feat: Move humor dataset generation script to environments directory

This commit is contained in:
Kirill Igumenshchev 2025-05-18 17:25:54 -07:00 committed by Kirill Igumenshchev (aider)
parent 7e3f32b296
commit 51fc48fd05

View file

@ -0,0 +1,48 @@
import os
import json
from dotenv import load_dotenv
from openai import OpenAI
def main():
load_dotenv()
client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
comedians = [
"Norm Macdonald",
"John Mulaney",
"Hasan Minhaj",
"Dave Chappelle",
"Ali Wong",
"Chris Rock",
]
formats = [
"haiku",
"one-liner",
"q/a over sms",
]
output_file = "humor_dataset.jsonl"
model_name = "gpt-4o-mini"
with open(output_file, "w", encoding="utf-8") as fout:
for comedian in comedians:
for fmt in formats:
question = (
f"Whats the best local LLM model to generate {fmt} jokes "
f"in the style of {comedian}? Please explain your reasoning step by step."
)
response = client.chat.completions.create(
model=model_name,
messages=[{"role": "user", "content": question}],
)
answer = response.choices[0].message.content.strip()
record = {
"comedian": comedian,
"format": fmt,
"question": question,
"response": answer,
}
fout.write(json.dumps(record, ensure_ascii=False) + "\n")
if __name__ == "__main__":
main()