|
import pandas as pd |
|
|
|
from openai import OpenAI |
|
|
|
FILE_NAME = "data/gaia_validation_20.jsonl" |
|
|
|
FINAL_ANSWER_MODEL = "gpt-4.5-preview" |
|
|
|
def get_questions(): |
|
df = pd.read_json(FILE_NAME, lines=True) |
|
result=[] |
|
|
|
for index, row in df.iterrows(): |
|
result.append([row["Level"], row["Question"], row["file_name"], row["Final answer"]]) |
|
|
|
return result |
|
|
|
def get_final_answer(question, initial_answer): |
|
prompt_template = """ |
|
You are an expert question answering assistant. Given a question and an initial answer, your task is to provide the final answer. |
|
Your final answer must be a number and/or string OR as few words as possible OR a comma-separated list of numbers and/or strings. |
|
If you are asked for a number, don't use comma to write your number neither use units such as $ or % unless specified otherwise. |
|
If you are asked for a string, don't use articles, neither abbreviations, and write the digits in plain text unless specified otherwise. |
|
If you are asked for a comma-separated list, apply the above rules depending of whether the element to be put in the list is a number or a string. |
|
If the final answer is a single word, start uppercase. |
|
|
|
**Question:** """ + question + """ |
|
|
|
**Initial answer:** """ + initial_answer + """ |
|
|
|
**Example 1:** How many 'r's are in strawberry? 3 |
|
**Example 2:** What is the opposite of black? White |
|
**Example 3:** What is the biggest city in California? Los Angeles |
|
**Example 4:** What is the superlative of good? Best |
|
**Example 5:** How many states are in the USA? 50 |
|
|
|
**Final answer:** |
|
|
|
""" |
|
|
|
client = OpenAI() |
|
completion = client.chat.completions.create( |
|
messages=[{"role": "user", "content": [{"type": "text", "text": prompt_template}]}], |
|
model=FINAL_ANSWER_MODEL |
|
) |
|
|
|
return completion.choices[0].message.content |