grady / util.py
bstraehle's picture
Update util.py
b68f7ec verified
raw
history blame
1.95 kB
import pandas as pd
from openai import OpenAI
FILE_NAME = "data/gaia_validation_20.jsonl"
FINAL_ANSWER_MODEL = "gpt-4.5-preview"
def get_questions():
df = pd.read_json(FILE_NAME, lines=True)
result=[]
for index, row in df.iterrows():
result.append([row["Level"], row["Question"], row["file_name"], row["Final answer"]])
return result
def get_final_answer(question, initial_answer):
prompt_template = """
You are an expert question answering assistant. Given a question and an initial answer, your task is to provide the final answer.
Your final answer must be a number and/or string OR as few words as possible OR a comma-separated list of numbers and/or strings.
If you are asked for a number, don't use comma to write your number neither use units such as $ or % unless specified otherwise.
If you are asked for a string, don't use articles, neither abbreviations, and write the digits in plain text unless specified otherwise.
If you are asked for a comma-separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
If the final answer is a single word, start uppercase.
**Question:** """ + question + """
**Initial answer:** """ + initial_answer + """
**Example 1:** How many 'r's are in strawberry? 3
**Example 2:** What is the opposite of black? White
**Example 3:** What is the biggest city in California? Los Angeles
**Example 4:** What is the superlative of good? Best
**Example 5:** How many states are in the USA? 50
**Final answer:**
"""
client = OpenAI()
completion = client.chat.completions.create(
messages=[{"role": "user", "content": [{"type": "text", "text": prompt_template}]}],
model=FINAL_ANSWER_MODEL
)
return completion.choices[0].message.content