Spaces:
Runtime error
Runtime error
missing
Browse files
src/leaderboard/read_evals.py
CHANGED
|
@@ -469,14 +469,14 @@ def get_raw_eval_results(results_path: str, requests_path: str, metadata) -> lis
|
|
| 469 |
|
| 470 |
print(f"Missing sbatch results:")
|
| 471 |
for r in for_run:
|
| 472 |
-
if r[0]==5 and r[1] in ['
|
| 473 |
fm=r[2]
|
| 474 |
-
script='
|
| 475 |
if ',chat' in fm:
|
| 476 |
-
script='
|
| 477 |
fm=fm.replace(',chat','')
|
| 478 |
if ',multiturn' in fm:
|
| 479 |
-
script='
|
| 480 |
fm=fm.replace(',multiturn','')
|
| 481 |
|
| 482 |
print(f'sbatch start.sh "bash {script} {r[0]} {r[1]} {fm}"')
|
|
|
|
| 469 |
|
| 470 |
print(f"Missing sbatch results:")
|
| 471 |
for r in for_run:
|
| 472 |
+
if r[0]==5 and r[1] in ['polish_eq_bench']: continue
|
| 473 |
fm=r[2]
|
| 474 |
+
script='eval_model_task_bs1.sh'
|
| 475 |
if ',chat' in fm:
|
| 476 |
+
script='eval_model_task_bs1_chat.sh'
|
| 477 |
fm=fm.replace(',chat','')
|
| 478 |
if ',multiturn' in fm:
|
| 479 |
+
script='eval_model_task_bs1_chat_few.sh'
|
| 480 |
fm=fm.replace(',multiturn','')
|
| 481 |
|
| 482 |
print(f'sbatch start.sh "bash {script} {r[0]} {r[1]} {fm}"')
|