rymc commited on
Commit
9938995
·
verified ·
1 Parent(s): c5e769d

Update leaderboard/data/leaderboard.csv

Browse files
Files changed (1) hide show
  1. leaderboard/data/leaderboard.csv +18 -18
leaderboard/data/leaderboard.csv CHANGED
@@ -1,18 +1,18 @@
1
- Models,ha_rag_rate,ha_non_rag_rate
2
- klusterai-Meta-Llama-3.1-8B-Instruct-Turbo,8.1,12.5
3
- Qwen2.5-VL-7B-Instruct,9.35,4.55
4
- Mistral-Nemo-Instruct-2407,10.63,8.74
5
- Llama-4-Maverick-17B-128E-Instruct-FP8,3.34,0.69
6
- Llama-4-Scout-17B-16E-Instruct,4.23,2.48
7
- Mistral-Small-24B-Instruct-2501,4.74,7.85
8
- Magistral-Small-2506,8.62,28.07
9
- gemma-3-27b-it,3.71,0.48
10
- klusterai-Meta-Llama-3.3-70B-Instruct-Turbo,2.12,1.09
11
- DeepSeek-V3-0324,4.66,0.91
12
- Qwen3-235B-A22B-FP8,5.04,0.88
13
- DeepSeek-R1-0528,2.26,0.78
14
- gpt-4o,6.05,0.64
15
- claude-sonnet-4,2.21,0.6
16
- gemini-2.5-pro,1.57,0.36
17
- kimi-k2,2.91,4.11
18
- qwen3-235b-a22b-07-25,7.87,0.94
 
1
+ Models,ha_rag_rate,ha_non_rag_rate
2
+ klusterai-Meta-Llama-3.1-8B-Instruct-Turbo,8.1,12.5
3
+ Qwen2.5-VL-7B-Instruct,9.35,4.55
4
+ Mistral-Nemo-Instruct-2407,10.63,8.74
5
+ Llama-4-Maverick-17B-128E-Instruct-FP8,3.34,0.69
6
+ Llama-4-Scout-17B-16E-Instruct,4.23,2.48
7
+ Mistral-Small-24B-Instruct-2501,4.74,7.85
8
+ Magistral-Small-2506,8.62,28.07
9
+ gemma-3-27b-it,3.71,0.48
10
+ klusterai-Meta-Llama-3.3-70B-Instruct-Turbo,2.12,1.09
11
+ DeepSeek-V3-0324,4.66,0.91
12
+ Qwen3-235B-A22B-FP8,5.04,0.88
13
+ DeepSeek-R1-0528,2.26,0.78
14
+ gpt-4o,6.05,0.64
15
+ claude-sonnet-4,2.21,0.6
16
+ gemini-2.5-pro,1.57,0.36
17
+ kimi-k2,2.91,4.11
18
+ Qwen3-235B-A22B-FP8-2507,7.87,0.94