Update README.md
Browse files
README.md
CHANGED
@@ -41,8 +41,8 @@ Remark: We developed the TH pair by translating the original datasets into Thai
|
|
41 |
|
42 |
| Model | ONET | IC | TGAT | TPAT-1 | A-Level | Average (ThaiExam) | MMLU |
|
43 |
| --- | --- | --- | --- | --- | --- | --- | --- |
|
44 |
-
| Typhoon-1.5X 70B | 0.565 | 0.68 | 0.778 | 0.517 | 0.56 | 0.620 | 0.7945 |
|
45 |
-
| gpt-4-0612 | 0.493 | 0.69 | 0.744 | 0.509 | 0.616 | 0.610 | 0.864
|
46 |
| --- | --- | --- | --- | --- | --- | --- | --- |
|
47 |
| gpt-4o | 0.62 | 0.63 | 0.789 | 0.56 | 0.623 | 0.644 | 0.887** |
|
48 |
|
@@ -52,7 +52,7 @@ Remark: We developed the TH pair by translating the original datasets into Thai
|
|
52 |
|
53 |
| Model | MT-Bench Thai | MT-Bench English |
|
54 |
| --- | --- | --- |
|
55 |
-
| Typhoon-1.5X 70B | 8.029 | 8.797 |
|
56 |
| gpt-4-0612 | 7.801 | 8.671 |
|
57 |
| --- | --- | --- |
|
58 |
| gpt-4o | 8.514 | 9.184 |
|
@@ -61,7 +61,7 @@ Remark: We developed the TH pair by translating the original datasets into Thai
|
|
61 |
|
62 |
| Model | IFEval Thai | IFEval English |
|
63 |
| --- | --- | --- |
|
64 |
-
| Typhoon-1.5X 70B | 0.645 | 0.810 |
|
65 |
| gpt-4-0612 | 0.612 | 0.793* |
|
66 |
| --- | --- | --- |
|
67 |
| gpt-4o | 0.737 | 0.871 |
|
@@ -72,9 +72,9 @@ Remark: We developed the TH pair by translating the original datasets into Thai
|
|
72 |
|
73 |
| Model | GAIA - Thai/English | GSM8K - Thai/English | HotpotQA - Thai/English |
|
74 |
| --- | --- | --- | --- |
|
75 |
-
| gpt-3.5-turbo-0125 | 18.42
|
76 |
| Typhoon-1.5X 70B | 17.10/36.25 | 80/95 | 52.7/65.83 |
|
77 |
-
| gpt-4-0612 | 17.10
|
78 |
| --- | --- | --- | --- |
|
79 |
| gpt-4o | 44.73/57.5 | 100/100 | 71.64/76.58 |
|
80 |
|
|
|
41 |
|
42 |
| Model | ONET | IC | TGAT | TPAT-1 | A-Level | Average (ThaiExam) | MMLU |
|
43 |
| --- | --- | --- | --- | --- | --- | --- | --- |
|
44 |
+
| Typhoon-1.5X 70B | **0.565** | 0.68 | **0.778** | **0.517** | 0.56 | **0.620** | 0.7945 |
|
45 |
+
| gpt-4-0612 | 0.493 | **0.69** | 0.744 | 0.509 | **0.616** | 0.610 | **0.864**** |
|
46 |
| --- | --- | --- | --- | --- | --- | --- | --- |
|
47 |
| gpt-4o | 0.62 | 0.63 | 0.789 | 0.56 | 0.623 | 0.644 | 0.887** |
|
48 |
|
|
|
52 |
|
53 |
| Model | MT-Bench Thai | MT-Bench English |
|
54 |
| --- | --- | --- |
|
55 |
+
| Typhoon-1.5X 70B | **8.029** | **8.797** |
|
56 |
| gpt-4-0612 | 7.801 | 8.671 |
|
57 |
| --- | --- | --- |
|
58 |
| gpt-4o | 8.514 | 9.184 |
|
|
|
61 |
|
62 |
| Model | IFEval Thai | IFEval English |
|
63 |
| --- | --- | --- |
|
64 |
+
| Typhoon-1.5X 70B | **0.645** | **0.810** |
|
65 |
| gpt-4-0612 | 0.612 | 0.793* |
|
66 |
| --- | --- | --- |
|
67 |
| gpt-4o | 0.737 | 0.871 |
|
|
|
72 |
|
73 |
| Model | GAIA - Thai/English | GSM8K - Thai/English | HotpotQA - Thai/English |
|
74 |
| --- | --- | --- | --- |
|
75 |
+
| gpt-3.5-turbo-0125 | **18.42**/37.5 | 70/80 | 39.56/59 |
|
76 |
| Typhoon-1.5X 70B | 17.10/36.25 | 80/95 | 52.7/65.83 |
|
77 |
+
| gpt-4-0612 | 17.10/**38.75** | **90**/**100** | **56.41**/**76.25** |
|
78 |
| --- | --- | --- | --- |
|
79 |
| gpt-4o | 44.73/57.5 | 100/100 | 71.64/76.58 |
|
80 |
|