abrek commited on
Commit
8ce7f2f
·
verified ·
1 Parent(s): 3c1441b

GECTurk model response white space problem fix

Browse files
results/zero-shot/CerebrumTech__cere-llama-3-8b-tr.json CHANGED
@@ -47,7 +47,7 @@
47
  {
48
  "name": "gecturk_generation",
49
  "task": "grammatical_error_correction",
50
- "exact_match": 0.013385333911117531
51
  },
52
  {
53
  "name": "xquad_tr",
 
47
  {
48
  "name": "gecturk_generation",
49
  "task": "grammatical_error_correction",
50
+ "exact_match": 0.4596
51
  },
52
  {
53
  "name": "xquad_tr",
results/zero-shot/Llama-3.3-70B-Instruct.json CHANGED
@@ -162,7 +162,7 @@
162
  {
163
  "name": "gecturk_generation",
164
  "task": "grammatical_error_correction",
165
- "exact_match": 0.0052482064615532766
166
  },
167
  {
168
  "name": "mlsum_tr",
 
162
  {
163
  "name": "gecturk_generation",
164
  "task": "grammatical_error_correction",
165
+ "exact_match": 0.441
166
  },
167
  {
168
  "name": "mlsum_tr",
results/zero-shot/Ministral-8B-Instruct.json CHANGED
@@ -166,7 +166,7 @@
166
  {
167
  "name": "gecturk_generation",
168
  "task": "grammatical_error_correction",
169
- "exact_match": 0.009003803745967548
170
  },
171
  {
172
  "name": "turkce_atasozleri",
 
166
  {
167
  "name": "gecturk_generation",
168
  "task": "grammatical_error_correction",
169
+ "exact_match": 0.3915
170
  },
171
  {
172
  "name": "turkce_atasozleri",
results/zero-shot/Mixtral-8x7B-Instruct-v0.1.json CHANGED
@@ -168,7 +168,7 @@
168
  {
169
  "name": "gecturk_generation",
170
  "task": "grammatical_error_correction",
171
- "exact_match": 0.036255958399537776
172
  },
173
  {
174
  "name": "turkce_atasozleri",
 
168
  {
169
  "name": "gecturk_generation",
170
  "task": "grammatical_error_correction",
171
+ "exact_match": 0.0364
172
  },
173
  {
174
  "name": "turkce_atasozleri",
results/zero-shot/Qwen2.5-0.5B-Instruct.json CHANGED
@@ -46,7 +46,7 @@
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
- "exact_match": 0.0005296355144686793
50
  },
51
  {
52
  "name": "xquad_tr",
 
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
+ "exact_match": 0.0177
50
  },
51
  {
52
  "name": "xquad_tr",
results/zero-shot/Qwen2.5-0.5B.json CHANGED
@@ -46,7 +46,7 @@
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
- "exact_match": 0.008859357696566999
50
  },
51
  {
52
  "name": "xquad_tr",
 
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
+ "exact_match": 0.0092
50
  },
51
  {
52
  "name": "xquad_tr",
results/zero-shot/Qwen2.5-1.5B-Instruct.json CHANGED
@@ -46,7 +46,7 @@
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
- "exact_match": 0.0012037170783379075
50
  },
51
  {
52
  "name": "xquad_tr",
 
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
+ "exact_match": 0.0361
50
  },
51
  {
52
  "name": "xquad_tr",
results/zero-shot/Qwen2.5-1.5B.json CHANGED
@@ -46,7 +46,7 @@
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
- "exact_match": 0.004188935432615918
50
  },
51
  {
52
  "name": "xquad_tr",
 
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
+ "exact_match": 0.1417
50
  },
51
  {
52
  "name": "xquad_tr",
results/zero-shot/Qwen2.5-14B-Instruct.json CHANGED
@@ -168,7 +168,7 @@
168
  {
169
  "name": "gecturk_generation",
170
  "task": "grammatical_error_correction",
171
- "exact_match": 0.00130001444460494
172
  },
173
  {
174
  "name": "turkce_atasozleri",
 
168
  {
169
  "name": "gecturk_generation",
170
  "task": "grammatical_error_correction",
171
+ "exact_match": 0.1088
172
  },
173
  {
174
  "name": "turkce_atasozleri",
results/zero-shot/Qwen2.5-14B.json CHANGED
@@ -168,7 +168,7 @@
168
  {
169
  "name": "gecturk_generation",
170
  "task": "grammatical_error_correction",
171
- "exact_match": 0.003707448601280755
172
  },
173
  {
174
  "name": "turkce_atasozleri",
 
168
  {
169
  "name": "gecturk_generation",
170
  "task": "grammatical_error_correction",
171
+ "exact_match": 0.1888
172
  },
173
  {
174
  "name": "turkce_atasozleri",
results/zero-shot/Qwen2.5-3B-Instruct.json CHANGED
@@ -46,7 +46,7 @@
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
- "exact_match": 0.0032741104530791083
50
  },
51
  {
52
  "name": "xquad_tr",
 
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
+ "exact_match": 0.0406
50
  },
51
  {
52
  "name": "xquad_tr",
results/zero-shot/Qwen2.5-3B.json CHANGED
@@ -46,7 +46,7 @@
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
- "exact_match": 0.01261495498098127
50
  },
51
  {
52
  "name": "xquad_tr",
 
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
+ "exact_match": 0.1466
50
  },
51
  {
52
  "name": "xquad_tr",
results/zero-shot/Qwen2.5-7B-Instruct.json CHANGED
@@ -46,7 +46,7 @@
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
- "exact_match": 0.0007222302470027445
50
  },
51
  {
52
  "name": "xquad_tr",
 
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
+ "exact_match": 0.0661
50
  },
51
  {
52
  "name": "xquad_tr",
results/zero-shot/Qwen2.5-7B.json CHANGED
@@ -46,7 +46,7 @@
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
- "exact_match": 0.005537098560354375
50
  },
51
  {
52
  "name": "xquad_tr",
 
46
  {
47
  "name": "gecturk_generation",
48
  "task": "grammatical_error_correction",
49
+ "exact_match": 0.2227
50
  },
51
  {
52
  "name": "xquad_tr",
results/zero-shot/aya-23-35B.json CHANGED
@@ -134,7 +134,7 @@
134
  {
135
  "name": "gecturk_generation",
136
  "task": "grammatical_error_correction",
137
- "exact_match": 0.009437141894169195
138
  },
139
  {
140
  "name": "xlsum_tr",
 
134
  {
135
  "name": "gecturk_generation",
136
  "task": "grammatical_error_correction",
137
+ "exact_match": 0.3079
138
  },
139
  {
140
  "name": "xlsum_tr",
results/zero-shot/aya-23-8b.json CHANGED
@@ -128,7 +128,7 @@
128
  {
129
  "name": "gecturk_generation",
130
  "task": "grammatical_error_correction",
131
- "exact_match": 0.008281573498964804
132
  },
133
  {
134
  "name": "mlsum_tr",
 
128
  {
129
  "name": "gecturk_generation",
130
  "task": "grammatical_error_correction",
131
+ "exact_match": 0.0429
132
  },
133
  {
134
  "name": "mlsum_tr",
results/zero-shot/aya-expanse-32b.json CHANGED
@@ -167,7 +167,7 @@
167
  {
168
  "name": "gecturk_generation",
169
  "task": "grammatical_error_correction",
170
- "exact_match": 0
171
  },
172
  {
173
  "name": "turkce_atasozleri",
 
167
  {
168
  "name": "gecturk_generation",
169
  "task": "grammatical_error_correction",
170
+ "exact_match": 0.0447
171
  },
172
  {
173
  "name": "turkce_atasozleri",
results/zero-shot/aya-expanse-8b.json CHANGED
@@ -30,7 +30,7 @@
30
  {
31
  "name": "gecturk_generation",
32
  "task": "grammatical_error_correction",
33
- "exact_match": 0.0018296499590736194
34
  },
35
  {
36
  "name": "ironytr",
 
30
  {
31
  "name": "gecturk_generation",
32
  "task": "grammatical_error_correction",
33
+ "exact_match": 0.0552
34
  },
35
  {
36
  "name": "ironytr",
results/zero-shot/aya101.json CHANGED
@@ -154,7 +154,7 @@
154
  {
155
  "name": "gecturk_generation",
156
  "task": "grammatical_error_correction",
157
- "exact_match": 0.0
158
  },
159
  {
160
  "name": "exams_tr",
 
154
  {
155
  "name": "gecturk_generation",
156
  "task": "grammatical_error_correction",
157
+ "exact_match": 0.3239
158
  },
159
  {
160
  "name": "exams_tr",
results/zero-shot/commencis-7b.json CHANGED
@@ -154,7 +154,7 @@
154
  {
155
  "name": "gecturk_generation",
156
  "task": "grammatical_error_correction",
157
- "exact_match": 0.1701574461938466
158
  },
159
  {
160
  "name": "exams_tr",
 
154
  {
155
  "name": "gecturk_generation",
156
  "task": "grammatical_error_correction",
157
+ "exact_match": 0.2371
158
  },
159
  {
160
  "name": "exams_tr",
results/zero-shot/kanarya-2b.json CHANGED
@@ -23,7 +23,7 @@
23
  {
24
  "name": "gecturk_generation",
25
  "task": "grammatical_error_correction",
26
- "exact_match": 9.62973662670326e-05
27
  },
28
  {
29
  "name": "ironytr",
 
23
  {
24
  "name": "gecturk_generation",
25
  "task": "grammatical_error_correction",
26
+ "exact_match": 0.0662
27
  },
28
  {
29
  "name": "ironytr",
results/zero-shot/llama-3-8b-instruct.json CHANGED
@@ -127,7 +127,7 @@
127
  {
128
  "name": "gecturk_generation",
129
  "task": "grammatical_error_correction",
130
- "exact_match": 0.005007463045885695
131
  },
132
  {
133
  "name": "mlsum_tr",
 
127
  {
128
  "name": "gecturk_generation",
129
  "task": "grammatical_error_correction",
130
+ "exact_match": 0.1001
131
  },
132
  {
133
  "name": "mlsum_tr",
results/zero-shot/llama-3-8b.json CHANGED
@@ -126,7 +126,7 @@
126
  {
127
  "name": "gecturk_generation",
128
  "task": "grammatical_error_correction",
129
- "exact_match": 0.006692666955558766
130
  },
131
  {
132
  "name": "mlsum_tr",
 
126
  {
127
  "name": "gecturk_generation",
128
  "task": "grammatical_error_correction",
129
+ "exact_match": 0.3412
130
  },
131
  {
132
  "name": "mlsum_tr",
results/zero-shot/llama-3.1-8b-instruct.json CHANGED
@@ -126,7 +126,7 @@
126
  {
127
  "name": "gecturk_generation",
128
  "task": "grammatical_error_correction",
129
- "exact_match": 0.006548220906158217
130
  },
131
  {
132
  "name": "mlsum_tr",
 
126
  {
127
  "name": "gecturk_generation",
128
  "task": "grammatical_error_correction",
129
+ "exact_match": 0.3149
130
  },
131
  {
132
  "name": "mlsum_tr",
results/zero-shot/llama-3.1-8b.json CHANGED
@@ -126,7 +126,7 @@
126
  {
127
  "name": "gecturk_generation",
128
  "task": "grammatical_error_correction",
129
- "exact_match": 0.006548220906158217
130
  },
131
  {
132
  "name": "mlsum_tr",
 
126
  {
127
  "name": "gecturk_generation",
128
  "task": "grammatical_error_correction",
129
+ "exact_match": 0.3527
130
  },
131
  {
132
  "name": "mlsum_tr",
results/zero-shot/llama-3.2-1b.json CHANGED
@@ -30,7 +30,7 @@
30
  {
31
  "name": "gecturk_generation",
32
  "task": "grammatical_error_correction",
33
- "exact_match": 0.00741489720256151
34
  },
35
  {
36
  "name": "ironytr",
 
30
  {
31
  "name": "gecturk_generation",
32
  "task": "grammatical_error_correction",
33
+ "exact_match": 0.181
34
  },
35
  {
36
  "name": "ironytr",
results/zero-shot/llama-3.2-3b-instruct.json CHANGED
@@ -30,7 +30,7 @@
30
  {
31
  "name": "gecturk_generation",
32
  "task": "grammatical_error_correction",
33
- "exact_match": 0.007222302470027445
34
  },
35
  {
36
  "name": "ironytr",
 
30
  {
31
  "name": "gecturk_generation",
32
  "task": "grammatical_error_correction",
33
+ "exact_match": 0.1672
34
  },
35
  {
36
  "name": "ironytr",
results/zero-shot/llama-3.2-3b.json CHANGED
@@ -120,7 +120,7 @@
120
  {
121
  "name": "gecturk_generation",
122
  "task": "grammatical_error_correction",
123
- "exact_match": 0.004670422263951081
124
  },
125
  {
126
  "name": "mlsum_tr",
 
120
  {
121
  "name": "gecturk_generation",
122
  "task": "grammatical_error_correction",
123
+ "exact_match": 0.2682
124
  },
125
  {
126
  "name": "mlsum_tr",
results/zero-shot/mistral-7b.json CHANGED
@@ -132,7 +132,7 @@
132
  {
133
  "name": "gecturk_generation",
134
  "task": "grammatical_error_correction",
135
- "exact_match": 0.20660599932591844
136
  },
137
  {
138
  "name": "mlsum_tr",
 
132
  {
133
  "name": "gecturk_generation",
134
  "task": "grammatical_error_correction",
135
+ "exact_match": 0.2084
136
  },
137
  {
138
  "name": "mlsum_tr",
results/zero-shot/trendyol-7b.json CHANGED
@@ -154,7 +154,7 @@
154
  {
155
  "name": "gecturk_generation",
156
  "task": "grammatical_error_correction",
157
- "exact_match": 0.00048148683133516297
158
  },
159
  {
160
  "name": "exams_tr",
 
154
  {
155
  "name": "gecturk_generation",
156
  "task": "grammatical_error_correction",
157
+ "exact_match": 0.0007
158
  },
159
  {
160
  "name": "exams_tr",