hunterhector commited on
Commit
e3e4276
·
verified ·
1 Parent(s): 4beacbb

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +29 -25
README.md CHANGED
@@ -31,6 +31,31 @@ datasets:
31
  model-index:
32
  - name: CrystalChat
33
  results:
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
34
  - task:
35
  type: multiple-choice # Required. Example: automatic-speech-recognition
36
  dataset:
@@ -64,9 +89,12 @@ model-index:
64
  type: winogrande # Required. Example: common_voice. Use dataset id from https://hf.co/datasets
65
  name: Winogrande # Required. A pretty name for the dataset. Example: Common Voice (French)
66
  metrics:
67
- - name: accuracy
68
  type: accuracy # Required. Example: wer. Use metric id from https://hf.co/metrics
69
  value: 70.639 # Required. Example: 41.148
 
 
 
70
  - task:
71
  type: multiple-choice # Required. Example: automatic-speech-recognition
72
  dataset:
@@ -145,30 +173,6 @@ model-index:
145
  - name: Accuracy (5 shot)
146
  type: accuracy # Required. Example: wer. Use metric id from https://hf.co/metrics
147
  value: 28.052 # Required. Example: 41.148
148
- - task:
149
- type: text-generation # Required. Example: automatic-speech-recognition
150
- dataset:
151
- type: openai_humanneval # Required. Example: common_voice. Use dataset id from https://hf.co/datasets
152
- name: OpenAI HumanEval # Required. A pretty name for the dataset. Example: Common Voice (French)
153
- metrics:
154
- - name: pass@1 (t=0.01)
155
- type: pass@1 # Required. Example: wer. Use metric id from https://hf.co/metrics
156
- value: 31.707 # Required. Example: 41.148
157
- - name: pass@10 (t=0.8)
158
- type: pass@10
159
- value: 65.755
160
- - task:
161
- type: text-generation # Required. Example: automatic-speech-recognition
162
- dataset:
163
- type: mbpp # Required. Example: common_voice. Use dataset id from https://hf.co/datasets
164
- name: Mostly Basic Python Problems (mbpp) # Required. A pretty name for the dataset. Example: Common Voice (French)
165
- metrics:
166
- - name: pass@1 (t=0.01)
167
- type: pass@1 # Required. Example: wer. Use metric id from https://hf.co/metrics
168
- value: 39.4 # Required. Example: 41.148
169
- - name: pass@10 (t=0.8)
170
- type: pass@10
171
- value: 59.895
172
  ---
173
 
174
  # CrystalChat
 
31
  model-index:
32
  - name: CrystalChat
33
  results:
34
+ - task:
35
+ type: text-generation # Required. Example: automatic-speech-recognition
36
+ dataset:
37
+ type: openai_humanneval # Required. Example: common_voice. Use dataset id from https://hf.co/datasets
38
+ name: OpenAI HumanEval # Required. A pretty name for the dataset. Example: Common Voice (French)
39
+ metrics:
40
+ - name: pass@1 (t=0.01)
41
+ type: pass@1 # Required. Example: wer. Use metric id from https://hf.co/metrics
42
+ value: 31.707 # Required. Example: 41.148
43
+ - name: pass@10 (t=0.8)
44
+ type: pass@10
45
+ value: 65.755
46
+ - task:
47
+ type: text-generation # Required. Example: automatic-speech-recognition
48
+ dataset:
49
+ type: mbpp # Required. Example: common_voice. Use dataset id from https://hf.co/datasets
50
+ name: Mostly Basic Python Problems (mbpp) # Required. A pretty name for the dataset. Example: Common Voice (French)
51
+ metrics:
52
+ - name: pass@1 (t=0.01)
53
+ type: pass@1 # Required. Example: wer. Use metric id from https://hf.co/metrics
54
+ value: 39.4 # Required. Example: 41.148
55
+ - name: pass@10 (t=0.8)
56
+ type: pass@10
57
+ value: 59.895
58
+
59
  - task:
60
  type: multiple-choice # Required. Example: automatic-speech-recognition
61
  dataset:
 
89
  type: winogrande # Required. Example: common_voice. Use dataset id from https://hf.co/datasets
90
  name: Winogrande # Required. A pretty name for the dataset. Example: Common Voice (French)
91
  metrics:
92
+ - name: accuracy (5 shot)
93
  type: accuracy # Required. Example: wer. Use metric id from https://hf.co/metrics
94
  value: 70.639 # Required. Example: 41.148
95
+ - name: accuracy (0 shot)
96
+ type: accuracy # Required. Example: wer. Use metric id from https://hf.co/metrics
97
+ value: 68.114 # Required. Example: 41.148
98
  - task:
99
  type: multiple-choice # Required. Example: automatic-speech-recognition
100
  dataset:
 
173
  - name: Accuracy (5 shot)
174
  type: accuracy # Required. Example: wer. Use metric id from https://hf.co/metrics
175
  value: 28.052 # Required. Example: 41.148
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
176
  ---
177
 
178
  # CrystalChat