jumelet commited on
Commit
5e6bc0c
·
1 Parent(s): 604e6ce

Training in progress, step 1757

Browse files
Files changed (4) hide show
  1. config.json +1 -1
  2. pytorch_model.bin +2 -2
  3. tokenizer.json +55 -55
  4. training_args.bin +1 -1
config.json CHANGED
@@ -19,7 +19,7 @@
19
  "layer_norm_epsilon": 1e-05,
20
  "model_type": "gpt2",
21
  "n_ctx": 1024,
22
- "n_embd": 128,
23
  "n_head": 8,
24
  "n_inner": null,
25
  "n_layer": 8,
 
19
  "layer_norm_epsilon": 1e-05,
20
  "model_type": "gpt2",
21
  "n_ctx": 1024,
22
+ "n_embd": 256,
23
  "n_head": 8,
24
  "n_inner": null,
25
  "n_layer": 8,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11cbbfa01a7706bd61b0297af02a5b8ca6c04e0b5a3f6ab01b613b346ac62350
3
- size 6438682
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a76c15c1f0c184493e6adb4a3408590a7847f6232446a7707a386a0100f3b9f
3
+ size 25427930
tokenizer.json CHANGED
@@ -104,78 +104,78 @@
104
  "he": 11,
105
  "in": 12,
106
  "Bible": 13,
107
- "n<apostrophe>t": 14,
108
- "a": 15,
109
  "here": 16,
110
  "He": 17,
111
  "to": 18,
112
  "by": 19,
113
- "<apostrophe>s": 20,
114
- "ditch": 21,
115
  "boy": 22,
116
- "knew": 23,
117
- "did": 24,
118
  "Oh": 25,
119
- "they": 26,
120
- ":": 27,
121
  "them": 28,
122
- "But": 29,
123
- "there": 30,
124
  "meant": 31,
125
- "Tuesday": 32,
126
- "find": 33,
127
- "help": 34,
128
- "Today": 35,
129
- "The": 36,
130
- "care": 37,
131
- "quite": 38,
132
- "not": 39,
133
- "really": 40,
134
- "intended": 41,
135
- "now": 42,
136
- "mattered": 43,
137
- "that": 44,
138
- "happened": 45,
139
- "should": 46,
140
- "leave": 47,
141
- "They": 48,
142
- "of": 49,
143
  "moved": 50,
144
- "finally": 51,
145
- "his": 52,
146
- "world": 53,
147
- "fingers": 54,
148
- "blackened": 55,
149
- "cows": 56,
150
- "justice": 57,
151
- "told": 58,
152
- "Because": 59,
153
- "none": 60,
154
  "class": 61,
155
- "finger": 62,
156
- "virtue": 63,
157
  "sure": 64,
158
  "what": 65,
159
  "narrowed": 66,
160
  "saw": 67,
161
  "were": 68,
162
- "even": 69,
163
- "then": 70,
164
- "And": 71,
165
  "dirt": 72,
166
  "lip": 73,
167
- "quivered": 74,
168
- "hazel": 75,
169
- "grass": 76,
170
- "baby": 77,
171
- "eyes": 78,
172
- "lower": 79,
173
- "child": 80,
174
- "darker": 81,
175
- "like": 82,
176
- "from": 83,
177
- "rising": 84,
178
- "than": 85,
179
  "silky": 86,
180
  "own": 87
181
  },
 
104
  "he": 11,
105
  "in": 12,
106
  "Bible": 13,
107
+ "a": 14,
108
+ "n<apostrophe>t": 15,
109
  "here": 16,
110
  "He": 17,
111
  "to": 18,
112
  "by": 19,
113
+ "ditch": 20,
114
+ "<apostrophe>s": 21,
115
  "boy": 22,
116
+ "did": 23,
117
+ "knew": 24,
118
  "Oh": 25,
119
+ ":": 26,
120
+ "they": 27,
121
  "them": 28,
122
+ "there": 29,
123
+ "But": 30,
124
  "meant": 31,
125
+ "that": 32,
126
+ "The": 33,
127
+ "Today": 34,
128
+ "Tuesday": 35,
129
+ "now": 36,
130
+ "find": 37,
131
+ "should": 38,
132
+ "leave": 39,
133
+ "help": 40,
134
+ "care": 41,
135
+ "not": 42,
136
+ "intended": 43,
137
+ "really": 44,
138
+ "quite": 45,
139
+ "They": 46,
140
+ "mattered": 47,
141
+ "finally": 48,
142
+ "told": 49,
143
  "moved": 50,
144
+ "blackened": 51,
145
+ "happened": 52,
146
+ "justice": 53,
147
+ "world": 54,
148
+ "fingers": 55,
149
+ "none": 56,
150
+ "his": 57,
151
+ "of": 58,
152
+ "cows": 59,
153
+ "Because": 60,
154
  "class": 61,
155
+ "virtue": 62,
156
+ "finger": 63,
157
  "sure": 64,
158
  "what": 65,
159
  "narrowed": 66,
160
  "saw": 67,
161
  "were": 68,
162
+ "And": 69,
163
+ "even": 70,
164
+ "then": 71,
165
  "dirt": 72,
166
  "lip": 73,
167
+ "baby": 74,
168
+ "grass": 75,
169
+ "hazel": 76,
170
+ "quivered": 77,
171
+ "darker": 78,
172
+ "child": 79,
173
+ "eyes": 80,
174
+ "like": 81,
175
+ "than": 82,
176
+ "rising": 83,
177
+ "from": 84,
178
+ "lower": 85,
179
  "silky": 86,
180
  "own": 87
181
  },
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce8e2e7270347d4dcb6a72fa308698c80a29e97650cbc2f94ccd57bf7d935a93
3
  size 4472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0687459bb833b211fcc325c8754de5eaee936871d5a3e7c19be03e852d3b1a9b
3
  size 4472