bobbyw commited on
Commit
c387cb4
·
verified ·
1 Parent(s): 7f97812

Training in progress, epoch 1

Browse files
added_tokens.json CHANGED
@@ -1,55 +1,67 @@
1
  {
2
- "</access_instructions>": 128042,
3
  "</accommodation>": 128002,
4
  "</activity>": 128004,
5
- "</address>": 128028,
6
- "</arrival location>": 128006,
7
  "</attendee>": 128008,
8
- "</availability>": 128050,
 
 
9
  "</cost>": 128010,
10
  "</date>": 128012,
11
- "</flight_type>": 128046,
12
- "</itenerary>": 128014,
13
- "</itinerary>": 128024,
14
- "</link>": 128036,
15
- "</location>": 128016,
16
- "</occupancy>": 128040,
17
- "</person>": 128048,
18
- "</pickup_location>": 128052,
19
- "</planner>": 128022,
20
- "</probability>": 128044,
21
- "</seat>": 128026,
22
- "</sender>": 128018,
23
- "</thing_needed>": 128030,
24
- "</time>": 128020,
25
- "</travel>": 128032,
26
- "</trip>": 128038,
27
- "</type>": 128034,
28
- "<access_instructions>": 128041,
 
 
 
 
29
  "<accommodation>": 128001,
30
  "<activity>": 128003,
31
- "<address>": 128027,
32
- "<arrival location>": 128005,
33
  "<attendee>": 128007,
34
- "<availability>": 128049,
 
 
35
  "<cost>": 128009,
36
  "<date>": 128011,
37
- "<flight_type>": 128045,
38
- "<itenerary>": 128013,
39
- "<itinerary>": 128023,
40
- "<link>": 128035,
41
- "<location>": 128015,
42
- "<occupancy>": 128039,
43
- "<person>": 128047,
44
- "<pickup_location>": 128051,
45
- "<planner>": 128021,
46
- "<probability>": 128043,
47
- "<seat>": 128025,
48
- "<sender>": 128017,
49
- "<thing_needed>": 128029,
50
- "<time>": 128019,
51
- "<travel>": 128031,
52
- "<trip>": 128037,
53
- "<type>": 128033,
 
 
 
 
54
  "[MASK]": 128000
55
  }
 
1
  {
2
+ "</access_instructions>": 128040,
3
  "</accommodation>": 128002,
4
  "</activity>": 128004,
5
+ "</address>": 128026,
6
+ "</arrival_location>": 128006,
7
  "</attendee>": 128008,
8
+ "</availability>": 128048,
9
+ "</chat_title>": 128060,
10
+ "</check_in_date>": 128056,
11
  "</cost>": 128010,
12
  "</date>": 128012,
13
+ "</flight_type>": 128044,
14
+ "</itinerary>": 128022,
15
+ "</link>": 128034,
16
+ "</location>": 128014,
17
+ "</metadata>": 128064,
18
+ "</occupancy>": 128038,
19
+ "</participants>": 128058,
20
+ "</person>": 128046,
21
+ "</pickup_location>": 128050,
22
+ "</planner>": 128020,
23
+ "</preference>": 128054,
24
+ "</probability>": 128042,
25
+ "</readable_date>": 128062,
26
+ "</seat>": 128024,
27
+ "</sender>": 128016,
28
+ "</thing_needed>": 128028,
29
+ "</time>": 128018,
30
+ "</travel>": 128030,
31
+ "</trip>": 128036,
32
+ "</type>": 128032,
33
+ "</unstructured_information>": 128052,
34
+ "<access_instructions>": 128039,
35
  "<accommodation>": 128001,
36
  "<activity>": 128003,
37
+ "<address>": 128025,
38
+ "<arrival_location>": 128005,
39
  "<attendee>": 128007,
40
+ "<availability>": 128047,
41
+ "<chat_title>": 128059,
42
+ "<check_in_date>": 128055,
43
  "<cost>": 128009,
44
  "<date>": 128011,
45
+ "<flight_type>": 128043,
46
+ "<itinerary>": 128021,
47
+ "<link>": 128033,
48
+ "<location>": 128013,
49
+ "<metadata>": 128063,
50
+ "<occupancy>": 128037,
51
+ "<participants>": 128057,
52
+ "<person>": 128045,
53
+ "<pickup_location>": 128049,
54
+ "<planner>": 128019,
55
+ "<preference>": 128053,
56
+ "<probability>": 128041,
57
+ "<readable_date>": 128061,
58
+ "<seat>": 128023,
59
+ "<sender>": 128015,
60
+ "<thing_needed>": 128027,
61
+ "<time>": 128017,
62
+ "<travel>": 128029,
63
+ "<trip>": 128035,
64
+ "<type>": 128031,
65
+ "<unstructured_information>": 128051,
66
  "[MASK]": 128000
67
  }
config.json CHANGED
@@ -70,7 +70,27 @@
70
  "59": "accommodation location",
71
  "60": "itinerary link",
72
  "61": "activity availability",
73
- "62": "activity pickup_location"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
74
  },
75
  "initializer_range": 0.02,
76
  "intermediate_size": 3072,
@@ -78,14 +98,18 @@
78
  "accommodation access_instructions": 41,
79
  "accommodation address": 36,
80
  "accommodation attendee": 44,
 
81
  "accommodation cost": 0,
82
  "accommodation date": 52,
83
  "accommodation link": 37,
84
  "accommodation location": 59,
85
  "accommodation occupancy": 58,
86
  "accommodation planner": 1,
 
87
  "accommodation probability": 2,
88
  "accommodation type": 3,
 
 
89
  "activity address": 31,
90
  "activity attendee": 4,
91
  "activity availability": 61,
@@ -95,23 +119,31 @@
95
  "activity location": 6,
96
  "activity pickup_location": 62,
97
  "activity planner": 7,
 
98
  "activity probability": 8,
99
  "activity restaurant": 9,
100
  "activity thing_needed": 32,
101
  "activity time": 34,
 
102
  "attendee accommodation": 57,
103
  "attendee activity": 50,
 
104
  "attendee date": 47,
105
  "attendee itinerary": 10,
106
  "attendee probability": 43,
107
  "attendee seat": 11,
 
108
  "date attendee": 12,
 
109
  "date link": 56,
 
110
  "date probability": 13,
 
111
  "itinerary attendee": 53,
112
  "itinerary date": 42,
113
  "itinerary link": 60,
114
  "itinerary probability": 14,
 
115
  "link attendee": 54,
116
  "location accommodation": 15,
117
  "location activity": 16,
@@ -120,6 +152,8 @@
120
  "location itinerary": 19,
121
  "location planner": 20,
122
  "location probability": 21,
 
 
123
  "travel arrival location": 22,
124
  "travel attendee": 23,
125
  "travel cost": 55,
@@ -127,17 +161,23 @@
127
  "travel destination": 48,
128
  "travel flight_type": 49,
129
  "travel planner": 33,
 
130
  "travel probability": 25,
131
  "travel time": 26,
132
  "travel type": 51,
 
133
  "trip accommodation": 45,
134
  "trip activity": 40,
135
  "trip attendee": 27,
136
  "trip date": 46,
 
137
  "trip link": 38,
138
  "trip location": 28,
139
  "trip travel": 29,
140
- "type probability": 30
 
 
 
141
  },
142
  "layer_norm_eps": 1e-07,
143
  "max_position_embeddings": 512,
@@ -160,7 +200,7 @@
160
  "relative_attention": true,
161
  "share_att_key": true,
162
  "torch_dtype": "float32",
163
- "transformers_version": "4.35.2",
164
  "type_vocab_size": 0,
165
- "vocab_size": 128053
166
  }
 
70
  "59": "accommodation location",
71
  "60": "itinerary link",
72
  "61": "activity availability",
73
+ "62": "activity pickup_location",
74
+ "63": "accommodation unstructured_information",
75
+ "64": "unstructured_information link",
76
+ "65": "itinerary unstructured_information",
77
+ "66": "activity unstructured_information",
78
+ "67": "activity preference",
79
+ "68": "preference attendee",
80
+ "69": "unstructured_information unstructured_information",
81
+ "70": "activity activity",
82
+ "71": "date unstructured_information",
83
+ "72": "trip itinerary",
84
+ "73": "accommodation preference",
85
+ "74": "date preference",
86
+ "75": "date date",
87
+ "76": "preference preference",
88
+ "77": "trip unstructured_information",
89
+ "78": "attendee attendee",
90
+ "79": "attendee unstructured_information",
91
+ "80": "travel preference",
92
+ "81": "travel unstructured_information",
93
+ "82": "accommodation check_in_date"
94
  },
95
  "initializer_range": 0.02,
96
  "intermediate_size": 3072,
 
98
  "accommodation access_instructions": 41,
99
  "accommodation address": 36,
100
  "accommodation attendee": 44,
101
+ "accommodation check_in_date": 82,
102
  "accommodation cost": 0,
103
  "accommodation date": 52,
104
  "accommodation link": 37,
105
  "accommodation location": 59,
106
  "accommodation occupancy": 58,
107
  "accommodation planner": 1,
108
+ "accommodation preference": 73,
109
  "accommodation probability": 2,
110
  "accommodation type": 3,
111
+ "accommodation unstructured_information": 63,
112
+ "activity activity": 70,
113
  "activity address": 31,
114
  "activity attendee": 4,
115
  "activity availability": 61,
 
119
  "activity location": 6,
120
  "activity pickup_location": 62,
121
  "activity planner": 7,
122
+ "activity preference": 67,
123
  "activity probability": 8,
124
  "activity restaurant": 9,
125
  "activity thing_needed": 32,
126
  "activity time": 34,
127
+ "activity unstructured_information": 66,
128
  "attendee accommodation": 57,
129
  "attendee activity": 50,
130
+ "attendee attendee": 78,
131
  "attendee date": 47,
132
  "attendee itinerary": 10,
133
  "attendee probability": 43,
134
  "attendee seat": 11,
135
+ "attendee unstructured_information": 79,
136
  "date attendee": 12,
137
+ "date date": 75,
138
  "date link": 56,
139
+ "date preference": 74,
140
  "date probability": 13,
141
+ "date unstructured_information": 71,
142
  "itinerary attendee": 53,
143
  "itinerary date": 42,
144
  "itinerary link": 60,
145
  "itinerary probability": 14,
146
+ "itinerary unstructured_information": 65,
147
  "link attendee": 54,
148
  "location accommodation": 15,
149
  "location activity": 16,
 
152
  "location itinerary": 19,
153
  "location planner": 20,
154
  "location probability": 21,
155
+ "preference attendee": 68,
156
+ "preference preference": 76,
157
  "travel arrival location": 22,
158
  "travel attendee": 23,
159
  "travel cost": 55,
 
161
  "travel destination": 48,
162
  "travel flight_type": 49,
163
  "travel planner": 33,
164
+ "travel preference": 80,
165
  "travel probability": 25,
166
  "travel time": 26,
167
  "travel type": 51,
168
+ "travel unstructured_information": 81,
169
  "trip accommodation": 45,
170
  "trip activity": 40,
171
  "trip attendee": 27,
172
  "trip date": 46,
173
+ "trip itinerary": 72,
174
  "trip link": 38,
175
  "trip location": 28,
176
  "trip travel": 29,
177
+ "trip unstructured_information": 77,
178
+ "type probability": 30,
179
+ "unstructured_information link": 64,
180
+ "unstructured_information unstructured_information": 69
181
  },
182
  "layer_norm_eps": 1e-07,
183
  "max_position_embeddings": 512,
 
200
  "relative_attention": true,
201
  "share_att_key": true,
202
  "torch_dtype": "float32",
203
+ "transformers_version": "4.40.0",
204
  "type_vocab_size": 0,
205
+ "vocab_size": 128065
206
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:983357b818a670c1c502a4b4f1486da0c8f5956db1e473b6bdcc60659f5a61ac
3
- size 567641820
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2625c33201b52b0ff6473145ede9473741895334b759fec91ec70e8eb53cf19
3
+ size 567740204
runs/Apr30_01-56-37_93720833cc24/events.out.tfevents.1714442226.93720833cc24.1740.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22ffeb3444005de22d75f10d05ea9027c2014e4f3e10f707be85cb647a40d382
3
+ size 10629
tokenizer.json CHANGED
@@ -86,7 +86,7 @@
86
  },
87
  {
88
  "id": 128005,
89
- "content": "<arrival location>",
90
  "single_word": false,
91
  "lstrip": false,
92
  "rstrip": false,
@@ -95,7 +95,7 @@
95
  },
96
  {
97
  "id": 128006,
98
- "content": "</arrival location>",
99
  "single_word": false,
100
  "lstrip": false,
101
  "rstrip": false,
@@ -158,7 +158,7 @@
158
  },
159
  {
160
  "id": 128013,
161
- "content": "<itenerary>",
162
  "single_word": false,
163
  "lstrip": false,
164
  "rstrip": false,
@@ -167,7 +167,7 @@
167
  },
168
  {
169
  "id": 128014,
170
- "content": "</itenerary>",
171
  "single_word": false,
172
  "lstrip": false,
173
  "rstrip": false,
@@ -176,7 +176,7 @@
176
  },
177
  {
178
  "id": 128015,
179
- "content": "<location>",
180
  "single_word": false,
181
  "lstrip": false,
182
  "rstrip": false,
@@ -185,7 +185,7 @@
185
  },
186
  {
187
  "id": 128016,
188
- "content": "</location>",
189
  "single_word": false,
190
  "lstrip": false,
191
  "rstrip": false,
@@ -194,7 +194,7 @@
194
  },
195
  {
196
  "id": 128017,
197
- "content": "<sender>",
198
  "single_word": false,
199
  "lstrip": false,
200
  "rstrip": false,
@@ -203,7 +203,7 @@
203
  },
204
  {
205
  "id": 128018,
206
- "content": "</sender>",
207
  "single_word": false,
208
  "lstrip": false,
209
  "rstrip": false,
@@ -212,7 +212,7 @@
212
  },
213
  {
214
  "id": 128019,
215
- "content": "<time>",
216
  "single_word": false,
217
  "lstrip": false,
218
  "rstrip": false,
@@ -221,7 +221,7 @@
221
  },
222
  {
223
  "id": 128020,
224
- "content": "</time>",
225
  "single_word": false,
226
  "lstrip": false,
227
  "rstrip": false,
@@ -230,7 +230,7 @@
230
  },
231
  {
232
  "id": 128021,
233
- "content": "<planner>",
234
  "single_word": false,
235
  "lstrip": false,
236
  "rstrip": false,
@@ -239,7 +239,7 @@
239
  },
240
  {
241
  "id": 128022,
242
- "content": "</planner>",
243
  "single_word": false,
244
  "lstrip": false,
245
  "rstrip": false,
@@ -248,7 +248,7 @@
248
  },
249
  {
250
  "id": 128023,
251
- "content": "<itinerary>",
252
  "single_word": false,
253
  "lstrip": false,
254
  "rstrip": false,
@@ -257,7 +257,7 @@
257
  },
258
  {
259
  "id": 128024,
260
- "content": "</itinerary>",
261
  "single_word": false,
262
  "lstrip": false,
263
  "rstrip": false,
@@ -266,7 +266,7 @@
266
  },
267
  {
268
  "id": 128025,
269
- "content": "<seat>",
270
  "single_word": false,
271
  "lstrip": false,
272
  "rstrip": false,
@@ -275,7 +275,7 @@
275
  },
276
  {
277
  "id": 128026,
278
- "content": "</seat>",
279
  "single_word": false,
280
  "lstrip": false,
281
  "rstrip": false,
@@ -284,7 +284,7 @@
284
  },
285
  {
286
  "id": 128027,
287
- "content": "<address>",
288
  "single_word": false,
289
  "lstrip": false,
290
  "rstrip": false,
@@ -293,7 +293,7 @@
293
  },
294
  {
295
  "id": 128028,
296
- "content": "</address>",
297
  "single_word": false,
298
  "lstrip": false,
299
  "rstrip": false,
@@ -302,7 +302,7 @@
302
  },
303
  {
304
  "id": 128029,
305
- "content": "<thing_needed>",
306
  "single_word": false,
307
  "lstrip": false,
308
  "rstrip": false,
@@ -311,7 +311,7 @@
311
  },
312
  {
313
  "id": 128030,
314
- "content": "</thing_needed>",
315
  "single_word": false,
316
  "lstrip": false,
317
  "rstrip": false,
@@ -320,7 +320,7 @@
320
  },
321
  {
322
  "id": 128031,
323
- "content": "<travel>",
324
  "single_word": false,
325
  "lstrip": false,
326
  "rstrip": false,
@@ -329,7 +329,7 @@
329
  },
330
  {
331
  "id": 128032,
332
- "content": "</travel>",
333
  "single_word": false,
334
  "lstrip": false,
335
  "rstrip": false,
@@ -338,7 +338,7 @@
338
  },
339
  {
340
  "id": 128033,
341
- "content": "<type>",
342
  "single_word": false,
343
  "lstrip": false,
344
  "rstrip": false,
@@ -347,7 +347,7 @@
347
  },
348
  {
349
  "id": 128034,
350
- "content": "</type>",
351
  "single_word": false,
352
  "lstrip": false,
353
  "rstrip": false,
@@ -356,7 +356,7 @@
356
  },
357
  {
358
  "id": 128035,
359
- "content": "<link>",
360
  "single_word": false,
361
  "lstrip": false,
362
  "rstrip": false,
@@ -365,7 +365,7 @@
365
  },
366
  {
367
  "id": 128036,
368
- "content": "</link>",
369
  "single_word": false,
370
  "lstrip": false,
371
  "rstrip": false,
@@ -374,7 +374,7 @@
374
  },
375
  {
376
  "id": 128037,
377
- "content": "<trip>",
378
  "single_word": false,
379
  "lstrip": false,
380
  "rstrip": false,
@@ -383,7 +383,7 @@
383
  },
384
  {
385
  "id": 128038,
386
- "content": "</trip>",
387
  "single_word": false,
388
  "lstrip": false,
389
  "rstrip": false,
@@ -392,7 +392,7 @@
392
  },
393
  {
394
  "id": 128039,
395
- "content": "<occupancy>",
396
  "single_word": false,
397
  "lstrip": false,
398
  "rstrip": false,
@@ -401,7 +401,7 @@
401
  },
402
  {
403
  "id": 128040,
404
- "content": "</occupancy>",
405
  "single_word": false,
406
  "lstrip": false,
407
  "rstrip": false,
@@ -410,7 +410,7 @@
410
  },
411
  {
412
  "id": 128041,
413
- "content": "<access_instructions>",
414
  "single_word": false,
415
  "lstrip": false,
416
  "rstrip": false,
@@ -419,7 +419,7 @@
419
  },
420
  {
421
  "id": 128042,
422
- "content": "</access_instructions>",
423
  "single_word": false,
424
  "lstrip": false,
425
  "rstrip": false,
@@ -428,7 +428,7 @@
428
  },
429
  {
430
  "id": 128043,
431
- "content": "<probability>",
432
  "single_word": false,
433
  "lstrip": false,
434
  "rstrip": false,
@@ -437,7 +437,7 @@
437
  },
438
  {
439
  "id": 128044,
440
- "content": "</probability>",
441
  "single_word": false,
442
  "lstrip": false,
443
  "rstrip": false,
@@ -446,7 +446,7 @@
446
  },
447
  {
448
  "id": 128045,
449
- "content": "<flight_type>",
450
  "single_word": false,
451
  "lstrip": false,
452
  "rstrip": false,
@@ -455,7 +455,7 @@
455
  },
456
  {
457
  "id": 128046,
458
- "content": "</flight_type>",
459
  "single_word": false,
460
  "lstrip": false,
461
  "rstrip": false,
@@ -464,7 +464,7 @@
464
  },
465
  {
466
  "id": 128047,
467
- "content": "<person>",
468
  "single_word": false,
469
  "lstrip": false,
470
  "rstrip": false,
@@ -473,7 +473,7 @@
473
  },
474
  {
475
  "id": 128048,
476
- "content": "</person>",
477
  "single_word": false,
478
  "lstrip": false,
479
  "rstrip": false,
@@ -482,7 +482,7 @@
482
  },
483
  {
484
  "id": 128049,
485
- "content": "<availability>",
486
  "single_word": false,
487
  "lstrip": false,
488
  "rstrip": false,
@@ -491,7 +491,7 @@
491
  },
492
  {
493
  "id": 128050,
494
- "content": "</availability>",
495
  "single_word": false,
496
  "lstrip": false,
497
  "rstrip": false,
@@ -500,7 +500,7 @@
500
  },
501
  {
502
  "id": 128051,
503
- "content": "<pickup_location>",
504
  "single_word": false,
505
  "lstrip": false,
506
  "rstrip": false,
@@ -509,7 +509,115 @@
509
  },
510
  {
511
  "id": 128052,
512
- "content": "</pickup_location>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
513
  "single_word": false,
514
  "lstrip": false,
515
  "rstrip": false,
@@ -544,8 +652,8 @@
544
  {
545
  "type": "Metaspace",
546
  "replacement": "▁",
547
- "add_prefix_space": true,
548
- "prepend_scheme": "always"
549
  }
550
  ]
551
  },
@@ -627,8 +735,8 @@
627
  "decoder": {
628
  "type": "Metaspace",
629
  "replacement": "▁",
630
- "add_prefix_space": true,
631
- "prepend_scheme": "always"
632
  },
633
  "model": {
634
  "type": "Unigram",
 
86
  },
87
  {
88
  "id": 128005,
89
+ "content": "<arrival_location>",
90
  "single_word": false,
91
  "lstrip": false,
92
  "rstrip": false,
 
95
  },
96
  {
97
  "id": 128006,
98
+ "content": "</arrival_location>",
99
  "single_word": false,
100
  "lstrip": false,
101
  "rstrip": false,
 
158
  },
159
  {
160
  "id": 128013,
161
+ "content": "<location>",
162
  "single_word": false,
163
  "lstrip": false,
164
  "rstrip": false,
 
167
  },
168
  {
169
  "id": 128014,
170
+ "content": "</location>",
171
  "single_word": false,
172
  "lstrip": false,
173
  "rstrip": false,
 
176
  },
177
  {
178
  "id": 128015,
179
+ "content": "<sender>",
180
  "single_word": false,
181
  "lstrip": false,
182
  "rstrip": false,
 
185
  },
186
  {
187
  "id": 128016,
188
+ "content": "</sender>",
189
  "single_word": false,
190
  "lstrip": false,
191
  "rstrip": false,
 
194
  },
195
  {
196
  "id": 128017,
197
+ "content": "<time>",
198
  "single_word": false,
199
  "lstrip": false,
200
  "rstrip": false,
 
203
  },
204
  {
205
  "id": 128018,
206
+ "content": "</time>",
207
  "single_word": false,
208
  "lstrip": false,
209
  "rstrip": false,
 
212
  },
213
  {
214
  "id": 128019,
215
+ "content": "<planner>",
216
  "single_word": false,
217
  "lstrip": false,
218
  "rstrip": false,
 
221
  },
222
  {
223
  "id": 128020,
224
+ "content": "</planner>",
225
  "single_word": false,
226
  "lstrip": false,
227
  "rstrip": false,
 
230
  },
231
  {
232
  "id": 128021,
233
+ "content": "<itinerary>",
234
  "single_word": false,
235
  "lstrip": false,
236
  "rstrip": false,
 
239
  },
240
  {
241
  "id": 128022,
242
+ "content": "</itinerary>",
243
  "single_word": false,
244
  "lstrip": false,
245
  "rstrip": false,
 
248
  },
249
  {
250
  "id": 128023,
251
+ "content": "<seat>",
252
  "single_word": false,
253
  "lstrip": false,
254
  "rstrip": false,
 
257
  },
258
  {
259
  "id": 128024,
260
+ "content": "</seat>",
261
  "single_word": false,
262
  "lstrip": false,
263
  "rstrip": false,
 
266
  },
267
  {
268
  "id": 128025,
269
+ "content": "<address>",
270
  "single_word": false,
271
  "lstrip": false,
272
  "rstrip": false,
 
275
  },
276
  {
277
  "id": 128026,
278
+ "content": "</address>",
279
  "single_word": false,
280
  "lstrip": false,
281
  "rstrip": false,
 
284
  },
285
  {
286
  "id": 128027,
287
+ "content": "<thing_needed>",
288
  "single_word": false,
289
  "lstrip": false,
290
  "rstrip": false,
 
293
  },
294
  {
295
  "id": 128028,
296
+ "content": "</thing_needed>",
297
  "single_word": false,
298
  "lstrip": false,
299
  "rstrip": false,
 
302
  },
303
  {
304
  "id": 128029,
305
+ "content": "<travel>",
306
  "single_word": false,
307
  "lstrip": false,
308
  "rstrip": false,
 
311
  },
312
  {
313
  "id": 128030,
314
+ "content": "</travel>",
315
  "single_word": false,
316
  "lstrip": false,
317
  "rstrip": false,
 
320
  },
321
  {
322
  "id": 128031,
323
+ "content": "<type>",
324
  "single_word": false,
325
  "lstrip": false,
326
  "rstrip": false,
 
329
  },
330
  {
331
  "id": 128032,
332
+ "content": "</type>",
333
  "single_word": false,
334
  "lstrip": false,
335
  "rstrip": false,
 
338
  },
339
  {
340
  "id": 128033,
341
+ "content": "<link>",
342
  "single_word": false,
343
  "lstrip": false,
344
  "rstrip": false,
 
347
  },
348
  {
349
  "id": 128034,
350
+ "content": "</link>",
351
  "single_word": false,
352
  "lstrip": false,
353
  "rstrip": false,
 
356
  },
357
  {
358
  "id": 128035,
359
+ "content": "<trip>",
360
  "single_word": false,
361
  "lstrip": false,
362
  "rstrip": false,
 
365
  },
366
  {
367
  "id": 128036,
368
+ "content": "</trip>",
369
  "single_word": false,
370
  "lstrip": false,
371
  "rstrip": false,
 
374
  },
375
  {
376
  "id": 128037,
377
+ "content": "<occupancy>",
378
  "single_word": false,
379
  "lstrip": false,
380
  "rstrip": false,
 
383
  },
384
  {
385
  "id": 128038,
386
+ "content": "</occupancy>",
387
  "single_word": false,
388
  "lstrip": false,
389
  "rstrip": false,
 
392
  },
393
  {
394
  "id": 128039,
395
+ "content": "<access_instructions>",
396
  "single_word": false,
397
  "lstrip": false,
398
  "rstrip": false,
 
401
  },
402
  {
403
  "id": 128040,
404
+ "content": "</access_instructions>",
405
  "single_word": false,
406
  "lstrip": false,
407
  "rstrip": false,
 
410
  },
411
  {
412
  "id": 128041,
413
+ "content": "<probability>",
414
  "single_word": false,
415
  "lstrip": false,
416
  "rstrip": false,
 
419
  },
420
  {
421
  "id": 128042,
422
+ "content": "</probability>",
423
  "single_word": false,
424
  "lstrip": false,
425
  "rstrip": false,
 
428
  },
429
  {
430
  "id": 128043,
431
+ "content": "<flight_type>",
432
  "single_word": false,
433
  "lstrip": false,
434
  "rstrip": false,
 
437
  },
438
  {
439
  "id": 128044,
440
+ "content": "</flight_type>",
441
  "single_word": false,
442
  "lstrip": false,
443
  "rstrip": false,
 
446
  },
447
  {
448
  "id": 128045,
449
+ "content": "<person>",
450
  "single_word": false,
451
  "lstrip": false,
452
  "rstrip": false,
 
455
  },
456
  {
457
  "id": 128046,
458
+ "content": "</person>",
459
  "single_word": false,
460
  "lstrip": false,
461
  "rstrip": false,
 
464
  },
465
  {
466
  "id": 128047,
467
+ "content": "<availability>",
468
  "single_word": false,
469
  "lstrip": false,
470
  "rstrip": false,
 
473
  },
474
  {
475
  "id": 128048,
476
+ "content": "</availability>",
477
  "single_word": false,
478
  "lstrip": false,
479
  "rstrip": false,
 
482
  },
483
  {
484
  "id": 128049,
485
+ "content": "<pickup_location>",
486
  "single_word": false,
487
  "lstrip": false,
488
  "rstrip": false,
 
491
  },
492
  {
493
  "id": 128050,
494
+ "content": "</pickup_location>",
495
  "single_word": false,
496
  "lstrip": false,
497
  "rstrip": false,
 
500
  },
501
  {
502
  "id": 128051,
503
+ "content": "<unstructured_information>",
504
  "single_word": false,
505
  "lstrip": false,
506
  "rstrip": false,
 
509
  },
510
  {
511
  "id": 128052,
512
+ "content": "</unstructured_information>",
513
+ "single_word": false,
514
+ "lstrip": false,
515
+ "rstrip": false,
516
+ "normalized": true,
517
+ "special": false
518
+ },
519
+ {
520
+ "id": 128053,
521
+ "content": "<preference>",
522
+ "single_word": false,
523
+ "lstrip": false,
524
+ "rstrip": false,
525
+ "normalized": true,
526
+ "special": false
527
+ },
528
+ {
529
+ "id": 128054,
530
+ "content": "</preference>",
531
+ "single_word": false,
532
+ "lstrip": false,
533
+ "rstrip": false,
534
+ "normalized": true,
535
+ "special": false
536
+ },
537
+ {
538
+ "id": 128055,
539
+ "content": "<check_in_date>",
540
+ "single_word": false,
541
+ "lstrip": false,
542
+ "rstrip": false,
543
+ "normalized": true,
544
+ "special": false
545
+ },
546
+ {
547
+ "id": 128056,
548
+ "content": "</check_in_date>",
549
+ "single_word": false,
550
+ "lstrip": false,
551
+ "rstrip": false,
552
+ "normalized": true,
553
+ "special": false
554
+ },
555
+ {
556
+ "id": 128057,
557
+ "content": "<participants>",
558
+ "single_word": false,
559
+ "lstrip": false,
560
+ "rstrip": false,
561
+ "normalized": true,
562
+ "special": false
563
+ },
564
+ {
565
+ "id": 128058,
566
+ "content": "</participants>",
567
+ "single_word": false,
568
+ "lstrip": false,
569
+ "rstrip": false,
570
+ "normalized": true,
571
+ "special": false
572
+ },
573
+ {
574
+ "id": 128059,
575
+ "content": "<chat_title>",
576
+ "single_word": false,
577
+ "lstrip": false,
578
+ "rstrip": false,
579
+ "normalized": true,
580
+ "special": false
581
+ },
582
+ {
583
+ "id": 128060,
584
+ "content": "</chat_title>",
585
+ "single_word": false,
586
+ "lstrip": false,
587
+ "rstrip": false,
588
+ "normalized": true,
589
+ "special": false
590
+ },
591
+ {
592
+ "id": 128061,
593
+ "content": "<readable_date>",
594
+ "single_word": false,
595
+ "lstrip": false,
596
+ "rstrip": false,
597
+ "normalized": true,
598
+ "special": false
599
+ },
600
+ {
601
+ "id": 128062,
602
+ "content": "</readable_date>",
603
+ "single_word": false,
604
+ "lstrip": false,
605
+ "rstrip": false,
606
+ "normalized": true,
607
+ "special": false
608
+ },
609
+ {
610
+ "id": 128063,
611
+ "content": "<metadata>",
612
+ "single_word": false,
613
+ "lstrip": false,
614
+ "rstrip": false,
615
+ "normalized": true,
616
+ "special": false
617
+ },
618
+ {
619
+ "id": 128064,
620
+ "content": "</metadata>",
621
  "single_word": false,
622
  "lstrip": false,
623
  "rstrip": false,
 
652
  {
653
  "type": "Metaspace",
654
  "replacement": "▁",
655
+ "prepend_scheme": "always",
656
+ "split": true
657
  }
658
  ]
659
  },
 
735
  "decoder": {
736
  "type": "Metaspace",
737
  "replacement": "▁",
738
+ "prepend_scheme": "always",
739
+ "split": true
740
  },
741
  "model": {
742
  "type": "Unigram",
tokenizer_config.json CHANGED
@@ -73,7 +73,7 @@
73
  "special": false
74
  },
75
  "128005": {
76
- "content": "<arrival location>",
77
  "lstrip": false,
78
  "normalized": true,
79
  "rstrip": false,
@@ -81,7 +81,7 @@
81
  "special": false
82
  },
83
  "128006": {
84
- "content": "</arrival location>",
85
  "lstrip": false,
86
  "normalized": true,
87
  "rstrip": false,
@@ -137,7 +137,7 @@
137
  "special": false
138
  },
139
  "128013": {
140
- "content": "<itenerary>",
141
  "lstrip": false,
142
  "normalized": true,
143
  "rstrip": false,
@@ -145,7 +145,7 @@
145
  "special": false
146
  },
147
  "128014": {
148
- "content": "</itenerary>",
149
  "lstrip": false,
150
  "normalized": true,
151
  "rstrip": false,
@@ -153,7 +153,7 @@
153
  "special": false
154
  },
155
  "128015": {
156
- "content": "<location>",
157
  "lstrip": false,
158
  "normalized": true,
159
  "rstrip": false,
@@ -161,7 +161,7 @@
161
  "special": false
162
  },
163
  "128016": {
164
- "content": "</location>",
165
  "lstrip": false,
166
  "normalized": true,
167
  "rstrip": false,
@@ -169,7 +169,7 @@
169
  "special": false
170
  },
171
  "128017": {
172
- "content": "<sender>",
173
  "lstrip": false,
174
  "normalized": true,
175
  "rstrip": false,
@@ -177,7 +177,7 @@
177
  "special": false
178
  },
179
  "128018": {
180
- "content": "</sender>",
181
  "lstrip": false,
182
  "normalized": true,
183
  "rstrip": false,
@@ -185,7 +185,7 @@
185
  "special": false
186
  },
187
  "128019": {
188
- "content": "<time>",
189
  "lstrip": false,
190
  "normalized": true,
191
  "rstrip": false,
@@ -193,7 +193,7 @@
193
  "special": false
194
  },
195
  "128020": {
196
- "content": "</time>",
197
  "lstrip": false,
198
  "normalized": true,
199
  "rstrip": false,
@@ -201,7 +201,7 @@
201
  "special": false
202
  },
203
  "128021": {
204
- "content": "<planner>",
205
  "lstrip": false,
206
  "normalized": true,
207
  "rstrip": false,
@@ -209,7 +209,7 @@
209
  "special": false
210
  },
211
  "128022": {
212
- "content": "</planner>",
213
  "lstrip": false,
214
  "normalized": true,
215
  "rstrip": false,
@@ -217,7 +217,7 @@
217
  "special": false
218
  },
219
  "128023": {
220
- "content": "<itinerary>",
221
  "lstrip": false,
222
  "normalized": true,
223
  "rstrip": false,
@@ -225,7 +225,7 @@
225
  "special": false
226
  },
227
  "128024": {
228
- "content": "</itinerary>",
229
  "lstrip": false,
230
  "normalized": true,
231
  "rstrip": false,
@@ -233,7 +233,7 @@
233
  "special": false
234
  },
235
  "128025": {
236
- "content": "<seat>",
237
  "lstrip": false,
238
  "normalized": true,
239
  "rstrip": false,
@@ -241,7 +241,7 @@
241
  "special": false
242
  },
243
  "128026": {
244
- "content": "</seat>",
245
  "lstrip": false,
246
  "normalized": true,
247
  "rstrip": false,
@@ -249,7 +249,7 @@
249
  "special": false
250
  },
251
  "128027": {
252
- "content": "<address>",
253
  "lstrip": false,
254
  "normalized": true,
255
  "rstrip": false,
@@ -257,7 +257,7 @@
257
  "special": false
258
  },
259
  "128028": {
260
- "content": "</address>",
261
  "lstrip": false,
262
  "normalized": true,
263
  "rstrip": false,
@@ -265,7 +265,7 @@
265
  "special": false
266
  },
267
  "128029": {
268
- "content": "<thing_needed>",
269
  "lstrip": false,
270
  "normalized": true,
271
  "rstrip": false,
@@ -273,7 +273,7 @@
273
  "special": false
274
  },
275
  "128030": {
276
- "content": "</thing_needed>",
277
  "lstrip": false,
278
  "normalized": true,
279
  "rstrip": false,
@@ -281,7 +281,7 @@
281
  "special": false
282
  },
283
  "128031": {
284
- "content": "<travel>",
285
  "lstrip": false,
286
  "normalized": true,
287
  "rstrip": false,
@@ -289,7 +289,7 @@
289
  "special": false
290
  },
291
  "128032": {
292
- "content": "</travel>",
293
  "lstrip": false,
294
  "normalized": true,
295
  "rstrip": false,
@@ -297,7 +297,7 @@
297
  "special": false
298
  },
299
  "128033": {
300
- "content": "<type>",
301
  "lstrip": false,
302
  "normalized": true,
303
  "rstrip": false,
@@ -305,7 +305,7 @@
305
  "special": false
306
  },
307
  "128034": {
308
- "content": "</type>",
309
  "lstrip": false,
310
  "normalized": true,
311
  "rstrip": false,
@@ -313,7 +313,7 @@
313
  "special": false
314
  },
315
  "128035": {
316
- "content": "<link>",
317
  "lstrip": false,
318
  "normalized": true,
319
  "rstrip": false,
@@ -321,7 +321,7 @@
321
  "special": false
322
  },
323
  "128036": {
324
- "content": "</link>",
325
  "lstrip": false,
326
  "normalized": true,
327
  "rstrip": false,
@@ -329,7 +329,7 @@
329
  "special": false
330
  },
331
  "128037": {
332
- "content": "<trip>",
333
  "lstrip": false,
334
  "normalized": true,
335
  "rstrip": false,
@@ -337,7 +337,7 @@
337
  "special": false
338
  },
339
  "128038": {
340
- "content": "</trip>",
341
  "lstrip": false,
342
  "normalized": true,
343
  "rstrip": false,
@@ -345,7 +345,7 @@
345
  "special": false
346
  },
347
  "128039": {
348
- "content": "<occupancy>",
349
  "lstrip": false,
350
  "normalized": true,
351
  "rstrip": false,
@@ -353,7 +353,7 @@
353
  "special": false
354
  },
355
  "128040": {
356
- "content": "</occupancy>",
357
  "lstrip": false,
358
  "normalized": true,
359
  "rstrip": false,
@@ -361,7 +361,7 @@
361
  "special": false
362
  },
363
  "128041": {
364
- "content": "<access_instructions>",
365
  "lstrip": false,
366
  "normalized": true,
367
  "rstrip": false,
@@ -369,7 +369,7 @@
369
  "special": false
370
  },
371
  "128042": {
372
- "content": "</access_instructions>",
373
  "lstrip": false,
374
  "normalized": true,
375
  "rstrip": false,
@@ -377,7 +377,7 @@
377
  "special": false
378
  },
379
  "128043": {
380
- "content": "<probability>",
381
  "lstrip": false,
382
  "normalized": true,
383
  "rstrip": false,
@@ -385,7 +385,7 @@
385
  "special": false
386
  },
387
  "128044": {
388
- "content": "</probability>",
389
  "lstrip": false,
390
  "normalized": true,
391
  "rstrip": false,
@@ -393,7 +393,7 @@
393
  "special": false
394
  },
395
  "128045": {
396
- "content": "<flight_type>",
397
  "lstrip": false,
398
  "normalized": true,
399
  "rstrip": false,
@@ -401,7 +401,7 @@
401
  "special": false
402
  },
403
  "128046": {
404
- "content": "</flight_type>",
405
  "lstrip": false,
406
  "normalized": true,
407
  "rstrip": false,
@@ -409,7 +409,7 @@
409
  "special": false
410
  },
411
  "128047": {
412
- "content": "<person>",
413
  "lstrip": false,
414
  "normalized": true,
415
  "rstrip": false,
@@ -417,7 +417,7 @@
417
  "special": false
418
  },
419
  "128048": {
420
- "content": "</person>",
421
  "lstrip": false,
422
  "normalized": true,
423
  "rstrip": false,
@@ -425,7 +425,7 @@
425
  "special": false
426
  },
427
  "128049": {
428
- "content": "<availability>",
429
  "lstrip": false,
430
  "normalized": true,
431
  "rstrip": false,
@@ -433,7 +433,7 @@
433
  "special": false
434
  },
435
  "128050": {
436
- "content": "</availability>",
437
  "lstrip": false,
438
  "normalized": true,
439
  "rstrip": false,
@@ -441,7 +441,7 @@
441
  "special": false
442
  },
443
  "128051": {
444
- "content": "<pickup_location>",
445
  "lstrip": false,
446
  "normalized": true,
447
  "rstrip": false,
@@ -449,7 +449,103 @@
449
  "special": false
450
  },
451
  "128052": {
452
- "content": "</pickup_location>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
453
  "lstrip": false,
454
  "normalized": true,
455
  "rstrip": false,
 
73
  "special": false
74
  },
75
  "128005": {
76
+ "content": "<arrival_location>",
77
  "lstrip": false,
78
  "normalized": true,
79
  "rstrip": false,
 
81
  "special": false
82
  },
83
  "128006": {
84
+ "content": "</arrival_location>",
85
  "lstrip": false,
86
  "normalized": true,
87
  "rstrip": false,
 
137
  "special": false
138
  },
139
  "128013": {
140
+ "content": "<location>",
141
  "lstrip": false,
142
  "normalized": true,
143
  "rstrip": false,
 
145
  "special": false
146
  },
147
  "128014": {
148
+ "content": "</location>",
149
  "lstrip": false,
150
  "normalized": true,
151
  "rstrip": false,
 
153
  "special": false
154
  },
155
  "128015": {
156
+ "content": "<sender>",
157
  "lstrip": false,
158
  "normalized": true,
159
  "rstrip": false,
 
161
  "special": false
162
  },
163
  "128016": {
164
+ "content": "</sender>",
165
  "lstrip": false,
166
  "normalized": true,
167
  "rstrip": false,
 
169
  "special": false
170
  },
171
  "128017": {
172
+ "content": "<time>",
173
  "lstrip": false,
174
  "normalized": true,
175
  "rstrip": false,
 
177
  "special": false
178
  },
179
  "128018": {
180
+ "content": "</time>",
181
  "lstrip": false,
182
  "normalized": true,
183
  "rstrip": false,
 
185
  "special": false
186
  },
187
  "128019": {
188
+ "content": "<planner>",
189
  "lstrip": false,
190
  "normalized": true,
191
  "rstrip": false,
 
193
  "special": false
194
  },
195
  "128020": {
196
+ "content": "</planner>",
197
  "lstrip": false,
198
  "normalized": true,
199
  "rstrip": false,
 
201
  "special": false
202
  },
203
  "128021": {
204
+ "content": "<itinerary>",
205
  "lstrip": false,
206
  "normalized": true,
207
  "rstrip": false,
 
209
  "special": false
210
  },
211
  "128022": {
212
+ "content": "</itinerary>",
213
  "lstrip": false,
214
  "normalized": true,
215
  "rstrip": false,
 
217
  "special": false
218
  },
219
  "128023": {
220
+ "content": "<seat>",
221
  "lstrip": false,
222
  "normalized": true,
223
  "rstrip": false,
 
225
  "special": false
226
  },
227
  "128024": {
228
+ "content": "</seat>",
229
  "lstrip": false,
230
  "normalized": true,
231
  "rstrip": false,
 
233
  "special": false
234
  },
235
  "128025": {
236
+ "content": "<address>",
237
  "lstrip": false,
238
  "normalized": true,
239
  "rstrip": false,
 
241
  "special": false
242
  },
243
  "128026": {
244
+ "content": "</address>",
245
  "lstrip": false,
246
  "normalized": true,
247
  "rstrip": false,
 
249
  "special": false
250
  },
251
  "128027": {
252
+ "content": "<thing_needed>",
253
  "lstrip": false,
254
  "normalized": true,
255
  "rstrip": false,
 
257
  "special": false
258
  },
259
  "128028": {
260
+ "content": "</thing_needed>",
261
  "lstrip": false,
262
  "normalized": true,
263
  "rstrip": false,
 
265
  "special": false
266
  },
267
  "128029": {
268
+ "content": "<travel>",
269
  "lstrip": false,
270
  "normalized": true,
271
  "rstrip": false,
 
273
  "special": false
274
  },
275
  "128030": {
276
+ "content": "</travel>",
277
  "lstrip": false,
278
  "normalized": true,
279
  "rstrip": false,
 
281
  "special": false
282
  },
283
  "128031": {
284
+ "content": "<type>",
285
  "lstrip": false,
286
  "normalized": true,
287
  "rstrip": false,
 
289
  "special": false
290
  },
291
  "128032": {
292
+ "content": "</type>",
293
  "lstrip": false,
294
  "normalized": true,
295
  "rstrip": false,
 
297
  "special": false
298
  },
299
  "128033": {
300
+ "content": "<link>",
301
  "lstrip": false,
302
  "normalized": true,
303
  "rstrip": false,
 
305
  "special": false
306
  },
307
  "128034": {
308
+ "content": "</link>",
309
  "lstrip": false,
310
  "normalized": true,
311
  "rstrip": false,
 
313
  "special": false
314
  },
315
  "128035": {
316
+ "content": "<trip>",
317
  "lstrip": false,
318
  "normalized": true,
319
  "rstrip": false,
 
321
  "special": false
322
  },
323
  "128036": {
324
+ "content": "</trip>",
325
  "lstrip": false,
326
  "normalized": true,
327
  "rstrip": false,
 
329
  "special": false
330
  },
331
  "128037": {
332
+ "content": "<occupancy>",
333
  "lstrip": false,
334
  "normalized": true,
335
  "rstrip": false,
 
337
  "special": false
338
  },
339
  "128038": {
340
+ "content": "</occupancy>",
341
  "lstrip": false,
342
  "normalized": true,
343
  "rstrip": false,
 
345
  "special": false
346
  },
347
  "128039": {
348
+ "content": "<access_instructions>",
349
  "lstrip": false,
350
  "normalized": true,
351
  "rstrip": false,
 
353
  "special": false
354
  },
355
  "128040": {
356
+ "content": "</access_instructions>",
357
  "lstrip": false,
358
  "normalized": true,
359
  "rstrip": false,
 
361
  "special": false
362
  },
363
  "128041": {
364
+ "content": "<probability>",
365
  "lstrip": false,
366
  "normalized": true,
367
  "rstrip": false,
 
369
  "special": false
370
  },
371
  "128042": {
372
+ "content": "</probability>",
373
  "lstrip": false,
374
  "normalized": true,
375
  "rstrip": false,
 
377
  "special": false
378
  },
379
  "128043": {
380
+ "content": "<flight_type>",
381
  "lstrip": false,
382
  "normalized": true,
383
  "rstrip": false,
 
385
  "special": false
386
  },
387
  "128044": {
388
+ "content": "</flight_type>",
389
  "lstrip": false,
390
  "normalized": true,
391
  "rstrip": false,
 
393
  "special": false
394
  },
395
  "128045": {
396
+ "content": "<person>",
397
  "lstrip": false,
398
  "normalized": true,
399
  "rstrip": false,
 
401
  "special": false
402
  },
403
  "128046": {
404
+ "content": "</person>",
405
  "lstrip": false,
406
  "normalized": true,
407
  "rstrip": false,
 
409
  "special": false
410
  },
411
  "128047": {
412
+ "content": "<availability>",
413
  "lstrip": false,
414
  "normalized": true,
415
  "rstrip": false,
 
417
  "special": false
418
  },
419
  "128048": {
420
+ "content": "</availability>",
421
  "lstrip": false,
422
  "normalized": true,
423
  "rstrip": false,
 
425
  "special": false
426
  },
427
  "128049": {
428
+ "content": "<pickup_location>",
429
  "lstrip": false,
430
  "normalized": true,
431
  "rstrip": false,
 
433
  "special": false
434
  },
435
  "128050": {
436
+ "content": "</pickup_location>",
437
  "lstrip": false,
438
  "normalized": true,
439
  "rstrip": false,
 
441
  "special": false
442
  },
443
  "128051": {
444
+ "content": "<unstructured_information>",
445
  "lstrip": false,
446
  "normalized": true,
447
  "rstrip": false,
 
449
  "special": false
450
  },
451
  "128052": {
452
+ "content": "</unstructured_information>",
453
+ "lstrip": false,
454
+ "normalized": true,
455
+ "rstrip": false,
456
+ "single_word": false,
457
+ "special": false
458
+ },
459
+ "128053": {
460
+ "content": "<preference>",
461
+ "lstrip": false,
462
+ "normalized": true,
463
+ "rstrip": false,
464
+ "single_word": false,
465
+ "special": false
466
+ },
467
+ "128054": {
468
+ "content": "</preference>",
469
+ "lstrip": false,
470
+ "normalized": true,
471
+ "rstrip": false,
472
+ "single_word": false,
473
+ "special": false
474
+ },
475
+ "128055": {
476
+ "content": "<check_in_date>",
477
+ "lstrip": false,
478
+ "normalized": true,
479
+ "rstrip": false,
480
+ "single_word": false,
481
+ "special": false
482
+ },
483
+ "128056": {
484
+ "content": "</check_in_date>",
485
+ "lstrip": false,
486
+ "normalized": true,
487
+ "rstrip": false,
488
+ "single_word": false,
489
+ "special": false
490
+ },
491
+ "128057": {
492
+ "content": "<participants>",
493
+ "lstrip": false,
494
+ "normalized": true,
495
+ "rstrip": false,
496
+ "single_word": false,
497
+ "special": false
498
+ },
499
+ "128058": {
500
+ "content": "</participants>",
501
+ "lstrip": false,
502
+ "normalized": true,
503
+ "rstrip": false,
504
+ "single_word": false,
505
+ "special": false
506
+ },
507
+ "128059": {
508
+ "content": "<chat_title>",
509
+ "lstrip": false,
510
+ "normalized": true,
511
+ "rstrip": false,
512
+ "single_word": false,
513
+ "special": false
514
+ },
515
+ "128060": {
516
+ "content": "</chat_title>",
517
+ "lstrip": false,
518
+ "normalized": true,
519
+ "rstrip": false,
520
+ "single_word": false,
521
+ "special": false
522
+ },
523
+ "128061": {
524
+ "content": "<readable_date>",
525
+ "lstrip": false,
526
+ "normalized": true,
527
+ "rstrip": false,
528
+ "single_word": false,
529
+ "special": false
530
+ },
531
+ "128062": {
532
+ "content": "</readable_date>",
533
+ "lstrip": false,
534
+ "normalized": true,
535
+ "rstrip": false,
536
+ "single_word": false,
537
+ "special": false
538
+ },
539
+ "128063": {
540
+ "content": "<metadata>",
541
+ "lstrip": false,
542
+ "normalized": true,
543
+ "rstrip": false,
544
+ "single_word": false,
545
+ "special": false
546
+ },
547
+ "128064": {
548
+ "content": "</metadata>",
549
  "lstrip": false,
550
  "normalized": true,
551
  "rstrip": false,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:425f276aadfa8dc84a5025bdb68eaa9b59e4d39235576178acdadc1631853855
3
- size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05b0cf070846a9c433d551fe47d44fabbb3d940bb18dd0ca9c6b6fbcc3191207
3
+ size 4984