Xenova HF staff commited on
Commit
7e875f6
·
1 Parent(s): 0e6ebb2

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -54,7 +54,7 @@
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
- "transformers_version": "4.32.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 58930
60
  }
 
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
+ "transformers_version": "4.34.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 58930
60
  }
generation_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_from_model_config": true,
3
  "bad_words_ids": [
4
  [
5
  58929
@@ -12,5 +11,6 @@
12
  "max_length": 512,
13
  "num_beams": 4,
14
  "pad_token_id": 58929,
15
- "transformers_version": "4.32.0.dev0"
 
16
  }
 
1
  {
 
2
  "bad_words_ids": [
3
  [
4
  58929
 
11
  "max_length": 512,
12
  "num_beams": 4,
13
  "pad_token_id": 58929,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.34.0.dev0"
16
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2bf78600380cd8c473dc037345641ac4a4cfa25c1885bb47723f63863ede2a84
3
- size 343834560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82f35d3553063d2cebc078473e419e38bd97f8a4ac86eace975ec14060ff2287
3
+ size 223145977
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91b188f95a7ebdbc056629202341a90c0c67adb481c5d6b0cbf47ec692292f4c
3
- size 344070042
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c09f5c5381cf2f70447d9c6a93b3f473ed429e0cb4ae9b53e7aab7256a900e44
3
+ size 223381544
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54446c39dc6c677f6942d471d0209dd7fa369afe61fab3b1377a2c407caa0cfd
3
- size 87548390
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e612107b64044539d273234c9baeea724f47d0523156443426cc781bc9834d0
3
+ size 57080168
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bebc52c0eb9526d220abc72ec77141459565c9f8285fc93f2c1a053096b3c509
3
- size 87177034
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a6f5af760f33efd9038bcb805165bf18945cc5eaa547cc69f80d94e627ff282
3
+ size 56709466
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:280b4bd4f9fe0350ce4b98e48971f76aa927a4fe4456911fae6a6cf2e3afabbe
3
- size 331184051
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a93ba4d39bb4f3d0f98660f1615b65f8ac9f19e3b199d2354291fbaf6fad5c59
3
+ size 210495468
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78689e88673cc5f714eb548b49be11ec77e544c4e9ea6e6885ca91267b9f4838
3
- size 83905570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3c98844304366b4db6ca984decde7d11eb14f95ce15cccbdcb02204502a4b67
3
+ size 53438002
quantize_config.json CHANGED
@@ -4,120 +4,120 @@
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
- "Cast",
8
- "Concat",
 
 
 
 
9
  "Softmax",
10
- "Mul",
 
 
 
 
 
 
11
  "Sqrt",
12
- "Sub",
13
  "Shape",
14
- "Unsqueeze",
15
- "MatMul",
16
  "Range",
17
- "Pow",
 
 
18
  "Reshape",
19
- "Gather",
20
- "Expand",
21
  "Transpose",
22
- "ReduceMean",
23
- "Sigmoid",
24
- "Constant",
25
- "ConstantOfShape",
26
- "Equal",
27
- "Where",
28
- "Div",
29
- "Add"
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
- "Cast",
36
- "Concat",
 
 
 
 
37
  "Softmax",
38
- "Mul",
 
 
 
 
 
 
39
  "Sqrt",
40
- "Sub",
41
  "Shape",
42
- "Unsqueeze",
43
- "MatMul",
44
  "Range",
45
- "Pow",
 
 
46
  "Reshape",
47
- "Gather",
48
- "Expand",
49
  "Transpose",
50
- "ReduceMean",
51
- "Sigmoid",
52
- "Constant",
53
- "ConstantOfShape",
54
- "Equal",
55
- "Where",
56
- "Div",
57
- "Add"
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
- "decoder_model": {
62
  "op_types": [
63
- "Cast",
64
- "Concat",
 
 
 
 
65
  "Softmax",
66
- "Mul",
67
- "Slice",
 
 
 
 
 
68
  "Sqrt",
69
- "Sub",
70
  "Shape",
71
- "Unsqueeze",
72
- "MatMul",
73
- "Squeeze",
74
  "Range",
75
- "Pow",
 
 
 
76
  "Reshape",
77
- "Gather",
78
- "Expand",
79
  "Transpose",
80
- "ReduceMean",
81
- "Sigmoid",
82
- "Constant",
83
- "ConstantOfShape",
84
  "Less",
85
- "Where",
86
- "Equal",
87
- "Div",
88
- "Add"
89
  ],
90
  "weight_type": "QInt8"
91
  },
92
- "decoder_model_merged": {
93
  "op_types": [
94
- "Cast",
95
- "Concat",
 
 
 
 
96
  "Softmax",
97
- "Mul",
98
- "Slice",
 
 
 
 
 
99
  "Sqrt",
100
- "Sub",
101
  "Shape",
102
- "Unsqueeze",
103
- "MatMul",
104
- "Squeeze",
105
  "Range",
106
- "Pow",
 
 
 
107
  "Reshape",
108
- "Gather",
109
- "Expand",
110
  "Transpose",
111
- "ReduceMean",
112
- "Sigmoid",
113
- "Constant",
114
- "ConstantOfShape",
115
- "If",
116
  "Less",
117
- "Where",
118
- "Equal",
119
- "Div",
120
- "Add"
121
  ],
122
  "weight_type": "QInt8"
123
  }
 
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
+ "MatMul",
8
+ "Div",
9
+ "Sigmoid",
10
+ "Constant",
11
+ "Expand",
12
+ "Sub",
13
  "Softmax",
14
+ "Concat",
15
+ "ReduceMean",
16
+ "Add",
17
+ "Where",
18
+ "Gather",
19
+ "Pow",
20
+ "Unsqueeze",
21
  "Sqrt",
 
22
  "Shape",
 
 
23
  "Range",
24
+ "Equal",
25
+ "ConstantOfShape",
26
+ "Mul",
27
  "Reshape",
 
 
28
  "Transpose",
29
+ "Cast"
 
 
 
 
 
 
 
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
+ "MatMul",
36
+ "Div",
37
+ "Sigmoid",
38
+ "Constant",
39
+ "Expand",
40
+ "Sub",
41
  "Softmax",
42
+ "Concat",
43
+ "ReduceMean",
44
+ "Where",
45
+ "Add",
46
+ "Gather",
47
+ "Pow",
48
+ "Unsqueeze",
49
  "Sqrt",
 
50
  "Shape",
 
 
51
  "Range",
52
+ "Equal",
53
+ "ConstantOfShape",
54
+ "Mul",
55
  "Reshape",
 
 
56
  "Transpose",
57
+ "Cast"
 
 
 
 
 
 
 
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
+ "decoder_model_merged": {
62
  "op_types": [
63
+ "MatMul",
64
+ "Div",
65
+ "Sigmoid",
66
+ "Constant",
67
+ "Expand",
68
+ "Sub",
69
  "Softmax",
70
+ "Concat",
71
+ "ReduceMean",
72
+ "Add",
73
+ "Where",
74
+ "Gather",
75
+ "Pow",
76
+ "Unsqueeze",
77
  "Sqrt",
78
+ "If",
79
  "Shape",
 
 
 
80
  "Range",
81
+ "Squeeze",
82
+ "Equal",
83
+ "ConstantOfShape",
84
+ "Mul",
85
  "Reshape",
86
+ "Slice",
 
87
  "Transpose",
 
 
 
 
88
  "Less",
89
+ "Cast"
 
 
 
90
  ],
91
  "weight_type": "QInt8"
92
  },
93
+ "decoder_model": {
94
  "op_types": [
95
+ "MatMul",
96
+ "Div",
97
+ "Sigmoid",
98
+ "Constant",
99
+ "Expand",
100
+ "Sub",
101
  "Softmax",
102
+ "Concat",
103
+ "ReduceMean",
104
+ "Add",
105
+ "Where",
106
+ "Gather",
107
+ "Pow",
108
+ "Unsqueeze",
109
  "Sqrt",
 
110
  "Shape",
 
 
 
111
  "Range",
112
+ "Squeeze",
113
+ "Equal",
114
+ "ConstantOfShape",
115
+ "Mul",
116
  "Reshape",
117
+ "Slice",
 
118
  "Transpose",
 
 
 
 
 
119
  "Less",
120
+ "Cast"
 
 
 
121
  ],
122
  "weight_type": "QInt8"
123
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff