Xenova HF staff commited on
Commit
26eb644
·
1 Parent(s): a8120a7

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -54,7 +54,7 @@
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
- "transformers_version": "4.32.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 53739
60
  }
 
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
+ "transformers_version": "4.34.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 53739
60
  }
generation_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_from_model_config": true,
3
  "bad_words_ids": [
4
  [
5
  53738
@@ -12,5 +11,6 @@
12
  "max_length": 512,
13
  "num_beams": 6,
14
  "pad_token_id": 53738,
15
- "transformers_version": "4.32.0.dev0"
 
16
  }
 
1
  {
 
2
  "bad_words_ids": [
3
  [
4
  53738
 
11
  "max_length": 512,
12
  "num_beams": 6,
13
  "pad_token_id": 53738,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.34.0.dev0"
16
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a99fb73b7a3934f524662745d11070bb1211f79eb1eb5a70aa097e2082fe393a
3
- size 322551460
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c87e35f60349bfea2fd82c59b5e06d1f8f0fdc77c77d24a00073ddfc7d1007ad
3
+ size 212494045
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7000434b1823a202bdabb4061912fc7cf24e59ce6b8bfd57751758fdcae2ad1b
3
- size 322786942
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0b29e9729f8b2c3467f9601c37bf7a4b490aaca386ac4c7571e8a8190e2e05f
3
+ size 212729612
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80862a4a8821363ed2455cc9d248364efd47e83c901acebc92bccde9e07cbe74
3
- size 82186086
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:540edbcc08bab0b42c03576a759fd9b4d5fc99996ac3178630733916dc2325cb
3
+ size 54401611
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43e9c242c6bfe83143ba529f71ed212d3c3264a94032f75511ed296c920e8e56
3
- size 81814730
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ba31d206ad237dbd35dbf46b9fe4d0368c082fd9e2d0e9603bd709facf4119d
3
+ size 54030909
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:192903fd8b7565b384618f1201530717c68916c02795c9b0ffcb811d700100d9
3
- size 309900951
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29a835ab18a732ac4d6c397ca4d5d3847d0740962763a645884725c1762bde57
3
+ size 199843536
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:646fe7bcb8f72f13cafeffc4a513d1fb2755e66047e9959b67e49eefadb580b5
3
- size 78543266
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c6208549dda986c3e6c24c650aff2b0af973b6d07260a1c8bbf3bbc0a6ad6dd
3
+ size 50759445
quantize_config.json CHANGED
@@ -4,120 +4,120 @@
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
- "Gather",
8
- "Transpose",
9
- "Cast",
10
- "Pow",
11
  "Concat",
 
 
 
12
  "Reshape",
13
- "Expand",
14
- "Constant",
15
- "Mul",
16
  "Sqrt",
17
- "ConstantOfShape",
18
- "Range",
19
- "Unsqueeze",
20
  "Where",
21
- "Sub",
22
- "ReduceMean",
23
- "Softmax",
24
- "Sigmoid",
25
- "Div",
26
- "MatMul",
27
  "Add",
 
 
 
 
 
28
  "Equal",
29
- "Shape"
 
 
 
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
- "Gather",
36
- "Transpose",
37
- "Cast",
38
- "Pow",
39
  "Concat",
 
 
 
40
  "Reshape",
41
- "Expand",
42
- "Constant",
43
- "Mul",
44
  "Sqrt",
45
- "ConstantOfShape",
46
- "Range",
47
- "Unsqueeze",
48
  "Where",
49
- "Sub",
50
- "ReduceMean",
51
- "Softmax",
52
- "Sigmoid",
53
- "Div",
54
- "MatMul",
55
  "Add",
 
 
 
 
 
56
  "Equal",
57
- "Shape"
 
 
 
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
- "decoder_model": {
62
  "op_types": [
63
- "Gather",
64
- "Transpose",
65
- "Cast",
66
- "Pow",
67
  "Concat",
 
 
 
68
  "Reshape",
69
- "Slice",
 
70
  "Squeeze",
71
- "Expand",
72
- "Constant",
73
- "Mul",
74
  "Sqrt",
75
- "ConstantOfShape",
76
- "Range",
77
- "Unsqueeze",
78
  "Where",
79
- "Sub",
80
- "Softmax",
81
- "ReduceMean",
82
- "Sigmoid",
83
- "Div",
84
- "MatMul",
85
  "Add",
 
 
 
 
 
86
  "Less",
87
  "Equal",
88
- "Shape"
 
 
 
 
89
  ],
90
  "weight_type": "QInt8"
91
  },
92
- "decoder_model_merged": {
93
  "op_types": [
94
- "Gather",
95
- "Transpose",
96
- "Cast",
97
- "Pow",
98
  "Concat",
 
 
 
99
  "Reshape",
100
- "Slice",
 
101
  "Squeeze",
102
- "Expand",
103
- "Constant",
104
- "Mul",
105
- "If",
106
  "Sqrt",
107
- "ConstantOfShape",
108
- "Range",
109
- "Unsqueeze",
110
  "Where",
111
- "Sub",
112
- "Softmax",
113
- "ReduceMean",
114
- "Sigmoid",
115
- "Div",
116
- "MatMul",
117
  "Add",
 
 
 
 
118
  "Less",
119
  "Equal",
120
- "Shape"
 
 
 
 
121
  ],
122
  "weight_type": "QInt8"
123
  }
 
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
+ "Sigmoid",
8
+ "Unsqueeze",
9
+ "Range",
 
10
  "Concat",
11
+ "Div",
12
+ "Gather",
13
+ "Shape",
14
  "Reshape",
15
+ "MatMul",
16
+ "Sub",
 
17
  "Sqrt",
 
 
 
18
  "Where",
 
 
 
 
 
 
19
  "Add",
20
+ "Softmax",
21
+ "Transpose",
22
+ "Constant",
23
+ "Mul",
24
+ "Expand",
25
  "Equal",
26
+ "ConstantOfShape",
27
+ "ReduceMean",
28
+ "Pow",
29
+ "Cast"
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
+ "Sigmoid",
36
+ "Unsqueeze",
37
+ "Range",
 
38
  "Concat",
39
+ "Div",
40
+ "Gather",
41
+ "Shape",
42
  "Reshape",
43
+ "MatMul",
44
+ "Sub",
 
45
  "Sqrt",
 
 
 
46
  "Where",
 
 
 
 
 
 
47
  "Add",
48
+ "Softmax",
49
+ "Transpose",
50
+ "Constant",
51
+ "Mul",
52
+ "Expand",
53
  "Equal",
54
+ "ConstantOfShape",
55
+ "ReduceMean",
56
+ "Pow",
57
+ "Cast"
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
+ "decoder_model_merged": {
62
  "op_types": [
63
+ "Sigmoid",
64
+ "Unsqueeze",
65
+ "Range",
 
66
  "Concat",
67
+ "Div",
68
+ "Gather",
69
+ "Shape",
70
  "Reshape",
71
+ "MatMul",
72
+ "Sub",
73
  "Squeeze",
74
+ "Slice",
 
 
75
  "Sqrt",
 
 
 
76
  "Where",
 
 
 
 
 
 
77
  "Add",
78
+ "Softmax",
79
+ "Transpose",
80
+ "Constant",
81
+ "If",
82
+ "Mul",
83
  "Less",
84
  "Equal",
85
+ "ConstantOfShape",
86
+ "Expand",
87
+ "ReduceMean",
88
+ "Pow",
89
+ "Cast"
90
  ],
91
  "weight_type": "QInt8"
92
  },
93
+ "decoder_model": {
94
  "op_types": [
95
+ "Sigmoid",
96
+ "Unsqueeze",
97
+ "Range",
 
98
  "Concat",
99
+ "Div",
100
+ "Gather",
101
+ "Shape",
102
  "Reshape",
103
+ "MatMul",
104
+ "Sub",
105
  "Squeeze",
106
+ "Slice",
 
 
 
107
  "Sqrt",
 
 
 
108
  "Where",
 
 
 
 
 
 
109
  "Add",
110
+ "Softmax",
111
+ "Transpose",
112
+ "Constant",
113
+ "Mul",
114
  "Less",
115
  "Equal",
116
+ "ConstantOfShape",
117
+ "Expand",
118
+ "ReduceMean",
119
+ "Pow",
120
+ "Cast"
121
  ],
122
  "weight_type": "QInt8"
123
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff