Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +1 -1
generation_config.json +2 -2
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +73 -73
tokenizer.json +0 -0

config.json CHANGED Viewed

@@ -54,7 +54,7 @@
   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
-  "transformers_version": "4.32.0.dev0",
   "use_cache": true,
   "vocab_size": 53739
 }

   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 53739
 }

generation_config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "_from_model_config": true,
   "bad_words_ids": [
     [
       53738
@@ -12,5 +11,6 @@
   "max_length": 512,
   "num_beams": 6,
   "pad_token_id": 53738,
-  "transformers_version": "4.32.0.dev0"
 }

 {
   "bad_words_ids": [
     [
       53738
   "max_length": 512,
   "num_beams": 6,
   "pad_token_id": 53738,
+  "renormalize_logits": true,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a99fb73b7a3934f524662745d11070bb1211f79eb1eb5a70aa097e2082fe393a
-size 322551460

 version https://git-lfs.github.com/spec/v1
+oid sha256:c87e35f60349bfea2fd82c59b5e06d1f8f0fdc77c77d24a00073ddfc7d1007ad
+size 212494045

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7000434b1823a202bdabb4061912fc7cf24e59ce6b8bfd57751758fdcae2ad1b
-size 322786942

 version https://git-lfs.github.com/spec/v1
+oid sha256:a0b29e9729f8b2c3467f9601c37bf7a4b490aaca386ac4c7571e8a8190e2e05f
+size 212729612

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:80862a4a8821363ed2455cc9d248364efd47e83c901acebc92bccde9e07cbe74
-size 82186086

 version https://git-lfs.github.com/spec/v1
+oid sha256:540edbcc08bab0b42c03576a759fd9b4d5fc99996ac3178630733916dc2325cb
+size 54401611

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:43e9c242c6bfe83143ba529f71ed212d3c3264a94032f75511ed296c920e8e56
-size 81814730

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ba31d206ad237dbd35dbf46b9fe4d0368c082fd9e2d0e9603bd709facf4119d
+size 54030909

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:192903fd8b7565b384618f1201530717c68916c02795c9b0ffcb811d700100d9
-size 309900951

 version https://git-lfs.github.com/spec/v1
+oid sha256:29a835ab18a732ac4d6c397ca4d5d3847d0740962763a645884725c1762bde57
+size 199843536

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:646fe7bcb8f72f13cafeffc4a513d1fb2755e66047e9959b67e49eefadb580b5
-size 78543266

 version https://git-lfs.github.com/spec/v1
+oid sha256:8c6208549dda986c3e6c24c650aff2b0af973b6d07260a1c8bbf3bbc0a6ad6dd
+size 50759445

quantize_config.json CHANGED Viewed

@@ -4,120 +4,120 @@
     "per_model_config": {
         "encoder_model": {
             "op_types": [
-                "Gather",
-                "Transpose",
-                "Cast",
-                "Pow",
                 "Concat",
                 "Reshape",
-                "Expand",
-                "Constant",
-                "Mul",
                 "Sqrt",
-                "ConstantOfShape",
-                "Range",
-                "Unsqueeze",
                 "Where",
-                "Sub",
-                "ReduceMean",
-                "Softmax",
-                "Sigmoid",
-                "Div",
-                "MatMul",
                 "Add",
                 "Equal",
-                "Shape"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Gather",
-                "Transpose",
-                "Cast",
-                "Pow",
                 "Concat",
                 "Reshape",
-                "Expand",
-                "Constant",
-                "Mul",
                 "Sqrt",
-                "ConstantOfShape",
-                "Range",
-                "Unsqueeze",
                 "Where",
-                "Sub",
-                "ReduceMean",
-                "Softmax",
-                "Sigmoid",
-                "Div",
-                "MatMul",
                 "Add",
                 "Equal",
-                "Shape"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
-                "Gather",
-                "Transpose",
-                "Cast",
-                "Pow",
                 "Concat",
                 "Reshape",
-                "Slice",
                 "Squeeze",
-                "Expand",
-                "Constant",
-                "Mul",
                 "Sqrt",
-                "ConstantOfShape",
-                "Range",
-                "Unsqueeze",
                 "Where",
-                "Sub",
-                "Softmax",
-                "ReduceMean",
-                "Sigmoid",
-                "Div",
-                "MatMul",
                 "Add",
                 "Less",
                 "Equal",
-                "Shape"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
-                "Gather",
-                "Transpose",
-                "Cast",
-                "Pow",
                 "Concat",
                 "Reshape",
-                "Slice",
                 "Squeeze",
-                "Expand",
-                "Constant",
-                "Mul",
-                "If",
                 "Sqrt",
-                "ConstantOfShape",
-                "Range",
-                "Unsqueeze",
                 "Where",
-                "Sub",
-                "Softmax",
-                "ReduceMean",
-                "Sigmoid",
-                "Div",
-                "MatMul",
                 "Add",
                 "Less",
                 "Equal",
-                "Shape"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "encoder_model": {
             "op_types": [
+                "Sigmoid",
+                "Unsqueeze",
+                "Range",
                 "Concat",
+                "Div",
+                "Gather",
+                "Shape",
                 "Reshape",
+                "MatMul",
+                "Sub",
                 "Sqrt",
                 "Where",
                 "Add",
+                "Softmax",
+                "Transpose",
+                "Constant",
+                "Mul",
+                "Expand",
                 "Equal",
+                "ConstantOfShape",
+                "ReduceMean",
+                "Pow",
+                "Cast"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Sigmoid",
+                "Unsqueeze",
+                "Range",
                 "Concat",
+                "Div",
+                "Gather",
+                "Shape",
                 "Reshape",
+                "MatMul",
+                "Sub",
                 "Sqrt",
                 "Where",
                 "Add",
+                "Softmax",
+                "Transpose",
+                "Constant",
+                "Mul",
+                "Expand",
                 "Equal",
+                "ConstantOfShape",
+                "ReduceMean",
+                "Pow",
+                "Cast"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Sigmoid",
+                "Unsqueeze",
+                "Range",
                 "Concat",
+                "Div",
+                "Gather",
+                "Shape",
                 "Reshape",
+                "MatMul",
+                "Sub",
                 "Squeeze",
+                "Slice",
                 "Sqrt",
                 "Where",
                 "Add",
+                "Softmax",
+                "Transpose",
+                "Constant",
+                "If",
+                "Mul",
                 "Less",
                 "Equal",
+                "ConstantOfShape",
+                "Expand",
+                "ReduceMean",
+                "Pow",
+                "Cast"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model": {
             "op_types": [
+                "Sigmoid",
+                "Unsqueeze",
+                "Range",
                 "Concat",
+                "Div",
+                "Gather",
+                "Shape",
                 "Reshape",
+                "MatMul",
+                "Sub",
                 "Squeeze",
+                "Slice",
                 "Sqrt",
                 "Where",
                 "Add",
+                "Softmax",
+                "Transpose",
+                "Constant",
+                "Mul",
                 "Less",
                 "Equal",
+                "ConstantOfShape",
+                "Expand",
+                "ReduceMean",
+                "Pow",
+                "Cast"
             ],
             "weight_type": "QInt8"
         }

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff