ayousanz commited on
Commit
6982d40
·
1 Parent(s): 368b6fb

Upload folder using huggingface_hub

Browse files
cyberagent/open-calm-large/onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2c1b09cf2371f623c559779bbb9d0445828f6cbe3a03742e7617603057d8fc9
3
  size 14575707
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66a54c149f0791c1ce56fb1ab5dafd4a1250aff76118df20c8499a5be3980156
3
  size 14575707
cyberagent/open-calm-large/onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d47728243edf3c43ddb97c378304a4b39821fb587f8ae44f02e01ed2c2e53621
3
+ size 859097597
cyberagent/open-calm-large/onnx/decoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b977a5c7190d7ba9b038dd073d94a27c079c587ed10ef31988a870d918ad7b27
3
+ size 851214085
cyberagent/open-calm-large/onnx/decoder_with_past_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f18e1dbfcc2496c0323a0cc68ff8cf2a21c945afa3a71679ade88537ff0584bf
3
+ size 851254112
cyberagent/open-calm-large/quantize_config.json ADDED
@@ -0,0 +1,103 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "decoder_model_merged": {
6
+ "op_types": [
7
+ "Div",
8
+ "Pow",
9
+ "Mul",
10
+ "Softmax",
11
+ "ReduceMean",
12
+ "Slice",
13
+ "Unsqueeze",
14
+ "Constant",
15
+ "Tile",
16
+ "Expand",
17
+ "Sqrt",
18
+ "Squeeze",
19
+ "Transpose",
20
+ "Gather",
21
+ "Neg",
22
+ "Add",
23
+ "Concat",
24
+ "GatherElements",
25
+ "Sub",
26
+ "Erf",
27
+ "Range",
28
+ "Reshape",
29
+ "Where",
30
+ "MatMul",
31
+ "Shape",
32
+ "Cast",
33
+ "If",
34
+ "ConstantOfShape"
35
+ ],
36
+ "weight_type": "QInt8"
37
+ },
38
+ "decoder_model": {
39
+ "op_types": [
40
+ "Div",
41
+ "Pow",
42
+ "Mul",
43
+ "Softmax",
44
+ "ReduceMean",
45
+ "Slice",
46
+ "Unsqueeze",
47
+ "Constant",
48
+ "Tile",
49
+ "Expand",
50
+ "Sqrt",
51
+ "Squeeze",
52
+ "Transpose",
53
+ "Gather",
54
+ "Neg",
55
+ "Add",
56
+ "Concat",
57
+ "GatherElements",
58
+ "Sub",
59
+ "Erf",
60
+ "Range",
61
+ "Reshape",
62
+ "Where",
63
+ "MatMul",
64
+ "Shape",
65
+ "Cast",
66
+ "ConstantOfShape"
67
+ ],
68
+ "weight_type": "QInt8"
69
+ },
70
+ "decoder_with_past_model": {
71
+ "op_types": [
72
+ "Div",
73
+ "Pow",
74
+ "Mul",
75
+ "Softmax",
76
+ "Slice",
77
+ "ReduceMean",
78
+ "Unsqueeze",
79
+ "Constant",
80
+ "Tile",
81
+ "Expand",
82
+ "Sqrt",
83
+ "Squeeze",
84
+ "Transpose",
85
+ "Gather",
86
+ "Neg",
87
+ "Add",
88
+ "Concat",
89
+ "GatherElements",
90
+ "Sub",
91
+ "Erf",
92
+ "Range",
93
+ "Reshape",
94
+ "Where",
95
+ "MatMul",
96
+ "Shape",
97
+ "Cast",
98
+ "ConstantOfShape"
99
+ ],
100
+ "weight_type": "QInt8"
101
+ }
102
+ }
103
+ }