ayousanz commited on
Commit
5ca360f
·
1 Parent(s): b0974ab

Upload folder using huggingface_hub

Browse files
cyberagent/open-calm-1b/onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:923d0b4c600f5aa35ef971cd36c4f5aa3d3d513c27169192b6d98d3a9f755192
3
- size 15624509
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f89dd892fbcce1433b977cfe5feb023932255af961fcd5aabf2b3b619afc2b0
3
+ size 15624518
cyberagent/open-calm-1b/onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2d27ab29e0f75b1a3bf0d7ac18f5e37a72c54cc46c354f8bf1f21f118a8d295
3
+ size 1443171022
cyberagent/open-calm-1b/onnx/decoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4ab6f59eaf27e20528ece176fa976fa326b9239f635e8e6403ec5d648d77a79
3
+ size 1434763065
cyberagent/open-calm-1b/onnx/decoder_with_past_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a13a3709c0529e47a6d68321173e8ddf8658270e485703ad3a072fd936e9cb4
3
+ size 1434803140
cyberagent/open-calm-1b/quantize_config.json ADDED
@@ -0,0 +1,103 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "decoder_model_merged": {
6
+ "op_types": [
7
+ "Unsqueeze",
8
+ "Pow",
9
+ "Range",
10
+ "Erf",
11
+ "MatMul",
12
+ "Gather",
13
+ "Tile",
14
+ "Constant",
15
+ "Div",
16
+ "Sub",
17
+ "If",
18
+ "Transpose",
19
+ "ReduceMean",
20
+ "Squeeze",
21
+ "Reshape",
22
+ "ConstantOfShape",
23
+ "Expand",
24
+ "Sqrt",
25
+ "Mul",
26
+ "Where",
27
+ "GatherElements",
28
+ "Shape",
29
+ "Add",
30
+ "Neg",
31
+ "Slice",
32
+ "Concat",
33
+ "Softmax",
34
+ "Cast"
35
+ ],
36
+ "weight_type": "QInt8"
37
+ },
38
+ "decoder_model": {
39
+ "op_types": [
40
+ "Unsqueeze",
41
+ "Pow",
42
+ "Range",
43
+ "Erf",
44
+ "MatMul",
45
+ "Gather",
46
+ "Tile",
47
+ "Constant",
48
+ "Div",
49
+ "Sub",
50
+ "Transpose",
51
+ "ReduceMean",
52
+ "Squeeze",
53
+ "Reshape",
54
+ "ConstantOfShape",
55
+ "Expand",
56
+ "Sqrt",
57
+ "Mul",
58
+ "Where",
59
+ "GatherElements",
60
+ "Shape",
61
+ "Add",
62
+ "Neg",
63
+ "Slice",
64
+ "Concat",
65
+ "Softmax",
66
+ "Cast"
67
+ ],
68
+ "weight_type": "QInt8"
69
+ },
70
+ "decoder_with_past_model": {
71
+ "op_types": [
72
+ "Unsqueeze",
73
+ "Pow",
74
+ "Range",
75
+ "Erf",
76
+ "MatMul",
77
+ "Gather",
78
+ "Tile",
79
+ "Constant",
80
+ "Div",
81
+ "Sub",
82
+ "Transpose",
83
+ "ReduceMean",
84
+ "Squeeze",
85
+ "Reshape",
86
+ "ConstantOfShape",
87
+ "Expand",
88
+ "Sqrt",
89
+ "Mul",
90
+ "Where",
91
+ "GatherElements",
92
+ "Shape",
93
+ "Add",
94
+ "Neg",
95
+ "Slice",
96
+ "Concat",
97
+ "Softmax",
98
+ "Cast"
99
+ ],
100
+ "weight_type": "QInt8"
101
+ }
102
+ }
103
+ }