Xenova HF staff commited on
Commit
8bf38ba
·
1 Parent(s): 23b6876

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -139,8 +139,7 @@
139
  50360,
140
  50361
141
  ],
142
- "torch_dtype": "float32",
143
- "transformers_version": "4.29.2",
144
  "use_cache": true,
145
  "use_weighted_layer_sum": false,
146
  "vocab_size": 51864
 
139
  50360,
140
  50361
141
  ],
142
+ "transformers_version": "4.30.2",
 
143
  "use_cache": true,
144
  "use_weighted_layer_sum": false,
145
  "vocab_size": 51864
generation_config.json CHANGED
@@ -110,5 +110,5 @@
110
  50360,
111
  50361
112
  ],
113
- "transformers_version": "4.29.2"
114
  }
 
110
  50360,
111
  50361
112
  ],
113
+ "transformers_version": "4.30.2"
114
  }
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:407050fe2f75a5eb90b80fc7d758aabd4748c6cd24559e6a4581b6320bdaa864
3
  size 1926573
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a6bc26a22416cb5ca53f5db05a44fae39a56a38053bd172c60a77be35974151
3
  size 1926573
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c402233f1d2a50cc7f2fb96b7af97a9f0d0b9ccd151df68116408125af6f33de
3
- size 517263427
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd4c06f8bfbfb28f8a777a84618692ee05687ab598fef9dffb2fea11d3cd83c4
3
+ size 515405408
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9813464d9702b3ac296213dadf3712e1af3f1c1824ce1edb535f5541b0cb191d
3
- size 515875253
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fe4c89bbf88b377dd1d2862571d7611ce6888d8d1a055b61790050791d97deb
3
+ size 514017234
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ba30507ec53dbb96c6e55b6bc9664a3c27770b0c7fb50c807fb2c33af975d60
3
- size 464950674
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:789bc74086187043db99dd1684f3d82ec61d15464dddc2c3daba21dec6e505d5
3
+ size 463338655
onnx/encoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c11cab5779929dcfbfe465f640ec12a116bd41794a50ffc4815824e80aaef2d5
3
- size 314503795
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:952aacc7ab4ff86afccc732a42c4d6c8babb7651653aeb9b0ff22adcc42dcc90
3
+ size 313397176
quant_config.json ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": false,
3
+ "reduce_range": false,
4
+ "per_model_config": {
5
+ "encoder_model": {
6
+ "op_types": [
7
+ "ReduceMean",
8
+ "Sqrt",
9
+ "Reshape",
10
+ "Mul",
11
+ "Transpose",
12
+ "Shape",
13
+ "Gather",
14
+ "Sub",
15
+ "Add",
16
+ "Pow",
17
+ "Conv",
18
+ "Constant",
19
+ "MatMul",
20
+ "Erf",
21
+ "Concat",
22
+ "Unsqueeze",
23
+ "Softmax",
24
+ "Div"
25
+ ],
26
+ "weight_type": "QUInt8"
27
+ },
28
+ "decoder_model": {
29
+ "op_types": [
30
+ "Shape",
31
+ "Range",
32
+ "Expand",
33
+ "Sub",
34
+ "Sqrt",
35
+ "Reshape",
36
+ "Gather",
37
+ "Transpose",
38
+ "Add",
39
+ "Pow",
40
+ "Constant",
41
+ "Concat",
42
+ "ReduceMean",
43
+ "Mul",
44
+ "Equal",
45
+ "MatMul",
46
+ "Less",
47
+ "Where",
48
+ "Slice",
49
+ "Squeeze",
50
+ "Cast",
51
+ "Erf",
52
+ "ConstantOfShape",
53
+ "Unsqueeze",
54
+ "Softmax",
55
+ "Div"
56
+ ],
57
+ "weight_type": "QInt8"
58
+ },
59
+ "decoder_model_merged": {
60
+ "op_types": [
61
+ "If"
62
+ ],
63
+ "weight_type": "QInt8"
64
+ },
65
+ "decoder_with_past_model": {
66
+ "op_types": [
67
+ "ReduceMean",
68
+ "Sqrt",
69
+ "Reshape",
70
+ "Gather",
71
+ "Mul",
72
+ "Shape",
73
+ "Transpose",
74
+ "Add",
75
+ "Pow",
76
+ "Constant",
77
+ "MatMul",
78
+ "Softmax",
79
+ "Div",
80
+ "Erf",
81
+ "Concat",
82
+ "Unsqueeze",
83
+ "Slice",
84
+ "Sub"
85
+ ],
86
+ "weight_type": "QInt8"
87
+ }
88
+ }
89
+ }