Xenova HF staff commited on
Commit
ff92221
·
1 Parent(s): 0ca5e83

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -54,7 +54,7 @@
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
- "transformers_version": "4.32.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 61127
60
  }
 
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
+ "transformers_version": "4.34.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 61127
60
  }
generation_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_from_model_config": true,
3
  "bad_words_ids": [
4
  [
5
  61126
@@ -12,5 +11,6 @@
12
  "max_length": 512,
13
  "num_beams": 6,
14
  "pad_token_id": 61126,
15
- "transformers_version": "4.32.0.dev0"
 
16
  }
 
1
  {
 
2
  "bad_words_ids": [
3
  [
4
  61126
 
11
  "max_length": 512,
12
  "num_beams": 6,
13
  "pad_token_id": 61126,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.34.0.dev0"
16
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3916641462dd742083ab7cdf1f592a2ef3b2b9761a7c14906f662f87b239c05
3
- size 352842260
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac3064b219ec795d5540a12883942352b9b2f214db74c551816e7065540d3c10
3
+ size 227654221
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08335fc74b027d83a19ea94d549c26e085203f6590c43e9809779f301942269a
3
- size 353077742
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a593643aed05d3a9df0199870033552e3af419dca95453bb8d50dd00478decab
3
+ size 227889788
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e1fb554b4c7d7c53b3e681ffeb6a2076034964586489597bea81d4ed3c1206a
3
- size 89817891
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52655659006c8ce742cc761282d49b3be4e73bfbf080f1b6a546aa96170d5813
3
+ size 58213820
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e7579e6fc4a745166c95b56e2adcdce7b009d51433270f47b4da6194bbd6762
3
- size 89446535
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d04d5119a4059792ac9ff48500f539535aee85283ad0a7eb3477ab5d7f4eddf3
3
+ size 57843118
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:174616b069809fa322e6ba4f3ac8f9c6d5aa8772bbfb875d3f0d98c770416593
3
- size 340191751
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a1ccd427b295dd243df1b9f5df5c410bd40cdd1a6c088d57fb4560aa7a3f517
3
+ size 215003712
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e01dec23df754a2f4a149e2beb207c50e19df07e9d24ff4ea6e4fb567ade26c0
3
- size 86175071
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63f11bce5887fe400a83ebc8842c13518fe691b623a39f9b2f4fba593c60ff0e
3
+ size 54571654
quantize_config.json CHANGED
@@ -4,120 +4,120 @@
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
- "Add",
8
- "Where",
9
  "Constant",
10
- "Mul",
 
11
  "Sqrt",
12
- "Shape",
13
- "Sub",
14
- "Softmax",
15
- "MatMul",
16
- "Reshape",
17
- "ReduceMean",
18
- "Div",
19
- "ConstantOfShape",
20
  "Pow",
 
21
  "Transpose",
22
- "Gather",
23
  "Expand",
 
 
 
 
 
 
 
 
24
  "Sigmoid",
25
  "Unsqueeze",
26
- "Concat",
27
- "Cast",
28
- "Equal",
29
- "Range"
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
- "Where",
36
- "Add",
37
  "Constant",
38
- "Mul",
 
39
  "Sqrt",
40
- "Shape",
41
- "Sub",
42
- "Softmax",
43
- "MatMul",
44
- "Reshape",
45
- "ReduceMean",
46
- "Div",
47
- "ConstantOfShape",
48
  "Pow",
 
49
  "Transpose",
50
- "Gather",
51
  "Expand",
 
 
 
 
 
 
 
 
52
  "Sigmoid",
53
  "Unsqueeze",
54
- "Concat",
55
- "Cast",
56
- "Equal",
57
- "Range"
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
- "decoder_model": {
62
  "op_types": [
63
- "Add",
64
- "Where",
65
  "Constant",
66
- "Slice",
67
- "Mul",
68
  "Sqrt",
69
- "Shape",
70
- "Sub",
71
- "Softmax",
72
- "MatMul",
73
- "Reshape",
74
- "ReduceMean",
75
- "Div",
76
- "ConstantOfShape",
77
  "Pow",
 
 
78
  "Transpose",
79
- "Gather",
80
  "Expand",
 
 
 
 
 
 
 
 
 
81
  "Sigmoid",
82
  "Unsqueeze",
83
- "Concat",
84
- "Cast",
85
- "Less",
86
- "Squeeze",
87
- "Equal",
88
- "Range"
89
  ],
90
  "weight_type": "QInt8"
91
  },
92
- "decoder_model_merged": {
93
  "op_types": [
94
- "Add",
95
- "Where",
96
  "Constant",
97
- "Slice",
98
- "Mul",
99
  "Sqrt",
100
- "Shape",
101
- "Sub",
102
- "Softmax",
103
- "MatMul",
104
- "Reshape",
105
- "ReduceMean",
106
- "Div",
107
- "ConstantOfShape",
108
  "Pow",
 
 
109
  "Transpose",
110
- "Gather",
111
  "Expand",
112
- "If",
 
 
 
 
 
 
 
113
  "Sigmoid",
114
  "Unsqueeze",
115
- "Concat",
116
- "Cast",
117
- "Less",
118
- "Squeeze",
119
- "Equal",
120
- "Range"
121
  ],
122
  "weight_type": "QInt8"
123
  }
 
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
 
 
7
  "Constant",
8
+ "Add",
9
+ "Gather",
10
  "Sqrt",
11
+ "Concat",
12
+ "Equal",
 
 
 
 
 
 
13
  "Pow",
14
+ "Softmax",
15
  "Transpose",
16
+ "ReduceMean",
17
  "Expand",
18
+ "Mul",
19
+ "Sub",
20
+ "Div",
21
+ "Reshape",
22
+ "Where",
23
+ "Cast",
24
+ "Shape",
25
+ "Range",
26
  "Sigmoid",
27
  "Unsqueeze",
28
+ "ConstantOfShape",
29
+ "MatMul"
 
 
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
 
 
35
  "Constant",
36
+ "Add",
37
+ "Gather",
38
  "Sqrt",
39
+ "Concat",
40
+ "Equal",
 
 
 
 
 
 
41
  "Pow",
42
+ "Softmax",
43
  "Transpose",
44
+ "ReduceMean",
45
  "Expand",
46
+ "Mul",
47
+ "Sub",
48
+ "Div",
49
+ "Reshape",
50
+ "Where",
51
+ "Cast",
52
+ "Shape",
53
+ "Range",
54
  "Sigmoid",
55
  "Unsqueeze",
56
+ "ConstantOfShape",
57
+ "MatMul"
 
 
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
+ "decoder_model_merged": {
62
  "op_types": [
 
 
63
  "Constant",
64
+ "Add",
65
+ "Gather",
66
  "Sqrt",
67
+ "Concat",
68
+ "Equal",
 
 
 
 
 
 
69
  "Pow",
70
+ "Softmax",
71
+ "Squeeze",
72
  "Transpose",
73
+ "ReduceMean",
74
  "Expand",
75
+ "Mul",
76
+ "Sub",
77
+ "Div",
78
+ "Reshape",
79
+ "If",
80
+ "Where",
81
+ "Cast",
82
+ "Shape",
83
+ "Range",
84
  "Sigmoid",
85
  "Unsqueeze",
86
+ "ConstantOfShape",
87
+ "MatMul",
88
+ "Slice",
89
+ "Less"
 
 
90
  ],
91
  "weight_type": "QInt8"
92
  },
93
+ "decoder_model": {
94
  "op_types": [
 
 
95
  "Constant",
96
+ "Add",
97
+ "Gather",
98
  "Sqrt",
99
+ "Concat",
100
+ "Equal",
 
 
 
 
 
 
101
  "Pow",
102
+ "Softmax",
103
+ "Squeeze",
104
  "Transpose",
105
+ "ReduceMean",
106
  "Expand",
107
+ "Mul",
108
+ "Sub",
109
+ "Div",
110
+ "Reshape",
111
+ "Where",
112
+ "Cast",
113
+ "Shape",
114
+ "Range",
115
  "Sigmoid",
116
  "Unsqueeze",
117
+ "ConstantOfShape",
118
+ "MatMul",
119
+ "Slice",
120
+ "Less"
 
 
121
  ],
122
  "weight_type": "QInt8"
123
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff