fxmarty commited on
Commit
5d5b8c6
·
verified ·
1 Parent(s): 903d863

Upload folder using huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +50 -56
config.json CHANGED
@@ -21,64 +21,58 @@
21
  "pad_token_id": -1,
22
  "pretraining_tp": 1,
23
  "quantization_config": {
24
- "activation_scheme": "static",
25
- "kv_cache_scheme": null,
26
- "library": "quark",
27
- "quant_method": "fp8",
28
- "quark_config": {
29
- "algo_config": null,
30
- "exclude": [
31
- "lm_head"
32
- ],
33
- "export": {
34
- "kv_cache_group": [],
35
- "pack_method": "reorder",
36
- "weight_format": "real_quantized",
37
- "weight_merge_groups": null
 
 
 
 
 
 
 
 
38
  },
39
- "global_quant_config": {
40
- "bias": null,
41
- "input_tensors": {
42
- "ch_axis": null,
43
- "dtype": "fp8_e4m3",
44
- "group_size": null,
45
- "is_dynamic": false,
46
- "observer_cls": "PerTensorMinMaxObserver",
47
- "qscheme": "per_tensor",
48
- "round_method": null,
49
- "scale_type": null,
50
- "symmetric": null
51
- },
52
- "output_tensors": {
53
- "ch_axis": null,
54
- "dtype": "fp8_e4m3",
55
- "group_size": null,
56
- "is_dynamic": false,
57
- "observer_cls": "PerTensorMinMaxObserver",
58
- "qscheme": "per_tensor",
59
- "round_method": null,
60
- "scale_type": null,
61
- "symmetric": null
62
- },
63
- "target_device": null,
64
- "weight": {
65
- "ch_axis": null,
66
- "dtype": "fp8_e4m3",
67
- "group_size": null,
68
- "is_dynamic": false,
69
- "observer_cls": "PerTensorMinMaxObserver",
70
- "qscheme": "per_tensor",
71
- "round_method": null,
72
- "scale_type": null,
73
- "symmetric": null
74
- }
75
  },
76
- "layer_quant_config": {},
77
- "layer_type_quant_config": {},
78
- "pack_method": "reorder",
79
- "quant_method": "quark",
80
- "quant_mode": 1
81
- }
 
 
 
 
 
 
 
 
 
 
 
 
82
  },
83
  "rms_norm_eps": 1e-06,
84
  "rope_scaling": null,
 
21
  "pad_token_id": -1,
22
  "pretraining_tp": 1,
23
  "quantization_config": {
24
+ "algo_config": null,
25
+ "exclude": [
26
+ "lm_head"
27
+ ],
28
+ "export": {
29
+ "kv_cache_group": [],
30
+ "pack_method": "reorder",
31
+ "weight_format": "real_quantized",
32
+ "weight_merge_groups": null
33
+ },
34
+ "global_quant_config": {
35
+ "bias": null,
36
+ "input_tensors": {
37
+ "ch_axis": null,
38
+ "dtype": "fp8_e4m3",
39
+ "group_size": null,
40
+ "is_dynamic": false,
41
+ "observer_cls": "PerTensorMinMaxObserver",
42
+ "qscheme": "per_tensor",
43
+ "round_method": null,
44
+ "scale_type": null,
45
+ "symmetric": null
46
  },
47
+ "output_tensors": {
48
+ "ch_axis": null,
49
+ "dtype": "fp8_e4m3",
50
+ "group_size": null,
51
+ "is_dynamic": false,
52
+ "observer_cls": "PerTensorMinMaxObserver",
53
+ "qscheme": "per_tensor",
54
+ "round_method": null,
55
+ "scale_type": null,
56
+ "symmetric": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
  },
58
+ "target_device": null,
59
+ "weight": {
60
+ "ch_axis": null,
61
+ "dtype": "fp8_e4m3",
62
+ "group_size": null,
63
+ "is_dynamic": false,
64
+ "observer_cls": "PerTensorMinMaxObserver",
65
+ "qscheme": "per_tensor",
66
+ "round_method": null,
67
+ "scale_type": null,
68
+ "symmetric": null
69
+ }
70
+ },
71
+ "layer_quant_config": {},
72
+ "layer_type_quant_config": {},
73
+ "pack_method": "reorder",
74
+ "quant_method": "quark",
75
+ "quant_mode": 1
76
  },
77
  "rms_norm_eps": 1e-06,
78
  "rope_scaling": null,