medimed commited on
Commit
83dc3b8
·
verified ·
1 Parent(s): aa340db

Upload Qwen3ForCausalLM

Browse files
Files changed (3) hide show
  1. config.json +43 -1
  2. model.safetensors +2 -2
  3. recipe.yaml +7 -0
config.json CHANGED
@@ -18,6 +18,48 @@
18
  "num_hidden_layers": 28,
19
  "num_key_value_heads": 8,
20
  "pad_token_id": 151643,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21
  "rms_norm_eps": 1e-06,
22
  "rope_scaling": null,
23
  "rope_theta": 1000000,
@@ -28,4 +70,4 @@
28
  "use_cache": true,
29
  "use_sliding_window": false,
30
  "vocab_size": 151936
31
- }
 
18
  "num_hidden_layers": 28,
19
  "num_key_value_heads": 8,
20
  "pad_token_id": 151643,
21
+ "quantization_config": {
22
+ "config_groups": {
23
+ "group_0": {
24
+ "input_activations": {
25
+ "actorder": null,
26
+ "block_structure": null,
27
+ "dynamic": true,
28
+ "group_size": null,
29
+ "num_bits": 8,
30
+ "observer": null,
31
+ "observer_kwargs": {},
32
+ "strategy": "token",
33
+ "symmetric": true,
34
+ "type": "int"
35
+ },
36
+ "output_activations": null,
37
+ "targets": [
38
+ "Linear"
39
+ ],
40
+ "weights": {
41
+ "actorder": null,
42
+ "block_structure": null,
43
+ "dynamic": false,
44
+ "group_size": null,
45
+ "num_bits": 8,
46
+ "observer": "minmax",
47
+ "observer_kwargs": {},
48
+ "strategy": "channel",
49
+ "symmetric": true,
50
+ "type": "int"
51
+ }
52
+ }
53
+ },
54
+ "format": "int-quantized",
55
+ "global_compression_ratio": null,
56
+ "ignore": [
57
+ "lm_head"
58
+ ],
59
+ "kv_cache_scheme": null,
60
+ "quant_method": "compressed-tensors",
61
+ "quantization_status": "compressed"
62
+ },
63
  "rms_norm_eps": 1e-06,
64
  "rope_scaling": null,
65
  "rope_theta": 1000000,
 
70
  "use_cache": true,
71
  "use_sliding_window": false,
72
  "vocab_size": 151936
73
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:baa3239a4c22b64f9442b9409e1ad5984719b1a4cfb83dacb7ca54d34ea8fe1d
3
- size 311308760
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7340bf7b29fa08a02b1f7fbb9c30dec3cd9c3423c692d83276e410848a6664c9
3
+ size 752443720
recipe.yaml ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ default_stage:
2
+ default_modifiers:
3
+ SmoothQuantModifier: {smoothing_strength: 0.8}
4
+ GPTQModifier:
5
+ scheme: W8A8
6
+ targets: Linear
7
+ ignore: [lm_head]