iNeil77 commited on
Commit
650defe
·
verified ·
1 Parent(s): 33ab729

Upload Qwen3ForCausalLM

Browse files
Files changed (3) hide show
  1. README.md +1 -1
  2. config.json +4 -4
  3. generation_config.json +2 -2
README.md CHANGED
@@ -2,4 +2,4 @@
2
  license: apache-2.0
3
  pipeline_tag: text-generation
4
  library_name: transformers
5
- ---
 
2
  license: apache-2.0
3
  pipeline_tag: text-generation
4
  library_name: transformers
5
+ ---
config.json CHANGED
@@ -4,7 +4,7 @@
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
- "bos_token_id": 151643,
8
  "dtype": "bfloat16",
9
  "eos_token_id": 151643,
10
  "head_dim": 128,
@@ -42,7 +42,7 @@
42
  "full_attention",
43
  "full_attention"
44
  ],
45
- "max_position_embeddings": 32768,
46
  "max_window_layers": 28,
47
  "model_type": "qwen3",
48
  "num_attention_heads": 16,
@@ -51,12 +51,12 @@
51
  "pad_token_id": 151656,
52
  "rms_norm_eps": 1e-06,
53
  "rope_parameters": {
54
- "rope_theta": 1000000,
55
  "rope_type": "default"
56
  },
57
  "sliding_window": null,
58
  "tie_word_embeddings": true,
59
- "transformers_version": "5.6.1",
60
  "use_cache": true,
61
  "use_sliding_window": false,
62
  "vocab_size": 151936
 
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
+ "bos_token_id": null,
8
  "dtype": "bfloat16",
9
  "eos_token_id": 151643,
10
  "head_dim": 128,
 
42
  "full_attention",
43
  "full_attention"
44
  ],
45
+ "max_position_embeddings": 131072,
46
  "max_window_layers": 28,
47
  "model_type": "qwen3",
48
  "num_attention_heads": 16,
 
51
  "pad_token_id": 151656,
52
  "rms_norm_eps": 1e-06,
53
  "rope_parameters": {
54
+ "rope_theta": 10000000,
55
  "rope_type": "default"
56
  },
57
  "sliding_window": null,
58
  "tie_word_embeddings": true,
59
+ "transformers_version": "5.8.1",
60
  "use_cache": true,
61
  "use_sliding_window": false,
62
  "vocab_size": 151936
generation_config.json CHANGED
@@ -7,6 +7,6 @@
7
  151656
8
  ],
9
  "pad_token_id": 151656,
10
- "transformers_version": "5.6.1",
11
  "trust_remote_code": true
12
- }
 
7
  151656
8
  ],
9
  "pad_token_id": 151656,
10
+ "transformers_version": "5.8.1",
11
  "trust_remote_code": true
12
+ }