danielhanchen commited on
Commit
fd98091
1 Parent(s): 13e19bc

Upload config

Browse files
Files changed (2) hide show
  1. README.md +1 -1
  2. config.json +5 -3
README.md CHANGED
@@ -1,8 +1,8 @@
1
  ---
2
  language:
3
  - en
4
- license: apache-2.0
5
  library_name: transformers
 
6
  tags:
7
  - unsloth
8
  - transformers
 
1
  ---
2
  language:
3
  - en
 
4
  library_name: transformers
5
+ license: apache-2.0
6
  tags:
7
  - unsloth
8
  - transformers
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "Qwen/Qwen2-0.5B-Instruct",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
@@ -16,12 +16,14 @@
16
  "num_attention_heads": 14,
17
  "num_hidden_layers": 24,
18
  "num_key_value_heads": 2,
 
19
  "rms_norm_eps": 1e-06,
20
  "rope_theta": 1000000.0,
21
- "sliding_window": 32768,
22
  "tie_word_embeddings": true,
23
  "torch_dtype": "bfloat16",
24
- "transformers_version": "4.41.2",
 
25
  "use_cache": true,
26
  "use_sliding_window": false,
27
  "vocab_size": 151936
 
1
  {
2
+ "_name_or_path": "unsloth/Qwen2-0.5B-Instruct",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
 
16
  "num_attention_heads": 14,
17
  "num_hidden_layers": 24,
18
  "num_key_value_heads": 2,
19
+ "pad_token_id": 151643,
20
  "rms_norm_eps": 1e-06,
21
  "rope_theta": 1000000.0,
22
+ "sliding_window": null,
23
  "tie_word_embeddings": true,
24
  "torch_dtype": "bfloat16",
25
+ "transformers_version": "4.44.0",
26
+ "unsloth_version": "2024.8",
27
  "use_cache": true,
28
  "use_sliding_window": false,
29
  "vocab_size": 151936