Sansa commited on
Commit
72e1be8
1 Parent(s): 44d46d5

End of training

Browse files
config.json CHANGED
@@ -23,12 +23,6 @@
23
  "rope_theta": 10000.0,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
- "task_specific_params": {
27
- "text-generation": {
28
- "do_sample": true,
29
- "max_length": 2048
30
- }
31
- },
32
  "transformers_version": "4.44.2",
33
  "use_cache": true,
34
  "vocab_size": 32000
 
23
  "rope_theta": 10000.0,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
 
 
 
 
 
 
26
  "transformers_version": "4.44.2",
27
  "use_cache": true,
28
  "vocab_size": 32000
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30c0887fed90548d21054d3a3824c3a1e9bb62fa7849d224f14fe4cd3a5494a3
3
- size 3328345304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a81c619ae8c0c53793454282f9eb6af56ca013e95a4e4f4926ca31ab38a1af3
3
+ size 3590489392
model.safetensors.index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "metadata": {
3
- "total_size": 13214687232
4
  },
5
  "weight_map": {
6
  "denoise_model.layers.0.input_layernorm.weight": "model-00001-of-00003.safetensors",
@@ -292,6 +292,7 @@
292
  "denoise_model.layers.9.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
293
  "denoise_model.layers.9.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
294
  "denoise_model.norm.weight": "model-00003-of-00003.safetensors",
295
- "embed_tokens.weight": "model-00001-of-00003.safetensors"
 
296
  }
297
  }
 
1
  {
2
  "metadata": {
3
+ "total_size": 13476831232
4
  },
5
  "weight_map": {
6
  "denoise_model.layers.0.input_layernorm.weight": "model-00001-of-00003.safetensors",
 
292
  "denoise_model.layers.9.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
293
  "denoise_model.layers.9.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
294
  "denoise_model.norm.weight": "model-00003-of-00003.safetensors",
295
+ "embed_tokens.weight": "model-00001-of-00003.safetensors",
296
+ "lm_head.weight": "model-00003-of-00003.safetensors"
297
  }
298
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7103635ce5c20a6f6d01c93cefbc398a78e2de5a61db27adcfac95d8f56714ba
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a574afd82e6f6ababddfb8d8e5ce772823ff404fa8bb71fa77a6df3cc5f183f
3
  size 5368