Upload folder using huggingface_hub
Browse files- README.md +52 -1
- config.json +28 -0
- mergekit_config.yml +28 -0
- model-00001-of-00035.safetensors +3 -0
- model-00002-of-00035.safetensors +3 -0
- model-00003-of-00035.safetensors +3 -0
- model-00004-of-00035.safetensors +3 -0
- model-00005-of-00035.safetensors +3 -0
- model-00006-of-00035.safetensors +3 -0
- model-00007-of-00035.safetensors +3 -0
- model-00008-of-00035.safetensors +3 -0
- model-00009-of-00035.safetensors +3 -0
- model-00010-of-00035.safetensors +3 -0
- model-00011-of-00035.safetensors +3 -0
- model-00012-of-00035.safetensors +3 -0
- model-00013-of-00035.safetensors +3 -0
- model-00014-of-00035.safetensors +3 -0
- model-00015-of-00035.safetensors +3 -0
- model-00016-of-00035.safetensors +3 -0
- model-00017-of-00035.safetensors +3 -0
- model-00018-of-00035.safetensors +3 -0
- model-00019-of-00035.safetensors +3 -0
- model-00020-of-00035.safetensors +3 -0
- model-00021-of-00035.safetensors +3 -0
- model-00022-of-00035.safetensors +3 -0
- model-00023-of-00035.safetensors +3 -0
- model-00024-of-00035.safetensors +3 -0
- model-00025-of-00035.safetensors +3 -0
- model-00026-of-00035.safetensors +3 -0
- model-00027-of-00035.safetensors +3 -0
- model-00028-of-00035.safetensors +3 -0
- model-00029-of-00035.safetensors +3 -0
- model-00030-of-00035.safetensors +3 -0
- model-00031-of-00035.safetensors +3 -0
- model-00032-of-00035.safetensors +3 -0
- model-00033-of-00035.safetensors +3 -0
- model-00034-of-00035.safetensors +3 -0
- model-00035-of-00035.safetensors +3 -0
- model.safetensors.index.json +0 -0
- special_tokens_map.json +23 -0
- tokenizer.json +0 -0
- tokenizer.model +3 -0
- tokenizer_config.json +41 -0
README.md
CHANGED
@@ -1,3 +1,54 @@
|
|
1 |
---
|
2 |
-
|
|
|
|
|
|
|
|
|
3 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
---
|
2 |
+
base_model: []
|
3 |
+
tags:
|
4 |
+
- mergekit
|
5 |
+
- merge
|
6 |
+
|
7 |
---
|
8 |
+
# BigCodeLLama LFG 🚀
|
9 |
+
|
10 |
+
## Experimental CodeLlaMA frankenstein to see how it benchmarks
|
11 |
+
|
12 |
+
### Models Merged
|
13 |
+
|
14 |
+
The following models were included in the merge:
|
15 |
+
* ../CodeLlama-70b-hf
|
16 |
+
* ../CodeLlama-70b-Instruct-hf
|
17 |
+
* ../CodeLlama-70b-Python-hf
|
18 |
+
|
19 |
+
### Configuration
|
20 |
+
|
21 |
+
The following YAML configuration was used to produce this model:
|
22 |
+
|
23 |
+
```yaml
|
24 |
+
dtype: bfloat16
|
25 |
+
merge_method: passthrough
|
26 |
+
slices:
|
27 |
+
- sources:
|
28 |
+
- layer_range: [0, 69]
|
29 |
+
model:
|
30 |
+
model:
|
31 |
+
path: ../CodeLlama-70b-hf
|
32 |
+
- sources:
|
33 |
+
- layer_range: [66, 76]
|
34 |
+
model:
|
35 |
+
model:
|
36 |
+
path: ../CodeLlama-70b-Instruct-hf
|
37 |
+
- sources:
|
38 |
+
- layer_range: [42, 66]
|
39 |
+
model:
|
40 |
+
model:
|
41 |
+
path: ../CodeLlama-70b-hf
|
42 |
+
- sources:
|
43 |
+
- layer_range: [13, 37]
|
44 |
+
model:
|
45 |
+
model:
|
46 |
+
path: ../CodeLlama-70b-Python-hf
|
47 |
+
- sources:
|
48 |
+
- layer_range: [10, 80]
|
49 |
+
model:
|
50 |
+
model:
|
51 |
+
path: ../CodeLlama-70b-Instruct-hf
|
52 |
+
```
|
53 |
+
|
54 |
+
### Stay tuned for GGUFs quants
|
config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "BigCodeLlama-169b",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 16384,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 197,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"pretraining_tp": 1,
|
20 |
+
"rms_norm_eps": 1e-05,
|
21 |
+
"rope_scaling": null,
|
22 |
+
"rope_theta": 1000000,
|
23 |
+
"tie_word_embeddings": false,
|
24 |
+
"torch_dtype": "bfloat16",
|
25 |
+
"transformers_version": "4.37.2",
|
26 |
+
"use_cache": true,
|
27 |
+
"vocab_size": 32016
|
28 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
dtype: bfloat16
|
2 |
+
merge_method: passthrough
|
3 |
+
slices:
|
4 |
+
- sources:
|
5 |
+
- layer_range: [0, 69]
|
6 |
+
model:
|
7 |
+
model:
|
8 |
+
path: ../CodeLlama-70b-hf
|
9 |
+
- sources:
|
10 |
+
- layer_range: [66, 76]
|
11 |
+
model:
|
12 |
+
model:
|
13 |
+
path: ../CodeLlama-70b-Instruct-hf
|
14 |
+
- sources:
|
15 |
+
- layer_range: [42, 66]
|
16 |
+
model:
|
17 |
+
model:
|
18 |
+
path: ../CodeLlama-70b-hf
|
19 |
+
- sources:
|
20 |
+
- layer_range: [13, 37]
|
21 |
+
model:
|
22 |
+
model:
|
23 |
+
path: ../CodeLlama-70b-Python-hf
|
24 |
+
- sources:
|
25 |
+
- layer_range: [10, 80]
|
26 |
+
model:
|
27 |
+
model:
|
28 |
+
path: ../CodeLlama-70b-Instruct-hf
|
model-00001-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2cdf6d49de5bd6cf36ac2ba1934691b637578e15a2545e7303bbd85bf811abb
|
3 |
+
size 9852869216
|
model-00002-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da3cfed04534b57517a985ad7562817357e189df6bc4aa78154db5c8fdcb0ffb
|
3 |
+
size 9798096232
|
model-00003-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0428161bd48d61d51eb3316e3758059f57fbe963670260dc1e590498152e481
|
3 |
+
size 9797997992
|
model-00004-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca65b7cba5706dc35657650ffa552696493e210fcb94afba110474d240a4d34d
|
3 |
+
size 9630325192
|
model-00005-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d9e1443b8809374e42982b52ddeee2a39db9d500df41961d6b737fe0f087222
|
3 |
+
size 9798096992
|
model-00006-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05425f4c273c3c9e51e40315999d6136a49b1038ea8b4b1a83ff2516f3b8b8d7
|
3 |
+
size 9798129992
|
model-00007-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:491f90efbb9c435ea88c7d8e106fe70697a507b8db8406fa6fb3ec40f977e95a
|
3 |
+
size 9999423488
|
model-00008-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdc12500041f01ffd1729b9a8b1fa8fb1dd12773ee26bc304308ce4075060bb0
|
3 |
+
size 9965868792
|
model-00009-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:102e1e2ab7e9beae5ad08f6ec0b3a7809e393bafcd3125ddd5dfdaba9f492c72
|
3 |
+
size 9932314128
|
model-00010-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bec2242b2b0e5d9945c0518af30e2e1bbd2c84dddd602d95b60e50a94fa6a46
|
3 |
+
size 9798031016
|
model-00011-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22d8d0760bd7f9ae65d6cc1de2108674517466ffb3735777db214fc0bd6806eb
|
3 |
+
size 9965853000
|
model-00012-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f5ee6252ebebbb96df56ac025693a135c7d0c6b59ca59935aebe67a6d67e06a
|
3 |
+
size 9764559544
|
model-00013-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb3aecb0bd849f22aabdd5a360d7fb6d228fcf143ecf5e7b0278b8bc709f0237
|
3 |
+
size 9798097000
|
model-00014-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e457102fc56a72492b9e7c8e49f51576108cd4f0326e2a8e8adf08ba8467261
|
3 |
+
size 9999423480
|
model-00015-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:128a39f880167a165c9c5f24ee7eddc6199f3f7b8fba46d6a7eb857b730176d1
|
3 |
+
size 9831650944
|
model-00016-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:966a1dcb03fd6e2739c9c659f1519126885fdf84d2692602a7e7b9fefdba869a
|
3 |
+
size 9764541608
|
model-00017-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2951108e876924b3543d65eebf6a43a64a3763135e6085712aba4b12d9c8b777
|
3 |
+
size 9965819992
|
model-00018-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e01ef782efcd49e1af01bb7d5863613e1094d19528826572758da92898aaa10f
|
3 |
+
size 9932282544
|
model-00019-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b24adb40483a2afd6f9a1a375a876db31e83cb1d52ea20fb8bd96574f39f0d6
|
3 |
+
size 9764576040
|
model-00020-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:874d4940d68b908eeda96cf4e943820ad05e203277033387ba2f5692c49a820a
|
3 |
+
size 9831667424
|
model-00021-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df0e31413836df6eac4870b068bfd4f51da77339e76ce2cfa43b73260105d409
|
3 |
+
size 9999439952
|
model-00022-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af7a106c8f195178d507482327840dd70f290f480d52a75961c836453fe4e733
|
3 |
+
size 9798063280
|
model-00023-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46fc216f7e14908bb68489e5c16e1a1ac8a7c294756d3a0c338c449f53fb10d0
|
3 |
+
size 9932297608
|
model-00024-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fb607ff7fbe20f2324299526cba7cd5f1fab8b28478b2ff30b4cddda9db66d6
|
3 |
+
size 9630275672
|
model-00025-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1bba5bac077377d6334041d476584d8a835435231790ddcfb13f07c21371313
|
3 |
+
size 9630292184
|
model-00026-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93562879bb415f590dddbd357d81039d2e3e930478cde61fe9cded9c7a38f91d
|
3 |
+
size 9965885288
|
model-00027-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73cc2507af8fdbba4876ad913daa67164bf23e2ad4d9fca912745d9f706d4507
|
3 |
+
size 9798113472
|
model-00028-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4118e6ea30d4a291d8e978ae6b7fcf27c5bb25bf81e33eec7514d54c5be8ceac
|
3 |
+
size 9999424168
|
model-00029-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cef6efb8985818333ae7413a911ac5594b3efa72ae4eb98d8a82e51417b4e0ec
|
3 |
+
size 9663894912
|
model-00030-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a546055b84316bdf244c9028e508669314474e24f06775225ad4cc12a829cb16
|
3 |
+
size 9764541608
|
model-00031-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbcde9f1e93113e13923c8c87357d9fcf6788bba40e2eae1b13c9c2ccaf2df0e
|
3 |
+
size 9798014496
|
model-00032-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33a2e5705ed2099ee4d6c52808426ef36b5fc2581b5bfa5622e404aded4d9cf2
|
3 |
+
size 9932315528
|
model-00033-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2368514495d6f9d515252154f3ef8a081221ee8b6a43d37226b06b52a7b0ffc5
|
3 |
+
size 9798096992
|
model-00034-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db982aa39b1ca6576bbf567411746bb8b05119f7f3e224f1d19d469d04dabd16
|
3 |
+
size 9697465384
|
model-00035-of-00035.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:150e94c99a3376ee807539545b5917f402b1085598aee299f76e9b82332f4f30
|
3 |
+
size 3779413944
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
special_tokens_map.json
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "</s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"unk_token": {
|
17 |
+
"content": "<unk>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
}
|
23 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99049b351301fb75b3b0587a484b675cbfd51abe27d2b92eabd385e4c41f97e9
|
3 |
+
size 500033
|
tokenizer_config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": true,
|
3 |
+
"add_eos_token": false,
|
4 |
+
"added_tokens_decoder": {
|
5 |
+
"0": {
|
6 |
+
"content": "<unk>",
|
7 |
+
"lstrip": false,
|
8 |
+
"normalized": false,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false,
|
11 |
+
"special": true
|
12 |
+
},
|
13 |
+
"1": {
|
14 |
+
"content": "<s>",
|
15 |
+
"lstrip": false,
|
16 |
+
"normalized": false,
|
17 |
+
"rstrip": false,
|
18 |
+
"single_word": false,
|
19 |
+
"special": true
|
20 |
+
},
|
21 |
+
"2": {
|
22 |
+
"content": "</s>",
|
23 |
+
"lstrip": false,
|
24 |
+
"normalized": false,
|
25 |
+
"rstrip": false,
|
26 |
+
"single_word": false,
|
27 |
+
"special": true
|
28 |
+
}
|
29 |
+
},
|
30 |
+
"bos_token": "<s>",
|
31 |
+
"clean_up_tokenization_spaces": false,
|
32 |
+
"eos_token": "</s>",
|
33 |
+
"legacy": true,
|
34 |
+
"model_max_length": 1000000000000000019884624838656,
|
35 |
+
"pad_token": null,
|
36 |
+
"sp_model_kwargs": {},
|
37 |
+
"spaces_between_special_tokens": false,
|
38 |
+
"tokenizer_class": "LlamaTokenizer",
|
39 |
+
"unk_token": "<unk>",
|
40 |
+
"use_default_system_prompt": false
|
41 |
+
}
|