nisten commited on Jan 29

Commit

5d79425

•

1 Parent(s): 753bbe3

Upload folder using huggingface_hub

Browse files

Files changed (43) hide show

README.md +52 -1
config.json +28 -0
mergekit_config.yml +28 -0
model-00001-of-00035.safetensors +3 -0
model-00002-of-00035.safetensors +3 -0
model-00003-of-00035.safetensors +3 -0
model-00004-of-00035.safetensors +3 -0
model-00005-of-00035.safetensors +3 -0
model-00006-of-00035.safetensors +3 -0
model-00007-of-00035.safetensors +3 -0
model-00008-of-00035.safetensors +3 -0
model-00009-of-00035.safetensors +3 -0
model-00010-of-00035.safetensors +3 -0
model-00011-of-00035.safetensors +3 -0
model-00012-of-00035.safetensors +3 -0
model-00013-of-00035.safetensors +3 -0
model-00014-of-00035.safetensors +3 -0
model-00015-of-00035.safetensors +3 -0
model-00016-of-00035.safetensors +3 -0
model-00017-of-00035.safetensors +3 -0
model-00018-of-00035.safetensors +3 -0
model-00019-of-00035.safetensors +3 -0
model-00020-of-00035.safetensors +3 -0
model-00021-of-00035.safetensors +3 -0
model-00022-of-00035.safetensors +3 -0
model-00023-of-00035.safetensors +3 -0
model-00024-of-00035.safetensors +3 -0
model-00025-of-00035.safetensors +3 -0
model-00026-of-00035.safetensors +3 -0
model-00027-of-00035.safetensors +3 -0
model-00028-of-00035.safetensors +3 -0
model-00029-of-00035.safetensors +3 -0
model-00030-of-00035.safetensors +3 -0
model-00031-of-00035.safetensors +3 -0
model-00032-of-00035.safetensors +3 -0
model-00033-of-00035.safetensors +3 -0
model-00034-of-00035.safetensors +3 -0
model-00035-of-00035.safetensors +3 -0
model.safetensors.index.json +0 -0
special_tokens_map.json +23 -0
tokenizer.json +0 -0
tokenizer.model +3 -0
tokenizer_config.json +41 -0

README.md CHANGED Viewed

@@ -1,3 +1,54 @@
 ---
-license: mit
 ---

 ---
+base_model: []
+tags:
+- mergekit
+- merge
 ---
+# BigCodeLLama LFG 🚀
+## Experimental CodeLlaMA frankenstein to see how it benchmarks
+### Models Merged
+The following models were included in the merge:
+* ../CodeLlama-70b-hf
+* ../CodeLlama-70b-Instruct-hf
+* ../CodeLlama-70b-Python-hf
+### Configuration
+The following YAML configuration was used to produce this model:
+```yaml
+dtype: bfloat16
+merge_method: passthrough
+slices:
+- sources:
+  - layer_range: [0, 69]
+    model:
+      model:
+        path: ../CodeLlama-70b-hf
+- sources:
+  - layer_range: [66, 76]
+    model:
+      model:
+        path: ../CodeLlama-70b-Instruct-hf
+- sources:
+  - layer_range: [42, 66]
+    model:
+      model:
+        path: ../CodeLlama-70b-hf
+- sources:
+  - layer_range: [13, 37]
+    model:
+      model:
+        path: ../CodeLlama-70b-Python-hf
+- sources:
+  - layer_range: [10, 80]
+    model:
+      model:
+        path: ../CodeLlama-70b-Instruct-hf
+```
+### Stay tuned for GGUFs quants

config.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+  "_name_or_path": "BigCodeLlama-169b",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 8192,
+  "initializer_range": 0.02,
+  "intermediate_size": 28672,
+  "max_position_embeddings": 16384,
+  "model_type": "llama",
+  "num_attention_heads": 64,
+  "num_hidden_layers": 197,
+  "num_key_value_heads": 8,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 1000000,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.37.2",
+  "use_cache": true,
+  "vocab_size": 32016
+}

mergekit_config.yml ADDED Viewed

	@@ -0,0 +1,28 @@

+dtype: bfloat16
+merge_method: passthrough
+slices:
+- sources:
+  - layer_range: [0, 69]
+    model:
+      model:
+        path: ../CodeLlama-70b-hf
+- sources:
+  - layer_range: [66, 76]
+    model:
+      model:
+        path: ../CodeLlama-70b-Instruct-hf
+- sources:
+  - layer_range: [42, 66]
+    model:
+      model:
+        path: ../CodeLlama-70b-hf
+- sources:
+  - layer_range: [13, 37]
+    model:
+      model:
+        path: ../CodeLlama-70b-Python-hf
+- sources:
+  - layer_range: [10, 80]
+    model:
+      model:
+        path: ../CodeLlama-70b-Instruct-hf

model-00001-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2cdf6d49de5bd6cf36ac2ba1934691b637578e15a2545e7303bbd85bf811abb
+size 9852869216

model-00002-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:da3cfed04534b57517a985ad7562817357e189df6bc4aa78154db5c8fdcb0ffb
+size 9798096232

model-00003-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0428161bd48d61d51eb3316e3758059f57fbe963670260dc1e590498152e481
+size 9797997992

model-00004-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ca65b7cba5706dc35657650ffa552696493e210fcb94afba110474d240a4d34d
+size 9630325192

model-00005-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8d9e1443b8809374e42982b52ddeee2a39db9d500df41961d6b737fe0f087222
+size 9798096992

model-00006-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05425f4c273c3c9e51e40315999d6136a49b1038ea8b4b1a83ff2516f3b8b8d7
+size 9798129992

model-00007-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:491f90efbb9c435ea88c7d8e106fe70697a507b8db8406fa6fb3ec40f977e95a
+size 9999423488

model-00008-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cdc12500041f01ffd1729b9a8b1fa8fb1dd12773ee26bc304308ce4075060bb0
+size 9965868792

model-00009-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:102e1e2ab7e9beae5ad08f6ec0b3a7809e393bafcd3125ddd5dfdaba9f492c72
+size 9932314128

model-00010-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9bec2242b2b0e5d9945c0518af30e2e1bbd2c84dddd602d95b60e50a94fa6a46
+size 9798031016

model-00011-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22d8d0760bd7f9ae65d6cc1de2108674517466ffb3735777db214fc0bd6806eb
+size 9965853000

model-00012-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9f5ee6252ebebbb96df56ac025693a135c7d0c6b59ca59935aebe67a6d67e06a
+size 9764559544

model-00013-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fb3aecb0bd849f22aabdd5a360d7fb6d228fcf143ecf5e7b0278b8bc709f0237
+size 9798097000

model-00014-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1e457102fc56a72492b9e7c8e49f51576108cd4f0326e2a8e8adf08ba8467261
+size 9999423480

model-00015-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:128a39f880167a165c9c5f24ee7eddc6199f3f7b8fba46d6a7eb857b730176d1
+size 9831650944

model-00016-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:966a1dcb03fd6e2739c9c659f1519126885fdf84d2692602a7e7b9fefdba869a
+size 9764541608

model-00017-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2951108e876924b3543d65eebf6a43a64a3763135e6085712aba4b12d9c8b777
+size 9965819992

model-00018-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e01ef782efcd49e1af01bb7d5863613e1094d19528826572758da92898aaa10f
+size 9932282544

model-00019-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b24adb40483a2afd6f9a1a375a876db31e83cb1d52ea20fb8bd96574f39f0d6
+size 9764576040

model-00020-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:874d4940d68b908eeda96cf4e943820ad05e203277033387ba2f5692c49a820a
+size 9831667424

model-00021-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df0e31413836df6eac4870b068bfd4f51da77339e76ce2cfa43b73260105d409
+size 9999439952

model-00022-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af7a106c8f195178d507482327840dd70f290f480d52a75961c836453fe4e733
+size 9798063280

model-00023-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:46fc216f7e14908bb68489e5c16e1a1ac8a7c294756d3a0c338c449f53fb10d0
+size 9932297608

model-00024-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3fb607ff7fbe20f2324299526cba7cd5f1fab8b28478b2ff30b4cddda9db66d6
+size 9630275672

model-00025-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b1bba5bac077377d6334041d476584d8a835435231790ddcfb13f07c21371313
+size 9630292184

model-00026-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93562879bb415f590dddbd357d81039d2e3e930478cde61fe9cded9c7a38f91d
+size 9965885288

model-00027-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:73cc2507af8fdbba4876ad913daa67164bf23e2ad4d9fca912745d9f706d4507
+size 9798113472

model-00028-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4118e6ea30d4a291d8e978ae6b7fcf27c5bb25bf81e33eec7514d54c5be8ceac
+size 9999424168

model-00029-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cef6efb8985818333ae7413a911ac5594b3efa72ae4eb98d8a82e51417b4e0ec
+size 9663894912

model-00030-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a546055b84316bdf244c9028e508669314474e24f06775225ad4cc12a829cb16
+size 9764541608

model-00031-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbcde9f1e93113e13923c8c87357d9fcf6788bba40e2eae1b13c9c2ccaf2df0e
+size 9798014496

model-00032-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:33a2e5705ed2099ee4d6c52808426ef36b5fc2581b5bfa5622e404aded4d9cf2
+size 9932315528

model-00033-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2368514495d6f9d515252154f3ef8a081221ee8b6a43d37226b06b52a7b0ffc5
+size 9798096992

model-00034-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:db982aa39b1ca6576bbf567411746bb8b05119f7f3e224f1d19d469d04dabd16
+size 9697465384

model-00035-of-00035.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:150e94c99a3376ee807539545b5917f402b1085598aee299f76e9b82332f4f30
+size 3779413944

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99049b351301fb75b3b0587a484b675cbfd51abe27d2b92eabd385e4c41f97e9
+size 500033

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,41 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": true,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": null,
+  "sp_model_kwargs": {},
+  "spaces_between_special_tokens": false,
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}