Upload folder using huggingface_hub (#5)
Browse files- adfacd1fdecad3533c359c30035a150da4a6e0744babe33836ac0fdb654fbd47 (55d49b1c98c08068f079996428a06ceda4167015)
- 89d39802f0f44aab3aaec9fe367bbde5bdeb1f600dc741fc19855a66bf25179e (532a50809d5112e12c2e72cb107ca8f7739ea2a6)
- 154b6296b96d19d09f03b3a2c445b70c6254c729fee49893e751a6f8bd5f4923 (1a1feb7c86b5379c2de530a5707d09186273231f)
- 04e119436f75f623c3d09d0eed91cd5bdcec6c8aed307bdb0a418776a3ed37a3 (c8e81dd24aeddc4f4c43253c3bc3243628ee7b6c)
- aad672a5c32ccddaefef79368d8cca41096ad7c03b3d22377804b1dd0eefa803 (f00cba4ff2556bf9ab84460ee7a9ef48aeb70a34)
- 2699bd4029ecae938e19db9fe8e756f6ed9c30214508311656496453decf4e2f (23f25e7d7f13ff4626ebe028c1b6f439442febac)
- c191b597e4415146f4bb0d3df015d2bd960a03ca7ee497671c00fa16ac390ee5 (5ab58aaf5db3792643d86419f42bb2b7c6be7c78)
- .gitattributes +1 -0
- README.md +5 -4
- config.json +2 -1
- generation_config.json +1 -1
- model-00001-of-00007.safetensors +1 -1
- model-00002-of-00007.safetensors +1 -1
- model-00003-of-00007.safetensors +1 -1
- model-00004-of-00007.safetensors +1 -1
- model-00005-of-00007.safetensors +1 -1
- model-00006-of-00007.safetensors +1 -1
- tokenizer.json +0 -0
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
@@ -29,6 +29,7 @@ tags:
|
|
29 |
base_model: meta-llama/Meta-Llama-3.1-8B-Instruct
|
30 |
datasets:
|
31 |
- sequelbox/Celestia
|
|
|
32 |
- sequelbox/Supernova
|
33 |
model_type: llama
|
34 |
model-index:
|
@@ -261,9 +262,9 @@ Shining Valiant 2 is a chat model built on Llama 3.1 8b, finetuned on our data f
|
|
261 |
|
262 |
## Version
|
263 |
|
264 |
-
This is the **2024-
|
265 |
|
266 |
-
|
267 |
|
268 |
Future upgrades will continue to expand Shining Valiant's technical knowledge base.
|
269 |
|
@@ -303,9 +304,9 @@ print(outputs[0]["generated_text"][-1])
|
|
303 |
## The Model
|
304 |
Shining Valiant 2 is built on top of Llama 3.1 8b Instruct.
|
305 |
|
306 |
-
The current version of Shining Valiant 2 is trained on technical knowledge using [sequelbox/Celestia](https://huggingface.co/datasets/sequelbox/Celestia) and general chat capability using [sequelbox/Supernova.](https://huggingface.co/datasets/sequelbox/Supernova)
|
307 |
|
308 |
-
|
309 |
|
310 |
|
311 |
![image/jpeg](https://cdn-uploads.huggingface.co/production/uploads/63444f2687964b331809eb55/VCJ8Fmefd8cdVhXSSxJiD.jpeg)
|
|
|
29 |
base_model: meta-llama/Meta-Llama-3.1-8B-Instruct
|
30 |
datasets:
|
31 |
- sequelbox/Celestia
|
32 |
+
- sequelbox/Spurline
|
33 |
- sequelbox/Supernova
|
34 |
model_type: llama
|
35 |
model-index:
|
|
|
262 |
|
263 |
## Version
|
264 |
|
265 |
+
This is the **2024-11-04** release of Shining Valiant 2 for Llama 3.1 8b.
|
266 |
|
267 |
+
This release uses our newest datasets, open-sourced for everyone's use, including our expanded [science-instruct dataset](https://huggingface.co/datasets/sequelbox/Celestia). This release features improvements in logical thinking and structured reasoning as well as physics, chemistry, biology, astronomy, Earth science, computer science, and information theory.
|
268 |
|
269 |
Future upgrades will continue to expand Shining Valiant's technical knowledge base.
|
270 |
|
|
|
304 |
## The Model
|
305 |
Shining Valiant 2 is built on top of Llama 3.1 8b Instruct.
|
306 |
|
307 |
+
The current version of Shining Valiant 2 is trained on technical knowledge using [sequelbox/Celestia](https://huggingface.co/datasets/sequelbox/Celestia), complex reasoning using [sequelbox/Spurline](https://huggingface.co/datasets/sequelbox/Spurline), and general chat capability using [sequelbox/Supernova.](https://huggingface.co/datasets/sequelbox/Supernova)
|
308 |
|
309 |
+
We're super excited that Shining Valiant's dataset has been fully open-sourced! She's friendly, enthusiastic, insightful, knowledgeable, and loves to learn! Magical.
|
310 |
|
311 |
|
312 |
![image/jpeg](https://cdn-uploads.huggingface.co/production/uploads/63444f2687964b331809eb55/VCJ8Fmefd8cdVhXSSxJiD.jpeg)
|
@@ -11,6 +11,7 @@
|
|
11 |
128008,
|
12 |
128009
|
13 |
],
|
|
|
14 |
"hidden_act": "silu",
|
15 |
"hidden_size": 4096,
|
16 |
"initializer_range": 0.02,
|
@@ -33,7 +34,7 @@
|
|
33 |
"rope_theta": 500000.0,
|
34 |
"tie_word_embeddings": false,
|
35 |
"torch_dtype": "float32",
|
36 |
-
"transformers_version": "4.
|
37 |
"use_cache": true,
|
38 |
"vocab_size": 128256
|
39 |
}
|
|
|
11 |
128008,
|
12 |
128009
|
13 |
],
|
14 |
+
"head_dim": 128,
|
15 |
"hidden_act": "silu",
|
16 |
"hidden_size": 4096,
|
17 |
"initializer_range": 0.02,
|
|
|
34 |
"rope_theta": 500000.0,
|
35 |
"tie_word_embeddings": false,
|
36 |
"torch_dtype": "float32",
|
37 |
+
"transformers_version": "4.46.1",
|
38 |
"use_cache": true,
|
39 |
"vocab_size": 128256
|
40 |
}
|
@@ -8,5 +8,5 @@
|
|
8 |
],
|
9 |
"temperature": 0.6,
|
10 |
"top_p": 0.9,
|
11 |
-
"transformers_version": "4.
|
12 |
}
|
|
|
8 |
],
|
9 |
"temperature": 0.6,
|
10 |
"top_p": 0.9,
|
11 |
+
"transformers_version": "4.46.1"
|
12 |
}
|
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4886466168
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6efbffa72857ec90e0ea4310a6025190a4e75eef43e10ec9d46025412e1616a8
|
3 |
size 4886466168
|
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4832007448
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c569b9d9276836eb9f31fda31ea667ee3ad1c132b852ec94b4b9a7a2598db0ca
|
3 |
size 4832007448
|
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999813112
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10413c97beeea538cb108448193c790d5224192982c2837b1dc3a54a1d5ff50b
|
3 |
size 4999813112
|
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999813128
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ef021115a20513e5b0db4178345a1f4959c59eb73fbb3679aca24055ead5d0e
|
3 |
size 4999813128
|
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4832007496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26822b4a9c2cc0f9d92e0c1522f517aac4a20a6b936c706e1ca68ed1beaf8b44
|
3 |
size 4832007496
|
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999813120
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f64f7cdbfd3903f7fea88117c49a8533a1ffa928d1ce4354d0d8431faddffe4
|
3 |
size 4999813120
|
The diff for this file is too large to render.
See raw diff
|
|