End of training
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +1 -5
- adapter_config.json +3 -3
- adapter_model.safetensors +1 -1
- overlap 0.jpg +0 -0
- overlap 1.jpg +0 -0
- overlap 10.jpg +0 -0
- overlap 11.jpg +0 -0
- overlap 12.jpg +0 -0
- overlap 13.jpg +0 -0
- overlap 14.jpg +0 -0
- overlap 15.jpg +0 -0
- overlap 16.jpg +0 -0
- overlap 17.jpg +0 -0
- overlap 18.jpg +0 -0
- overlap 19.jpg +0 -0
- overlap 2.jpg +0 -0
- overlap 20.jpg +0 -0
- overlap 21.jpg +0 -0
- overlap 22.jpg +0 -0
- overlap 23.jpg +0 -0
- overlap 24.jpg +0 -0
- overlap 25.jpg +0 -0
- overlap 26.jpg +0 -0
- overlap 27.jpg +0 -0
- overlap 28.jpg +0 -0
- overlap 29.jpg +0 -0
- overlap 3.jpg +0 -0
- overlap 30.jpg +0 -0
- overlap 31.jpg +0 -0
- overlap 32.jpg +0 -0
- overlap 33.jpg +0 -0
- overlap 34.jpg +0 -0
- overlap 35.jpg +0 -0
- overlap 36.jpg +0 -0
- overlap 37.jpg +0 -0
- overlap 38.jpg +0 -0
- overlap 39.jpg +0 -0
- overlap 4.jpg +0 -0
- overlap 40.jpg +0 -0
- overlap 41.jpg +0 -0
- overlap 42.jpg +0 -0
- overlap 43.jpg +0 -0
- overlap 44.jpg +0 -0
- overlap 45.jpg +0 -0
- overlap 46.jpg +0 -0
- overlap 47.jpg +0 -0
- overlap 48.jpg +0 -0
- overlap 49.jpg +0 -0
- overlap 5.jpg +0 -0
- overlap 50.jpg +0 -0
README.md
CHANGED
@@ -43,13 +43,9 @@ The following hyperparameters were used during training:
|
|
43 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
44 |
- lr_scheduler_type: cosine
|
45 |
- lr_scheduler_warmup_ratio: 0.03
|
46 |
-
- num_epochs:
|
47 |
- mixed_precision_training: Native AMP
|
48 |
|
49 |
-
### Training results
|
50 |
-
|
51 |
-
|
52 |
-
|
53 |
### Framework versions
|
54 |
|
55 |
- PEFT 0.11.2.dev0
|
|
|
43 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
44 |
- lr_scheduler_type: cosine
|
45 |
- lr_scheduler_warmup_ratio: 0.03
|
46 |
+
- num_epochs: 3
|
47 |
- mixed_precision_training: Native AMP
|
48 |
|
|
|
|
|
|
|
|
|
49 |
### Framework versions
|
50 |
|
51 |
- PEFT 0.11.2.dev0
|
adapter_config.json
CHANGED
@@ -20,10 +20,10 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"query_key_value",
|
24 |
-
"dense_h_to_4h",
|
25 |
"dense_4h_to_h",
|
26 |
-
"
|
|
|
|
|
27 |
],
|
28 |
"task_type": "CAUSAL_LM",
|
29 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
|
|
|
|
23 |
"dense_4h_to_h",
|
24 |
+
"dense_h_to_4h",
|
25 |
+
"dense",
|
26 |
+
"query_key_value"
|
27 |
],
|
28 |
"task_type": "CAUSAL_LM",
|
29 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 100690288
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bc893b41372f260eb02048401003e6873a3340a4358fa4e9eff49be4547bb6e
|
3 |
size 100690288
|
overlap 0.jpg
ADDED
overlap 1.jpg
ADDED
overlap 10.jpg
ADDED
overlap 11.jpg
ADDED
overlap 12.jpg
ADDED
overlap 13.jpg
ADDED
overlap 14.jpg
ADDED
overlap 15.jpg
ADDED
overlap 16.jpg
ADDED
overlap 17.jpg
ADDED
overlap 18.jpg
ADDED
overlap 19.jpg
ADDED
overlap 2.jpg
ADDED
overlap 20.jpg
ADDED
overlap 21.jpg
ADDED
overlap 22.jpg
ADDED
overlap 23.jpg
ADDED
overlap 24.jpg
ADDED
overlap 25.jpg
ADDED
overlap 26.jpg
ADDED
overlap 27.jpg
ADDED
overlap 28.jpg
ADDED
overlap 29.jpg
ADDED
overlap 3.jpg
ADDED
overlap 30.jpg
ADDED
overlap 31.jpg
ADDED
overlap 32.jpg
ADDED
overlap 33.jpg
ADDED
overlap 34.jpg
ADDED
overlap 35.jpg
ADDED
overlap 36.jpg
ADDED
overlap 37.jpg
ADDED
overlap 38.jpg
ADDED
overlap 39.jpg
ADDED
overlap 4.jpg
ADDED
overlap 40.jpg
ADDED
overlap 41.jpg
ADDED
overlap 42.jpg
ADDED
overlap 43.jpg
ADDED
overlap 44.jpg
ADDED
overlap 45.jpg
ADDED
overlap 46.jpg
ADDED
overlap 47.jpg
ADDED
overlap 48.jpg
ADDED
overlap 49.jpg
ADDED
overlap 5.jpg
ADDED
overlap 50.jpg
ADDED