malibanekg commited on
Commit
e04f4ed
1 Parent(s): 32c7f35

Training in progress, step 500

Browse files
adapter_config.json CHANGED
@@ -7,14 +7,19 @@
7
  "init_lora_weights": true,
8
  "layers_pattern": null,
9
  "layers_to_transform": null,
10
- "lora_alpha": 32,
11
  "lora_dropout": 0.05,
12
  "modules_to_save": null,
13
  "peft_type": "LORA",
14
- "r": 32,
15
  "revision": null,
16
  "target_modules": [
17
  "q_proj",
 
 
 
 
 
18
  "v_proj"
19
  ],
20
  "task_type": "CAUSAL_LM"
 
7
  "init_lora_weights": true,
8
  "layers_pattern": null,
9
  "layers_to_transform": null,
10
+ "lora_alpha": 64,
11
  "lora_dropout": 0.05,
12
  "modules_to_save": null,
13
  "peft_type": "LORA",
14
+ "r": 16,
15
  "revision": null,
16
  "target_modules": [
17
  "q_proj",
18
+ "up_proj",
19
+ "o_proj",
20
+ "k_proj",
21
+ "down_proj",
22
+ "gate_proj",
23
  "v_proj"
24
  ],
25
  "task_type": "CAUSAL_LM"
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30ced87f7939b503d56c01b6ec9e3447cfbd1e5fc4784fdb1357e25abe3d4490
3
- size 67154893
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e55120625687c565e690bd8174332fd7986f44332a13a1e7941e1ba86c25ced5
3
+ size 160069389
runs/Dec18_23-16-55_gpu3/events.out.tfevents.1702941425.gpu3.3301.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c03e226a29cbea34ef0c20e0c69c20290767c9b278e2979fad035448068d59c
3
+ size 5169
tokenizer.json CHANGED
@@ -1,11 +1,6 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 512,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
  "padding": null,
10
  "added_tokens": [
11
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5a29bf5877a769de2ed9ae2f45be0f565b383b6404799aebf624f1ed8ded37e
3
  size 3963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94c21d71386114f0b1a597033a9077773b7c12a5464db0762dda7c0090069363
3
  size 3963