Training in progress, step 24

Files changed (6) hide show

adapter_config.json CHANGED Viewed

@@ -13,19 +13,16 @@
   "lora_dropout": 0.05,
   "megatron_config": null,
   "megatron_core": "megatron.core",
-  "modules_to_save": [
-    "embed_tokens",
-    "lm_head"
-  ],
   "peft_type": "LORA",
   "r": 32,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "v_proj",
-    "q_proj",
     "o_proj",
-    "k_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "lora_dropout": 0.05,
   "megatron_config": null,
   "megatron_core": "megatron.core",
+  "modules_to_save": null,
   "peft_type": "LORA",
   "r": 32,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "v_proj",
     "o_proj",
+    "k_proj",
+    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:af3ac1c80ecdf708b99c2f7daafdec741f36f9e7b61015425db60fee85f24489
-size 1682049472

 version https://git-lfs.github.com/spec/v1
+oid sha256:0b0fd3a3deaa32b10ddda56ff4259dcd92d17228b9f9e5c23d1a86dff1b4c016
+size 109086416

config.json CHANGED Viewed

@@ -40,5 +40,5 @@
   "torch_dtype": "bfloat16",
   "transformers_version": "4.38.2",
   "use_cache": false,
-  "vocab_size": 32002
 }

   "torch_dtype": "bfloat16",
   "transformers_version": "4.38.2",
   "use_cache": false,
+  "vocab_size": 32000
 }

tokenizer.json CHANGED Viewed

@@ -29,24 +29,6 @@
       "rstrip": false,
       "normalized": false,
       "special": true
-    },
-    {
-      "id": 32000,
-      "content": "[f]",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": false,
-      "normalized": true,
-      "special": false
-    },
-    {
-      "id": 32001,
-      "content": "[c]",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": false,
-      "normalized": true,
-      "special": false
     }
   ],
   "normalizer": {

       "rstrip": false,
       "normalized": false,
       "special": true
     }
   ],
   "normalizer": {

tokenizer_config.json CHANGED Viewed

@@ -25,22 +25,6 @@
       "rstrip": false,
       "single_word": false,
       "special": true
-    },
-    "32000": {
-      "content": "[f]",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "32001": {
-      "content": "[c]",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
     }
   },
   "additional_special_tokens": [],

       "rstrip": false,
       "single_word": false,
       "special": true
     }
   },
   "additional_special_tokens": [],

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c0b044d94ebf37a98aa662dcc3d7d1231cd55dd3890db71add4a7b5d0fe4c352
 size 5688

 version https://git-lfs.github.com/spec/v1
+oid sha256:e55e74ccda3527a8a8b79aa1749c6a5486e93f9f6c7ca173771f1b4d6214b242
 size 5688