gemma2B-It-Medical-Finetuned-2epochs

Files changed (6) hide show

README.md CHANGED Viewed

@@ -37,13 +37,13 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 0.0002
 - train_batch_size: 2
-- eval_batch_size: 8
 - seed: 42
 - gradient_accumulation_steps: 8
 - total_train_batch_size: 16
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- num_epochs: 2
 ### Training results

 The following hyperparameters were used during training:
 - learning_rate: 0.0002
 - train_batch_size: 2
+- eval_batch_size: 2
 - seed: 42
 - gradient_accumulation_steps: 8
 - total_train_batch_size: 16
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- training_steps: 140
 ### Training results

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "google/gemma-2b-it",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -15,17 +15,17 @@
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
-  "r": 32,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "k_proj",
-    "down_proj",
     "q_proj",
     "up_proj",
     "gate_proj",
-    "o_proj",
-    "v_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": null,
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "r": 16,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "q_proj",
     "up_proj",
+    "down_proj",
+    "v_proj",
+    "k_proj",
     "gate_proj",
+    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:934c9dc96cbcbdf7a0291059d54fad03ea27608fa06c284ed0be9e650bc1b8c3
-size 156926880

 version https://git-lfs.github.com/spec/v1
+oid sha256:564baef948c1c3ec200d528fd06a5fcd757bff2b54a677d3190b1dae17846cb8
+size 78484352

runs/Mar27_09-49-24_5c1c4e61306f/events.out.tfevents.1711532972.5c1c4e61306f.406.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5270e5a589353335a36f2a78ad9adb0cfe06ccc49d1b674be5f333b7c32c41f
+size 4996

runs/Mar27_09-50-41_5c1c4e61306f/events.out.tfevents.1711533047.5c1c4e61306f.406.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:be2aa91aba0cadf3fbb7987d2d125bd9d93617195d7a91e1e982786edac16a43
+size 8257

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77c7ac08fea4403b0d9beed0ef5095552d19edd85f199fb8f60683b4c33202f6
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:d762cae44da0ef032ea87b818369afc5bca58006ca7507457c9fb71cee95e261
 size 4920