huggingartists

Files changed (9) hide show

README.md CHANGED Viewed

@@ -45,15 +45,15 @@ from datasets import load_dataset
 dataset = load_dataset("huggingartists/slava-marlow")
 ```
-[Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/dajo6l0v/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
 ## Training procedure
 The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on SLAVA MARLOW's lyrics.
-Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/1djy4mi8) for full transparency and reproducibility.
-At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/1djy4mi8/artifacts) is logged and versioned.
 ## How to use

 dataset = load_dataset("huggingartists/slava-marlow")
 ```
+[Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/1fdcz1s5/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
 ## Training procedure
 The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on SLAVA MARLOW's lyrics.
+Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/ro4q353s) for full transparency and reproducibility.
+At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/ro4q353s/artifacts) is logged and versioned.
 ## How to use

evaluation.txt CHANGED Viewed

	@@ -1 +1 @@
1	- {"eval_loss": 1.~~5765409469604492~~, "eval_runtime": 8.~~007~~, "eval_samples_per_second": 21.~~232~~, "eval_steps_per_second": 2.~~748~~, "epoch": 3.0}


1	+ {"eval_loss": 1.3606982231140137, "eval_runtime": 7.3833, "eval_samples_per_second": 21.129, "eval_steps_per_second": 2.709, "epoch": 4.0}

flax_model.msgpack CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0f31f81a0ff5da76be1d7744122ddaa1d4c33c954bdadcae9976300407273a91
 size 497764120

 version https://git-lfs.github.com/spec/v1
+oid sha256:6de5112cbe4228b802fb6b2f1d86b9101d8c460145da927df0d9af62e9757cf1
 size 497764120

optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e61f1c361c857b02d5d0830f1edf1460b1f7dab9003211a02897fe30b5bd91d1
 size 995604017

 version https://git-lfs.github.com/spec/v1
+oid sha256:6ae00f5bac3f0549cbee7f9952c6fd26ec32ab79e31649b794d02118952f2e52
 size 995604017

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1fc237e81048121824c38df56404ddd7899a39fab731a11c12988aa8ebd5164c
 size 510403817

 version https://git-lfs.github.com/spec/v1
+oid sha256:70f27c25592190cf50121c5b3c309fea728d24a5d25c2956b78b878b1c9671b7
 size 510403817

rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5960c90ad81f7699bd122a5bfa6732fd3b57d2883f4ba4ed0d4dd0a79b0596f4
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:c45f584f404ff6c35b7f091be7f153b417156dd52345a73889f7b7af6e5bb990
 size 14503

scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8267538b8f71047573a2bf4b20b591f7a175ff510694f359e666cbbd6a22e8c0
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:268ef632d221476fc1686df5234f05a490d4a9176c570d0dcb5fdb5ff616d0fe
 size 623

trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-  "best_metric": 1.5765409469604492,
-  "best_model_checkpoint": "output/slava-marlow/checkpoint-327",
   "epoch": 3.0,
-  "global_step": 327,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -404,11 +404,25 @@
       "eval_samples_per_second": 21.227,
       "eval_steps_per_second": 2.747,
       "step": 327
     }
   ],
-  "max_steps": 327,
-  "num_train_epochs": 3,
-  "total_flos": 340594163712000.0,
   "trial_name": null,
   "trial_params": null
 }

 {
+  "best_metric": 1.3606982231140137,
+  "best_model_checkpoint": "output/slava-marlow/checkpoint-333",
   "epoch": 3.0,
+  "global_step": 333,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 21.227,
       "eval_steps_per_second": 2.747,
       "step": 327
+    },
+    {
+      "epoch": 2.97,
+      "learning_rate": 2.4713228598268823e-07,
+      "loss": 1.5213,
+      "step": 330
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 1.3606982231140137,
+      "eval_runtime": 7.4703,
+      "eval_samples_per_second": 20.883,
+      "eval_steps_per_second": 2.677,
+      "step": 333
     }
   ],
+  "max_steps": 444,
+  "num_train_epochs": 4,
+  "total_flos": 346081296384000.0,
   "trial_name": null,
   "trial_params": null
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d77fa0328ab599e88846dcdcfe668efcd1424c4a8c70e39af87fe4768ee0b599
 size 2863

 version https://git-lfs.github.com/spec/v1
+oid sha256:0bc20d77a5f3b1a200d6fd4c842752a456cf12cc4cfe556a9debe895cae75c6a
 size 2863