AlekseyKorshuk commited on
Commit
5b68e39
1 Parent(s): e8ae835

huggingartists

Browse files
README.md CHANGED
@@ -45,15 +45,15 @@ from datasets import load_dataset
45
  dataset = load_dataset("huggingartists/bring-me-the-horizon")
46
  ```
47
 
48
- [Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/1yuqm1pv/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
49
 
50
  ## Training procedure
51
 
52
  The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on Bring Me The Horizon's lyrics.
53
 
54
- Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/z98a5j5r) for full transparency and reproducibility.
55
 
56
- At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/z98a5j5r/artifacts) is logged and versioned.
57
 
58
  ## How to use
59
 
 
45
  dataset = load_dataset("huggingartists/bring-me-the-horizon")
46
  ```
47
 
48
+ [Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/1e9181i6/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
49
 
50
  ## Training procedure
51
 
52
  The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on Bring Me The Horizon's lyrics.
53
 
54
+ Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/3p7pncir) for full transparency and reproducibility.
55
 
56
+ At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/3p7pncir/artifacts) is logged and versioned.
57
 
58
  ## How to use
59
 
evaluation.txt CHANGED
@@ -1 +1 @@
1
- {"eval_loss": 1.761746883392334, "eval_runtime": 0.4813, "eval_samples_per_second": 74.8, "eval_steps_per_second": 10.389, "epoch": 52.0}
 
1
+ {"eval_loss": 1.3656095266342163, "eval_runtime": 0.4403, "eval_samples_per_second": 74.943, "eval_steps_per_second": 11.355, "epoch": 108.0}
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f60e50a7e388c49df33a2cac5abe57958ed061c6525713fbbaf0e72692b8751
3
  size 497764120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ff98a92d7a8b2e431f9a5a76dd5a5df2cc58d7364acc5e1f5d951bcf0359ec4
3
  size 497764120
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0aec99ac123784c1df18282b656728c10ab998edaa76607406f49892e8c5d190
3
  size 995603825
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4326008d729e27a10c347bbb6a46bd8799a6937e7c1eead85f7e90067bcb0243
3
  size 995603825
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00a416d9b660bc7b7cd01571f1569a51e5c89dfe326c7ea762cb31673f6bdd8a
3
  size 510403817
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6cd18063e45fc379977b2bec642a11331a4fe8b17068ee3c6c7ceb85156ee9e
3
  size 510403817
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a9eb709ab35df7f70905c14ca74e38db768088a1b8d7f8fd0df5af8ff6128c9
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41c13ff59225bf75f6e3a42ec434ae273bb624cc97eb69019e900e7a38315153
3
  size 14503
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2bbb036f11beb59109336ec9fefde1522b1dc6499163e8831bd87d849eba417d
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6113b0488c437ba8d289a92febabd7916f0db341f7e47637a541e44c487c9485
3
  size 623
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 1.761746883392334,
3
- "best_model_checkpoint": "output/bring-me-the-horizon/checkpoint-208",
4
  "epoch": 8.0,
5
- "global_step": 208,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -316,11 +316,31 @@
316
  "eval_samples_per_second": 74.353,
317
  "eval_steps_per_second": 10.327,
318
  "step": 208
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
319
  }
320
  ],
321
- "max_steps": 1352,
322
- "num_train_epochs": 52,
323
- "total_flos": 215043342336000.0,
324
  "trial_name": null,
325
  "trial_params": null
326
  }
 
1
  {
2
+ "best_metric": 1.3656095266342163,
3
+ "best_model_checkpoint": "output/bring-me-the-horizon/checkpoint-216",
4
  "epoch": 8.0,
5
+ "global_step": 216,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
316
  "eval_samples_per_second": 74.353,
317
  "eval_steps_per_second": 10.327,
318
  "step": 208
319
+ },
320
+ {
321
+ "epoch": 7.78,
322
+ "learning_rate": 0.00012115064879796188,
323
+ "loss": 1.688,
324
+ "step": 210
325
+ },
326
+ {
327
+ "epoch": 7.96,
328
+ "learning_rate": 0.00013673615134109727,
329
+ "loss": 1.5172,
330
+ "step": 215
331
+ },
332
+ {
333
+ "epoch": 8.0,
334
+ "eval_loss": 1.3656095266342163,
335
+ "eval_runtime": 0.4451,
336
+ "eval_samples_per_second": 74.143,
337
+ "eval_steps_per_second": 11.234,
338
+ "step": 216
339
  }
340
  ],
341
+ "max_steps": 2916,
342
+ "num_train_epochs": 108,
343
+ "total_flos": 222490165248000.0,
344
  "trial_name": null,
345
  "trial_params": null
346
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a61175f6b4282876536474ec422652e78dcd99a973713a9795eb16ce4347ccb
3
  size 2863
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77d7737b562948aaba74d132cdb2242f8cd3659133b02f42a93887fc2f475c32
3
  size 2863