AlekseyKorshuk commited on
Commit
c134d7b
1 Parent(s): b5d5f55

huggingartists

Browse files
README.md CHANGED
@@ -45,15 +45,15 @@ from datasets import load_dataset
45
  dataset = load_dataset("huggingartists/og-buda")
46
  ```
47
 
48
- [Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/3fm004ry/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
49
 
50
  ## Training procedure
51
 
52
  The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on OG Buda's lyrics.
53
 
54
- Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/3r1oo0se) for full transparency and reproducibility.
55
 
56
- At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/3r1oo0se/artifacts) is logged and versioned.
57
 
58
  ## How to use
59
 
 
45
  dataset = load_dataset("huggingartists/og-buda")
46
  ```
47
 
48
+ [Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/19koddag/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
49
 
50
  ## Training procedure
51
 
52
  The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on OG Buda's lyrics.
53
 
54
+ Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/2pjx3dty) for full transparency and reproducibility.
55
 
56
+ At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/2pjx3dty/artifacts) is logged and versioned.
57
 
58
  ## How to use
59
 
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "gpt2",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
@@ -35,7 +35,7 @@
35
  }
36
  },
37
  "torch_dtype": "float32",
38
- "transformers_version": "4.10.0",
39
  "use_cache": true,
40
  "vocab_size": 50257
41
  }
 
1
  {
2
+ "_name_or_path": "huggingartists/og-buda",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
35
  }
36
  },
37
  "torch_dtype": "float32",
38
+ "transformers_version": "4.10.2",
39
  "use_cache": true,
40
  "vocab_size": 50257
41
  }
evaluation.txt CHANGED
@@ -1 +1 @@
1
- {"eval_loss": 1.7267966270446777, "eval_runtime": 9.827, "eval_samples_per_second": 22.082, "eval_steps_per_second": 2.849, "epoch": 3.0}
 
1
+ {"eval_loss": 1.6688779592514038, "eval_runtime": 9.5584, "eval_samples_per_second": 20.819, "eval_steps_per_second": 2.616, "epoch": 4.0}
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2b95c809621b3aecc74a1c90f3c824a1a3a2d6ce143dee337193937ebba7bd0
3
  size 497764120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e333fb388e02210c1f3ff984ad6c4d21e6d008bcab46dfd83e150235f59d89bc
3
  size 497764120
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f804530839f0ce5add3c90035df250c1e521fbcfc6c6b9411ff5d93495bc79f
3
  size 995604017
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ebbd0aa38a33ae4017b166fd8f1134893410206219de2130750e6d7d5f39b3e
3
  size 995604017
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:860c0ba6e9c4d2a7b8cf3014a15ef0dd7d194bc3e7624e85d836256662aaeb56
3
  size 510403817
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cb6cef5d2d7cbde31a058ffa3aefb7f08a7a2e4806e882a70db75aeff20abb1
3
  size 510403817
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9ef718cfc6030c7cccdc844d0b97e7bd680aadecd264b3ef13b83e80663d3b7
3
  size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a598a815349f8b1988c86709fdd881dafa589aaad49c7f20d98d3860abe8f36f
3
  size 14567
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5824e0331cc12edcb39b03d3f95b3b9ecd34a42ea9c54b7208dfa4115ef580e
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e86c0f8b5c2b1ad48d13df79807268e5d50299fba1287501961674ecf5c92d8c
3
  size 623
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"unk_token": "<|endoftext|>", "bos_token": "<|endoftext|>", "eos_token": "<|endoftext|>", "add_prefix_space": false, "model_max_length": 1024, "special_tokens_map_file": null, "name_or_path": "gpt2", "tokenizer_class": "GPT2Tokenizer"}
 
1
+ {"unk_token": "<|endoftext|>", "bos_token": "<|endoftext|>", "eos_token": "<|endoftext|>", "add_prefix_space": false, "model_max_length": 1024, "special_tokens_map_file": null, "name_or_path": "huggingartists/og-buda", "tokenizer_class": "GPT2Tokenizer"}
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 1.7267966270446777,
3
- "best_model_checkpoint": "output/og-buda/checkpoint-456",
4
  "epoch": 3.0,
5
- "global_step": 456,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -576,11 +576,25 @@
576
  "eval_samples_per_second": 22.262,
577
  "eval_steps_per_second": 2.872,
578
  "step": 456
 
 
 
 
 
 
 
 
 
 
 
 
 
 
579
  }
580
  ],
581
- "max_steps": 456,
582
- "num_train_epochs": 3,
583
- "total_flos": 475028914176000.0,
584
  "trial_name": null,
585
  "trial_params": null
586
  }
 
1
  {
2
+ "best_metric": 1.6688779592514038,
3
+ "best_model_checkpoint": "output/og-buda/checkpoint-462",
4
  "epoch": 3.0,
5
+ "global_step": 462,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
576
  "eval_samples_per_second": 22.262,
577
  "eval_steps_per_second": 2.872,
578
  "step": 456
579
+ },
580
+ {
581
+ "epoch": 2.99,
582
+ "learning_rate": 5.708896496161406e-08,
583
+ "loss": 1.777,
584
+ "step": 460
585
+ },
586
+ {
587
+ "epoch": 3.0,
588
+ "eval_loss": 1.6688779592514038,
589
+ "eval_runtime": 9.6717,
590
+ "eval_samples_per_second": 20.576,
591
+ "eval_steps_per_second": 2.585,
592
+ "step": 462
593
  }
594
  ],
595
+ "max_steps": 616,
596
+ "num_train_epochs": 4,
597
+ "total_flos": 481038630912000.0,
598
  "trial_name": null,
599
  "trial_params": null
600
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c861e4bf6fefedbd0432d0ecc6f44737e89f7d8fcebe4c1d079577fd5ea0a59
3
  size 2671
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14e6c3bf99fa49e34d3e8e2fd8f9080f73be0573bb5ad5de841304e2c8bb6fc0
3
  size 2671