sanchit-gandhi HF staff commited on
Commit
c415bc5
1 Parent(s): 6fd09e1

End of training

Browse files
Files changed (5) hide show
  1. README.md +6 -1
  2. all_results.json +11 -11
  3. eval_results.json +6 -6
  4. train_results.json +6 -6
  5. trainer_state.json +40 -255
README.md CHANGED
@@ -2,6 +2,8 @@
2
  license: cc-by-nc-4.0
3
  library_name: peft
4
  tags:
 
 
5
  - generated_from_trainer
6
  base_model: facebook/musicgen-melody-large
7
  model-index:
@@ -16,7 +18,10 @@ should probably proofread and complete it, then remove this comment. -->
16
  [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/sanchit-gandhi/black-eyed-peas/runs/6y8tlzp8)
17
  # black-eyed-peas-v1-unprompted
18
 
19
- This model is a fine-tuned version of [facebook/musicgen-melody-large](https://huggingface.co/facebook/musicgen-melody-large) on an unknown dataset.
 
 
 
20
 
21
  ## Model description
22
 
 
2
  license: cc-by-nc-4.0
3
  library_name: peft
4
  tags:
5
+ - text-to-audio
6
+ - sweet-dreambooths/black-eyed-peas-v1
7
  - generated_from_trainer
8
  base_model: facebook/musicgen-melody-large
9
  model-index:
 
18
  [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/sanchit-gandhi/black-eyed-peas/runs/6y8tlzp8)
19
  # black-eyed-peas-v1-unprompted
20
 
21
+ This model is a fine-tuned version of [facebook/musicgen-melody-large](https://huggingface.co/facebook/musicgen-melody-large) on the SWEET-DREAMBOOTHS/BLACK-EYED-PEAS-V1 - DEFAULT dataset.
22
+ It achieves the following results on the evaluation set:
23
+ - Loss: 3.0117
24
+ - Clap: 0.0264
25
 
26
  ## Model description
27
 
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
- "epoch": 1.9834710743801653,
3
- "eval_clap": -0.06337755173444748,
4
- "eval_loss": 5.031132698059082,
5
- "eval_runtime": 238.3424,
6
  "eval_samples": 8,
7
- "eval_samples_per_second": 0.034,
8
- "eval_steps_per_second": 0.034,
9
- "total_flos": 26305190573760.0,
10
- "train_loss": 6.993270270029703,
11
- "train_runtime": 2006.6605,
12
  "train_samples": 121,
13
- "train_samples_per_second": 0.121,
14
- "train_steps_per_second": 0.015
15
  }
 
1
  {
2
+ "epoch": 0.9256198347107438,
3
+ "eval_clap": 0.026393521577119827,
4
+ "eval_loss": 3.011723279953003,
5
+ "eval_runtime": 167.6466,
6
  "eval_samples": 8,
7
+ "eval_samples_per_second": 0.048,
8
+ "eval_steps_per_second": 0.048,
9
+ "total_flos": 12275755601088.0,
10
+ "train_loss": 9.150690759931292,
11
+ "train_runtime": 313.5661,
12
  "train_samples": 121,
13
+ "train_samples_per_second": 0.386,
14
+ "train_steps_per_second": 0.022
15
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 1.9834710743801653,
3
- "eval_clap": -0.06337755173444748,
4
- "eval_loss": 5.031132698059082,
5
- "eval_runtime": 238.3424,
6
  "eval_samples": 8,
7
- "eval_samples_per_second": 0.034,
8
- "eval_steps_per_second": 0.034
9
  }
 
1
  {
2
+ "epoch": 0.9256198347107438,
3
+ "eval_clap": 0.026393521577119827,
4
+ "eval_loss": 3.011723279953003,
5
+ "eval_runtime": 167.6466,
6
  "eval_samples": 8,
7
+ "eval_samples_per_second": 0.048,
8
+ "eval_steps_per_second": 0.048
9
  }
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 1.9834710743801653,
3
- "total_flos": 26305190573760.0,
4
- "train_loss": 6.993270270029703,
5
- "train_runtime": 2006.6605,
6
  "train_samples": 121,
7
- "train_samples_per_second": 0.121,
8
- "train_steps_per_second": 0.015
9
  }
 
1
  {
2
+ "epoch": 0.9256198347107438,
3
+ "total_flos": 12275755601088.0,
4
+ "train_loss": 9.150690759931292,
5
+ "train_runtime": 313.5661,
6
  "train_samples": 121,
7
+ "train_samples_per_second": 0.386,
8
+ "train_steps_per_second": 0.022
9
  }
trainer_state.json CHANGED
@@ -1,291 +1,76 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.9834710743801653,
5
- "eval_steps": 5,
6
- "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
- {
12
- "epoch": 0.06611570247933884,
13
- "grad_norm": 1.9830907583236694,
14
- "learning_rate": 0.00019333333333333333,
15
- "loss": 10.1125,
16
- "step": 1
17
- },
18
  {
19
  "epoch": 0.1322314049586777,
20
- "grad_norm": 2.0950465202331543,
21
- "learning_rate": 0.0001866666666666667,
22
- "loss": 9.9005,
23
- "step": 2
24
- },
25
- {
26
- "epoch": 0.19834710743801653,
27
- "grad_norm": 2.9728968143463135,
28
- "learning_rate": 0.00018,
29
- "loss": 9.7099,
30
- "step": 3
31
  },
32
  {
33
  "epoch": 0.2644628099173554,
34
- "grad_norm": 3.350935935974121,
35
- "learning_rate": 0.00017333333333333334,
36
- "loss": 8.944,
37
- "step": 4
38
- },
39
- {
40
- "epoch": 0.3305785123966942,
41
- "grad_norm": 3.183183431625366,
42
- "learning_rate": 0.0001666666666666667,
43
- "loss": 8.2807,
44
- "step": 5
45
- },
46
- {
47
- "epoch": 0.3305785123966942,
48
- "eval_clap": 0.016216065734624863,
49
- "eval_loss": 3.0157957077026367,
50
- "eval_runtime": 243.8548,
51
- "eval_samples_per_second": 0.033,
52
- "eval_steps_per_second": 0.033,
53
- "step": 5
54
  },
55
  {
56
  "epoch": 0.39669421487603307,
57
- "grad_norm": 4.646206855773926,
58
- "learning_rate": 0.00016,
59
- "loss": 7.7738,
60
- "step": 6
61
- },
62
- {
63
- "epoch": 0.4628099173553719,
64
- "grad_norm": 7.790807723999023,
65
- "learning_rate": 0.00015333333333333334,
66
- "loss": 7.5699,
67
- "step": 7
68
  },
69
  {
70
  "epoch": 0.5289256198347108,
71
- "grad_norm": 5.643434047698975,
72
- "learning_rate": 0.00014666666666666666,
73
- "loss": 7.139,
74
- "step": 8
75
- },
76
- {
77
- "epoch": 0.5950413223140496,
78
- "grad_norm": 3.7166173458099365,
79
- "learning_rate": 0.00014,
80
- "loss": 7.129,
81
- "step": 9
82
- },
83
- {
84
- "epoch": 0.6611570247933884,
85
- "grad_norm": 2.310825824737549,
86
- "learning_rate": 0.00013333333333333334,
87
- "loss": 6.536,
88
- "step": 10
89
  },
90
  {
91
  "epoch": 0.6611570247933884,
92
- "eval_clap": 0.007407550700008869,
93
- "eval_loss": 3.2537384033203125,
94
- "eval_runtime": 229.6949,
95
- "eval_samples_per_second": 0.035,
96
- "eval_steps_per_second": 0.035,
97
- "step": 10
98
- },
99
- {
100
- "epoch": 0.7272727272727273,
101
- "grad_norm": 3.1138978004455566,
102
- "learning_rate": 0.00012666666666666666,
103
- "loss": 7.0649,
104
- "step": 11
105
  },
106
  {
107
  "epoch": 0.7933884297520661,
108
- "grad_norm": 1.9888191223144531,
109
- "learning_rate": 0.00012,
110
- "loss": 6.579,
111
- "step": 12
112
- },
113
- {
114
- "epoch": 0.859504132231405,
115
- "grad_norm": 2.7568395137786865,
116
- "learning_rate": 0.00011333333333333334,
117
- "loss": 6.927,
118
- "step": 13
119
  },
120
  {
121
  "epoch": 0.9256198347107438,
122
- "grad_norm": 1.5047709941864014,
123
- "learning_rate": 0.00010666666666666667,
124
- "loss": 6.4366,
125
- "step": 14
126
- },
127
- {
128
- "epoch": 0.9917355371900827,
129
- "grad_norm": 1.930873155593872,
130
- "learning_rate": 0.0001,
131
- "loss": 6.1596,
132
- "step": 15
133
- },
134
- {
135
- "epoch": 0.9917355371900827,
136
- "eval_clap": -0.039488501846790314,
137
- "eval_loss": 4.296116828918457,
138
- "eval_runtime": 237.1954,
139
- "eval_samples_per_second": 0.034,
140
- "eval_steps_per_second": 0.034,
141
- "step": 15
142
- },
143
- {
144
- "epoch": 1.0578512396694215,
145
- "grad_norm": 1.186317801475525,
146
- "learning_rate": 9.333333333333334e-05,
147
- "loss": 6.3429,
148
- "step": 16
149
- },
150
- {
151
- "epoch": 1.1239669421487604,
152
- "grad_norm": 1.2925118207931519,
153
- "learning_rate": 8.666666666666667e-05,
154
- "loss": 6.1757,
155
- "step": 17
156
- },
157
- {
158
- "epoch": 1.1900826446280992,
159
- "grad_norm": 0.9777997136116028,
160
- "learning_rate": 8e-05,
161
- "loss": 6.2497,
162
- "step": 18
163
- },
164
- {
165
- "epoch": 1.256198347107438,
166
- "grad_norm": 1.5951266288757324,
167
- "learning_rate": 7.333333333333333e-05,
168
- "loss": 6.3316,
169
- "step": 19
170
- },
171
- {
172
- "epoch": 1.322314049586777,
173
- "grad_norm": 1.7874397039413452,
174
- "learning_rate": 6.666666666666667e-05,
175
- "loss": 6.44,
176
- "step": 20
177
- },
178
- {
179
- "epoch": 1.322314049586777,
180
- "eval_clap": -0.038016706705093384,
181
- "eval_loss": 4.876384258270264,
182
- "eval_runtime": 233.9024,
183
- "eval_samples_per_second": 0.034,
184
- "eval_steps_per_second": 0.034,
185
- "step": 20
186
- },
187
- {
188
- "epoch": 1.3884297520661157,
189
- "grad_norm": 1.0251847505569458,
190
- "learning_rate": 6e-05,
191
- "loss": 6.0348,
192
- "step": 21
193
- },
194
- {
195
- "epoch": 1.4545454545454546,
196
- "grad_norm": 0.8240154981613159,
197
- "learning_rate": 5.333333333333333e-05,
198
- "loss": 6.1891,
199
- "step": 22
200
- },
201
- {
202
- "epoch": 1.5206611570247934,
203
- "grad_norm": 1.571574091911316,
204
- "learning_rate": 4.666666666666667e-05,
205
- "loss": 5.89,
206
- "step": 23
207
- },
208
- {
209
- "epoch": 1.5867768595041323,
210
- "grad_norm": 0.9506106376647949,
211
- "learning_rate": 4e-05,
212
- "loss": 6.2511,
213
- "step": 24
214
- },
215
- {
216
- "epoch": 1.6528925619834711,
217
- "grad_norm": 1.503645420074463,
218
- "learning_rate": 3.3333333333333335e-05,
219
- "loss": 6.4944,
220
- "step": 25
221
- },
222
- {
223
- "epoch": 1.6528925619834711,
224
- "eval_clap": -0.05864603444933891,
225
- "eval_loss": 5.022668361663818,
226
- "eval_runtime": 237.1887,
227
- "eval_samples_per_second": 0.034,
228
- "eval_steps_per_second": 0.034,
229
- "step": 25
230
- },
231
- {
232
- "epoch": 1.71900826446281,
233
- "grad_norm": 1.0225498676300049,
234
- "learning_rate": 2.6666666666666667e-05,
235
- "loss": 6.2162,
236
- "step": 26
237
- },
238
- {
239
- "epoch": 1.7851239669421488,
240
- "grad_norm": 1.566749930381775,
241
- "learning_rate": 2e-05,
242
- "loss": 6.2582,
243
- "step": 27
244
- },
245
- {
246
- "epoch": 1.8512396694214877,
247
- "grad_norm": 1.3055825233459473,
248
- "learning_rate": 1.3333333333333333e-05,
249
- "loss": 6.1079,
250
- "step": 28
251
- },
252
- {
253
- "epoch": 1.9173553719008265,
254
- "grad_norm": 0.9658945798873901,
255
- "learning_rate": 6.666666666666667e-06,
256
- "loss": 6.1765,
257
- "step": 29
258
- },
259
- {
260
- "epoch": 1.9834710743801653,
261
- "grad_norm": 1.0808743238449097,
262
  "learning_rate": 0.0,
263
- "loss": 6.3776,
264
- "step": 30
265
- },
266
- {
267
- "epoch": 1.9834710743801653,
268
- "eval_clap": -0.05411681905388832,
269
- "eval_loss": 5.031132698059082,
270
- "eval_runtime": 232.4736,
271
- "eval_samples_per_second": 0.034,
272
- "eval_steps_per_second": 0.034,
273
- "step": 30
274
  },
275
  {
276
- "epoch": 1.9834710743801653,
277
- "step": 30,
278
- "total_flos": 26305190573760.0,
279
- "train_loss": 6.993270270029703,
280
- "train_runtime": 2006.6605,
281
- "train_samples_per_second": 0.121,
282
- "train_steps_per_second": 0.015
283
  }
284
  ],
285
  "logging_steps": 1.0,
286
- "max_steps": 30,
287
  "num_input_tokens_seen": 0,
288
- "num_train_epochs": 2,
289
  "save_steps": 500,
290
  "stateful_callbacks": {
291
  "TrainerControl": {
@@ -299,7 +84,7 @@
299
  "attributes": {}
300
  }
301
  },
302
- "total_flos": 26305190573760.0,
303
  "train_batch_size": 1,
304
  "trial_name": null,
305
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9256198347107438,
5
+ "eval_steps": 30,
6
+ "global_step": 7,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
11
  {
12
  "epoch": 0.1322314049586777,
13
+ "grad_norm": 1.7038763761520386,
14
+ "learning_rate": 0.00017142857142857143,
15
+ "loss": 10.0955,
16
+ "step": 1
 
 
 
 
 
 
 
17
  },
18
  {
19
  "epoch": 0.2644628099173554,
20
+ "grad_norm": 1.7832878828048706,
21
+ "learning_rate": 0.00014285714285714287,
22
+ "loss": 10.0281,
23
+ "step": 2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
24
  },
25
  {
26
  "epoch": 0.39669421487603307,
27
+ "grad_norm": 2.6710143089294434,
28
+ "learning_rate": 0.00011428571428571428,
29
+ "loss": 9.5219,
30
+ "step": 3
 
 
 
 
 
 
 
31
  },
32
  {
33
  "epoch": 0.5289256198347108,
34
+ "grad_norm": 3.564816951751709,
35
+ "learning_rate": 8.571428571428571e-05,
36
+ "loss": 9.0921,
37
+ "step": 4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
38
  },
39
  {
40
  "epoch": 0.6611570247933884,
41
+ "grad_norm": 3.5809993743896484,
42
+ "learning_rate": 5.714285714285714e-05,
43
+ "loss": 8.6465,
44
+ "step": 5
 
 
 
 
 
 
 
 
 
45
  },
46
  {
47
  "epoch": 0.7933884297520661,
48
+ "grad_norm": 2.9257972240448,
49
+ "learning_rate": 2.857142857142857e-05,
50
+ "loss": 8.3989,
51
+ "step": 6
 
 
 
 
 
 
 
52
  },
53
  {
54
  "epoch": 0.9256198347107438,
55
+ "grad_norm": 3.141226291656494,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
56
  "learning_rate": 0.0,
57
+ "loss": 8.2718,
58
+ "step": 7
 
 
 
 
 
 
 
 
 
59
  },
60
  {
61
+ "epoch": 0.9256198347107438,
62
+ "step": 7,
63
+ "total_flos": 12275755601088.0,
64
+ "train_loss": 9.150690759931292,
65
+ "train_runtime": 313.5661,
66
+ "train_samples_per_second": 0.386,
67
+ "train_steps_per_second": 0.022
68
  }
69
  ],
70
  "logging_steps": 1.0,
71
+ "max_steps": 7,
72
  "num_input_tokens_seen": 0,
73
+ "num_train_epochs": 1,
74
  "save_steps": 500,
75
  "stateful_callbacks": {
76
  "TrainerControl": {
 
84
  "attributes": {}
85
  }
86
  },
87
+ "total_flos": 12275755601088.0,
88
  "train_batch_size": 1,
89
  "trial_name": null,
90
  "trial_params": null