Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8a043da359e951e6996e778beed5122d81d075566be927632d84938826a8e47
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9604bdd336350d342e616cfb7a56db3fb21f064fe8ef2bc9113733c502c4d3e
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81405a8c8546822be2693be905dc62e59a56142d229cee21fc214d56bbd5dfda
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63f129be760a286f5a80a006036753c37e86aa084acfce99dba6218705fd5ce7
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -58,3 +58,29 @@
|
|
58 |
{"current_steps": 560, "total_steps": 825, "loss": 0.6351, "learning_rate": 5e-06, "epoch": 2.036363636363636, "percentage": 67.88, "elapsed_time": "0:59:27", "remaining_time": "0:28:08"}
|
59 |
{"current_steps": 570, "total_steps": 825, "loss": 0.6307, "learning_rate": 5e-06, "epoch": 2.0727272727272728, "percentage": 69.09, "elapsed_time": "1:00:26", "remaining_time": "0:27:02"}
|
60 |
{"current_steps": 580, "total_steps": 825, "loss": 0.6357, "learning_rate": 5e-06, "epoch": 2.109090909090909, "percentage": 70.3, "elapsed_time": "1:01:25", "remaining_time": "0:25:56"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
58 |
{"current_steps": 560, "total_steps": 825, "loss": 0.6351, "learning_rate": 5e-06, "epoch": 2.036363636363636, "percentage": 67.88, "elapsed_time": "0:59:27", "remaining_time": "0:28:08"}
|
59 |
{"current_steps": 570, "total_steps": 825, "loss": 0.6307, "learning_rate": 5e-06, "epoch": 2.0727272727272728, "percentage": 69.09, "elapsed_time": "1:00:26", "remaining_time": "0:27:02"}
|
60 |
{"current_steps": 580, "total_steps": 825, "loss": 0.6357, "learning_rate": 5e-06, "epoch": 2.109090909090909, "percentage": 70.3, "elapsed_time": "1:01:25", "remaining_time": "0:25:56"}
|
61 |
+
{"current_steps": 590, "total_steps": 825, "loss": 0.6375, "learning_rate": 5e-06, "epoch": 2.1454545454545455, "percentage": 71.52, "elapsed_time": "1:02:24", "remaining_time": "0:24:51"}
|
62 |
+
{"current_steps": 600, "total_steps": 825, "loss": 0.635, "learning_rate": 5e-06, "epoch": 2.1818181818181817, "percentage": 72.73, "elapsed_time": "1:03:23", "remaining_time": "0:23:46"}
|
63 |
+
{"current_steps": 610, "total_steps": 825, "loss": 0.6383, "learning_rate": 5e-06, "epoch": 2.2181818181818183, "percentage": 73.94, "elapsed_time": "1:04:22", "remaining_time": "0:22:41"}
|
64 |
+
{"current_steps": 620, "total_steps": 825, "loss": 0.6321, "learning_rate": 5e-06, "epoch": 2.2545454545454544, "percentage": 75.15, "elapsed_time": "1:05:21", "remaining_time": "0:21:36"}
|
65 |
+
{"current_steps": 630, "total_steps": 825, "loss": 0.6341, "learning_rate": 5e-06, "epoch": 2.290909090909091, "percentage": 76.36, "elapsed_time": "1:06:21", "remaining_time": "0:20:32"}
|
66 |
+
{"current_steps": 640, "total_steps": 825, "loss": 0.6326, "learning_rate": 5e-06, "epoch": 2.327272727272727, "percentage": 77.58, "elapsed_time": "1:07:20", "remaining_time": "0:19:27"}
|
67 |
+
{"current_steps": 650, "total_steps": 825, "loss": 0.6385, "learning_rate": 5e-06, "epoch": 2.3636363636363638, "percentage": 78.79, "elapsed_time": "1:08:19", "remaining_time": "0:18:23"}
|
68 |
+
{"current_steps": 660, "total_steps": 825, "loss": 0.6373, "learning_rate": 5e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "1:09:19", "remaining_time": "0:17:19"}
|
69 |
+
{"current_steps": 670, "total_steps": 825, "loss": 0.6399, "learning_rate": 5e-06, "epoch": 2.4363636363636365, "percentage": 81.21, "elapsed_time": "1:10:17", "remaining_time": "0:16:15"}
|
70 |
+
{"current_steps": 680, "total_steps": 825, "loss": 0.6393, "learning_rate": 5e-06, "epoch": 2.4727272727272727, "percentage": 82.42, "elapsed_time": "1:11:16", "remaining_time": "0:15:11"}
|
71 |
+
{"current_steps": 690, "total_steps": 825, "loss": 0.6405, "learning_rate": 5e-06, "epoch": 2.509090909090909, "percentage": 83.64, "elapsed_time": "1:12:15", "remaining_time": "0:14:08"}
|
72 |
+
{"current_steps": 700, "total_steps": 825, "loss": 0.6385, "learning_rate": 5e-06, "epoch": 2.5454545454545454, "percentage": 84.85, "elapsed_time": "1:13:15", "remaining_time": "0:13:04"}
|
73 |
+
{"current_steps": 710, "total_steps": 825, "loss": 0.6377, "learning_rate": 5e-06, "epoch": 2.581818181818182, "percentage": 86.06, "elapsed_time": "1:14:15", "remaining_time": "0:12:01"}
|
74 |
+
{"current_steps": 720, "total_steps": 825, "loss": 0.6427, "learning_rate": 5e-06, "epoch": 2.618181818181818, "percentage": 87.27, "elapsed_time": "1:15:14", "remaining_time": "0:10:58"}
|
75 |
+
{"current_steps": 730, "total_steps": 825, "loss": 0.6346, "learning_rate": 5e-06, "epoch": 2.6545454545454543, "percentage": 88.48, "elapsed_time": "1:16:14", "remaining_time": "0:09:55"}
|
76 |
+
{"current_steps": 740, "total_steps": 825, "loss": 0.6414, "learning_rate": 5e-06, "epoch": 2.690909090909091, "percentage": 89.7, "elapsed_time": "1:17:13", "remaining_time": "0:08:52"}
|
77 |
+
{"current_steps": 750, "total_steps": 825, "loss": 0.6363, "learning_rate": 5e-06, "epoch": 2.7272727272727275, "percentage": 90.91, "elapsed_time": "1:18:13", "remaining_time": "0:07:49"}
|
78 |
+
{"current_steps": 760, "total_steps": 825, "loss": 0.6421, "learning_rate": 5e-06, "epoch": 2.7636363636363637, "percentage": 92.12, "elapsed_time": "1:19:12", "remaining_time": "0:06:46"}
|
79 |
+
{"current_steps": 770, "total_steps": 825, "loss": 0.6356, "learning_rate": 5e-06, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "1:20:10", "remaining_time": "0:05:43"}
|
80 |
+
{"current_steps": 780, "total_steps": 825, "loss": 0.6425, "learning_rate": 5e-06, "epoch": 2.8363636363636364, "percentage": 94.55, "elapsed_time": "1:21:09", "remaining_time": "0:04:40"}
|
81 |
+
{"current_steps": 790, "total_steps": 825, "loss": 0.6368, "learning_rate": 5e-06, "epoch": 2.8727272727272726, "percentage": 95.76, "elapsed_time": "1:22:08", "remaining_time": "0:03:38"}
|
82 |
+
{"current_steps": 800, "total_steps": 825, "loss": 0.6405, "learning_rate": 5e-06, "epoch": 2.909090909090909, "percentage": 96.97, "elapsed_time": "1:23:07", "remaining_time": "0:02:35"}
|
83 |
+
{"current_steps": 810, "total_steps": 825, "loss": 0.6357, "learning_rate": 5e-06, "epoch": 2.9454545454545453, "percentage": 98.18, "elapsed_time": "1:24:07", "remaining_time": "0:01:33"}
|
84 |
+
{"current_steps": 820, "total_steps": 825, "loss": 0.6412, "learning_rate": 5e-06, "epoch": 2.981818181818182, "percentage": 99.39, "elapsed_time": "1:25:06", "remaining_time": "0:00:31"}
|
85 |
+
{"current_steps": 825, "total_steps": 825, "eval_loss": 0.7299705147743225, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:27:36", "remaining_time": "0:00:00"}
|
86 |
+
{"current_steps": 825, "total_steps": 825, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:29:09", "remaining_time": "0:00:00"}
|