File size: 17,628 Bytes
a8aec59
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
{"current_steps": 10, "total_steps": 2724, "loss": 0.7005, "learning_rate": 5e-06, "epoch": 0.01100715465052284, "percentage": 0.37, "elapsed_time": "0:01:32", "remaining_time": "6:58:19"}
{"current_steps": 20, "total_steps": 2724, "loss": 0.6377, "learning_rate": 5e-06, "epoch": 0.02201430930104568, "percentage": 0.73, "elapsed_time": "0:02:56", "remaining_time": "6:36:35"}
{"current_steps": 30, "total_steps": 2724, "loss": 0.6063, "learning_rate": 5e-06, "epoch": 0.03302146395156852, "percentage": 1.1, "elapsed_time": "0:04:19", "remaining_time": "6:28:02"}
{"current_steps": 40, "total_steps": 2724, "loss": 0.5969, "learning_rate": 5e-06, "epoch": 0.04402861860209136, "percentage": 1.47, "elapsed_time": "0:05:42", "remaining_time": "6:22:59"}
{"current_steps": 50, "total_steps": 2724, "loss": 0.5714, "learning_rate": 5e-06, "epoch": 0.0550357732526142, "percentage": 1.84, "elapsed_time": "0:07:05", "remaining_time": "6:19:29"}
{"current_steps": 60, "total_steps": 2724, "loss": 0.5648, "learning_rate": 5e-06, "epoch": 0.06604292790313704, "percentage": 2.2, "elapsed_time": "0:08:29", "remaining_time": "6:16:51"}
{"current_steps": 70, "total_steps": 2724, "loss": 0.5611, "learning_rate": 5e-06, "epoch": 0.07705008255365987, "percentage": 2.57, "elapsed_time": "0:09:52", "remaining_time": "6:14:27"}
{"current_steps": 80, "total_steps": 2724, "loss": 0.5512, "learning_rate": 5e-06, "epoch": 0.08805723720418272, "percentage": 2.94, "elapsed_time": "0:11:16", "remaining_time": "6:12:22"}
{"current_steps": 90, "total_steps": 2724, "loss": 0.5485, "learning_rate": 5e-06, "epoch": 0.09906439185470556, "percentage": 3.3, "elapsed_time": "0:12:39", "remaining_time": "6:10:30"}
{"current_steps": 100, "total_steps": 2724, "loss": 0.5509, "learning_rate": 5e-06, "epoch": 0.1100715465052284, "percentage": 3.67, "elapsed_time": "0:14:03", "remaining_time": "6:08:44"}
{"current_steps": 110, "total_steps": 2724, "loss": 0.5408, "learning_rate": 5e-06, "epoch": 0.12107870115575124, "percentage": 4.04, "elapsed_time": "0:15:26", "remaining_time": "6:06:54"}
{"current_steps": 120, "total_steps": 2724, "loss": 0.5454, "learning_rate": 5e-06, "epoch": 0.13208585580627408, "percentage": 4.41, "elapsed_time": "0:16:49", "remaining_time": "6:05:11"}
{"current_steps": 130, "total_steps": 2724, "loss": 0.547, "learning_rate": 5e-06, "epoch": 0.14309301045679693, "percentage": 4.77, "elapsed_time": "0:18:13", "remaining_time": "6:03:33"}
{"current_steps": 140, "total_steps": 2724, "loss": 0.5355, "learning_rate": 5e-06, "epoch": 0.15410016510731975, "percentage": 5.14, "elapsed_time": "0:19:36", "remaining_time": "6:01:58"}
{"current_steps": 150, "total_steps": 2724, "loss": 0.5401, "learning_rate": 5e-06, "epoch": 0.1651073197578426, "percentage": 5.51, "elapsed_time": "0:21:00", "remaining_time": "6:00:21"}
{"current_steps": 160, "total_steps": 2724, "loss": 0.5382, "learning_rate": 5e-06, "epoch": 0.17611447440836545, "percentage": 5.87, "elapsed_time": "0:22:23", "remaining_time": "5:58:43"}
{"current_steps": 170, "total_steps": 2724, "loss": 0.5375, "learning_rate": 5e-06, "epoch": 0.18712162905888827, "percentage": 6.24, "elapsed_time": "0:23:45", "remaining_time": "5:57:02"}
{"current_steps": 180, "total_steps": 2724, "loss": 0.5293, "learning_rate": 5e-06, "epoch": 0.19812878370941112, "percentage": 6.61, "elapsed_time": "0:25:08", "remaining_time": "5:55:23"}
{"current_steps": 190, "total_steps": 2724, "loss": 0.529, "learning_rate": 5e-06, "epoch": 0.20913593835993396, "percentage": 6.98, "elapsed_time": "0:26:31", "remaining_time": "5:53:48"}
{"current_steps": 200, "total_steps": 2724, "loss": 0.5374, "learning_rate": 5e-06, "epoch": 0.2201430930104568, "percentage": 7.34, "elapsed_time": "0:27:55", "remaining_time": "5:52:19"}
{"current_steps": 210, "total_steps": 2724, "loss": 0.5244, "learning_rate": 5e-06, "epoch": 0.23115024766097964, "percentage": 7.71, "elapsed_time": "0:29:18", "remaining_time": "5:50:51"}
{"current_steps": 220, "total_steps": 2724, "loss": 0.5239, "learning_rate": 5e-06, "epoch": 0.24215740231150248, "percentage": 8.08, "elapsed_time": "0:30:42", "remaining_time": "5:49:27"}
{"current_steps": 230, "total_steps": 2724, "loss": 0.5208, "learning_rate": 5e-06, "epoch": 0.25316455696202533, "percentage": 8.44, "elapsed_time": "0:32:05", "remaining_time": "5:47:59"}
{"current_steps": 240, "total_steps": 2724, "loss": 0.5235, "learning_rate": 5e-06, "epoch": 0.26417171161254815, "percentage": 8.81, "elapsed_time": "0:33:28", "remaining_time": "5:46:30"}
{"current_steps": 250, "total_steps": 2724, "loss": 0.5208, "learning_rate": 5e-06, "epoch": 0.275178866263071, "percentage": 9.18, "elapsed_time": "0:34:52", "remaining_time": "5:45:04"}
{"current_steps": 260, "total_steps": 2724, "loss": 0.5221, "learning_rate": 5e-06, "epoch": 0.28618602091359385, "percentage": 9.54, "elapsed_time": "0:36:15", "remaining_time": "5:43:41"}
{"current_steps": 270, "total_steps": 2724, "loss": 0.5208, "learning_rate": 5e-06, "epoch": 0.2971931755641167, "percentage": 9.91, "elapsed_time": "0:37:39", "remaining_time": "5:42:15"}
{"current_steps": 280, "total_steps": 2724, "loss": 0.5197, "learning_rate": 5e-06, "epoch": 0.3082003302146395, "percentage": 10.28, "elapsed_time": "0:39:02", "remaining_time": "5:40:49"}
{"current_steps": 290, "total_steps": 2724, "loss": 0.5184, "learning_rate": 5e-06, "epoch": 0.31920748486516237, "percentage": 10.65, "elapsed_time": "0:40:26", "remaining_time": "5:39:23"}
{"current_steps": 300, "total_steps": 2724, "loss": 0.5212, "learning_rate": 5e-06, "epoch": 0.3302146395156852, "percentage": 11.01, "elapsed_time": "0:41:49", "remaining_time": "5:37:57"}
{"current_steps": 310, "total_steps": 2724, "loss": 0.5184, "learning_rate": 5e-06, "epoch": 0.341221794166208, "percentage": 11.38, "elapsed_time": "0:43:13", "remaining_time": "5:36:31"}
{"current_steps": 320, "total_steps": 2724, "loss": 0.5117, "learning_rate": 5e-06, "epoch": 0.3522289488167309, "percentage": 11.75, "elapsed_time": "0:44:36", "remaining_time": "5:35:06"}
{"current_steps": 330, "total_steps": 2724, "loss": 0.5168, "learning_rate": 5e-06, "epoch": 0.3632361034672537, "percentage": 12.11, "elapsed_time": "0:45:59", "remaining_time": "5:33:41"}
{"current_steps": 340, "total_steps": 2724, "loss": 0.5112, "learning_rate": 5e-06, "epoch": 0.37424325811777653, "percentage": 12.48, "elapsed_time": "0:47:23", "remaining_time": "5:32:16"}
{"current_steps": 350, "total_steps": 2724, "loss": 0.5093, "learning_rate": 5e-06, "epoch": 0.3852504127682994, "percentage": 12.85, "elapsed_time": "0:48:46", "remaining_time": "5:30:50"}
{"current_steps": 360, "total_steps": 2724, "loss": 0.5089, "learning_rate": 5e-06, "epoch": 0.39625756741882223, "percentage": 13.22, "elapsed_time": "0:50:10", "remaining_time": "5:29:25"}
{"current_steps": 370, "total_steps": 2724, "loss": 0.5119, "learning_rate": 5e-06, "epoch": 0.40726472206934505, "percentage": 13.58, "elapsed_time": "0:51:33", "remaining_time": "5:28:02"}
{"current_steps": 380, "total_steps": 2724, "loss": 0.5114, "learning_rate": 5e-06, "epoch": 0.41827187671986793, "percentage": 13.95, "elapsed_time": "0:52:57", "remaining_time": "5:26:39"}
{"current_steps": 390, "total_steps": 2724, "loss": 0.5099, "learning_rate": 5e-06, "epoch": 0.42927903137039075, "percentage": 14.32, "elapsed_time": "0:54:21", "remaining_time": "5:25:17"}
{"current_steps": 400, "total_steps": 2724, "loss": 0.5052, "learning_rate": 5e-06, "epoch": 0.4402861860209136, "percentage": 14.68, "elapsed_time": "0:55:45", "remaining_time": "5:23:57"}
{"current_steps": 410, "total_steps": 2724, "loss": 0.5101, "learning_rate": 5e-06, "epoch": 0.45129334067143645, "percentage": 15.05, "elapsed_time": "0:57:09", "remaining_time": "5:22:37"}
{"current_steps": 420, "total_steps": 2724, "loss": 0.5052, "learning_rate": 5e-06, "epoch": 0.46230049532195927, "percentage": 15.42, "elapsed_time": "0:58:34", "remaining_time": "5:21:17"}
{"current_steps": 430, "total_steps": 2724, "loss": 0.5071, "learning_rate": 5e-06, "epoch": 0.4733076499724821, "percentage": 15.79, "elapsed_time": "0:59:58", "remaining_time": "5:19:57"}
{"current_steps": 440, "total_steps": 2724, "loss": 0.5087, "learning_rate": 5e-06, "epoch": 0.48431480462300497, "percentage": 16.15, "elapsed_time": "1:01:22", "remaining_time": "5:18:36"}
{"current_steps": 450, "total_steps": 2724, "loss": 0.5037, "learning_rate": 5e-06, "epoch": 0.4953219592735278, "percentage": 16.52, "elapsed_time": "1:02:46", "remaining_time": "5:17:12"}
{"current_steps": 460, "total_steps": 2724, "loss": 0.5017, "learning_rate": 5e-06, "epoch": 0.5063291139240507, "percentage": 16.89, "elapsed_time": "1:04:09", "remaining_time": "5:15:46"}
{"current_steps": 470, "total_steps": 2724, "loss": 0.5027, "learning_rate": 5e-06, "epoch": 0.5173362685745735, "percentage": 17.25, "elapsed_time": "1:05:33", "remaining_time": "5:14:22"}
{"current_steps": 480, "total_steps": 2724, "loss": 0.4956, "learning_rate": 5e-06, "epoch": 0.5283434232250963, "percentage": 17.62, "elapsed_time": "1:06:57", "remaining_time": "5:13:00"}
{"current_steps": 490, "total_steps": 2724, "loss": 0.508, "learning_rate": 5e-06, "epoch": 0.5393505778756191, "percentage": 17.99, "elapsed_time": "1:08:21", "remaining_time": "5:11:37"}
{"current_steps": 500, "total_steps": 2724, "loss": 0.5055, "learning_rate": 5e-06, "epoch": 0.550357732526142, "percentage": 18.36, "elapsed_time": "1:09:44", "remaining_time": "5:10:13"}
{"current_steps": 510, "total_steps": 2724, "loss": 0.5039, "learning_rate": 5e-06, "epoch": 0.5613648871766649, "percentage": 18.72, "elapsed_time": "1:11:07", "remaining_time": "5:08:47"}
{"current_steps": 520, "total_steps": 2724, "loss": 0.4977, "learning_rate": 5e-06, "epoch": 0.5723720418271877, "percentage": 19.09, "elapsed_time": "1:12:31", "remaining_time": "5:07:22"}
{"current_steps": 530, "total_steps": 2724, "loss": 0.4998, "learning_rate": 5e-06, "epoch": 0.5833791964777105, "percentage": 19.46, "elapsed_time": "1:13:54", "remaining_time": "5:05:58"}
{"current_steps": 540, "total_steps": 2724, "loss": 0.5056, "learning_rate": 5e-06, "epoch": 0.5943863511282333, "percentage": 19.82, "elapsed_time": "1:15:18", "remaining_time": "5:04:36"}
{"current_steps": 550, "total_steps": 2724, "loss": 0.4987, "learning_rate": 5e-06, "epoch": 0.6053935057787562, "percentage": 20.19, "elapsed_time": "1:16:42", "remaining_time": "5:03:12"}
{"current_steps": 560, "total_steps": 2724, "loss": 0.501, "learning_rate": 5e-06, "epoch": 0.616400660429279, "percentage": 20.56, "elapsed_time": "1:18:06", "remaining_time": "5:01:50"}
{"current_steps": 570, "total_steps": 2724, "loss": 0.4962, "learning_rate": 5e-06, "epoch": 0.6274078150798019, "percentage": 20.93, "elapsed_time": "1:19:30", "remaining_time": "5:00:26"}
{"current_steps": 580, "total_steps": 2724, "loss": 0.4999, "learning_rate": 5e-06, "epoch": 0.6384149697303247, "percentage": 21.29, "elapsed_time": "1:20:53", "remaining_time": "4:59:02"}
{"current_steps": 590, "total_steps": 2724, "loss": 0.5039, "learning_rate": 5e-06, "epoch": 0.6494221243808476, "percentage": 21.66, "elapsed_time": "1:22:17", "remaining_time": "4:57:38"}
{"current_steps": 600, "total_steps": 2724, "loss": 0.4997, "learning_rate": 5e-06, "epoch": 0.6604292790313704, "percentage": 22.03, "elapsed_time": "1:23:40", "remaining_time": "4:56:14"}
{"current_steps": 610, "total_steps": 2724, "loss": 0.4953, "learning_rate": 5e-06, "epoch": 0.6714364336818932, "percentage": 22.39, "elapsed_time": "1:25:04", "remaining_time": "4:54:50"}
{"current_steps": 620, "total_steps": 2724, "loss": 0.492, "learning_rate": 5e-06, "epoch": 0.682443588332416, "percentage": 22.76, "elapsed_time": "1:26:27", "remaining_time": "4:53:25"}
{"current_steps": 630, "total_steps": 2724, "loss": 0.4953, "learning_rate": 5e-06, "epoch": 0.693450742982939, "percentage": 23.13, "elapsed_time": "1:27:51", "remaining_time": "4:52:00"}
{"current_steps": 640, "total_steps": 2724, "loss": 0.4889, "learning_rate": 5e-06, "epoch": 0.7044578976334618, "percentage": 23.49, "elapsed_time": "1:29:14", "remaining_time": "4:50:35"}
{"current_steps": 650, "total_steps": 2724, "loss": 0.5007, "learning_rate": 5e-06, "epoch": 0.7154650522839846, "percentage": 23.86, "elapsed_time": "1:30:37", "remaining_time": "4:49:10"}
{"current_steps": 660, "total_steps": 2724, "loss": 0.4938, "learning_rate": 5e-06, "epoch": 0.7264722069345074, "percentage": 24.23, "elapsed_time": "1:32:01", "remaining_time": "4:47:46"}
{"current_steps": 670, "total_steps": 2724, "loss": 0.4999, "learning_rate": 5e-06, "epoch": 0.7374793615850302, "percentage": 24.6, "elapsed_time": "1:33:24", "remaining_time": "4:46:22"}
{"current_steps": 680, "total_steps": 2724, "loss": 0.502, "learning_rate": 5e-06, "epoch": 0.7484865162355531, "percentage": 24.96, "elapsed_time": "1:34:48", "remaining_time": "4:44:59"}
{"current_steps": 690, "total_steps": 2724, "loss": 0.4967, "learning_rate": 5e-06, "epoch": 0.759493670886076, "percentage": 25.33, "elapsed_time": "1:36:13", "remaining_time": "4:43:38"}
{"current_steps": 700, "total_steps": 2724, "loss": 0.4927, "learning_rate": 5e-06, "epoch": 0.7705008255365988, "percentage": 25.7, "elapsed_time": "1:37:36", "remaining_time": "4:42:15"}
{"current_steps": 710, "total_steps": 2724, "loss": 0.4896, "learning_rate": 5e-06, "epoch": 0.7815079801871216, "percentage": 26.06, "elapsed_time": "1:39:00", "remaining_time": "4:40:51"}
{"current_steps": 720, "total_steps": 2724, "loss": 0.4897, "learning_rate": 5e-06, "epoch": 0.7925151348376445, "percentage": 26.43, "elapsed_time": "1:40:24", "remaining_time": "4:39:28"}
{"current_steps": 730, "total_steps": 2724, "loss": 0.488, "learning_rate": 5e-06, "epoch": 0.8035222894881673, "percentage": 26.8, "elapsed_time": "1:41:48", "remaining_time": "4:38:04"}
{"current_steps": 740, "total_steps": 2724, "loss": 0.4934, "learning_rate": 5e-06, "epoch": 0.8145294441386901, "percentage": 27.17, "elapsed_time": "1:43:12", "remaining_time": "4:36:42"}
{"current_steps": 750, "total_steps": 2724, "loss": 0.4892, "learning_rate": 5e-06, "epoch": 0.825536598789213, "percentage": 27.53, "elapsed_time": "1:44:36", "remaining_time": "4:35:19"}
{"current_steps": 760, "total_steps": 2724, "loss": 0.479, "learning_rate": 5e-06, "epoch": 0.8365437534397359, "percentage": 27.9, "elapsed_time": "1:46:00", "remaining_time": "4:33:56"}
{"current_steps": 770, "total_steps": 2724, "loss": 0.4918, "learning_rate": 5e-06, "epoch": 0.8475509080902587, "percentage": 28.27, "elapsed_time": "1:47:24", "remaining_time": "4:32:33"}
{"current_steps": 780, "total_steps": 2724, "loss": 0.4936, "learning_rate": 5e-06, "epoch": 0.8585580627407815, "percentage": 28.63, "elapsed_time": "1:48:48", "remaining_time": "4:31:10"}
{"current_steps": 790, "total_steps": 2724, "loss": 0.4912, "learning_rate": 5e-06, "epoch": 0.8695652173913043, "percentage": 29.0, "elapsed_time": "1:50:11", "remaining_time": "4:29:46"}
{"current_steps": 800, "total_steps": 2724, "loss": 0.4874, "learning_rate": 5e-06, "epoch": 0.8805723720418271, "percentage": 29.37, "elapsed_time": "1:51:35", "remaining_time": "4:28:23"}
{"current_steps": 810, "total_steps": 2724, "loss": 0.4898, "learning_rate": 5e-06, "epoch": 0.8915795266923501, "percentage": 29.74, "elapsed_time": "1:53:00", "remaining_time": "4:27:01"}
{"current_steps": 820, "total_steps": 2724, "loss": 0.4871, "learning_rate": 5e-06, "epoch": 0.9025866813428729, "percentage": 30.1, "elapsed_time": "1:54:24", "remaining_time": "4:25:38"}
{"current_steps": 830, "total_steps": 2724, "loss": 0.4874, "learning_rate": 5e-06, "epoch": 0.9135938359933957, "percentage": 30.47, "elapsed_time": "1:55:47", "remaining_time": "4:24:14"}
{"current_steps": 840, "total_steps": 2724, "loss": 0.4833, "learning_rate": 5e-06, "epoch": 0.9246009906439185, "percentage": 30.84, "elapsed_time": "1:57:11", "remaining_time": "4:22:49"}
{"current_steps": 850, "total_steps": 2724, "loss": 0.4854, "learning_rate": 5e-06, "epoch": 0.9356081452944414, "percentage": 31.2, "elapsed_time": "1:58:34", "remaining_time": "4:21:24"}
{"current_steps": 860, "total_steps": 2724, "loss": 0.4891, "learning_rate": 5e-06, "epoch": 0.9466152999449642, "percentage": 31.57, "elapsed_time": "1:59:57", "remaining_time": "4:20:00"}
{"current_steps": 870, "total_steps": 2724, "loss": 0.486, "learning_rate": 5e-06, "epoch": 0.9576224545954871, "percentage": 31.94, "elapsed_time": "2:01:20", "remaining_time": "4:18:35"}
{"current_steps": 880, "total_steps": 2724, "loss": 0.4865, "learning_rate": 5e-06, "epoch": 0.9686296092460099, "percentage": 32.31, "elapsed_time": "2:02:43", "remaining_time": "4:17:10"}
{"current_steps": 890, "total_steps": 2724, "loss": 0.487, "learning_rate": 5e-06, "epoch": 0.9796367638965328, "percentage": 32.67, "elapsed_time": "2:04:06", "remaining_time": "4:15:45"}
{"current_steps": 900, "total_steps": 2724, "loss": 0.4816, "learning_rate": 5e-06, "epoch": 0.9906439185470556, "percentage": 33.04, "elapsed_time": "2:05:30", "remaining_time": "4:14:21"}
{"current_steps": 908, "total_steps": 2724, "eval_loss": 0.4856513738632202, "epoch": 0.9994496422674739, "percentage": 33.33, "elapsed_time": "2:09:20", "remaining_time": "4:18:41"}
{"current_steps": 910, "total_steps": 2724, "loss": 0.481, "learning_rate": 5e-06, "epoch": 1.0016510731975785, "percentage": 33.41, "elapsed_time": "2:10:26", "remaining_time": "4:20:00"}
{"current_steps": 920, "total_steps": 2724, "loss": 0.4391, "learning_rate": 5e-06, "epoch": 1.0126582278481013, "percentage": 33.77, "elapsed_time": "2:11:48", "remaining_time": "4:18:28"}