File size: 4,279 Bytes
747a654
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
epoch: 1, batch: 100, avg loss: 1.035541, avg ranking loss: 0.016568, avg mle loss: 8.698632
learning rate: 0.000000

epoch: 1, batch: 200, avg loss: 0.939091, avg ranking loss: 0.015825, avg mle loss: 7.808369
learning rate: 0.000000

epoch: 1, batch: 300, avg loss: 0.786419, avg ranking loss: 0.015178, avg mle loss: 6.346376
learning rate: 0.000001

epoch: 1, batch: 400, avg loss: 0.653152, avg ranking loss: 0.014788, avg mle loss: 5.052757
learning rate: 0.000001

epoch: 1, batch: 500, avg loss: 0.583150, avg ranking loss: 0.014760, avg mle loss: 4.355531
learning rate: 0.000001

epoch: 1, batch: 600, avg loss: 0.531894, avg ranking loss: 0.014850, avg mle loss: 3.833926
learning rate: 0.000001

epoch: 1, batch: 700, avg loss: 0.496518, avg ranking loss: 0.014805, avg mle loss: 3.484637
learning rate: 0.000001

epoch: 1, batch: 800, avg loss: 0.470519, avg ranking loss: 0.014618, avg mle loss: 3.243440
learning rate: 0.000002

epoch: 1, batch: 900, avg loss: 0.449544, avg ranking loss: 0.014501, avg mle loss: 3.045354
learning rate: 0.000002

epoch: 1, batch: 1000, avg loss: 0.431474, avg ranking loss: 0.014440, avg mle loss: 2.870745
learning rate: 0.000002

best ranking loss - epoch: 0, batch: 999
val ranking loss: 0.729979
val ranking rouge1: 0.629180, rouge2: 0.334733, rougeLsum: 0.599455
best generation loss - epoch: 0, batch: 999
val generation loss: 0.885783
val generation rouge1: 0.321491, rouge2: 0.134002, rougeLsum: 0.299572
epoch: 1, batch: 1100, avg loss: 0.419558, avg ranking loss: 0.014534, avg mle loss: 2.742168
learning rate: 0.000002

epoch: 1, batch: 1200, avg loss: 0.405170, avg ranking loss: 0.014500, avg mle loss: 2.601675
learning rate: 0.000002

epoch: 1, batch: 1300, avg loss: 0.394226, avg ranking loss: 0.014297, avg mle loss: 2.512567
learning rate: 0.000003

epoch: 1, batch: 1400, avg loss: 0.388203, avg ranking loss: 0.014295, avg mle loss: 2.452513
learning rate: 0.000003

epoch: 1, batch: 1500, avg loss: 0.379525, avg ranking loss: 0.014269, avg mle loss: 2.368302
learning rate: 0.000003

epoch: 1, batch: 1600, avg loss: 0.375064, avg ranking loss: 0.014436, avg mle loss: 2.307035
learning rate: 0.000003

epoch: 1, batch: 1700, avg loss: 0.364328, avg ranking loss: 0.014073, avg mle loss: 2.235932
learning rate: 0.000003

epoch: 1, batch: 1800, avg loss: 0.362203, avg ranking loss: 0.014417, avg mle loss: 2.180354
learning rate: 0.000004

epoch: 1, batch: 1900, avg loss: 0.358076, avg ranking loss: 0.014373, avg mle loss: 2.143419
learning rate: 0.000004

epoch: 1, batch: 2000, avg loss: 0.351821, avg ranking loss: 0.014282, avg mle loss: 2.089963
learning rate: 0.000004

val ranking loss: 0.734460
val ranking rouge1: 0.620741, rouge2: 0.331641, rougeLsum: 0.590756
val generation loss: 0.885808
val generation rouge1: 0.314677, rouge2: 0.155852, rougeLsum: 0.293533
epoch: 1, batch: 2100, avg loss: 0.349724, avg ranking loss: 0.014392, avg mle loss: 2.058075
learning rate: 0.000004

epoch: 1, batch: 2200, avg loss: 0.343959, avg ranking loss: 0.014182, avg mle loss: 2.021375
learning rate: 0.000004

epoch: 1, batch: 2300, avg loss: 0.340133, avg ranking loss: 0.014330, avg mle loss: 1.968376
learning rate: 0.000005

epoch: 1, batch: 2400, avg loss: 0.336417, avg ranking loss: 0.014204, avg mle loss: 1.943732
learning rate: 0.000005

epoch: 1, batch: 2500, avg loss: 0.330869, avg ranking loss: 0.014164, avg mle loss: 1.892253
learning rate: 0.000005

epoch: 1, batch: 2600, avg loss: 0.329880, avg ranking loss: 0.014310, avg mle loss: 1.867807
learning rate: 0.000005

epoch: 1, batch: 2700, avg loss: 0.326743, avg ranking loss: 0.014328, avg mle loss: 1.834671
learning rate: 0.000005

epoch: 1, batch: 2800, avg loss: 0.323882, avg ranking loss: 0.014190, avg mle loss: 1.819801
learning rate: 0.000006

epoch: 1, batch: 2900, avg loss: 0.320222, avg ranking loss: 0.013906, avg mle loss: 1.811585
learning rate: 0.000006

epoch: 1, batch: 3000, avg loss: 0.317352, avg ranking loss: 0.014259, avg mle loss: 1.747636
learning rate: 0.000006

val ranking loss: 0.736030
val ranking rouge1: 0.617348, rouge2: 0.330589, rougeLsum: 0.587821
best generation loss - epoch: 0, batch: 2999
val generation loss: 0.884436
val generation rouge1: 0.314360, rouge2: 0.161066, rougeLsum: 0.296060