ruihanglai commited on
Commit
494f611
1 Parent(s): c9ff6a7

Initial commit

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
logs.txt ADDED
@@ -0,0 +1,261 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/195 [00:00<?, ?it/s]
1
 
 
2
  0%| | 0/195 [00:00<?, ?it/s]
3
 
 
4
  0%| | 0/195 [00:08<?, ?it/s]
5
  1%| | 1/195 [00:09<29:48, 9.22s/it]
6
 
 
7
  1%| | 1/195 [00:09<29:48, 9.22s/it]
8
 
 
9
  1%| | 1/195 [00:09<29:48, 9.22s/it]
10
  2%|▏ | 3/195 [00:09<07:58, 2.49s/it]
11
 
 
12
  2%|▏ | 3/195 [00:09<07:58, 2.49s/it]
13
  2%|▏ | 4/195 [00:10<06:17, 1.98s/it]
14
 
 
15
  2%|▏ | 4/195 [00:10<06:17, 1.98s/it]
16
 
 
17
  2%|▏ | 4/195 [00:10<06:17, 1.98s/it]
18
  3%|▎ | 6/195 [00:10<03:28, 1.10s/it]
19
 
 
20
  3%|▎ | 6/195 [00:10<03:28, 1.10s/it]
21
  4%|▎ | 7/195 [00:11<02:38, 1.19it/s]
22
 
 
23
  4%|▎ | 7/195 [00:11<02:38, 1.19it/s]
24
 
 
25
  4%|▎ | 7/195 [00:11<02:38, 1.19it/s]
26
  5%|▍ | 9/195 [00:11<01:39, 1.87it/s]
27
 
 
28
  5%|▍ | 9/195 [00:11<01:39, 1.87it/s]
29
  5%|▌ | 10/195 [00:12<02:00, 1.54it/s]
30
 
 
31
  5%|▌ | 10/195 [00:12<02:00, 1.54it/s]
32
 
 
33
  5%|▌ | 10/195 [00:12<02:00, 1.54it/s]
34
  6%|▌ | 12/195 [00:12<01:24, 2.15it/s]
35
 
 
36
  6%|▌ | 12/195 [00:12<01:24, 2.15it/s]
37
  7%|▋ | 13/195 [00:12<01:09, 2.61it/s]
38
 
 
39
  7%|▋ | 13/195 [00:12<01:09, 2.61it/s]
40
 
 
41
  7%|▋ | 13/195 [00:12<01:09, 2.61it/s]
42
  8%|▊ | 15/195 [00:13<00:50, 3.53it/s]
43
 
 
44
  8%|▊ | 15/195 [00:13<00:50, 3.53it/s]
45
  8%|▊ | 16/195 [00:13<01:15, 2.36it/s]
46
 
 
47
  8%|▊ | 16/195 [00:13<01:15, 2.36it/s]
48
 
 
49
  8%|▊ | 16/195 [00:14<01:15, 2.36it/s]
50
  9%|▉ | 18/195 [00:14<00:58, 3.04it/s]
51
 
 
52
  9%|▉ | 18/195 [00:14<00:58, 3.04it/s]
53
  10%|▉ | 19/195 [00:14<00:49, 3.57it/s]
54
 
 
55
  10%|▉ | 19/195 [00:14<00:49, 3.57it/s]
56
 
 
57
  10%|▉ | 19/195 [00:14<00:49, 3.57it/s]
58
  11%|█ | 21/195 [00:14<00:38, 4.53it/s]
59
 
 
60
  11%|█ | 21/195 [00:14<00:38, 4.53it/s]
61
  11%|█▏ | 22/195 [00:15<00:55, 3.11it/s]
62
 
 
63
  11%|█▏ | 22/195 [00:15<00:55, 3.11it/s]
64
 
 
65
  11%|█▏ | 22/195 [00:15<00:55, 3.11it/s]
66
  12%|█▏ | 24/195 [00:15<00:44, 3.87it/s]
67
 
 
68
  12%|█▏ | 24/195 [00:15<00:44, 3.87it/s]
69
  13%|█▎ | 25/195 [00:15<00:38, 4.45it/s]
70
 
 
71
  13%|█▎ | 25/195 [00:15<00:38, 4.45it/s]
72
 
 
73
  13%|█▎ | 25/195 [00:15<00:38, 4.45it/s]
74
  14%|█▍ | 27/195 [00:16<00:31, 5.38it/s]
75
 
 
76
  14%|█▍ | 27/195 [00:16<00:31, 5.38it/s]
77
  14%|█▍ | 28/195 [00:16<00:53, 3.14it/s]
78
 
 
79
  14%|█▍ | 28/195 [00:16<00:53, 3.14it/s]
80
 
 
81
  14%|█▍ | 28/195 [00:16<00:53, 3.14it/s]
82
  15%|█▌ | 30/195 [00:17<00:42, 3.89it/s]
83
 
 
84
  15%|█▌ | 30/195 [00:17<00:42, 3.89it/s]
85
  16%|█▌ | 31/195 [00:17<00:36, 4.47it/s]
86
 
 
87
  16%|█▌ | 31/195 [00:17<00:36, 4.47it/s]
88
 
 
89
  16%|█▌ | 31/195 [00:17<00:36, 4.47it/s]
90
  17%|█▋ | 33/195 [00:17<00:32, 4.97it/s]
91
 
 
92
  17%|█▋ | 33/195 [00:17<00:32, 4.97it/s]
93
  17%|█▋ | 34/195 [00:18<00:51, 3.12it/s]
94
 
 
95
  17%|█▋ | 34/195 [00:18<00:51, 3.12it/s]
96
 
 
97
  17%|█▋ | 34/195 [00:18<00:51, 3.12it/s]
98
  18%|█▊ | 36/195 [00:18<00:42, 3.77it/s]
99
 
 
100
  18%|█▊ | 36/195 [00:18<00:42, 3.77it/s]
101
 
 
102
  18%|█▊ | 36/195 [00:18<00:42, 3.77it/s]
103
  19%|█▉ | 38/195 [00:18<00:29, 5.26it/s]
104
 
 
105
  19%|█▉ | 38/195 [00:18<00:29, 5.26it/s]
106
  20%|██ | 39/195 [00:19<00:31, 5.02it/s]
107
 
 
108
  20%|██ | 39/195 [00:19<00:31, 5.02it/s]
109
  21%|██ | 40/195 [00:19<00:46, 3.35it/s]
110
 
 
111
  21%|██ | 40/195 [00:19<00:46, 3.35it/s]
112
 
 
113
  21%|██ | 40/195 [00:19<00:46, 3.35it/s]
114
  22%|██▏ | 42/195 [00:19<00:37, 4.12it/s]
115
 
 
116
  22%|██▏ | 42/195 [00:19<00:37, 4.12it/s]
117
  22%|██▏ | 43/195 [00:20<00:32, 4.72it/s]
118
 
 
119
  22%|██▏ | 43/195 [00:20<00:32, 4.72it/s]
120
 
 
121
  22%|██▏ | 43/195 [00:20<00:32, 4.72it/s]
122
  23%|██▎ | 45/195 [00:20<00:26, 5.62it/s]
123
 
 
124
  23%|██▎ | 45/195 [00:20<00:26, 5.62it/s]
125
  24%|██▎ | 46/195 [00:21<00:44, 3.35it/s]
126
 
 
127
  24%|██▎ | 46/195 [00:21<00:44, 3.35it/s]
128
 
 
129
  24%|██▎ | 46/195 [00:21<00:44, 3.35it/s]
130
  25%|██▍ | 48/195 [00:21<00:35, 4.11it/s]
131
 
 
132
  25%|██▍ | 48/195 [00:21<00:35, 4.11it/s]
133
  25%|██▌ | 49/195 [00:21<00:31, 4.70it/s]
134
 
 
135
  25%|██▌ | 49/195 [00:21<00:31, 4.70it/s]
136
 
 
137
  25%|██▌ | 49/195 [00:21<00:31, 4.70it/s]
138
 
 
139
  25%|██▌ | 49/195 [00:21<00:31, 4.70it/s]
140
 
 
141
  25%|██▌ | 49/195 [00:58<00:31, 4.70it/s]
142
  26%|██▌ | 51/195 [00:58<17:18, 7.21s/it]
143
 
 
144
  26%|██▌ | 51/195 [00:58<17:18, 7.21s/it]
145
 
 
146
  26%|██▌ | 51/195 [00:58<17:18, 7.21s/it]
147
  27%|██▋ | 53/195 [00:59<11:13, 4.74s/it]
148
 
 
149
  27%|██▋ | 53/195 [00:59<11:13, 4.74s/it]
150
  28%|██▊ | 54/195 [01:00<09:23, 4.00s/it]
151
 
 
152
  28%|██▊ | 54/195 [01:00<09:23, 4.00s/it]
153
 
 
154
  28%|██▊ | 54/195 [01:00<09:23, 4.00s/it]
155
  29%|██▊ | 56/195 [01:00<06:03, 2.61s/it]
156
 
 
157
  29%|██▊ | 56/195 [01:00<06:03, 2.61s/it]
158
  29%|██▉ | 57/195 [01:00<04:50, 2.10s/it]
159
 
 
160
  29%|██▉ | 57/195 [01:00<04:50, 2.10s/it]
161
 
 
162
  29%|██▉ | 57/195 [01:00<04:50, 2.10s/it]
163
  30%|███ | 59/195 [01:01<03:07, 1.38s/it]
164
 
 
165
  30%|███ | 59/195 [01:01<03:07, 1.38s/it]
166
  31%|███ | 60/195 [01:01<02:47, 1.24s/it]
167
 
 
168
  31%|███ | 60/195 [01:01<02:47, 1.24s/it]
169
 
 
170
  31%|███ | 60/195 [01:01<02:47, 1.24s/it]
171
  32%|███▏ | 62/195 [01:02<01:52, 1.18it/s]
172
 
 
173
  32%|███▏ | 62/195 [01:02<01:52, 1.18it/s]
174
  32%|███▏ | 63/195 [01:02<01:31, 1.44it/s]
175
 
 
176
  32%|███▏ | 63/195 [01:02<01:31, 1.44it/s]
177
 
 
178
  32%|███▏ | 63/195 [01:02<01:31, 1.44it/s]
179
  33%|███▎ | 65/195 [01:02<01:03, 2.04it/s]
180
 
 
181
  33%|███▎ | 65/195 [01:02<01:03, 2.04it/s]
182
  34%|███▍ | 66/195 [01:03<01:08, 1.90it/s]
183
 
 
184
  34%|███▍ | 66/195 [01:03<01:08, 1.90it/s]
185
 
 
186
  34%|███▍ | 66/195 [01:03<01:08, 1.90it/s]
187
  35%|███▍ | 68/195 [01:03<00:48, 2.61it/s]
188
 
 
189
  35%|███▍ | 68/195 [01:03<00:48, 2.61it/s]
190
 
 
191
  35%|███▍ | 68/195 [01:03<00:48, 2.61it/s]
192
 
 
193
  35%|███▍ | 68/195 [01:03<00:48, 2.61it/s]
194
  36%|███▋ | 71/195 [01:03<00:32, 3.82it/s]
195
 
 
196
  36%|███▋ | 71/195 [01:03<00:32, 3.82it/s]
197
  37%|███▋ | 72/195 [01:04<00:37, 3.31it/s]
198
 
 
199
  37%|███▋ | 72/195 [01:04<00:37, 3.31it/s]
200
 
 
201
  37%|███▋ | 72/195 [01:04<00:37, 3.31it/s]
202
  38%|███▊ | 74/195 [01:04<00:30, 4.02it/s]
203
 
 
204
  38%|███▊ | 74/195 [01:04<00:30, 4.02it/s]
205
 
 
206
  38%|███▊ | 74/195 [01:04<00:30, 4.02it/s]
207
 
 
208
  38%|███▊ | 74/195 [01:04<00:30, 4.02it/s]
209
  39%|███▉ | 77/195 [01:04<00:22, 5.26it/s]
210
 
 
211
  39%|███▉ | 77/195 [01:05<00:22, 5.26it/s]
212
  40%|████ | 78/195 [01:05<00:27, 4.18it/s]
213
 
 
214
  40%|████ | 78/195 [01:05<00:27, 4.18it/s]
215
 
 
216
  40%|████ | 78/195 [01:05<00:27, 4.18it/s]
217
  41%|████ | 80/195 [01:05<00:23, 4.83it/s]
218
 
 
219
  41%|████ | 80/195 [01:05<00:23, 4.83it/s]
220
 
 
221
  41%|████ | 80/195 [01:05<00:23, 4.83it/s]
222
 
 
223
  41%|████ | 80/195 [01:05<00:23, 4.83it/s]
224
  43%|████▎ | 83/195 [01:06<00:18, 6.01it/s]
225
 
 
226
  43%|████▎ | 83/195 [01:06<00:18, 6.01it/s]
227
  43%|████▎ | 84/195 [01:06<00:24, 4.57it/s]
228
 
 
229
  43%|████▎ | 84/195 [01:06<00:24, 4.57it/s]
230
 
 
231
  43%|████▎ | 84/195 [01:06<00:24, 4.57it/s]
232
  44%|████▍ | 86/195 [01:06<00:20, 5.19it/s]
233
 
 
234
  44%|████▍ | 86/195 [01:06<00:20, 5.19it/s]
235
 
 
236
  44%|████▍ | 86/195 [01:06<00:20, 5.19it/s]
237
 
 
238
  44%|████▍ | 86/195 [01:06<00:20, 5.19it/s]
239
  46%|████▌ | 89/195 [01:07<00:16, 6.37it/s]
240
 
 
241
  46%|████▌ | 89/195 [01:07<00:16, 6.37it/s]
242
  46%|████▌ | 90/195 [01:07<00:21, 4.80it/s]
243
 
 
244
  46%|████▌ | 90/195 [01:07<00:21, 4.80it/s]
245
 
 
246
  46%|████▌ | 90/195 [01:07<00:21, 4.80it/s]
247
  47%|████▋ | 92/195 [01:07<00:19, 5.41it/s]
248
 
 
249
  47%|████▋ | 92/195 [01:07<00:19, 5.41it/s]
250
 
 
251
  47%|████▋ | 92/195 [01:07<00:19, 5.41it/s]
252
 
 
253
  47%|████▋ | 92/195 [01:07<00:19, 5.41it/s]
254
  49%|████▊ | 95/195 [01:08<00:15, 6.51it/s]
255
 
 
256
  49%|████▊ | 95/195 [01:08<00:15, 6.51it/s]
257
  49%|████▉ | 96/195 [01:08<00:20, 4.81it/s]
258
 
 
259
  49%|████▉ | 96/195 [01:08<00:20, 4.81it/s]
260
 
 
261
  49%|████▉ | 96/195 [01:08<00:20, 4.81it/s]
262
  50%|█████ | 98/195 [01:08<00:17, 5.41it/s]
263
 
 
264
  50%|█████ | 98/195 [01:08<00:17, 5.41it/s]
265
 
 
266
  50%|█████ | 98/195 [01:09<00:17, 5.41it/s]
267
 
 
268
  50%|█████ | 98/195 [01:09<00:17, 5.41it/s]
269
  52%|█████▏ | 101/195 [01:09<00:14, 6.58it/s]
270
 
 
271
  52%|█████▏ | 101/195 [01:09<00:14, 6.58it/s]
272
  52%|█████▏ | 102/195 [01:09<00:18, 4.92it/s]
273
 
 
274
  52%|█████▏ | 102/195 [01:09<00:18, 4.92it/s]
275
 
 
276
  52%|█████▏ | 102/195 [01:09<00:18, 4.92it/s]
277
  53%|█████▎ | 104/195 [01:10<00:16, 5.44it/s]
278
 
 
279
  53%|█████▎ | 104/195 [01:10<00:16, 5.44it/s]
280
 
 
281
  53%|█████▎ | 104/195 [01:10<00:16, 5.44it/s]
282
 
 
283
  53%|█████▎ | 104/195 [01:10<00:16, 5.44it/s]
284
  55%|█████▍ | 107/195 [01:10<00:13, 6.60it/s]
285
 
 
286
  55%|█████▍ | 107/195 [01:10<00:13, 6.60it/s]
287
  55%|█████▌ | 108/195 [01:10<00:17, 4.94it/s]
288
 
 
289
  55%|█████▌ | 108/195 [01:10<00:17, 4.94it/s]
290
 
 
291
  55%|█████▌ | 108/195 [01:10<00:17, 4.94it/s]
292
  56%|█████▋ | 110/195 [01:11<00:15, 5.47it/s]
293
 
 
294
  56%|█████▋ | 110/195 [01:11<00:15, 5.47it/s]
295
 
 
296
  56%|█████▋ | 110/195 [01:11<00:15, 5.47it/s]
297
 
 
298
  56%|█████▋ | 110/195 [01:11<00:15, 5.47it/s]
299
  58%|█████▊ | 113/195 [01:11<00:12, 6.62it/s]
300
 
 
301
  58%|█████▊ | 113/195 [01:11<00:12, 6.62it/s]
302
  58%|█████▊ | 114/195 [01:11<00:16, 4.95it/s]
303
 
 
304
  58%|█████▊ | 114/195 [01:11<00:16, 4.95it/s]
305
 
 
306
  58%|█████▊ | 114/195 [01:11<00:16, 4.95it/s]
307
  59%|█████▉ | 116/195 [01:12<00:14, 5.55it/s]
308
 
 
309
  59%|█████▉ | 116/195 [01:12<00:14, 5.55it/s]
310
 
 
311
  59%|█████▉ | 116/195 [01:12<00:14, 5.55it/s]
312
 
 
313
  59%|█████▉ | 116/195 [01:12<00:14, 5.55it/s]
314
  61%|██████ | 119/195 [01:12<00:11, 6.63it/s]
315
 
 
316
  61%|██████ | 119/195 [01:12<00:11, 6.63it/s]
317
  62%|██████▏ | 120/195 [01:12<00:15, 4.78it/s]
318
 
 
319
  62%|██████▏ | 120/195 [01:12<00:15, 4.78it/s]
320
 
 
321
  62%|██████▏ | 120/195 [01:13<00:15, 4.78it/s]
322
  63%|██████▎ | 122/195 [01:13<00:13, 5.33it/s]
323
 
 
324
  63%|██████▎ | 122/195 [01:13<00:13, 5.33it/s]
325
 
 
326
  63%|██████▎ | 122/195 [01:13<00:13, 5.33it/s]
327
 
 
328
  63%|██████▎ | 122/195 [01:13<00:13, 5.33it/s]
329
  64%|██████▍ | 125/195 [01:13<00:10, 6.42it/s]
330
 
 
331
  64%|██████▍ | 125/195 [01:13<00:10, 6.42it/s]
332
  65%|██████▍ | 126/195 [01:14<00:14, 4.77it/s]
333
 
 
334
  65%|██████▍ | 126/195 [01:14<00:14, 4.77it/s]
335
 
 
336
  65%|██████▍ | 126/195 [01:14<00:14, 4.77it/s]
337
  66%|██████▌ | 128/195 [01:14<00:12, 5.32it/s]
338
 
 
339
  66%|██████▌ | 128/195 [01:14<00:12, 5.32it/s]
340
 
 
341
  66%|██████▌ | 128/195 [01:14<00:12, 5.32it/s]
342
 
 
343
  66%|██████▌ | 128/195 [01:14<00:12, 5.32it/s]
344
  67%|██████▋ | 131/195 [01:14<00:09, 6.50it/s]
345
 
 
346
  67%|██████▋ | 131/195 [01:14<00:09, 6.50it/s]
347
  68%|██████▊ | 132/195 [01:15<00:12, 4.89it/s]
348
 
 
349
  68%|██████▊ | 132/195 [01:15<00:12, 4.89it/s]
350
 
 
351
  68%|██████▊ | 132/195 [01:15<00:12, 4.89it/s]
352
  69%|██████▊ | 134/195 [01:15<00:11, 5.50it/s]
353
 
 
354
  69%|██████▊ | 134/195 [01:15<00:11, 5.50it/s]
355
 
 
356
  69%|██████▊ | 134/195 [01:15<00:11, 5.50it/s]
357
 
 
358
  69%|██████▊ | 134/195 [01:15<00:11, 5.50it/s]
359
  70%|███████ | 137/195 [01:15<00:08, 6.58it/s]
360
 
 
361
  70%|███████ | 137/195 [01:15<00:08, 6.58it/s]
362
  71%|███████ | 138/195 [01:16<00:11, 4.80it/s]
363
 
 
364
  71%|███████ | 138/195 [01:16<00:11, 4.80it/s]
365
 
 
366
  71%|███████ | 138/195 [01:16<00:11, 4.80it/s]
367
  72%|███████▏ | 140/195 [01:16<00:10, 5.42it/s]
368
 
 
369
  72%|███████▏ | 140/195 [01:16<00:10, 5.42it/s]
370
 
 
371
  72%|███████▏ | 140/195 [01:16<00:10, 5.42it/s]
372
 
 
373
  72%|███████▏ | 140/195 [01:16<00:10, 5.42it/s]
374
  73%|███████▎ | 143/195 [01:16<00:07, 6.51it/s]
375
 
 
376
  73%|███████▎ | 143/195 [01:16<00:07, 6.51it/s]
377
  74%|███████▍ | 144/195 [01:17<00:10, 4.87it/s]
378
 
 
379
  74%|███████▍ | 144/195 [01:17<00:10, 4.87it/s]
380
 
 
381
  74%|███████▍ | 144/195 [01:17<00:10, 4.87it/s]
382
  75%|███████▍ | 146/195 [01:17<00:09, 5.41it/s]
383
 
 
384
  75%|███████▍ | 146/195 [01:17<00:09, 5.41it/s]
385
 
 
386
  75%|███████▍ | 146/195 [01:17<00:09, 5.41it/s]
387
 
 
388
  75%|███████▍ | 146/195 [01:17<00:09, 5.41it/s]
389
  76%|███████▋ | 149/195 [01:17<00:06, 6.58it/s]
390
 
 
391
  76%|███████▋ | 149/195 [01:17<00:06, 6.58it/s]
392
  77%|███████▋ | 150/195 [01:18<00:09, 4.82it/s]
393
 
 
394
  77%|███████▋ | 150/195 [01:18<00:09, 4.82it/s]
395
 
 
396
  77%|███████▋ | 150/195 [01:18<00:09, 4.82it/s]
397
  78%|███████▊ | 152/195 [01:18<00:07, 5.44it/s]
398
 
 
399
  78%|███████▊ | 152/195 [01:18<00:07, 5.44it/s]
400
 
 
401
  78%|███████▊ | 152/195 [01:18<00:07, 5.44it/s]
402
 
 
403
  78%|███████▊ | 152/195 [01:18<00:07, 5.44it/s]
404
  79%|███████▉ | 155/195 [01:18<00:06, 6.53it/s]
405
 
 
406
  79%|███████▉ | 155/195 [01:19<00:06, 6.53it/s]
407
  80%|████████ | 156/195 [01:19<00:08, 4.72it/s]
408
 
 
409
  80%|████████ | 156/195 [01:19<00:08, 4.72it/s]
410
 
 
411
  80%|████████ | 156/195 [01:19<00:08, 4.72it/s]
412
  81%|████████ | 158/195 [01:19<00:06, 5.33it/s]
413
 
 
414
  81%|████████ | 158/195 [01:19<00:06, 5.33it/s]
415
 
 
416
  81%|████████ | 158/195 [01:19<00:06, 5.33it/s]
417
 
 
418
  81%|████████ | 158/195 [01:19<00:06, 5.33it/s]
419
  83%|████████▎ | 161/195 [01:20<00:05, 6.51it/s]
420
 
 
421
  83%|████████▎ | 161/195 [01:20<00:05, 6.51it/s]
422
  83%|████████▎ | 162/195 [01:20<00:06, 4.83it/s]
423
 
 
424
  83%|████████▎ | 162/195 [01:20<00:06, 4.83it/s]
425
 
 
426
  83%|████████▎ | 162/195 [01:20<00:06, 4.83it/s]
427
  84%|████████▍ | 164/195 [01:20<00:05, 5.43it/s]
428
 
 
429
  84%|████████▍ | 164/195 [01:20<00:05, 5.43it/s]
430
 
 
431
  84%|████████▍ | 164/195 [01:20<00:05, 5.43it/s]
432
 
 
433
  84%|████████▍ | 164/195 [01:20<00:05, 5.43it/s]
434
  86%|████████▌ | 167/195 [01:21<00:04, 6.52it/s]
435
 
 
436
  86%|████████▌ | 167/195 [01:21<00:04, 6.52it/s]
437
  86%|████████▌ | 168/195 [01:21<00:05, 4.74it/s]
438
 
 
439
  86%|████████▌ | 168/195 [01:21<00:05, 4.74it/s]
440
 
 
441
  86%|████████▌ | 168/195 [01:21<00:05, 4.74it/s]
442
  87%|████████▋ | 170/195 [01:21<00:04, 5.35it/s]
443
 
 
444
  87%|████████▋ | 170/195 [01:21<00:04, 5.35it/s]
445
 
 
446
  87%|████████▋ | 170/195 [01:21<00:04, 5.35it/s]
447
 
 
448
  87%|████████▋ | 170/195 [01:22<00:04, 5.35it/s]
449
  89%|████████▊ | 173/195 [01:22<00:03, 6.53it/s]
450
 
 
451
  89%|████████▊ | 173/195 [01:22<00:03, 6.53it/s]
452
  89%|████████▉ | 174/195 [01:22<00:04, 4.84it/s]
453
 
 
454
  89%|████████▉ | 174/195 [01:22<00:04, 4.84it/s]
455
 
 
456
  89%|████████▉ | 174/195 [01:22<00:04, 4.84it/s]
457
  90%|█████████ | 176/195 [01:22<00:03, 5.38it/s]
458
 
 
459
  90%|█████████ | 176/195 [01:22<00:03, 5.38it/s]
460
 
 
461
  90%|█████████ | 176/195 [01:23<00:03, 5.38it/s]
462
 
 
463
  90%|█████████ | 176/195 [01:23<00:03, 5.38it/s]
464
  92%|█████████▏| 179/195 [01:23<00:02, 6.56it/s]
465
 
 
466
  92%|█████████▏| 179/195 [01:23<00:02, 6.56it/s]
467
  92%|█████████▏| 180/195 [01:23<00:03, 4.82it/s]
468
 
 
469
  92%|█████████▏| 180/195 [01:23<00:03, 4.82it/s]
470
 
 
471
  92%|█████████▏| 180/195 [01:23<00:03, 4.82it/s]
472
  93%|█████████▎| 182/195 [01:24<00:02, 5.43it/s]
473
 
 
474
  93%|█████████▎| 182/195 [01:24<00:02, 5.43it/s]
475
 
 
476
  93%|█████████▎| 182/195 [01:24<00:02, 5.43it/s]
477
 
 
478
  93%|█████████▎| 182/195 [01:24<00:02, 5.43it/s]
479
  95%|█████████▍| 185/195 [01:24<00:01, 5.69it/s]
480
 
 
481
  95%|█████████▍| 185/195 [01:24<00:01, 5.69it/s]
482
  95%|█████████▌| 186/195 [01:25<00:02, 4.42it/s]
483
 
 
484
  95%|█████████▌| 186/195 [01:25<00:02, 4.42it/s]
485
 
 
486
  95%|█████████▌| 186/195 [01:25<00:02, 4.42it/s]
487
  96%|█████████▋| 188/195 [01:25<00:01, 5.07it/s]
488
 
 
489
  96%|█████████▋| 188/195 [01:25<00:01, 5.07it/s]
490
 
 
491
  96%|█████████▋| 188/195 [01:25<00:01, 5.07it/s]
492
 
 
493
  96%|█████████▋| 188/195 [01:25<00:01, 5.07it/s]
494
  98%|█████████▊| 191/195 [01:25<00:00, 6.28it/s]
495
 
 
496
  98%|█████████▊| 191/195 [01:25<00:00, 6.28it/s]
497
  98%|█████████▊| 192/195 [01:26<00:00, 4.79it/s]
498
 
 
499
  98%|█████████▊| 192/195 [01:26<00:00, 4.79it/s]
500
 
 
501
  98%|█████████▊| 192/195 [01:26<00:00, 4.79it/s]
502
  99%|█████████▉| 194/195 [01:26<00:00, 5.34it/s]
503
 
 
504
  99%|█████████▉| 194/195 [01:26<00:00, 5.34it/s]
 
 
 
 
 
 
 
 
 
 
1
+ /home/ruihang/Workspace/miniconda3/envs/python311/bin/python -m mlc_llm gen_config /models/Llama-2-7b-chat-hf --quantization q0f16 --conv-template llama-2 --output /tmp/tmp8ew5r2yr
2
+ [2024-05-22 00:30:05] INFO auto_config.py:115: Found model configuration: /models/Llama-2-7b-chat-hf/config.json
3
+ [2024-05-22 00:30:05] INFO auto_config.py:153: Found model type: llama. Use `--model-type` to override.
4
+ [2024-05-22 00:30:05] INFO llama_model.py:52: context_window_size not found in config.json. Falling back to max_position_embeddings (4096)
5
+ [2024-05-22 00:30:05] INFO llama_model.py:72: prefill_chunk_size defaults to 2048
6
+ [2024-05-22 00:30:05] INFO config.py:106: Overriding max_batch_size from 1 to 80
7
+ [2024-05-22 00:30:05] INFO gen_config.py:255: [generation_config.json] Setting bos_token_id: 1
8
+ [2024-05-22 00:30:05] INFO gen_config.py:255: [generation_config.json] Setting eos_token_id: 2
9
+ [2024-05-22 00:30:05] INFO gen_config.py:255: [generation_config.json] Setting pad_token_id: 0
10
+ [2024-05-22 00:30:05] INFO gen_config.py:255: [generation_config.json] Setting temperature: 0.6
11
+ [2024-05-22 00:30:05] INFO gen_config.py:255: [generation_config.json] Setting top_p: 0.9
12
+ [2024-05-22 00:30:05] INFO gen_config.py:267: Found tokenizer config: /models/Llama-2-7b-chat-hf/tokenizer.model. Copying to /tmp/tmp8ew5r2yr/tokenizer.model
13
+ [2024-05-22 00:30:05] INFO gen_config.py:267: Found tokenizer config: /models/Llama-2-7b-chat-hf/tokenizer.json. Copying to /tmp/tmp8ew5r2yr/tokenizer.json
14
+ [2024-05-22 00:30:05] INFO gen_config.py:269: Not found tokenizer config: /models/Llama-2-7b-chat-hf/vocab.json
15
+ [2024-05-22 00:30:05] INFO gen_config.py:269: Not found tokenizer config: /models/Llama-2-7b-chat-hf/merges.txt
16
+ [2024-05-22 00:30:05] INFO gen_config.py:269: Not found tokenizer config: /models/Llama-2-7b-chat-hf/added_tokens.json
17
+ [2024-05-22 00:30:05] INFO gen_config.py:267: Found tokenizer config: /models/Llama-2-7b-chat-hf/tokenizer_config.json. Copying to /tmp/tmp8ew5r2yr/tokenizer_config.json
18
+ [2024-05-22 00:30:05] INFO gen_config.py:80: [System default] Setting presence_penalty: 0.0
19
+ [2024-05-22 00:30:05] INFO gen_config.py:80: [System default] Setting frequency_penalty: 0.0
20
+ [2024-05-22 00:30:05] INFO gen_config.py:80: [System default] Setting repetition_penalty: 1.0
21
+ [2024-05-22 00:30:05] INFO gen_config.py:80: [System default] Setting mean_gen_len: 128
22
+ [2024-05-22 00:30:05] INFO gen_config.py:80: [System default] Setting max_gen_len: 512
23
+ [2024-05-22 00:30:05] INFO gen_config.py:80: [System default] Setting shift_fill_factor: 0.3
24
+ [2024-05-22 00:30:05] INFO gen_config.py:335: Dumping configuration file to: /tmp/tmp8ew5r2yr/mlc-chat-config.json
25
+ /home/ruihang/Workspace/miniconda3/envs/python311/bin/python -m mlc_llm convert_weight /models/Llama-2-7b-chat-hf --quantization q0f16 --source-format auto --output /tmp/tmp8ew5r2yr
26
+ [2024-05-22 00:30:06] INFO auto_config.py:115: Found model configuration: /models/Llama-2-7b-chat-hf/config.json
27
+ [2024-05-22 00:30:06] INFO auto_device.py:79: Found device: cuda:0
28
+ [2024-05-22 00:30:06] INFO auto_device.py:79: Found device: cuda:1
29
+ [2024-05-22 00:30:07] INFO auto_device.py:88: Not found device: rocm:0
30
+ [2024-05-22 00:30:08] INFO auto_device.py:88: Not found device: metal:0
31
+ [2024-05-22 00:30:09] INFO auto_device.py:79: Found device: vulkan:0
32
+ [2024-05-22 00:30:09] INFO auto_device.py:79: Found device: vulkan:1
33
+ [2024-05-22 00:30:09] INFO auto_device.py:79: Found device: vulkan:2
34
+ [2024-05-22 00:30:10] INFO auto_device.py:79: Found device: opencl:0
35
+ [2024-05-22 00:30:10] INFO auto_device.py:79: Found device: opencl:1
36
+ [2024-05-22 00:30:10] INFO auto_device.py:35: Using device: cuda:0
37
+ [2024-05-22 00:30:10] INFO auto_weight.py:70: Finding weights in: /models/Llama-2-7b-chat-hf
38
+ [2024-05-22 00:30:10] INFO auto_weight.py:120: Found source weight format: huggingface-torch. Source configuration: /models/Llama-2-7b-chat-hf/pytorch_model.bin.index.json
39
+ [2024-05-22 00:30:10] INFO auto_weight.py:143: Found source weight format: huggingface-safetensor. Source configuration: /models/Llama-2-7b-chat-hf/model.safetensors.index.json
40
+ [2024-05-22 00:30:10] INFO auto_weight.py:106: Using source weight configuration: /models/Llama-2-7b-chat-hf/pytorch_model.bin.index.json. Use `--source` to override.
41
+ [2024-05-22 00:30:10] INFO auto_weight.py:110: Using source weight format: huggingface-torch. Use `--source-format` to override.
42
+ [2024-05-22 00:30:10] INFO auto_config.py:153: Found model type: llama. Use `--model-type` to override.
43
+ [2024-05-22 00:30:10] INFO llama_model.py:52: context_window_size not found in config.json. Falling back to max_position_embeddings (4096)
44
+ [2024-05-22 00:30:10] INFO llama_model.py:72: prefill_chunk_size defaults to 2048
45
+ Weight conversion with arguments:
46
+ --config /models/Llama-2-7b-chat-hf/config.json
47
+ --quantization NoQuantize(name='q0f16', kind='no-quant', model_dtype='float16')
48
+ --model-type llama
49
+ --device cuda:0
50
+ --source /models/Llama-2-7b-chat-hf/pytorch_model.bin.index.json
51
+ --source-format huggingface-torch
52
+ --output /tmp/tmp8ew5r2yr
53
+ Start storing to cache /tmp/tmp8ew5r2yr
54
+
55
  0%| | 0/195 [00:00<?, ?it/s]
56
 
57
+
58
  0%| | 0/195 [00:00<?, ?it/s]
59
 
60
+
61
  0%| | 0/195 [00:08<?, ?it/s]
62
  1%| | 1/195 [00:09<29:48, 9.22s/it]
63
 
64
+
65
  1%| | 1/195 [00:09<29:48, 9.22s/it]
66
 
67
+
68
  1%| | 1/195 [00:09<29:48, 9.22s/it]
69
  2%|▏ | 3/195 [00:09<07:58, 2.49s/it]
70
 
71
+
72
  2%|▏ | 3/195 [00:09<07:58, 2.49s/it]
73
  2%|▏ | 4/195 [00:10<06:17, 1.98s/it]
74
 
75
+
76
  2%|▏ | 4/195 [00:10<06:17, 1.98s/it]
77
 
78
+
79
  2%|▏ | 4/195 [00:10<06:17, 1.98s/it]
80
  3%|▎ | 6/195 [00:10<03:28, 1.10s/it]
81
 
82
+
83
  3%|▎ | 6/195 [00:10<03:28, 1.10s/it]
84
  4%|▎ | 7/195 [00:11<02:38, 1.19it/s]
85
 
86
+
87
  4%|▎ | 7/195 [00:11<02:38, 1.19it/s]
88
 
89
+
90
  4%|▎ | 7/195 [00:11<02:38, 1.19it/s]
91
  5%|▍ | 9/195 [00:11<01:39, 1.87it/s]
92
 
93
+
94
  5%|▍ | 9/195 [00:11<01:39, 1.87it/s]
95
  5%|▌ | 10/195 [00:12<02:00, 1.54it/s]
96
 
97
+
98
  5%|▌ | 10/195 [00:12<02:00, 1.54it/s]
99
 
100
+
101
  5%|▌ | 10/195 [00:12<02:00, 1.54it/s]
102
  6%|▌ | 12/195 [00:12<01:24, 2.15it/s]
103
 
104
+
105
  6%|▌ | 12/195 [00:12<01:24, 2.15it/s]
106
  7%|▋ | 13/195 [00:12<01:09, 2.61it/s]
107
 
108
+
109
  7%|▋ | 13/195 [00:12<01:09, 2.61it/s]
110
 
111
+
112
  7%|▋ | 13/195 [00:12<01:09, 2.61it/s]
113
  8%|▊ | 15/195 [00:13<00:50, 3.53it/s]
114
 
115
+
116
  8%|▊ | 15/195 [00:13<00:50, 3.53it/s]
117
  8%|▊ | 16/195 [00:13<01:15, 2.36it/s]
118
 
119
+
120
  8%|▊ | 16/195 [00:13<01:15, 2.36it/s]
121
 
122
+
123
  8%|▊ | 16/195 [00:14<01:15, 2.36it/s]
124
  9%|▉ | 18/195 [00:14<00:58, 3.04it/s]
125
 
126
+
127
  9%|▉ | 18/195 [00:14<00:58, 3.04it/s]
128
  10%|▉ | 19/195 [00:14<00:49, 3.57it/s]
129
 
130
+
131
  10%|▉ | 19/195 [00:14<00:49, 3.57it/s]
132
 
133
+
134
  10%|▉ | 19/195 [00:14<00:49, 3.57it/s]
135
  11%|█ | 21/195 [00:14<00:38, 4.53it/s]
136
 
137
+
138
  11%|█ | 21/195 [00:14<00:38, 4.53it/s]
139
  11%|█▏ | 22/195 [00:15<00:55, 3.11it/s]
140
 
141
+
142
  11%|█▏ | 22/195 [00:15<00:55, 3.11it/s]
143
 
144
+
145
  11%|█▏ | 22/195 [00:15<00:55, 3.11it/s]
146
  12%|█▏ | 24/195 [00:15<00:44, 3.87it/s]
147
 
148
+
149
  12%|█▏ | 24/195 [00:15<00:44, 3.87it/s]
150
  13%|█▎ | 25/195 [00:15<00:38, 4.45it/s]
151
 
152
+
153
  13%|█▎ | 25/195 [00:15<00:38, 4.45it/s]
154
 
155
+
156
  13%|█▎ | 25/195 [00:15<00:38, 4.45it/s]
157
  14%|█▍ | 27/195 [00:16<00:31, 5.38it/s]
158
 
159
+
160
  14%|█▍ | 27/195 [00:16<00:31, 5.38it/s]
161
  14%|█▍ | 28/195 [00:16<00:53, 3.14it/s]
162
 
163
+
164
  14%|█▍ | 28/195 [00:16<00:53, 3.14it/s]
165
 
166
+
167
  14%|█▍ | 28/195 [00:16<00:53, 3.14it/s]
168
  15%|█▌ | 30/195 [00:17<00:42, 3.89it/s]
169
 
170
+
171
  15%|█▌ | 30/195 [00:17<00:42, 3.89it/s]
172
  16%|█▌ | 31/195 [00:17<00:36, 4.47it/s]
173
 
174
+
175
  16%|█▌ | 31/195 [00:17<00:36, 4.47it/s]
176
 
177
+
178
  16%|█▌ | 31/195 [00:17<00:36, 4.47it/s]
179
  17%|█▋ | 33/195 [00:17<00:32, 4.97it/s]
180
 
181
+
182
  17%|█▋ | 33/195 [00:17<00:32, 4.97it/s]
183
  17%|█▋ | 34/195 [00:18<00:51, 3.12it/s]
184
 
185
+
186
  17%|█▋ | 34/195 [00:18<00:51, 3.12it/s]
187
 
188
+
189
  17%|█▋ | 34/195 [00:18<00:51, 3.12it/s]
190
  18%|█▊ | 36/195 [00:18<00:42, 3.77it/s]
191
 
192
+
193
  18%|█▊ | 36/195 [00:18<00:42, 3.77it/s]
194
 
195
+
196
  18%|█▊ | 36/195 [00:18<00:42, 3.77it/s]
197
  19%|█▉ | 38/195 [00:18<00:29, 5.26it/s]
198
 
199
+
200
  19%|█▉ | 38/195 [00:18<00:29, 5.26it/s]
201
  20%|██ | 39/195 [00:19<00:31, 5.02it/s]
202
 
203
+
204
  20%|██ | 39/195 [00:19<00:31, 5.02it/s]
205
  21%|██ | 40/195 [00:19<00:46, 3.35it/s]
206
 
207
+
208
  21%|██ | 40/195 [00:19<00:46, 3.35it/s]
209
 
210
+
211
  21%|██ | 40/195 [00:19<00:46, 3.35it/s]
212
  22%|██▏ | 42/195 [00:19<00:37, 4.12it/s]
213
 
214
+
215
  22%|██▏ | 42/195 [00:19<00:37, 4.12it/s]
216
  22%|██▏ | 43/195 [00:20<00:32, 4.72it/s]
217
 
218
+
219
  22%|██▏ | 43/195 [00:20<00:32, 4.72it/s]
220
 
221
+
222
  22%|██▏ | 43/195 [00:20<00:32, 4.72it/s]
223
  23%|██▎ | 45/195 [00:20<00:26, 5.62it/s]
224
 
225
+
226
  23%|██▎ | 45/195 [00:20<00:26, 5.62it/s]
227
  24%|██▎ | 46/195 [00:21<00:44, 3.35it/s]
228
 
229
+
230
  24%|██▎ | 46/195 [00:21<00:44, 3.35it/s]
231
 
232
+
233
  24%|██▎ | 46/195 [00:21<00:44, 3.35it/s]
234
  25%|██▍ | 48/195 [00:21<00:35, 4.11it/s]
235
 
236
+
237
  25%|██▍ | 48/195 [00:21<00:35, 4.11it/s]
238
  25%|██▌ | 49/195 [00:21<00:31, 4.70it/s]
239
 
240
+
241
  25%|██▌ | 49/195 [00:21<00:31, 4.70it/s]
242
 
243
+
244
  25%|██▌ | 49/195 [00:21<00:31, 4.70it/s]
245
 
246
+
247
  25%|██▌ | 49/195 [00:21<00:31, 4.70it/s]
248
 
249
+
250
  25%|██▌ | 49/195 [00:58<00:31, 4.70it/s]
251
  26%|██▌ | 51/195 [00:58<17:18, 7.21s/it]
252
 
253
+
254
  26%|██▌ | 51/195 [00:58<17:18, 7.21s/it]
255
 
256
+
257
  26%|██▌ | 51/195 [00:58<17:18, 7.21s/it]
258
  27%|██▋ | 53/195 [00:59<11:13, 4.74s/it]
259
 
260
+
261
  27%|██▋ | 53/195 [00:59<11:13, 4.74s/it]
262
  28%|██▊ | 54/195 [01:00<09:23, 4.00s/it]
263
 
264
+
265
  28%|██▊ | 54/195 [01:00<09:23, 4.00s/it]
266
 
267
+
268
  28%|██▊ | 54/195 [01:00<09:23, 4.00s/it]
269
  29%|██▊ | 56/195 [01:00<06:03, 2.61s/it]
270
 
271
+
272
  29%|██▊ | 56/195 [01:00<06:03, 2.61s/it]
273
  29%|██▉ | 57/195 [01:00<04:50, 2.10s/it]
274
 
275
+
276
  29%|██▉ | 57/195 [01:00<04:50, 2.10s/it]
277
 
278
+
279
  29%|██▉ | 57/195 [01:00<04:50, 2.10s/it]
280
  30%|███ | 59/195 [01:01<03:07, 1.38s/it]
281
 
282
+
283
  30%|███ | 59/195 [01:01<03:07, 1.38s/it]
284
  31%|███ | 60/195 [01:01<02:47, 1.24s/it]
285
 
286
+
287
  31%|███ | 60/195 [01:01<02:47, 1.24s/it]
288
 
289
+
290
  31%|███ | 60/195 [01:01<02:47, 1.24s/it]
291
  32%|███▏ | 62/195 [01:02<01:52, 1.18it/s]
292
 
293
+
294
  32%|███▏ | 62/195 [01:02<01:52, 1.18it/s]
295
  32%|███▏ | 63/195 [01:02<01:31, 1.44it/s]
296
 
297
+
298
  32%|███▏ | 63/195 [01:02<01:31, 1.44it/s]
299
 
300
+
301
  32%|███▏ | 63/195 [01:02<01:31, 1.44it/s]
302
  33%|███▎ | 65/195 [01:02<01:03, 2.04it/s]
303
 
304
+
305
  33%|███▎ | 65/195 [01:02<01:03, 2.04it/s]
306
  34%|███▍ | 66/195 [01:03<01:08, 1.90it/s]
307
 
308
+
309
  34%|███▍ | 66/195 [01:03<01:08, 1.90it/s]
310
 
311
+
312
  34%|███▍ | 66/195 [01:03<01:08, 1.90it/s]
313
  35%|███▍ | 68/195 [01:03<00:48, 2.61it/s]
314
 
315
+
316
  35%|███▍ | 68/195 [01:03<00:48, 2.61it/s]
317
 
318
+
319
  35%|███▍ | 68/195 [01:03<00:48, 2.61it/s]
320
 
321
+
322
  35%|███▍ | 68/195 [01:03<00:48, 2.61it/s]
323
  36%|███▋ | 71/195 [01:03<00:32, 3.82it/s]
324
 
325
+
326
  36%|███▋ | 71/195 [01:03<00:32, 3.82it/s]
327
  37%|███▋ | 72/195 [01:04<00:37, 3.31it/s]
328
 
329
+
330
  37%|███▋ | 72/195 [01:04<00:37, 3.31it/s]
331
 
332
+
333
  37%|███▋ | 72/195 [01:04<00:37, 3.31it/s]
334
  38%|███▊ | 74/195 [01:04<00:30, 4.02it/s]
335
 
336
+
337
  38%|███▊ | 74/195 [01:04<00:30, 4.02it/s]
338
 
339
+
340
  38%|███▊ | 74/195 [01:04<00:30, 4.02it/s]
341
 
342
+
343
  38%|███▊ | 74/195 [01:04<00:30, 4.02it/s]
344
  39%|███▉ | 77/195 [01:04<00:22, 5.26it/s]
345
 
346
+
347
  39%|███▉ | 77/195 [01:05<00:22, 5.26it/s]
348
  40%|████ | 78/195 [01:05<00:27, 4.18it/s]
349
 
350
+
351
  40%|████ | 78/195 [01:05<00:27, 4.18it/s]
352
 
353
+
354
  40%|████ | 78/195 [01:05<00:27, 4.18it/s]
355
  41%|████ | 80/195 [01:05<00:23, 4.83it/s]
356
 
357
+
358
  41%|████ | 80/195 [01:05<00:23, 4.83it/s]
359
 
360
+
361
  41%|████ | 80/195 [01:05<00:23, 4.83it/s]
362
 
363
+
364
  41%|████ | 80/195 [01:05<00:23, 4.83it/s]
365
  43%|████▎ | 83/195 [01:06<00:18, 6.01it/s]
366
 
367
+
368
  43%|████▎ | 83/195 [01:06<00:18, 6.01it/s]
369
  43%|████▎ | 84/195 [01:06<00:24, 4.57it/s]
370
 
371
+
372
  43%|████▎ | 84/195 [01:06<00:24, 4.57it/s]
373
 
374
+
375
  43%|████▎ | 84/195 [01:06<00:24, 4.57it/s]
376
  44%|████▍ | 86/195 [01:06<00:20, 5.19it/s]
377
 
378
+
379
  44%|████▍ | 86/195 [01:06<00:20, 5.19it/s]
380
 
381
+
382
  44%|████▍ | 86/195 [01:06<00:20, 5.19it/s]
383
 
384
+
385
  44%|████▍ | 86/195 [01:06<00:20, 5.19it/s]
386
  46%|████▌ | 89/195 [01:07<00:16, 6.37it/s]
387
 
388
+
389
  46%|████▌ | 89/195 [01:07<00:16, 6.37it/s]
390
  46%|████▌ | 90/195 [01:07<00:21, 4.80it/s]
391
 
392
+
393
  46%|████▌ | 90/195 [01:07<00:21, 4.80it/s]
394
 
395
+
396
  46%|████▌ | 90/195 [01:07<00:21, 4.80it/s]
397
  47%|████▋ | 92/195 [01:07<00:19, 5.41it/s]
398
 
399
+
400
  47%|████▋ | 92/195 [01:07<00:19, 5.41it/s]
401
 
402
+
403
  47%|████▋ | 92/195 [01:07<00:19, 5.41it/s]
404
 
405
+
406
  47%|████▋ | 92/195 [01:07<00:19, 5.41it/s]
407
  49%|████▊ | 95/195 [01:08<00:15, 6.51it/s]
408
 
409
+
410
  49%|████▊ | 95/195 [01:08<00:15, 6.51it/s]
411
  49%|████▉ | 96/195 [01:08<00:20, 4.81it/s]
412
 
413
+
414
  49%|████▉ | 96/195 [01:08<00:20, 4.81it/s]
415
 
416
+
417
  49%|████▉ | 96/195 [01:08<00:20, 4.81it/s]
418
  50%|█████ | 98/195 [01:08<00:17, 5.41it/s]
419
 
420
+
421
  50%|█████ | 98/195 [01:08<00:17, 5.41it/s]
422
 
423
+
424
  50%|█████ | 98/195 [01:09<00:17, 5.41it/s]
425
 
426
+
427
  50%|█████ | 98/195 [01:09<00:17, 5.41it/s]
428
  52%|█████▏ | 101/195 [01:09<00:14, 6.58it/s]
429
 
430
+
431
  52%|█████▏ | 101/195 [01:09<00:14, 6.58it/s]
432
  52%|█████▏ | 102/195 [01:09<00:18, 4.92it/s]
433
 
434
+
435
  52%|█████▏ | 102/195 [01:09<00:18, 4.92it/s]
436
 
437
+
438
  52%|█████▏ | 102/195 [01:09<00:18, 4.92it/s]
439
  53%|█████▎ | 104/195 [01:10<00:16, 5.44it/s]
440
 
441
+
442
  53%|█████▎ | 104/195 [01:10<00:16, 5.44it/s]
443
 
444
+
445
  53%|█████▎ | 104/195 [01:10<00:16, 5.44it/s]
446
 
447
+
448
  53%|█████▎ | 104/195 [01:10<00:16, 5.44it/s]
449
  55%|█████▍ | 107/195 [01:10<00:13, 6.60it/s]
450
 
451
+
452
  55%|█████▍ | 107/195 [01:10<00:13, 6.60it/s]
453
  55%|█████▌ | 108/195 [01:10<00:17, 4.94it/s]
454
 
455
+
456
  55%|█████▌ | 108/195 [01:10<00:17, 4.94it/s]
457
 
458
+
459
  55%|█████▌ | 108/195 [01:10<00:17, 4.94it/s]
460
  56%|█████▋ | 110/195 [01:11<00:15, 5.47it/s]
461
 
462
+
463
  56%|█████▋ | 110/195 [01:11<00:15, 5.47it/s]
464
 
465
+
466
  56%|█████▋ | 110/195 [01:11<00:15, 5.47it/s]
467
 
468
+
469
  56%|█████▋ | 110/195 [01:11<00:15, 5.47it/s]
470
  58%|█████▊ | 113/195 [01:11<00:12, 6.62it/s]
471
 
472
+
473
  58%|█████▊ | 113/195 [01:11<00:12, 6.62it/s]
474
  58%|█████▊ | 114/195 [01:11<00:16, 4.95it/s]
475
 
476
+
477
  58%|█████▊ | 114/195 [01:11<00:16, 4.95it/s]
478
 
479
+
480
  58%|█████▊ | 114/195 [01:11<00:16, 4.95it/s]
481
  59%|█████▉ | 116/195 [01:12<00:14, 5.55it/s]
482
 
483
+
484
  59%|█████▉ | 116/195 [01:12<00:14, 5.55it/s]
485
 
486
+
487
  59%|█████▉ | 116/195 [01:12<00:14, 5.55it/s]
488
 
489
+
490
  59%|█████▉ | 116/195 [01:12<00:14, 5.55it/s]
491
  61%|██████ | 119/195 [01:12<00:11, 6.63it/s]
492
 
493
+
494
  61%|██████ | 119/195 [01:12<00:11, 6.63it/s]
495
  62%|██████▏ | 120/195 [01:12<00:15, 4.78it/s]
496
 
497
+
498
  62%|██████▏ | 120/195 [01:12<00:15, 4.78it/s]
499
 
500
+
501
  62%|██████▏ | 120/195 [01:13<00:15, 4.78it/s]
502
  63%|██████▎ | 122/195 [01:13<00:13, 5.33it/s]
503
 
504
+
505
  63%|██████▎ | 122/195 [01:13<00:13, 5.33it/s]
506
 
507
+
508
  63%|██████▎ | 122/195 [01:13<00:13, 5.33it/s]
509
 
510
+
511
  63%|██████▎ | 122/195 [01:13<00:13, 5.33it/s]
512
  64%|██████▍ | 125/195 [01:13<00:10, 6.42it/s]
513
 
514
+
515
  64%|██████▍ | 125/195 [01:13<00:10, 6.42it/s]
516
  65%|██████▍ | 126/195 [01:14<00:14, 4.77it/s]
517
 
518
+
519
  65%|██████▍ | 126/195 [01:14<00:14, 4.77it/s]
520
 
521
+
522
  65%|██████▍ | 126/195 [01:14<00:14, 4.77it/s]
523
  66%|██████▌ | 128/195 [01:14<00:12, 5.32it/s]
524
 
525
+
526
  66%|██████▌ | 128/195 [01:14<00:12, 5.32it/s]
527
 
528
+
529
  66%|██████▌ | 128/195 [01:14<00:12, 5.32it/s]
530
 
531
+
532
  66%|██████▌ | 128/195 [01:14<00:12, 5.32it/s]
533
  67%|██████▋ | 131/195 [01:14<00:09, 6.50it/s]
534
 
535
+
536
  67%|██████▋ | 131/195 [01:14<00:09, 6.50it/s]
537
  68%|██████▊ | 132/195 [01:15<00:12, 4.89it/s]
538
 
539
+
540
  68%|██████▊ | 132/195 [01:15<00:12, 4.89it/s]
541
 
542
+
543
  68%|██████▊ | 132/195 [01:15<00:12, 4.89it/s]
544
  69%|██████▊ | 134/195 [01:15<00:11, 5.50it/s]
545
 
546
+
547
  69%|██████▊ | 134/195 [01:15<00:11, 5.50it/s]
548
 
549
+
550
  69%|██████▊ | 134/195 [01:15<00:11, 5.50it/s]
551
 
552
+
553
  69%|██████▊ | 134/195 [01:15<00:11, 5.50it/s]
554
  70%|███████ | 137/195 [01:15<00:08, 6.58it/s]
555
 
556
+
557
  70%|███████ | 137/195 [01:15<00:08, 6.58it/s]
558
  71%|███████ | 138/195 [01:16<00:11, 4.80it/s]
559
 
560
+
561
  71%|███████ | 138/195 [01:16<00:11, 4.80it/s]
562
 
563
+
564
  71%|███████ | 138/195 [01:16<00:11, 4.80it/s]
565
  72%|███████▏ | 140/195 [01:16<00:10, 5.42it/s]
566
 
567
+
568
  72%|███████▏ | 140/195 [01:16<00:10, 5.42it/s]
569
 
570
+
571
  72%|███████▏ | 140/195 [01:16<00:10, 5.42it/s]
572
 
573
+
574
  72%|███████▏ | 140/195 [01:16<00:10, 5.42it/s]
575
  73%|███████▎ | 143/195 [01:16<00:07, 6.51it/s]
576
 
577
+
578
  73%|███████▎ | 143/195 [01:16<00:07, 6.51it/s]
579
  74%|███████▍ | 144/195 [01:17<00:10, 4.87it/s]
580
 
581
+
582
  74%|███████▍ | 144/195 [01:17<00:10, 4.87it/s]
583
 
584
+
585
  74%|███████▍ | 144/195 [01:17<00:10, 4.87it/s]
586
  75%|███████▍ | 146/195 [01:17<00:09, 5.41it/s]
587
 
588
+
589
  75%|███████▍ | 146/195 [01:17<00:09, 5.41it/s]
590
 
591
+
592
  75%|███████▍ | 146/195 [01:17<00:09, 5.41it/s]
593
 
594
+
595
  75%|███████▍ | 146/195 [01:17<00:09, 5.41it/s]
596
  76%|███████▋ | 149/195 [01:17<00:06, 6.58it/s]
597
 
598
+
599
  76%|███████▋ | 149/195 [01:17<00:06, 6.58it/s]
600
  77%|███████▋ | 150/195 [01:18<00:09, 4.82it/s]
601
 
602
+
603
  77%|███████▋ | 150/195 [01:18<00:09, 4.82it/s]
604
 
605
+
606
  77%|███████▋ | 150/195 [01:18<00:09, 4.82it/s]
607
  78%|███████▊ | 152/195 [01:18<00:07, 5.44it/s]
608
 
609
+
610
  78%|███████▊ | 152/195 [01:18<00:07, 5.44it/s]
611
 
612
+
613
  78%|███████▊ | 152/195 [01:18<00:07, 5.44it/s]
614
 
615
+
616
  78%|███████▊ | 152/195 [01:18<00:07, 5.44it/s]
617
  79%|███████▉ | 155/195 [01:18<00:06, 6.53it/s]
618
 
619
+
620
  79%|███████▉ | 155/195 [01:19<00:06, 6.53it/s]
621
  80%|████████ | 156/195 [01:19<00:08, 4.72it/s]
622
 
623
+
624
  80%|████████ | 156/195 [01:19<00:08, 4.72it/s]
625
 
626
+
627
  80%|████████ | 156/195 [01:19<00:08, 4.72it/s]
628
  81%|████████ | 158/195 [01:19<00:06, 5.33it/s]
629
 
630
+
631
  81%|████████ | 158/195 [01:19<00:06, 5.33it/s]
632
 
633
+
634
  81%|████████ | 158/195 [01:19<00:06, 5.33it/s]
635
 
636
+
637
  81%|████████ | 158/195 [01:19<00:06, 5.33it/s]
638
  83%|████████▎ | 161/195 [01:20<00:05, 6.51it/s]
639
 
640
+
641
  83%|████████▎ | 161/195 [01:20<00:05, 6.51it/s]
642
  83%|████████▎ | 162/195 [01:20<00:06, 4.83it/s]
643
 
644
+
645
  83%|████████▎ | 162/195 [01:20<00:06, 4.83it/s]
646
 
647
+
648
  83%|████████▎ | 162/195 [01:20<00:06, 4.83it/s]
649
  84%|████████▍ | 164/195 [01:20<00:05, 5.43it/s]
650
 
651
+
652
  84%|████████▍ | 164/195 [01:20<00:05, 5.43it/s]
653
 
654
+
655
  84%|████████▍ | 164/195 [01:20<00:05, 5.43it/s]
656
 
657
+
658
  84%|████████▍ | 164/195 [01:20<00:05, 5.43it/s]
659
  86%|████████▌ | 167/195 [01:21<00:04, 6.52it/s]
660
 
661
+
662
  86%|████████▌ | 167/195 [01:21<00:04, 6.52it/s]
663
  86%|████████▌ | 168/195 [01:21<00:05, 4.74it/s]
664
 
665
+
666
  86%|████████▌ | 168/195 [01:21<00:05, 4.74it/s]
667
 
668
+
669
  86%|████████▌ | 168/195 [01:21<00:05, 4.74it/s]
670
  87%|████████▋ | 170/195 [01:21<00:04, 5.35it/s]
671
 
672
+
673
  87%|████████▋ | 170/195 [01:21<00:04, 5.35it/s]
674
 
675
+
676
  87%|████████▋ | 170/195 [01:21<00:04, 5.35it/s]
677
 
678
+
679
  87%|████████▋ | 170/195 [01:22<00:04, 5.35it/s]
680
  89%|████████▊ | 173/195 [01:22<00:03, 6.53it/s]
681
 
682
+
683
  89%|████████▊ | 173/195 [01:22<00:03, 6.53it/s]
684
  89%|████████▉ | 174/195 [01:22<00:04, 4.84it/s]
685
 
686
+
687
  89%|████████▉ | 174/195 [01:22<00:04, 4.84it/s]
688
 
689
+
690
  89%|████████▉ | 174/195 [01:22<00:04, 4.84it/s]
691
  90%|█████████ | 176/195 [01:22<00:03, 5.38it/s]
692
 
693
+
694
  90%|█████████ | 176/195 [01:22<00:03, 5.38it/s]
695
 
696
+
697
  90%|█████████ | 176/195 [01:23<00:03, 5.38it/s]
698
 
699
+
700
  90%|█████████ | 176/195 [01:23<00:03, 5.38it/s]
701
  92%|█████████▏| 179/195 [01:23<00:02, 6.56it/s]
702
 
703
+
704
  92%|█████████▏| 179/195 [01:23<00:02, 6.56it/s]
705
  92%|█████████▏| 180/195 [01:23<00:03, 4.82it/s]
706
 
707
+
708
  92%|█████████▏| 180/195 [01:23<00:03, 4.82it/s]
709
 
710
+
711
  92%|█████████▏| 180/195 [01:23<00:03, 4.82it/s]
712
  93%|█████████▎| 182/195 [01:24<00:02, 5.43it/s]
713
 
714
+
715
  93%|█████████▎| 182/195 [01:24<00:02, 5.43it/s]
716
 
717
+
718
  93%|█████████▎| 182/195 [01:24<00:02, 5.43it/s]
719
 
720
+
721
  93%|█████████▎| 182/195 [01:24<00:02, 5.43it/s]
722
  95%|█████████▍| 185/195 [01:24<00:01, 5.69it/s]
723
 
724
+
725
  95%|█████████▍| 185/195 [01:24<00:01, 5.69it/s]
726
  95%|█████████▌| 186/195 [01:25<00:02, 4.42it/s]
727
 
728
+
729
  95%|█████████▌| 186/195 [01:25<00:02, 4.42it/s]
730
 
731
+
732
  95%|█████████▌| 186/195 [01:25<00:02, 4.42it/s]
733
  96%|█████████▋| 188/195 [01:25<00:01, 5.07it/s]
734
 
735
+
736
  96%|█████████▋| 188/195 [01:25<00:01, 5.07it/s]
737
 
738
+
739
  96%|█████████▋| 188/195 [01:25<00:01, 5.07it/s]
740
 
741
+
742
  96%|█████████▋| 188/195 [01:25<00:01, 5.07it/s]
743
  98%|█████████▊| 191/195 [01:25<00:00, 6.28it/s]
744
 
745
+
746
  98%|█████████▊| 191/195 [01:25<00:00, 6.28it/s]
747
  98%|█████████▊| 192/195 [01:26<00:00, 4.79it/s]
748
 
749
+
750
  98%|█████████▊| 192/195 [01:26<00:00, 4.79it/s]
751
 
752
+
753
  98%|█████████▊| 192/195 [01:26<00:00, 4.79it/s]
754
  99%|█████████▉| 194/195 [01:26<00:00, 5.34it/s]
755
 
756
+
757
  99%|█████████▉| 194/195 [01:26<00:00, 5.34it/s]
758
+ [2024-05-22 00:31:37] INFO huggingface_loader.py:196: Unloading HF weight file: /models/Llama-2-7b-chat-hf/pytorch_model-00001-of-00002.bin
759
+ [2024-05-22 00:31:38] INFO stats.py:76: Time usage: HF loading: 44.115 sec; Pre-quantization mapping: 7.475 sec; Quantization: 0.000 sec
760
+ [2024-05-22 00:31:38] INFO stats.py:90: RAM usage: Peak RAM: 9.291 GB. Total bytes loaded from disk: 12.551 GB
761
+ [2024-05-22 00:31:38] INFO convert_weight.py:155: Parameter size after quantization: 12.551 GB
762
+ [2024-05-22 00:31:38] INFO convert_weight.py:160: Total parameters: 6,738,415,616
763
+ [2024-05-22 00:31:38] INFO convert_weight.py:161: Bits per parameter: 16.000
764
+ [2024-05-22 00:31:38] INFO convert_weight.py:166: Saved to directory: /tmp/tmp8ew5r2yr
765
+
766
+ All finished, 131 total shards committed, record saved to /tmp/tmp8ew5r2yr/ndarray-cache.json
mlc-chat-config.json ADDED
@@ -0,0 +1,77 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "llama",
3
+ "quantization": "q0f16",
4
+ "model_config": {
5
+ "hidden_size": 4096,
6
+ "intermediate_size": 11008,
7
+ "num_attention_heads": 32,
8
+ "num_hidden_layers": 32,
9
+ "rms_norm_eps": 1e-06,
10
+ "vocab_size": 32000,
11
+ "position_embedding_base": 10000,
12
+ "context_window_size": 4096,
13
+ "prefill_chunk_size": 2048,
14
+ "num_key_value_heads": 32,
15
+ "head_dim": 128,
16
+ "tensor_parallel_shards": 1,
17
+ "max_batch_size": 80
18
+ },
19
+ "vocab_size": 32000,
20
+ "context_window_size": 4096,
21
+ "sliding_window_size": -1,
22
+ "prefill_chunk_size": 2048,
23
+ "attention_sink_size": -1,
24
+ "tensor_parallel_shards": 1,
25
+ "mean_gen_len": 128,
26
+ "max_gen_len": 512,
27
+ "shift_fill_factor": 0.3,
28
+ "temperature": 0.6,
29
+ "presence_penalty": 0.0,
30
+ "frequency_penalty": 0.0,
31
+ "repetition_penalty": 1.0,
32
+ "top_p": 0.9,
33
+ "conv_template": {
34
+ "name": "llama-2",
35
+ "system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n",
36
+ "system_message": "You are a helpful, respectful and honest assistant.",
37
+ "system_prefix_token_ids": [
38
+ 1
39
+ ],
40
+ "add_role_after_system_message": false,
41
+ "roles": {
42
+ "user": "<s>[INST]",
43
+ "assistant": "[/INST]",
44
+ "tool": "[INST]"
45
+ },
46
+ "role_templates": {
47
+ "user": "{user_message}",
48
+ "assistant": "{assistant_message}",
49
+ "tool": "{tool_message}"
50
+ },
51
+ "messages": [],
52
+ "seps": [
53
+ " ",
54
+ " </s>"
55
+ ],
56
+ "role_content_sep": " ",
57
+ "role_empty_sep": " ",
58
+ "stop_str": [
59
+ "[INST]"
60
+ ],
61
+ "stop_token_ids": [
62
+ 2
63
+ ],
64
+ "function_string": "",
65
+ "use_function_calling": false
66
+ },
67
+ "pad_token_id": 0,
68
+ "bos_token_id": 1,
69
+ "eos_token_id": 2,
70
+ "tokenizer_files": [
71
+ "tokenizer.model",
72
+ "tokenizer.json",
73
+ "tokenizer_config.json"
74
+ ],
75
+ "token_table_postproc_method": "byte_fallback",
76
+ "version": "0.1.0"
77
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c82acf0f390411b8f3e071702ab6cb79d05d6b2b894af831001f25d32e0ab1e1
3
+ size 262144000
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:106e8a821011d724b7f1241642ecf78879e826319f95c3cb286f8cda78edfbd4
3
+ size 90177536
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe1e3fafa7c030fabc2555a4aec0f69754ccea75810b99b6cb25032481828cf6
3
+ size 180355072
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f86376cd89a5d6c2871f92df82ee8a8ac2fb3719bd76990f7a8c3751ced05d9e
3
+ size 100663296
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a23209c92a4de08f01f590e86c05550d4f9cd7b09026cf7db3889fa2f7631292
3
+ size 33554432
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5c431da9b0c87ae1ea137823781c5f59bd7a3a4208235c03bbdddeba1a50bd1
3
+ size 90177536
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:890556b34cf64071ae1e2d963246e721228abf101f1beaf668330689aa411e60
3
+ size 180355072
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7ea55b7ecb31513ecddbaf5d2af31677c680c8c1df70e2fe461f65d3097e58b
3
+ size 100663296
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd25f92eb7d9989192ee70823f46221d2e34021a40299703a0aff4da3fe577b6
3
+ size 33554432
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fb5921bffeec01dcbde3337439cbbe7a17af324342c4692f829717fa635f95b
3
+ size 90177536
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:412a16b7382f43671eca72726d7c1c6aa5c5457dc31d21d3ca0322c6e874510f
3
+ size 180355072
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1c0fbc97262d1f66587d3cdab0d6ba796030dc5aa3bb39e1940548d25798b66
3
+ size 100663296
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecdc141700f1211748c51581929cd3ef008f0cf90984d8b99c72d511fe933228
3
+ size 33554432
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a91698047e5e2cdf10352fbae0a543b00f0b5ee5f5641f14e4a5dfcbae38b87
3
+ size 100663296
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f7663ae3cb01aa5ef0f5faf0c3501e5866c4e5b00f431fb5870027d26dec1b4
3
+ size 90177536
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6f27eca17673b962330affcf8be33f6376443cda6246b669d6d22abbe8400d2
3
+ size 180355072
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcb7fe8fff62cdd3ad71c57834f4968e1f0535ed8c22796c9740955c57aa9358
3
+ size 100663296
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91b72108e1ee3f8a888e23f76dcdf65d70ae78b27bef12a31c71199d5a109071
3
+ size 33554432
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99834e9dc3779a64632e87d38dccd40bec3cfd29433ae68b1fd56408cee35dbd
3
+ size 90177536
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b54b37221472531b9617451ed64277ac6127cd527d8a152b9cf6524baadd579d
3
+ size 180355072
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8254d40a5ff399a0d4d69311a918c0c28b38905dcf88881f82351d7cffaca307
3
+ size 100663296
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1175e3d5178225b867ad5744133215c98f62f7a7dc7da2e449a2d1a5dc1b77f
3
+ size 33554432
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8da1458efd7b705a77bd0fb2462a4ca699b99f499e62f5df060cf2c4d24367a4
3
+ size 90177536
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:308fd51e6030ac6a1aa00d594646a3461259f106c64921319f4e5a9f4672eb4d
3
+ size 180355072
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dfd67a74420433e411bae645b94f80e59b159727635b819bd9580d292c8ea33
3
+ size 33554432
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:454f659581268e99fa93293fdb1ed6eb1b0d6ddf57dfd50964d6afa0ee465312
3
+ size 100663296
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:866706c3393eb7d12e673f5cadbe0999809e21b5513caedcece80bf8228de2a0
3
+ size 33554432
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bcff9547e262f5a79d8c44f19f8744e3574458f253fa36ae804eace6ebb48ab
3
+ size 90177536
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2a1035caf4b9073d2a67b3493b1b9392bef7d274814f14ac2d7e140108abeba
3
+ size 180355072
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f49cb1d10398bf5e6512839fad0d6e55bd3e08139064b38fa881c605b2f5f17d
3
+ size 100663296
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02686f613907af9428296a15bc1a50f137c3176979756bcaef84fd535326ffa9
3
+ size 33554432
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fac7c9231aeb4cbf40c86d2efa8dbfdae0f935678e89d0ed1e5932843b46a63b
3
+ size 90177536
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:537a0ae2ef4d887c43193ee94748dca11b8b497ec3445521f370c368f9a8db22
3
+ size 180355072
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cecbb255e4aa37e122de9783c67676c7404447e155f041df09e256e9b1c0eba
3
+ size 100663296
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40cbdf9e6fc55d6db597c1997c557f1be3d7528bfb9f5e749cde4efa11de8b99
3
+ size 33554432
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:415c8fce0ef3057da704a879a037349d482953604d5f1b13d0094ead6f8bbff8
3
+ size 90177536
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5313166331b4b3cbbdf6e6eb14575e543271969c134affeb8c24b0819c46e999
3
+ size 532480
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c068d9a20dc11e42a1758a204d5089bc448e533e06ca91ae8f088e8c81784301
3
+ size 180355072
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42359fda2ba2830d26593cde8177763c7b230f8c06cd2be170748384b051a59b
3
+ size 100663296
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf39454db1d0ea4263c5932bc08cf8d20fe9362e91f2df99994ce686e0783c9a
3
+ size 33554432
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d27836197f2185bf5e156879999766a58a174ca68ee82d3ac7d1dc3cd71ada71
3
+ size 90177536
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d60cf0ee0435346f25a60771f1f7160369c59cca4e7a4c4f6cf3fe6a2df920e2
3
+ size 180355072
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2825c85d632bffcd7b09242da7c7fba10b678827db4af10255f7c0d4f82e72d5
3
+ size 100663296
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ead039b62eb49d02d56d611e4c4683dbbcd30d53860ac4c015108040cebc3546
3
+ size 180355072
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79565c3ce00cd083ac33beef8c1d48e4342a16fc77456514b7ccf2e1e2325f1d
3
+ size 33554432
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2d349cad6eeca2eaa53c09059a6812ccfd31546711e60fdac425ecdeb8245f9
3
+ size 90177536
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5424bb60b1830416c670a528e0a3c8cfdac621edee256fadfc9e521c0d017b6d
3
+ size 180355072