mengshyu commited on
Commit
7d2985c
1 Parent(s): 74f29ca

Initial commit

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
added_tokens.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<|endoftext|>": 32000,
3
+ "<|assistant|>": 32001,
4
+ "<|placeholder1|>": 32002,
5
+ "<|placeholder2|>": 32003,
6
+ "<|placeholder3|>": 32004,
7
+ "<|placeholder4|>": 32005,
8
+ "<|system|>": 32006,
9
+ "<|end|>": 32007,
10
+ "<|placeholder5|>": 32008,
11
+ "<|placeholder6|>": 32009,
12
+ "<|user|>": 32010
13
+ }
logs.txt ADDED
@@ -0,0 +1,262 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/195 [00:00<?, ?it/s]
1
 
 
2
  0%| | 0/195 [00:00<?, ?it/s]
3
 
 
4
  0%| | 0/195 [00:01<?, ?it/s]/home/msyu/workspace/venv/lib/python3.10/site-packages/numpy/core/getlimits.py:549: UserWarning: The value of the smallest subnormal for <class 'numpy.float32'> type is zero.
 
 
 
 
5
  1%| | 1/195 [00:02<07:35, 2.35s/it]
6
 
 
7
  1%| | 1/195 [00:02<07:35, 2.35s/it]
8
 
 
9
  1%| | 1/195 [00:02<07:35, 2.35s/it]
10
  2%|▏ | 3/195 [00:02<02:14, 1.43it/s]
11
 
 
12
  2%|▏ | 3/195 [00:02<02:14, 1.43it/s]
13
  2%|▏ | 4/195 [00:03<01:58, 1.61it/s]
14
 
 
15
  2%|▏ | 4/195 [00:03<01:58, 1.61it/s]
16
 
 
17
  2%|▏ | 4/195 [00:03<01:58, 1.61it/s]
18
  3%|▎ | 6/195 [00:03<01:11, 2.64it/s]
19
 
 
20
  3%|▎ | 6/195 [00:03<01:11, 2.64it/s]
21
 
 
22
  3%|▎ | 6/195 [00:03<01:11, 2.64it/s]
23
  4%|▍ | 8/195 [00:03<00:50, 3.69it/s]
24
 
 
25
  4%|▍ | 8/195 [00:03<00:50, 3.69it/s]
26
  5%|▍ | 9/195 [00:04<00:58, 3.16it/s]
27
 
 
28
  5%|▍ | 9/195 [00:04<00:58, 3.16it/s]
29
 
 
30
  5%|▍ | 9/195 [00:04<00:58, 3.16it/s]
31
 
 
32
  5%|▍ | 9/195 [00:04<00:58, 3.16it/s]
33
  6%|▌ | 12/195 [00:04<00:39, 4.64it/s]
34
 
 
35
  6%|▌ | 12/195 [00:04<00:39, 4.64it/s]
36
 
 
37
  6%|▌ | 12/195 [00:04<00:39, 4.64it/s]
38
  7%|▋ | 14/195 [00:04<00:33, 5.41it/s]
39
 
 
40
  7%|▋ | 14/195 [00:04<00:33, 5.41it/s]
41
  8%|▊ | 15/195 [00:05<00:42, 4.21it/s]
42
 
 
43
  8%|▊ | 15/195 [00:05<00:42, 4.21it/s]
44
 
 
45
  8%|▊ | 15/195 [00:05<00:42, 4.21it/s]
46
 
 
47
  8%|▊ | 15/195 [00:05<00:42, 4.21it/s]
48
  9%|▉ | 18/195 [00:05<00:32, 5.42it/s]
49
 
 
50
  9%|▉ | 18/195 [00:05<00:32, 5.42it/s]
51
 
 
52
  9%|▉ | 18/195 [00:05<00:32, 5.42it/s]
53
  10%|█ | 20/195 [00:05<00:28, 6.06it/s]
54
 
 
55
  10%|█ | 20/195 [00:05<00:28, 6.06it/s]
56
  11%|█ | 21/195 [00:06<00:37, 4.59it/s]
57
 
 
58
  11%|█ | 21/195 [00:06<00:37, 4.59it/s]
59
 
 
60
  11%|█ | 21/195 [00:06<00:37, 4.59it/s]
61
 
 
62
  11%|█ | 21/195 [00:06<00:37, 4.59it/s]
63
  12%|█▏ | 24/195 [00:06<00:29, 5.72it/s]
64
 
 
65
  12%|█▏ | 24/195 [00:06<00:29, 5.72it/s]
66
 
 
67
  12%|█▏ | 24/195 [00:06<00:29, 5.72it/s]
68
  13%|█▎ | 26/195 [00:06<00:26, 6.30it/s]
69
 
 
70
  13%|█▎ | 26/195 [00:06<00:26, 6.30it/s]
71
  14%|█▍ | 27/195 [00:07<00:37, 4.54it/s]
72
 
 
73
  14%|█▍ | 27/195 [00:07<00:37, 4.54it/s]
74
 
 
75
  14%|█▍ | 27/195 [00:07<00:37, 4.54it/s]
76
 
 
77
  14%|█▍ | 27/195 [00:07<00:37, 4.54it/s]
78
  15%|█▌ | 30/195 [00:07<00:29, 5.66it/s]
79
 
 
80
  15%|█▌ | 30/195 [00:07<00:29, 5.66it/s]
81
 
 
82
  15%|█▌ | 30/195 [00:07<00:29, 5.66it/s]
83
  16%|█▋ | 32/195 [00:07<00:26, 6.24it/s]
84
 
 
85
  16%|█▋ | 32/195 [00:07<00:26, 6.24it/s]
86
  17%|█▋ | 33/195 [00:08<00:36, 4.46it/s]
87
 
 
88
  17%|█▋ | 33/195 [00:08<00:36, 4.46it/s]
89
 
 
90
  17%|█▋ | 33/195 [00:08<00:36, 4.46it/s]
91
 
 
92
  17%|█▋ | 33/195 [00:08<00:36, 4.46it/s]
93
  18%|█▊ | 36/195 [00:08<00:28, 5.59it/s]
94
 
 
95
  18%|█▊ | 36/195 [00:08<00:28, 5.59it/s]
96
 
 
97
  18%|█▊ | 36/195 [00:08<00:28, 5.59it/s]
98
  19%|█▉ | 38/195 [00:09<00:30, 5.13it/s]
99
 
 
100
  19%|█▉ | 38/195 [00:09<00:30, 5.13it/s]
101
  20%|██ | 39/195 [00:09<00:39, 3.90it/s]
102
 
 
103
  20%|██ | 39/195 [00:09<00:39, 3.90it/s]
104
 
 
105
  20%|██ | 39/195 [00:09<00:39, 3.90it/s]
106
 
 
107
  20%|██ | 39/195 [00:09<00:39, 3.90it/s]
108
  22%|██▏ | 42/195 [00:10<00:30, 5.06it/s]
109
 
 
110
  22%|██▏ | 42/195 [00:10<00:30, 5.06it/s]
111
 
 
112
  22%|██▏ | 42/195 [00:10<00:30, 5.06it/s]
113
  23%|██▎ | 44/195 [00:10<00:26, 5.71it/s]
114
 
 
115
  23%|██▎ | 44/195 [00:10<00:26, 5.71it/s]
116
  23%|██▎ | 45/195 [00:10<00:35, 4.21it/s]
117
 
 
118
  23%|██▎ | 45/195 [00:10<00:35, 4.21it/s]
119
 
 
120
  23%|██▎ | 45/195 [00:10<00:35, 4.21it/s]
121
 
 
122
  23%|██▎ | 45/195 [00:10<00:35, 4.21it/s]
123
  25%|██▍ | 48/195 [00:11<00:27, 5.34it/s]
124
 
 
125
  25%|██▍ | 48/195 [00:11<00:27, 5.34it/s]
126
 
 
127
  25%|██▍ | 48/195 [00:11<00:27, 5.34it/s]
128
  26%|██▌ | 50/195 [00:11<00:24, 5.96it/s]
129
 
 
130
  26%|██▌ | 50/195 [00:11<00:24, 5.96it/s]
131
  26%|██▌ | 51/195 [00:12<00:33, 4.29it/s]
132
 
 
133
  26%|██▌ | 51/195 [00:12<00:33, 4.29it/s]
134
 
 
135
  26%|██▌ | 51/195 [00:12<00:33, 4.29it/s]
136
 
 
137
  26%|██▌ | 51/195 [00:12<00:33, 4.29it/s]
138
  28%|██▊ | 54/195 [00:12<00:25, 5.43it/s]
139
 
 
140
  28%|██▊ | 54/195 [00:12<00:25, 5.43it/s]
141
 
 
142
  28%|██▊ | 54/195 [00:12<00:25, 5.43it/s]
143
  29%|██▊ | 56/195 [00:12<00:23, 6.03it/s]
144
 
 
145
  29%|██▊ | 56/195 [00:12<00:23, 6.03it/s]
146
  29%|██▉ | 57/195 [00:13<00:32, 4.28it/s]
147
 
 
148
  29%|██▉ | 57/195 [00:13<00:32, 4.28it/s]
149
 
 
150
  29%|██▉ | 57/195 [00:13<00:32, 4.28it/s]
151
 
 
152
  29%|██▉ | 57/195 [00:13<00:32, 4.28it/s]
153
  31%|███ | 60/195 [00:13<00:24, 5.42it/s]
154
 
 
155
  31%|███ | 60/195 [00:13<00:24, 5.42it/s]
156
 
 
157
  31%|███ | 60/195 [00:13<00:24, 5.42it/s]
158
  32%|███▏ | 62/195 [00:13<00:22, 6.02it/s]
159
 
 
160
  32%|███▏ | 62/195 [00:13<00:22, 6.02it/s]
161
  32%|███▏ | 63/195 [00:14<00:44, 2.96it/s]
162
 
 
163
  32%|███▏ | 63/195 [00:14<00:44, 2.96it/s]
164
 
 
165
  32%|███▏ | 63/195 [00:14<00:44, 2.96it/s]
166
 
 
167
  32%|███▏ | 63/195 [00:15<00:44, 2.96it/s]
168
  34%|███▍ | 66/195 [00:15<00:31, 4.05it/s]
169
 
 
170
  34%|███▍ | 66/195 [00:15<00:31, 4.05it/s]
171
 
 
172
  34%|███▍ | 66/195 [00:15<00:31, 4.05it/s]
173
 
 
174
  34%|███▍ | 66/195 [00:15<00:31, 4.05it/s]
175
 
 
176
  34%|███▍ | 66/195 [00:16<00:31, 4.05it/s]
177
  35%|███▍ | 68/195 [00:17<01:01, 2.08it/s]
178
 
 
179
  35%|███▍ | 68/195 [00:17<01:01, 2.08it/s]
180
 
 
181
  35%|███▍ | 68/195 [00:17<01:01, 2.08it/s]
182
  36%|███▌ | 70/195 [00:17<00:47, 2.65it/s]
183
 
 
184
  36%|███▌ | 70/195 [00:17<00:47, 2.65it/s]
185
  36%|███▋ | 71/195 [00:18<00:48, 2.55it/s]
186
 
 
187
  36%|███▋ | 71/195 [00:18<00:48, 2.55it/s]
188
 
 
189
  36%|███▋ | 71/195 [00:18<00:48, 2.55it/s]
190
 
 
191
  36%|███▋ | 71/195 [00:18<00:48, 2.55it/s]
192
  38%|███▊ | 74/195 [00:18<00:33, 3.61it/s]
193
 
 
194
  38%|███▊ | 74/195 [00:18<00:33, 3.61it/s]
195
 
 
196
  38%|███▊ | 74/195 [00:18<00:33, 3.61it/s]
197
  39%|███▉ | 76/195 [00:18<00:27, 4.32it/s]
198
 
 
199
  39%|███▉ | 76/195 [00:18<00:27, 4.32it/s]
200
  39%|███▉ | 77/195 [00:19<00:32, 3.67it/s]
201
 
 
202
  39%|███▉ | 77/195 [00:19<00:32, 3.67it/s]
203
 
 
204
  39%|███▉ | 77/195 [00:19<00:32, 3.67it/s]
205
 
 
206
  39%|███▉ | 77/195 [00:19<00:32, 3.67it/s]
207
  41%|████ | 80/195 [00:19<00:23, 4.82it/s]
208
 
 
209
  41%|████ | 80/195 [00:19<00:23, 4.82it/s]
210
 
 
211
  41%|████ | 80/195 [00:19<00:23, 4.82it/s]
212
  42%|████▏ | 82/195 [00:19<00:20, 5.49it/s]
213
 
 
214
  42%|████▏ | 82/195 [00:19<00:20, 5.49it/s]
215
  43%|████▎ | 83/195 [00:20<00:25, 4.33it/s]
216
 
 
217
  43%|████▎ | 83/195 [00:20<00:25, 4.33it/s]
218
 
 
219
  43%|████▎ | 83/195 [00:20<00:25, 4.33it/s]
220
 
 
221
  43%|████▎ | 83/195 [00:20<00:25, 4.33it/s]
222
  44%|████▍ | 86/195 [00:20<00:20, 5.45it/s]
223
 
 
224
  44%|████▍ | 86/195 [00:20<00:20, 5.45it/s]
225
 
 
226
  44%|████▍ | 86/195 [00:20<00:20, 5.45it/s]
227
  45%|████▌ | 88/195 [00:20<00:17, 6.06it/s]
228
 
 
229
  45%|████▌ | 88/195 [00:20<00:17, 6.06it/s]
230
  46%|████▌ | 89/195 [00:21<00:22, 4.62it/s]
231
 
 
232
  46%|████▌ | 89/195 [00:21<00:22, 4.62it/s]
233
 
 
234
  46%|████▌ | 89/195 [00:21<00:22, 4.62it/s]
235
 
 
236
  46%|████▌ | 89/195 [00:21<00:22, 4.62it/s]
237
  47%|████▋ | 92/195 [00:21<00:18, 5.71it/s]
238
 
 
239
  47%|████▋ | 92/195 [00:21<00:18, 5.71it/s]
240
 
 
241
  47%|████▋ | 92/195 [00:21<00:18, 5.71it/s]
242
  48%|████▊ | 94/195 [00:21<00:16, 6.29it/s]
243
 
 
244
  48%|████▊ | 94/195 [00:21<00:16, 6.29it/s]
245
  49%|████▊ | 95/195 [00:22<00:21, 4.69it/s]
246
 
 
247
  49%|████▊ | 95/195 [00:22<00:21, 4.69it/s]
248
 
 
249
  49%|████▊ | 95/195 [00:22<00:21, 4.69it/s]
250
 
 
251
  49%|████▊ | 95/195 [00:22<00:21, 4.69it/s]
252
  50%|█████ | 98/195 [00:22<00:16, 5.77it/s]
253
 
 
254
  50%|█████ | 98/195 [00:22<00:16, 5.77it/s]
255
 
 
256
  50%|█████ | 98/195 [00:22<00:16, 5.77it/s]
257
  51%|█████▏ | 100/195 [00:23<00:14, 6.34it/s]
258
 
 
259
  51%|█████▏ | 100/195 [00:23<00:14, 6.34it/s]
260
  52%|█████▏ | 101/195 [00:23<00:20, 4.67it/s]
261
 
 
262
  52%|█████▏ | 101/195 [00:23<00:20, 4.67it/s]
263
 
 
264
  52%|█████▏ | 101/195 [00:23<00:20, 4.67it/s]
265
 
 
266
  52%|█████▏ | 101/195 [00:23<00:20, 4.67it/s]
267
  53%|█████▎ | 104/195 [00:23<00:15, 5.75it/s]
268
 
 
269
  53%|█████▎ | 104/195 [00:23<00:15, 5.75it/s]
270
 
 
271
  53%|█████▎ | 104/195 [00:23<00:15, 5.75it/s]
272
  54%|█████▍ | 106/195 [00:24<00:14, 6.33it/s]
273
 
 
274
  54%|█████▍ | 106/195 [00:24<00:14, 6.33it/s]
275
  55%|█████▍ | 107/195 [00:24<00:18, 4.69it/s]
276
 
 
277
  55%|█████▍ | 107/195 [00:24<00:18, 4.69it/s]
278
 
 
279
  55%|█████▍ | 107/195 [00:24<00:18, 4.69it/s]
280
 
 
281
  55%|█████▍ | 107/195 [00:24<00:18, 4.69it/s]
282
  56%|█████▋ | 110/195 [00:24<00:14, 5.77it/s]
283
 
 
284
  56%|█████▋ | 110/195 [00:24<00:14, 5.77it/s]
285
 
 
286
  56%|█████▋ | 110/195 [00:24<00:14, 5.77it/s]
287
  57%|█████▋ | 112/195 [00:25<00:13, 6.34it/s]
288
 
 
289
  57%|█████▋ | 112/195 [00:25<00:13, 6.34it/s]
290
  58%|█████▊ | 113/195 [00:25<00:17, 4.65it/s]
291
 
 
292
  58%|█████▊ | 113/195 [00:25<00:17, 4.65it/s]
293
 
 
294
  58%|█████▊ | 113/195 [00:25<00:17, 4.65it/s]
295
 
 
296
  58%|█████▊ | 113/195 [00:25<00:17, 4.65it/s]
297
  59%|█████▉ | 116/195 [00:26<00:13, 5.70it/s]
298
 
 
299
  59%|█████▉ | 116/195 [00:26<00:13, 5.70it/s]
300
 
 
301
  59%|█████▉ | 116/195 [00:26<00:13, 5.70it/s]
302
  61%|██████ | 118/195 [00:26<00:12, 6.22it/s]
303
 
 
304
  61%|██████ | 118/195 [00:26<00:12, 6.22it/s]
305
  61%|██████ | 119/195 [00:26<00:17, 4.47it/s]
306
 
 
307
  61%|██████ | 119/195 [00:26<00:17, 4.47it/s]
308
 
 
309
  61%|██████ | 119/195 [00:26<00:17, 4.47it/s]
310
 
 
311
  61%|██████ | 119/195 [00:26<00:17, 4.47it/s]
312
  63%|██████▎ | 122/195 [00:27<00:13, 5.57it/s]
313
 
 
314
  63%|██████▎ | 122/195 [00:27<00:13, 5.57it/s]
315
 
 
316
  63%|██████▎ | 122/195 [00:27<00:13, 5.57it/s]
317
  64%|██████▎ | 124/195 [00:27<00:11, 6.17it/s]
318
 
 
319
  64%|██████▎ | 124/195 [00:27<00:11, 6.17it/s]
320
  64%|██████▍ | 125/195 [00:27<00:15, 4.56it/s]
321
 
 
322
  64%|██████▍ | 125/195 [00:27<00:15, 4.56it/s]
323
 
 
324
  64%|██████▍ | 125/195 [00:27<00:15, 4.56it/s]
325
 
 
326
  64%|██████▍ | 125/195 [00:28<00:15, 4.56it/s]
327
  66%|██████▌ | 128/195 [00:28<00:11, 5.65it/s]
328
 
 
329
  66%|██████▌ | 128/195 [00:28<00:11, 5.65it/s]
330
 
 
331
  66%|██████▌ | 128/195 [00:28<00:11, 5.65it/s]
332
  67%|██████▋ | 130/195 [00:28<00:10, 6.24it/s]
333
 
 
334
  67%|██████▋ | 130/195 [00:28<00:10, 6.24it/s]
335
  67%|██████▋ | 131/195 [00:29<00:13, 4.60it/s]
336
 
 
337
  67%|██████▋ | 131/195 [00:29<00:13, 4.60it/s]
338
 
 
339
  67%|██████▋ | 131/195 [00:29<00:13, 4.60it/s]
340
 
 
341
  67%|██████▋ | 131/195 [00:29<00:13, 4.60it/s]
342
  69%|██████▊ | 134/195 [00:29<00:10, 5.69it/s]
343
 
 
344
  69%|██████▊ | 134/195 [00:29<00:10, 5.69it/s]
345
 
 
346
  69%|██████▊ | 134/195 [00:29<00:10, 5.69it/s]
347
  70%|██████▉ | 136/195 [00:29<00:09, 6.28it/s]
348
 
 
349
  70%|██████▉ | 136/195 [00:29<00:09, 6.28it/s]
350
  70%|███████ | 137/195 [00:30<00:13, 4.27it/s]
351
 
 
352
  70%|███████ | 137/195 [00:30<00:13, 4.27it/s]
353
 
 
354
  70%|███████ | 137/195 [00:30<00:13, 4.27it/s]
355
 
 
356
  70%|███████ | 137/195 [00:30<00:13, 4.27it/s]
357
  72%|███████▏ | 140/195 [00:30<00:10, 5.33it/s]
358
 
 
359
  72%|███████▏ | 140/195 [00:30<00:10, 5.33it/s]
360
 
 
361
  72%|███████▏ | 140/195 [00:30<00:10, 5.33it/s]
362
  73%|███████▎ | 142/195 [00:30<00:08, 5.93it/s]
363
 
 
364
  73%|███████▎ | 142/195 [00:30<00:08, 5.93it/s]
365
  73%|███████▎ | 143/195 [00:31<00:11, 4.50it/s]
366
 
 
367
  73%|███████▎ | 143/195 [00:31<00:11, 4.50it/s]
368
 
 
369
  73%|███████▎ | 143/195 [00:31<00:11, 4.50it/s]
370
 
 
371
  73%|███████▎ | 143/195 [00:31<00:11, 4.50it/s]
372
  75%|███████▍ | 146/195 [00:31<00:08, 5.60it/s]
373
 
 
374
  75%|███████▍ | 146/195 [00:31<00:08, 5.60it/s]
375
 
 
376
  75%|███████▍ | 146/195 [00:31<00:08, 5.60it/s]
377
  76%|███████▌ | 148/195 [00:31<00:07, 6.20it/s]
378
 
 
379
  76%|███████▌ | 148/195 [00:31<00:07, 6.20it/s]
380
  76%|███████▋ | 149/195 [00:32<00:10, 4.39it/s]
381
 
 
382
  76%|███████▋ | 149/195 [00:32<00:10, 4.39it/s]
383
 
 
384
  76%|███████▋ | 149/195 [00:32<00:10, 4.39it/s]
385
 
 
386
  76%|███████▋ | 149/195 [00:32<00:10, 4.39it/s]
387
  78%|███████▊ | 152/195 [00:32<00:07, 5.50it/s]
388
 
 
389
  78%|███████▊ | 152/195 [00:32<00:07, 5.50it/s]
390
 
 
391
  78%|███████▊ | 152/195 [00:32<00:07, 5.50it/s]
392
 
 
393
  78%|███████▊ | 152/195 [00:32<00:07, 5.50it/s]
394
  79%|███████▉ | 155/195 [00:33<00:06, 6.52it/s]
395
 
 
396
  79%|███████▉ | 155/195 [00:33<00:06, 6.52it/s]
397
  80%|████████ | 156/195 [00:33<00:08, 4.86it/s]
398
 
 
399
  80%|████████ | 156/195 [00:33<00:08, 4.86it/s]
400
 
 
401
  80%|████████ | 156/195 [00:33<00:08, 4.86it/s]
402
 
 
403
  80%|████████ | 156/195 [00:33<00:08, 4.86it/s]
404
  82%|████████▏ | 159/195 [00:33<00:06, 5.83it/s]
405
 
 
406
  82%|████████▏ | 159/195 [00:33<00:06, 5.83it/s]
407
 
 
408
  82%|████████▏ | 159/195 [00:33<00:06, 5.83it/s]
409
  83%|████████▎ | 161/195 [00:34<00:05, 6.30it/s]
410
 
 
411
  83%|████████▎ | 161/195 [00:34<00:05, 6.30it/s]
412
  83%|████████▎ | 162/195 [00:34<00:08, 4.00it/s]
413
 
 
414
  83%|████████▎ | 162/195 [00:34<00:08, 4.00it/s]
415
 
 
416
  83%|████████▎ | 162/195 [00:34<00:08, 4.00it/s]
417
 
 
418
  83%|████████▎ | 162/195 [00:35<00:08, 4.00it/s]
419
  85%|████████▍ | 165/195 [00:35<00:05, 5.09it/s]
420
 
 
421
  85%|████████▍ | 165/195 [00:35<00:05, 5.09it/s]
422
 
 
423
  85%|████████▍ | 165/195 [00:35<00:05, 5.09it/s]
424
  86%|████████▌ | 167/195 [00:35<00:04, 5.72it/s]
425
 
 
426
  86%|████████▌ | 167/195 [00:35<00:04, 5.72it/s]
427
  86%|████████▌ | 168/195 [00:36<00:06, 4.25it/s]
428
 
 
429
  86%|████████▌ | 168/195 [00:36<00:06, 4.25it/s]
430
 
 
431
  86%|████████▌ | 168/195 [00:36<00:06, 4.25it/s]
432
 
 
433
  86%|████████▌ | 168/195 [00:36<00:06, 4.25it/s]
434
  88%|████████▊ | 171/195 [00:36<00:04, 5.34it/s]
435
 
 
436
  88%|████████▊ | 171/195 [00:36<00:04, 5.34it/s]
437
 
 
438
  88%|████████▊ | 171/195 [00:36<00:04, 5.34it/s]
439
  89%|████████▊ | 173/195 [00:36<00:03, 5.95it/s]
440
 
 
441
  89%|████████▊ | 173/195 [00:36<00:03, 5.95it/s]
442
  89%|████████▉ | 174/195 [00:37<00:04, 4.39it/s]
443
 
 
444
  89%|████████▉ | 174/195 [00:37<00:04, 4.39it/s]
445
 
 
446
  89%|████████▉ | 174/195 [00:37<00:04, 4.39it/s]
447
 
 
448
  89%|████████▉ | 174/195 [00:37<00:04, 4.39it/s]
449
  91%|█████████ | 177/195 [00:37<00:03, 5.50it/s]
450
 
 
451
  91%|█████████ | 177/195 [00:37<00:03, 5.50it/s]
452
 
 
453
  91%|█████████ | 177/195 [00:37<00:03, 5.50it/s]
454
  92%|█████████▏| 179/195 [00:37<00:02, 6.11it/s]
455
 
 
456
  92%|█████████▏| 179/195 [00:37<00:02, 6.11it/s]
457
  92%|█████████▏| 180/195 [00:38<00:03, 4.52it/s]
458
 
 
459
  92%|█████████▏| 180/195 [00:38<00:03, 4.52it/s]
460
 
 
461
  92%|█████████▏| 180/195 [00:38<00:03, 4.52it/s]
462
 
 
463
  92%|█████████▏| 180/195 [00:38<00:03, 4.52it/s]
464
  94%|█████████▍| 183/195 [00:38<00:02, 5.62it/s]
465
 
 
466
  94%|█████████▍| 183/195 [00:38<00:02, 5.62it/s]
467
 
 
468
  94%|█████████▍| 183/195 [00:38<00:02, 5.62it/s]
469
  95%|█████████▍| 185/195 [00:38<00:01, 6.21it/s]
470
 
 
471
  95%|█████████▍| 185/195 [00:38<00:01, 6.21it/s]
472
  95%|█████████▌| 186/195 [00:39<00:02, 4.07it/s]
473
 
 
474
  95%|█████████▌| 186/195 [00:39<00:02, 4.07it/s]
475
 
 
476
  95%|█████████▌| 186/195 [00:39<00:02, 4.07it/s]
477
 
 
478
  95%|█████████▌| 186/195 [00:39<00:02, 4.07it/s]
479
  97%|█████████▋| 189/195 [00:39<00:01, 5.21it/s]
480
 
 
481
  97%|█████████▋| 189/195 [00:39<00:01, 5.21it/s]
482
 
 
483
  97%|█████████▋| 189/195 [00:39<00:01, 5.21it/s]
484
  98%|█████████▊| 191/195 [00:40<00:00, 5.85it/s]
485
 
 
486
  98%|█████████▊| 191/195 [00:40<00:00, 5.85it/s]
487
  98%|█████████▊| 192/195 [00:40<00:00, 4.37it/s]
488
 
 
489
  98%|█████████▊| 192/195 [00:40<00:00, 4.37it/s]
490
 
 
491
  98%|█████████▊| 192/195 [00:40<00:00, 4.37it/s]
492
 
 
493
  98%|█████████▊| 192/195 [00:40<00:00, 4.37it/s]
 
 
 
 
 
 
 
 
 
 
 
1
+ /home/msyu/workspace/venv/bin/python -m mlc_llm gen_config /tmp/tmpy7oe9l51/repo --quantization q0f32 --conv-template phi-3 --output /tmp/tmptqlm3cdw
2
+ [2024-05-08 13:34:15] INFO auto_config.py:115: Found model configuration: /tmp/tmpy7oe9l51/repo/config.json
3
+ [2024-05-08 13:34:15] INFO auto_config.py:153: Found model type: phi3. Use `--model-type` to override.
4
+ [2024-05-08 13:34:15] INFO phi3_model.py:53: context_window_size not found in config.json. Falling back to max_position_embeddings (4096)
5
+ [2024-05-08 13:34:15] INFO phi3_model.py:68: prefill_chunk_size defaults to 2048
6
+ [2024-05-08 13:34:15] INFO config.py:106: Overriding max_batch_size from 1 to 80
7
+ [2024-05-08 13:34:15] INFO gen_config.py:255: [generation_config.json] Setting bos_token_id: 1
8
+ [2024-05-08 13:34:15] INFO gen_config.py:255: [generation_config.json] Setting eos_token_id: [32000, 32001, 32007]
9
+ [2024-05-08 13:34:15] INFO gen_config.py:255: [generation_config.json] Setting pad_token_id: 32000
10
+ [2024-05-08 13:34:15] INFO gen_config.py:267: Found tokenizer config: /tmp/tmpy7oe9l51/repo/tokenizer.model. Copying to /tmp/tmptqlm3cdw/tokenizer.model
11
+ [2024-05-08 13:34:15] INFO gen_config.py:267: Found tokenizer config: /tmp/tmpy7oe9l51/repo/tokenizer.json. Copying to /tmp/tmptqlm3cdw/tokenizer.json
12
+ [2024-05-08 13:34:15] INFO gen_config.py:269: Not found tokenizer config: /tmp/tmpy7oe9l51/repo/vocab.json
13
+ [2024-05-08 13:34:15] INFO gen_config.py:269: Not found tokenizer config: /tmp/tmpy7oe9l51/repo/merges.txt
14
+ [2024-05-08 13:34:15] INFO gen_config.py:267: Found tokenizer config: /tmp/tmpy7oe9l51/repo/added_tokens.json. Copying to /tmp/tmptqlm3cdw/added_tokens.json
15
+ [2024-05-08 13:34:15] INFO gen_config.py:267: Found tokenizer config: /tmp/tmpy7oe9l51/repo/tokenizer_config.json. Copying to /tmp/tmptqlm3cdw/tokenizer_config.json
16
+ [2024-05-08 13:34:15] INFO gen_config.py:80: [System default] Setting temperature: 0.7
17
+ [2024-05-08 13:34:15] INFO gen_config.py:80: [System default] Setting presence_penalty: 0.0
18
+ [2024-05-08 13:34:15] INFO gen_config.py:80: [System default] Setting frequency_penalty: 0.0
19
+ [2024-05-08 13:34:15] INFO gen_config.py:80: [System default] Setting repetition_penalty: 1.0
20
+ [2024-05-08 13:34:15] INFO gen_config.py:80: [System default] Setting top_p: 0.95
21
+ [2024-05-08 13:34:15] INFO gen_config.py:80: [System default] Setting mean_gen_len: 128
22
+ [2024-05-08 13:34:15] INFO gen_config.py:80: [System default] Setting max_gen_len: 512
23
+ [2024-05-08 13:34:15] INFO gen_config.py:80: [System default] Setting shift_fill_factor: 0.3
24
+ [2024-05-08 13:34:15] INFO gen_config.py:335: Dumping configuration file to: /tmp/tmptqlm3cdw/mlc-chat-config.json
25
+ /home/msyu/workspace/venv/bin/python -m mlc_llm convert_weight /tmp/tmpy7oe9l51/repo --quantization q0f32 --source-format auto --output /tmp/tmptqlm3cdw
26
+ [2024-05-08 13:34:16] INFO auto_config.py:115: Found model configuration: /tmp/tmpy7oe9l51/repo/config.json
27
+ [2024-05-08 13:34:16] INFO auto_device.py:79: Found device: cuda:0
28
+ [2024-05-08 13:34:17] INFO auto_device.py:88: Not found device: rocm:0
29
+ [2024-05-08 13:34:18] INFO auto_device.py:88: Not found device: metal:0
30
+ [2024-05-08 13:34:18] INFO auto_device.py:88: Not found device: vulkan:0
31
+ [2024-05-08 13:34:19] INFO auto_device.py:79: Found device: opencl:0
32
+ [2024-05-08 13:34:19] INFO auto_device.py:35: Using device: cuda:0
33
+ [2024-05-08 13:34:19] INFO auto_weight.py:70: Finding weights in: /tmp/tmpy7oe9l51/repo
34
+ [2024-05-08 13:34:19] INFO auto_weight.py:136: Not found Huggingface PyTorch
35
+ [2024-05-08 13:34:19] INFO auto_weight.py:143: Found source weight format: huggingface-safetensor. Source configuration: /tmp/tmpy7oe9l51/repo/model.safetensors.index.json
36
+ [2024-05-08 13:34:19] INFO auto_weight.py:106: Using source weight configuration: /tmp/tmpy7oe9l51/repo/model.safetensors.index.json. Use `--source` to override.
37
+ [2024-05-08 13:34:19] INFO auto_weight.py:110: Using source weight format: huggingface-safetensor. Use `--source-format` to override.
38
+ [2024-05-08 13:34:19] INFO auto_config.py:153: Found model type: phi3. Use `--model-type` to override.
39
+ [2024-05-08 13:34:19] INFO phi3_model.py:53: context_window_size not found in config.json. Falling back to max_position_embeddings (4096)
40
+ [2024-05-08 13:34:19] INFO phi3_model.py:68: prefill_chunk_size defaults to 2048
41
+ Weight conversion with arguments:
42
+ --config /tmp/tmpy7oe9l51/repo/config.json
43
+ --quantization NoQuantize(name='q0f32', kind='no-quant', model_dtype='float32')
44
+ --model-type phi3
45
+ --device cuda:0
46
+ --source /tmp/tmpy7oe9l51/repo/model.safetensors.index.json
47
+ --source-format huggingface-safetensor
48
+ --output /tmp/tmptqlm3cdw
49
+ Start storing to cache /tmp/tmptqlm3cdw
50
+
51
  0%| | 0/195 [00:00<?, ?it/s]
52
 
53
+
54
  0%| | 0/195 [00:00<?, ?it/s]
55
 
56
+
57
  0%| | 0/195 [00:01<?, ?it/s]/home/msyu/workspace/venv/lib/python3.10/site-packages/numpy/core/getlimits.py:549: UserWarning: The value of the smallest subnormal for <class 'numpy.float32'> type is zero.
58
+ setattr(self, word, getattr(machar, word).flat[0])
59
+ /home/msyu/workspace/venv/lib/python3.10/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for <class 'numpy.float32'> type is zero.
60
+ return self._float_to_str(self.smallest_subnormal)
61
+
62
  1%| | 1/195 [00:02<07:35, 2.35s/it]
63
 
64
+
65
  1%| | 1/195 [00:02<07:35, 2.35s/it]
66
 
67
+
68
  1%| | 1/195 [00:02<07:35, 2.35s/it]
69
  2%|▏ | 3/195 [00:02<02:14, 1.43it/s]
70
 
71
+
72
  2%|▏ | 3/195 [00:02<02:14, 1.43it/s]
73
  2%|▏ | 4/195 [00:03<01:58, 1.61it/s]
74
 
75
+
76
  2%|▏ | 4/195 [00:03<01:58, 1.61it/s]
77
 
78
+
79
  2%|▏ | 4/195 [00:03<01:58, 1.61it/s]
80
  3%|▎ | 6/195 [00:03<01:11, 2.64it/s]
81
 
82
+
83
  3%|▎ | 6/195 [00:03<01:11, 2.64it/s]
84
 
85
+
86
  3%|▎ | 6/195 [00:03<01:11, 2.64it/s]
87
  4%|▍ | 8/195 [00:03<00:50, 3.69it/s]
88
 
89
+
90
  4%|▍ | 8/195 [00:03<00:50, 3.69it/s]
91
  5%|▍ | 9/195 [00:04<00:58, 3.16it/s]
92
 
93
+
94
  5%|▍ | 9/195 [00:04<00:58, 3.16it/s]
95
 
96
+
97
  5%|▍ | 9/195 [00:04<00:58, 3.16it/s]
98
 
99
+
100
  5%|▍ | 9/195 [00:04<00:58, 3.16it/s]
101
  6%|▌ | 12/195 [00:04<00:39, 4.64it/s]
102
 
103
+
104
  6%|▌ | 12/195 [00:04<00:39, 4.64it/s]
105
 
106
+
107
  6%|▌ | 12/195 [00:04<00:39, 4.64it/s]
108
  7%|▋ | 14/195 [00:04<00:33, 5.41it/s]
109
 
110
+
111
  7%|▋ | 14/195 [00:04<00:33, 5.41it/s]
112
  8%|▊ | 15/195 [00:05<00:42, 4.21it/s]
113
 
114
+
115
  8%|▊ | 15/195 [00:05<00:42, 4.21it/s]
116
 
117
+
118
  8%|▊ | 15/195 [00:05<00:42, 4.21it/s]
119
 
120
+
121
  8%|▊ | 15/195 [00:05<00:42, 4.21it/s]
122
  9%|▉ | 18/195 [00:05<00:32, 5.42it/s]
123
 
124
+
125
  9%|▉ | 18/195 [00:05<00:32, 5.42it/s]
126
 
127
+
128
  9%|▉ | 18/195 [00:05<00:32, 5.42it/s]
129
  10%|█ | 20/195 [00:05<00:28, 6.06it/s]
130
 
131
+
132
  10%|█ | 20/195 [00:05<00:28, 6.06it/s]
133
  11%|█ | 21/195 [00:06<00:37, 4.59it/s]
134
 
135
+
136
  11%|█ | 21/195 [00:06<00:37, 4.59it/s]
137
 
138
+
139
  11%|█ | 21/195 [00:06<00:37, 4.59it/s]
140
 
141
+
142
  11%|█ | 21/195 [00:06<00:37, 4.59it/s]
143
  12%|█▏ | 24/195 [00:06<00:29, 5.72it/s]
144
 
145
+
146
  12%|█▏ | 24/195 [00:06<00:29, 5.72it/s]
147
 
148
+
149
  12%|█▏ | 24/195 [00:06<00:29, 5.72it/s]
150
  13%|█▎ | 26/195 [00:06<00:26, 6.30it/s]
151
 
152
+
153
  13%|█▎ | 26/195 [00:06<00:26, 6.30it/s]
154
  14%|█▍ | 27/195 [00:07<00:37, 4.54it/s]
155
 
156
+
157
  14%|█▍ | 27/195 [00:07<00:37, 4.54it/s]
158
 
159
+
160
  14%|█▍ | 27/195 [00:07<00:37, 4.54it/s]
161
 
162
+
163
  14%|█▍ | 27/195 [00:07<00:37, 4.54it/s]
164
  15%|█▌ | 30/195 [00:07<00:29, 5.66it/s]
165
 
166
+
167
  15%|█▌ | 30/195 [00:07<00:29, 5.66it/s]
168
 
169
+
170
  15%|█▌ | 30/195 [00:07<00:29, 5.66it/s]
171
  16%|█▋ | 32/195 [00:07<00:26, 6.24it/s]
172
 
173
+
174
  16%|█▋ | 32/195 [00:07<00:26, 6.24it/s]
175
  17%|█▋ | 33/195 [00:08<00:36, 4.46it/s]
176
 
177
+
178
  17%|█▋ | 33/195 [00:08<00:36, 4.46it/s]
179
 
180
+
181
  17%|█▋ | 33/195 [00:08<00:36, 4.46it/s]
182
 
183
+
184
  17%|█▋ | 33/195 [00:08<00:36, 4.46it/s]
185
  18%|█▊ | 36/195 [00:08<00:28, 5.59it/s]
186
 
187
+
188
  18%|█▊ | 36/195 [00:08<00:28, 5.59it/s]
189
 
190
+
191
  18%|█▊ | 36/195 [00:08<00:28, 5.59it/s]
192
  19%|█▉ | 38/195 [00:09<00:30, 5.13it/s]
193
 
194
+
195
  19%|█▉ | 38/195 [00:09<00:30, 5.13it/s]
196
  20%|██ | 39/195 [00:09<00:39, 3.90it/s]
197
 
198
+
199
  20%|██ | 39/195 [00:09<00:39, 3.90it/s]
200
 
201
+
202
  20%|██ | 39/195 [00:09<00:39, 3.90it/s]
203
 
204
+
205
  20%|██ | 39/195 [00:09<00:39, 3.90it/s]
206
  22%|██▏ | 42/195 [00:10<00:30, 5.06it/s]
207
 
208
+
209
  22%|██▏ | 42/195 [00:10<00:30, 5.06it/s]
210
 
211
+
212
  22%|██▏ | 42/195 [00:10<00:30, 5.06it/s]
213
  23%|██▎ | 44/195 [00:10<00:26, 5.71it/s]
214
 
215
+
216
  23%|██▎ | 44/195 [00:10<00:26, 5.71it/s]
217
  23%|██▎ | 45/195 [00:10<00:35, 4.21it/s]
218
 
219
+
220
  23%|██▎ | 45/195 [00:10<00:35, 4.21it/s]
221
 
222
+
223
  23%|██▎ | 45/195 [00:10<00:35, 4.21it/s]
224
 
225
+
226
  23%|██▎ | 45/195 [00:10<00:35, 4.21it/s]
227
  25%|██▍ | 48/195 [00:11<00:27, 5.34it/s]
228
 
229
+
230
  25%|██▍ | 48/195 [00:11<00:27, 5.34it/s]
231
 
232
+
233
  25%|██▍ | 48/195 [00:11<00:27, 5.34it/s]
234
  26%|██▌ | 50/195 [00:11<00:24, 5.96it/s]
235
 
236
+
237
  26%|██▌ | 50/195 [00:11<00:24, 5.96it/s]
238
  26%|██▌ | 51/195 [00:12<00:33, 4.29it/s]
239
 
240
+
241
  26%|██▌ | 51/195 [00:12<00:33, 4.29it/s]
242
 
243
+
244
  26%|██▌ | 51/195 [00:12<00:33, 4.29it/s]
245
 
246
+
247
  26%|██▌ | 51/195 [00:12<00:33, 4.29it/s]
248
  28%|██▊ | 54/195 [00:12<00:25, 5.43it/s]
249
 
250
+
251
  28%|██▊ | 54/195 [00:12<00:25, 5.43it/s]
252
 
253
+
254
  28%|██▊ | 54/195 [00:12<00:25, 5.43it/s]
255
  29%|██▊ | 56/195 [00:12<00:23, 6.03it/s]
256
 
257
+
258
  29%|██▊ | 56/195 [00:12<00:23, 6.03it/s]
259
  29%|██▉ | 57/195 [00:13<00:32, 4.28it/s]
260
 
261
+
262
  29%|██▉ | 57/195 [00:13<00:32, 4.28it/s]
263
 
264
+
265
  29%|██▉ | 57/195 [00:13<00:32, 4.28it/s]
266
 
267
+
268
  29%|██▉ | 57/195 [00:13<00:32, 4.28it/s]
269
  31%|███ | 60/195 [00:13<00:24, 5.42it/s]
270
 
271
+
272
  31%|███ | 60/195 [00:13<00:24, 5.42it/s]
273
 
274
+
275
  31%|███ | 60/195 [00:13<00:24, 5.42it/s]
276
  32%|███▏ | 62/195 [00:13<00:22, 6.02it/s]
277
 
278
+
279
  32%|███▏ | 62/195 [00:13<00:22, 6.02it/s]
280
  32%|███▏ | 63/195 [00:14<00:44, 2.96it/s]
281
 
282
+
283
  32%|███▏ | 63/195 [00:14<00:44, 2.96it/s]
284
 
285
+
286
  32%|███▏ | 63/195 [00:14<00:44, 2.96it/s]
287
 
288
+
289
  32%|███▏ | 63/195 [00:15<00:44, 2.96it/s]
290
  34%|███▍ | 66/195 [00:15<00:31, 4.05it/s]
291
 
292
+
293
  34%|███▍ | 66/195 [00:15<00:31, 4.05it/s]
294
 
295
+
296
  34%|███▍ | 66/195 [00:15<00:31, 4.05it/s]
297
 
298
+
299
  34%|███▍ | 66/195 [00:15<00:31, 4.05it/s]
300
 
301
+
302
  34%|███▍ | 66/195 [00:16<00:31, 4.05it/s]
303
  35%|███▍ | 68/195 [00:17<01:01, 2.08it/s]
304
 
305
+
306
  35%|███▍ | 68/195 [00:17<01:01, 2.08it/s]
307
 
308
+
309
  35%|███▍ | 68/195 [00:17<01:01, 2.08it/s]
310
  36%|███▌ | 70/195 [00:17<00:47, 2.65it/s]
311
 
312
+
313
  36%|███▌ | 70/195 [00:17<00:47, 2.65it/s]
314
  36%|███▋ | 71/195 [00:18<00:48, 2.55it/s]
315
 
316
+
317
  36%|███▋ | 71/195 [00:18<00:48, 2.55it/s]
318
 
319
+
320
  36%|███▋ | 71/195 [00:18<00:48, 2.55it/s]
321
 
322
+
323
  36%|███▋ | 71/195 [00:18<00:48, 2.55it/s]
324
  38%|███▊ | 74/195 [00:18<00:33, 3.61it/s]
325
 
326
+
327
  38%|███▊ | 74/195 [00:18<00:33, 3.61it/s]
328
 
329
+
330
  38%|███▊ | 74/195 [00:18<00:33, 3.61it/s]
331
  39%|███▉ | 76/195 [00:18<00:27, 4.32it/s]
332
 
333
+
334
  39%|███▉ | 76/195 [00:18<00:27, 4.32it/s]
335
  39%|███▉ | 77/195 [00:19<00:32, 3.67it/s]
336
 
337
+
338
  39%|███▉ | 77/195 [00:19<00:32, 3.67it/s]
339
 
340
+
341
  39%|███▉ | 77/195 [00:19<00:32, 3.67it/s]
342
 
343
+
344
  39%|███▉ | 77/195 [00:19<00:32, 3.67it/s]
345
  41%|████ | 80/195 [00:19<00:23, 4.82it/s]
346
 
347
+
348
  41%|████ | 80/195 [00:19<00:23, 4.82it/s]
349
 
350
+
351
  41%|████ | 80/195 [00:19<00:23, 4.82it/s]
352
  42%|████▏ | 82/195 [00:19<00:20, 5.49it/s]
353
 
354
+
355
  42%|████▏ | 82/195 [00:19<00:20, 5.49it/s]
356
  43%|████▎ | 83/195 [00:20<00:25, 4.33it/s]
357
 
358
+
359
  43%|████▎ | 83/195 [00:20<00:25, 4.33it/s]
360
 
361
+
362
  43%|████▎ | 83/195 [00:20<00:25, 4.33it/s]
363
 
364
+
365
  43%|████▎ | 83/195 [00:20<00:25, 4.33it/s]
366
  44%|████▍ | 86/195 [00:20<00:20, 5.45it/s]
367
 
368
+
369
  44%|████▍ | 86/195 [00:20<00:20, 5.45it/s]
370
 
371
+
372
  44%|████▍ | 86/195 [00:20<00:20, 5.45it/s]
373
  45%|████▌ | 88/195 [00:20<00:17, 6.06it/s]
374
 
375
+
376
  45%|████▌ | 88/195 [00:20<00:17, 6.06it/s]
377
  46%|████▌ | 89/195 [00:21<00:22, 4.62it/s]
378
 
379
+
380
  46%|████▌ | 89/195 [00:21<00:22, 4.62it/s]
381
 
382
+
383
  46%|████▌ | 89/195 [00:21<00:22, 4.62it/s]
384
 
385
+
386
  46%|████▌ | 89/195 [00:21<00:22, 4.62it/s]
387
  47%|████▋ | 92/195 [00:21<00:18, 5.71it/s]
388
 
389
+
390
  47%|████▋ | 92/195 [00:21<00:18, 5.71it/s]
391
 
392
+
393
  47%|████▋ | 92/195 [00:21<00:18, 5.71it/s]
394
  48%|████▊ | 94/195 [00:21<00:16, 6.29it/s]
395
 
396
+
397
  48%|████▊ | 94/195 [00:21<00:16, 6.29it/s]
398
  49%|████▊ | 95/195 [00:22<00:21, 4.69it/s]
399
 
400
+
401
  49%|████▊ | 95/195 [00:22<00:21, 4.69it/s]
402
 
403
+
404
  49%|████▊ | 95/195 [00:22<00:21, 4.69it/s]
405
 
406
+
407
  49%|████▊ | 95/195 [00:22<00:21, 4.69it/s]
408
  50%|█████ | 98/195 [00:22<00:16, 5.77it/s]
409
 
410
+
411
  50%|█████ | 98/195 [00:22<00:16, 5.77it/s]
412
 
413
+
414
  50%|█████ | 98/195 [00:22<00:16, 5.77it/s]
415
  51%|█████▏ | 100/195 [00:23<00:14, 6.34it/s]
416
 
417
+
418
  51%|█████▏ | 100/195 [00:23<00:14, 6.34it/s]
419
  52%|█████▏ | 101/195 [00:23<00:20, 4.67it/s]
420
 
421
+
422
  52%|█████▏ | 101/195 [00:23<00:20, 4.67it/s]
423
 
424
+
425
  52%|█████▏ | 101/195 [00:23<00:20, 4.67it/s]
426
 
427
+
428
  52%|█████▏ | 101/195 [00:23<00:20, 4.67it/s]
429
  53%|█████▎ | 104/195 [00:23<00:15, 5.75it/s]
430
 
431
+
432
  53%|█████▎ | 104/195 [00:23<00:15, 5.75it/s]
433
 
434
+
435
  53%|█████▎ | 104/195 [00:23<00:15, 5.75it/s]
436
  54%|█████▍ | 106/195 [00:24<00:14, 6.33it/s]
437
 
438
+
439
  54%|█████▍ | 106/195 [00:24<00:14, 6.33it/s]
440
  55%|█████▍ | 107/195 [00:24<00:18, 4.69it/s]
441
 
442
+
443
  55%|█████▍ | 107/195 [00:24<00:18, 4.69it/s]
444
 
445
+
446
  55%|█████▍ | 107/195 [00:24<00:18, 4.69it/s]
447
 
448
+
449
  55%|█████▍ | 107/195 [00:24<00:18, 4.69it/s]
450
  56%|█████▋ | 110/195 [00:24<00:14, 5.77it/s]
451
 
452
+
453
  56%|█████▋ | 110/195 [00:24<00:14, 5.77it/s]
454
 
455
+
456
  56%|█████▋ | 110/195 [00:24<00:14, 5.77it/s]
457
  57%|█████▋ | 112/195 [00:25<00:13, 6.34it/s]
458
 
459
+
460
  57%|█████▋ | 112/195 [00:25<00:13, 6.34it/s]
461
  58%|█████▊ | 113/195 [00:25<00:17, 4.65it/s]
462
 
463
+
464
  58%|█████▊ | 113/195 [00:25<00:17, 4.65it/s]
465
 
466
+
467
  58%|█████▊ | 113/195 [00:25<00:17, 4.65it/s]
468
 
469
+
470
  58%|█████▊ | 113/195 [00:25<00:17, 4.65it/s]
471
  59%|█████▉ | 116/195 [00:26<00:13, 5.70it/s]
472
 
473
+
474
  59%|█████▉ | 116/195 [00:26<00:13, 5.70it/s]
475
 
476
+
477
  59%|█████▉ | 116/195 [00:26<00:13, 5.70it/s]
478
  61%|██████ | 118/195 [00:26<00:12, 6.22it/s]
479
 
480
+
481
  61%|██████ | 118/195 [00:26<00:12, 6.22it/s]
482
  61%|██████ | 119/195 [00:26<00:17, 4.47it/s]
483
 
484
+
485
  61%|██████ | 119/195 [00:26<00:17, 4.47it/s]
486
 
487
+
488
  61%|██████ | 119/195 [00:26<00:17, 4.47it/s]
489
 
490
+
491
  61%|██████ | 119/195 [00:26<00:17, 4.47it/s]
492
  63%|██████▎ | 122/195 [00:27<00:13, 5.57it/s]
493
 
494
+
495
  63%|██████▎ | 122/195 [00:27<00:13, 5.57it/s]
496
 
497
+
498
  63%|██████▎ | 122/195 [00:27<00:13, 5.57it/s]
499
  64%|██████▎ | 124/195 [00:27<00:11, 6.17it/s]
500
 
501
+
502
  64%|██████▎ | 124/195 [00:27<00:11, 6.17it/s]
503
  64%|██████▍ | 125/195 [00:27<00:15, 4.56it/s]
504
 
505
+
506
  64%|██████▍ | 125/195 [00:27<00:15, 4.56it/s]
507
 
508
+
509
  64%|██████▍ | 125/195 [00:27<00:15, 4.56it/s]
510
 
511
+
512
  64%|██████▍ | 125/195 [00:28<00:15, 4.56it/s]
513
  66%|██████▌ | 128/195 [00:28<00:11, 5.65it/s]
514
 
515
+
516
  66%|██████▌ | 128/195 [00:28<00:11, 5.65it/s]
517
 
518
+
519
  66%|██████▌ | 128/195 [00:28<00:11, 5.65it/s]
520
  67%|██████▋ | 130/195 [00:28<00:10, 6.24it/s]
521
 
522
+
523
  67%|██████▋ | 130/195 [00:28<00:10, 6.24it/s]
524
  67%|██████▋ | 131/195 [00:29<00:13, 4.60it/s]
525
 
526
+
527
  67%|██████▋ | 131/195 [00:29<00:13, 4.60it/s]
528
 
529
+
530
  67%|██████▋ | 131/195 [00:29<00:13, 4.60it/s]
531
 
532
+
533
  67%|██████▋ | 131/195 [00:29<00:13, 4.60it/s]
534
  69%|██████▊ | 134/195 [00:29<00:10, 5.69it/s]
535
 
536
+
537
  69%|██████▊ | 134/195 [00:29<00:10, 5.69it/s]
538
 
539
+
540
  69%|██████▊ | 134/195 [00:29<00:10, 5.69it/s]
541
  70%|██████▉ | 136/195 [00:29<00:09, 6.28it/s]
542
 
543
+
544
  70%|██████▉ | 136/195 [00:29<00:09, 6.28it/s]
545
  70%|███████ | 137/195 [00:30<00:13, 4.27it/s]
546
 
547
+
548
  70%|███████ | 137/195 [00:30<00:13, 4.27it/s]
549
 
550
+
551
  70%|███████ | 137/195 [00:30<00:13, 4.27it/s]
552
 
553
+
554
  70%|███████ | 137/195 [00:30<00:13, 4.27it/s]
555
  72%|███████▏ | 140/195 [00:30<00:10, 5.33it/s]
556
 
557
+
558
  72%|███████▏ | 140/195 [00:30<00:10, 5.33it/s]
559
 
560
+
561
  72%|███████▏ | 140/195 [00:30<00:10, 5.33it/s]
562
  73%|███████▎ | 142/195 [00:30<00:08, 5.93it/s]
563
 
564
+
565
  73%|███████▎ | 142/195 [00:30<00:08, 5.93it/s]
566
  73%|███████▎ | 143/195 [00:31<00:11, 4.50it/s]
567
 
568
+
569
  73%|███████▎ | 143/195 [00:31<00:11, 4.50it/s]
570
 
571
+
572
  73%|███████▎ | 143/195 [00:31<00:11, 4.50it/s]
573
 
574
+
575
  73%|███████▎ | 143/195 [00:31<00:11, 4.50it/s]
576
  75%|███████▍ | 146/195 [00:31<00:08, 5.60it/s]
577
 
578
+
579
  75%|███████▍ | 146/195 [00:31<00:08, 5.60it/s]
580
 
581
+
582
  75%|███████▍ | 146/195 [00:31<00:08, 5.60it/s]
583
  76%|███████▌ | 148/195 [00:31<00:07, 6.20it/s]
584
 
585
+
586
  76%|███████▌ | 148/195 [00:31<00:07, 6.20it/s]
587
  76%|███████▋ | 149/195 [00:32<00:10, 4.39it/s]
588
 
589
+
590
  76%|███████▋ | 149/195 [00:32<00:10, 4.39it/s]
591
 
592
+
593
  76%|███████▋ | 149/195 [00:32<00:10, 4.39it/s]
594
 
595
+
596
  76%|███████▋ | 149/195 [00:32<00:10, 4.39it/s]
597
  78%|███████▊ | 152/195 [00:32<00:07, 5.50it/s]
598
 
599
+
600
  78%|███████▊ | 152/195 [00:32<00:07, 5.50it/s]
601
 
602
+
603
  78%|███████▊ | 152/195 [00:32<00:07, 5.50it/s]
604
 
605
+
606
  78%|███████▊ | 152/195 [00:32<00:07, 5.50it/s]
607
  79%|███████▉ | 155/195 [00:33<00:06, 6.52it/s]
608
 
609
+
610
  79%|███████▉ | 155/195 [00:33<00:06, 6.52it/s]
611
  80%|████████ | 156/195 [00:33<00:08, 4.86it/s]
612
 
613
+
614
  80%|████████ | 156/195 [00:33<00:08, 4.86it/s]
615
 
616
+
617
  80%|████████ | 156/195 [00:33<00:08, 4.86it/s]
618
 
619
+
620
  80%|████████ | 156/195 [00:33<00:08, 4.86it/s]
621
  82%|████████▏ | 159/195 [00:33<00:06, 5.83it/s]
622
 
623
+
624
  82%|████████▏ | 159/195 [00:33<00:06, 5.83it/s]
625
 
626
+
627
  82%|████████▏ | 159/195 [00:33<00:06, 5.83it/s]
628
  83%|████████▎ | 161/195 [00:34<00:05, 6.30it/s]
629
 
630
+
631
  83%|████████▎ | 161/195 [00:34<00:05, 6.30it/s]
632
  83%|████████▎ | 162/195 [00:34<00:08, 4.00it/s]
633
 
634
+
635
  83%|████████▎ | 162/195 [00:34<00:08, 4.00it/s]
636
 
637
+
638
  83%|████████▎ | 162/195 [00:34<00:08, 4.00it/s]
639
 
640
+
641
  83%|████████▎ | 162/195 [00:35<00:08, 4.00it/s]
642
  85%|████████▍ | 165/195 [00:35<00:05, 5.09it/s]
643
 
644
+
645
  85%|████████▍ | 165/195 [00:35<00:05, 5.09it/s]
646
 
647
+
648
  85%|████████▍ | 165/195 [00:35<00:05, 5.09it/s]
649
  86%|████████▌ | 167/195 [00:35<00:04, 5.72it/s]
650
 
651
+
652
  86%|████████▌ | 167/195 [00:35<00:04, 5.72it/s]
653
  86%|████████▌ | 168/195 [00:36<00:06, 4.25it/s]
654
 
655
+
656
  86%|████████▌ | 168/195 [00:36<00:06, 4.25it/s]
657
 
658
+
659
  86%|████████▌ | 168/195 [00:36<00:06, 4.25it/s]
660
 
661
+
662
  86%|████████▌ | 168/195 [00:36<00:06, 4.25it/s]
663
  88%|████████▊ | 171/195 [00:36<00:04, 5.34it/s]
664
 
665
+
666
  88%|████████▊ | 171/195 [00:36<00:04, 5.34it/s]
667
 
668
+
669
  88%|████████▊ | 171/195 [00:36<00:04, 5.34it/s]
670
  89%|████████▊ | 173/195 [00:36<00:03, 5.95it/s]
671
 
672
+
673
  89%|████████▊ | 173/195 [00:36<00:03, 5.95it/s]
674
  89%|████████▉ | 174/195 [00:37<00:04, 4.39it/s]
675
 
676
+
677
  89%|████████▉ | 174/195 [00:37<00:04, 4.39it/s]
678
 
679
+
680
  89%|████████▉ | 174/195 [00:37<00:04, 4.39it/s]
681
 
682
+
683
  89%|████████▉ | 174/195 [00:37<00:04, 4.39it/s]
684
  91%|█████████ | 177/195 [00:37<00:03, 5.50it/s]
685
 
686
+
687
  91%|█████████ | 177/195 [00:37<00:03, 5.50it/s]
688
 
689
+
690
  91%|█████████ | 177/195 [00:37<00:03, 5.50it/s]
691
  92%|█████████▏| 179/195 [00:37<00:02, 6.11it/s]
692
 
693
+
694
  92%|█████████▏| 179/195 [00:37<00:02, 6.11it/s]
695
  92%|█████████▏| 180/195 [00:38<00:03, 4.52it/s]
696
 
697
+
698
  92%|█████████▏| 180/195 [00:38<00:03, 4.52it/s]
699
 
700
+
701
  92%|█████████▏| 180/195 [00:38<00:03, 4.52it/s]
702
 
703
+
704
  92%|█████████▏| 180/195 [00:38<00:03, 4.52it/s]
705
  94%|█████████▍| 183/195 [00:38<00:02, 5.62it/s]
706
 
707
+
708
  94%|█████████▍| 183/195 [00:38<00:02, 5.62it/s]
709
 
710
+
711
  94%|█████████▍| 183/195 [00:38<00:02, 5.62it/s]
712
  95%|█████████▍| 185/195 [00:38<00:01, 6.21it/s]
713
 
714
+
715
  95%|█████████▍| 185/195 [00:38<00:01, 6.21it/s]
716
  95%|█████████▌| 186/195 [00:39<00:02, 4.07it/s]
717
 
718
+
719
  95%|█████████▌| 186/195 [00:39<00:02, 4.07it/s]
720
 
721
+
722
  95%|█████████▌| 186/195 [00:39<00:02, 4.07it/s]
723
 
724
+
725
  95%|█████████▌| 186/195 [00:39<00:02, 4.07it/s]
726
  97%|█████████▋| 189/195 [00:39<00:01, 5.21it/s]
727
 
728
+
729
  97%|█████████▋| 189/195 [00:39<00:01, 5.21it/s]
730
 
731
+
732
  97%|█████████▋| 189/195 [00:39<00:01, 5.21it/s]
733
  98%|█████████▊| 191/195 [00:40<00:00, 5.85it/s]
734
 
735
+
736
  98%|█████████▊| 191/195 [00:40<00:00, 5.85it/s]
737
  98%|█████████▊| 192/195 [00:40<00:00, 4.37it/s]
738
 
739
+
740
  98%|█████████▊| 192/195 [00:40<00:00, 4.37it/s]
741
 
742
+
743
  98%|█████████▊| 192/195 [00:40<00:00, 4.37it/s]
744
 
745
+
746
  98%|█████████▊| 192/195 [00:40<00:00, 4.37it/s]
747
+ [2024-05-08 13:35:01] INFO huggingface_loader.py:196: Unloading HF weight file: /tmp/tmpy7oe9l51/repo/model-00001-of-00002.safetensors
748
+ [2024-05-08 13:35:01] INFO stats.py:76: Time usage: HF loading: 1.642 sec; Pre-quantization mapping: 2.009 sec; Quantization: 0.000 sec
749
+ [2024-05-08 13:35:01] INFO stats.py:90: RAM usage: Peak RAM: 9.262 GB. Total bytes loaded from disk: 14.235 GB
750
+ [2024-05-08 13:35:01] INFO convert_weight.py:155: Parameter size after quantization: 14.235 GB
751
+ [2024-05-08 13:35:01] INFO convert_weight.py:160: Total parameters: 3,821,079,552
752
+ [2024-05-08 13:35:01] INFO convert_weight.py:161: Bits per parameter: 32.000
753
+ [2024-05-08 13:35:01] INFO convert_weight.py:166: Saved to directory: /tmp/tmptqlm3cdw
754
+
755
+ All finished, 130 total shards committed, record saved to /tmp/tmptqlm3cdw/ndarray-cache.json
756
+ Also saved a bf16 record to /tmp/tmptqlm3cdw/ndarray-cache-b16.json
mlc-chat-config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "phi3",
3
+ "quantization": "q0f32",
4
+ "model_config": {
5
+ "model_type": "phi3",
6
+ "hidden_size": 3072,
7
+ "vocab_size": 32064,
8
+ "num_hidden_layers": 32,
9
+ "num_attention_heads": 32,
10
+ "intermediate_size": 8192,
11
+ "rms_norm_eps": 1e-05,
12
+ "num_key_value_heads": 32,
13
+ "position_embedding_base": 10000.0,
14
+ "context_window_size": 4096,
15
+ "prefill_chunk_size": 2048,
16
+ "head_dim": 96,
17
+ "tensor_parallel_shards": 1,
18
+ "max_batch_size": 80
19
+ },
20
+ "vocab_size": 32064,
21
+ "context_window_size": 4096,
22
+ "sliding_window_size": -1,
23
+ "prefill_chunk_size": 2048,
24
+ "attention_sink_size": -1,
25
+ "tensor_parallel_shards": 1,
26
+ "mean_gen_len": 128,
27
+ "max_gen_len": 512,
28
+ "shift_fill_factor": 0.3,
29
+ "temperature": 0.7,
30
+ "presence_penalty": 0.0,
31
+ "frequency_penalty": 0.0,
32
+ "repetition_penalty": 1.0,
33
+ "top_p": 0.95,
34
+ "conv_template": {
35
+ "name": "phi-3",
36
+ "system_template": "<|system|>\n{system_message}",
37
+ "system_message": "You are a helpful digital assistant. Please provide safe, ethical and accurate information to the user.",
38
+ "system_prefix_token_ids": [
39
+ 1
40
+ ],
41
+ "add_role_after_system_message": true,
42
+ "roles": {
43
+ "user": "<|user|>",
44
+ "assistant": "<|assistant|>"
45
+ },
46
+ "role_templates": {
47
+ "user": "{user_message}",
48
+ "assistant": "{assistant_message}",
49
+ "tool": "{tool_message}"
50
+ },
51
+ "messages": [],
52
+ "seps": [
53
+ "<|end|>\n"
54
+ ],
55
+ "role_content_sep": "\n",
56
+ "role_empty_sep": "\n",
57
+ "stop_str": [
58
+ "<|endoftext|>"
59
+ ],
60
+ "stop_token_ids": [
61
+ 32000,
62
+ 32001,
63
+ 32007
64
+ ],
65
+ "function_string": "",
66
+ "use_function_calling": false
67
+ },
68
+ "pad_token_id": 32000,
69
+ "bos_token_id": 1,
70
+ "eos_token_id": [
71
+ 32000,
72
+ 32001,
73
+ 32007
74
+ ],
75
+ "tokenizer_files": [
76
+ "tokenizer.model",
77
+ "tokenizer.json",
78
+ "added_tokens.json",
79
+ "tokenizer_config.json"
80
+ ],
81
+ "token_table_postproc_method": "byte_fallback",
82
+ "version": "0.1.0"
83
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df40c10192dc1d5fb2a479458331624e60788db5eb0fe0f980dbb12fe145d5ce
3
+ size 197001216
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b4ad850b996123270c49e890d324832aef9ad842b0f085a4174c22c6ea9ac4f
3
+ size 50331648
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:badbb9cb80505c83e58953c232c913bed654cdef67751b6a5b70d5dab8eca86e
3
+ size 56623104
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:207ebe99c8f06f7288e7ba173d6e36084af20f9c8de4e27ba4b52fcc560334a6
3
+ size 18874368
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d2d9322f60c900e0ff3364c1f62a7b0d35efcb3b5840a91c364e37992d466ba
3
+ size 50331648
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:756b23bca7d41c4b433888ab5192f1b650c758de4517763fca3ae6869f559733
3
+ size 100663296
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f8c99368645eb0d21cd6dfb0264c174654e8129977342f5df0fdcd0179007c3
3
+ size 18874368
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:850a3986780bb9c3a1e63de782a12d663aae0a79d3c1f7b249017f36996fced3
3
+ size 56623104
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:568d0db6c28d7b3d6baa666b64345cf2b6836529de0003249bf7e4c8a9bdbcb8
3
+ size 50331648
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7107f3106c0ee833abed7814b83b829966102f26768b47e6b56d141e2c04b393
3
+ size 100663296
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6def91230ee779540606cc520b363ccd4a7a465edafe860ce62675fa62ffc2a4
3
+ size 18874368
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ef70e94a1c3b26fe07d5c8140b2f4dd4f8fd5fc2be2f1077a62f7ec31fd63fa
3
+ size 56623104
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e35c5f8f8e6e21570c43e1ff5d0d52954b7d1e68182f3069f854bbde76358a0
3
+ size 50331648
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eb65496e2e29c9149be95cb2bf60606203e46c7046cd52dae1bc6ac31cbe910
3
+ size 50331648
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35cf2575eee6a7d7d64118137c3aab99579e5572a386a6ccb6388dd932c9ed9f
3
+ size 100663296
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86eb0a68e0f8260a26fdc8901a1e938b90ebdd7f39e5622501232b4b91144920
3
+ size 18874368
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29941b1c4548474d7349ae2d41ec7a090b551e49ae9baa0948420c72c5fe752d
3
+ size 56623104
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76184f2b8c3467da81d709db403f96a676f6deae0e82bc02bb1dca9bd20a3544
3
+ size 50331648
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acd4ffcf9e4789486406d3af35f01e3d24e0c0134cc666ea38a22757a04b5198
3
+ size 100663296
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8c4c6de39b700f2d8883c09af80c2cb554074aed2cc3a566f4b3f3eb4a21942
3
+ size 18874368
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d92740f6f3251b459e7796659f2dfb7c6d571bc83e485d40169480268d4b4517
3
+ size 56623104
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f535eb5e731a9b2f83261e5d16b6e62dc1b581a63e160b47f1f018f042384d75
3
+ size 50331648
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:940a93cd2993ff0e923f289065cd8b5427ca4a33aff3663523be20571f0a5fb9
3
+ size 100663296
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c95f7116592c307a1595d8887823ee034b7944bf13c2780eca78e0b338b297c
3
+ size 18874368
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4b455769067c13c1e5f3702d706acd54280c7b500341d0035cad9b1a319b2cd
3
+ size 100663296
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e24163d1d43008028d92397784b9ba3b9c58010df8e12714936c07f58a404518
3
+ size 56623104
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40876c08372b681f538e4bc69e67d16b8a64a4bd550fc79bd2d542b6fa629d4c
3
+ size 50331648
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16c52e0ce73001358aea309436290c1e3bbfccd70fd2bcadd1338f39acb4676f
3
+ size 100663296
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4524d9a09a673e8da60d27a1a67c83db7d24328a4ce3492bcc4f9fd145915af8
3
+ size 18874368
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54217b91a8efb4783c40b3e656d88817119c62b0f048c077bb6c20073f8195fb
3
+ size 56623104
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd7b2cec79a4030e9b409d26b79f90699ff5d28a2231131b8a7384b7e1618992
3
+ size 50331648
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:795f480da5b514707722f6fbe61c1a673fe0abe660f5e6ededb1135c69255f80
3
+ size 100663296
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f32e96798292d13375e6cb5552b9a103e3480711b38abcf2dc7c6766c821c2d
3
+ size 18874368
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62a0766014a78e224a4b9d4e5b6003fed054026b8323bcab1e5a212cba92fa01
3
+ size 56623104
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:411a07a5a91c9fdccc790a8c3fff772dcf54e4b03e785143c181ffab2a4a2574
3
+ size 19273728
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b946c82d0b0f6443fc055c5e003f071e7aeb7cc8b24b5fbd7b7b35aeaa2c011
3
+ size 18874368
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e309714d37f4b9aa563cc3eab2db1ab37bdafb6794e9d1d8de000d9b0e57b58
3
+ size 56623104
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4102c4beb346759b4a31ba3354065fd51c33e42fa0b37f0468e7c7425e41ad30
3
+ size 50331648
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03db7cd6203ddf201640a3e40d882d8018c8a33c2c3f93677dbfae99fbbc2c19
3
+ size 100663296
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:030014e969aab1f7481055a88259693df5692e1c9915a82dade58b74b44198e8
3
+ size 18874368
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfa919d46d844ae86da262825c2f198e286d903127bf0d8a01b3717a4fbb4795
3
+ size 56623104
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0891fb0de46c30c2bcd54f23dc8abf76e2d1ac3e6d580757284c9ea8485441b
3
+ size 50331648
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30af31bad6d767386c3da1b59187ba23e7d0350e485cfcb5585c5bc2305e7470
3
+ size 100663296
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:326512b72da0579fa64dc0ce9259ca4f3a410f5f8efe75c2269c0f594de1b64c
3
+ size 100663296
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b19c200637a7c08a44919b66687e67100c2e76ef192fee8ec2692bdea4c8a3f2
3
+ size 18874368