sy1998 commited on
Commit
38fccd8
1 Parent(s): e98ef20

Delete VideoXL_weight_8

Browse files
VideoXL_weight_8/config.json DELETED
@@ -1,880 +0,0 @@
1
- {
2
- "_name_or_path": "/share/junjie/shuyan/Qwen2-7B-Instruct",
3
- "architectures": [
4
- "LlavaQwenForCausalLM"
5
- ],
6
- "attention_dropout": 0.0,
7
- "beacon_accum": true,
8
- "beacon_attend_prev": true,
9
- "beacon_attn": "full-coverage",
10
- "beacon_embed_init": "eos",
11
- "beacon_parallel_window": 1,
12
- "beacon_param": [
13
- "q",
14
- "k",
15
- "v"
16
- ],
17
- "beacon_pos": "interleave",
18
- "beacon_ratio": [
19
- 2,
20
- 4,
21
- 8
22
- ],
23
- "beacon_ratio_mix": "step-random",
24
- "beacon_sink_size": 0,
25
- "beacon_stride": 1440,
26
- "beacon_window": 1440,
27
- "bos_token_id": 151643,
28
- "enable_beacon": true,
29
- "eos_token_id": 151645,
30
- "freeze_mm_mlp_adapter": false,
31
- "freeze_mm_vision_resampler": false,
32
- "hidden_act": "silu",
33
- "hidden_size": 3584,
34
- "image_aspect_ratio": "anyres",
35
- "image_crop_resolution": null,
36
- "image_grid_pinpoints": [
37
- [
38
- 336,
39
- 672
40
- ],
41
- [
42
- 336,
43
- 1008
44
- ],
45
- [
46
- 336,
47
- 1344
48
- ],
49
- [
50
- 336,
51
- 1680
52
- ],
53
- [
54
- 336,
55
- 2016
56
- ],
57
- [
58
- 336,
59
- 2352
60
- ],
61
- [
62
- 336,
63
- 2688
64
- ],
65
- [
66
- 336,
67
- 3024
68
- ],
69
- [
70
- 336,
71
- 3360
72
- ],
73
- [
74
- 336,
75
- 3696
76
- ],
77
- [
78
- 336,
79
- 4032
80
- ],
81
- [
82
- 336,
83
- 4368
84
- ],
85
- [
86
- 336,
87
- 4704
88
- ],
89
- [
90
- 336,
91
- 5040
92
- ],
93
- [
94
- 336,
95
- 5376
96
- ],
97
- [
98
- 336,
99
- 5712
100
- ],
101
- [
102
- 336,
103
- 6048
104
- ],
105
- [
106
- 336,
107
- 6384
108
- ],
109
- [
110
- 336,
111
- 6720
112
- ],
113
- [
114
- 336,
115
- 7056
116
- ],
117
- [
118
- 336,
119
- 7392
120
- ],
121
- [
122
- 336,
123
- 7728
124
- ],
125
- [
126
- 336,
127
- 8064
128
- ],
129
- [
130
- 336,
131
- 8400
132
- ],
133
- [
134
- 336,
135
- 8736
136
- ],
137
- [
138
- 336,
139
- 9072
140
- ],
141
- [
142
- 336,
143
- 9408
144
- ],
145
- [
146
- 336,
147
- 9744
148
- ],
149
- [
150
- 336,
151
- 10080
152
- ],
153
- [
154
- 336,
155
- 10416
156
- ],
157
- [
158
- 336,
159
- 10752
160
- ],
161
- [
162
- 336,
163
- 11088
164
- ],
165
- [
166
- 336,
167
- 11424
168
- ],
169
- [
170
- 336,
171
- 11760
172
- ],
173
- [
174
- 336,
175
- 12096
176
- ],
177
- [
178
- 336,
179
- 12432
180
- ],
181
- [
182
- 336,
183
- 12768
184
- ],
185
- [
186
- 336,
187
- 13104
188
- ],
189
- [
190
- 336,
191
- 13440
192
- ],
193
- [
194
- 336,
195
- 13776
196
- ],
197
- [
198
- 336,
199
- 14112
200
- ],
201
- [
202
- 336,
203
- 14448
204
- ],
205
- [
206
- 336,
207
- 14784
208
- ],
209
- [
210
- 336,
211
- 15120
212
- ],
213
- [
214
- 336,
215
- 15456
216
- ],
217
- [
218
- 336,
219
- 15792
220
- ],
221
- [
222
- 336,
223
- 16128
224
- ],
225
- [
226
- 336,
227
- 16464
228
- ],
229
- [
230
- 672,
231
- 336
232
- ],
233
- [
234
- 672,
235
- 672
236
- ],
237
- [
238
- 672,
239
- 1008
240
- ],
241
- [
242
- 672,
243
- 1344
244
- ],
245
- [
246
- 672,
247
- 1680
248
- ],
249
- [
250
- 672,
251
- 2016
252
- ],
253
- [
254
- 672,
255
- 2352
256
- ],
257
- [
258
- 672,
259
- 2688
260
- ],
261
- [
262
- 672,
263
- 3024
264
- ],
265
- [
266
- 672,
267
- 3360
268
- ],
269
- [
270
- 672,
271
- 3696
272
- ],
273
- [
274
- 672,
275
- 4032
276
- ],
277
- [
278
- 672,
279
- 4368
280
- ],
281
- [
282
- 672,
283
- 4704
284
- ],
285
- [
286
- 672,
287
- 5040
288
- ],
289
- [
290
- 672,
291
- 5376
292
- ],
293
- [
294
- 672,
295
- 5712
296
- ],
297
- [
298
- 672,
299
- 6048
300
- ],
301
- [
302
- 672,
303
- 6384
304
- ],
305
- [
306
- 672,
307
- 6720
308
- ],
309
- [
310
- 672,
311
- 7056
312
- ],
313
- [
314
- 672,
315
- 7392
316
- ],
317
- [
318
- 672,
319
- 7728
320
- ],
321
- [
322
- 672,
323
- 8064
324
- ],
325
- [
326
- 1008,
327
- 336
328
- ],
329
- [
330
- 1008,
331
- 672
332
- ],
333
- [
334
- 1008,
335
- 1008
336
- ],
337
- [
338
- 1008,
339
- 1344
340
- ],
341
- [
342
- 1008,
343
- 1680
344
- ],
345
- [
346
- 1008,
347
- 2016
348
- ],
349
- [
350
- 1008,
351
- 2352
352
- ],
353
- [
354
- 1008,
355
- 2688
356
- ],
357
- [
358
- 1008,
359
- 3024
360
- ],
361
- [
362
- 1008,
363
- 3360
364
- ],
365
- [
366
- 1008,
367
- 3696
368
- ],
369
- [
370
- 1008,
371
- 4032
372
- ],
373
- [
374
- 1008,
375
- 4368
376
- ],
377
- [
378
- 1008,
379
- 4704
380
- ],
381
- [
382
- 1008,
383
- 5040
384
- ],
385
- [
386
- 1008,
387
- 5376
388
- ],
389
- [
390
- 1344,
391
- 336
392
- ],
393
- [
394
- 1344,
395
- 672
396
- ],
397
- [
398
- 1344,
399
- 1008
400
- ],
401
- [
402
- 1344,
403
- 1344
404
- ],
405
- [
406
- 1344,
407
- 1680
408
- ],
409
- [
410
- 1344,
411
- 2016
412
- ],
413
- [
414
- 1344,
415
- 2352
416
- ],
417
- [
418
- 1344,
419
- 2688
420
- ],
421
- [
422
- 1344,
423
- 3024
424
- ],
425
- [
426
- 1344,
427
- 3360
428
- ],
429
- [
430
- 1344,
431
- 3696
432
- ],
433
- [
434
- 1344,
435
- 4032
436
- ],
437
- [
438
- 1680,
439
- 336
440
- ],
441
- [
442
- 1680,
443
- 672
444
- ],
445
- [
446
- 1680,
447
- 1008
448
- ],
449
- [
450
- 1680,
451
- 1344
452
- ],
453
- [
454
- 1680,
455
- 1680
456
- ],
457
- [
458
- 1680,
459
- 2016
460
- ],
461
- [
462
- 1680,
463
- 2352
464
- ],
465
- [
466
- 1680,
467
- 2688
468
- ],
469
- [
470
- 1680,
471
- 3024
472
- ],
473
- [
474
- 2016,
475
- 336
476
- ],
477
- [
478
- 2016,
479
- 672
480
- ],
481
- [
482
- 2016,
483
- 1008
484
- ],
485
- [
486
- 2016,
487
- 1344
488
- ],
489
- [
490
- 2016,
491
- 1680
492
- ],
493
- [
494
- 2016,
495
- 2016
496
- ],
497
- [
498
- 2016,
499
- 2352
500
- ],
501
- [
502
- 2016,
503
- 2688
504
- ],
505
- [
506
- 2352,
507
- 336
508
- ],
509
- [
510
- 2352,
511
- 672
512
- ],
513
- [
514
- 2352,
515
- 1008
516
- ],
517
- [
518
- 2352,
519
- 1344
520
- ],
521
- [
522
- 2352,
523
- 1680
524
- ],
525
- [
526
- 2352,
527
- 2016
528
- ],
529
- [
530
- 2352,
531
- 2352
532
- ],
533
- [
534
- 2688,
535
- 336
536
- ],
537
- [
538
- 2688,
539
- 672
540
- ],
541
- [
542
- 2688,
543
- 1008
544
- ],
545
- [
546
- 2688,
547
- 1344
548
- ],
549
- [
550
- 2688,
551
- 1680
552
- ],
553
- [
554
- 2688,
555
- 2016
556
- ],
557
- [
558
- 3024,
559
- 336
560
- ],
561
- [
562
- 3024,
563
- 672
564
- ],
565
- [
566
- 3024,
567
- 1008
568
- ],
569
- [
570
- 3024,
571
- 1344
572
- ],
573
- [
574
- 3024,
575
- 1680
576
- ],
577
- [
578
- 3360,
579
- 336
580
- ],
581
- [
582
- 3360,
583
- 672
584
- ],
585
- [
586
- 3360,
587
- 1008
588
- ],
589
- [
590
- 3360,
591
- 1344
592
- ],
593
- [
594
- 3696,
595
- 336
596
- ],
597
- [
598
- 3696,
599
- 672
600
- ],
601
- [
602
- 3696,
603
- 1008
604
- ],
605
- [
606
- 3696,
607
- 1344
608
- ],
609
- [
610
- 4032,
611
- 336
612
- ],
613
- [
614
- 4032,
615
- 672
616
- ],
617
- [
618
- 4032,
619
- 1008
620
- ],
621
- [
622
- 4032,
623
- 1344
624
- ],
625
- [
626
- 4368,
627
- 336
628
- ],
629
- [
630
- 4368,
631
- 672
632
- ],
633
- [
634
- 4368,
635
- 1008
636
- ],
637
- [
638
- 4704,
639
- 336
640
- ],
641
- [
642
- 4704,
643
- 672
644
- ],
645
- [
646
- 4704,
647
- 1008
648
- ],
649
- [
650
- 5040,
651
- 336
652
- ],
653
- [
654
- 5040,
655
- 672
656
- ],
657
- [
658
- 5040,
659
- 1008
660
- ],
661
- [
662
- 5376,
663
- 336
664
- ],
665
- [
666
- 5376,
667
- 672
668
- ],
669
- [
670
- 5376,
671
- 1008
672
- ],
673
- [
674
- 5712,
675
- 336
676
- ],
677
- [
678
- 5712,
679
- 672
680
- ],
681
- [
682
- 6048,
683
- 336
684
- ],
685
- [
686
- 6048,
687
- 672
688
- ],
689
- [
690
- 6384,
691
- 336
692
- ],
693
- [
694
- 6384,
695
- 672
696
- ],
697
- [
698
- 6720,
699
- 336
700
- ],
701
- [
702
- 6720,
703
- 672
704
- ],
705
- [
706
- 7056,
707
- 336
708
- ],
709
- [
710
- 7056,
711
- 672
712
- ],
713
- [
714
- 7392,
715
- 336
716
- ],
717
- [
718
- 7392,
719
- 672
720
- ],
721
- [
722
- 7728,
723
- 336
724
- ],
725
- [
726
- 7728,
727
- 672
728
- ],
729
- [
730
- 8064,
731
- 336
732
- ],
733
- [
734
- 8064,
735
- 672
736
- ],
737
- [
738
- 8400,
739
- 336
740
- ],
741
- [
742
- 8736,
743
- 336
744
- ],
745
- [
746
- 9072,
747
- 336
748
- ],
749
- [
750
- 9408,
751
- 336
752
- ],
753
- [
754
- 9744,
755
- 336
756
- ],
757
- [
758
- 10080,
759
- 336
760
- ],
761
- [
762
- 10416,
763
- 336
764
- ],
765
- [
766
- 10752,
767
- 336
768
- ],
769
- [
770
- 11088,
771
- 336
772
- ],
773
- [
774
- 11424,
775
- 336
776
- ],
777
- [
778
- 11760,
779
- 336
780
- ],
781
- [
782
- 12096,
783
- 336
784
- ],
785
- [
786
- 12432,
787
- 336
788
- ],
789
- [
790
- 12768,
791
- 336
792
- ],
793
- [
794
- 13104,
795
- 336
796
- ],
797
- [
798
- 13440,
799
- 336
800
- ],
801
- [
802
- 13776,
803
- 336
804
- ],
805
- [
806
- 14112,
807
- 336
808
- ],
809
- [
810
- 14448,
811
- 336
812
- ],
813
- [
814
- 14784,
815
- 336
816
- ],
817
- [
818
- 15120,
819
- 336
820
- ],
821
- [
822
- 15456,
823
- 336
824
- ],
825
- [
826
- 15792,
827
- 336
828
- ],
829
- [
830
- 16128,
831
- 336
832
- ],
833
- [
834
- 16464,
835
- 336
836
- ]
837
- ],
838
- "image_split_resolution": null,
839
- "initializer_range": 0.02,
840
- "intermediate_size": 18944,
841
- "max_position_embeddings": 32768,
842
- "max_window_layers": 28,
843
- "mm_hidden_size": 1024,
844
- "mm_patch_merge_type": "unires",
845
- "mm_projector_lr": null,
846
- "mm_projector_type": "mlp2x_gelu",
847
- "mm_resampler_type": "spatial_pool",
848
- "mm_spatial_pool_mode": "average",
849
- "mm_spatial_pool_out_channels": 1024,
850
- "mm_spatial_pool_stride": 2,
851
- "mm_use_im_patch_token": false,
852
- "mm_use_im_start_end": false,
853
- "mm_vision_select_feature": "patch",
854
- "mm_vision_select_layer": -1,
855
- "mm_vision_tower": "/share/junjie/shuyan/clip-vit-large-patch14-336",
856
- "mm_vision_tower_lr": null,
857
- "model_type": "qwen2",
858
- "num_attention_heads": 28,
859
- "num_hidden_layers": 28,
860
- "num_key_value_heads": 4,
861
- "pos_skipping_range": 4096,
862
- "rms_norm_eps": 1e-06,
863
- "rope_scaling": null,
864
- "rope_theta": 1000000.0,
865
- "sliding_window": 131072,
866
- "tie_word_embeddings": false,
867
- "tokenizer_model_max_length": 32768,
868
- "tokenizer_padding_side": "right",
869
- "torch_dtype": "bfloat16",
870
- "transformers_version": "4.39.2",
871
- "tune_mm_mlp_adapter": false,
872
- "tune_mm_vision_resampler": false,
873
- "unfreeze_mm_vision_tower": true,
874
- "use_cache": false,
875
- "use_mm_proj": true,
876
- "use_pos_skipping": false,
877
- "use_sliding_window": false,
878
- "vision_tower_pretrained": null,
879
- "vocab_size": 152064
880
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
VideoXL_weight_8/latest DELETED
@@ -1 +0,0 @@
1
- global_step15000
 
 
VideoXL_weight_8/model-00002-of-00004.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:440fc3d8b28f82f1ad817d368d3a4c74467341c84297b8b5c40a6afb2f381324
3
- size 4991570400
 
 
 
 
VideoXL_weight_8/model-00003-of-00004.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3db1423d451c8045375b5248ff01ffaae92a348e8000f2b4b2261a2cc9ff4dd
3
- size 4991570464
 
 
 
 
VideoXL_weight_8/rng_state_1.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:27091615c47a5f03f833ce157986890dc26d2d4ede28d06870ca0c96c37e3b6c
3
- size 15984
 
 
 
 
VideoXL_weight_8/trainer_state.json DELETED
The diff for this file is too large to render. See raw diff
 
VideoXL_weight_8/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:70b3fb3b86cd0c94d13a93bdc080bee40afe65820d8d57848cc5106c1d0d6a4f
3
- size 7032
 
 
 
 
VideoXL_weight_8/vocab.json DELETED
The diff for this file is too large to render. See raw diff