lxr2003 commited on
Commit
8393537
·
verified ·
1 Parent(s): 9a2445a

Upload folder using huggingface_hub

Browse files
.ipynb_checkpoints/config-checkpoint.json ADDED
@@ -0,0 +1,880 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/share/LXRlxr0_0/code/Qwen/Qwen2.5-3B-Instruct",
3
+ "architectures": [
4
+ "LlavaQwenForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "beacon_accum": true,
8
+ "beacon_attend_prev": true,
9
+ "beacon_attn": "full-coverage",
10
+ "beacon_embed_init": "eos",
11
+ "beacon_parallel_window": 1,
12
+ "beacon_param": [
13
+ "q",
14
+ "k",
15
+ "v"
16
+ ],
17
+ "beacon_pos": "interleave",
18
+ "beacon_ratio": [
19
+ 2,
20
+ 4,
21
+ 8
22
+ ],
23
+ "beacon_ratio_mix": "step-random",
24
+ "beacon_sink_size": 0,
25
+ "beacon_stride": 1440,
26
+ "beacon_window": 1440,
27
+ "bos_token_id": 151643,
28
+ "enable_beacon": true,
29
+ "eos_token_id": 151645,
30
+ "freeze_mm_mlp_adapter": false,
31
+ "freeze_mm_vision_resampler": false,
32
+ "hidden_act": "silu",
33
+ "hidden_size": 2048,
34
+ "image_aspect_ratio": "anyres",
35
+ "image_crop_resolution": null,
36
+ "image_grid_pinpoints": [
37
+ [
38
+ 336,
39
+ 672
40
+ ],
41
+ [
42
+ 336,
43
+ 1008
44
+ ],
45
+ [
46
+ 336,
47
+ 1344
48
+ ],
49
+ [
50
+ 336,
51
+ 1680
52
+ ],
53
+ [
54
+ 336,
55
+ 2016
56
+ ],
57
+ [
58
+ 336,
59
+ 2352
60
+ ],
61
+ [
62
+ 336,
63
+ 2688
64
+ ],
65
+ [
66
+ 336,
67
+ 3024
68
+ ],
69
+ [
70
+ 336,
71
+ 3360
72
+ ],
73
+ [
74
+ 336,
75
+ 3696
76
+ ],
77
+ [
78
+ 336,
79
+ 4032
80
+ ],
81
+ [
82
+ 336,
83
+ 4368
84
+ ],
85
+ [
86
+ 336,
87
+ 4704
88
+ ],
89
+ [
90
+ 336,
91
+ 5040
92
+ ],
93
+ [
94
+ 336,
95
+ 5376
96
+ ],
97
+ [
98
+ 336,
99
+ 5712
100
+ ],
101
+ [
102
+ 336,
103
+ 6048
104
+ ],
105
+ [
106
+ 336,
107
+ 6384
108
+ ],
109
+ [
110
+ 336,
111
+ 6720
112
+ ],
113
+ [
114
+ 336,
115
+ 7056
116
+ ],
117
+ [
118
+ 336,
119
+ 7392
120
+ ],
121
+ [
122
+ 336,
123
+ 7728
124
+ ],
125
+ [
126
+ 336,
127
+ 8064
128
+ ],
129
+ [
130
+ 336,
131
+ 8400
132
+ ],
133
+ [
134
+ 336,
135
+ 8736
136
+ ],
137
+ [
138
+ 336,
139
+ 9072
140
+ ],
141
+ [
142
+ 336,
143
+ 9408
144
+ ],
145
+ [
146
+ 336,
147
+ 9744
148
+ ],
149
+ [
150
+ 336,
151
+ 10080
152
+ ],
153
+ [
154
+ 336,
155
+ 10416
156
+ ],
157
+ [
158
+ 336,
159
+ 10752
160
+ ],
161
+ [
162
+ 336,
163
+ 11088
164
+ ],
165
+ [
166
+ 336,
167
+ 11424
168
+ ],
169
+ [
170
+ 336,
171
+ 11760
172
+ ],
173
+ [
174
+ 336,
175
+ 12096
176
+ ],
177
+ [
178
+ 336,
179
+ 12432
180
+ ],
181
+ [
182
+ 336,
183
+ 12768
184
+ ],
185
+ [
186
+ 336,
187
+ 13104
188
+ ],
189
+ [
190
+ 336,
191
+ 13440
192
+ ],
193
+ [
194
+ 336,
195
+ 13776
196
+ ],
197
+ [
198
+ 336,
199
+ 14112
200
+ ],
201
+ [
202
+ 336,
203
+ 14448
204
+ ],
205
+ [
206
+ 336,
207
+ 14784
208
+ ],
209
+ [
210
+ 336,
211
+ 15120
212
+ ],
213
+ [
214
+ 336,
215
+ 15456
216
+ ],
217
+ [
218
+ 336,
219
+ 15792
220
+ ],
221
+ [
222
+ 336,
223
+ 16128
224
+ ],
225
+ [
226
+ 336,
227
+ 16464
228
+ ],
229
+ [
230
+ 672,
231
+ 336
232
+ ],
233
+ [
234
+ 672,
235
+ 672
236
+ ],
237
+ [
238
+ 672,
239
+ 1008
240
+ ],
241
+ [
242
+ 672,
243
+ 1344
244
+ ],
245
+ [
246
+ 672,
247
+ 1680
248
+ ],
249
+ [
250
+ 672,
251
+ 2016
252
+ ],
253
+ [
254
+ 672,
255
+ 2352
256
+ ],
257
+ [
258
+ 672,
259
+ 2688
260
+ ],
261
+ [
262
+ 672,
263
+ 3024
264
+ ],
265
+ [
266
+ 672,
267
+ 3360
268
+ ],
269
+ [
270
+ 672,
271
+ 3696
272
+ ],
273
+ [
274
+ 672,
275
+ 4032
276
+ ],
277
+ [
278
+ 672,
279
+ 4368
280
+ ],
281
+ [
282
+ 672,
283
+ 4704
284
+ ],
285
+ [
286
+ 672,
287
+ 5040
288
+ ],
289
+ [
290
+ 672,
291
+ 5376
292
+ ],
293
+ [
294
+ 672,
295
+ 5712
296
+ ],
297
+ [
298
+ 672,
299
+ 6048
300
+ ],
301
+ [
302
+ 672,
303
+ 6384
304
+ ],
305
+ [
306
+ 672,
307
+ 6720
308
+ ],
309
+ [
310
+ 672,
311
+ 7056
312
+ ],
313
+ [
314
+ 672,
315
+ 7392
316
+ ],
317
+ [
318
+ 672,
319
+ 7728
320
+ ],
321
+ [
322
+ 672,
323
+ 8064
324
+ ],
325
+ [
326
+ 1008,
327
+ 336
328
+ ],
329
+ [
330
+ 1008,
331
+ 672
332
+ ],
333
+ [
334
+ 1008,
335
+ 1008
336
+ ],
337
+ [
338
+ 1008,
339
+ 1344
340
+ ],
341
+ [
342
+ 1008,
343
+ 1680
344
+ ],
345
+ [
346
+ 1008,
347
+ 2016
348
+ ],
349
+ [
350
+ 1008,
351
+ 2352
352
+ ],
353
+ [
354
+ 1008,
355
+ 2688
356
+ ],
357
+ [
358
+ 1008,
359
+ 3024
360
+ ],
361
+ [
362
+ 1008,
363
+ 3360
364
+ ],
365
+ [
366
+ 1008,
367
+ 3696
368
+ ],
369
+ [
370
+ 1008,
371
+ 4032
372
+ ],
373
+ [
374
+ 1008,
375
+ 4368
376
+ ],
377
+ [
378
+ 1008,
379
+ 4704
380
+ ],
381
+ [
382
+ 1008,
383
+ 5040
384
+ ],
385
+ [
386
+ 1008,
387
+ 5376
388
+ ],
389
+ [
390
+ 1344,
391
+ 336
392
+ ],
393
+ [
394
+ 1344,
395
+ 672
396
+ ],
397
+ [
398
+ 1344,
399
+ 1008
400
+ ],
401
+ [
402
+ 1344,
403
+ 1344
404
+ ],
405
+ [
406
+ 1344,
407
+ 1680
408
+ ],
409
+ [
410
+ 1344,
411
+ 2016
412
+ ],
413
+ [
414
+ 1344,
415
+ 2352
416
+ ],
417
+ [
418
+ 1344,
419
+ 2688
420
+ ],
421
+ [
422
+ 1344,
423
+ 3024
424
+ ],
425
+ [
426
+ 1344,
427
+ 3360
428
+ ],
429
+ [
430
+ 1344,
431
+ 3696
432
+ ],
433
+ [
434
+ 1344,
435
+ 4032
436
+ ],
437
+ [
438
+ 1680,
439
+ 336
440
+ ],
441
+ [
442
+ 1680,
443
+ 672
444
+ ],
445
+ [
446
+ 1680,
447
+ 1008
448
+ ],
449
+ [
450
+ 1680,
451
+ 1344
452
+ ],
453
+ [
454
+ 1680,
455
+ 1680
456
+ ],
457
+ [
458
+ 1680,
459
+ 2016
460
+ ],
461
+ [
462
+ 1680,
463
+ 2352
464
+ ],
465
+ [
466
+ 1680,
467
+ 2688
468
+ ],
469
+ [
470
+ 1680,
471
+ 3024
472
+ ],
473
+ [
474
+ 2016,
475
+ 336
476
+ ],
477
+ [
478
+ 2016,
479
+ 672
480
+ ],
481
+ [
482
+ 2016,
483
+ 1008
484
+ ],
485
+ [
486
+ 2016,
487
+ 1344
488
+ ],
489
+ [
490
+ 2016,
491
+ 1680
492
+ ],
493
+ [
494
+ 2016,
495
+ 2016
496
+ ],
497
+ [
498
+ 2016,
499
+ 2352
500
+ ],
501
+ [
502
+ 2016,
503
+ 2688
504
+ ],
505
+ [
506
+ 2352,
507
+ 336
508
+ ],
509
+ [
510
+ 2352,
511
+ 672
512
+ ],
513
+ [
514
+ 2352,
515
+ 1008
516
+ ],
517
+ [
518
+ 2352,
519
+ 1344
520
+ ],
521
+ [
522
+ 2352,
523
+ 1680
524
+ ],
525
+ [
526
+ 2352,
527
+ 2016
528
+ ],
529
+ [
530
+ 2352,
531
+ 2352
532
+ ],
533
+ [
534
+ 2688,
535
+ 336
536
+ ],
537
+ [
538
+ 2688,
539
+ 672
540
+ ],
541
+ [
542
+ 2688,
543
+ 1008
544
+ ],
545
+ [
546
+ 2688,
547
+ 1344
548
+ ],
549
+ [
550
+ 2688,
551
+ 1680
552
+ ],
553
+ [
554
+ 2688,
555
+ 2016
556
+ ],
557
+ [
558
+ 3024,
559
+ 336
560
+ ],
561
+ [
562
+ 3024,
563
+ 672
564
+ ],
565
+ [
566
+ 3024,
567
+ 1008
568
+ ],
569
+ [
570
+ 3024,
571
+ 1344
572
+ ],
573
+ [
574
+ 3024,
575
+ 1680
576
+ ],
577
+ [
578
+ 3360,
579
+ 336
580
+ ],
581
+ [
582
+ 3360,
583
+ 672
584
+ ],
585
+ [
586
+ 3360,
587
+ 1008
588
+ ],
589
+ [
590
+ 3360,
591
+ 1344
592
+ ],
593
+ [
594
+ 3696,
595
+ 336
596
+ ],
597
+ [
598
+ 3696,
599
+ 672
600
+ ],
601
+ [
602
+ 3696,
603
+ 1008
604
+ ],
605
+ [
606
+ 3696,
607
+ 1344
608
+ ],
609
+ [
610
+ 4032,
611
+ 336
612
+ ],
613
+ [
614
+ 4032,
615
+ 672
616
+ ],
617
+ [
618
+ 4032,
619
+ 1008
620
+ ],
621
+ [
622
+ 4032,
623
+ 1344
624
+ ],
625
+ [
626
+ 4368,
627
+ 336
628
+ ],
629
+ [
630
+ 4368,
631
+ 672
632
+ ],
633
+ [
634
+ 4368,
635
+ 1008
636
+ ],
637
+ [
638
+ 4704,
639
+ 336
640
+ ],
641
+ [
642
+ 4704,
643
+ 672
644
+ ],
645
+ [
646
+ 4704,
647
+ 1008
648
+ ],
649
+ [
650
+ 5040,
651
+ 336
652
+ ],
653
+ [
654
+ 5040,
655
+ 672
656
+ ],
657
+ [
658
+ 5040,
659
+ 1008
660
+ ],
661
+ [
662
+ 5376,
663
+ 336
664
+ ],
665
+ [
666
+ 5376,
667
+ 672
668
+ ],
669
+ [
670
+ 5376,
671
+ 1008
672
+ ],
673
+ [
674
+ 5712,
675
+ 336
676
+ ],
677
+ [
678
+ 5712,
679
+ 672
680
+ ],
681
+ [
682
+ 6048,
683
+ 336
684
+ ],
685
+ [
686
+ 6048,
687
+ 672
688
+ ],
689
+ [
690
+ 6384,
691
+ 336
692
+ ],
693
+ [
694
+ 6384,
695
+ 672
696
+ ],
697
+ [
698
+ 6720,
699
+ 336
700
+ ],
701
+ [
702
+ 6720,
703
+ 672
704
+ ],
705
+ [
706
+ 7056,
707
+ 336
708
+ ],
709
+ [
710
+ 7056,
711
+ 672
712
+ ],
713
+ [
714
+ 7392,
715
+ 336
716
+ ],
717
+ [
718
+ 7392,
719
+ 672
720
+ ],
721
+ [
722
+ 7728,
723
+ 336
724
+ ],
725
+ [
726
+ 7728,
727
+ 672
728
+ ],
729
+ [
730
+ 8064,
731
+ 336
732
+ ],
733
+ [
734
+ 8064,
735
+ 672
736
+ ],
737
+ [
738
+ 8400,
739
+ 336
740
+ ],
741
+ [
742
+ 8736,
743
+ 336
744
+ ],
745
+ [
746
+ 9072,
747
+ 336
748
+ ],
749
+ [
750
+ 9408,
751
+ 336
752
+ ],
753
+ [
754
+ 9744,
755
+ 336
756
+ ],
757
+ [
758
+ 10080,
759
+ 336
760
+ ],
761
+ [
762
+ 10416,
763
+ 336
764
+ ],
765
+ [
766
+ 10752,
767
+ 336
768
+ ],
769
+ [
770
+ 11088,
771
+ 336
772
+ ],
773
+ [
774
+ 11424,
775
+ 336
776
+ ],
777
+ [
778
+ 11760,
779
+ 336
780
+ ],
781
+ [
782
+ 12096,
783
+ 336
784
+ ],
785
+ [
786
+ 12432,
787
+ 336
788
+ ],
789
+ [
790
+ 12768,
791
+ 336
792
+ ],
793
+ [
794
+ 13104,
795
+ 336
796
+ ],
797
+ [
798
+ 13440,
799
+ 336
800
+ ],
801
+ [
802
+ 13776,
803
+ 336
804
+ ],
805
+ [
806
+ 14112,
807
+ 336
808
+ ],
809
+ [
810
+ 14448,
811
+ 336
812
+ ],
813
+ [
814
+ 14784,
815
+ 336
816
+ ],
817
+ [
818
+ 15120,
819
+ 336
820
+ ],
821
+ [
822
+ 15456,
823
+ 336
824
+ ],
825
+ [
826
+ 15792,
827
+ 336
828
+ ],
829
+ [
830
+ 16128,
831
+ 336
832
+ ],
833
+ [
834
+ 16464,
835
+ 336
836
+ ]
837
+ ],
838
+ "image_split_resolution": null,
839
+ "initializer_range": 0.02,
840
+ "intermediate_size": 11008,
841
+ "max_position_embeddings": 32768,
842
+ "max_window_layers": 70,
843
+ "mm_hidden_size": 1152,
844
+ "mm_patch_merge_type": "unires",
845
+ "mm_projector_lr": null,
846
+ "mm_projector_type": "mlp2x_gelu",
847
+ "mm_resampler_type": "spatial_pool",
848
+ "mm_spatial_pool_mode": "average",
849
+ "mm_spatial_pool_out_channels": 1152,
850
+ "mm_spatial_pool_stride": 2,
851
+ "mm_use_im_patch_token": false,
852
+ "mm_use_im_start_end": false,
853
+ "mm_vision_select_feature": "patch",
854
+ "mm_vision_select_layer": -1,
855
+ "mm_vision_tower": "/share/LXRlxr0_0/code/videoxlturbo2.0/videoxl/google/siglip-so400m-patch14-384",
856
+ "mm_vision_tower_lr": null,
857
+ "model_type": "qwen2",
858
+ "num_attention_heads": 16,
859
+ "num_hidden_layers": 36,
860
+ "num_key_value_heads": 2,
861
+ "pos_skipping_range": 4096,
862
+ "rms_norm_eps": 1e-06,
863
+ "rope_scaling": null,
864
+ "rope_theta": 1000000.0,
865
+ "sliding_window": null,
866
+ "tie_word_embeddings": true,
867
+ "tokenizer_model_max_length": 32768,
868
+ "tokenizer_padding_side": "right",
869
+ "torch_dtype": "bfloat16",
870
+ "transformers_version": "4.43.0",
871
+ "tune_mm_mlp_adapter": false,
872
+ "tune_mm_vision_resampler": false,
873
+ "unfreeze_mm_vision_tower": true,
874
+ "use_cache": true,
875
+ "use_mm_proj": true,
876
+ "use_pos_skipping": false,
877
+ "use_sliding_window": false,
878
+ "vision_tower_pretrained": null,
879
+ "vocab_size": 151936
880
+ }
.ipynb_checkpoints/model.safetensors.index-checkpoint.json ADDED
The diff for this file is too large to render. See raw diff
 
.ipynb_checkpoints/special_tokens_map-checkpoint.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>",
5
+ "<|object_ref_start|>",
6
+ "<|object_ref_end|>",
7
+ "<|box_start|>",
8
+ "<|box_end|>",
9
+ "<|quad_start|>",
10
+ "<|quad_end|>",
11
+ "<|vision_start|>",
12
+ "<|vision_end|>",
13
+ "<|vision_pad|>",
14
+ "<|image_pad|>",
15
+ "<|video_pad|>"
16
+ ],
17
+ "eos_token": {
18
+ "content": "<|im_end|>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ },
24
+ "pad_token": {
25
+ "content": "<|endoftext|>",
26
+ "lstrip": false,
27
+ "normalized": false,
28
+ "rstrip": false,
29
+ "single_word": false
30
+ }
31
+ }
.ipynb_checkpoints/vocab-checkpoint.json ADDED
The diff for this file is too large to render. See raw diff
 
added_tokens.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</tool_call>": 151658,
3
+ "<tool_call>": 151657,
4
+ "<|box_end|>": 151649,
5
+ "<|box_start|>": 151648,
6
+ "<|endoftext|>": 151643,
7
+ "<|file_sep|>": 151664,
8
+ "<|fim_middle|>": 151660,
9
+ "<|fim_pad|>": 151662,
10
+ "<|fim_prefix|>": 151659,
11
+ "<|fim_suffix|>": 151661,
12
+ "<|im_end|>": 151645,
13
+ "<|im_start|>": 151644,
14
+ "<|image_pad|>": 151655,
15
+ "<|object_ref_end|>": 151647,
16
+ "<|object_ref_start|>": 151646,
17
+ "<|quad_end|>": 151651,
18
+ "<|quad_start|>": 151650,
19
+ "<|repo_name|>": 151663,
20
+ "<|video_pad|>": 151656,
21
+ "<|vision_end|>": 151653,
22
+ "<|vision_pad|>": 151654,
23
+ "<|vision_start|>": 151652
24
+ }
config.json ADDED
@@ -0,0 +1,880 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/share/LXRlxr0_0/code/Qwen/Qwen2.5-3B-Instruct",
3
+ "architectures": [
4
+ "LlavaQwenForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "beacon_accum": true,
8
+ "beacon_attend_prev": true,
9
+ "beacon_attn": "full-coverage",
10
+ "beacon_embed_init": "eos",
11
+ "beacon_parallel_window": 1,
12
+ "beacon_param": [
13
+ "q",
14
+ "k",
15
+ "v"
16
+ ],
17
+ "beacon_pos": "interleave",
18
+ "beacon_ratio": [
19
+ 2,
20
+ 4,
21
+ 8
22
+ ],
23
+ "beacon_ratio_mix": "step-random",
24
+ "beacon_sink_size": 0,
25
+ "beacon_stride": 1440,
26
+ "beacon_window": 1440,
27
+ "bos_token_id": 151643,
28
+ "enable_beacon": true,
29
+ "eos_token_id": 151645,
30
+ "freeze_mm_mlp_adapter": false,
31
+ "freeze_mm_vision_resampler": false,
32
+ "hidden_act": "silu",
33
+ "hidden_size": 2048,
34
+ "image_aspect_ratio": "anyres",
35
+ "image_crop_resolution": null,
36
+ "image_grid_pinpoints": [
37
+ [
38
+ 336,
39
+ 672
40
+ ],
41
+ [
42
+ 336,
43
+ 1008
44
+ ],
45
+ [
46
+ 336,
47
+ 1344
48
+ ],
49
+ [
50
+ 336,
51
+ 1680
52
+ ],
53
+ [
54
+ 336,
55
+ 2016
56
+ ],
57
+ [
58
+ 336,
59
+ 2352
60
+ ],
61
+ [
62
+ 336,
63
+ 2688
64
+ ],
65
+ [
66
+ 336,
67
+ 3024
68
+ ],
69
+ [
70
+ 336,
71
+ 3360
72
+ ],
73
+ [
74
+ 336,
75
+ 3696
76
+ ],
77
+ [
78
+ 336,
79
+ 4032
80
+ ],
81
+ [
82
+ 336,
83
+ 4368
84
+ ],
85
+ [
86
+ 336,
87
+ 4704
88
+ ],
89
+ [
90
+ 336,
91
+ 5040
92
+ ],
93
+ [
94
+ 336,
95
+ 5376
96
+ ],
97
+ [
98
+ 336,
99
+ 5712
100
+ ],
101
+ [
102
+ 336,
103
+ 6048
104
+ ],
105
+ [
106
+ 336,
107
+ 6384
108
+ ],
109
+ [
110
+ 336,
111
+ 6720
112
+ ],
113
+ [
114
+ 336,
115
+ 7056
116
+ ],
117
+ [
118
+ 336,
119
+ 7392
120
+ ],
121
+ [
122
+ 336,
123
+ 7728
124
+ ],
125
+ [
126
+ 336,
127
+ 8064
128
+ ],
129
+ [
130
+ 336,
131
+ 8400
132
+ ],
133
+ [
134
+ 336,
135
+ 8736
136
+ ],
137
+ [
138
+ 336,
139
+ 9072
140
+ ],
141
+ [
142
+ 336,
143
+ 9408
144
+ ],
145
+ [
146
+ 336,
147
+ 9744
148
+ ],
149
+ [
150
+ 336,
151
+ 10080
152
+ ],
153
+ [
154
+ 336,
155
+ 10416
156
+ ],
157
+ [
158
+ 336,
159
+ 10752
160
+ ],
161
+ [
162
+ 336,
163
+ 11088
164
+ ],
165
+ [
166
+ 336,
167
+ 11424
168
+ ],
169
+ [
170
+ 336,
171
+ 11760
172
+ ],
173
+ [
174
+ 336,
175
+ 12096
176
+ ],
177
+ [
178
+ 336,
179
+ 12432
180
+ ],
181
+ [
182
+ 336,
183
+ 12768
184
+ ],
185
+ [
186
+ 336,
187
+ 13104
188
+ ],
189
+ [
190
+ 336,
191
+ 13440
192
+ ],
193
+ [
194
+ 336,
195
+ 13776
196
+ ],
197
+ [
198
+ 336,
199
+ 14112
200
+ ],
201
+ [
202
+ 336,
203
+ 14448
204
+ ],
205
+ [
206
+ 336,
207
+ 14784
208
+ ],
209
+ [
210
+ 336,
211
+ 15120
212
+ ],
213
+ [
214
+ 336,
215
+ 15456
216
+ ],
217
+ [
218
+ 336,
219
+ 15792
220
+ ],
221
+ [
222
+ 336,
223
+ 16128
224
+ ],
225
+ [
226
+ 336,
227
+ 16464
228
+ ],
229
+ [
230
+ 672,
231
+ 336
232
+ ],
233
+ [
234
+ 672,
235
+ 672
236
+ ],
237
+ [
238
+ 672,
239
+ 1008
240
+ ],
241
+ [
242
+ 672,
243
+ 1344
244
+ ],
245
+ [
246
+ 672,
247
+ 1680
248
+ ],
249
+ [
250
+ 672,
251
+ 2016
252
+ ],
253
+ [
254
+ 672,
255
+ 2352
256
+ ],
257
+ [
258
+ 672,
259
+ 2688
260
+ ],
261
+ [
262
+ 672,
263
+ 3024
264
+ ],
265
+ [
266
+ 672,
267
+ 3360
268
+ ],
269
+ [
270
+ 672,
271
+ 3696
272
+ ],
273
+ [
274
+ 672,
275
+ 4032
276
+ ],
277
+ [
278
+ 672,
279
+ 4368
280
+ ],
281
+ [
282
+ 672,
283
+ 4704
284
+ ],
285
+ [
286
+ 672,
287
+ 5040
288
+ ],
289
+ [
290
+ 672,
291
+ 5376
292
+ ],
293
+ [
294
+ 672,
295
+ 5712
296
+ ],
297
+ [
298
+ 672,
299
+ 6048
300
+ ],
301
+ [
302
+ 672,
303
+ 6384
304
+ ],
305
+ [
306
+ 672,
307
+ 6720
308
+ ],
309
+ [
310
+ 672,
311
+ 7056
312
+ ],
313
+ [
314
+ 672,
315
+ 7392
316
+ ],
317
+ [
318
+ 672,
319
+ 7728
320
+ ],
321
+ [
322
+ 672,
323
+ 8064
324
+ ],
325
+ [
326
+ 1008,
327
+ 336
328
+ ],
329
+ [
330
+ 1008,
331
+ 672
332
+ ],
333
+ [
334
+ 1008,
335
+ 1008
336
+ ],
337
+ [
338
+ 1008,
339
+ 1344
340
+ ],
341
+ [
342
+ 1008,
343
+ 1680
344
+ ],
345
+ [
346
+ 1008,
347
+ 2016
348
+ ],
349
+ [
350
+ 1008,
351
+ 2352
352
+ ],
353
+ [
354
+ 1008,
355
+ 2688
356
+ ],
357
+ [
358
+ 1008,
359
+ 3024
360
+ ],
361
+ [
362
+ 1008,
363
+ 3360
364
+ ],
365
+ [
366
+ 1008,
367
+ 3696
368
+ ],
369
+ [
370
+ 1008,
371
+ 4032
372
+ ],
373
+ [
374
+ 1008,
375
+ 4368
376
+ ],
377
+ [
378
+ 1008,
379
+ 4704
380
+ ],
381
+ [
382
+ 1008,
383
+ 5040
384
+ ],
385
+ [
386
+ 1008,
387
+ 5376
388
+ ],
389
+ [
390
+ 1344,
391
+ 336
392
+ ],
393
+ [
394
+ 1344,
395
+ 672
396
+ ],
397
+ [
398
+ 1344,
399
+ 1008
400
+ ],
401
+ [
402
+ 1344,
403
+ 1344
404
+ ],
405
+ [
406
+ 1344,
407
+ 1680
408
+ ],
409
+ [
410
+ 1344,
411
+ 2016
412
+ ],
413
+ [
414
+ 1344,
415
+ 2352
416
+ ],
417
+ [
418
+ 1344,
419
+ 2688
420
+ ],
421
+ [
422
+ 1344,
423
+ 3024
424
+ ],
425
+ [
426
+ 1344,
427
+ 3360
428
+ ],
429
+ [
430
+ 1344,
431
+ 3696
432
+ ],
433
+ [
434
+ 1344,
435
+ 4032
436
+ ],
437
+ [
438
+ 1680,
439
+ 336
440
+ ],
441
+ [
442
+ 1680,
443
+ 672
444
+ ],
445
+ [
446
+ 1680,
447
+ 1008
448
+ ],
449
+ [
450
+ 1680,
451
+ 1344
452
+ ],
453
+ [
454
+ 1680,
455
+ 1680
456
+ ],
457
+ [
458
+ 1680,
459
+ 2016
460
+ ],
461
+ [
462
+ 1680,
463
+ 2352
464
+ ],
465
+ [
466
+ 1680,
467
+ 2688
468
+ ],
469
+ [
470
+ 1680,
471
+ 3024
472
+ ],
473
+ [
474
+ 2016,
475
+ 336
476
+ ],
477
+ [
478
+ 2016,
479
+ 672
480
+ ],
481
+ [
482
+ 2016,
483
+ 1008
484
+ ],
485
+ [
486
+ 2016,
487
+ 1344
488
+ ],
489
+ [
490
+ 2016,
491
+ 1680
492
+ ],
493
+ [
494
+ 2016,
495
+ 2016
496
+ ],
497
+ [
498
+ 2016,
499
+ 2352
500
+ ],
501
+ [
502
+ 2016,
503
+ 2688
504
+ ],
505
+ [
506
+ 2352,
507
+ 336
508
+ ],
509
+ [
510
+ 2352,
511
+ 672
512
+ ],
513
+ [
514
+ 2352,
515
+ 1008
516
+ ],
517
+ [
518
+ 2352,
519
+ 1344
520
+ ],
521
+ [
522
+ 2352,
523
+ 1680
524
+ ],
525
+ [
526
+ 2352,
527
+ 2016
528
+ ],
529
+ [
530
+ 2352,
531
+ 2352
532
+ ],
533
+ [
534
+ 2688,
535
+ 336
536
+ ],
537
+ [
538
+ 2688,
539
+ 672
540
+ ],
541
+ [
542
+ 2688,
543
+ 1008
544
+ ],
545
+ [
546
+ 2688,
547
+ 1344
548
+ ],
549
+ [
550
+ 2688,
551
+ 1680
552
+ ],
553
+ [
554
+ 2688,
555
+ 2016
556
+ ],
557
+ [
558
+ 3024,
559
+ 336
560
+ ],
561
+ [
562
+ 3024,
563
+ 672
564
+ ],
565
+ [
566
+ 3024,
567
+ 1008
568
+ ],
569
+ [
570
+ 3024,
571
+ 1344
572
+ ],
573
+ [
574
+ 3024,
575
+ 1680
576
+ ],
577
+ [
578
+ 3360,
579
+ 336
580
+ ],
581
+ [
582
+ 3360,
583
+ 672
584
+ ],
585
+ [
586
+ 3360,
587
+ 1008
588
+ ],
589
+ [
590
+ 3360,
591
+ 1344
592
+ ],
593
+ [
594
+ 3696,
595
+ 336
596
+ ],
597
+ [
598
+ 3696,
599
+ 672
600
+ ],
601
+ [
602
+ 3696,
603
+ 1008
604
+ ],
605
+ [
606
+ 3696,
607
+ 1344
608
+ ],
609
+ [
610
+ 4032,
611
+ 336
612
+ ],
613
+ [
614
+ 4032,
615
+ 672
616
+ ],
617
+ [
618
+ 4032,
619
+ 1008
620
+ ],
621
+ [
622
+ 4032,
623
+ 1344
624
+ ],
625
+ [
626
+ 4368,
627
+ 336
628
+ ],
629
+ [
630
+ 4368,
631
+ 672
632
+ ],
633
+ [
634
+ 4368,
635
+ 1008
636
+ ],
637
+ [
638
+ 4704,
639
+ 336
640
+ ],
641
+ [
642
+ 4704,
643
+ 672
644
+ ],
645
+ [
646
+ 4704,
647
+ 1008
648
+ ],
649
+ [
650
+ 5040,
651
+ 336
652
+ ],
653
+ [
654
+ 5040,
655
+ 672
656
+ ],
657
+ [
658
+ 5040,
659
+ 1008
660
+ ],
661
+ [
662
+ 5376,
663
+ 336
664
+ ],
665
+ [
666
+ 5376,
667
+ 672
668
+ ],
669
+ [
670
+ 5376,
671
+ 1008
672
+ ],
673
+ [
674
+ 5712,
675
+ 336
676
+ ],
677
+ [
678
+ 5712,
679
+ 672
680
+ ],
681
+ [
682
+ 6048,
683
+ 336
684
+ ],
685
+ [
686
+ 6048,
687
+ 672
688
+ ],
689
+ [
690
+ 6384,
691
+ 336
692
+ ],
693
+ [
694
+ 6384,
695
+ 672
696
+ ],
697
+ [
698
+ 6720,
699
+ 336
700
+ ],
701
+ [
702
+ 6720,
703
+ 672
704
+ ],
705
+ [
706
+ 7056,
707
+ 336
708
+ ],
709
+ [
710
+ 7056,
711
+ 672
712
+ ],
713
+ [
714
+ 7392,
715
+ 336
716
+ ],
717
+ [
718
+ 7392,
719
+ 672
720
+ ],
721
+ [
722
+ 7728,
723
+ 336
724
+ ],
725
+ [
726
+ 7728,
727
+ 672
728
+ ],
729
+ [
730
+ 8064,
731
+ 336
732
+ ],
733
+ [
734
+ 8064,
735
+ 672
736
+ ],
737
+ [
738
+ 8400,
739
+ 336
740
+ ],
741
+ [
742
+ 8736,
743
+ 336
744
+ ],
745
+ [
746
+ 9072,
747
+ 336
748
+ ],
749
+ [
750
+ 9408,
751
+ 336
752
+ ],
753
+ [
754
+ 9744,
755
+ 336
756
+ ],
757
+ [
758
+ 10080,
759
+ 336
760
+ ],
761
+ [
762
+ 10416,
763
+ 336
764
+ ],
765
+ [
766
+ 10752,
767
+ 336
768
+ ],
769
+ [
770
+ 11088,
771
+ 336
772
+ ],
773
+ [
774
+ 11424,
775
+ 336
776
+ ],
777
+ [
778
+ 11760,
779
+ 336
780
+ ],
781
+ [
782
+ 12096,
783
+ 336
784
+ ],
785
+ [
786
+ 12432,
787
+ 336
788
+ ],
789
+ [
790
+ 12768,
791
+ 336
792
+ ],
793
+ [
794
+ 13104,
795
+ 336
796
+ ],
797
+ [
798
+ 13440,
799
+ 336
800
+ ],
801
+ [
802
+ 13776,
803
+ 336
804
+ ],
805
+ [
806
+ 14112,
807
+ 336
808
+ ],
809
+ [
810
+ 14448,
811
+ 336
812
+ ],
813
+ [
814
+ 14784,
815
+ 336
816
+ ],
817
+ [
818
+ 15120,
819
+ 336
820
+ ],
821
+ [
822
+ 15456,
823
+ 336
824
+ ],
825
+ [
826
+ 15792,
827
+ 336
828
+ ],
829
+ [
830
+ 16128,
831
+ 336
832
+ ],
833
+ [
834
+ 16464,
835
+ 336
836
+ ]
837
+ ],
838
+ "image_split_resolution": null,
839
+ "initializer_range": 0.02,
840
+ "intermediate_size": 11008,
841
+ "max_position_embeddings": 32768,
842
+ "max_window_layers": 70,
843
+ "mm_hidden_size": 1152,
844
+ "mm_patch_merge_type": "unires",
845
+ "mm_projector_lr": null,
846
+ "mm_projector_type": "mlp2x_gelu",
847
+ "mm_resampler_type": "spatial_pool",
848
+ "mm_spatial_pool_mode": "average",
849
+ "mm_spatial_pool_out_channels": 1152,
850
+ "mm_spatial_pool_stride": 2,
851
+ "mm_use_im_patch_token": false,
852
+ "mm_use_im_start_end": false,
853
+ "mm_vision_select_feature": "patch",
854
+ "mm_vision_select_layer": -1,
855
+ "mm_vision_tower": "/share/LXRlxr0_0/code/videoxlturbo2.0/videoxl_adaptfps/google/siglip-so400m-patch14-384",
856
+ "mm_vision_tower_lr": null,
857
+ "model_type": "qwen2",
858
+ "num_attention_heads": 16,
859
+ "num_hidden_layers": 36,
860
+ "num_key_value_heads": 2,
861
+ "pos_skipping_range": 4096,
862
+ "rms_norm_eps": 1e-06,
863
+ "rope_scaling": null,
864
+ "rope_theta": 1000000.0,
865
+ "sliding_window": null,
866
+ "tie_word_embeddings": true,
867
+ "tokenizer_model_max_length": 32768,
868
+ "tokenizer_padding_side": "right",
869
+ "torch_dtype": "bfloat16",
870
+ "transformers_version": "4.43.0",
871
+ "tune_mm_mlp_adapter": false,
872
+ "tune_mm_vision_resampler": false,
873
+ "unfreeze_mm_vision_tower": true,
874
+ "use_cache": true,
875
+ "use_mm_proj": true,
876
+ "use_pos_skipping": false,
877
+ "use_sliding_window": false,
878
+ "vision_tower_pretrained": null,
879
+ "vocab_size": 151936
880
+ }
generation_config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 151643,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 151645,
6
+ 151643
7
+ ],
8
+ "pad_token_id": 151643,
9
+ "repetition_penalty": 1.05,
10
+ "temperature": 0.7,
11
+ "top_k": 20,
12
+ "top_p": 0.8,
13
+ "transformers_version": "4.43.0"
14
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:482a5114f34c14d352dc9765e39c755cd3c27bd8efc4bc42886c8fdd699a5543
3
+ size 4977615904
model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7e8e43de53317dbe90e98a2e51554edc1cb4cdfbbf0d7f00a59f011e56f1438
3
+ size 3198470440
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>",
5
+ "<|object_ref_start|>",
6
+ "<|object_ref_end|>",
7
+ "<|box_start|>",
8
+ "<|box_end|>",
9
+ "<|quad_start|>",
10
+ "<|quad_end|>",
11
+ "<|vision_start|>",
12
+ "<|vision_end|>",
13
+ "<|vision_pad|>",
14
+ "<|image_pad|>",
15
+ "<|video_pad|>"
16
+ ],
17
+ "eos_token": {
18
+ "content": "<|im_end|>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ },
24
+ "pad_token": {
25
+ "content": "<|endoftext|>",
26
+ "lstrip": false,
27
+ "normalized": false,
28
+ "rstrip": false,
29
+ "single_word": false
30
+ }
31
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,208 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": false,
3
+ "add_prefix_space": false,
4
+ "added_tokens_decoder": {
5
+ "151643": {
6
+ "content": "<|endoftext|>",
7
+ "lstrip": false,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "151644": {
14
+ "content": "<|im_start|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "151645": {
22
+ "content": "<|im_end|>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ },
29
+ "151646": {
30
+ "content": "<|object_ref_start|>",
31
+ "lstrip": false,
32
+ "normalized": false,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": true
36
+ },
37
+ "151647": {
38
+ "content": "<|object_ref_end|>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false,
43
+ "special": true
44
+ },
45
+ "151648": {
46
+ "content": "<|box_start|>",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false,
51
+ "special": true
52
+ },
53
+ "151649": {
54
+ "content": "<|box_end|>",
55
+ "lstrip": false,
56
+ "normalized": false,
57
+ "rstrip": false,
58
+ "single_word": false,
59
+ "special": true
60
+ },
61
+ "151650": {
62
+ "content": "<|quad_start|>",
63
+ "lstrip": false,
64
+ "normalized": false,
65
+ "rstrip": false,
66
+ "single_word": false,
67
+ "special": true
68
+ },
69
+ "151651": {
70
+ "content": "<|quad_end|>",
71
+ "lstrip": false,
72
+ "normalized": false,
73
+ "rstrip": false,
74
+ "single_word": false,
75
+ "special": true
76
+ },
77
+ "151652": {
78
+ "content": "<|vision_start|>",
79
+ "lstrip": false,
80
+ "normalized": false,
81
+ "rstrip": false,
82
+ "single_word": false,
83
+ "special": true
84
+ },
85
+ "151653": {
86
+ "content": "<|vision_end|>",
87
+ "lstrip": false,
88
+ "normalized": false,
89
+ "rstrip": false,
90
+ "single_word": false,
91
+ "special": true
92
+ },
93
+ "151654": {
94
+ "content": "<|vision_pad|>",
95
+ "lstrip": false,
96
+ "normalized": false,
97
+ "rstrip": false,
98
+ "single_word": false,
99
+ "special": true
100
+ },
101
+ "151655": {
102
+ "content": "<|image_pad|>",
103
+ "lstrip": false,
104
+ "normalized": false,
105
+ "rstrip": false,
106
+ "single_word": false,
107
+ "special": true
108
+ },
109
+ "151656": {
110
+ "content": "<|video_pad|>",
111
+ "lstrip": false,
112
+ "normalized": false,
113
+ "rstrip": false,
114
+ "single_word": false,
115
+ "special": true
116
+ },
117
+ "151657": {
118
+ "content": "<tool_call>",
119
+ "lstrip": false,
120
+ "normalized": false,
121
+ "rstrip": false,
122
+ "single_word": false,
123
+ "special": false
124
+ },
125
+ "151658": {
126
+ "content": "</tool_call>",
127
+ "lstrip": false,
128
+ "normalized": false,
129
+ "rstrip": false,
130
+ "single_word": false,
131
+ "special": false
132
+ },
133
+ "151659": {
134
+ "content": "<|fim_prefix|>",
135
+ "lstrip": false,
136
+ "normalized": false,
137
+ "rstrip": false,
138
+ "single_word": false,
139
+ "special": false
140
+ },
141
+ "151660": {
142
+ "content": "<|fim_middle|>",
143
+ "lstrip": false,
144
+ "normalized": false,
145
+ "rstrip": false,
146
+ "single_word": false,
147
+ "special": false
148
+ },
149
+ "151661": {
150
+ "content": "<|fim_suffix|>",
151
+ "lstrip": false,
152
+ "normalized": false,
153
+ "rstrip": false,
154
+ "single_word": false,
155
+ "special": false
156
+ },
157
+ "151662": {
158
+ "content": "<|fim_pad|>",
159
+ "lstrip": false,
160
+ "normalized": false,
161
+ "rstrip": false,
162
+ "single_word": false,
163
+ "special": false
164
+ },
165
+ "151663": {
166
+ "content": "<|repo_name|>",
167
+ "lstrip": false,
168
+ "normalized": false,
169
+ "rstrip": false,
170
+ "single_word": false,
171
+ "special": false
172
+ },
173
+ "151664": {
174
+ "content": "<|file_sep|>",
175
+ "lstrip": false,
176
+ "normalized": false,
177
+ "rstrip": false,
178
+ "single_word": false,
179
+ "special": false
180
+ }
181
+ },
182
+ "additional_special_tokens": [
183
+ "<|im_start|>",
184
+ "<|im_end|>",
185
+ "<|object_ref_start|>",
186
+ "<|object_ref_end|>",
187
+ "<|box_start|>",
188
+ "<|box_end|>",
189
+ "<|quad_start|>",
190
+ "<|quad_end|>",
191
+ "<|vision_start|>",
192
+ "<|vision_end|>",
193
+ "<|vision_pad|>",
194
+ "<|image_pad|>",
195
+ "<|video_pad|>"
196
+ ],
197
+ "bos_token": null,
198
+ "chat_template": "{%- if tools %}\n {{- '<|im_start|>system\\n' }}\n {%- if messages[0]['role'] == 'system' %}\n {{- messages[0]['content'] }}\n {%- else %}\n {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }}\n {%- endif %}\n {{- \"\\n\\n# Tools\\n\\nYou may call one or more functions to assist with the user query.\\n\\nYou are provided with function signatures within <tools></tools> XML tags:\\n<tools>\" }}\n {%- for tool in tools %}\n {{- \"\\n\" }}\n {{- tool | tojson }}\n {%- endfor %}\n {{- \"\\n</tools>\\n\\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\\n<tool_call>\\n{\\\"name\\\": <function-name>, \\\"arguments\\\": <args-json-object>}\\n</tool_call><|im_end|>\\n\" }}\n{%- else %}\n {%- if messages[0]['role'] == 'system' %}\n {{- '<|im_start|>system\\n' + messages[0]['content'] + '<|im_end|>\\n' }}\n {%- else %}\n {{- '<|im_start|>system\\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\\n' }}\n {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and not message.tool_calls) %}\n {{- '<|im_start|>' + message.role + '\\n' + message.content + '<|im_end|>' + '\\n' }}\n {%- elif message.role == \"assistant\" %}\n {{- '<|im_start|>' + message.role }}\n {%- if message.content %}\n {{- '\\n' + message.content }}\n {%- endif %}\n {%- for tool_call in message.tool_calls %}\n {%- if tool_call.function is defined %}\n {%- set tool_call = tool_call.function %}\n {%- endif %}\n {{- '\\n<tool_call>\\n{\"name\": \"' }}\n {{- tool_call.name }}\n {{- '\", \"arguments\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- '}\\n</tool_call>' }}\n {%- endfor %}\n {{- '<|im_end|>\\n' }}\n {%- elif message.role == \"tool\" %}\n {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != \"tool\") %}\n {{- '<|im_start|>user' }}\n {%- endif %}\n {{- '\\n<tool_response>\\n' }}\n {{- message.content }}\n {{- '\\n</tool_response>' }}\n {%- if loop.last or (messages[loop.index0 + 1].role != \"tool\") %}\n {{- '<|im_end|>\\n' }}\n {%- endif %}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|im_start|>assistant\\n' }}\n{%- endif %}\n",
199
+ "clean_up_tokenization_spaces": false,
200
+ "eos_token": "<|im_end|>",
201
+ "errors": "replace",
202
+ "model_max_length": 32768,
203
+ "pad_token": "<|endoftext|>",
204
+ "padding_side": "right",
205
+ "split_special_tokens": false,
206
+ "tokenizer_class": "Qwen2Tokenizer",
207
+ "unk_token": null
208
+ }
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75fdc26965f066ea3a3653fe2cb89637260eb67c664cc2a8c6fae40eeaa9fbc6
3
+ size 7352
vocab.json ADDED
The diff for this file is too large to render. See raw diff