Regenerate the model to ensure successful execution on vLLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +312 -126
- model-00001-of-00054.safetensors +2 -2
- model-00002-of-00054.safetensors +2 -2
- model-00003-of-00054.safetensors +2 -2
- model-00004-of-00054.safetensors +2 -2
- model-00005-of-00054.safetensors +2 -2
- model-00006-of-00054.safetensors +2 -2
- model-00007-of-00054.safetensors +2 -2
- model-00008-of-00054.safetensors +2 -2
- model-00009-of-00054.safetensors +2 -2
- model-00010-of-00054.safetensors +2 -2
- model-00011-of-00054.safetensors +2 -2
- model-00012-of-00054.safetensors +2 -2
- model-00013-of-00054.safetensors +2 -2
- model-00014-of-00054.safetensors +2 -2
- model-00015-of-00054.safetensors +2 -2
- model-00016-of-00054.safetensors +2 -2
- model-00017-of-00054.safetensors +2 -2
- model-00018-of-00054.safetensors +2 -2
- model-00019-of-00054.safetensors +2 -2
- model-00020-of-00054.safetensors +2 -2
- model-00021-of-00054.safetensors +2 -2
- model-00022-of-00054.safetensors +2 -2
- model-00023-of-00054.safetensors +2 -2
- model-00024-of-00054.safetensors +2 -2
- model-00025-of-00054.safetensors +2 -2
- model-00026-of-00054.safetensors +2 -2
- model-00027-of-00054.safetensors +2 -2
- model-00028-of-00054.safetensors +2 -2
- model-00029-of-00054.safetensors +2 -2
- model-00030-of-00054.safetensors +2 -2
- model-00031-of-00054.safetensors +2 -2
- model-00032-of-00054.safetensors +2 -2
- model-00033-of-00054.safetensors +2 -2
- model-00034-of-00054.safetensors +2 -2
- model-00035-of-00054.safetensors +2 -2
- model-00036-of-00054.safetensors +2 -2
- model-00037-of-00054.safetensors +2 -2
- model-00038-of-00054.safetensors +2 -2
- model-00039-of-00054.safetensors +2 -2
- model-00040-of-00054.safetensors +2 -2
- model-00041-of-00054.safetensors +2 -2
- model-00042-of-00054.safetensors +2 -2
- model-00043-of-00054.safetensors +2 -2
- model-00044-of-00054.safetensors +2 -2
- model-00045-of-00054.safetensors +2 -2
- model-00046-of-00054.safetensors +2 -2
- model-00047-of-00054.safetensors +2 -2
- model-00048-of-00054.safetensors +2 -2
- model-00049-of-00054.safetensors +2 -2
config.json
CHANGED
|
@@ -25,13 +25,12 @@
|
|
| 25 |
"output_router_logits": false,
|
| 26 |
"qkv_bias": false,
|
| 27 |
"quantization_config": {
|
| 28 |
-
"autoround_version": "0.6.
|
| 29 |
"bits": 4,
|
| 30 |
"data_type": "int",
|
| 31 |
"extra_config": {
|
| 32 |
"model.layers.0.mlp.gate": {
|
| 33 |
-
"bits":
|
| 34 |
-
"group_size": 128
|
| 35 |
},
|
| 36 |
"model.layers.0.self_attn.k_proj": {
|
| 37 |
"bits": 8,
|
|
@@ -50,8 +49,7 @@
|
|
| 50 |
"group_size": 128
|
| 51 |
},
|
| 52 |
"model.layers.1.mlp.gate": {
|
| 53 |
-
"bits":
|
| 54 |
-
"group_size": 128
|
| 55 |
},
|
| 56 |
"model.layers.1.self_attn.k_proj": {
|
| 57 |
"bits": 8,
|
|
@@ -70,8 +68,7 @@
|
|
| 70 |
"group_size": 128
|
| 71 |
},
|
| 72 |
"model.layers.10.mlp.gate": {
|
| 73 |
-
"bits":
|
| 74 |
-
"group_size": 128
|
| 75 |
},
|
| 76 |
"model.layers.10.self_attn.k_proj": {
|
| 77 |
"bits": 8,
|
|
@@ -90,8 +87,7 @@
|
|
| 90 |
"group_size": 128
|
| 91 |
},
|
| 92 |
"model.layers.11.mlp.gate": {
|
| 93 |
-
"bits":
|
| 94 |
-
"group_size": 128
|
| 95 |
},
|
| 96 |
"model.layers.11.self_attn.k_proj": {
|
| 97 |
"bits": 8,
|
|
@@ -110,8 +106,7 @@
|
|
| 110 |
"group_size": 128
|
| 111 |
},
|
| 112 |
"model.layers.12.mlp.gate": {
|
| 113 |
-
"bits":
|
| 114 |
-
"group_size": 128
|
| 115 |
},
|
| 116 |
"model.layers.12.self_attn.k_proj": {
|
| 117 |
"bits": 8,
|
|
@@ -130,8 +125,7 @@
|
|
| 130 |
"group_size": 128
|
| 131 |
},
|
| 132 |
"model.layers.13.mlp.gate": {
|
| 133 |
-
"bits":
|
| 134 |
-
"group_size": 128
|
| 135 |
},
|
| 136 |
"model.layers.13.self_attn.k_proj": {
|
| 137 |
"bits": 8,
|
|
@@ -150,8 +144,7 @@
|
|
| 150 |
"group_size": 128
|
| 151 |
},
|
| 152 |
"model.layers.14.mlp.gate": {
|
| 153 |
-
"bits":
|
| 154 |
-
"group_size": 128
|
| 155 |
},
|
| 156 |
"model.layers.14.self_attn.k_proj": {
|
| 157 |
"bits": 8,
|
|
@@ -170,8 +163,7 @@
|
|
| 170 |
"group_size": 128
|
| 171 |
},
|
| 172 |
"model.layers.15.mlp.gate": {
|
| 173 |
-
"bits":
|
| 174 |
-
"group_size": 128
|
| 175 |
},
|
| 176 |
"model.layers.15.self_attn.k_proj": {
|
| 177 |
"bits": 8,
|
|
@@ -190,8 +182,7 @@
|
|
| 190 |
"group_size": 128
|
| 191 |
},
|
| 192 |
"model.layers.16.mlp.gate": {
|
| 193 |
-
"bits":
|
| 194 |
-
"group_size": 128
|
| 195 |
},
|
| 196 |
"model.layers.16.self_attn.k_proj": {
|
| 197 |
"bits": 8,
|
|
@@ -210,8 +201,7 @@
|
|
| 210 |
"group_size": 128
|
| 211 |
},
|
| 212 |
"model.layers.17.mlp.gate": {
|
| 213 |
-
"bits":
|
| 214 |
-
"group_size": 128
|
| 215 |
},
|
| 216 |
"model.layers.17.self_attn.k_proj": {
|
| 217 |
"bits": 8,
|
|
@@ -230,8 +220,7 @@
|
|
| 230 |
"group_size": 128
|
| 231 |
},
|
| 232 |
"model.layers.18.mlp.gate": {
|
| 233 |
-
"bits":
|
| 234 |
-
"group_size": 128
|
| 235 |
},
|
| 236 |
"model.layers.18.self_attn.k_proj": {
|
| 237 |
"bits": 8,
|
|
@@ -250,8 +239,7 @@
|
|
| 250 |
"group_size": 128
|
| 251 |
},
|
| 252 |
"model.layers.19.mlp.gate": {
|
| 253 |
-
"bits":
|
| 254 |
-
"group_size": 128
|
| 255 |
},
|
| 256 |
"model.layers.19.self_attn.k_proj": {
|
| 257 |
"bits": 8,
|
|
@@ -270,8 +258,7 @@
|
|
| 270 |
"group_size": 128
|
| 271 |
},
|
| 272 |
"model.layers.2.mlp.gate": {
|
| 273 |
-
"bits":
|
| 274 |
-
"group_size": 128
|
| 275 |
},
|
| 276 |
"model.layers.2.self_attn.k_proj": {
|
| 277 |
"bits": 8,
|
|
@@ -290,8 +277,7 @@
|
|
| 290 |
"group_size": 128
|
| 291 |
},
|
| 292 |
"model.layers.20.mlp.gate": {
|
| 293 |
-
"bits":
|
| 294 |
-
"group_size": 128
|
| 295 |
},
|
| 296 |
"model.layers.20.self_attn.k_proj": {
|
| 297 |
"bits": 8,
|
|
@@ -310,8 +296,7 @@
|
|
| 310 |
"group_size": 128
|
| 311 |
},
|
| 312 |
"model.layers.21.mlp.gate": {
|
| 313 |
-
"bits":
|
| 314 |
-
"group_size": 128
|
| 315 |
},
|
| 316 |
"model.layers.21.self_attn.k_proj": {
|
| 317 |
"bits": 8,
|
|
@@ -330,8 +315,7 @@
|
|
| 330 |
"group_size": 128
|
| 331 |
},
|
| 332 |
"model.layers.22.mlp.gate": {
|
| 333 |
-
"bits":
|
| 334 |
-
"group_size": 128
|
| 335 |
},
|
| 336 |
"model.layers.22.self_attn.k_proj": {
|
| 337 |
"bits": 8,
|
|
@@ -350,8 +334,7 @@
|
|
| 350 |
"group_size": 128
|
| 351 |
},
|
| 352 |
"model.layers.23.mlp.gate": {
|
| 353 |
-
"bits":
|
| 354 |
-
"group_size": 128
|
| 355 |
},
|
| 356 |
"model.layers.23.self_attn.k_proj": {
|
| 357 |
"bits": 8,
|
|
@@ -370,8 +353,7 @@
|
|
| 370 |
"group_size": 128
|
| 371 |
},
|
| 372 |
"model.layers.24.mlp.gate": {
|
| 373 |
-
"bits":
|
| 374 |
-
"group_size": 128
|
| 375 |
},
|
| 376 |
"model.layers.24.self_attn.k_proj": {
|
| 377 |
"bits": 8,
|
|
@@ -390,8 +372,7 @@
|
|
| 390 |
"group_size": 128
|
| 391 |
},
|
| 392 |
"model.layers.25.mlp.gate": {
|
| 393 |
-
"bits":
|
| 394 |
-
"group_size": 128
|
| 395 |
},
|
| 396 |
"model.layers.25.self_attn.k_proj": {
|
| 397 |
"bits": 8,
|
|
@@ -410,8 +391,7 @@
|
|
| 410 |
"group_size": 128
|
| 411 |
},
|
| 412 |
"model.layers.26.mlp.gate": {
|
| 413 |
-
"bits":
|
| 414 |
-
"group_size": 128
|
| 415 |
},
|
| 416 |
"model.layers.26.self_attn.k_proj": {
|
| 417 |
"bits": 8,
|
|
@@ -430,8 +410,7 @@
|
|
| 430 |
"group_size": 128
|
| 431 |
},
|
| 432 |
"model.layers.27.mlp.gate": {
|
| 433 |
-
"bits":
|
| 434 |
-
"group_size": 128
|
| 435 |
},
|
| 436 |
"model.layers.27.self_attn.k_proj": {
|
| 437 |
"bits": 8,
|
|
@@ -450,8 +429,7 @@
|
|
| 450 |
"group_size": 128
|
| 451 |
},
|
| 452 |
"model.layers.28.mlp.gate": {
|
| 453 |
-
"bits":
|
| 454 |
-
"group_size": 128
|
| 455 |
},
|
| 456 |
"model.layers.28.self_attn.k_proj": {
|
| 457 |
"bits": 8,
|
|
@@ -470,8 +448,7 @@
|
|
| 470 |
"group_size": 128
|
| 471 |
},
|
| 472 |
"model.layers.29.mlp.gate": {
|
| 473 |
-
"bits":
|
| 474 |
-
"group_size": 128
|
| 475 |
},
|
| 476 |
"model.layers.29.self_attn.k_proj": {
|
| 477 |
"bits": 8,
|
|
@@ -490,8 +467,7 @@
|
|
| 490 |
"group_size": 128
|
| 491 |
},
|
| 492 |
"model.layers.3.mlp.gate": {
|
| 493 |
-
"bits":
|
| 494 |
-
"group_size": 128
|
| 495 |
},
|
| 496 |
"model.layers.3.self_attn.k_proj": {
|
| 497 |
"bits": 8,
|
|
@@ -510,8 +486,7 @@
|
|
| 510 |
"group_size": 128
|
| 511 |
},
|
| 512 |
"model.layers.30.mlp.gate": {
|
| 513 |
-
"bits":
|
| 514 |
-
"group_size": 128
|
| 515 |
},
|
| 516 |
"model.layers.30.self_attn.k_proj": {
|
| 517 |
"bits": 8,
|
|
@@ -530,8 +505,7 @@
|
|
| 530 |
"group_size": 128
|
| 531 |
},
|
| 532 |
"model.layers.31.mlp.gate": {
|
| 533 |
-
"bits":
|
| 534 |
-
"group_size": 128
|
| 535 |
},
|
| 536 |
"model.layers.31.self_attn.k_proj": {
|
| 537 |
"bits": 8,
|
|
@@ -550,8 +524,7 @@
|
|
| 550 |
"group_size": 128
|
| 551 |
},
|
| 552 |
"model.layers.32.mlp.gate": {
|
| 553 |
-
"bits":
|
| 554 |
-
"group_size": 128
|
| 555 |
},
|
| 556 |
"model.layers.32.self_attn.k_proj": {
|
| 557 |
"bits": 8,
|
|
@@ -570,8 +543,7 @@
|
|
| 570 |
"group_size": 128
|
| 571 |
},
|
| 572 |
"model.layers.33.mlp.gate": {
|
| 573 |
-
"bits":
|
| 574 |
-
"group_size": 128
|
| 575 |
},
|
| 576 |
"model.layers.33.self_attn.k_proj": {
|
| 577 |
"bits": 8,
|
|
@@ -590,8 +562,7 @@
|
|
| 590 |
"group_size": 128
|
| 591 |
},
|
| 592 |
"model.layers.34.mlp.gate": {
|
| 593 |
-
"bits":
|
| 594 |
-
"group_size": 128
|
| 595 |
},
|
| 596 |
"model.layers.34.self_attn.k_proj": {
|
| 597 |
"bits": 8,
|
|
@@ -610,8 +581,7 @@
|
|
| 610 |
"group_size": 128
|
| 611 |
},
|
| 612 |
"model.layers.35.mlp.gate": {
|
| 613 |
-
"bits":
|
| 614 |
-
"group_size": 128
|
| 615 |
},
|
| 616 |
"model.layers.35.self_attn.k_proj": {
|
| 617 |
"bits": 8,
|
|
@@ -630,8 +600,7 @@
|
|
| 630 |
"group_size": 128
|
| 631 |
},
|
| 632 |
"model.layers.36.mlp.gate": {
|
| 633 |
-
"bits":
|
| 634 |
-
"group_size": 128
|
| 635 |
},
|
| 636 |
"model.layers.36.self_attn.k_proj": {
|
| 637 |
"bits": 8,
|
|
@@ -650,8 +619,7 @@
|
|
| 650 |
"group_size": 128
|
| 651 |
},
|
| 652 |
"model.layers.37.mlp.gate": {
|
| 653 |
-
"bits":
|
| 654 |
-
"group_size": 128
|
| 655 |
},
|
| 656 |
"model.layers.37.self_attn.k_proj": {
|
| 657 |
"bits": 8,
|
|
@@ -670,8 +638,7 @@
|
|
| 670 |
"group_size": 128
|
| 671 |
},
|
| 672 |
"model.layers.38.mlp.gate": {
|
| 673 |
-
"bits":
|
| 674 |
-
"group_size": 128
|
| 675 |
},
|
| 676 |
"model.layers.38.self_attn.k_proj": {
|
| 677 |
"bits": 8,
|
|
@@ -690,8 +657,7 @@
|
|
| 690 |
"group_size": 128
|
| 691 |
},
|
| 692 |
"model.layers.39.mlp.gate": {
|
| 693 |
-
"bits":
|
| 694 |
-
"group_size": 128
|
| 695 |
},
|
| 696 |
"model.layers.39.self_attn.k_proj": {
|
| 697 |
"bits": 8,
|
|
@@ -710,8 +676,7 @@
|
|
| 710 |
"group_size": 128
|
| 711 |
},
|
| 712 |
"model.layers.4.mlp.gate": {
|
| 713 |
-
"bits":
|
| 714 |
-
"group_size": 128
|
| 715 |
},
|
| 716 |
"model.layers.4.self_attn.k_proj": {
|
| 717 |
"bits": 8,
|
|
@@ -730,8 +695,7 @@
|
|
| 730 |
"group_size": 128
|
| 731 |
},
|
| 732 |
"model.layers.40.mlp.gate": {
|
| 733 |
-
"bits":
|
| 734 |
-
"group_size": 128
|
| 735 |
},
|
| 736 |
"model.layers.40.self_attn.k_proj": {
|
| 737 |
"bits": 8,
|
|
@@ -750,8 +714,7 @@
|
|
| 750 |
"group_size": 128
|
| 751 |
},
|
| 752 |
"model.layers.41.mlp.gate": {
|
| 753 |
-
"bits":
|
| 754 |
-
"group_size": 128
|
| 755 |
},
|
| 756 |
"model.layers.41.self_attn.k_proj": {
|
| 757 |
"bits": 8,
|
|
@@ -770,8 +733,7 @@
|
|
| 770 |
"group_size": 128
|
| 771 |
},
|
| 772 |
"model.layers.42.mlp.gate": {
|
| 773 |
-
"bits":
|
| 774 |
-
"group_size": 128
|
| 775 |
},
|
| 776 |
"model.layers.42.self_attn.k_proj": {
|
| 777 |
"bits": 8,
|
|
@@ -790,8 +752,7 @@
|
|
| 790 |
"group_size": 128
|
| 791 |
},
|
| 792 |
"model.layers.43.mlp.gate": {
|
| 793 |
-
"bits":
|
| 794 |
-
"group_size": 128
|
| 795 |
},
|
| 796 |
"model.layers.43.self_attn.k_proj": {
|
| 797 |
"bits": 8,
|
|
@@ -810,8 +771,7 @@
|
|
| 810 |
"group_size": 128
|
| 811 |
},
|
| 812 |
"model.layers.44.mlp.gate": {
|
| 813 |
-
"bits":
|
| 814 |
-
"group_size": 128
|
| 815 |
},
|
| 816 |
"model.layers.44.self_attn.k_proj": {
|
| 817 |
"bits": 8,
|
|
@@ -830,8 +790,7 @@
|
|
| 830 |
"group_size": 128
|
| 831 |
},
|
| 832 |
"model.layers.45.mlp.gate": {
|
| 833 |
-
"bits":
|
| 834 |
-
"group_size": 128
|
| 835 |
},
|
| 836 |
"model.layers.45.self_attn.k_proj": {
|
| 837 |
"bits": 8,
|
|
@@ -850,8 +809,7 @@
|
|
| 850 |
"group_size": 128
|
| 851 |
},
|
| 852 |
"model.layers.46.mlp.gate": {
|
| 853 |
-
"bits":
|
| 854 |
-
"group_size": 128
|
| 855 |
},
|
| 856 |
"model.layers.46.self_attn.k_proj": {
|
| 857 |
"bits": 8,
|
|
@@ -870,8 +828,7 @@
|
|
| 870 |
"group_size": 128
|
| 871 |
},
|
| 872 |
"model.layers.47.mlp.gate": {
|
| 873 |
-
"bits":
|
| 874 |
-
"group_size": 128
|
| 875 |
},
|
| 876 |
"model.layers.47.self_attn.k_proj": {
|
| 877 |
"bits": 8,
|
|
@@ -890,8 +847,7 @@
|
|
| 890 |
"group_size": 128
|
| 891 |
},
|
| 892 |
"model.layers.48.mlp.gate": {
|
| 893 |
-
"bits":
|
| 894 |
-
"group_size": 128
|
| 895 |
},
|
| 896 |
"model.layers.48.self_attn.k_proj": {
|
| 897 |
"bits": 8,
|
|
@@ -910,8 +866,7 @@
|
|
| 910 |
"group_size": 128
|
| 911 |
},
|
| 912 |
"model.layers.49.mlp.gate": {
|
| 913 |
-
"bits":
|
| 914 |
-
"group_size": 128
|
| 915 |
},
|
| 916 |
"model.layers.49.self_attn.k_proj": {
|
| 917 |
"bits": 8,
|
|
@@ -930,8 +885,7 @@
|
|
| 930 |
"group_size": 128
|
| 931 |
},
|
| 932 |
"model.layers.5.mlp.gate": {
|
| 933 |
-
"bits":
|
| 934 |
-
"group_size": 128
|
| 935 |
},
|
| 936 |
"model.layers.5.self_attn.k_proj": {
|
| 937 |
"bits": 8,
|
|
@@ -950,8 +904,7 @@
|
|
| 950 |
"group_size": 128
|
| 951 |
},
|
| 952 |
"model.layers.50.mlp.gate": {
|
| 953 |
-
"bits":
|
| 954 |
-
"group_size": 128
|
| 955 |
},
|
| 956 |
"model.layers.50.self_attn.k_proj": {
|
| 957 |
"bits": 8,
|
|
@@ -970,8 +923,7 @@
|
|
| 970 |
"group_size": 128
|
| 971 |
},
|
| 972 |
"model.layers.51.mlp.gate": {
|
| 973 |
-
"bits":
|
| 974 |
-
"group_size": 128
|
| 975 |
},
|
| 976 |
"model.layers.51.self_attn.k_proj": {
|
| 977 |
"bits": 8,
|
|
@@ -990,8 +942,7 @@
|
|
| 990 |
"group_size": 128
|
| 991 |
},
|
| 992 |
"model.layers.52.mlp.gate": {
|
| 993 |
-
"bits":
|
| 994 |
-
"group_size": 128
|
| 995 |
},
|
| 996 |
"model.layers.52.self_attn.k_proj": {
|
| 997 |
"bits": 8,
|
|
@@ -1010,8 +961,7 @@
|
|
| 1010 |
"group_size": 128
|
| 1011 |
},
|
| 1012 |
"model.layers.53.mlp.gate": {
|
| 1013 |
-
"bits":
|
| 1014 |
-
"group_size": 128
|
| 1015 |
},
|
| 1016 |
"model.layers.53.self_attn.k_proj": {
|
| 1017 |
"bits": 8,
|
|
@@ -1030,8 +980,7 @@
|
|
| 1030 |
"group_size": 128
|
| 1031 |
},
|
| 1032 |
"model.layers.54.mlp.gate": {
|
| 1033 |
-
"bits":
|
| 1034 |
-
"group_size": 128
|
| 1035 |
},
|
| 1036 |
"model.layers.54.self_attn.k_proj": {
|
| 1037 |
"bits": 8,
|
|
@@ -1050,8 +999,7 @@
|
|
| 1050 |
"group_size": 128
|
| 1051 |
},
|
| 1052 |
"model.layers.55.mlp.gate": {
|
| 1053 |
-
"bits":
|
| 1054 |
-
"group_size": 128
|
| 1055 |
},
|
| 1056 |
"model.layers.55.self_attn.k_proj": {
|
| 1057 |
"bits": 8,
|
|
@@ -1070,8 +1018,7 @@
|
|
| 1070 |
"group_size": 128
|
| 1071 |
},
|
| 1072 |
"model.layers.56.mlp.gate": {
|
| 1073 |
-
"bits":
|
| 1074 |
-
"group_size": 128
|
| 1075 |
},
|
| 1076 |
"model.layers.56.self_attn.k_proj": {
|
| 1077 |
"bits": 8,
|
|
@@ -1090,8 +1037,7 @@
|
|
| 1090 |
"group_size": 128
|
| 1091 |
},
|
| 1092 |
"model.layers.57.mlp.gate": {
|
| 1093 |
-
"bits":
|
| 1094 |
-
"group_size": 128
|
| 1095 |
},
|
| 1096 |
"model.layers.57.self_attn.k_proj": {
|
| 1097 |
"bits": 8,
|
|
@@ -1110,8 +1056,7 @@
|
|
| 1110 |
"group_size": 128
|
| 1111 |
},
|
| 1112 |
"model.layers.58.mlp.gate": {
|
| 1113 |
-
"bits":
|
| 1114 |
-
"group_size": 128
|
| 1115 |
},
|
| 1116 |
"model.layers.58.self_attn.k_proj": {
|
| 1117 |
"bits": 8,
|
|
@@ -1130,8 +1075,7 @@
|
|
| 1130 |
"group_size": 128
|
| 1131 |
},
|
| 1132 |
"model.layers.59.mlp.gate": {
|
| 1133 |
-
"bits":
|
| 1134 |
-
"group_size": 128
|
| 1135 |
},
|
| 1136 |
"model.layers.59.self_attn.k_proj": {
|
| 1137 |
"bits": 8,
|
|
@@ -1150,8 +1094,7 @@
|
|
| 1150 |
"group_size": 128
|
| 1151 |
},
|
| 1152 |
"model.layers.6.mlp.gate": {
|
| 1153 |
-
"bits":
|
| 1154 |
-
"group_size": 128
|
| 1155 |
},
|
| 1156 |
"model.layers.6.self_attn.k_proj": {
|
| 1157 |
"bits": 8,
|
|
@@ -1170,8 +1113,7 @@
|
|
| 1170 |
"group_size": 128
|
| 1171 |
},
|
| 1172 |
"model.layers.60.mlp.gate": {
|
| 1173 |
-
"bits":
|
| 1174 |
-
"group_size": 128
|
| 1175 |
},
|
| 1176 |
"model.layers.60.self_attn.k_proj": {
|
| 1177 |
"bits": 8,
|
|
@@ -1190,8 +1132,7 @@
|
|
| 1190 |
"group_size": 128
|
| 1191 |
},
|
| 1192 |
"model.layers.61.mlp.gate": {
|
| 1193 |
-
"bits":
|
| 1194 |
-
"group_size": 128
|
| 1195 |
},
|
| 1196 |
"model.layers.61.self_attn.k_proj": {
|
| 1197 |
"bits": 8,
|
|
@@ -1210,8 +1151,7 @@
|
|
| 1210 |
"group_size": 128
|
| 1211 |
},
|
| 1212 |
"model.layers.7.mlp.gate": {
|
| 1213 |
-
"bits":
|
| 1214 |
-
"group_size": 128
|
| 1215 |
},
|
| 1216 |
"model.layers.7.self_attn.k_proj": {
|
| 1217 |
"bits": 8,
|
|
@@ -1230,8 +1170,7 @@
|
|
| 1230 |
"group_size": 128
|
| 1231 |
},
|
| 1232 |
"model.layers.8.mlp.gate": {
|
| 1233 |
-
"bits":
|
| 1234 |
-
"group_size": 128
|
| 1235 |
},
|
| 1236 |
"model.layers.8.self_attn.k_proj": {
|
| 1237 |
"bits": 8,
|
|
@@ -1250,8 +1189,7 @@
|
|
| 1250 |
"group_size": 128
|
| 1251 |
},
|
| 1252 |
"model.layers.9.mlp.gate": {
|
| 1253 |
-
"bits":
|
| 1254 |
-
"group_size": 128
|
| 1255 |
},
|
| 1256 |
"model.layers.9.self_attn.k_proj": {
|
| 1257 |
"bits": 8,
|
|
@@ -1268,6 +1206,254 @@
|
|
| 1268 |
"model.layers.9.self_attn.v_proj": {
|
| 1269 |
"bits": 8,
|
| 1270 |
"group_size": 128
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1271 |
}
|
| 1272 |
},
|
| 1273 |
"group_size": 64,
|
|
@@ -1289,4 +1475,4 @@
|
|
| 1289 |
"use_qk_norm": true,
|
| 1290 |
"use_sliding_window": false,
|
| 1291 |
"vocab_size": 151936
|
| 1292 |
-
}
|
|
|
|
| 25 |
"output_router_logits": false,
|
| 26 |
"qkv_bias": false,
|
| 27 |
"quantization_config": {
|
| 28 |
+
"autoround_version": "0.6.1.dev",
|
| 29 |
"bits": 4,
|
| 30 |
"data_type": "int",
|
| 31 |
"extra_config": {
|
| 32 |
"model.layers.0.mlp.gate": {
|
| 33 |
+
"bits": 16
|
|
|
|
| 34 |
},
|
| 35 |
"model.layers.0.self_attn.k_proj": {
|
| 36 |
"bits": 8,
|
|
|
|
| 49 |
"group_size": 128
|
| 50 |
},
|
| 51 |
"model.layers.1.mlp.gate": {
|
| 52 |
+
"bits": 16
|
|
|
|
| 53 |
},
|
| 54 |
"model.layers.1.self_attn.k_proj": {
|
| 55 |
"bits": 8,
|
|
|
|
| 68 |
"group_size": 128
|
| 69 |
},
|
| 70 |
"model.layers.10.mlp.gate": {
|
| 71 |
+
"bits": 16
|
|
|
|
| 72 |
},
|
| 73 |
"model.layers.10.self_attn.k_proj": {
|
| 74 |
"bits": 8,
|
|
|
|
| 87 |
"group_size": 128
|
| 88 |
},
|
| 89 |
"model.layers.11.mlp.gate": {
|
| 90 |
+
"bits": 16
|
|
|
|
| 91 |
},
|
| 92 |
"model.layers.11.self_attn.k_proj": {
|
| 93 |
"bits": 8,
|
|
|
|
| 106 |
"group_size": 128
|
| 107 |
},
|
| 108 |
"model.layers.12.mlp.gate": {
|
| 109 |
+
"bits": 16
|
|
|
|
| 110 |
},
|
| 111 |
"model.layers.12.self_attn.k_proj": {
|
| 112 |
"bits": 8,
|
|
|
|
| 125 |
"group_size": 128
|
| 126 |
},
|
| 127 |
"model.layers.13.mlp.gate": {
|
| 128 |
+
"bits": 16
|
|
|
|
| 129 |
},
|
| 130 |
"model.layers.13.self_attn.k_proj": {
|
| 131 |
"bits": 8,
|
|
|
|
| 144 |
"group_size": 128
|
| 145 |
},
|
| 146 |
"model.layers.14.mlp.gate": {
|
| 147 |
+
"bits": 16
|
|
|
|
| 148 |
},
|
| 149 |
"model.layers.14.self_attn.k_proj": {
|
| 150 |
"bits": 8,
|
|
|
|
| 163 |
"group_size": 128
|
| 164 |
},
|
| 165 |
"model.layers.15.mlp.gate": {
|
| 166 |
+
"bits": 16
|
|
|
|
| 167 |
},
|
| 168 |
"model.layers.15.self_attn.k_proj": {
|
| 169 |
"bits": 8,
|
|
|
|
| 182 |
"group_size": 128
|
| 183 |
},
|
| 184 |
"model.layers.16.mlp.gate": {
|
| 185 |
+
"bits": 16
|
|
|
|
| 186 |
},
|
| 187 |
"model.layers.16.self_attn.k_proj": {
|
| 188 |
"bits": 8,
|
|
|
|
| 201 |
"group_size": 128
|
| 202 |
},
|
| 203 |
"model.layers.17.mlp.gate": {
|
| 204 |
+
"bits": 16
|
|
|
|
| 205 |
},
|
| 206 |
"model.layers.17.self_attn.k_proj": {
|
| 207 |
"bits": 8,
|
|
|
|
| 220 |
"group_size": 128
|
| 221 |
},
|
| 222 |
"model.layers.18.mlp.gate": {
|
| 223 |
+
"bits": 16
|
|
|
|
| 224 |
},
|
| 225 |
"model.layers.18.self_attn.k_proj": {
|
| 226 |
"bits": 8,
|
|
|
|
| 239 |
"group_size": 128
|
| 240 |
},
|
| 241 |
"model.layers.19.mlp.gate": {
|
| 242 |
+
"bits": 16
|
|
|
|
| 243 |
},
|
| 244 |
"model.layers.19.self_attn.k_proj": {
|
| 245 |
"bits": 8,
|
|
|
|
| 258 |
"group_size": 128
|
| 259 |
},
|
| 260 |
"model.layers.2.mlp.gate": {
|
| 261 |
+
"bits": 16
|
|
|
|
| 262 |
},
|
| 263 |
"model.layers.2.self_attn.k_proj": {
|
| 264 |
"bits": 8,
|
|
|
|
| 277 |
"group_size": 128
|
| 278 |
},
|
| 279 |
"model.layers.20.mlp.gate": {
|
| 280 |
+
"bits": 16
|
|
|
|
| 281 |
},
|
| 282 |
"model.layers.20.self_attn.k_proj": {
|
| 283 |
"bits": 8,
|
|
|
|
| 296 |
"group_size": 128
|
| 297 |
},
|
| 298 |
"model.layers.21.mlp.gate": {
|
| 299 |
+
"bits": 16
|
|
|
|
| 300 |
},
|
| 301 |
"model.layers.21.self_attn.k_proj": {
|
| 302 |
"bits": 8,
|
|
|
|
| 315 |
"group_size": 128
|
| 316 |
},
|
| 317 |
"model.layers.22.mlp.gate": {
|
| 318 |
+
"bits": 16
|
|
|
|
| 319 |
},
|
| 320 |
"model.layers.22.self_attn.k_proj": {
|
| 321 |
"bits": 8,
|
|
|
|
| 334 |
"group_size": 128
|
| 335 |
},
|
| 336 |
"model.layers.23.mlp.gate": {
|
| 337 |
+
"bits": 16
|
|
|
|
| 338 |
},
|
| 339 |
"model.layers.23.self_attn.k_proj": {
|
| 340 |
"bits": 8,
|
|
|
|
| 353 |
"group_size": 128
|
| 354 |
},
|
| 355 |
"model.layers.24.mlp.gate": {
|
| 356 |
+
"bits": 16
|
|
|
|
| 357 |
},
|
| 358 |
"model.layers.24.self_attn.k_proj": {
|
| 359 |
"bits": 8,
|
|
|
|
| 372 |
"group_size": 128
|
| 373 |
},
|
| 374 |
"model.layers.25.mlp.gate": {
|
| 375 |
+
"bits": 16
|
|
|
|
| 376 |
},
|
| 377 |
"model.layers.25.self_attn.k_proj": {
|
| 378 |
"bits": 8,
|
|
|
|
| 391 |
"group_size": 128
|
| 392 |
},
|
| 393 |
"model.layers.26.mlp.gate": {
|
| 394 |
+
"bits": 16
|
|
|
|
| 395 |
},
|
| 396 |
"model.layers.26.self_attn.k_proj": {
|
| 397 |
"bits": 8,
|
|
|
|
| 410 |
"group_size": 128
|
| 411 |
},
|
| 412 |
"model.layers.27.mlp.gate": {
|
| 413 |
+
"bits": 16
|
|
|
|
| 414 |
},
|
| 415 |
"model.layers.27.self_attn.k_proj": {
|
| 416 |
"bits": 8,
|
|
|
|
| 429 |
"group_size": 128
|
| 430 |
},
|
| 431 |
"model.layers.28.mlp.gate": {
|
| 432 |
+
"bits": 16
|
|
|
|
| 433 |
},
|
| 434 |
"model.layers.28.self_attn.k_proj": {
|
| 435 |
"bits": 8,
|
|
|
|
| 448 |
"group_size": 128
|
| 449 |
},
|
| 450 |
"model.layers.29.mlp.gate": {
|
| 451 |
+
"bits": 16
|
|
|
|
| 452 |
},
|
| 453 |
"model.layers.29.self_attn.k_proj": {
|
| 454 |
"bits": 8,
|
|
|
|
| 467 |
"group_size": 128
|
| 468 |
},
|
| 469 |
"model.layers.3.mlp.gate": {
|
| 470 |
+
"bits": 16
|
|
|
|
| 471 |
},
|
| 472 |
"model.layers.3.self_attn.k_proj": {
|
| 473 |
"bits": 8,
|
|
|
|
| 486 |
"group_size": 128
|
| 487 |
},
|
| 488 |
"model.layers.30.mlp.gate": {
|
| 489 |
+
"bits": 16
|
|
|
|
| 490 |
},
|
| 491 |
"model.layers.30.self_attn.k_proj": {
|
| 492 |
"bits": 8,
|
|
|
|
| 505 |
"group_size": 128
|
| 506 |
},
|
| 507 |
"model.layers.31.mlp.gate": {
|
| 508 |
+
"bits": 16
|
|
|
|
| 509 |
},
|
| 510 |
"model.layers.31.self_attn.k_proj": {
|
| 511 |
"bits": 8,
|
|
|
|
| 524 |
"group_size": 128
|
| 525 |
},
|
| 526 |
"model.layers.32.mlp.gate": {
|
| 527 |
+
"bits": 16
|
|
|
|
| 528 |
},
|
| 529 |
"model.layers.32.self_attn.k_proj": {
|
| 530 |
"bits": 8,
|
|
|
|
| 543 |
"group_size": 128
|
| 544 |
},
|
| 545 |
"model.layers.33.mlp.gate": {
|
| 546 |
+
"bits": 16
|
|
|
|
| 547 |
},
|
| 548 |
"model.layers.33.self_attn.k_proj": {
|
| 549 |
"bits": 8,
|
|
|
|
| 562 |
"group_size": 128
|
| 563 |
},
|
| 564 |
"model.layers.34.mlp.gate": {
|
| 565 |
+
"bits": 16
|
|
|
|
| 566 |
},
|
| 567 |
"model.layers.34.self_attn.k_proj": {
|
| 568 |
"bits": 8,
|
|
|
|
| 581 |
"group_size": 128
|
| 582 |
},
|
| 583 |
"model.layers.35.mlp.gate": {
|
| 584 |
+
"bits": 16
|
|
|
|
| 585 |
},
|
| 586 |
"model.layers.35.self_attn.k_proj": {
|
| 587 |
"bits": 8,
|
|
|
|
| 600 |
"group_size": 128
|
| 601 |
},
|
| 602 |
"model.layers.36.mlp.gate": {
|
| 603 |
+
"bits": 16
|
|
|
|
| 604 |
},
|
| 605 |
"model.layers.36.self_attn.k_proj": {
|
| 606 |
"bits": 8,
|
|
|
|
| 619 |
"group_size": 128
|
| 620 |
},
|
| 621 |
"model.layers.37.mlp.gate": {
|
| 622 |
+
"bits": 16
|
|
|
|
| 623 |
},
|
| 624 |
"model.layers.37.self_attn.k_proj": {
|
| 625 |
"bits": 8,
|
|
|
|
| 638 |
"group_size": 128
|
| 639 |
},
|
| 640 |
"model.layers.38.mlp.gate": {
|
| 641 |
+
"bits": 16
|
|
|
|
| 642 |
},
|
| 643 |
"model.layers.38.self_attn.k_proj": {
|
| 644 |
"bits": 8,
|
|
|
|
| 657 |
"group_size": 128
|
| 658 |
},
|
| 659 |
"model.layers.39.mlp.gate": {
|
| 660 |
+
"bits": 16
|
|
|
|
| 661 |
},
|
| 662 |
"model.layers.39.self_attn.k_proj": {
|
| 663 |
"bits": 8,
|
|
|
|
| 676 |
"group_size": 128
|
| 677 |
},
|
| 678 |
"model.layers.4.mlp.gate": {
|
| 679 |
+
"bits": 16
|
|
|
|
| 680 |
},
|
| 681 |
"model.layers.4.self_attn.k_proj": {
|
| 682 |
"bits": 8,
|
|
|
|
| 695 |
"group_size": 128
|
| 696 |
},
|
| 697 |
"model.layers.40.mlp.gate": {
|
| 698 |
+
"bits": 16
|
|
|
|
| 699 |
},
|
| 700 |
"model.layers.40.self_attn.k_proj": {
|
| 701 |
"bits": 8,
|
|
|
|
| 714 |
"group_size": 128
|
| 715 |
},
|
| 716 |
"model.layers.41.mlp.gate": {
|
| 717 |
+
"bits": 16
|
|
|
|
| 718 |
},
|
| 719 |
"model.layers.41.self_attn.k_proj": {
|
| 720 |
"bits": 8,
|
|
|
|
| 733 |
"group_size": 128
|
| 734 |
},
|
| 735 |
"model.layers.42.mlp.gate": {
|
| 736 |
+
"bits": 16
|
|
|
|
| 737 |
},
|
| 738 |
"model.layers.42.self_attn.k_proj": {
|
| 739 |
"bits": 8,
|
|
|
|
| 752 |
"group_size": 128
|
| 753 |
},
|
| 754 |
"model.layers.43.mlp.gate": {
|
| 755 |
+
"bits": 16
|
|
|
|
| 756 |
},
|
| 757 |
"model.layers.43.self_attn.k_proj": {
|
| 758 |
"bits": 8,
|
|
|
|
| 771 |
"group_size": 128
|
| 772 |
},
|
| 773 |
"model.layers.44.mlp.gate": {
|
| 774 |
+
"bits": 16
|
|
|
|
| 775 |
},
|
| 776 |
"model.layers.44.self_attn.k_proj": {
|
| 777 |
"bits": 8,
|
|
|
|
| 790 |
"group_size": 128
|
| 791 |
},
|
| 792 |
"model.layers.45.mlp.gate": {
|
| 793 |
+
"bits": 16
|
|
|
|
| 794 |
},
|
| 795 |
"model.layers.45.self_attn.k_proj": {
|
| 796 |
"bits": 8,
|
|
|
|
| 809 |
"group_size": 128
|
| 810 |
},
|
| 811 |
"model.layers.46.mlp.gate": {
|
| 812 |
+
"bits": 16
|
|
|
|
| 813 |
},
|
| 814 |
"model.layers.46.self_attn.k_proj": {
|
| 815 |
"bits": 8,
|
|
|
|
| 828 |
"group_size": 128
|
| 829 |
},
|
| 830 |
"model.layers.47.mlp.gate": {
|
| 831 |
+
"bits": 16
|
|
|
|
| 832 |
},
|
| 833 |
"model.layers.47.self_attn.k_proj": {
|
| 834 |
"bits": 8,
|
|
|
|
| 847 |
"group_size": 128
|
| 848 |
},
|
| 849 |
"model.layers.48.mlp.gate": {
|
| 850 |
+
"bits": 16
|
|
|
|
| 851 |
},
|
| 852 |
"model.layers.48.self_attn.k_proj": {
|
| 853 |
"bits": 8,
|
|
|
|
| 866 |
"group_size": 128
|
| 867 |
},
|
| 868 |
"model.layers.49.mlp.gate": {
|
| 869 |
+
"bits": 16
|
|
|
|
| 870 |
},
|
| 871 |
"model.layers.49.self_attn.k_proj": {
|
| 872 |
"bits": 8,
|
|
|
|
| 885 |
"group_size": 128
|
| 886 |
},
|
| 887 |
"model.layers.5.mlp.gate": {
|
| 888 |
+
"bits": 16
|
|
|
|
| 889 |
},
|
| 890 |
"model.layers.5.self_attn.k_proj": {
|
| 891 |
"bits": 8,
|
|
|
|
| 904 |
"group_size": 128
|
| 905 |
},
|
| 906 |
"model.layers.50.mlp.gate": {
|
| 907 |
+
"bits": 16
|
|
|
|
| 908 |
},
|
| 909 |
"model.layers.50.self_attn.k_proj": {
|
| 910 |
"bits": 8,
|
|
|
|
| 923 |
"group_size": 128
|
| 924 |
},
|
| 925 |
"model.layers.51.mlp.gate": {
|
| 926 |
+
"bits": 16
|
|
|
|
| 927 |
},
|
| 928 |
"model.layers.51.self_attn.k_proj": {
|
| 929 |
"bits": 8,
|
|
|
|
| 942 |
"group_size": 128
|
| 943 |
},
|
| 944 |
"model.layers.52.mlp.gate": {
|
| 945 |
+
"bits": 16
|
|
|
|
| 946 |
},
|
| 947 |
"model.layers.52.self_attn.k_proj": {
|
| 948 |
"bits": 8,
|
|
|
|
| 961 |
"group_size": 128
|
| 962 |
},
|
| 963 |
"model.layers.53.mlp.gate": {
|
| 964 |
+
"bits": 16
|
|
|
|
| 965 |
},
|
| 966 |
"model.layers.53.self_attn.k_proj": {
|
| 967 |
"bits": 8,
|
|
|
|
| 980 |
"group_size": 128
|
| 981 |
},
|
| 982 |
"model.layers.54.mlp.gate": {
|
| 983 |
+
"bits": 16
|
|
|
|
| 984 |
},
|
| 985 |
"model.layers.54.self_attn.k_proj": {
|
| 986 |
"bits": 8,
|
|
|
|
| 999 |
"group_size": 128
|
| 1000 |
},
|
| 1001 |
"model.layers.55.mlp.gate": {
|
| 1002 |
+
"bits": 16
|
|
|
|
| 1003 |
},
|
| 1004 |
"model.layers.55.self_attn.k_proj": {
|
| 1005 |
"bits": 8,
|
|
|
|
| 1018 |
"group_size": 128
|
| 1019 |
},
|
| 1020 |
"model.layers.56.mlp.gate": {
|
| 1021 |
+
"bits": 16
|
|
|
|
| 1022 |
},
|
| 1023 |
"model.layers.56.self_attn.k_proj": {
|
| 1024 |
"bits": 8,
|
|
|
|
| 1037 |
"group_size": 128
|
| 1038 |
},
|
| 1039 |
"model.layers.57.mlp.gate": {
|
| 1040 |
+
"bits": 16
|
|
|
|
| 1041 |
},
|
| 1042 |
"model.layers.57.self_attn.k_proj": {
|
| 1043 |
"bits": 8,
|
|
|
|
| 1056 |
"group_size": 128
|
| 1057 |
},
|
| 1058 |
"model.layers.58.mlp.gate": {
|
| 1059 |
+
"bits": 16
|
|
|
|
| 1060 |
},
|
| 1061 |
"model.layers.58.self_attn.k_proj": {
|
| 1062 |
"bits": 8,
|
|
|
|
| 1075 |
"group_size": 128
|
| 1076 |
},
|
| 1077 |
"model.layers.59.mlp.gate": {
|
| 1078 |
+
"bits": 16
|
|
|
|
| 1079 |
},
|
| 1080 |
"model.layers.59.self_attn.k_proj": {
|
| 1081 |
"bits": 8,
|
|
|
|
| 1094 |
"group_size": 128
|
| 1095 |
},
|
| 1096 |
"model.layers.6.mlp.gate": {
|
| 1097 |
+
"bits": 16
|
|
|
|
| 1098 |
},
|
| 1099 |
"model.layers.6.self_attn.k_proj": {
|
| 1100 |
"bits": 8,
|
|
|
|
| 1113 |
"group_size": 128
|
| 1114 |
},
|
| 1115 |
"model.layers.60.mlp.gate": {
|
| 1116 |
+
"bits": 16
|
|
|
|
| 1117 |
},
|
| 1118 |
"model.layers.60.self_attn.k_proj": {
|
| 1119 |
"bits": 8,
|
|
|
|
| 1132 |
"group_size": 128
|
| 1133 |
},
|
| 1134 |
"model.layers.61.mlp.gate": {
|
| 1135 |
+
"bits": 16
|
|
|
|
| 1136 |
},
|
| 1137 |
"model.layers.61.self_attn.k_proj": {
|
| 1138 |
"bits": 8,
|
|
|
|
| 1151 |
"group_size": 128
|
| 1152 |
},
|
| 1153 |
"model.layers.7.mlp.gate": {
|
| 1154 |
+
"bits": 16
|
|
|
|
| 1155 |
},
|
| 1156 |
"model.layers.7.self_attn.k_proj": {
|
| 1157 |
"bits": 8,
|
|
|
|
| 1170 |
"group_size": 128
|
| 1171 |
},
|
| 1172 |
"model.layers.8.mlp.gate": {
|
| 1173 |
+
"bits": 16
|
|
|
|
| 1174 |
},
|
| 1175 |
"model.layers.8.self_attn.k_proj": {
|
| 1176 |
"bits": 8,
|
|
|
|
| 1189 |
"group_size": 128
|
| 1190 |
},
|
| 1191 |
"model.layers.9.mlp.gate": {
|
| 1192 |
+
"bits": 16
|
|
|
|
| 1193 |
},
|
| 1194 |
"model.layers.9.self_attn.k_proj": {
|
| 1195 |
"bits": 8,
|
|
|
|
| 1206 |
"model.layers.9.self_attn.v_proj": {
|
| 1207 |
"bits": 8,
|
| 1208 |
"group_size": 128
|
| 1209 |
+
},
|
| 1210 |
+
"model.layers.0.self_attn.qkv_proj": {
|
| 1211 |
+
"bits": 8,
|
| 1212 |
+
"group_size": 128
|
| 1213 |
+
},
|
| 1214 |
+
"model.layers.1.self_attn.qkv_proj": {
|
| 1215 |
+
"bits": 8,
|
| 1216 |
+
"group_size": 128
|
| 1217 |
+
},
|
| 1218 |
+
"model.layers.2.self_attn.qkv_proj": {
|
| 1219 |
+
"bits": 8,
|
| 1220 |
+
"group_size": 128
|
| 1221 |
+
},
|
| 1222 |
+
"model.layers.3.self_attn.qkv_proj": {
|
| 1223 |
+
"bits": 8,
|
| 1224 |
+
"group_size": 128
|
| 1225 |
+
},
|
| 1226 |
+
"model.layers.4.self_attn.qkv_proj": {
|
| 1227 |
+
"bits": 8,
|
| 1228 |
+
"group_size": 128
|
| 1229 |
+
},
|
| 1230 |
+
"model.layers.5.self_attn.qkv_proj": {
|
| 1231 |
+
"bits": 8,
|
| 1232 |
+
"group_size": 128
|
| 1233 |
+
},
|
| 1234 |
+
"model.layers.6.self_attn.qkv_proj": {
|
| 1235 |
+
"bits": 8,
|
| 1236 |
+
"group_size": 128
|
| 1237 |
+
},
|
| 1238 |
+
"model.layers.7.self_attn.qkv_proj": {
|
| 1239 |
+
"bits": 8,
|
| 1240 |
+
"group_size": 128
|
| 1241 |
+
},
|
| 1242 |
+
"model.layers.8.self_attn.qkv_proj": {
|
| 1243 |
+
"bits": 8,
|
| 1244 |
+
"group_size": 128
|
| 1245 |
+
},
|
| 1246 |
+
"model.layers.9.self_attn.qkv_proj": {
|
| 1247 |
+
"bits": 8,
|
| 1248 |
+
"group_size": 128
|
| 1249 |
+
},
|
| 1250 |
+
"model.layers.10.self_attn.qkv_proj": {
|
| 1251 |
+
"bits": 8,
|
| 1252 |
+
"group_size": 128
|
| 1253 |
+
},
|
| 1254 |
+
"model.layers.11.self_attn.qkv_proj": {
|
| 1255 |
+
"bits": 8,
|
| 1256 |
+
"group_size": 128
|
| 1257 |
+
},
|
| 1258 |
+
"model.layers.12.self_attn.qkv_proj": {
|
| 1259 |
+
"bits": 8,
|
| 1260 |
+
"group_size": 128
|
| 1261 |
+
},
|
| 1262 |
+
"model.layers.13.self_attn.qkv_proj": {
|
| 1263 |
+
"bits": 8,
|
| 1264 |
+
"group_size": 128
|
| 1265 |
+
},
|
| 1266 |
+
"model.layers.14.self_attn.qkv_proj": {
|
| 1267 |
+
"bits": 8,
|
| 1268 |
+
"group_size": 128
|
| 1269 |
+
},
|
| 1270 |
+
"model.layers.15.self_attn.qkv_proj": {
|
| 1271 |
+
"bits": 8,
|
| 1272 |
+
"group_size": 128
|
| 1273 |
+
},
|
| 1274 |
+
"model.layers.16.self_attn.qkv_proj": {
|
| 1275 |
+
"bits": 8,
|
| 1276 |
+
"group_size": 128
|
| 1277 |
+
},
|
| 1278 |
+
"model.layers.17.self_attn.qkv_proj": {
|
| 1279 |
+
"bits": 8,
|
| 1280 |
+
"group_size": 128
|
| 1281 |
+
},
|
| 1282 |
+
"model.layers.18.self_attn.qkv_proj": {
|
| 1283 |
+
"bits": 8,
|
| 1284 |
+
"group_size": 128
|
| 1285 |
+
},
|
| 1286 |
+
"model.layers.19.self_attn.qkv_proj": {
|
| 1287 |
+
"bits": 8,
|
| 1288 |
+
"group_size": 128
|
| 1289 |
+
},
|
| 1290 |
+
"model.layers.20.self_attn.qkv_proj": {
|
| 1291 |
+
"bits": 8,
|
| 1292 |
+
"group_size": 128
|
| 1293 |
+
},
|
| 1294 |
+
"model.layers.21.self_attn.qkv_proj": {
|
| 1295 |
+
"bits": 8,
|
| 1296 |
+
"group_size": 128
|
| 1297 |
+
},
|
| 1298 |
+
"model.layers.22.self_attn.qkv_proj": {
|
| 1299 |
+
"bits": 8,
|
| 1300 |
+
"group_size": 128
|
| 1301 |
+
},
|
| 1302 |
+
"model.layers.23.self_attn.qkv_proj": {
|
| 1303 |
+
"bits": 8,
|
| 1304 |
+
"group_size": 128
|
| 1305 |
+
},
|
| 1306 |
+
"model.layers.24.self_attn.qkv_proj": {
|
| 1307 |
+
"bits": 8,
|
| 1308 |
+
"group_size": 128
|
| 1309 |
+
},
|
| 1310 |
+
"model.layers.25.self_attn.qkv_proj": {
|
| 1311 |
+
"bits": 8,
|
| 1312 |
+
"group_size": 128
|
| 1313 |
+
},
|
| 1314 |
+
"model.layers.26.self_attn.qkv_proj": {
|
| 1315 |
+
"bits": 8,
|
| 1316 |
+
"group_size": 128
|
| 1317 |
+
},
|
| 1318 |
+
"model.layers.27.self_attn.qkv_proj": {
|
| 1319 |
+
"bits": 8,
|
| 1320 |
+
"group_size": 128
|
| 1321 |
+
},
|
| 1322 |
+
"model.layers.28.self_attn.qkv_proj": {
|
| 1323 |
+
"bits": 8,
|
| 1324 |
+
"group_size": 128
|
| 1325 |
+
},
|
| 1326 |
+
"model.layers.29.self_attn.qkv_proj": {
|
| 1327 |
+
"bits": 8,
|
| 1328 |
+
"group_size": 128
|
| 1329 |
+
},
|
| 1330 |
+
"model.layers.30.self_attn.qkv_proj": {
|
| 1331 |
+
"bits": 8,
|
| 1332 |
+
"group_size": 128
|
| 1333 |
+
},
|
| 1334 |
+
"model.layers.31.self_attn.qkv_proj": {
|
| 1335 |
+
"bits": 8,
|
| 1336 |
+
"group_size": 128
|
| 1337 |
+
},
|
| 1338 |
+
"model.layers.32.self_attn.qkv_proj": {
|
| 1339 |
+
"bits": 8,
|
| 1340 |
+
"group_size": 128
|
| 1341 |
+
},
|
| 1342 |
+
"model.layers.33.self_attn.qkv_proj": {
|
| 1343 |
+
"bits": 8,
|
| 1344 |
+
"group_size": 128
|
| 1345 |
+
},
|
| 1346 |
+
"model.layers.34.self_attn.qkv_proj": {
|
| 1347 |
+
"bits": 8,
|
| 1348 |
+
"group_size": 128
|
| 1349 |
+
},
|
| 1350 |
+
"model.layers.35.self_attn.qkv_proj": {
|
| 1351 |
+
"bits": 8,
|
| 1352 |
+
"group_size": 128
|
| 1353 |
+
},
|
| 1354 |
+
"model.layers.36.self_attn.qkv_proj": {
|
| 1355 |
+
"bits": 8,
|
| 1356 |
+
"group_size": 128
|
| 1357 |
+
},
|
| 1358 |
+
"model.layers.37.self_attn.qkv_proj": {
|
| 1359 |
+
"bits": 8,
|
| 1360 |
+
"group_size": 128
|
| 1361 |
+
},
|
| 1362 |
+
"model.layers.38.self_attn.qkv_proj": {
|
| 1363 |
+
"bits": 8,
|
| 1364 |
+
"group_size": 128
|
| 1365 |
+
},
|
| 1366 |
+
"model.layers.39.self_attn.qkv_proj": {
|
| 1367 |
+
"bits": 8,
|
| 1368 |
+
"group_size": 128
|
| 1369 |
+
},
|
| 1370 |
+
"model.layers.40.self_attn.qkv_proj": {
|
| 1371 |
+
"bits": 8,
|
| 1372 |
+
"group_size": 128
|
| 1373 |
+
},
|
| 1374 |
+
"model.layers.41.self_attn.qkv_proj": {
|
| 1375 |
+
"bits": 8,
|
| 1376 |
+
"group_size": 128
|
| 1377 |
+
},
|
| 1378 |
+
"model.layers.42.self_attn.qkv_proj": {
|
| 1379 |
+
"bits": 8,
|
| 1380 |
+
"group_size": 128
|
| 1381 |
+
},
|
| 1382 |
+
"model.layers.43.self_attn.qkv_proj": {
|
| 1383 |
+
"bits": 8,
|
| 1384 |
+
"group_size": 128
|
| 1385 |
+
},
|
| 1386 |
+
"model.layers.44.self_attn.qkv_proj": {
|
| 1387 |
+
"bits": 8,
|
| 1388 |
+
"group_size": 128
|
| 1389 |
+
},
|
| 1390 |
+
"model.layers.45.self_attn.qkv_proj": {
|
| 1391 |
+
"bits": 8,
|
| 1392 |
+
"group_size": 128
|
| 1393 |
+
},
|
| 1394 |
+
"model.layers.46.self_attn.qkv_proj": {
|
| 1395 |
+
"bits": 8,
|
| 1396 |
+
"group_size": 128
|
| 1397 |
+
},
|
| 1398 |
+
"model.layers.47.self_attn.qkv_proj": {
|
| 1399 |
+
"bits": 8,
|
| 1400 |
+
"group_size": 128
|
| 1401 |
+
},
|
| 1402 |
+
"model.layers.48.self_attn.qkv_proj": {
|
| 1403 |
+
"bits": 8,
|
| 1404 |
+
"group_size": 128
|
| 1405 |
+
},
|
| 1406 |
+
"model.layers.49.self_attn.qkv_proj": {
|
| 1407 |
+
"bits": 8,
|
| 1408 |
+
"group_size": 128
|
| 1409 |
+
},
|
| 1410 |
+
"model.layers.50.self_attn.qkv_proj": {
|
| 1411 |
+
"bits": 8,
|
| 1412 |
+
"group_size": 128
|
| 1413 |
+
},
|
| 1414 |
+
"model.layers.51.self_attn.qkv_proj": {
|
| 1415 |
+
"bits": 8,
|
| 1416 |
+
"group_size": 128
|
| 1417 |
+
},
|
| 1418 |
+
"model.layers.52.self_attn.qkv_proj": {
|
| 1419 |
+
"bits": 8,
|
| 1420 |
+
"group_size": 128
|
| 1421 |
+
},
|
| 1422 |
+
"model.layers.53.self_attn.qkv_proj": {
|
| 1423 |
+
"bits": 8,
|
| 1424 |
+
"group_size": 128
|
| 1425 |
+
},
|
| 1426 |
+
"model.layers.54.self_attn.qkv_proj": {
|
| 1427 |
+
"bits": 8,
|
| 1428 |
+
"group_size": 128
|
| 1429 |
+
},
|
| 1430 |
+
"model.layers.55.self_attn.qkv_proj": {
|
| 1431 |
+
"bits": 8,
|
| 1432 |
+
"group_size": 128
|
| 1433 |
+
},
|
| 1434 |
+
"model.layers.56.self_attn.qkv_proj": {
|
| 1435 |
+
"bits": 8,
|
| 1436 |
+
"group_size": 128
|
| 1437 |
+
},
|
| 1438 |
+
"model.layers.57.self_attn.qkv_proj": {
|
| 1439 |
+
"bits": 8,
|
| 1440 |
+
"group_size": 128
|
| 1441 |
+
},
|
| 1442 |
+
"model.layers.58.self_attn.qkv_proj": {
|
| 1443 |
+
"bits": 8,
|
| 1444 |
+
"group_size": 128
|
| 1445 |
+
},
|
| 1446 |
+
"model.layers.59.self_attn.qkv_proj": {
|
| 1447 |
+
"bits": 8,
|
| 1448 |
+
"group_size": 128
|
| 1449 |
+
},
|
| 1450 |
+
"model.layers.60.self_attn.qkv_proj": {
|
| 1451 |
+
"bits": 8,
|
| 1452 |
+
"group_size": 128
|
| 1453 |
+
},
|
| 1454 |
+
"model.layers.61.self_attn.qkv_proj": {
|
| 1455 |
+
"bits": 8,
|
| 1456 |
+
"group_size": 128
|
| 1457 |
}
|
| 1458 |
},
|
| 1459 |
"group_size": 64,
|
|
|
|
| 1475 |
"use_qk_norm": true,
|
| 1476 |
"use_sliding_window": false,
|
| 1477 |
"vocab_size": 151936
|
| 1478 |
+
}
|
model-00001-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0848401550a548d5906c1301e8818d99bff4c97376009e96546ae69ac23e74b
|
| 3 |
+
size 4995569896
|
model-00002-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1dd26b9529cb11cbd9863e9c53c85729c10eb2a8961dc2c6f39993b3f6bff20
|
| 3 |
+
size 4994004384
|
model-00003-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:badcc4a6981a6a0c0246619d5b53bee8b3b9855d077c890e54fd9fb0f2a5d87e
|
| 3 |
+
size 4993827288
|
model-00004-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ddd33a0f576ea0fe2e16be5909ed992b41a7ce0a079b489747970cf354b9723
|
| 3 |
+
size 4994004104
|
model-00005-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a137d0c16758a6acdad9e1ee71dacee0b9825e411a1ac9f0dc9946afffe0417d
|
| 3 |
+
size 4994004120
|
model-00006-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb752749d800f0a93803f756300f8c88ad7ddfb923fb5f90665d2653841ad046
|
| 3 |
+
size 4994004120
|
model-00007-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd65b9a2271e46eadbaf89d05e957bcc36b18d4309a5082a53e504aa4b357f57
|
| 3 |
+
size 4994004368
|
model-00008-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18581e49da6ccdefdabc2c5813d4edacf55e99a0b1394c2b3f12fd68ddacd4ba
|
| 3 |
+
size 4994004392
|
model-00009-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a792cf65f6c3a78a4bb7864072047b4f200f9b03046421e36fc0d0746a66c1a
|
| 3 |
+
size 4993827440
|
model-00010-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a36b2931c2944c29ce46d15b5a89668526fa16d3b800014cfe901dea9628eef
|
| 3 |
+
size 4994005840
|
model-00011-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eaad473812203b936e13e641e71a49b2a185525c4fae744e5034817c91aa7ae9
|
| 3 |
+
size 4994005840
|
model-00012-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ecf5628353f6e41cc1962eb7d3561355bb99f8c52693699ffac540e802e628a
|
| 3 |
+
size 4994005928
|
model-00013-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d1feea16eb58c466f54e531725f13f17f4d4dcdf4da0d6b1d98c72f21e416c0
|
| 3 |
+
size 4994006104
|
model-00014-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58c2784a1519f13e7aa7d5a3028fd18a6794399d4c25a0758f6f5cb906af2674
|
| 3 |
+
size 4993829088
|
model-00015-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a813925b4c7d96e6c1ff39a61b46af9d22dc5b871476bc2f4dc96a6661846964
|
| 3 |
+
size 4994005768
|
model-00016-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6211af418b67ccb9c319cd23df0007b8b6e6ca713059a443795c4d08204f64e5
|
| 3 |
+
size 4994005848
|
model-00017-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a943e51d7c7d50214433fafebf34c39dba7a7dabcbc8aa217778935ac00f517
|
| 3 |
+
size 4994005840
|
model-00018-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a20ae1bd085948eb35f286cbe6f11b8b74d2178558cdbd6a9894ea16bd1a7597
|
| 3 |
+
size 4994006024
|
model-00019-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:123bbbe2777c2bea5caf9245d660b50d0378b7e41eac404db606ab79c68fb0a4
|
| 3 |
+
size 4994006112
|
model-00020-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c40086af51c56e4802326be567d9e0d4a3cbbdcad822ccf0f90a38263f500e33
|
| 3 |
+
size 4993828920
|
model-00021-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7908c705352f541e9a16963000b2cc8bb3dd8187fab675add635ec1c5ad70432
|
| 3 |
+
size 4994005840
|
model-00022-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08307afb9cac64194c37b7953362c7e2c4f32a7569fec3b1a0db0afe84c72338
|
| 3 |
+
size 4994005840
|
model-00023-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c800fa3c36db20eddbf0be35219027d92ec5cb93eb16fd47420f3282b0afc90
|
| 3 |
+
size 4994005864
|
model-00024-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec1c7404cc437df075df3bf095a66a4db8bb768dc31de1d01448a15c9d3285d8
|
| 3 |
+
size 4994006104
|
model-00025-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d6fd36aa70586fbd5a2cdd5a5c6e9287766c826b5555ebb170a6ee40e020fb2e
|
| 3 |
+
size 4951635464
|
model-00026-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5a7a058b27b6838999f17cf9c2c05510efe3ef47e64400be20fd06bc76ef7a06
|
| 3 |
+
size 4993804024
|
model-00027-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b016131a085b46ef04604b4d681f9bb7bfb356083bdd363556356af454ece465
|
| 3 |
+
size 4994005840
|
model-00028-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a830f1e5368ff967acce3ff2c179db6aeafa0d40c64b5372c3ba4f4f6bdeae50
|
| 3 |
+
size 4994005848
|
model-00029-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dba0de06df718829cbfbd7f41787873d1149333fb355659d5022c22bc5da6960
|
| 3 |
+
size 4994005952
|
model-00030-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48d0d93aae5f0f175ca080ad70cefa6335ca29b3614c193f2332a5c307f14a0e
|
| 3 |
+
size 4994006104
|
model-00031-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d9987c96f8c7ffe014870f57e0ecd166350caacd2040a2d8c07d372f8464107
|
| 3 |
+
size 4993829040
|
model-00032-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8be8f330ee0e975a9c9e524f236dad761b74829a4f4190c4e14d43ee7dbb19f4
|
| 3 |
+
size 4994005800
|
model-00033-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:710a7fce80a3ef7172ff052544db60de516a44c3e456a64f25da566eff973496
|
| 3 |
+
size 4994005840
|
model-00034-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86d68aa8604e0f242527003962f0b9b8fa8c691d9dd5a641815ba09a7ee0bd45
|
| 3 |
+
size 4994005840
|
model-00035-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6e200b058c24d7dd4b9c82ffb34d602c817110aaeb2226bea238ac4826cd044b
|
| 3 |
+
size 4994006056
|
model-00036-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a206147ee64bba963754d817263a23502c6ffca77aedeee725136098571049dd
|
| 3 |
+
size 4994006104
|
model-00037-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7f8a652119c77dfb9f42ed389c2547dbcbca965ee35d5f5418919aef31a2326
|
| 3 |
+
size 4993828896
|
model-00038-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91e648e4103e4bf1053a72594b982a5416cce3afbe686017ab95f12cd846cb7f
|
| 3 |
+
size 4994005840
|
model-00039-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:52f012cb2f2f58d92290011cad7fc15df8e6d8141a0c73f29e2f8d0bd8b65753
|
| 3 |
+
size 4994005848
|
model-00040-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8952a7a915140fc9dcbb8e96b9a9f6eb037fb20e9d99f2e5366f7c404fcd9745
|
| 3 |
+
size 4994005888
|
model-00041-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d515b56490be523cbd51d17b720c02443d0598604ac34b42be2deca2ac17a40d
|
| 3 |
+
size 4994006104
|
model-00042-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f84cd7e83e532697b4b5b1789a54aa24680120be41f964d40ae477303918813d
|
| 3 |
+
size 4973948552
|
model-00043-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ebe4924e524fa4ea02ecf0892b0e532a9e304e52702816e220f60b09639f24f3
|
| 3 |
+
size 4996928176
|
model-00044-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:43dc8b0f880a6d5356561dda31f3eed4dd89bf6f488f01ba3f482ba7fda72af4
|
| 3 |
+
size 4994005848
|
model-00045-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9525e8b95c7b51d832b2dd5f12ee4866e869f20511fc8460adc528171301697d
|
| 3 |
+
size 4994005840
|
model-00046-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68260ef3af4e5a5eace88d3a7a52a1879537df4a713f807cfeb35147abbd9f00
|
| 3 |
+
size 4994005984
|
model-00047-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70b56a69be788efe0baeff1eb627f652a4e98468eb7d6f7a830cf8d0aeb86009
|
| 3 |
+
size 4994006112
|
model-00048-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69919089db2b0abb9396bf7f4cf9a15dd67350ff90d8d1871ea920d63cad3eb3
|
| 3 |
+
size 4993828976
|
model-00049-of-00054.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f16d301d1a796bb1bfe9b9c42ec0b8ebb6d017d3979ed483a6b05dab8984181a
|
| 3 |
+
size 4994005824
|