Upload folder using huggingface_hub
Browse files- config.json +28 -28
- model-00003-of-00061.safetensors +2 -2
- model-00005-of-00061.safetensors +2 -2
- model-00007-of-00061.safetensors +2 -2
- model-00009-of-00061.safetensors +2 -2
- model-00011-of-00061.safetensors +2 -2
- model-00014-of-00061.safetensors +2 -2
- model-00016-of-00061.safetensors +2 -2
- model-00018-of-00061.safetensors +2 -2
- model-00020-of-00061.safetensors +2 -2
- model-00022-of-00061.safetensors +2 -2
- model-00024-of-00061.safetensors +2 -2
- model-00026-of-00061.safetensors +2 -2
- model-00029-of-00061.safetensors +2 -2
- model-00031-of-00061.safetensors +2 -2
- model-00033-of-00061.safetensors +2 -2
- model-00035-of-00061.safetensors +2 -2
- model-00037-of-00061.safetensors +2 -2
- model-00039-of-00061.safetensors +2 -2
- model-00041-of-00061.safetensors +2 -2
- model-00044-of-00061.safetensors +2 -2
- model-00046-of-00061.safetensors +2 -2
- model-00048-of-00061.safetensors +2 -2
- model-00050-of-00061.safetensors +2 -2
- model-00052-of-00061.safetensors +2 -2
- model-00054-of-00061.safetensors +2 -2
- model-00056-of-00061.safetensors +2 -2
- model-00059-of-00061.safetensors +2 -2
- model-00061-of-00061.safetensors +2 -2
- model.safetensors.index.json +2 -2
- quantization_config.json +28 -28
config.json
CHANGED
|
@@ -40,7 +40,7 @@
|
|
| 40 |
"extra_config": {
|
| 41 |
"model.layers.0.mlp.router.classifier": {
|
| 42 |
"act_bits": 16,
|
| 43 |
-
"bits":
|
| 44 |
"data_type": "int",
|
| 45 |
"group_size": 128,
|
| 46 |
"sym": true
|
|
@@ -159,7 +159,7 @@
|
|
| 159 |
},
|
| 160 |
"model.layers.1.mlp.router.classifier": {
|
| 161 |
"act_bits": 16,
|
| 162 |
-
"bits":
|
| 163 |
"data_type": "int",
|
| 164 |
"group_size": 128,
|
| 165 |
"sym": true
|
|
@@ -278,7 +278,7 @@
|
|
| 278 |
},
|
| 279 |
"model.layers.10.mlp.router.classifier": {
|
| 280 |
"act_bits": 16,
|
| 281 |
-
"bits":
|
| 282 |
"data_type": "int",
|
| 283 |
"group_size": 128,
|
| 284 |
"sym": true
|
|
@@ -397,7 +397,7 @@
|
|
| 397 |
},
|
| 398 |
"model.layers.11.mlp.router.classifier": {
|
| 399 |
"act_bits": 16,
|
| 400 |
-
"bits":
|
| 401 |
"data_type": "int",
|
| 402 |
"group_size": 128,
|
| 403 |
"sym": true
|
|
@@ -516,7 +516,7 @@
|
|
| 516 |
},
|
| 517 |
"model.layers.12.mlp.router.classifier": {
|
| 518 |
"act_bits": 16,
|
| 519 |
-
"bits":
|
| 520 |
"data_type": "int",
|
| 521 |
"group_size": 128,
|
| 522 |
"sym": true
|
|
@@ -635,7 +635,7 @@
|
|
| 635 |
},
|
| 636 |
"model.layers.13.mlp.router.classifier": {
|
| 637 |
"act_bits": 16,
|
| 638 |
-
"bits":
|
| 639 |
"data_type": "int",
|
| 640 |
"group_size": 128,
|
| 641 |
"sym": true
|
|
@@ -754,7 +754,7 @@
|
|
| 754 |
},
|
| 755 |
"model.layers.14.mlp.router.classifier": {
|
| 756 |
"act_bits": 16,
|
| 757 |
-
"bits":
|
| 758 |
"data_type": "int",
|
| 759 |
"group_size": 128,
|
| 760 |
"sym": true
|
|
@@ -873,7 +873,7 @@
|
|
| 873 |
},
|
| 874 |
"model.layers.15.mlp.router.classifier": {
|
| 875 |
"act_bits": 16,
|
| 876 |
-
"bits":
|
| 877 |
"data_type": "int",
|
| 878 |
"group_size": 128,
|
| 879 |
"sym": true
|
|
@@ -992,7 +992,7 @@
|
|
| 992 |
},
|
| 993 |
"model.layers.16.mlp.router.classifier": {
|
| 994 |
"act_bits": 16,
|
| 995 |
-
"bits":
|
| 996 |
"data_type": "int",
|
| 997 |
"group_size": 128,
|
| 998 |
"sym": true
|
|
@@ -1111,7 +1111,7 @@
|
|
| 1111 |
},
|
| 1112 |
"model.layers.17.mlp.router.classifier": {
|
| 1113 |
"act_bits": 16,
|
| 1114 |
-
"bits":
|
| 1115 |
"data_type": "int",
|
| 1116 |
"group_size": 128,
|
| 1117 |
"sym": true
|
|
@@ -1230,7 +1230,7 @@
|
|
| 1230 |
},
|
| 1231 |
"model.layers.18.mlp.router.classifier": {
|
| 1232 |
"act_bits": 16,
|
| 1233 |
-
"bits":
|
| 1234 |
"data_type": "int",
|
| 1235 |
"group_size": 128,
|
| 1236 |
"sym": true
|
|
@@ -1349,7 +1349,7 @@
|
|
| 1349 |
},
|
| 1350 |
"model.layers.19.mlp.router.classifier": {
|
| 1351 |
"act_bits": 16,
|
| 1352 |
-
"bits":
|
| 1353 |
"data_type": "int",
|
| 1354 |
"group_size": 128,
|
| 1355 |
"sym": true
|
|
@@ -1468,7 +1468,7 @@
|
|
| 1468 |
},
|
| 1469 |
"model.layers.2.mlp.router.classifier": {
|
| 1470 |
"act_bits": 16,
|
| 1471 |
-
"bits":
|
| 1472 |
"data_type": "int",
|
| 1473 |
"group_size": 128,
|
| 1474 |
"sym": true
|
|
@@ -1587,7 +1587,7 @@
|
|
| 1587 |
},
|
| 1588 |
"model.layers.20.mlp.router.classifier": {
|
| 1589 |
"act_bits": 16,
|
| 1590 |
-
"bits":
|
| 1591 |
"data_type": "int",
|
| 1592 |
"group_size": 128,
|
| 1593 |
"sym": true
|
|
@@ -1706,7 +1706,7 @@
|
|
| 1706 |
},
|
| 1707 |
"model.layers.21.mlp.router.classifier": {
|
| 1708 |
"act_bits": 16,
|
| 1709 |
-
"bits":
|
| 1710 |
"data_type": "int",
|
| 1711 |
"group_size": 128,
|
| 1712 |
"sym": true
|
|
@@ -1825,7 +1825,7 @@
|
|
| 1825 |
},
|
| 1826 |
"model.layers.22.mlp.router.classifier": {
|
| 1827 |
"act_bits": 16,
|
| 1828 |
-
"bits":
|
| 1829 |
"data_type": "int",
|
| 1830 |
"group_size": 128,
|
| 1831 |
"sym": true
|
|
@@ -1944,7 +1944,7 @@
|
|
| 1944 |
},
|
| 1945 |
"model.layers.23.mlp.router.classifier": {
|
| 1946 |
"act_bits": 16,
|
| 1947 |
-
"bits":
|
| 1948 |
"data_type": "int",
|
| 1949 |
"group_size": 128,
|
| 1950 |
"sym": true
|
|
@@ -2063,7 +2063,7 @@
|
|
| 2063 |
},
|
| 2064 |
"model.layers.24.mlp.router.classifier": {
|
| 2065 |
"act_bits": 16,
|
| 2066 |
-
"bits":
|
| 2067 |
"data_type": "int",
|
| 2068 |
"group_size": 128,
|
| 2069 |
"sym": true
|
|
@@ -2182,7 +2182,7 @@
|
|
| 2182 |
},
|
| 2183 |
"model.layers.25.mlp.router.classifier": {
|
| 2184 |
"act_bits": 16,
|
| 2185 |
-
"bits":
|
| 2186 |
"data_type": "int",
|
| 2187 |
"group_size": 128,
|
| 2188 |
"sym": true
|
|
@@ -2301,7 +2301,7 @@
|
|
| 2301 |
},
|
| 2302 |
"model.layers.26.mlp.router.classifier": {
|
| 2303 |
"act_bits": 16,
|
| 2304 |
-
"bits":
|
| 2305 |
"data_type": "int",
|
| 2306 |
"group_size": 128,
|
| 2307 |
"sym": true
|
|
@@ -2420,7 +2420,7 @@
|
|
| 2420 |
},
|
| 2421 |
"model.layers.27.mlp.router.classifier": {
|
| 2422 |
"act_bits": 16,
|
| 2423 |
-
"bits":
|
| 2424 |
"data_type": "int",
|
| 2425 |
"group_size": 128,
|
| 2426 |
"sym": true
|
|
@@ -2539,7 +2539,7 @@
|
|
| 2539 |
},
|
| 2540 |
"model.layers.3.mlp.router.classifier": {
|
| 2541 |
"act_bits": 16,
|
| 2542 |
-
"bits":
|
| 2543 |
"data_type": "int",
|
| 2544 |
"group_size": 128,
|
| 2545 |
"sym": true
|
|
@@ -2658,7 +2658,7 @@
|
|
| 2658 |
},
|
| 2659 |
"model.layers.4.mlp.router.classifier": {
|
| 2660 |
"act_bits": 16,
|
| 2661 |
-
"bits":
|
| 2662 |
"data_type": "int",
|
| 2663 |
"group_size": 128,
|
| 2664 |
"sym": true
|
|
@@ -2777,7 +2777,7 @@
|
|
| 2777 |
},
|
| 2778 |
"model.layers.5.mlp.router.classifier": {
|
| 2779 |
"act_bits": 16,
|
| 2780 |
-
"bits":
|
| 2781 |
"data_type": "int",
|
| 2782 |
"group_size": 128,
|
| 2783 |
"sym": true
|
|
@@ -2896,7 +2896,7 @@
|
|
| 2896 |
},
|
| 2897 |
"model.layers.6.mlp.router.classifier": {
|
| 2898 |
"act_bits": 16,
|
| 2899 |
-
"bits":
|
| 2900 |
"data_type": "int",
|
| 2901 |
"group_size": 128,
|
| 2902 |
"sym": true
|
|
@@ -3015,7 +3015,7 @@
|
|
| 3015 |
},
|
| 3016 |
"model.layers.7.mlp.router.classifier": {
|
| 3017 |
"act_bits": 16,
|
| 3018 |
-
"bits":
|
| 3019 |
"data_type": "int",
|
| 3020 |
"group_size": 128,
|
| 3021 |
"sym": true
|
|
@@ -3134,7 +3134,7 @@
|
|
| 3134 |
},
|
| 3135 |
"model.layers.8.mlp.router.classifier": {
|
| 3136 |
"act_bits": 16,
|
| 3137 |
-
"bits":
|
| 3138 |
"data_type": "int",
|
| 3139 |
"group_size": 128,
|
| 3140 |
"sym": true
|
|
@@ -3253,7 +3253,7 @@
|
|
| 3253 |
},
|
| 3254 |
"model.layers.9.mlp.router.classifier": {
|
| 3255 |
"act_bits": 16,
|
| 3256 |
-
"bits":
|
| 3257 |
"data_type": "int",
|
| 3258 |
"group_size": 128,
|
| 3259 |
"sym": true
|
|
|
|
| 40 |
"extra_config": {
|
| 41 |
"model.layers.0.mlp.router.classifier": {
|
| 42 |
"act_bits": 16,
|
| 43 |
+
"bits": 16,
|
| 44 |
"data_type": "int",
|
| 45 |
"group_size": 128,
|
| 46 |
"sym": true
|
|
|
|
| 159 |
},
|
| 160 |
"model.layers.1.mlp.router.classifier": {
|
| 161 |
"act_bits": 16,
|
| 162 |
+
"bits": 16,
|
| 163 |
"data_type": "int",
|
| 164 |
"group_size": 128,
|
| 165 |
"sym": true
|
|
|
|
| 278 |
},
|
| 279 |
"model.layers.10.mlp.router.classifier": {
|
| 280 |
"act_bits": 16,
|
| 281 |
+
"bits": 16,
|
| 282 |
"data_type": "int",
|
| 283 |
"group_size": 128,
|
| 284 |
"sym": true
|
|
|
|
| 397 |
},
|
| 398 |
"model.layers.11.mlp.router.classifier": {
|
| 399 |
"act_bits": 16,
|
| 400 |
+
"bits": 16,
|
| 401 |
"data_type": "int",
|
| 402 |
"group_size": 128,
|
| 403 |
"sym": true
|
|
|
|
| 516 |
},
|
| 517 |
"model.layers.12.mlp.router.classifier": {
|
| 518 |
"act_bits": 16,
|
| 519 |
+
"bits": 16,
|
| 520 |
"data_type": "int",
|
| 521 |
"group_size": 128,
|
| 522 |
"sym": true
|
|
|
|
| 635 |
},
|
| 636 |
"model.layers.13.mlp.router.classifier": {
|
| 637 |
"act_bits": 16,
|
| 638 |
+
"bits": 16,
|
| 639 |
"data_type": "int",
|
| 640 |
"group_size": 128,
|
| 641 |
"sym": true
|
|
|
|
| 754 |
},
|
| 755 |
"model.layers.14.mlp.router.classifier": {
|
| 756 |
"act_bits": 16,
|
| 757 |
+
"bits": 16,
|
| 758 |
"data_type": "int",
|
| 759 |
"group_size": 128,
|
| 760 |
"sym": true
|
|
|
|
| 873 |
},
|
| 874 |
"model.layers.15.mlp.router.classifier": {
|
| 875 |
"act_bits": 16,
|
| 876 |
+
"bits": 16,
|
| 877 |
"data_type": "int",
|
| 878 |
"group_size": 128,
|
| 879 |
"sym": true
|
|
|
|
| 992 |
},
|
| 993 |
"model.layers.16.mlp.router.classifier": {
|
| 994 |
"act_bits": 16,
|
| 995 |
+
"bits": 16,
|
| 996 |
"data_type": "int",
|
| 997 |
"group_size": 128,
|
| 998 |
"sym": true
|
|
|
|
| 1111 |
},
|
| 1112 |
"model.layers.17.mlp.router.classifier": {
|
| 1113 |
"act_bits": 16,
|
| 1114 |
+
"bits": 16,
|
| 1115 |
"data_type": "int",
|
| 1116 |
"group_size": 128,
|
| 1117 |
"sym": true
|
|
|
|
| 1230 |
},
|
| 1231 |
"model.layers.18.mlp.router.classifier": {
|
| 1232 |
"act_bits": 16,
|
| 1233 |
+
"bits": 16,
|
| 1234 |
"data_type": "int",
|
| 1235 |
"group_size": 128,
|
| 1236 |
"sym": true
|
|
|
|
| 1349 |
},
|
| 1350 |
"model.layers.19.mlp.router.classifier": {
|
| 1351 |
"act_bits": 16,
|
| 1352 |
+
"bits": 16,
|
| 1353 |
"data_type": "int",
|
| 1354 |
"group_size": 128,
|
| 1355 |
"sym": true
|
|
|
|
| 1468 |
},
|
| 1469 |
"model.layers.2.mlp.router.classifier": {
|
| 1470 |
"act_bits": 16,
|
| 1471 |
+
"bits": 16,
|
| 1472 |
"data_type": "int",
|
| 1473 |
"group_size": 128,
|
| 1474 |
"sym": true
|
|
|
|
| 1587 |
},
|
| 1588 |
"model.layers.20.mlp.router.classifier": {
|
| 1589 |
"act_bits": 16,
|
| 1590 |
+
"bits": 16,
|
| 1591 |
"data_type": "int",
|
| 1592 |
"group_size": 128,
|
| 1593 |
"sym": true
|
|
|
|
| 1706 |
},
|
| 1707 |
"model.layers.21.mlp.router.classifier": {
|
| 1708 |
"act_bits": 16,
|
| 1709 |
+
"bits": 16,
|
| 1710 |
"data_type": "int",
|
| 1711 |
"group_size": 128,
|
| 1712 |
"sym": true
|
|
|
|
| 1825 |
},
|
| 1826 |
"model.layers.22.mlp.router.classifier": {
|
| 1827 |
"act_bits": 16,
|
| 1828 |
+
"bits": 16,
|
| 1829 |
"data_type": "int",
|
| 1830 |
"group_size": 128,
|
| 1831 |
"sym": true
|
|
|
|
| 1944 |
},
|
| 1945 |
"model.layers.23.mlp.router.classifier": {
|
| 1946 |
"act_bits": 16,
|
| 1947 |
+
"bits": 16,
|
| 1948 |
"data_type": "int",
|
| 1949 |
"group_size": 128,
|
| 1950 |
"sym": true
|
|
|
|
| 2063 |
},
|
| 2064 |
"model.layers.24.mlp.router.classifier": {
|
| 2065 |
"act_bits": 16,
|
| 2066 |
+
"bits": 16,
|
| 2067 |
"data_type": "int",
|
| 2068 |
"group_size": 128,
|
| 2069 |
"sym": true
|
|
|
|
| 2182 |
},
|
| 2183 |
"model.layers.25.mlp.router.classifier": {
|
| 2184 |
"act_bits": 16,
|
| 2185 |
+
"bits": 16,
|
| 2186 |
"data_type": "int",
|
| 2187 |
"group_size": 128,
|
| 2188 |
"sym": true
|
|
|
|
| 2301 |
},
|
| 2302 |
"model.layers.26.mlp.router.classifier": {
|
| 2303 |
"act_bits": 16,
|
| 2304 |
+
"bits": 16,
|
| 2305 |
"data_type": "int",
|
| 2306 |
"group_size": 128,
|
| 2307 |
"sym": true
|
|
|
|
| 2420 |
},
|
| 2421 |
"model.layers.27.mlp.router.classifier": {
|
| 2422 |
"act_bits": 16,
|
| 2423 |
+
"bits": 16,
|
| 2424 |
"data_type": "int",
|
| 2425 |
"group_size": 128,
|
| 2426 |
"sym": true
|
|
|
|
| 2539 |
},
|
| 2540 |
"model.layers.3.mlp.router.classifier": {
|
| 2541 |
"act_bits": 16,
|
| 2542 |
+
"bits": 16,
|
| 2543 |
"data_type": "int",
|
| 2544 |
"group_size": 128,
|
| 2545 |
"sym": true
|
|
|
|
| 2658 |
},
|
| 2659 |
"model.layers.4.mlp.router.classifier": {
|
| 2660 |
"act_bits": 16,
|
| 2661 |
+
"bits": 16,
|
| 2662 |
"data_type": "int",
|
| 2663 |
"group_size": 128,
|
| 2664 |
"sym": true
|
|
|
|
| 2777 |
},
|
| 2778 |
"model.layers.5.mlp.router.classifier": {
|
| 2779 |
"act_bits": 16,
|
| 2780 |
+
"bits": 16,
|
| 2781 |
"data_type": "int",
|
| 2782 |
"group_size": 128,
|
| 2783 |
"sym": true
|
|
|
|
| 2896 |
},
|
| 2897 |
"model.layers.6.mlp.router.classifier": {
|
| 2898 |
"act_bits": 16,
|
| 2899 |
+
"bits": 16,
|
| 2900 |
"data_type": "int",
|
| 2901 |
"group_size": 128,
|
| 2902 |
"sym": true
|
|
|
|
| 3015 |
},
|
| 3016 |
"model.layers.7.mlp.router.classifier": {
|
| 3017 |
"act_bits": 16,
|
| 3018 |
+
"bits": 16,
|
| 3019 |
"data_type": "int",
|
| 3020 |
"group_size": 128,
|
| 3021 |
"sym": true
|
|
|
|
| 3134 |
},
|
| 3135 |
"model.layers.8.mlp.router.classifier": {
|
| 3136 |
"act_bits": 16,
|
| 3137 |
+
"bits": 16,
|
| 3138 |
"data_type": "int",
|
| 3139 |
"group_size": 128,
|
| 3140 |
"sym": true
|
|
|
|
| 3253 |
},
|
| 3254 |
"model.layers.9.mlp.router.classifier": {
|
| 3255 |
"act_bits": 16,
|
| 3256 |
+
"bits": 16,
|
| 3257 |
"data_type": "int",
|
| 3258 |
"group_size": 128,
|
| 3259 |
"sym": true
|
model-00003-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dedc7cc247bfef2604688a1f817b76a682d77808369de8bab2938cf04364654e
|
| 3 |
+
size 4999445736
|
model-00005-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:458569aa745d82c9eae7d984a09fbcc291caa854325e55619ff72bf257c60a8e
|
| 3 |
+
size 4999445736
|
model-00007-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:96a545be84b9f1decd636a7f8a32c6a1f59eaa8c9493d1965e6e378d0f7963e5
|
| 3 |
+
size 4999446056
|
model-00009-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61164ac03a9044caed24b3f1e1a97e061f1823b0c7e1f11e32f8e2e03b309e21
|
| 3 |
+
size 4999446384
|
model-00011-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e323febb7264e73adece23d2e2010b4b29756dd1349459ae79a18512c20ea0f8
|
| 3 |
+
size 4988689384
|
model-00014-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:014d65d3759dde7c6cb63849792513034e8d1f388429939a6ddf19ded11ed12f
|
| 3 |
+
size 4999446088
|
model-00016-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b64f6c1cfb5cfd8fc0246c22a8c24b7a9c8179a12836102c76d183a6c1dca0b4
|
| 3 |
+
size 4999445816
|
model-00018-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c8f7c80573cac968f511a278ed3974eb62a4e825f210b95f525812b04c7513f
|
| 3 |
+
size 4999445744
|
model-00020-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:44e7c239cf28b5abc3927372ec97ece605e1483270461f532d74f78922c78f4a
|
| 3 |
+
size 4999445744
|
model-00022-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d9e4f1fc277bc5c16e807510eefb6d387efbfe7ca32fe52326723de67a763b0
|
| 3 |
+
size 4999446648
|
model-00024-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e2a9b63cf5906e1074387a4d54f99f4f29f31debbc4997fbc3569dea906eeb07
|
| 3 |
+
size 4999448416
|
model-00026-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:801ba1f6ea68f631111e892766db3962e4b1308345e2f3b2065b7868a3df57a9
|
| 3 |
+
size 4942928384
|
model-00029-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b142a7a6f72b2982886c282ff1dba662de2a7f7a43acc9e9d41a3a65618a07f0
|
| 3 |
+
size 4999448136
|
model-00031-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:40c208573805fa73c4f08272f5c40bcde198e7c1790e8d16279e158e8ee6fe6e
|
| 3 |
+
size 4999447864
|
model-00033-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03640c2d908660045dddaf193587accdf89d264da037617c085b2f8ea271bebe
|
| 3 |
+
size 4999447792
|
model-00035-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9bf8787c73a75db7f12ea04ea556c62e79cde235ff2554f233eb64f17a1c6eff
|
| 3 |
+
size 4999447792
|
model-00037-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b414f11d43d7dd7375ba73a3725c7fdd100ff355f830ff3a9575e01210532229
|
| 3 |
+
size 4999448096
|
model-00039-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:74b41a6733cb5ea91712444c332140a56991242b8875ec4384616b9b16dc2208
|
| 3 |
+
size 4999448416
|
model-00041-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aeb052399b4e15ff0e7f18d1cb1b8020e4b2de0cabe550c99a9706a15f737b40
|
| 3 |
+
size 4942928384
|
model-00044-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2254af31b5909d75ffafb56598cd532e856a9bbf5c2ed002a1c42f25f6677a1
|
| 3 |
+
size 4999448136
|
model-00046-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37eabf9a7037fd2c2ffd3a70eb4ce5b0f4f85a9203148ed61fd99dd07288acd5
|
| 3 |
+
size 4999447864
|
model-00048-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f2557997e77f70df97ecaf17b4eba26d8f79f0796fae1979a5f01de33e71b0f
|
| 3 |
+
size 4999447792
|
model-00050-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97ee5c182390e75fb8736c516dd064e031ca391be9aee2a3e5194458e6949e8c
|
| 3 |
+
size 4999447792
|
model-00052-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:941662f827317e364b30eea0b5d0056c1a8485fcf410c437e300ae4beedcf527
|
| 3 |
+
size 4999448096
|
model-00054-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c98b13d488bf63e2f18c6a74380edf8e3ea2ba7069d790c6e7e1e68c1843c97
|
| 3 |
+
size 4999448416
|
model-00056-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f234f8078fda6d34c033d698fd16e3135c2314343c636c655433f8b16889b872
|
| 3 |
+
size 4942928384
|
model-00059-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0bff1fa67b62fd1ad55b3b14b9593d63cc82f0c5c957f504b44cc0981947b13e
|
| 3 |
+
size 4999448136
|
model-00061-of-00061.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa45e514a5a410aea388eccb4e3db5635f5cdd658015f9ef80a7b0ce43db138f
|
| 3 |
+
size 3177840888
|
model.safetensors.index.json
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90806d9ddadc141bb5e0c218e12847f692be28410ce9a8d9c76ab18d88e529d9
|
| 3 |
+
size 11895025
|
quantization_config.json
CHANGED
|
@@ -9,7 +9,7 @@
|
|
| 9 |
"packing_format": "auto_round:auto_gptq",
|
| 10 |
"extra_config": {
|
| 11 |
"model.layers.0.mlp.router.classifier": {
|
| 12 |
-
"bits":
|
| 13 |
"group_size": 128,
|
| 14 |
"sym": true,
|
| 15 |
"data_type": "int",
|
|
@@ -128,7 +128,7 @@
|
|
| 128 |
"act_bits": 16
|
| 129 |
},
|
| 130 |
"model.layers.1.mlp.router.classifier": {
|
| 131 |
-
"bits":
|
| 132 |
"group_size": 128,
|
| 133 |
"sym": true,
|
| 134 |
"data_type": "int",
|
|
@@ -247,7 +247,7 @@
|
|
| 247 |
"act_bits": 16
|
| 248 |
},
|
| 249 |
"model.layers.2.mlp.router.classifier": {
|
| 250 |
-
"bits":
|
| 251 |
"group_size": 128,
|
| 252 |
"sym": true,
|
| 253 |
"data_type": "int",
|
|
@@ -366,7 +366,7 @@
|
|
| 366 |
"act_bits": 16
|
| 367 |
},
|
| 368 |
"model.layers.3.mlp.router.classifier": {
|
| 369 |
-
"bits":
|
| 370 |
"group_size": 128,
|
| 371 |
"sym": true,
|
| 372 |
"data_type": "int",
|
|
@@ -485,7 +485,7 @@
|
|
| 485 |
"act_bits": 16
|
| 486 |
},
|
| 487 |
"model.layers.4.mlp.router.classifier": {
|
| 488 |
-
"bits":
|
| 489 |
"group_size": 128,
|
| 490 |
"sym": true,
|
| 491 |
"data_type": "int",
|
|
@@ -604,7 +604,7 @@
|
|
| 604 |
"act_bits": 16
|
| 605 |
},
|
| 606 |
"model.layers.5.mlp.router.classifier": {
|
| 607 |
-
"bits":
|
| 608 |
"group_size": 128,
|
| 609 |
"sym": true,
|
| 610 |
"data_type": "int",
|
|
@@ -723,7 +723,7 @@
|
|
| 723 |
"act_bits": 16
|
| 724 |
},
|
| 725 |
"model.layers.6.mlp.router.classifier": {
|
| 726 |
-
"bits":
|
| 727 |
"group_size": 128,
|
| 728 |
"sym": true,
|
| 729 |
"data_type": "int",
|
|
@@ -842,7 +842,7 @@
|
|
| 842 |
"act_bits": 16
|
| 843 |
},
|
| 844 |
"model.layers.7.mlp.router.classifier": {
|
| 845 |
-
"bits":
|
| 846 |
"group_size": 128,
|
| 847 |
"sym": true,
|
| 848 |
"data_type": "int",
|
|
@@ -961,7 +961,7 @@
|
|
| 961 |
"act_bits": 16
|
| 962 |
},
|
| 963 |
"model.layers.8.mlp.router.classifier": {
|
| 964 |
-
"bits":
|
| 965 |
"group_size": 128,
|
| 966 |
"sym": true,
|
| 967 |
"data_type": "int",
|
|
@@ -1080,7 +1080,7 @@
|
|
| 1080 |
"act_bits": 16
|
| 1081 |
},
|
| 1082 |
"model.layers.9.mlp.router.classifier": {
|
| 1083 |
-
"bits":
|
| 1084 |
"group_size": 128,
|
| 1085 |
"sym": true,
|
| 1086 |
"data_type": "int",
|
|
@@ -1199,7 +1199,7 @@
|
|
| 1199 |
"act_bits": 16
|
| 1200 |
},
|
| 1201 |
"model.layers.10.mlp.router.classifier": {
|
| 1202 |
-
"bits":
|
| 1203 |
"group_size": 128,
|
| 1204 |
"sym": true,
|
| 1205 |
"data_type": "int",
|
|
@@ -1318,7 +1318,7 @@
|
|
| 1318 |
"act_bits": 16
|
| 1319 |
},
|
| 1320 |
"model.layers.11.mlp.router.classifier": {
|
| 1321 |
-
"bits":
|
| 1322 |
"group_size": 128,
|
| 1323 |
"sym": true,
|
| 1324 |
"data_type": "int",
|
|
@@ -1437,7 +1437,7 @@
|
|
| 1437 |
"act_bits": 16
|
| 1438 |
},
|
| 1439 |
"model.layers.12.mlp.router.classifier": {
|
| 1440 |
-
"bits":
|
| 1441 |
"group_size": 128,
|
| 1442 |
"sym": true,
|
| 1443 |
"data_type": "int",
|
|
@@ -1556,7 +1556,7 @@
|
|
| 1556 |
"act_bits": 16
|
| 1557 |
},
|
| 1558 |
"model.layers.13.mlp.router.classifier": {
|
| 1559 |
-
"bits":
|
| 1560 |
"group_size": 128,
|
| 1561 |
"sym": true,
|
| 1562 |
"data_type": "int",
|
|
@@ -1675,7 +1675,7 @@
|
|
| 1675 |
"act_bits": 16
|
| 1676 |
},
|
| 1677 |
"model.layers.14.mlp.router.classifier": {
|
| 1678 |
-
"bits":
|
| 1679 |
"group_size": 128,
|
| 1680 |
"sym": true,
|
| 1681 |
"data_type": "int",
|
|
@@ -1794,7 +1794,7 @@
|
|
| 1794 |
"act_bits": 16
|
| 1795 |
},
|
| 1796 |
"model.layers.15.mlp.router.classifier": {
|
| 1797 |
-
"bits":
|
| 1798 |
"group_size": 128,
|
| 1799 |
"sym": true,
|
| 1800 |
"data_type": "int",
|
|
@@ -1913,7 +1913,7 @@
|
|
| 1913 |
"act_bits": 16
|
| 1914 |
},
|
| 1915 |
"model.layers.16.mlp.router.classifier": {
|
| 1916 |
-
"bits":
|
| 1917 |
"group_size": 128,
|
| 1918 |
"sym": true,
|
| 1919 |
"data_type": "int",
|
|
@@ -2032,7 +2032,7 @@
|
|
| 2032 |
"act_bits": 16
|
| 2033 |
},
|
| 2034 |
"model.layers.17.mlp.router.classifier": {
|
| 2035 |
-
"bits":
|
| 2036 |
"group_size": 128,
|
| 2037 |
"sym": true,
|
| 2038 |
"data_type": "int",
|
|
@@ -2151,7 +2151,7 @@
|
|
| 2151 |
"act_bits": 16
|
| 2152 |
},
|
| 2153 |
"model.layers.18.mlp.router.classifier": {
|
| 2154 |
-
"bits":
|
| 2155 |
"group_size": 128,
|
| 2156 |
"sym": true,
|
| 2157 |
"data_type": "int",
|
|
@@ -2270,7 +2270,7 @@
|
|
| 2270 |
"act_bits": 16
|
| 2271 |
},
|
| 2272 |
"model.layers.19.mlp.router.classifier": {
|
| 2273 |
-
"bits":
|
| 2274 |
"group_size": 128,
|
| 2275 |
"sym": true,
|
| 2276 |
"data_type": "int",
|
|
@@ -2389,7 +2389,7 @@
|
|
| 2389 |
"act_bits": 16
|
| 2390 |
},
|
| 2391 |
"model.layers.20.mlp.router.classifier": {
|
| 2392 |
-
"bits":
|
| 2393 |
"group_size": 128,
|
| 2394 |
"sym": true,
|
| 2395 |
"data_type": "int",
|
|
@@ -2508,7 +2508,7 @@
|
|
| 2508 |
"act_bits": 16
|
| 2509 |
},
|
| 2510 |
"model.layers.21.mlp.router.classifier": {
|
| 2511 |
-
"bits":
|
| 2512 |
"group_size": 128,
|
| 2513 |
"sym": true,
|
| 2514 |
"data_type": "int",
|
|
@@ -2627,7 +2627,7 @@
|
|
| 2627 |
"act_bits": 16
|
| 2628 |
},
|
| 2629 |
"model.layers.22.mlp.router.classifier": {
|
| 2630 |
-
"bits":
|
| 2631 |
"group_size": 128,
|
| 2632 |
"sym": true,
|
| 2633 |
"data_type": "int",
|
|
@@ -2746,7 +2746,7 @@
|
|
| 2746 |
"act_bits": 16
|
| 2747 |
},
|
| 2748 |
"model.layers.23.mlp.router.classifier": {
|
| 2749 |
-
"bits":
|
| 2750 |
"group_size": 128,
|
| 2751 |
"sym": true,
|
| 2752 |
"data_type": "int",
|
|
@@ -2865,7 +2865,7 @@
|
|
| 2865 |
"act_bits": 16
|
| 2866 |
},
|
| 2867 |
"model.layers.24.mlp.router.classifier": {
|
| 2868 |
-
"bits":
|
| 2869 |
"group_size": 128,
|
| 2870 |
"sym": true,
|
| 2871 |
"data_type": "int",
|
|
@@ -2984,7 +2984,7 @@
|
|
| 2984 |
"act_bits": 16
|
| 2985 |
},
|
| 2986 |
"model.layers.25.mlp.router.classifier": {
|
| 2987 |
-
"bits":
|
| 2988 |
"group_size": 128,
|
| 2989 |
"sym": true,
|
| 2990 |
"data_type": "int",
|
|
@@ -3103,7 +3103,7 @@
|
|
| 3103 |
"act_bits": 16
|
| 3104 |
},
|
| 3105 |
"model.layers.26.mlp.router.classifier": {
|
| 3106 |
-
"bits":
|
| 3107 |
"group_size": 128,
|
| 3108 |
"sym": true,
|
| 3109 |
"data_type": "int",
|
|
@@ -3222,7 +3222,7 @@
|
|
| 3222 |
"act_bits": 16
|
| 3223 |
},
|
| 3224 |
"model.layers.27.mlp.router.classifier": {
|
| 3225 |
-
"bits":
|
| 3226 |
"group_size": 128,
|
| 3227 |
"sym": true,
|
| 3228 |
"data_type": "int",
|
|
|
|
| 9 |
"packing_format": "auto_round:auto_gptq",
|
| 10 |
"extra_config": {
|
| 11 |
"model.layers.0.mlp.router.classifier": {
|
| 12 |
+
"bits": 16,
|
| 13 |
"group_size": 128,
|
| 14 |
"sym": true,
|
| 15 |
"data_type": "int",
|
|
|
|
| 128 |
"act_bits": 16
|
| 129 |
},
|
| 130 |
"model.layers.1.mlp.router.classifier": {
|
| 131 |
+
"bits": 16,
|
| 132 |
"group_size": 128,
|
| 133 |
"sym": true,
|
| 134 |
"data_type": "int",
|
|
|
|
| 247 |
"act_bits": 16
|
| 248 |
},
|
| 249 |
"model.layers.2.mlp.router.classifier": {
|
| 250 |
+
"bits": 16,
|
| 251 |
"group_size": 128,
|
| 252 |
"sym": true,
|
| 253 |
"data_type": "int",
|
|
|
|
| 366 |
"act_bits": 16
|
| 367 |
},
|
| 368 |
"model.layers.3.mlp.router.classifier": {
|
| 369 |
+
"bits": 16,
|
| 370 |
"group_size": 128,
|
| 371 |
"sym": true,
|
| 372 |
"data_type": "int",
|
|
|
|
| 485 |
"act_bits": 16
|
| 486 |
},
|
| 487 |
"model.layers.4.mlp.router.classifier": {
|
| 488 |
+
"bits": 16,
|
| 489 |
"group_size": 128,
|
| 490 |
"sym": true,
|
| 491 |
"data_type": "int",
|
|
|
|
| 604 |
"act_bits": 16
|
| 605 |
},
|
| 606 |
"model.layers.5.mlp.router.classifier": {
|
| 607 |
+
"bits": 16,
|
| 608 |
"group_size": 128,
|
| 609 |
"sym": true,
|
| 610 |
"data_type": "int",
|
|
|
|
| 723 |
"act_bits": 16
|
| 724 |
},
|
| 725 |
"model.layers.6.mlp.router.classifier": {
|
| 726 |
+
"bits": 16,
|
| 727 |
"group_size": 128,
|
| 728 |
"sym": true,
|
| 729 |
"data_type": "int",
|
|
|
|
| 842 |
"act_bits": 16
|
| 843 |
},
|
| 844 |
"model.layers.7.mlp.router.classifier": {
|
| 845 |
+
"bits": 16,
|
| 846 |
"group_size": 128,
|
| 847 |
"sym": true,
|
| 848 |
"data_type": "int",
|
|
|
|
| 961 |
"act_bits": 16
|
| 962 |
},
|
| 963 |
"model.layers.8.mlp.router.classifier": {
|
| 964 |
+
"bits": 16,
|
| 965 |
"group_size": 128,
|
| 966 |
"sym": true,
|
| 967 |
"data_type": "int",
|
|
|
|
| 1080 |
"act_bits": 16
|
| 1081 |
},
|
| 1082 |
"model.layers.9.mlp.router.classifier": {
|
| 1083 |
+
"bits": 16,
|
| 1084 |
"group_size": 128,
|
| 1085 |
"sym": true,
|
| 1086 |
"data_type": "int",
|
|
|
|
| 1199 |
"act_bits": 16
|
| 1200 |
},
|
| 1201 |
"model.layers.10.mlp.router.classifier": {
|
| 1202 |
+
"bits": 16,
|
| 1203 |
"group_size": 128,
|
| 1204 |
"sym": true,
|
| 1205 |
"data_type": "int",
|
|
|
|
| 1318 |
"act_bits": 16
|
| 1319 |
},
|
| 1320 |
"model.layers.11.mlp.router.classifier": {
|
| 1321 |
+
"bits": 16,
|
| 1322 |
"group_size": 128,
|
| 1323 |
"sym": true,
|
| 1324 |
"data_type": "int",
|
|
|
|
| 1437 |
"act_bits": 16
|
| 1438 |
},
|
| 1439 |
"model.layers.12.mlp.router.classifier": {
|
| 1440 |
+
"bits": 16,
|
| 1441 |
"group_size": 128,
|
| 1442 |
"sym": true,
|
| 1443 |
"data_type": "int",
|
|
|
|
| 1556 |
"act_bits": 16
|
| 1557 |
},
|
| 1558 |
"model.layers.13.mlp.router.classifier": {
|
| 1559 |
+
"bits": 16,
|
| 1560 |
"group_size": 128,
|
| 1561 |
"sym": true,
|
| 1562 |
"data_type": "int",
|
|
|
|
| 1675 |
"act_bits": 16
|
| 1676 |
},
|
| 1677 |
"model.layers.14.mlp.router.classifier": {
|
| 1678 |
+
"bits": 16,
|
| 1679 |
"group_size": 128,
|
| 1680 |
"sym": true,
|
| 1681 |
"data_type": "int",
|
|
|
|
| 1794 |
"act_bits": 16
|
| 1795 |
},
|
| 1796 |
"model.layers.15.mlp.router.classifier": {
|
| 1797 |
+
"bits": 16,
|
| 1798 |
"group_size": 128,
|
| 1799 |
"sym": true,
|
| 1800 |
"data_type": "int",
|
|
|
|
| 1913 |
"act_bits": 16
|
| 1914 |
},
|
| 1915 |
"model.layers.16.mlp.router.classifier": {
|
| 1916 |
+
"bits": 16,
|
| 1917 |
"group_size": 128,
|
| 1918 |
"sym": true,
|
| 1919 |
"data_type": "int",
|
|
|
|
| 2032 |
"act_bits": 16
|
| 2033 |
},
|
| 2034 |
"model.layers.17.mlp.router.classifier": {
|
| 2035 |
+
"bits": 16,
|
| 2036 |
"group_size": 128,
|
| 2037 |
"sym": true,
|
| 2038 |
"data_type": "int",
|
|
|
|
| 2151 |
"act_bits": 16
|
| 2152 |
},
|
| 2153 |
"model.layers.18.mlp.router.classifier": {
|
| 2154 |
+
"bits": 16,
|
| 2155 |
"group_size": 128,
|
| 2156 |
"sym": true,
|
| 2157 |
"data_type": "int",
|
|
|
|
| 2270 |
"act_bits": 16
|
| 2271 |
},
|
| 2272 |
"model.layers.19.mlp.router.classifier": {
|
| 2273 |
+
"bits": 16,
|
| 2274 |
"group_size": 128,
|
| 2275 |
"sym": true,
|
| 2276 |
"data_type": "int",
|
|
|
|
| 2389 |
"act_bits": 16
|
| 2390 |
},
|
| 2391 |
"model.layers.20.mlp.router.classifier": {
|
| 2392 |
+
"bits": 16,
|
| 2393 |
"group_size": 128,
|
| 2394 |
"sym": true,
|
| 2395 |
"data_type": "int",
|
|
|
|
| 2508 |
"act_bits": 16
|
| 2509 |
},
|
| 2510 |
"model.layers.21.mlp.router.classifier": {
|
| 2511 |
+
"bits": 16,
|
| 2512 |
"group_size": 128,
|
| 2513 |
"sym": true,
|
| 2514 |
"data_type": "int",
|
|
|
|
| 2627 |
"act_bits": 16
|
| 2628 |
},
|
| 2629 |
"model.layers.22.mlp.router.classifier": {
|
| 2630 |
+
"bits": 16,
|
| 2631 |
"group_size": 128,
|
| 2632 |
"sym": true,
|
| 2633 |
"data_type": "int",
|
|
|
|
| 2746 |
"act_bits": 16
|
| 2747 |
},
|
| 2748 |
"model.layers.23.mlp.router.classifier": {
|
| 2749 |
+
"bits": 16,
|
| 2750 |
"group_size": 128,
|
| 2751 |
"sym": true,
|
| 2752 |
"data_type": "int",
|
|
|
|
| 2865 |
"act_bits": 16
|
| 2866 |
},
|
| 2867 |
"model.layers.24.mlp.router.classifier": {
|
| 2868 |
+
"bits": 16,
|
| 2869 |
"group_size": 128,
|
| 2870 |
"sym": true,
|
| 2871 |
"data_type": "int",
|
|
|
|
| 2984 |
"act_bits": 16
|
| 2985 |
},
|
| 2986 |
"model.layers.25.mlp.router.classifier": {
|
| 2987 |
+
"bits": 16,
|
| 2988 |
"group_size": 128,
|
| 2989 |
"sym": true,
|
| 2990 |
"data_type": "int",
|
|
|
|
| 3103 |
"act_bits": 16
|
| 3104 |
},
|
| 3105 |
"model.layers.26.mlp.router.classifier": {
|
| 3106 |
+
"bits": 16,
|
| 3107 |
"group_size": 128,
|
| 3108 |
"sym": true,
|
| 3109 |
"data_type": "int",
|
|
|
|
| 3222 |
"act_bits": 16
|
| 3223 |
},
|
| 3224 |
"model.layers.27.mlp.router.classifier": {
|
| 3225 |
+
"bits": 16,
|
| 3226 |
"group_size": 128,
|
| 3227 |
"sym": true,
|
| 3228 |
"data_type": "int",
|