INC4AI commited on
Commit
0455f52
·
verified ·
1 Parent(s): 6148d4c

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -40,7 +40,7 @@
40
  "extra_config": {
41
  "model.layers.0.mlp.router.classifier": {
42
  "act_bits": 16,
43
- "bits": 8,
44
  "data_type": "int",
45
  "group_size": 128,
46
  "sym": true
@@ -159,7 +159,7 @@
159
  },
160
  "model.layers.1.mlp.router.classifier": {
161
  "act_bits": 16,
162
- "bits": 8,
163
  "data_type": "int",
164
  "group_size": 128,
165
  "sym": true
@@ -278,7 +278,7 @@
278
  },
279
  "model.layers.10.mlp.router.classifier": {
280
  "act_bits": 16,
281
- "bits": 8,
282
  "data_type": "int",
283
  "group_size": 128,
284
  "sym": true
@@ -397,7 +397,7 @@
397
  },
398
  "model.layers.11.mlp.router.classifier": {
399
  "act_bits": 16,
400
- "bits": 8,
401
  "data_type": "int",
402
  "group_size": 128,
403
  "sym": true
@@ -516,7 +516,7 @@
516
  },
517
  "model.layers.12.mlp.router.classifier": {
518
  "act_bits": 16,
519
- "bits": 8,
520
  "data_type": "int",
521
  "group_size": 128,
522
  "sym": true
@@ -635,7 +635,7 @@
635
  },
636
  "model.layers.13.mlp.router.classifier": {
637
  "act_bits": 16,
638
- "bits": 8,
639
  "data_type": "int",
640
  "group_size": 128,
641
  "sym": true
@@ -754,7 +754,7 @@
754
  },
755
  "model.layers.14.mlp.router.classifier": {
756
  "act_bits": 16,
757
- "bits": 8,
758
  "data_type": "int",
759
  "group_size": 128,
760
  "sym": true
@@ -873,7 +873,7 @@
873
  },
874
  "model.layers.15.mlp.router.classifier": {
875
  "act_bits": 16,
876
- "bits": 8,
877
  "data_type": "int",
878
  "group_size": 128,
879
  "sym": true
@@ -992,7 +992,7 @@
992
  },
993
  "model.layers.16.mlp.router.classifier": {
994
  "act_bits": 16,
995
- "bits": 8,
996
  "data_type": "int",
997
  "group_size": 128,
998
  "sym": true
@@ -1111,7 +1111,7 @@
1111
  },
1112
  "model.layers.17.mlp.router.classifier": {
1113
  "act_bits": 16,
1114
- "bits": 8,
1115
  "data_type": "int",
1116
  "group_size": 128,
1117
  "sym": true
@@ -1230,7 +1230,7 @@
1230
  },
1231
  "model.layers.18.mlp.router.classifier": {
1232
  "act_bits": 16,
1233
- "bits": 8,
1234
  "data_type": "int",
1235
  "group_size": 128,
1236
  "sym": true
@@ -1349,7 +1349,7 @@
1349
  },
1350
  "model.layers.19.mlp.router.classifier": {
1351
  "act_bits": 16,
1352
- "bits": 8,
1353
  "data_type": "int",
1354
  "group_size": 128,
1355
  "sym": true
@@ -1468,7 +1468,7 @@
1468
  },
1469
  "model.layers.2.mlp.router.classifier": {
1470
  "act_bits": 16,
1471
- "bits": 8,
1472
  "data_type": "int",
1473
  "group_size": 128,
1474
  "sym": true
@@ -1587,7 +1587,7 @@
1587
  },
1588
  "model.layers.20.mlp.router.classifier": {
1589
  "act_bits": 16,
1590
- "bits": 8,
1591
  "data_type": "int",
1592
  "group_size": 128,
1593
  "sym": true
@@ -1706,7 +1706,7 @@
1706
  },
1707
  "model.layers.21.mlp.router.classifier": {
1708
  "act_bits": 16,
1709
- "bits": 8,
1710
  "data_type": "int",
1711
  "group_size": 128,
1712
  "sym": true
@@ -1825,7 +1825,7 @@
1825
  },
1826
  "model.layers.22.mlp.router.classifier": {
1827
  "act_bits": 16,
1828
- "bits": 8,
1829
  "data_type": "int",
1830
  "group_size": 128,
1831
  "sym": true
@@ -1944,7 +1944,7 @@
1944
  },
1945
  "model.layers.23.mlp.router.classifier": {
1946
  "act_bits": 16,
1947
- "bits": 8,
1948
  "data_type": "int",
1949
  "group_size": 128,
1950
  "sym": true
@@ -2063,7 +2063,7 @@
2063
  },
2064
  "model.layers.24.mlp.router.classifier": {
2065
  "act_bits": 16,
2066
- "bits": 8,
2067
  "data_type": "int",
2068
  "group_size": 128,
2069
  "sym": true
@@ -2182,7 +2182,7 @@
2182
  },
2183
  "model.layers.25.mlp.router.classifier": {
2184
  "act_bits": 16,
2185
- "bits": 8,
2186
  "data_type": "int",
2187
  "group_size": 128,
2188
  "sym": true
@@ -2301,7 +2301,7 @@
2301
  },
2302
  "model.layers.26.mlp.router.classifier": {
2303
  "act_bits": 16,
2304
- "bits": 8,
2305
  "data_type": "int",
2306
  "group_size": 128,
2307
  "sym": true
@@ -2420,7 +2420,7 @@
2420
  },
2421
  "model.layers.27.mlp.router.classifier": {
2422
  "act_bits": 16,
2423
- "bits": 8,
2424
  "data_type": "int",
2425
  "group_size": 128,
2426
  "sym": true
@@ -2539,7 +2539,7 @@
2539
  },
2540
  "model.layers.3.mlp.router.classifier": {
2541
  "act_bits": 16,
2542
- "bits": 8,
2543
  "data_type": "int",
2544
  "group_size": 128,
2545
  "sym": true
@@ -2658,7 +2658,7 @@
2658
  },
2659
  "model.layers.4.mlp.router.classifier": {
2660
  "act_bits": 16,
2661
- "bits": 8,
2662
  "data_type": "int",
2663
  "group_size": 128,
2664
  "sym": true
@@ -2777,7 +2777,7 @@
2777
  },
2778
  "model.layers.5.mlp.router.classifier": {
2779
  "act_bits": 16,
2780
- "bits": 8,
2781
  "data_type": "int",
2782
  "group_size": 128,
2783
  "sym": true
@@ -2896,7 +2896,7 @@
2896
  },
2897
  "model.layers.6.mlp.router.classifier": {
2898
  "act_bits": 16,
2899
- "bits": 8,
2900
  "data_type": "int",
2901
  "group_size": 128,
2902
  "sym": true
@@ -3015,7 +3015,7 @@
3015
  },
3016
  "model.layers.7.mlp.router.classifier": {
3017
  "act_bits": 16,
3018
- "bits": 8,
3019
  "data_type": "int",
3020
  "group_size": 128,
3021
  "sym": true
@@ -3134,7 +3134,7 @@
3134
  },
3135
  "model.layers.8.mlp.router.classifier": {
3136
  "act_bits": 16,
3137
- "bits": 8,
3138
  "data_type": "int",
3139
  "group_size": 128,
3140
  "sym": true
@@ -3253,7 +3253,7 @@
3253
  },
3254
  "model.layers.9.mlp.router.classifier": {
3255
  "act_bits": 16,
3256
- "bits": 8,
3257
  "data_type": "int",
3258
  "group_size": 128,
3259
  "sym": true
 
40
  "extra_config": {
41
  "model.layers.0.mlp.router.classifier": {
42
  "act_bits": 16,
43
+ "bits": 16,
44
  "data_type": "int",
45
  "group_size": 128,
46
  "sym": true
 
159
  },
160
  "model.layers.1.mlp.router.classifier": {
161
  "act_bits": 16,
162
+ "bits": 16,
163
  "data_type": "int",
164
  "group_size": 128,
165
  "sym": true
 
278
  },
279
  "model.layers.10.mlp.router.classifier": {
280
  "act_bits": 16,
281
+ "bits": 16,
282
  "data_type": "int",
283
  "group_size": 128,
284
  "sym": true
 
397
  },
398
  "model.layers.11.mlp.router.classifier": {
399
  "act_bits": 16,
400
+ "bits": 16,
401
  "data_type": "int",
402
  "group_size": 128,
403
  "sym": true
 
516
  },
517
  "model.layers.12.mlp.router.classifier": {
518
  "act_bits": 16,
519
+ "bits": 16,
520
  "data_type": "int",
521
  "group_size": 128,
522
  "sym": true
 
635
  },
636
  "model.layers.13.mlp.router.classifier": {
637
  "act_bits": 16,
638
+ "bits": 16,
639
  "data_type": "int",
640
  "group_size": 128,
641
  "sym": true
 
754
  },
755
  "model.layers.14.mlp.router.classifier": {
756
  "act_bits": 16,
757
+ "bits": 16,
758
  "data_type": "int",
759
  "group_size": 128,
760
  "sym": true
 
873
  },
874
  "model.layers.15.mlp.router.classifier": {
875
  "act_bits": 16,
876
+ "bits": 16,
877
  "data_type": "int",
878
  "group_size": 128,
879
  "sym": true
 
992
  },
993
  "model.layers.16.mlp.router.classifier": {
994
  "act_bits": 16,
995
+ "bits": 16,
996
  "data_type": "int",
997
  "group_size": 128,
998
  "sym": true
 
1111
  },
1112
  "model.layers.17.mlp.router.classifier": {
1113
  "act_bits": 16,
1114
+ "bits": 16,
1115
  "data_type": "int",
1116
  "group_size": 128,
1117
  "sym": true
 
1230
  },
1231
  "model.layers.18.mlp.router.classifier": {
1232
  "act_bits": 16,
1233
+ "bits": 16,
1234
  "data_type": "int",
1235
  "group_size": 128,
1236
  "sym": true
 
1349
  },
1350
  "model.layers.19.mlp.router.classifier": {
1351
  "act_bits": 16,
1352
+ "bits": 16,
1353
  "data_type": "int",
1354
  "group_size": 128,
1355
  "sym": true
 
1468
  },
1469
  "model.layers.2.mlp.router.classifier": {
1470
  "act_bits": 16,
1471
+ "bits": 16,
1472
  "data_type": "int",
1473
  "group_size": 128,
1474
  "sym": true
 
1587
  },
1588
  "model.layers.20.mlp.router.classifier": {
1589
  "act_bits": 16,
1590
+ "bits": 16,
1591
  "data_type": "int",
1592
  "group_size": 128,
1593
  "sym": true
 
1706
  },
1707
  "model.layers.21.mlp.router.classifier": {
1708
  "act_bits": 16,
1709
+ "bits": 16,
1710
  "data_type": "int",
1711
  "group_size": 128,
1712
  "sym": true
 
1825
  },
1826
  "model.layers.22.mlp.router.classifier": {
1827
  "act_bits": 16,
1828
+ "bits": 16,
1829
  "data_type": "int",
1830
  "group_size": 128,
1831
  "sym": true
 
1944
  },
1945
  "model.layers.23.mlp.router.classifier": {
1946
  "act_bits": 16,
1947
+ "bits": 16,
1948
  "data_type": "int",
1949
  "group_size": 128,
1950
  "sym": true
 
2063
  },
2064
  "model.layers.24.mlp.router.classifier": {
2065
  "act_bits": 16,
2066
+ "bits": 16,
2067
  "data_type": "int",
2068
  "group_size": 128,
2069
  "sym": true
 
2182
  },
2183
  "model.layers.25.mlp.router.classifier": {
2184
  "act_bits": 16,
2185
+ "bits": 16,
2186
  "data_type": "int",
2187
  "group_size": 128,
2188
  "sym": true
 
2301
  },
2302
  "model.layers.26.mlp.router.classifier": {
2303
  "act_bits": 16,
2304
+ "bits": 16,
2305
  "data_type": "int",
2306
  "group_size": 128,
2307
  "sym": true
 
2420
  },
2421
  "model.layers.27.mlp.router.classifier": {
2422
  "act_bits": 16,
2423
+ "bits": 16,
2424
  "data_type": "int",
2425
  "group_size": 128,
2426
  "sym": true
 
2539
  },
2540
  "model.layers.3.mlp.router.classifier": {
2541
  "act_bits": 16,
2542
+ "bits": 16,
2543
  "data_type": "int",
2544
  "group_size": 128,
2545
  "sym": true
 
2658
  },
2659
  "model.layers.4.mlp.router.classifier": {
2660
  "act_bits": 16,
2661
+ "bits": 16,
2662
  "data_type": "int",
2663
  "group_size": 128,
2664
  "sym": true
 
2777
  },
2778
  "model.layers.5.mlp.router.classifier": {
2779
  "act_bits": 16,
2780
+ "bits": 16,
2781
  "data_type": "int",
2782
  "group_size": 128,
2783
  "sym": true
 
2896
  },
2897
  "model.layers.6.mlp.router.classifier": {
2898
  "act_bits": 16,
2899
+ "bits": 16,
2900
  "data_type": "int",
2901
  "group_size": 128,
2902
  "sym": true
 
3015
  },
3016
  "model.layers.7.mlp.router.classifier": {
3017
  "act_bits": 16,
3018
+ "bits": 16,
3019
  "data_type": "int",
3020
  "group_size": 128,
3021
  "sym": true
 
3134
  },
3135
  "model.layers.8.mlp.router.classifier": {
3136
  "act_bits": 16,
3137
+ "bits": 16,
3138
  "data_type": "int",
3139
  "group_size": 128,
3140
  "sym": true
 
3253
  },
3254
  "model.layers.9.mlp.router.classifier": {
3255
  "act_bits": 16,
3256
+ "bits": 16,
3257
  "data_type": "int",
3258
  "group_size": 128,
3259
  "sym": true
model-00003-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43d02bed6dafc4e1334cd2c60cf7f569717f7cd95b0062508c5ff0bc351257cc
3
- size 4994837976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dedc7cc247bfef2604688a1f817b76a682d77808369de8bab2938cf04364654e
3
+ size 4999445736
model-00005-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d49176fc6b3671651f67f94850370834813a212ed700a91e74c3de37537b6dd
3
- size 4994837976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:458569aa745d82c9eae7d984a09fbcc291caa854325e55619ff72bf257c60a8e
3
+ size 4999445736
model-00007-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36466d48d5edc97cf3a76142cdc5d01030769842eef2d7ba64917698deec6cf8
3
- size 4994838296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96a545be84b9f1decd636a7f8a32c6a1f59eaa8c9493d1965e6e378d0f7963e5
3
+ size 4999446056
model-00009-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d981cf843ec2d7fae26ad08d860800ca3c22812113183eb9a221444a51fb9278
3
- size 4994838616
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61164ac03a9044caed24b3f1e1a97e061f1823b0c7e1f11e32f8e2e03b309e21
3
+ size 4999446384
model-00011-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c6c717aef80208f00a380123622a02ace04a7a7da82b0b2c97c0c0bf59665c9
3
- size 4984081616
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e323febb7264e73adece23d2e2010b4b29756dd1349459ae79a18512c20ea0f8
3
+ size 4988689384
model-00014-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e01b088d9549be6c444e0f692ecec71dd4c89b8ba9184baef36b0dcafaf42bbd
3
- size 4994838320
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:014d65d3759dde7c6cb63849792513034e8d1f388429939a6ddf19ded11ed12f
3
+ size 4999446088
model-00016-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b02b4c1ebd5b7427934142ec19988a8f71587dd7a0d7d3f3a3a5c25c9c0e28b
3
- size 4994838048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b64f6c1cfb5cfd8fc0246c22a8c24b7a9c8179a12836102c76d183a6c1dca0b4
3
+ size 4999445816
model-00018-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21b21568b9b92054203df88b5bae4da191ca5c3fccf267f4b5e0f6c497152add
3
- size 4994837984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c8f7c80573cac968f511a278ed3974eb62a4e825f210b95f525812b04c7513f
3
+ size 4999445744
model-00020-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66eca59142fa91e054960f63f53f1766ee52f261c58dacdfc5bb01943dfc7e04
3
- size 4994837984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44e7c239cf28b5abc3927372ec97ece605e1483270461f532d74f78922c78f4a
3
+ size 4999445744
model-00022-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c28a516a40d9590937fc3089ade4ceeee8a7537197b24f1680bb0a80fbaad01
3
- size 4994838880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d9e4f1fc277bc5c16e807510eefb6d387efbfe7ca32fe52326723de67a763b0
3
+ size 4999446648
model-00024-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3ed027e8b89b7211f234bb47e922dc73defb3ae6d8667e6aa763d818600c653
3
- size 4994840656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2a9b63cf5906e1074387a4d54f99f4f29f31debbc4997fbc3569dea906eeb07
3
+ size 4999448416
model-00026-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53e201e958133f95c45041443ce76a1eca26ba4a0a58aef47416181b72f68e67
3
- size 4938320624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:801ba1f6ea68f631111e892766db3962e4b1308345e2f3b2065b7868a3df57a9
3
+ size 4942928384
model-00029-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cda3b5139bedf8f1f0be069b682b4a339bc280544335d9a29afa1de1e6284bed
3
- size 4994840368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b142a7a6f72b2982886c282ff1dba662de2a7f7a43acc9e9d41a3a65618a07f0
3
+ size 4999448136
model-00031-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4ed47b1db1ae5ddbd50a54e5ca93a2f6e15ce07dc4efcf3b50d84f9254d0c73
3
- size 4994840096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40c208573805fa73c4f08272f5c40bcde198e7c1790e8d16279e158e8ee6fe6e
3
+ size 4999447864
model-00033-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40e97cf44ba6d1027dfb3213402380a6c5d4ef451934233a11161d33d7976c69
3
- size 4994840032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03640c2d908660045dddaf193587accdf89d264da037617c085b2f8ea271bebe
3
+ size 4999447792
model-00035-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ea7ba424a4846c69bfd08bcec57f9061370ce6977dd6d44d02096ccf48d956d
3
- size 4994840032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bf8787c73a75db7f12ea04ea556c62e79cde235ff2554f233eb64f17a1c6eff
3
+ size 4999447792
model-00037-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cdc005d94768c7f8ca78ee526967aa804f86b49e84ff91153c8e9517f7d34453
3
- size 4994840328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b414f11d43d7dd7375ba73a3725c7fdd100ff355f830ff3a9575e01210532229
3
+ size 4999448096
model-00039-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:993f0113cf108afd6c56ee3ddefd906155f4338c2b2091ccb346158e71025842
3
- size 4994840656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74b41a6733cb5ea91712444c332140a56991242b8875ec4384616b9b16dc2208
3
+ size 4999448416
model-00041-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9bdb5d4e9a80cba58b4fbd232505b8cf659864c6f7406e756b8e5e6eb047987
3
- size 4938320624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeb052399b4e15ff0e7f18d1cb1b8020e4b2de0cabe550c99a9706a15f737b40
3
+ size 4942928384
model-00044-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4bdf3f368b90b16998fa8a3e0ace222411bf42b91b9f0afc9351bdbc66aac70
3
- size 4994840368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2254af31b5909d75ffafb56598cd532e856a9bbf5c2ed002a1c42f25f6677a1
3
+ size 4999448136
model-00046-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:107f2fbaa9d60a185e2a5c64677da647957c757df8a6b93e508c3d4d8f31ad4b
3
- size 4994840096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37eabf9a7037fd2c2ffd3a70eb4ce5b0f4f85a9203148ed61fd99dd07288acd5
3
+ size 4999447864
model-00048-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d54454f233919dec55278bf15671968aeebf40ccf0820564e5a9373e26d7b1f6
3
- size 4994840032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f2557997e77f70df97ecaf17b4eba26d8f79f0796fae1979a5f01de33e71b0f
3
+ size 4999447792
model-00050-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8eb9d5743a197cc9272419e8c0d815e126edd246b49ef587a97bc229488ac304
3
- size 4994840032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97ee5c182390e75fb8736c516dd064e031ca391be9aee2a3e5194458e6949e8c
3
+ size 4999447792
model-00052-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c78c0a9e71cc759eebd11a9b575565499dd384a2c91242864e0254535b831f77
3
- size 4994840328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:941662f827317e364b30eea0b5d0056c1a8485fcf410c437e300ae4beedcf527
3
+ size 4999448096
model-00054-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0601777c0dc6e3e86a732173d95508ffd113b4fce94174fa9b9c90142031f9ab
3
- size 4994840656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c98b13d488bf63e2f18c6a74380edf8e3ea2ba7069d790c6e7e1e68c1843c97
3
+ size 4999448416
model-00056-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77958c4d4008ef133217ce283486720d1e225270139616cb3b0bda744dc67ab8
3
- size 4938320624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f234f8078fda6d34c033d698fd16e3135c2314343c636c655433f8b16889b872
3
+ size 4942928384
model-00059-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:784e3152e28322fa1df0427da54f0e02e1ebf753487b957ba8d50c65050531a6
3
- size 4994840368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bff1fa67b62fd1ad55b3b14b9593d63cc82f0c5c957f504b44cc0981947b13e
3
+ size 4999448136
model-00061-of-00061.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cef6c1244848727dab395b62706d513d4aebac102e20fb31a7cd09e7dd88167e
3
- size 3173233120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa45e514a5a410aea388eccb4e3db5635f5cdd658015f9ef80a7b0ce43db138f
3
+ size 3177840888
model.safetensors.index.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd11a4516d45204e651cbb7593c2153dcf7de411f75bc89fa7634f0e3131b1cc
3
- size 11899961
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90806d9ddadc141bb5e0c218e12847f692be28410ce9a8d9c76ab18d88e529d9
3
+ size 11895025
quantization_config.json CHANGED
@@ -9,7 +9,7 @@
9
  "packing_format": "auto_round:auto_gptq",
10
  "extra_config": {
11
  "model.layers.0.mlp.router.classifier": {
12
- "bits": 8,
13
  "group_size": 128,
14
  "sym": true,
15
  "data_type": "int",
@@ -128,7 +128,7 @@
128
  "act_bits": 16
129
  },
130
  "model.layers.1.mlp.router.classifier": {
131
- "bits": 8,
132
  "group_size": 128,
133
  "sym": true,
134
  "data_type": "int",
@@ -247,7 +247,7 @@
247
  "act_bits": 16
248
  },
249
  "model.layers.2.mlp.router.classifier": {
250
- "bits": 8,
251
  "group_size": 128,
252
  "sym": true,
253
  "data_type": "int",
@@ -366,7 +366,7 @@
366
  "act_bits": 16
367
  },
368
  "model.layers.3.mlp.router.classifier": {
369
- "bits": 8,
370
  "group_size": 128,
371
  "sym": true,
372
  "data_type": "int",
@@ -485,7 +485,7 @@
485
  "act_bits": 16
486
  },
487
  "model.layers.4.mlp.router.classifier": {
488
- "bits": 8,
489
  "group_size": 128,
490
  "sym": true,
491
  "data_type": "int",
@@ -604,7 +604,7 @@
604
  "act_bits": 16
605
  },
606
  "model.layers.5.mlp.router.classifier": {
607
- "bits": 8,
608
  "group_size": 128,
609
  "sym": true,
610
  "data_type": "int",
@@ -723,7 +723,7 @@
723
  "act_bits": 16
724
  },
725
  "model.layers.6.mlp.router.classifier": {
726
- "bits": 8,
727
  "group_size": 128,
728
  "sym": true,
729
  "data_type": "int",
@@ -842,7 +842,7 @@
842
  "act_bits": 16
843
  },
844
  "model.layers.7.mlp.router.classifier": {
845
- "bits": 8,
846
  "group_size": 128,
847
  "sym": true,
848
  "data_type": "int",
@@ -961,7 +961,7 @@
961
  "act_bits": 16
962
  },
963
  "model.layers.8.mlp.router.classifier": {
964
- "bits": 8,
965
  "group_size": 128,
966
  "sym": true,
967
  "data_type": "int",
@@ -1080,7 +1080,7 @@
1080
  "act_bits": 16
1081
  },
1082
  "model.layers.9.mlp.router.classifier": {
1083
- "bits": 8,
1084
  "group_size": 128,
1085
  "sym": true,
1086
  "data_type": "int",
@@ -1199,7 +1199,7 @@
1199
  "act_bits": 16
1200
  },
1201
  "model.layers.10.mlp.router.classifier": {
1202
- "bits": 8,
1203
  "group_size": 128,
1204
  "sym": true,
1205
  "data_type": "int",
@@ -1318,7 +1318,7 @@
1318
  "act_bits": 16
1319
  },
1320
  "model.layers.11.mlp.router.classifier": {
1321
- "bits": 8,
1322
  "group_size": 128,
1323
  "sym": true,
1324
  "data_type": "int",
@@ -1437,7 +1437,7 @@
1437
  "act_bits": 16
1438
  },
1439
  "model.layers.12.mlp.router.classifier": {
1440
- "bits": 8,
1441
  "group_size": 128,
1442
  "sym": true,
1443
  "data_type": "int",
@@ -1556,7 +1556,7 @@
1556
  "act_bits": 16
1557
  },
1558
  "model.layers.13.mlp.router.classifier": {
1559
- "bits": 8,
1560
  "group_size": 128,
1561
  "sym": true,
1562
  "data_type": "int",
@@ -1675,7 +1675,7 @@
1675
  "act_bits": 16
1676
  },
1677
  "model.layers.14.mlp.router.classifier": {
1678
- "bits": 8,
1679
  "group_size": 128,
1680
  "sym": true,
1681
  "data_type": "int",
@@ -1794,7 +1794,7 @@
1794
  "act_bits": 16
1795
  },
1796
  "model.layers.15.mlp.router.classifier": {
1797
- "bits": 8,
1798
  "group_size": 128,
1799
  "sym": true,
1800
  "data_type": "int",
@@ -1913,7 +1913,7 @@
1913
  "act_bits": 16
1914
  },
1915
  "model.layers.16.mlp.router.classifier": {
1916
- "bits": 8,
1917
  "group_size": 128,
1918
  "sym": true,
1919
  "data_type": "int",
@@ -2032,7 +2032,7 @@
2032
  "act_bits": 16
2033
  },
2034
  "model.layers.17.mlp.router.classifier": {
2035
- "bits": 8,
2036
  "group_size": 128,
2037
  "sym": true,
2038
  "data_type": "int",
@@ -2151,7 +2151,7 @@
2151
  "act_bits": 16
2152
  },
2153
  "model.layers.18.mlp.router.classifier": {
2154
- "bits": 8,
2155
  "group_size": 128,
2156
  "sym": true,
2157
  "data_type": "int",
@@ -2270,7 +2270,7 @@
2270
  "act_bits": 16
2271
  },
2272
  "model.layers.19.mlp.router.classifier": {
2273
- "bits": 8,
2274
  "group_size": 128,
2275
  "sym": true,
2276
  "data_type": "int",
@@ -2389,7 +2389,7 @@
2389
  "act_bits": 16
2390
  },
2391
  "model.layers.20.mlp.router.classifier": {
2392
- "bits": 8,
2393
  "group_size": 128,
2394
  "sym": true,
2395
  "data_type": "int",
@@ -2508,7 +2508,7 @@
2508
  "act_bits": 16
2509
  },
2510
  "model.layers.21.mlp.router.classifier": {
2511
- "bits": 8,
2512
  "group_size": 128,
2513
  "sym": true,
2514
  "data_type": "int",
@@ -2627,7 +2627,7 @@
2627
  "act_bits": 16
2628
  },
2629
  "model.layers.22.mlp.router.classifier": {
2630
- "bits": 8,
2631
  "group_size": 128,
2632
  "sym": true,
2633
  "data_type": "int",
@@ -2746,7 +2746,7 @@
2746
  "act_bits": 16
2747
  },
2748
  "model.layers.23.mlp.router.classifier": {
2749
- "bits": 8,
2750
  "group_size": 128,
2751
  "sym": true,
2752
  "data_type": "int",
@@ -2865,7 +2865,7 @@
2865
  "act_bits": 16
2866
  },
2867
  "model.layers.24.mlp.router.classifier": {
2868
- "bits": 8,
2869
  "group_size": 128,
2870
  "sym": true,
2871
  "data_type": "int",
@@ -2984,7 +2984,7 @@
2984
  "act_bits": 16
2985
  },
2986
  "model.layers.25.mlp.router.classifier": {
2987
- "bits": 8,
2988
  "group_size": 128,
2989
  "sym": true,
2990
  "data_type": "int",
@@ -3103,7 +3103,7 @@
3103
  "act_bits": 16
3104
  },
3105
  "model.layers.26.mlp.router.classifier": {
3106
- "bits": 8,
3107
  "group_size": 128,
3108
  "sym": true,
3109
  "data_type": "int",
@@ -3222,7 +3222,7 @@
3222
  "act_bits": 16
3223
  },
3224
  "model.layers.27.mlp.router.classifier": {
3225
- "bits": 8,
3226
  "group_size": 128,
3227
  "sym": true,
3228
  "data_type": "int",
 
9
  "packing_format": "auto_round:auto_gptq",
10
  "extra_config": {
11
  "model.layers.0.mlp.router.classifier": {
12
+ "bits": 16,
13
  "group_size": 128,
14
  "sym": true,
15
  "data_type": "int",
 
128
  "act_bits": 16
129
  },
130
  "model.layers.1.mlp.router.classifier": {
131
+ "bits": 16,
132
  "group_size": 128,
133
  "sym": true,
134
  "data_type": "int",
 
247
  "act_bits": 16
248
  },
249
  "model.layers.2.mlp.router.classifier": {
250
+ "bits": 16,
251
  "group_size": 128,
252
  "sym": true,
253
  "data_type": "int",
 
366
  "act_bits": 16
367
  },
368
  "model.layers.3.mlp.router.classifier": {
369
+ "bits": 16,
370
  "group_size": 128,
371
  "sym": true,
372
  "data_type": "int",
 
485
  "act_bits": 16
486
  },
487
  "model.layers.4.mlp.router.classifier": {
488
+ "bits": 16,
489
  "group_size": 128,
490
  "sym": true,
491
  "data_type": "int",
 
604
  "act_bits": 16
605
  },
606
  "model.layers.5.mlp.router.classifier": {
607
+ "bits": 16,
608
  "group_size": 128,
609
  "sym": true,
610
  "data_type": "int",
 
723
  "act_bits": 16
724
  },
725
  "model.layers.6.mlp.router.classifier": {
726
+ "bits": 16,
727
  "group_size": 128,
728
  "sym": true,
729
  "data_type": "int",
 
842
  "act_bits": 16
843
  },
844
  "model.layers.7.mlp.router.classifier": {
845
+ "bits": 16,
846
  "group_size": 128,
847
  "sym": true,
848
  "data_type": "int",
 
961
  "act_bits": 16
962
  },
963
  "model.layers.8.mlp.router.classifier": {
964
+ "bits": 16,
965
  "group_size": 128,
966
  "sym": true,
967
  "data_type": "int",
 
1080
  "act_bits": 16
1081
  },
1082
  "model.layers.9.mlp.router.classifier": {
1083
+ "bits": 16,
1084
  "group_size": 128,
1085
  "sym": true,
1086
  "data_type": "int",
 
1199
  "act_bits": 16
1200
  },
1201
  "model.layers.10.mlp.router.classifier": {
1202
+ "bits": 16,
1203
  "group_size": 128,
1204
  "sym": true,
1205
  "data_type": "int",
 
1318
  "act_bits": 16
1319
  },
1320
  "model.layers.11.mlp.router.classifier": {
1321
+ "bits": 16,
1322
  "group_size": 128,
1323
  "sym": true,
1324
  "data_type": "int",
 
1437
  "act_bits": 16
1438
  },
1439
  "model.layers.12.mlp.router.classifier": {
1440
+ "bits": 16,
1441
  "group_size": 128,
1442
  "sym": true,
1443
  "data_type": "int",
 
1556
  "act_bits": 16
1557
  },
1558
  "model.layers.13.mlp.router.classifier": {
1559
+ "bits": 16,
1560
  "group_size": 128,
1561
  "sym": true,
1562
  "data_type": "int",
 
1675
  "act_bits": 16
1676
  },
1677
  "model.layers.14.mlp.router.classifier": {
1678
+ "bits": 16,
1679
  "group_size": 128,
1680
  "sym": true,
1681
  "data_type": "int",
 
1794
  "act_bits": 16
1795
  },
1796
  "model.layers.15.mlp.router.classifier": {
1797
+ "bits": 16,
1798
  "group_size": 128,
1799
  "sym": true,
1800
  "data_type": "int",
 
1913
  "act_bits": 16
1914
  },
1915
  "model.layers.16.mlp.router.classifier": {
1916
+ "bits": 16,
1917
  "group_size": 128,
1918
  "sym": true,
1919
  "data_type": "int",
 
2032
  "act_bits": 16
2033
  },
2034
  "model.layers.17.mlp.router.classifier": {
2035
+ "bits": 16,
2036
  "group_size": 128,
2037
  "sym": true,
2038
  "data_type": "int",
 
2151
  "act_bits": 16
2152
  },
2153
  "model.layers.18.mlp.router.classifier": {
2154
+ "bits": 16,
2155
  "group_size": 128,
2156
  "sym": true,
2157
  "data_type": "int",
 
2270
  "act_bits": 16
2271
  },
2272
  "model.layers.19.mlp.router.classifier": {
2273
+ "bits": 16,
2274
  "group_size": 128,
2275
  "sym": true,
2276
  "data_type": "int",
 
2389
  "act_bits": 16
2390
  },
2391
  "model.layers.20.mlp.router.classifier": {
2392
+ "bits": 16,
2393
  "group_size": 128,
2394
  "sym": true,
2395
  "data_type": "int",
 
2508
  "act_bits": 16
2509
  },
2510
  "model.layers.21.mlp.router.classifier": {
2511
+ "bits": 16,
2512
  "group_size": 128,
2513
  "sym": true,
2514
  "data_type": "int",
 
2627
  "act_bits": 16
2628
  },
2629
  "model.layers.22.mlp.router.classifier": {
2630
+ "bits": 16,
2631
  "group_size": 128,
2632
  "sym": true,
2633
  "data_type": "int",
 
2746
  "act_bits": 16
2747
  },
2748
  "model.layers.23.mlp.router.classifier": {
2749
+ "bits": 16,
2750
  "group_size": 128,
2751
  "sym": true,
2752
  "data_type": "int",
 
2865
  "act_bits": 16
2866
  },
2867
  "model.layers.24.mlp.router.classifier": {
2868
+ "bits": 16,
2869
  "group_size": 128,
2870
  "sym": true,
2871
  "data_type": "int",
 
2984
  "act_bits": 16
2985
  },
2986
  "model.layers.25.mlp.router.classifier": {
2987
+ "bits": 16,
2988
  "group_size": 128,
2989
  "sym": true,
2990
  "data_type": "int",
 
3103
  "act_bits": 16
3104
  },
3105
  "model.layers.26.mlp.router.classifier": {
3106
+ "bits": 16,
3107
  "group_size": 128,
3108
  "sym": true,
3109
  "data_type": "int",
 
3222
  "act_bits": 16
3223
  },
3224
  "model.layers.27.mlp.router.classifier": {
3225
+ "bits": 16,
3226
  "group_size": 128,
3227
  "sym": true,
3228
  "data_type": "int",