NicoNico6 commited on
Commit
db2b361
1 Parent(s): 7a7c71f
Files changed (2) hide show
  1. model.safetensors +2 -2
  2. quant_strategy.json +93 -93
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1479d41168e66acccc7278685851fca7d327062f186688b09d20c635ab7d6362
3
- size 2817405528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f49bd33dea3023b79936ea738a31c465f42f0d369f2387e61b8ef6ae3a1a7489
3
+ size 2817405544
quant_strategy.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "measurement": {
3
  "model.layers.0": {
4
- "accuracy": 0.877131462097168,
5
- "total_bits": 606753024,
6
  "q_proj": {
7
  "group_size": {
8
  "2": 64
@@ -17,10 +17,10 @@
17
  },
18
  "k_proj": {
19
  "group_size": {
20
- "2": 64
21
  },
22
  "bits": [
23
- 2
24
  ],
25
  "bits_prop": [
26
  1
@@ -41,10 +41,10 @@
41
  },
42
  "o_proj": {
43
  "group_size": {
44
- "4": 128
45
  },
46
  "bits": [
47
- 4
48
  ],
49
  "bits_prop": [
50
  1
@@ -77,10 +77,10 @@
77
  },
78
  "down_proj": {
79
  "group_size": {
80
- "4": 128
81
  },
82
  "bits": [
83
- 4
84
  ],
85
  "bits_prop": [
86
  1
@@ -89,8 +89,8 @@
89
  }
90
  },
91
  "model.layers.1": {
92
- "accuracy": 0.8948612213134766,
93
- "total_bits": 573724416,
94
  "q_proj": {
95
  "group_size": {
96
  "2": 64
@@ -165,10 +165,10 @@
165
  },
166
  "down_proj": {
167
  "group_size": {
168
- "4": 128
169
  },
170
  "bits": [
171
- 4
172
  ],
173
  "bits_prop": [
174
  1
@@ -177,7 +177,7 @@
177
  }
178
  },
179
  "model.layers.2": {
180
- "accuracy": 0.9520481824874878,
181
  "total_bits": 458124288,
182
  "q_proj": {
183
  "group_size": {
@@ -265,8 +265,8 @@
265
  }
266
  },
267
  "model.layers.3": {
268
- "accuracy": 0.9584293961524963,
269
- "total_bits": 466380288,
270
  "q_proj": {
271
  "group_size": {
272
  "2": 64
@@ -281,10 +281,10 @@
281
  },
282
  "k_proj": {
283
  "group_size": {
284
- "4": 128
285
  },
286
  "bits": [
287
- 4
288
  ],
289
  "bits_prop": [
290
  1
@@ -353,7 +353,7 @@
353
  }
354
  },
355
  "model.layers.4": {
356
- "accuracy": 0.9498380422592163,
357
  "total_bits": 458124288,
358
  "q_proj": {
359
  "group_size": {
@@ -441,7 +441,7 @@
441
  }
442
  },
443
  "model.layers.5": {
444
- "accuracy": 0.9403245449066162,
445
  "total_bits": 458124288,
446
  "q_proj": {
447
  "group_size": {
@@ -529,7 +529,7 @@
529
  }
530
  },
531
  "model.layers.6": {
532
- "accuracy": 0.9329239130020142,
533
  "total_bits": 458124288,
534
  "q_proj": {
535
  "group_size": {
@@ -617,7 +617,7 @@
617
  }
618
  },
619
  "model.layers.7": {
620
- "accuracy": 0.9157736301422119,
621
  "total_bits": 458124288,
622
  "q_proj": {
623
  "group_size": {
@@ -705,8 +705,8 @@
705
  }
706
  },
707
  "model.layers.8": {
708
- "accuracy": 0.9307241439819336,
709
- "total_bits": 491152896,
710
  "q_proj": {
711
  "group_size": {
712
  "2": 64
@@ -745,10 +745,10 @@
745
  },
746
  "o_proj": {
747
  "group_size": {
748
- "4": 128
749
  },
750
  "bits": [
751
- 4
752
  ],
753
  "bits_prop": [
754
  1
@@ -793,7 +793,7 @@
793
  }
794
  },
795
  "model.layers.9": {
796
- "accuracy": 0.9189841747283936,
797
  "total_bits": 458124288,
798
  "q_proj": {
799
  "group_size": {
@@ -881,7 +881,7 @@
881
  }
882
  },
883
  "model.layers.10": {
884
- "accuracy": 0.9128692150115967,
885
  "total_bits": 458124288,
886
  "q_proj": {
887
  "group_size": {
@@ -969,7 +969,7 @@
969
  }
970
  },
971
  "model.layers.11": {
972
- "accuracy": 0.9105658531188965,
973
  "total_bits": 458124288,
974
  "q_proj": {
975
  "group_size": {
@@ -1057,14 +1057,14 @@
1057
  }
1058
  },
1059
  "model.layers.12": {
1060
- "accuracy": 0.9119572639465332,
1061
- "total_bits": 491152896,
1062
  "q_proj": {
1063
  "group_size": {
1064
- "4": 128
1065
  },
1066
  "bits": [
1067
- 4
1068
  ],
1069
  "bits_prop": [
1070
  1
@@ -1073,10 +1073,10 @@
1073
  },
1074
  "k_proj": {
1075
  "group_size": {
1076
- "2": 64
1077
  },
1078
  "bits": [
1079
- 2
1080
  ],
1081
  "bits_prop": [
1082
  1
@@ -1145,7 +1145,7 @@
1145
  }
1146
  },
1147
  "model.layers.13": {
1148
- "accuracy": 0.9047572612762451,
1149
  "total_bits": 458124288,
1150
  "q_proj": {
1151
  "group_size": {
@@ -1233,7 +1233,7 @@
1233
  }
1234
  },
1235
  "model.layers.14": {
1236
- "accuracy": 0.8954880237579346,
1237
  "total_bits": 458124288,
1238
  "q_proj": {
1239
  "group_size": {
@@ -1321,7 +1321,7 @@
1321
  }
1322
  },
1323
  "model.layers.15": {
1324
- "accuracy": 0.8818550109863281,
1325
  "total_bits": 458124288,
1326
  "q_proj": {
1327
  "group_size": {
@@ -1409,7 +1409,7 @@
1409
  }
1410
  },
1411
  "model.layers.16": {
1412
- "accuracy": 0.8823418617248535,
1413
  "total_bits": 458124288,
1414
  "q_proj": {
1415
  "group_size": {
@@ -1497,8 +1497,8 @@
1497
  }
1498
  },
1499
  "model.layers.17": {
1500
- "accuracy": 0.8916378021240234,
1501
- "total_bits": 491152896,
1502
  "q_proj": {
1503
  "group_size": {
1504
  "2": 64
@@ -1513,10 +1513,10 @@
1513
  },
1514
  "k_proj": {
1515
  "group_size": {
1516
- "2": 64
1517
  },
1518
  "bits": [
1519
- 2
1520
  ],
1521
  "bits_prop": [
1522
  1
@@ -1537,10 +1537,10 @@
1537
  },
1538
  "o_proj": {
1539
  "group_size": {
1540
- "4": 128
1541
  },
1542
  "bits": [
1543
- 4
1544
  ],
1545
  "bits_prop": [
1546
  1
@@ -1585,8 +1585,8 @@
1585
  }
1586
  },
1587
  "model.layers.18": {
1588
- "accuracy": 0.8813910484313965,
1589
- "total_bits": 491152896,
1590
  "q_proj": {
1591
  "group_size": {
1592
  "2": 64
@@ -1601,10 +1601,10 @@
1601
  },
1602
  "k_proj": {
1603
  "group_size": {
1604
- "2": 64
1605
  },
1606
  "bits": [
1607
- 2
1608
  ],
1609
  "bits_prop": [
1610
  1
@@ -1625,10 +1625,10 @@
1625
  },
1626
  "o_proj": {
1627
  "group_size": {
1628
- "4": 128
1629
  },
1630
  "bits": [
1631
- 4
1632
  ],
1633
  "bits_prop": [
1634
  1
@@ -1673,8 +1673,8 @@
1673
  }
1674
  },
1675
  "model.layers.19": {
1676
- "accuracy": 0.879364013671875,
1677
- "total_bits": 491152896,
1678
  "q_proj": {
1679
  "group_size": {
1680
  "2": 64
@@ -1713,10 +1713,10 @@
1713
  },
1714
  "o_proj": {
1715
  "group_size": {
1716
- "4": 128
1717
  },
1718
  "bits": [
1719
- 4
1720
  ],
1721
  "bits_prop": [
1722
  1
@@ -1761,8 +1761,8 @@
1761
  }
1762
  },
1763
  "model.layers.20": {
1764
- "accuracy": 0.8831210136413574,
1765
- "total_bits": 458124288,
1766
  "q_proj": {
1767
  "group_size": {
1768
  "2": 64
@@ -1777,10 +1777,10 @@
1777
  },
1778
  "k_proj": {
1779
  "group_size": {
1780
- "2": 64
1781
  },
1782
  "bits": [
1783
- 2
1784
  ],
1785
  "bits_prop": [
1786
  1
@@ -1849,7 +1849,7 @@
1849
  }
1850
  },
1851
  "model.layers.21": {
1852
- "accuracy": 0.8880167007446289,
1853
  "total_bits": 458124288,
1854
  "q_proj": {
1855
  "group_size": {
@@ -1937,7 +1937,7 @@
1937
  }
1938
  },
1939
  "model.layers.22": {
1940
- "accuracy": 0.8944659233093262,
1941
  "total_bits": 458124288,
1942
  "q_proj": {
1943
  "group_size": {
@@ -2025,8 +2025,8 @@
2025
  }
2026
  },
2027
  "model.layers.23": {
2028
- "accuracy": 0.8957762718200684,
2029
- "total_bits": 466380288,
2030
  "q_proj": {
2031
  "group_size": {
2032
  "2": 64
@@ -2041,10 +2041,10 @@
2041
  },
2042
  "k_proj": {
2043
  "group_size": {
2044
- "4": 128
2045
  },
2046
  "bits": [
2047
- 4
2048
  ],
2049
  "bits_prop": [
2050
  1
@@ -2113,7 +2113,7 @@
2113
  }
2114
  },
2115
  "model.layers.24": {
2116
- "accuracy": 0.892493724822998,
2117
  "total_bits": 458124288,
2118
  "q_proj": {
2119
  "group_size": {
@@ -2201,7 +2201,7 @@
2201
  }
2202
  },
2203
  "model.layers.25": {
2204
- "accuracy": 0.8929567337036133,
2205
  "total_bits": 458124288,
2206
  "q_proj": {
2207
  "group_size": {
@@ -2289,8 +2289,8 @@
2289
  }
2290
  },
2291
  "model.layers.26": {
2292
- "accuracy": 0.8940300941467285,
2293
- "total_bits": 466380288,
2294
  "q_proj": {
2295
  "group_size": {
2296
  "2": 64
@@ -2305,10 +2305,10 @@
2305
  },
2306
  "k_proj": {
2307
  "group_size": {
2308
- "4": 128
2309
  },
2310
  "bits": [
2311
- 4
2312
  ],
2313
  "bits_prop": [
2314
  1
@@ -2377,8 +2377,8 @@
2377
  }
2378
  },
2379
  "model.layers.27": {
2380
- "accuracy": 0.8957915306091309,
2381
- "total_bits": 466380288,
2382
  "q_proj": {
2383
  "group_size": {
2384
  "2": 64
@@ -2393,10 +2393,10 @@
2393
  },
2394
  "k_proj": {
2395
  "group_size": {
2396
- "4": 128
2397
  },
2398
  "bits": [
2399
- 4
2400
  ],
2401
  "bits_prop": [
2402
  1
@@ -2465,7 +2465,7 @@
2465
  }
2466
  },
2467
  "model.layers.28": {
2468
- "accuracy": 0.8838896751403809,
2469
  "total_bits": 458124288,
2470
  "q_proj": {
2471
  "group_size": {
@@ -2553,8 +2553,8 @@
2553
  }
2554
  },
2555
  "model.layers.29": {
2556
- "accuracy": 0.8807954788208008,
2557
- "total_bits": 458124288,
2558
  "q_proj": {
2559
  "group_size": {
2560
  "2": 64
@@ -2629,10 +2629,10 @@
2629
  },
2630
  "down_proj": {
2631
  "group_size": {
2632
- "2": 64
2633
  },
2634
  "bits": [
2635
- 2
2636
  ],
2637
  "bits_prop": [
2638
  1
@@ -2641,8 +2641,8 @@
2641
  }
2642
  },
2643
  "model.layers.30": {
2644
- "accuracy": 0.9012184143066406,
2645
- "total_bits": 573724416,
2646
  "q_proj": {
2647
  "group_size": {
2648
  "2": 64
@@ -2681,10 +2681,10 @@
2681
  },
2682
  "o_proj": {
2683
  "group_size": {
2684
- "2": 64
2685
  },
2686
  "bits": [
2687
- 2
2688
  ],
2689
  "bits_prop": [
2690
  1
@@ -2729,8 +2729,8 @@
2729
  }
2730
  },
2731
  "model.layers.31": {
2732
- "accuracy": 0.8941550254821777,
2733
- "total_bits": 573724416,
2734
  "q_proj": {
2735
  "group_size": {
2736
  "2": 64
@@ -2745,10 +2745,10 @@
2745
  },
2746
  "k_proj": {
2747
  "group_size": {
2748
- "2": 64
2749
  },
2750
  "bits": [
2751
- 2
2752
  ],
2753
  "bits_prop": [
2754
  1
@@ -2769,10 +2769,10 @@
2769
  },
2770
  "o_proj": {
2771
  "group_size": {
2772
- "2": 64
2773
  },
2774
  "bits": [
2775
- 2
2776
  ],
2777
  "bits_prop": [
2778
  1
@@ -2781,10 +2781,10 @@
2781
  },
2782
  "up_proj": {
2783
  "group_size": {
2784
- "2": 64
2785
  },
2786
  "bits": [
2787
- 2
2788
  ],
2789
  "bits_prop": [
2790
  1
@@ -2793,10 +2793,10 @@
2793
  },
2794
  "gate_proj": {
2795
  "group_size": {
2796
- "2": 64
2797
  },
2798
  "bits": [
2799
- 2
2800
  ],
2801
  "bits_prop": [
2802
  1
 
1
  {
2
  "measurement": {
3
  "model.layers.0": {
4
+ "accuracy": 0.7869586944580078,
5
+ "total_bits": 466380288,
6
  "q_proj": {
7
  "group_size": {
8
  "2": 64
 
17
  },
18
  "k_proj": {
19
  "group_size": {
20
+ "4": 128
21
  },
22
  "bits": [
23
+ 4
24
  ],
25
  "bits_prop": [
26
  1
 
41
  },
42
  "o_proj": {
43
  "group_size": {
44
+ "2": 64
45
  },
46
  "bits": [
47
+ 2
48
  ],
49
  "bits_prop": [
50
  1
 
77
  },
78
  "down_proj": {
79
  "group_size": {
80
+ "2": 64
81
  },
82
  "bits": [
83
+ 2
84
  ],
85
  "bits_prop": [
86
  1
 
89
  }
90
  },
91
  "model.layers.1": {
92
+ "accuracy": 0.647979736328125,
93
+ "total_bits": 458124288,
94
  "q_proj": {
95
  "group_size": {
96
  "2": 64
 
165
  },
166
  "down_proj": {
167
  "group_size": {
168
+ "2": 64
169
  },
170
  "bits": [
171
+ 2
172
  ],
173
  "bits_prop": [
174
  1
 
177
  }
178
  },
179
  "model.layers.2": {
180
+ "accuracy": 0.9489546418190002,
181
  "total_bits": 458124288,
182
  "q_proj": {
183
  "group_size": {
 
265
  }
266
  },
267
  "model.layers.3": {
268
+ "accuracy": 0.9539257287979126,
269
+ "total_bits": 458124288,
270
  "q_proj": {
271
  "group_size": {
272
  "2": 64
 
281
  },
282
  "k_proj": {
283
  "group_size": {
284
+ "2": 64
285
  },
286
  "bits": [
287
+ 2
288
  ],
289
  "bits_prop": [
290
  1
 
353
  }
354
  },
355
  "model.layers.4": {
356
+ "accuracy": 0.948026180267334,
357
  "total_bits": 458124288,
358
  "q_proj": {
359
  "group_size": {
 
441
  }
442
  },
443
  "model.layers.5": {
444
+ "accuracy": 0.938827395439148,
445
  "total_bits": 458124288,
446
  "q_proj": {
447
  "group_size": {
 
529
  }
530
  },
531
  "model.layers.6": {
532
+ "accuracy": 0.9337625503540039,
533
  "total_bits": 458124288,
534
  "q_proj": {
535
  "group_size": {
 
617
  }
618
  },
619
  "model.layers.7": {
620
+ "accuracy": 0.9189379215240479,
621
  "total_bits": 458124288,
622
  "q_proj": {
623
  "group_size": {
 
705
  }
706
  },
707
  "model.layers.8": {
708
+ "accuracy": 0.9234421253204346,
709
+ "total_bits": 458124288,
710
  "q_proj": {
711
  "group_size": {
712
  "2": 64
 
745
  },
746
  "o_proj": {
747
  "group_size": {
748
+ "2": 64
749
  },
750
  "bits": [
751
+ 2
752
  ],
753
  "bits_prop": [
754
  1
 
793
  }
794
  },
795
  "model.layers.9": {
796
+ "accuracy": 0.9196293354034424,
797
  "total_bits": 458124288,
798
  "q_proj": {
799
  "group_size": {
 
881
  }
882
  },
883
  "model.layers.10": {
884
+ "accuracy": 0.9117538928985596,
885
  "total_bits": 458124288,
886
  "q_proj": {
887
  "group_size": {
 
969
  }
970
  },
971
  "model.layers.11": {
972
+ "accuracy": 0.9103360176086426,
973
  "total_bits": 458124288,
974
  "q_proj": {
975
  "group_size": {
 
1057
  }
1058
  },
1059
  "model.layers.12": {
1060
+ "accuracy": 0.9095911979675293,
1061
+ "total_bits": 466380288,
1062
  "q_proj": {
1063
  "group_size": {
1064
+ "2": 64
1065
  },
1066
  "bits": [
1067
+ 2
1068
  ],
1069
  "bits_prop": [
1070
  1
 
1073
  },
1074
  "k_proj": {
1075
  "group_size": {
1076
+ "4": 128
1077
  },
1078
  "bits": [
1079
+ 4
1080
  ],
1081
  "bits_prop": [
1082
  1
 
1145
  }
1146
  },
1147
  "model.layers.13": {
1148
+ "accuracy": 0.9048597812652588,
1149
  "total_bits": 458124288,
1150
  "q_proj": {
1151
  "group_size": {
 
1233
  }
1234
  },
1235
  "model.layers.14": {
1236
+ "accuracy": 0.8939895629882812,
1237
  "total_bits": 458124288,
1238
  "q_proj": {
1239
  "group_size": {
 
1321
  }
1322
  },
1323
  "model.layers.15": {
1324
+ "accuracy": 0.88232421875,
1325
  "total_bits": 458124288,
1326
  "q_proj": {
1327
  "group_size": {
 
1409
  }
1410
  },
1411
  "model.layers.16": {
1412
+ "accuracy": 0.8802495002746582,
1413
  "total_bits": 458124288,
1414
  "q_proj": {
1415
  "group_size": {
 
1497
  }
1498
  },
1499
  "model.layers.17": {
1500
+ "accuracy": 0.8810954093933105,
1501
+ "total_bits": 466380288,
1502
  "q_proj": {
1503
  "group_size": {
1504
  "2": 64
 
1513
  },
1514
  "k_proj": {
1515
  "group_size": {
1516
+ "4": 128
1517
  },
1518
  "bits": [
1519
+ 4
1520
  ],
1521
  "bits_prop": [
1522
  1
 
1537
  },
1538
  "o_proj": {
1539
  "group_size": {
1540
+ "2": 64
1541
  },
1542
  "bits": [
1543
+ 2
1544
  ],
1545
  "bits_prop": [
1546
  1
 
1585
  }
1586
  },
1587
  "model.layers.18": {
1588
+ "accuracy": 0.8681793212890625,
1589
+ "total_bits": 466380288,
1590
  "q_proj": {
1591
  "group_size": {
1592
  "2": 64
 
1601
  },
1602
  "k_proj": {
1603
  "group_size": {
1604
+ "4": 128
1605
  },
1606
  "bits": [
1607
+ 4
1608
  ],
1609
  "bits_prop": [
1610
  1
 
1625
  },
1626
  "o_proj": {
1627
  "group_size": {
1628
+ "2": 64
1629
  },
1630
  "bits": [
1631
+ 2
1632
  ],
1633
  "bits_prop": [
1634
  1
 
1673
  }
1674
  },
1675
  "model.layers.19": {
1676
+ "accuracy": 0.865323543548584,
1677
+ "total_bits": 458124288,
1678
  "q_proj": {
1679
  "group_size": {
1680
  "2": 64
 
1713
  },
1714
  "o_proj": {
1715
  "group_size": {
1716
+ "2": 64
1717
  },
1718
  "bits": [
1719
+ 2
1720
  ],
1721
  "bits_prop": [
1722
  1
 
1761
  }
1762
  },
1763
  "model.layers.20": {
1764
+ "accuracy": 0.8790159225463867,
1765
+ "total_bits": 466380288,
1766
  "q_proj": {
1767
  "group_size": {
1768
  "2": 64
 
1777
  },
1778
  "k_proj": {
1779
  "group_size": {
1780
+ "4": 128
1781
  },
1782
  "bits": [
1783
+ 4
1784
  ],
1785
  "bits_prop": [
1786
  1
 
1849
  }
1850
  },
1851
  "model.layers.21": {
1852
+ "accuracy": 0.8824334144592285,
1853
  "total_bits": 458124288,
1854
  "q_proj": {
1855
  "group_size": {
 
1937
  }
1938
  },
1939
  "model.layers.22": {
1940
+ "accuracy": 0.8895416259765625,
1941
  "total_bits": 458124288,
1942
  "q_proj": {
1943
  "group_size": {
 
2025
  }
2026
  },
2027
  "model.layers.23": {
2028
+ "accuracy": 0.889040470123291,
2029
+ "total_bits": 458124288,
2030
  "q_proj": {
2031
  "group_size": {
2032
  "2": 64
 
2041
  },
2042
  "k_proj": {
2043
  "group_size": {
2044
+ "2": 64
2045
  },
2046
  "bits": [
2047
+ 2
2048
  ],
2049
  "bits_prop": [
2050
  1
 
2113
  }
2114
  },
2115
  "model.layers.24": {
2116
+ "accuracy": 0.8891377449035645,
2117
  "total_bits": 458124288,
2118
  "q_proj": {
2119
  "group_size": {
 
2201
  }
2202
  },
2203
  "model.layers.25": {
2204
+ "accuracy": 0.888709545135498,
2205
  "total_bits": 458124288,
2206
  "q_proj": {
2207
  "group_size": {
 
2289
  }
2290
  },
2291
  "model.layers.26": {
2292
+ "accuracy": 0.8839888572692871,
2293
+ "total_bits": 458124288,
2294
  "q_proj": {
2295
  "group_size": {
2296
  "2": 64
 
2305
  },
2306
  "k_proj": {
2307
  "group_size": {
2308
+ "2": 64
2309
  },
2310
  "bits": [
2311
+ 2
2312
  ],
2313
  "bits_prop": [
2314
  1
 
2377
  }
2378
  },
2379
  "model.layers.27": {
2380
+ "accuracy": 0.8789157867431641,
2381
+ "total_bits": 458124288,
2382
  "q_proj": {
2383
  "group_size": {
2384
  "2": 64
 
2393
  },
2394
  "k_proj": {
2395
  "group_size": {
2396
+ "2": 64
2397
  },
2398
  "bits": [
2399
+ 2
2400
  ],
2401
  "bits_prop": [
2402
  1
 
2465
  }
2466
  },
2467
  "model.layers.28": {
2468
+ "accuracy": 0.8596110343933105,
2469
  "total_bits": 458124288,
2470
  "q_proj": {
2471
  "group_size": {
 
2553
  }
2554
  },
2555
  "model.layers.29": {
2556
+ "accuracy": 0.8909573554992676,
2557
+ "total_bits": 573724416,
2558
  "q_proj": {
2559
  "group_size": {
2560
  "2": 64
 
2629
  },
2630
  "down_proj": {
2631
  "group_size": {
2632
+ "4": 128
2633
  },
2634
  "bits": [
2635
+ 4
2636
  ],
2637
  "bits_prop": [
2638
  1
 
2641
  }
2642
  },
2643
  "model.layers.30": {
2644
+ "accuracy": 0.8890519142150879,
2645
+ "total_bits": 606753024,
2646
  "q_proj": {
2647
  "group_size": {
2648
  "2": 64
 
2681
  },
2682
  "o_proj": {
2683
  "group_size": {
2684
+ "4": 128
2685
  },
2686
  "bits": [
2687
+ 4
2688
  ],
2689
  "bits_prop": [
2690
  1
 
2729
  }
2730
  },
2731
  "model.layers.31": {
2732
+ "accuracy": 0.9532780647277832,
2733
+ "total_bits": 846216960,
2734
  "q_proj": {
2735
  "group_size": {
2736
  "2": 64
 
2745
  },
2746
  "k_proj": {
2747
  "group_size": {
2748
+ "4": 128
2749
  },
2750
  "bits": [
2751
+ 4
2752
  ],
2753
  "bits_prop": [
2754
  1
 
2769
  },
2770
  "o_proj": {
2771
  "group_size": {
2772
+ "4": 128
2773
  },
2774
  "bits": [
2775
+ 4
2776
  ],
2777
  "bits_prop": [
2778
  1
 
2781
  },
2782
  "up_proj": {
2783
  "group_size": {
2784
+ "4": 128
2785
  },
2786
  "bits": [
2787
+ 4
2788
  ],
2789
  "bits_prop": [
2790
  1
 
2793
  },
2794
  "gate_proj": {
2795
  "group_size": {
2796
+ "4": 128
2797
  },
2798
  "bits": [
2799
+ 4
2800
  ],
2801
  "bits_prop": [
2802
  1