Upload folder using huggingface_hub
Browse files- config.json +1 -1
- model.safetensors +2 -2
- quant_log.csv +168 -168
- quantize_config.json +1 -1
config.json
CHANGED
|
@@ -47,7 +47,7 @@
|
|
| 47 |
"bits": 4,
|
| 48 |
"checkpoint_format": "gptq",
|
| 49 |
"desc_act": false,
|
| 50 |
-
"group_size":
|
| 51 |
"lm_head": false,
|
| 52 |
"meta": {
|
| 53 |
"act_group_aware": true,
|
|
|
|
| 47 |
"bits": 4,
|
| 48 |
"checkpoint_format": "gptq",
|
| 49 |
"desc_act": false,
|
| 50 |
+
"group_size": 32,
|
| 51 |
"lm_head": false,
|
| 52 |
"meta": {
|
| 53 |
"act_group_aware": true,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5431a0944d541d6043c2541ccdc041cc5abccb2148eb43433ea55ebe726d0afb
|
| 3 |
+
size 480351195
|
quant_log.csv
CHANGED
|
@@ -1,169 +1,169 @@
|
|
| 1 |
layer,module,loss,samples,damp,time
|
| 2 |
-
0,self_attn.k_proj,0.
|
| 3 |
-
0,self_attn.v_proj,0.
|
| 4 |
-
0,self_attn.q_proj,0.
|
| 5 |
-
0,self_attn.o_proj,0.
|
| 6 |
-
0,mlp.up_proj,0.
|
| 7 |
-
0,mlp.gate_proj,0.
|
| 8 |
-
0,mlp.down_proj,0.
|
| 9 |
-
1,self_attn.k_proj,0.
|
| 10 |
-
1,self_attn.
|
| 11 |
-
1,self_attn.
|
| 12 |
-
1,self_attn.o_proj,0.
|
| 13 |
-
1,mlp.
|
| 14 |
-
1,mlp.
|
| 15 |
-
1,mlp.down_proj,0.
|
| 16 |
-
2,self_attn.k_proj,0.
|
| 17 |
-
2,self_attn.v_proj,0.
|
| 18 |
-
2,self_attn.q_proj,0.
|
| 19 |
-
2,self_attn.o_proj,0.
|
| 20 |
-
2,mlp.
|
| 21 |
-
2,mlp.
|
| 22 |
-
2,mlp.down_proj,0.
|
| 23 |
-
3,self_attn.k_proj,0.
|
| 24 |
-
3,self_attn.v_proj,0.
|
| 25 |
-
3,self_attn.q_proj,0.
|
| 26 |
-
3,self_attn.o_proj,0.
|
| 27 |
-
3,mlp.gate_proj,0.
|
| 28 |
-
3,mlp.up_proj,0.
|
| 29 |
-
3,mlp.down_proj,0.
|
| 30 |
-
4,self_attn.
|
| 31 |
-
4,self_attn.q_proj,0.
|
| 32 |
-
4,self_attn.
|
| 33 |
-
4,self_attn.o_proj,0.
|
| 34 |
-
4,mlp.up_proj,0.
|
| 35 |
-
4,mlp.gate_proj,0.
|
| 36 |
-
4,mlp.down_proj,0.
|
| 37 |
-
5,self_attn.k_proj,0.
|
| 38 |
-
5,self_attn.v_proj,0.
|
| 39 |
-
5,self_attn.q_proj,0.
|
| 40 |
-
5,self_attn.o_proj,0.
|
| 41 |
-
5,mlp.gate_proj,0.
|
| 42 |
-
5,mlp.up_proj,0.
|
| 43 |
-
5,mlp.down_proj,0.
|
| 44 |
-
6,self_attn.k_proj,0.
|
| 45 |
-
6,self_attn.
|
| 46 |
-
6,self_attn.
|
| 47 |
-
6,self_attn.o_proj,0.
|
| 48 |
-
6,mlp.
|
| 49 |
-
6,mlp.
|
| 50 |
-
6,mlp.down_proj,0.
|
| 51 |
-
7,self_attn.k_proj,0.
|
| 52 |
-
7,self_attn.q_proj,0.
|
| 53 |
-
7,self_attn.v_proj,0.
|
| 54 |
-
7,self_attn.o_proj,0.
|
| 55 |
-
7,mlp.
|
| 56 |
-
7,mlp.
|
| 57 |
-
7,mlp.down_proj,0.
|
| 58 |
-
8,self_attn.k_proj,0.
|
| 59 |
-
8,self_attn.
|
| 60 |
-
8,self_attn.
|
| 61 |
-
8,self_attn.o_proj,0.
|
| 62 |
-
8,mlp.
|
| 63 |
-
8,mlp.
|
| 64 |
-
8,mlp.down_proj,0.
|
| 65 |
-
9,self_attn.k_proj,0.
|
| 66 |
-
9,self_attn.
|
| 67 |
-
9,self_attn.
|
| 68 |
-
9,self_attn.o_proj,0.
|
| 69 |
-
9,mlp.gate_proj,0.
|
| 70 |
-
9,mlp.up_proj,0.
|
| 71 |
-
9,mlp.down_proj,0.
|
| 72 |
-
10,self_attn.k_proj,0.
|
| 73 |
-
10,self_attn.
|
| 74 |
-
10,self_attn.
|
| 75 |
-
10,self_attn.o_proj,0.
|
| 76 |
-
10,mlp.
|
| 77 |
-
10,mlp.
|
| 78 |
-
10,mlp.down_proj,0.
|
| 79 |
-
11,self_attn.
|
| 80 |
-
11,self_attn.
|
| 81 |
-
11,self_attn.
|
| 82 |
-
11,self_attn.o_proj,0.
|
| 83 |
-
11,mlp.gate_proj,0.
|
| 84 |
-
11,mlp.up_proj,0.
|
| 85 |
-
11,mlp.down_proj,0.
|
| 86 |
-
12,self_attn.
|
| 87 |
-
12,self_attn.
|
| 88 |
-
12,self_attn.
|
| 89 |
-
12,self_attn.o_proj,0.
|
| 90 |
-
12,mlp.
|
| 91 |
-
12,mlp.
|
| 92 |
-
12,mlp.down_proj,0.
|
| 93 |
-
13,self_attn.
|
| 94 |
-
13,self_attn.
|
| 95 |
-
13,self_attn.
|
| 96 |
-
13,self_attn.o_proj,0.
|
| 97 |
-
13,mlp.gate_proj,0.
|
| 98 |
-
13,mlp.up_proj,0.
|
| 99 |
-
13,mlp.down_proj,0.
|
| 100 |
-
14,self_attn.k_proj,0.
|
| 101 |
-
14,self_attn.q_proj,0.
|
| 102 |
-
14,self_attn.v_proj,0.
|
| 103 |
-
14,self_attn.o_proj,0.
|
| 104 |
-
14,mlp.up_proj,0.
|
| 105 |
-
14,mlp.gate_proj,0.
|
| 106 |
-
14,mlp.down_proj,0.
|
| 107 |
-
15,self_attn.k_proj,0.
|
| 108 |
-
15,self_attn.
|
| 109 |
-
15,self_attn.
|
| 110 |
-
15,self_attn.o_proj,0.
|
| 111 |
-
15,mlp.gate_proj,0.
|
| 112 |
-
15,mlp.up_proj,0.
|
| 113 |
-
15,mlp.down_proj,0.
|
| 114 |
-
16,self_attn.k_proj,0.
|
| 115 |
-
16,self_attn.v_proj,0.
|
| 116 |
-
16,self_attn.q_proj,0.
|
| 117 |
-
16,self_attn.o_proj,0.
|
| 118 |
-
16,mlp.
|
| 119 |
-
16,mlp.
|
| 120 |
-
16,mlp.down_proj,0.
|
| 121 |
-
17,self_attn.k_proj,0.
|
| 122 |
-
17,self_attn.q_proj,0.
|
| 123 |
-
17,self_attn.v_proj,0.
|
| 124 |
-
17,self_attn.o_proj,0.
|
| 125 |
-
17,mlp.
|
| 126 |
-
17,mlp.
|
| 127 |
-
17,mlp.down_proj,0.
|
| 128 |
-
18,self_attn.
|
| 129 |
-
18,self_attn.
|
| 130 |
-
18,self_attn.
|
| 131 |
-
18,self_attn.o_proj,0.
|
| 132 |
-
18,mlp.up_proj,0.
|
| 133 |
-
18,mlp.gate_proj,0.
|
| 134 |
-
18,mlp.down_proj,0.
|
| 135 |
-
19,self_attn.k_proj,0.
|
| 136 |
-
19,self_attn.
|
| 137 |
-
19,self_attn.
|
| 138 |
-
19,self_attn.o_proj,0.
|
| 139 |
-
19,mlp.
|
| 140 |
-
19,mlp.
|
| 141 |
-
19,mlp.down_proj,0.
|
| 142 |
-
20,self_attn.k_proj,0.
|
| 143 |
-
20,self_attn.
|
| 144 |
-
20,self_attn.
|
| 145 |
-
20,self_attn.o_proj,0.
|
| 146 |
-
20,mlp.up_proj,0.
|
| 147 |
-
20,mlp.gate_proj,0.
|
| 148 |
-
20,mlp.down_proj,0.
|
| 149 |
-
21,self_attn.k_proj,0.
|
| 150 |
-
21,self_attn.
|
| 151 |
-
21,self_attn.
|
| 152 |
-
21,self_attn.o_proj,0.
|
| 153 |
-
21,mlp.
|
| 154 |
-
21,mlp.
|
| 155 |
-
21,mlp.down_proj,0.
|
| 156 |
-
22,self_attn.k_proj,0.
|
| 157 |
-
22,self_attn.
|
| 158 |
-
22,self_attn.
|
| 159 |
-
22,self_attn.o_proj,0.
|
| 160 |
-
22,mlp.
|
| 161 |
-
22,mlp.
|
| 162 |
-
22,mlp.down_proj,0.
|
| 163 |
-
23,self_attn.k_proj,0.
|
| 164 |
-
23,self_attn.
|
| 165 |
-
23,self_attn.
|
| 166 |
-
23,self_attn.o_proj,0.
|
| 167 |
-
23,mlp.gate_proj,0.
|
| 168 |
-
23,mlp.up_proj,0.
|
| 169 |
-
23,mlp.down_proj,0.
|
|
|
|
| 1 |
layer,module,loss,samples,damp,time
|
| 2 |
+
0,self_attn.k_proj,0.0000001374,0.05000,0.411
|
| 3 |
+
0,self_attn.v_proj,0.0000000028,0.05000,0.584
|
| 4 |
+
0,self_attn.q_proj,0.0000008549,0.05000,0.584
|
| 5 |
+
0,self_attn.o_proj,0.0000000005,0.05000,0.248
|
| 6 |
+
0,mlp.up_proj,0.0000120706,0.05000,0.277
|
| 7 |
+
0,mlp.gate_proj,0.0000190739,0.05000,0.312
|
| 8 |
+
0,mlp.down_proj,0.0000002370,0.05000,1.265
|
| 9 |
+
1,self_attn.k_proj,0.0000014250,0.05000,0.297
|
| 10 |
+
1,self_attn.q_proj,0.0000049810,0.05000,0.346
|
| 11 |
+
1,self_attn.v_proj,0.0000001409,0.05000,0.369
|
| 12 |
+
1,self_attn.o_proj,0.0000000737,0.05000,0.239
|
| 13 |
+
1,mlp.gate_proj,0.0000336152,0.05000,0.245
|
| 14 |
+
1,mlp.up_proj,0.0000177082,0.05000,0.262
|
| 15 |
+
1,mlp.down_proj,0.0000002587,0.05000,1.278
|
| 16 |
+
2,self_attn.k_proj,0.0000030212,0.05000,0.289
|
| 17 |
+
2,self_attn.v_proj,0.0000003602,0.05000,0.443
|
| 18 |
+
2,self_attn.q_proj,0.0000104272,0.05000,0.447
|
| 19 |
+
2,self_attn.o_proj,0.0000000885,0.05000,0.270
|
| 20 |
+
2,mlp.up_proj,0.0000254395,0.05000,0.270
|
| 21 |
+
2,mlp.gate_proj,0.0000473820,0.05000,0.284
|
| 22 |
+
2,mlp.down_proj,0.0000063855,0.05000,1.350
|
| 23 |
+
3,self_attn.k_proj,0.0000036164,0.05000,0.276
|
| 24 |
+
3,self_attn.v_proj,0.0000008465,0.05000,0.425
|
| 25 |
+
3,self_attn.q_proj,0.0000145756,0.05000,0.441
|
| 26 |
+
3,self_attn.o_proj,0.0000001321,0.05000,0.236
|
| 27 |
+
3,mlp.gate_proj,0.0000963621,0.05000,0.259
|
| 28 |
+
3,mlp.up_proj,0.0000551544,0.05000,0.288
|
| 29 |
+
3,mlp.down_proj,0.0000118582,0.05000,1.231
|
| 30 |
+
4,self_attn.k_proj,0.0000022631,0.05000,0.307
|
| 31 |
+
4,self_attn.q_proj,0.0000111644,0.05000,0.412
|
| 32 |
+
4,self_attn.v_proj,0.0000010152,0.05000,0.417
|
| 33 |
+
4,self_attn.o_proj,0.0000002745,0.05000,0.240
|
| 34 |
+
4,mlp.up_proj,0.0000394713,0.05000,0.259
|
| 35 |
+
4,mlp.gate_proj,0.0000614217,0.05000,0.286
|
| 36 |
+
4,mlp.down_proj,0.0000007736,0.05000,1.260
|
| 37 |
+
5,self_attn.k_proj,0.0000028338,0.05000,0.261
|
| 38 |
+
5,self_attn.v_proj,0.0000013757,0.05000,0.496
|
| 39 |
+
5,self_attn.q_proj,0.0000140757,0.05000,0.508
|
| 40 |
+
5,self_attn.o_proj,0.0000002477,0.05000,0.286
|
| 41 |
+
5,mlp.gate_proj,0.0001037606,0.05000,0.313
|
| 42 |
+
5,mlp.up_proj,0.0000515816,0.05000,0.318
|
| 43 |
+
5,mlp.down_proj,0.0000008419,0.05000,1.268
|
| 44 |
+
6,self_attn.k_proj,0.0000025804,0.05000,0.257
|
| 45 |
+
6,self_attn.v_proj,0.0000007676,0.05000,0.399
|
| 46 |
+
6,self_attn.q_proj,0.0000114309,0.05000,0.400
|
| 47 |
+
6,self_attn.o_proj,0.0000002146,0.05000,0.251
|
| 48 |
+
6,mlp.gate_proj,0.0000600376,0.05000,0.267
|
| 49 |
+
6,mlp.up_proj,0.0000420924,0.05000,0.276
|
| 50 |
+
6,mlp.down_proj,0.0000009019,0.05000,1.338
|
| 51 |
+
7,self_attn.k_proj,0.0000039587,0.05000,0.267
|
| 52 |
+
7,self_attn.q_proj,0.0000166899,0.05000,0.389
|
| 53 |
+
7,self_attn.v_proj,0.0000013533,0.05000,0.391
|
| 54 |
+
7,self_attn.o_proj,0.0000003905,0.05000,0.282
|
| 55 |
+
7,mlp.gate_proj,0.0000611757,0.05000,0.305
|
| 56 |
+
7,mlp.up_proj,0.0000478114,0.05000,0.308
|
| 57 |
+
7,mlp.down_proj,0.0000011080,0.05000,1.370
|
| 58 |
+
8,self_attn.k_proj,0.0000030156,0.05000,0.240
|
| 59 |
+
8,self_attn.q_proj,0.0000151704,0.05000,0.440
|
| 60 |
+
8,self_attn.v_proj,0.0000010115,0.05000,0.443
|
| 61 |
+
8,self_attn.o_proj,0.0000004879,0.05000,0.233
|
| 62 |
+
8,mlp.gate_proj,0.0000540080,0.05000,0.284
|
| 63 |
+
8,mlp.up_proj,0.0000413425,0.05000,0.298
|
| 64 |
+
8,mlp.down_proj,0.0000007874,0.05000,1.348
|
| 65 |
+
9,self_attn.k_proj,0.0000090284,0.05000,0.236
|
| 66 |
+
9,self_attn.v_proj,0.0000023909,0.05000,0.394
|
| 67 |
+
9,self_attn.q_proj,0.0000352399,0.05000,0.423
|
| 68 |
+
9,self_attn.o_proj,0.0000003621,0.05000,0.238
|
| 69 |
+
9,mlp.gate_proj,0.0000505815,0.05000,0.237
|
| 70 |
+
9,mlp.up_proj,0.0000433161,0.05000,0.265
|
| 71 |
+
9,mlp.down_proj,0.0000008689,0.05000,1.370
|
| 72 |
+
10,self_attn.k_proj,0.0000025689,0.05000,0.246
|
| 73 |
+
10,self_attn.v_proj,0.0000018463,0.05000,0.368
|
| 74 |
+
10,self_attn.q_proj,0.0000134080,0.05000,0.373
|
| 75 |
+
10,self_attn.o_proj,0.0000004496,0.05000,0.223
|
| 76 |
+
10,mlp.up_proj,0.0000373606,0.05000,0.249
|
| 77 |
+
10,mlp.gate_proj,0.0000484065,0.05000,0.285
|
| 78 |
+
10,mlp.down_proj,0.0000007205,0.05000,1.319
|
| 79 |
+
11,self_attn.k_proj,0.0000096949,0.05000,0.277
|
| 80 |
+
11,self_attn.q_proj,0.0000358525,0.05000,0.465
|
| 81 |
+
11,self_attn.v_proj,0.0000026096,0.05000,0.469
|
| 82 |
+
11,self_attn.o_proj,0.0000003160,0.05000,0.245
|
| 83 |
+
11,mlp.gate_proj,0.0000471413,0.05000,0.256
|
| 84 |
+
11,mlp.up_proj,0.0000432136,0.05000,0.275
|
| 85 |
+
11,mlp.down_proj,0.0000010805,0.05000,1.266
|
| 86 |
+
12,self_attn.k_proj,0.0000025656,0.05000,0.277
|
| 87 |
+
12,self_attn.q_proj,0.0000143737,0.05000,0.480
|
| 88 |
+
12,self_attn.v_proj,0.0000016514,0.05000,0.485
|
| 89 |
+
12,self_attn.o_proj,0.0000005012,0.05000,0.252
|
| 90 |
+
12,mlp.up_proj,0.0000396000,0.05000,0.251
|
| 91 |
+
12,mlp.gate_proj,0.0000438130,0.05000,0.274
|
| 92 |
+
12,mlp.down_proj,0.0000008642,0.05000,1.347
|
| 93 |
+
13,self_attn.k_proj,0.0000047205,0.05000,0.264
|
| 94 |
+
13,self_attn.q_proj,0.0000238298,0.05000,0.530
|
| 95 |
+
13,self_attn.v_proj,0.0000020183,0.05000,0.534
|
| 96 |
+
13,self_attn.o_proj,0.0000004878,0.05000,0.262
|
| 97 |
+
13,mlp.gate_proj,0.0000470698,0.05000,0.246
|
| 98 |
+
13,mlp.up_proj,0.0000468081,0.05000,0.260
|
| 99 |
+
13,mlp.down_proj,0.0000011870,0.05000,1.242
|
| 100 |
+
14,self_attn.k_proj,0.0000033385,0.05000,0.275
|
| 101 |
+
14,self_attn.q_proj,0.0000209151,0.05000,0.441
|
| 102 |
+
14,self_attn.v_proj,0.0000030890,0.05000,0.447
|
| 103 |
+
14,self_attn.o_proj,0.0000010850,0.05000,0.270
|
| 104 |
+
14,mlp.up_proj,0.0000475374,0.05000,0.226
|
| 105 |
+
14,mlp.gate_proj,0.0000534707,0.05000,0.294
|
| 106 |
+
14,mlp.down_proj,0.0000014841,0.05000,1.378
|
| 107 |
+
15,self_attn.k_proj,0.0000037106,0.05000,0.280
|
| 108 |
+
15,self_attn.q_proj,0.0000186038,0.05000,0.407
|
| 109 |
+
15,self_attn.v_proj,0.0000024893,0.05000,0.410
|
| 110 |
+
15,self_attn.o_proj,0.0000006463,0.05000,0.247
|
| 111 |
+
15,mlp.gate_proj,0.0000625236,0.05000,0.269
|
| 112 |
+
15,mlp.up_proj,0.0000601912,0.05000,0.285
|
| 113 |
+
15,mlp.down_proj,0.0000019398,0.05000,1.263
|
| 114 |
+
16,self_attn.k_proj,0.0000071184,0.05000,0.239
|
| 115 |
+
16,self_attn.v_proj,0.0000057205,0.05000,0.528
|
| 116 |
+
16,self_attn.q_proj,0.0000406430,0.05000,0.543
|
| 117 |
+
16,self_attn.o_proj,0.0000005914,0.05000,0.268
|
| 118 |
+
16,mlp.up_proj,0.0000715898,0.05000,0.255
|
| 119 |
+
16,mlp.gate_proj,0.0000915251,0.05000,0.266
|
| 120 |
+
16,mlp.down_proj,0.0000035746,0.05000,1.357
|
| 121 |
+
17,self_attn.k_proj,0.0000038815,0.05000,0.244
|
| 122 |
+
17,self_attn.q_proj,0.0000259958,0.05000,0.342
|
| 123 |
+
17,self_attn.v_proj,0.0000036715,0.05000,0.342
|
| 124 |
+
17,self_attn.o_proj,0.0000004955,0.05000,0.261
|
| 125 |
+
17,mlp.gate_proj,0.0001284090,0.05000,0.227
|
| 126 |
+
17,mlp.up_proj,0.0000846460,0.05000,0.239
|
| 127 |
+
17,mlp.down_proj,0.0000032604,0.05000,1.224
|
| 128 |
+
18,self_attn.k_proj,0.0000044824,0.05000,0.252
|
| 129 |
+
18,self_attn.q_proj,0.0000252827,0.05000,0.333
|
| 130 |
+
18,self_attn.v_proj,0.0000040620,0.05000,0.336
|
| 131 |
+
18,self_attn.o_proj,0.0000007172,0.05000,0.221
|
| 132 |
+
18,mlp.up_proj,0.0000873495,0.05000,0.270
|
| 133 |
+
18,mlp.gate_proj,0.0001080927,0.05000,0.279
|
| 134 |
+
18,mlp.down_proj,0.0000040154,0.05000,1.300
|
| 135 |
+
19,self_attn.k_proj,0.0000040385,0.05000,0.257
|
| 136 |
+
19,self_attn.v_proj,0.0000038138,0.05000,0.393
|
| 137 |
+
19,self_attn.q_proj,0.0000248874,0.05000,0.409
|
| 138 |
+
19,self_attn.o_proj,0.0000008094,0.05000,0.230
|
| 139 |
+
19,mlp.gate_proj,0.0001446683,0.05000,0.232
|
| 140 |
+
19,mlp.up_proj,0.0001231465,0.05000,0.265
|
| 141 |
+
19,mlp.down_proj,0.0000073288,0.05000,1.241
|
| 142 |
+
20,self_attn.k_proj,0.0000051520,0.05000,0.257
|
| 143 |
+
20,self_attn.v_proj,0.0000102601,0.05000,0.331
|
| 144 |
+
20,self_attn.q_proj,0.0000350694,0.05000,0.341
|
| 145 |
+
20,self_attn.o_proj,0.0000015609,0.05000,0.217
|
| 146 |
+
20,mlp.up_proj,0.0001401550,0.05000,0.235
|
| 147 |
+
20,mlp.gate_proj,0.0001513926,0.05000,0.260
|
| 148 |
+
20,mlp.down_proj,0.0000101059,0.05000,1.319
|
| 149 |
+
21,self_attn.k_proj,0.0000052119,0.05000,0.259
|
| 150 |
+
21,self_attn.v_proj,0.0000155353,0.05000,0.418
|
| 151 |
+
21,self_attn.q_proj,0.0000392914,0.05000,0.429
|
| 152 |
+
21,self_attn.o_proj,0.0000030117,0.05000,0.243
|
| 153 |
+
21,mlp.gate_proj,0.0001529105,0.05000,0.236
|
| 154 |
+
21,mlp.up_proj,0.0001498237,0.05000,0.251
|
| 155 |
+
21,mlp.down_proj,0.0000403716,0.05000,1.181
|
| 156 |
+
22,self_attn.k_proj,0.0000048279,0.05000,0.280
|
| 157 |
+
22,self_attn.q_proj,0.0000367167,0.05000,0.423
|
| 158 |
+
22,self_attn.v_proj,0.0000140020,0.05000,0.435
|
| 159 |
+
22,self_attn.o_proj,0.0000014592,0.05000,0.233
|
| 160 |
+
22,mlp.gate_proj,0.0001180850,0.05000,0.251
|
| 161 |
+
22,mlp.up_proj,0.0001251401,0.05000,0.263
|
| 162 |
+
22,mlp.down_proj,0.0000136729,0.05000,1.290
|
| 163 |
+
23,self_attn.k_proj,0.0000055235,0.05000,0.273
|
| 164 |
+
23,self_attn.q_proj,0.0000443739,0.05000,0.404
|
| 165 |
+
23,self_attn.v_proj,0.0000110931,0.05000,0.414
|
| 166 |
+
23,self_attn.o_proj,0.0000029716,0.05000,0.235
|
| 167 |
+
23,mlp.gate_proj,0.0001360635,0.05000,0.258
|
| 168 |
+
23,mlp.up_proj,0.0001328737,0.05000,0.277
|
| 169 |
+
23,mlp.down_proj,0.0000243960,0.05000,1.267
|
quantize_config.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"bits": 4,
|
| 3 |
-
"group_size":
|
| 4 |
"desc_act": false,
|
| 5 |
"sym": true,
|
| 6 |
"lm_head": false,
|
|
|
|
| 1 |
{
|
| 2 |
"bits": 4,
|
| 3 |
+
"group_size": 32,
|
| 4 |
"desc_act": false,
|
| 5 |
"sym": true,
|
| 6 |
"lm_head": false,
|