|
layer,module,loss,damp,time
|
|
0,self_attn.k_proj,0.20627,0.01000,0.986
|
|
0,self_attn.v_proj,0.00507,0.01000,0.607
|
|
0,self_attn.q_proj,0.42227,0.01000,0.610
|
|
0,self_attn.o_proj,0.00047,0.01000,0.603
|
|
0,mlp.up_proj,0.35409,0.01000,0.636
|
|
0,mlp.gate_proj,0.44565,0.01000,0.749
|
|
0,mlp.down_proj,0.00251,0.01000,2.774
|
|
1,self_attn.k_proj,0.33142,0.01000,0.600
|
|
1,self_attn.v_proj,0.01882,0.01000,0.615
|
|
1,self_attn.q_proj,0.61006,0.01000,0.611
|
|
1,self_attn.o_proj,0.00132,0.01000,0.608
|
|
1,mlp.up_proj,0.50808,0.01000,0.643
|
|
1,mlp.gate_proj,0.69618,0.01000,0.790
|
|
1,mlp.down_proj,1.31996,0.01000,2.535
|
|
2,self_attn.k_proj,0.65871,0.01000,0.607
|
|
2,self_attn.v_proj,0.04459,0.01000,0.610
|
|
2,self_attn.q_proj,1.27351,0.01000,0.619
|
|
2,self_attn.o_proj,0.00206,0.01000,0.596
|
|
2,mlp.up_proj,0.65205,0.01000,0.631
|
|
2,mlp.gate_proj,1.04195,0.01000,0.784
|
|
2,mlp.down_proj,0.00808,0.01000,2.504
|
|
3,self_attn.k_proj,0.43784,0.01000,0.592
|
|
3,self_attn.v_proj,0.05698,0.01000,0.586
|
|
3,self_attn.q_proj,0.94526,0.01000,0.610
|
|
3,self_attn.o_proj,0.00391,0.01000,0.644
|
|
3,mlp.up_proj,0.79450,0.01000,0.621
|
|
3,mlp.gate_proj,1.58985,0.01000,0.798
|
|
3,mlp.down_proj,0.01225,0.01000,2.532
|
|
4,self_attn.k_proj,0.46703,0.01000,0.583
|
|
4,self_attn.v_proj,0.05344,0.01000,0.588
|
|
4,self_attn.q_proj,0.95165,0.01000,0.609
|
|
4,self_attn.o_proj,0.00573,0.01000,0.604
|
|
4,mlp.up_proj,0.80078,0.01000,0.630
|
|
4,mlp.gate_proj,1.73697,0.01000,0.794
|
|
4,mlp.down_proj,0.01413,0.01000,2.501
|
|
5,self_attn.k_proj,0.69090,0.01000,0.596
|
|
5,self_attn.v_proj,0.04588,0.01000,0.589
|
|
5,self_attn.q_proj,1.21408,0.01000,0.664
|
|
5,self_attn.o_proj,0.00586,0.01000,0.612
|
|
5,mlp.up_proj,0.86928,0.01000,0.637
|
|
5,mlp.gate_proj,1.61338,0.01000,0.800
|
|
5,mlp.down_proj,0.01706,0.01000,2.504
|
|
6,self_attn.k_proj,0.56137,0.01000,0.592
|
|
6,self_attn.v_proj,0.05914,0.01000,0.583
|
|
6,self_attn.q_proj,0.88346,0.01000,0.589
|
|
6,self_attn.o_proj,0.00905,0.01000,0.614
|
|
6,mlp.up_proj,0.88001,0.01000,0.630
|
|
6,mlp.gate_proj,1.59125,0.01000,0.793
|
|
6,mlp.down_proj,0.01736,0.01000,2.431
|
|
7,self_attn.k_proj,0.56204,0.01000,0.584
|
|
7,self_attn.v_proj,0.06787,0.01000,0.578
|
|
7,self_attn.q_proj,1.04871,0.01000,0.627
|
|
7,self_attn.o_proj,0.00866,0.01000,0.598
|
|
7,mlp.up_proj,0.91172,0.01000,0.630
|
|
7,mlp.gate_proj,1.47971,0.01000,0.801
|
|
7,mlp.down_proj,0.01878,0.01000,2.453
|
|
8,self_attn.k_proj,0.65364,0.01000,0.587
|
|
8,self_attn.v_proj,0.06459,0.01000,0.599
|
|
8,self_attn.q_proj,1.06362,0.01000,0.589
|
|
8,self_attn.o_proj,0.01113,0.01000,0.585
|
|
8,mlp.up_proj,1.00755,0.01000,0.611
|
|
8,mlp.gate_proj,1.59544,0.01000,0.796
|
|
8,mlp.down_proj,0.02531,0.01000,2.416
|
|
9,self_attn.k_proj,0.54082,0.01000,0.584
|
|
9,self_attn.v_proj,0.07637,0.01000,0.580
|
|
9,self_attn.q_proj,1.30084,0.01000,0.591
|
|
9,self_attn.o_proj,0.01507,0.01000,0.603
|
|
9,mlp.up_proj,1.07703,0.01000,0.622
|
|
9,mlp.gate_proj,1.76000,0.01000,0.796
|
|
9,mlp.down_proj,0.03086,0.01000,2.426
|
|
10,self_attn.k_proj,0.66062,0.01000,0.590
|
|
10,self_attn.v_proj,0.08113,0.01000,0.583
|
|
10,self_attn.q_proj,1.32715,0.01000,0.583
|
|
10,self_attn.o_proj,0.01019,0.01000,0.594
|
|
10,mlp.up_proj,1.28599,0.01000,0.622
|
|
10,mlp.gate_proj,2.02958,0.01000,0.791
|
|
10,mlp.down_proj,0.03905,0.01000,2.438
|
|
11,self_attn.k_proj,0.79215,0.01000,0.583
|
|
11,self_attn.v_proj,0.08159,0.01000,0.590
|
|
11,self_attn.q_proj,1.31279,0.01000,0.571
|
|
11,self_attn.o_proj,0.00862,0.01000,0.625
|
|
11,mlp.up_proj,1.42253,0.01000,0.641
|
|
11,mlp.gate_proj,2.19144,0.01000,0.801
|
|
11,mlp.down_proj,0.04266,0.01000,2.499
|
|
12,self_attn.k_proj,0.76721,0.01000,0.585
|
|
12,self_attn.v_proj,0.08425,0.01000,0.580
|
|
12,self_attn.q_proj,1.29475,0.01000,0.582
|
|
12,self_attn.o_proj,0.00837,0.01000,0.586
|
|
12,mlp.up_proj,1.47983,0.01000,0.626
|
|
12,mlp.gate_proj,2.15212,0.01000,0.804
|
|
12,mlp.down_proj,0.04750,0.01000,2.422
|
|
13,self_attn.k_proj,0.73892,0.01000,0.589
|
|
13,self_attn.v_proj,0.13723,0.01000,0.574
|
|
13,self_attn.q_proj,1.45466,0.01000,0.589
|
|
13,self_attn.o_proj,0.01131,0.01000,0.578
|
|
13,mlp.up_proj,1.73117,0.01000,0.623
|
|
13,mlp.gate_proj,2.29325,0.01000,0.791
|
|
13,mlp.down_proj,0.06902,0.01000,2.415
|
|
14,self_attn.k_proj,0.79778,0.01000,0.588
|
|
14,self_attn.v_proj,0.29438,0.01000,0.582
|
|
14,self_attn.q_proj,1.52455,0.01000,0.580
|
|
14,self_attn.o_proj,0.02765,0.01000,0.586
|
|
14,mlp.up_proj,1.98990,0.01000,0.606
|
|
14,mlp.gate_proj,2.84552,0.01000,0.621
|
|
14,mlp.down_proj,0.09091,0.01000,2.440
|
|
15,self_attn.k_proj,0.71842,0.01000,0.607
|
|
15,self_attn.v_proj,0.31329,0.01000,0.577
|
|
15,self_attn.q_proj,1.39225,0.01000,0.585
|
|
15,self_attn.o_proj,0.09505,0.01000,0.585
|
|
15,mlp.up_proj,2.41008,0.01000,0.636
|
|
15,mlp.gate_proj,3.18340,0.01000,0.802
|
|
15,mlp.down_proj,0.21390,0.01000,2.454
|
|
|