|
layer,module,loss,samples,damp,time
|
|
0,self_attn.k_proj,0.0000002985,0.01000,4.947
|
|
0,self_attn.v_proj,0.0000000628,0.01000,1.884
|
|
0,self_attn.q_proj,0.0000008087,0.01000,1.865
|
|
0,self_attn.o_proj,0.0000009411,0.01000,1.889
|
|
0,mlp.up_proj,0.0000003857,0.01000,1.936
|
|
0,mlp.gate_proj,0.0000004343,0.01000,1.944
|
|
0,mlp.down_proj,0.0000008139,0.01000,6.115
|
|
1,self_attn.k_proj,0.0000000138,0.01000,1.904
|
|
1,self_attn.v_proj,0.0000000049,0.01000,1.858
|
|
1,self_attn.q_proj,0.0000000554,0.01000,1.897
|
|
1,self_attn.o_proj,0.0000000136,0.01000,1.902
|
|
1,mlp.up_proj,0.0000018059,0.01000,1.992
|
|
1,mlp.gate_proj,0.0000048088,0.01000,1.986
|
|
1,mlp.down_proj,0.0000000962,0.01000,6.180
|
|
2,self_attn.k_proj,0.0000000607,0.01000,1.859
|
|
2,self_attn.v_proj,0.0000000150,0.01000,1.884
|
|
2,self_attn.q_proj,0.0000001718,0.01000,1.890
|
|
2,self_attn.o_proj,0.0000000996,0.01000,1.952
|
|
2,mlp.up_proj,0.0000043320,0.01000,2.028
|
|
2,mlp.gate_proj,0.0000081417,0.01000,1.956
|
|
2,mlp.down_proj,0.0000004419,0.01000,6.144
|
|
3,self_attn.k_proj,0.0000003379,0.01000,1.877
|
|
3,self_attn.v_proj,0.0000000693,0.01000,1.870
|
|
3,self_attn.q_proj,0.0000009042,0.01000,1.892
|
|
3,self_attn.o_proj,0.0000002491,0.01000,1.931
|
|
3,mlp.up_proj,0.0000050404,0.01000,1.994
|
|
3,mlp.gate_proj,0.0000106641,0.01000,1.996
|
|
3,mlp.down_proj,0.0000007892,0.01000,6.105
|
|
4,self_attn.k_proj,0.0000003962,0.01000,1.884
|
|
4,self_attn.v_proj,0.0000001156,0.01000,1.823
|
|
4,self_attn.q_proj,0.0000010681,0.01000,1.846
|
|
4,self_attn.o_proj,0.0000004779,0.01000,1.910
|
|
4,mlp.up_proj,0.0000107675,0.01000,2.053
|
|
4,mlp.gate_proj,0.0000199058,0.01000,2.028
|
|
4,mlp.down_proj,0.0013483506,0.01000,6.148
|
|
5,self_attn.k_proj,0.0000013836,0.01000,1.869
|
|
5,self_attn.v_proj,0.0000005688,0.01000,1.827
|
|
5,self_attn.q_proj,0.0000044049,0.01000,1.926
|
|
5,self_attn.o_proj,0.0000007381,0.01000,1.906
|
|
5,mlp.up_proj,0.0000180994,0.01000,1.995
|
|
5,mlp.gate_proj,0.0000349824,0.01000,1.990
|
|
5,mlp.down_proj,0.0000037041,0.01000,6.229
|
|
6,self_attn.k_proj,0.0000015295,0.01000,1.891
|
|
6,self_attn.v_proj,0.0000008116,0.01000,1.841
|
|
6,self_attn.q_proj,0.0000052489,0.01000,1.904
|
|
6,self_attn.o_proj,0.0000006595,0.01000,1.914
|
|
6,mlp.up_proj,0.0000294027,0.01000,2.036
|
|
6,mlp.gate_proj,0.0000543190,0.01000,2.000
|
|
6,mlp.down_proj,0.0000033944,0.01000,6.185
|
|
7,self_attn.k_proj,0.0000022324,0.01000,1.848
|
|
7,self_attn.v_proj,0.0000012807,0.01000,1.836
|
|
7,self_attn.q_proj,0.0000077740,0.01000,1.898
|
|
7,self_attn.o_proj,0.0000006588,0.01000,1.889
|
|
7,mlp.up_proj,0.0000377604,0.01000,2.007
|
|
7,mlp.gate_proj,0.0000714821,0.01000,2.013
|
|
7,mlp.down_proj,0.0000025652,0.01000,6.107
|
|
8,self_attn.k_proj,0.0000024254,0.01000,1.863
|
|
8,self_attn.v_proj,0.0000010471,0.01000,1.841
|
|
8,self_attn.q_proj,0.0000081145,0.01000,1.936
|
|
8,self_attn.o_proj,0.0000005655,0.01000,1.886
|
|
8,mlp.up_proj,0.0000263257,0.01000,2.090
|
|
8,mlp.gate_proj,0.0000475203,0.01000,2.009
|
|
8,mlp.down_proj,0.0000034082,0.01000,6.117
|
|
9,self_attn.k_proj,0.0000022917,0.01000,1.865
|
|
9,self_attn.v_proj,0.0000013029,0.01000,1.832
|
|
9,self_attn.q_proj,0.0000077636,0.01000,1.919
|
|
9,self_attn.o_proj,0.0000010365,0.01000,1.908
|
|
9,mlp.up_proj,0.0000193074,0.01000,1.997
|
|
9,mlp.gate_proj,0.0000211020,0.01000,2.014
|
|
9,mlp.down_proj,0.0000048219,0.01000,6.151
|
|
10,self_attn.k_proj,0.0000034324,0.01000,1.867
|
|
10,self_attn.v_proj,0.0000019137,0.01000,1.831
|
|
10,self_attn.q_proj,0.0000121056,0.01000,1.897
|
|
10,self_attn.o_proj,0.0000010023,0.01000,1.873
|
|
10,mlp.up_proj,0.0000224903,0.01000,2.013
|
|
10,mlp.gate_proj,0.0000246599,0.01000,2.011
|
|
10,mlp.down_proj,0.0000059849,0.01000,6.103
|
|
11,self_attn.k_proj,0.0000025495,0.01000,1.908
|
|
11,self_attn.v_proj,0.0000012462,0.01000,1.865
|
|
11,self_attn.q_proj,0.0000090048,0.01000,1.923
|
|
11,self_attn.o_proj,0.0000014718,0.01000,1.924
|
|
11,mlp.up_proj,0.0000258469,0.01000,2.027
|
|
11,mlp.gate_proj,0.0000321958,0.01000,1.986
|
|
11,mlp.down_proj,0.0000051555,0.01000,6.087
|
|
12,self_attn.k_proj,0.0000031215,0.01000,1.847
|
|
12,self_attn.v_proj,0.0000014327,0.01000,1.841
|
|
12,self_attn.q_proj,0.0000111406,0.01000,1.893
|
|
12,self_attn.o_proj,0.0000017573,0.01000,1.957
|
|
12,mlp.up_proj,0.0000284193,0.01000,2.017
|
|
12,mlp.gate_proj,0.0000301645,0.01000,1.993
|
|
12,mlp.down_proj,0.0000064959,0.01000,6.090
|
|
13,self_attn.k_proj,0.0000034285,0.01000,1.923
|
|
13,self_attn.v_proj,0.0000017783,0.01000,1.831
|
|
13,self_attn.q_proj,0.0000119425,0.01000,1.911
|
|
13,self_attn.o_proj,0.0000020312,0.01000,1.861
|
|
13,mlp.up_proj,0.0000325586,0.01000,2.011
|
|
13,mlp.gate_proj,0.0000345637,0.01000,1.978
|
|
13,mlp.down_proj,0.0000076320,0.01000,6.090
|
|
14,self_attn.k_proj,0.0000042219,0.01000,1.872
|
|
14,self_attn.v_proj,0.0000019629,0.01000,1.827
|
|
14,self_attn.q_proj,0.0000144176,0.01000,1.895
|
|
14,self_attn.o_proj,0.0000020731,0.01000,1.931
|
|
14,mlp.up_proj,0.0000335783,0.01000,2.019
|
|
14,mlp.gate_proj,0.0000354549,0.01000,2.017
|
|
14,mlp.down_proj,0.0000079941,0.01000,6.158
|
|
15,self_attn.k_proj,0.0000036243,0.01000,1.894
|
|
15,self_attn.v_proj,0.0000022559,0.01000,1.827
|
|
15,self_attn.q_proj,0.0000129040,0.01000,1.897
|
|
15,self_attn.o_proj,0.0000027518,0.01000,1.912
|
|
15,mlp.up_proj,0.0000350510,0.01000,2.121
|
|
15,mlp.gate_proj,0.0000385737,0.01000,1.996
|
|
15,mlp.down_proj,0.0000085556,0.01000,6.094
|
|
16,self_attn.k_proj,0.0000036654,0.01000,1.849
|
|
16,self_attn.v_proj,0.0000015336,0.01000,1.822
|
|
16,self_attn.q_proj,0.0000115880,0.01000,1.872
|
|
16,self_attn.o_proj,0.0000024392,0.01000,1.921
|
|
16,mlp.up_proj,0.0000326376,0.01000,2.085
|
|
16,mlp.gate_proj,0.0000331992,0.01000,2.003
|
|
16,mlp.down_proj,0.0000084625,0.01000,6.173
|
|
17,self_attn.k_proj,0.0000040579,0.01000,1.885
|
|
17,self_attn.v_proj,0.0000018465,0.01000,1.861
|
|
17,self_attn.q_proj,0.0000138158,0.01000,1.906
|
|
17,self_attn.o_proj,0.0000025808,0.01000,1.932
|
|
17,mlp.up_proj,0.0000322729,0.01000,2.001
|
|
17,mlp.gate_proj,0.0000317870,0.01000,1.997
|
|
17,mlp.down_proj,0.0000080485,0.01000,6.129
|
|
18,self_attn.k_proj,0.0000039598,0.01000,1.839
|
|
18,self_attn.v_proj,0.0000020382,0.01000,1.798
|
|
18,self_attn.q_proj,0.0000137095,0.01000,1.895
|
|
18,self_attn.o_proj,0.0000029167,0.01000,1.892
|
|
18,mlp.up_proj,0.0000323423,0.01000,1.998
|
|
18,mlp.gate_proj,0.0000308571,0.01000,2.011
|
|
18,mlp.down_proj,0.0000081186,0.01000,6.181
|
|
19,self_attn.k_proj,0.0000043350,0.01000,1.867
|
|
19,self_attn.v_proj,0.0000020963,0.01000,1.811
|
|
19,self_attn.q_proj,0.0000163849,0.01000,1.886
|
|
19,self_attn.o_proj,0.0000022194,0.01000,1.976
|
|
19,mlp.up_proj,0.0000333286,0.01000,2.074
|
|
19,mlp.gate_proj,0.0000317924,0.01000,2.042
|
|
19,mlp.down_proj,0.0000083289,0.01000,6.124
|
|
20,self_attn.k_proj,0.0000045548,0.01000,1.827
|
|
20,self_attn.v_proj,0.0000019402,0.01000,1.863
|
|
20,self_attn.q_proj,0.0000157211,0.01000,1.926
|
|
20,self_attn.o_proj,0.0000029912,0.01000,1.890
|
|
20,mlp.up_proj,0.0000323250,0.01000,2.020
|
|
20,mlp.gate_proj,0.0000292523,0.01000,1.999
|
|
20,mlp.down_proj,0.0000087532,0.01000,6.119
|
|
21,self_attn.k_proj,0.0000042023,0.01000,1.894
|
|
21,self_attn.v_proj,0.0000019321,0.01000,1.853
|
|
21,self_attn.q_proj,0.0000144628,0.01000,1.918
|
|
21,self_attn.o_proj,0.0000030416,0.01000,1.891
|
|
21,mlp.up_proj,0.0000326811,0.01000,1.994
|
|
21,mlp.gate_proj,0.0000293238,0.01000,1.979
|
|
21,mlp.down_proj,0.0000085412,0.01000,6.151
|
|
22,self_attn.k_proj,0.0000046789,0.01000,1.887
|
|
22,self_attn.v_proj,0.0000028668,0.01000,1.833
|
|
22,self_attn.q_proj,0.0000161835,0.01000,1.896
|
|
22,self_attn.o_proj,0.0000038789,0.01000,1.901
|
|
22,mlp.up_proj,0.0000331632,0.01000,2.071
|
|
22,mlp.gate_proj,0.0000295798,0.01000,1.978
|
|
22,mlp.down_proj,0.0000096156,0.01000,6.178
|
|
23,self_attn.k_proj,0.0000043162,0.01000,1.860
|
|
23,self_attn.v_proj,0.0000028849,0.01000,1.833
|
|
23,self_attn.q_proj,0.0000160021,0.01000,1.861
|
|
23,self_attn.o_proj,0.0000037945,0.01000,1.923
|
|
23,mlp.up_proj,0.0000337720,0.01000,2.003
|
|
23,mlp.gate_proj,0.0000317463,0.01000,2.011
|
|
23,mlp.down_proj,0.0000093671,0.01000,6.194
|
|
24,self_attn.k_proj,0.0000057187,0.01000,1.942
|
|
24,self_attn.v_proj,0.0000024407,0.01000,1.866
|
|
24,self_attn.q_proj,0.0000181873,0.01000,1.904
|
|
24,self_attn.o_proj,0.0000041032,0.01000,1.924
|
|
24,mlp.up_proj,0.0000324691,0.01000,2.000
|
|
24,mlp.gate_proj,0.0000301167,0.01000,1.985
|
|
24,mlp.down_proj,0.0000084492,0.01000,6.136
|
|
25,self_attn.k_proj,0.0000055621,0.01000,1.846
|
|
25,self_attn.v_proj,0.0000031424,0.01000,1.823
|
|
25,self_attn.q_proj,0.0000198023,0.01000,1.922
|
|
25,self_attn.o_proj,0.0000028802,0.01000,1.885
|
|
25,mlp.up_proj,0.0000330885,0.01000,2.068
|
|
25,mlp.gate_proj,0.0000296588,0.01000,2.031
|
|
25,mlp.down_proj,0.0000089875,0.01000,6.062
|
|
26,self_attn.k_proj,0.0000050286,0.01000,1.858
|
|
26,self_attn.v_proj,0.0000021552,0.01000,1.866
|
|
26,self_attn.q_proj,0.0000176642,0.01000,1.899
|
|
26,self_attn.o_proj,0.0000031027,0.01000,1.904
|
|
26,mlp.up_proj,0.0000356900,0.01000,2.014
|
|
26,mlp.gate_proj,0.0000308428,0.01000,1.988
|
|
26,mlp.down_proj,0.0000103464,0.01000,6.112
|
|
27,self_attn.k_proj,0.0000050559,0.01000,1.826
|
|
27,self_attn.v_proj,0.0000026083,0.01000,1.817
|
|
27,self_attn.q_proj,0.0000170910,0.01000,1.898
|
|
27,self_attn.o_proj,0.0000044997,0.01000,1.891
|
|
27,mlp.up_proj,0.0000373241,0.01000,2.002
|
|
27,mlp.gate_proj,0.0000323265,0.01000,2.026
|
|
27,mlp.down_proj,0.0000123207,0.01000,6.172
|
|
28,self_attn.k_proj,0.0000042150,0.01000,1.883
|
|
28,self_attn.v_proj,0.0000037593,0.01000,1.861
|
|
28,self_attn.q_proj,0.0000171301,0.01000,1.885
|
|
28,self_attn.o_proj,0.0000054424,0.01000,1.916
|
|
28,mlp.up_proj,0.0000382802,0.01000,1.990
|
|
28,mlp.gate_proj,0.0000329041,0.01000,2.059
|
|
28,mlp.down_proj,0.0000136056,0.01000,6.099
|
|
29,self_attn.k_proj,0.0000055420,0.01000,1.847
|
|
29,self_attn.v_proj,0.0000036558,0.01000,1.942
|
|
29,self_attn.q_proj,0.0000196112,0.01000,1.991
|
|
29,self_attn.o_proj,0.0000046135,0.01000,1.879
|
|
29,mlp.up_proj,0.0000391342,0.01000,2.033
|
|
29,mlp.gate_proj,0.0000337284,0.01000,1.968
|
|
29,mlp.down_proj,0.0000148448,0.01000,6.136
|
|
30,self_attn.k_proj,0.0000047346,0.01000,1.847
|
|
30,self_attn.v_proj,0.0000041514,0.01000,1.863
|
|
30,self_attn.q_proj,0.0000184229,0.01000,1.959
|
|
30,self_attn.o_proj,0.0000064813,0.01000,1.855
|
|
30,mlp.up_proj,0.0000411291,0.01000,2.034
|
|
30,mlp.gate_proj,0.0000354981,0.01000,2.003
|
|
30,mlp.down_proj,0.0000166990,0.01000,6.158
|
|
31,self_attn.k_proj,0.0000048687,0.01000,1.867
|
|
31,self_attn.v_proj,0.0000040193,0.01000,1.842
|
|
31,self_attn.q_proj,0.0000189473,0.01000,1.897
|
|
31,self_attn.o_proj,0.0000054662,0.01000,1.928
|
|
31,mlp.up_proj,0.0000457638,0.01000,2.001
|
|
31,mlp.gate_proj,0.0000403368,0.01000,2.053
|
|
31,mlp.down_proj,0.0000203712,0.01000,6.115
|
|
32,self_attn.k_proj,0.0000053250,0.01000,1.836
|
|
32,self_attn.v_proj,0.0000053774,0.01000,1.829
|
|
32,self_attn.q_proj,0.0000208265,0.01000,1.948
|
|
32,self_attn.o_proj,0.0000054974,0.01000,1.923
|
|
32,mlp.up_proj,0.0000489943,0.01000,2.010
|
|
32,mlp.gate_proj,0.0000443471,0.01000,2.022
|
|
32,mlp.down_proj,0.0000236334,0.01000,6.119
|
|
33,self_attn.k_proj,0.0000055528,0.01000,1.860
|
|
33,self_attn.v_proj,0.0000053279,0.01000,1.855
|
|
33,self_attn.q_proj,0.0000225135,0.01000,1.882
|
|
33,self_attn.o_proj,0.0000065416,0.01000,1.911
|
|
33,mlp.up_proj,0.0000581524,0.01000,1.989
|
|
33,mlp.gate_proj,0.0000532374,0.01000,1.992
|
|
33,mlp.down_proj,0.0000341816,0.01000,6.194
|
|
34,self_attn.k_proj,0.0000057969,0.01000,1.865
|
|
34,self_attn.v_proj,0.0000065100,0.01000,1.820
|
|
34,self_attn.q_proj,0.0000247060,0.01000,1.933
|
|
34,self_attn.o_proj,0.0000064140,0.01000,1.974
|
|
34,mlp.up_proj,0.0000676059,0.01000,1.996
|
|
34,mlp.gate_proj,0.0000639034,0.01000,1.969
|
|
34,mlp.down_proj,0.0000421207,0.01000,6.114
|
|
35,self_attn.k_proj,0.0000056806,0.01000,1.843
|
|
35,self_attn.v_proj,0.0000058037,0.01000,1.859
|
|
35,self_attn.q_proj,0.0000227509,0.01000,1.864
|
|
35,self_attn.o_proj,0.0000107215,0.01000,1.953
|
|
35,mlp.up_proj,0.0000773738,0.01000,2.075
|
|
35,mlp.gate_proj,0.0000748045,0.01000,2.003
|
|
35,mlp.down_proj,0.0000531376,0.01000,6.151
|
|
36,self_attn.k_proj,0.0000064778,0.01000,1.826
|
|
36,self_attn.v_proj,0.0000105387,0.01000,1.820
|
|
36,self_attn.q_proj,0.0000284083,0.01000,1.898
|
|
36,self_attn.o_proj,0.0000097221,0.01000,1.959
|
|
36,mlp.up_proj,0.0000858965,0.01000,2.012
|
|
36,mlp.gate_proj,0.0000823549,0.01000,2.042
|
|
36,mlp.down_proj,0.0000657707,0.01000,6.164
|
|
37,self_attn.k_proj,0.0000074679,0.01000,1.836
|
|
37,self_attn.v_proj,0.0000103437,0.01000,1.870
|
|
37,self_attn.q_proj,0.0000301686,0.01000,1.843
|
|
37,self_attn.o_proj,0.0000103363,0.01000,1.949
|
|
37,mlp.up_proj,0.0000963696,0.01000,2.029
|
|
37,mlp.gate_proj,0.0000927627,0.01000,1.995
|
|
37,mlp.down_proj,0.0000759659,0.01000,6.172
|
|
38,self_attn.k_proj,0.0000072543,0.01000,1.906
|
|
38,self_attn.v_proj,0.0000103870,0.01000,1.833
|
|
38,self_attn.q_proj,0.0000302236,0.01000,1.885
|
|
38,self_attn.o_proj,0.0000106793,0.01000,1.909
|
|
38,mlp.up_proj,0.0001080096,0.01000,1.994
|
|
38,mlp.gate_proj,0.0001029393,0.01000,2.037
|
|
38,mlp.down_proj,0.0000864311,0.01000,6.118
|
|
39,self_attn.k_proj,0.0000070753,0.01000,1.848
|
|
39,self_attn.v_proj,0.0000115101,0.01000,1.855
|
|
39,self_attn.q_proj,0.0000317167,0.01000,1.926
|
|
39,self_attn.o_proj,0.0000149693,0.01000,1.908
|
|
39,mlp.up_proj,0.0001216658,0.01000,2.038
|
|
39,mlp.gate_proj,0.0001149202,0.01000,2.005
|
|
39,mlp.down_proj,0.0001039416,0.01000,6.191
|
|
40,self_attn.k_proj,0.0000081462,0.01000,1.824
|
|
40,self_attn.v_proj,0.0000157852,0.01000,1.910
|
|
40,self_attn.q_proj,0.0000353841,0.01000,1.991
|
|
40,self_attn.o_proj,0.0000151671,0.01000,1.913
|
|
40,mlp.up_proj,0.0001326770,0.01000,2.002
|
|
40,mlp.gate_proj,0.0001247391,0.01000,2.012
|
|
40,mlp.down_proj,0.0001193831,0.01000,6.104
|
|
41,self_attn.k_proj,0.0000079063,0.01000,1.881
|
|
41,self_attn.v_proj,0.0000165749,0.01000,1.930
|
|
41,self_attn.q_proj,0.0000366510,0.01000,1.896
|
|
41,self_attn.o_proj,0.0000124038,0.01000,1.877
|
|
41,mlp.up_proj,0.0001447803,0.01000,1.999
|
|
41,mlp.gate_proj,0.0001340893,0.01000,1.963
|
|
41,mlp.down_proj,0.0001349494,0.01000,6.061
|
|
42,self_attn.k_proj,0.0000083146,0.01000,1.833
|
|
42,self_attn.v_proj,0.0000181338,0.01000,1.793
|
|
42,self_attn.q_proj,0.0000357798,0.01000,1.855
|
|
42,self_attn.o_proj,0.0000141514,0.01000,1.914
|
|
42,mlp.up_proj,0.0001559160,0.01000,1.990
|
|
42,mlp.gate_proj,0.0001425551,0.01000,1.997
|
|
42,mlp.down_proj,0.0001580665,0.01000,6.099
|
|
43,self_attn.k_proj,0.0000083956,0.01000,1.822
|
|
43,self_attn.v_proj,0.0000256210,0.01000,1.813
|
|
43,self_attn.q_proj,0.0000399949,0.01000,1.861
|
|
43,self_attn.o_proj,0.0000247247,0.01000,1.883
|
|
43,mlp.up_proj,0.0001706939,0.01000,2.020
|
|
43,mlp.gate_proj,0.0001531956,0.01000,2.037
|
|
43,mlp.down_proj,0.0001867778,0.01000,6.179
|
|
44,self_attn.k_proj,0.0000076330,0.01000,1.852
|
|
44,self_attn.v_proj,0.0000281914,0.01000,1.820
|
|
44,self_attn.q_proj,0.0000391793,0.01000,1.889
|
|
44,self_attn.o_proj,0.0000360502,0.01000,1.884
|
|
44,mlp.up_proj,0.0001831046,0.01000,1.963
|
|
44,mlp.gate_proj,0.0001616602,0.01000,1.966
|
|
44,mlp.down_proj,0.0002535868,0.01000,6.108
|
|
45,self_attn.k_proj,0.0000079784,0.01000,1.892
|
|
45,self_attn.v_proj,0.0000340295,0.01000,1.838
|
|
45,self_attn.q_proj,0.0000422606,0.01000,1.895
|
|
45,self_attn.o_proj,0.0000337677,0.01000,1.944
|
|
45,mlp.up_proj,0.0001918452,0.01000,1.990
|
|
45,mlp.gate_proj,0.0001717587,0.01000,1.985
|
|
45,mlp.down_proj,0.0002833572,0.01000,6.189
|
|
46,self_attn.k_proj,0.0000071048,0.01000,1.838
|
|
46,self_attn.v_proj,0.0000363993,0.01000,1.838
|
|
46,self_attn.q_proj,0.0000375253,0.01000,1.876
|
|
46,self_attn.o_proj,0.0000640068,0.01000,1.919
|
|
46,mlp.up_proj,0.0001911036,0.01000,2.009
|
|
46,mlp.gate_proj,0.0001784168,0.01000,2.081
|
|
46,mlp.down_proj,0.0004206370,0.01000,6.225
|
|
47,self_attn.k_proj,0.0000061165,0.01000,1.837
|
|
47,self_attn.v_proj,0.0000228788,0.01000,1.920
|
|
47,self_attn.q_proj,0.0000279219,0.01000,1.940
|
|
47,self_attn.o_proj,0.0000288922,0.01000,1.906
|
|
47,mlp.up_proj,0.0002043838,0.01000,2.035
|
|
47,mlp.gate_proj,0.0001966780,0.01000,2.033
|
|
47,mlp.down_proj,0.0006320129,0.01000,6.199
|
|
|