File size: 15,567 Bytes
a6baa9c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 |
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000002985,0.01000,4.947
0,self_attn.v_proj,0.0000000628,0.01000,1.884
0,self_attn.q_proj,0.0000008087,0.01000,1.865
0,self_attn.o_proj,0.0000009411,0.01000,1.889
0,mlp.up_proj,0.0000003857,0.01000,1.936
0,mlp.gate_proj,0.0000004343,0.01000,1.944
0,mlp.down_proj,0.0000008139,0.01000,6.115
1,self_attn.k_proj,0.0000000138,0.01000,1.904
1,self_attn.v_proj,0.0000000049,0.01000,1.858
1,self_attn.q_proj,0.0000000554,0.01000,1.897
1,self_attn.o_proj,0.0000000136,0.01000,1.902
1,mlp.up_proj,0.0000018059,0.01000,1.992
1,mlp.gate_proj,0.0000048088,0.01000,1.986
1,mlp.down_proj,0.0000000962,0.01000,6.180
2,self_attn.k_proj,0.0000000607,0.01000,1.859
2,self_attn.v_proj,0.0000000150,0.01000,1.884
2,self_attn.q_proj,0.0000001718,0.01000,1.890
2,self_attn.o_proj,0.0000000996,0.01000,1.952
2,mlp.up_proj,0.0000043320,0.01000,2.028
2,mlp.gate_proj,0.0000081417,0.01000,1.956
2,mlp.down_proj,0.0000004419,0.01000,6.144
3,self_attn.k_proj,0.0000003379,0.01000,1.877
3,self_attn.v_proj,0.0000000693,0.01000,1.870
3,self_attn.q_proj,0.0000009042,0.01000,1.892
3,self_attn.o_proj,0.0000002491,0.01000,1.931
3,mlp.up_proj,0.0000050404,0.01000,1.994
3,mlp.gate_proj,0.0000106641,0.01000,1.996
3,mlp.down_proj,0.0000007892,0.01000,6.105
4,self_attn.k_proj,0.0000003962,0.01000,1.884
4,self_attn.v_proj,0.0000001156,0.01000,1.823
4,self_attn.q_proj,0.0000010681,0.01000,1.846
4,self_attn.o_proj,0.0000004779,0.01000,1.910
4,mlp.up_proj,0.0000107675,0.01000,2.053
4,mlp.gate_proj,0.0000199058,0.01000,2.028
4,mlp.down_proj,0.0013483506,0.01000,6.148
5,self_attn.k_proj,0.0000013836,0.01000,1.869
5,self_attn.v_proj,0.0000005688,0.01000,1.827
5,self_attn.q_proj,0.0000044049,0.01000,1.926
5,self_attn.o_proj,0.0000007381,0.01000,1.906
5,mlp.up_proj,0.0000180994,0.01000,1.995
5,mlp.gate_proj,0.0000349824,0.01000,1.990
5,mlp.down_proj,0.0000037041,0.01000,6.229
6,self_attn.k_proj,0.0000015295,0.01000,1.891
6,self_attn.v_proj,0.0000008116,0.01000,1.841
6,self_attn.q_proj,0.0000052489,0.01000,1.904
6,self_attn.o_proj,0.0000006595,0.01000,1.914
6,mlp.up_proj,0.0000294027,0.01000,2.036
6,mlp.gate_proj,0.0000543190,0.01000,2.000
6,mlp.down_proj,0.0000033944,0.01000,6.185
7,self_attn.k_proj,0.0000022324,0.01000,1.848
7,self_attn.v_proj,0.0000012807,0.01000,1.836
7,self_attn.q_proj,0.0000077740,0.01000,1.898
7,self_attn.o_proj,0.0000006588,0.01000,1.889
7,mlp.up_proj,0.0000377604,0.01000,2.007
7,mlp.gate_proj,0.0000714821,0.01000,2.013
7,mlp.down_proj,0.0000025652,0.01000,6.107
8,self_attn.k_proj,0.0000024254,0.01000,1.863
8,self_attn.v_proj,0.0000010471,0.01000,1.841
8,self_attn.q_proj,0.0000081145,0.01000,1.936
8,self_attn.o_proj,0.0000005655,0.01000,1.886
8,mlp.up_proj,0.0000263257,0.01000,2.090
8,mlp.gate_proj,0.0000475203,0.01000,2.009
8,mlp.down_proj,0.0000034082,0.01000,6.117
9,self_attn.k_proj,0.0000022917,0.01000,1.865
9,self_attn.v_proj,0.0000013029,0.01000,1.832
9,self_attn.q_proj,0.0000077636,0.01000,1.919
9,self_attn.o_proj,0.0000010365,0.01000,1.908
9,mlp.up_proj,0.0000193074,0.01000,1.997
9,mlp.gate_proj,0.0000211020,0.01000,2.014
9,mlp.down_proj,0.0000048219,0.01000,6.151
10,self_attn.k_proj,0.0000034324,0.01000,1.867
10,self_attn.v_proj,0.0000019137,0.01000,1.831
10,self_attn.q_proj,0.0000121056,0.01000,1.897
10,self_attn.o_proj,0.0000010023,0.01000,1.873
10,mlp.up_proj,0.0000224903,0.01000,2.013
10,mlp.gate_proj,0.0000246599,0.01000,2.011
10,mlp.down_proj,0.0000059849,0.01000,6.103
11,self_attn.k_proj,0.0000025495,0.01000,1.908
11,self_attn.v_proj,0.0000012462,0.01000,1.865
11,self_attn.q_proj,0.0000090048,0.01000,1.923
11,self_attn.o_proj,0.0000014718,0.01000,1.924
11,mlp.up_proj,0.0000258469,0.01000,2.027
11,mlp.gate_proj,0.0000321958,0.01000,1.986
11,mlp.down_proj,0.0000051555,0.01000,6.087
12,self_attn.k_proj,0.0000031215,0.01000,1.847
12,self_attn.v_proj,0.0000014327,0.01000,1.841
12,self_attn.q_proj,0.0000111406,0.01000,1.893
12,self_attn.o_proj,0.0000017573,0.01000,1.957
12,mlp.up_proj,0.0000284193,0.01000,2.017
12,mlp.gate_proj,0.0000301645,0.01000,1.993
12,mlp.down_proj,0.0000064959,0.01000,6.090
13,self_attn.k_proj,0.0000034285,0.01000,1.923
13,self_attn.v_proj,0.0000017783,0.01000,1.831
13,self_attn.q_proj,0.0000119425,0.01000,1.911
13,self_attn.o_proj,0.0000020312,0.01000,1.861
13,mlp.up_proj,0.0000325586,0.01000,2.011
13,mlp.gate_proj,0.0000345637,0.01000,1.978
13,mlp.down_proj,0.0000076320,0.01000,6.090
14,self_attn.k_proj,0.0000042219,0.01000,1.872
14,self_attn.v_proj,0.0000019629,0.01000,1.827
14,self_attn.q_proj,0.0000144176,0.01000,1.895
14,self_attn.o_proj,0.0000020731,0.01000,1.931
14,mlp.up_proj,0.0000335783,0.01000,2.019
14,mlp.gate_proj,0.0000354549,0.01000,2.017
14,mlp.down_proj,0.0000079941,0.01000,6.158
15,self_attn.k_proj,0.0000036243,0.01000,1.894
15,self_attn.v_proj,0.0000022559,0.01000,1.827
15,self_attn.q_proj,0.0000129040,0.01000,1.897
15,self_attn.o_proj,0.0000027518,0.01000,1.912
15,mlp.up_proj,0.0000350510,0.01000,2.121
15,mlp.gate_proj,0.0000385737,0.01000,1.996
15,mlp.down_proj,0.0000085556,0.01000,6.094
16,self_attn.k_proj,0.0000036654,0.01000,1.849
16,self_attn.v_proj,0.0000015336,0.01000,1.822
16,self_attn.q_proj,0.0000115880,0.01000,1.872
16,self_attn.o_proj,0.0000024392,0.01000,1.921
16,mlp.up_proj,0.0000326376,0.01000,2.085
16,mlp.gate_proj,0.0000331992,0.01000,2.003
16,mlp.down_proj,0.0000084625,0.01000,6.173
17,self_attn.k_proj,0.0000040579,0.01000,1.885
17,self_attn.v_proj,0.0000018465,0.01000,1.861
17,self_attn.q_proj,0.0000138158,0.01000,1.906
17,self_attn.o_proj,0.0000025808,0.01000,1.932
17,mlp.up_proj,0.0000322729,0.01000,2.001
17,mlp.gate_proj,0.0000317870,0.01000,1.997
17,mlp.down_proj,0.0000080485,0.01000,6.129
18,self_attn.k_proj,0.0000039598,0.01000,1.839
18,self_attn.v_proj,0.0000020382,0.01000,1.798
18,self_attn.q_proj,0.0000137095,0.01000,1.895
18,self_attn.o_proj,0.0000029167,0.01000,1.892
18,mlp.up_proj,0.0000323423,0.01000,1.998
18,mlp.gate_proj,0.0000308571,0.01000,2.011
18,mlp.down_proj,0.0000081186,0.01000,6.181
19,self_attn.k_proj,0.0000043350,0.01000,1.867
19,self_attn.v_proj,0.0000020963,0.01000,1.811
19,self_attn.q_proj,0.0000163849,0.01000,1.886
19,self_attn.o_proj,0.0000022194,0.01000,1.976
19,mlp.up_proj,0.0000333286,0.01000,2.074
19,mlp.gate_proj,0.0000317924,0.01000,2.042
19,mlp.down_proj,0.0000083289,0.01000,6.124
20,self_attn.k_proj,0.0000045548,0.01000,1.827
20,self_attn.v_proj,0.0000019402,0.01000,1.863
20,self_attn.q_proj,0.0000157211,0.01000,1.926
20,self_attn.o_proj,0.0000029912,0.01000,1.890
20,mlp.up_proj,0.0000323250,0.01000,2.020
20,mlp.gate_proj,0.0000292523,0.01000,1.999
20,mlp.down_proj,0.0000087532,0.01000,6.119
21,self_attn.k_proj,0.0000042023,0.01000,1.894
21,self_attn.v_proj,0.0000019321,0.01000,1.853
21,self_attn.q_proj,0.0000144628,0.01000,1.918
21,self_attn.o_proj,0.0000030416,0.01000,1.891
21,mlp.up_proj,0.0000326811,0.01000,1.994
21,mlp.gate_proj,0.0000293238,0.01000,1.979
21,mlp.down_proj,0.0000085412,0.01000,6.151
22,self_attn.k_proj,0.0000046789,0.01000,1.887
22,self_attn.v_proj,0.0000028668,0.01000,1.833
22,self_attn.q_proj,0.0000161835,0.01000,1.896
22,self_attn.o_proj,0.0000038789,0.01000,1.901
22,mlp.up_proj,0.0000331632,0.01000,2.071
22,mlp.gate_proj,0.0000295798,0.01000,1.978
22,mlp.down_proj,0.0000096156,0.01000,6.178
23,self_attn.k_proj,0.0000043162,0.01000,1.860
23,self_attn.v_proj,0.0000028849,0.01000,1.833
23,self_attn.q_proj,0.0000160021,0.01000,1.861
23,self_attn.o_proj,0.0000037945,0.01000,1.923
23,mlp.up_proj,0.0000337720,0.01000,2.003
23,mlp.gate_proj,0.0000317463,0.01000,2.011
23,mlp.down_proj,0.0000093671,0.01000,6.194
24,self_attn.k_proj,0.0000057187,0.01000,1.942
24,self_attn.v_proj,0.0000024407,0.01000,1.866
24,self_attn.q_proj,0.0000181873,0.01000,1.904
24,self_attn.o_proj,0.0000041032,0.01000,1.924
24,mlp.up_proj,0.0000324691,0.01000,2.000
24,mlp.gate_proj,0.0000301167,0.01000,1.985
24,mlp.down_proj,0.0000084492,0.01000,6.136
25,self_attn.k_proj,0.0000055621,0.01000,1.846
25,self_attn.v_proj,0.0000031424,0.01000,1.823
25,self_attn.q_proj,0.0000198023,0.01000,1.922
25,self_attn.o_proj,0.0000028802,0.01000,1.885
25,mlp.up_proj,0.0000330885,0.01000,2.068
25,mlp.gate_proj,0.0000296588,0.01000,2.031
25,mlp.down_proj,0.0000089875,0.01000,6.062
26,self_attn.k_proj,0.0000050286,0.01000,1.858
26,self_attn.v_proj,0.0000021552,0.01000,1.866
26,self_attn.q_proj,0.0000176642,0.01000,1.899
26,self_attn.o_proj,0.0000031027,0.01000,1.904
26,mlp.up_proj,0.0000356900,0.01000,2.014
26,mlp.gate_proj,0.0000308428,0.01000,1.988
26,mlp.down_proj,0.0000103464,0.01000,6.112
27,self_attn.k_proj,0.0000050559,0.01000,1.826
27,self_attn.v_proj,0.0000026083,0.01000,1.817
27,self_attn.q_proj,0.0000170910,0.01000,1.898
27,self_attn.o_proj,0.0000044997,0.01000,1.891
27,mlp.up_proj,0.0000373241,0.01000,2.002
27,mlp.gate_proj,0.0000323265,0.01000,2.026
27,mlp.down_proj,0.0000123207,0.01000,6.172
28,self_attn.k_proj,0.0000042150,0.01000,1.883
28,self_attn.v_proj,0.0000037593,0.01000,1.861
28,self_attn.q_proj,0.0000171301,0.01000,1.885
28,self_attn.o_proj,0.0000054424,0.01000,1.916
28,mlp.up_proj,0.0000382802,0.01000,1.990
28,mlp.gate_proj,0.0000329041,0.01000,2.059
28,mlp.down_proj,0.0000136056,0.01000,6.099
29,self_attn.k_proj,0.0000055420,0.01000,1.847
29,self_attn.v_proj,0.0000036558,0.01000,1.942
29,self_attn.q_proj,0.0000196112,0.01000,1.991
29,self_attn.o_proj,0.0000046135,0.01000,1.879
29,mlp.up_proj,0.0000391342,0.01000,2.033
29,mlp.gate_proj,0.0000337284,0.01000,1.968
29,mlp.down_proj,0.0000148448,0.01000,6.136
30,self_attn.k_proj,0.0000047346,0.01000,1.847
30,self_attn.v_proj,0.0000041514,0.01000,1.863
30,self_attn.q_proj,0.0000184229,0.01000,1.959
30,self_attn.o_proj,0.0000064813,0.01000,1.855
30,mlp.up_proj,0.0000411291,0.01000,2.034
30,mlp.gate_proj,0.0000354981,0.01000,2.003
30,mlp.down_proj,0.0000166990,0.01000,6.158
31,self_attn.k_proj,0.0000048687,0.01000,1.867
31,self_attn.v_proj,0.0000040193,0.01000,1.842
31,self_attn.q_proj,0.0000189473,0.01000,1.897
31,self_attn.o_proj,0.0000054662,0.01000,1.928
31,mlp.up_proj,0.0000457638,0.01000,2.001
31,mlp.gate_proj,0.0000403368,0.01000,2.053
31,mlp.down_proj,0.0000203712,0.01000,6.115
32,self_attn.k_proj,0.0000053250,0.01000,1.836
32,self_attn.v_proj,0.0000053774,0.01000,1.829
32,self_attn.q_proj,0.0000208265,0.01000,1.948
32,self_attn.o_proj,0.0000054974,0.01000,1.923
32,mlp.up_proj,0.0000489943,0.01000,2.010
32,mlp.gate_proj,0.0000443471,0.01000,2.022
32,mlp.down_proj,0.0000236334,0.01000,6.119
33,self_attn.k_proj,0.0000055528,0.01000,1.860
33,self_attn.v_proj,0.0000053279,0.01000,1.855
33,self_attn.q_proj,0.0000225135,0.01000,1.882
33,self_attn.o_proj,0.0000065416,0.01000,1.911
33,mlp.up_proj,0.0000581524,0.01000,1.989
33,mlp.gate_proj,0.0000532374,0.01000,1.992
33,mlp.down_proj,0.0000341816,0.01000,6.194
34,self_attn.k_proj,0.0000057969,0.01000,1.865
34,self_attn.v_proj,0.0000065100,0.01000,1.820
34,self_attn.q_proj,0.0000247060,0.01000,1.933
34,self_attn.o_proj,0.0000064140,0.01000,1.974
34,mlp.up_proj,0.0000676059,0.01000,1.996
34,mlp.gate_proj,0.0000639034,0.01000,1.969
34,mlp.down_proj,0.0000421207,0.01000,6.114
35,self_attn.k_proj,0.0000056806,0.01000,1.843
35,self_attn.v_proj,0.0000058037,0.01000,1.859
35,self_attn.q_proj,0.0000227509,0.01000,1.864
35,self_attn.o_proj,0.0000107215,0.01000,1.953
35,mlp.up_proj,0.0000773738,0.01000,2.075
35,mlp.gate_proj,0.0000748045,0.01000,2.003
35,mlp.down_proj,0.0000531376,0.01000,6.151
36,self_attn.k_proj,0.0000064778,0.01000,1.826
36,self_attn.v_proj,0.0000105387,0.01000,1.820
36,self_attn.q_proj,0.0000284083,0.01000,1.898
36,self_attn.o_proj,0.0000097221,0.01000,1.959
36,mlp.up_proj,0.0000858965,0.01000,2.012
36,mlp.gate_proj,0.0000823549,0.01000,2.042
36,mlp.down_proj,0.0000657707,0.01000,6.164
37,self_attn.k_proj,0.0000074679,0.01000,1.836
37,self_attn.v_proj,0.0000103437,0.01000,1.870
37,self_attn.q_proj,0.0000301686,0.01000,1.843
37,self_attn.o_proj,0.0000103363,0.01000,1.949
37,mlp.up_proj,0.0000963696,0.01000,2.029
37,mlp.gate_proj,0.0000927627,0.01000,1.995
37,mlp.down_proj,0.0000759659,0.01000,6.172
38,self_attn.k_proj,0.0000072543,0.01000,1.906
38,self_attn.v_proj,0.0000103870,0.01000,1.833
38,self_attn.q_proj,0.0000302236,0.01000,1.885
38,self_attn.o_proj,0.0000106793,0.01000,1.909
38,mlp.up_proj,0.0001080096,0.01000,1.994
38,mlp.gate_proj,0.0001029393,0.01000,2.037
38,mlp.down_proj,0.0000864311,0.01000,6.118
39,self_attn.k_proj,0.0000070753,0.01000,1.848
39,self_attn.v_proj,0.0000115101,0.01000,1.855
39,self_attn.q_proj,0.0000317167,0.01000,1.926
39,self_attn.o_proj,0.0000149693,0.01000,1.908
39,mlp.up_proj,0.0001216658,0.01000,2.038
39,mlp.gate_proj,0.0001149202,0.01000,2.005
39,mlp.down_proj,0.0001039416,0.01000,6.191
40,self_attn.k_proj,0.0000081462,0.01000,1.824
40,self_attn.v_proj,0.0000157852,0.01000,1.910
40,self_attn.q_proj,0.0000353841,0.01000,1.991
40,self_attn.o_proj,0.0000151671,0.01000,1.913
40,mlp.up_proj,0.0001326770,0.01000,2.002
40,mlp.gate_proj,0.0001247391,0.01000,2.012
40,mlp.down_proj,0.0001193831,0.01000,6.104
41,self_attn.k_proj,0.0000079063,0.01000,1.881
41,self_attn.v_proj,0.0000165749,0.01000,1.930
41,self_attn.q_proj,0.0000366510,0.01000,1.896
41,self_attn.o_proj,0.0000124038,0.01000,1.877
41,mlp.up_proj,0.0001447803,0.01000,1.999
41,mlp.gate_proj,0.0001340893,0.01000,1.963
41,mlp.down_proj,0.0001349494,0.01000,6.061
42,self_attn.k_proj,0.0000083146,0.01000,1.833
42,self_attn.v_proj,0.0000181338,0.01000,1.793
42,self_attn.q_proj,0.0000357798,0.01000,1.855
42,self_attn.o_proj,0.0000141514,0.01000,1.914
42,mlp.up_proj,0.0001559160,0.01000,1.990
42,mlp.gate_proj,0.0001425551,0.01000,1.997
42,mlp.down_proj,0.0001580665,0.01000,6.099
43,self_attn.k_proj,0.0000083956,0.01000,1.822
43,self_attn.v_proj,0.0000256210,0.01000,1.813
43,self_attn.q_proj,0.0000399949,0.01000,1.861
43,self_attn.o_proj,0.0000247247,0.01000,1.883
43,mlp.up_proj,0.0001706939,0.01000,2.020
43,mlp.gate_proj,0.0001531956,0.01000,2.037
43,mlp.down_proj,0.0001867778,0.01000,6.179
44,self_attn.k_proj,0.0000076330,0.01000,1.852
44,self_attn.v_proj,0.0000281914,0.01000,1.820
44,self_attn.q_proj,0.0000391793,0.01000,1.889
44,self_attn.o_proj,0.0000360502,0.01000,1.884
44,mlp.up_proj,0.0001831046,0.01000,1.963
44,mlp.gate_proj,0.0001616602,0.01000,1.966
44,mlp.down_proj,0.0002535868,0.01000,6.108
45,self_attn.k_proj,0.0000079784,0.01000,1.892
45,self_attn.v_proj,0.0000340295,0.01000,1.838
45,self_attn.q_proj,0.0000422606,0.01000,1.895
45,self_attn.o_proj,0.0000337677,0.01000,1.944
45,mlp.up_proj,0.0001918452,0.01000,1.990
45,mlp.gate_proj,0.0001717587,0.01000,1.985
45,mlp.down_proj,0.0002833572,0.01000,6.189
46,self_attn.k_proj,0.0000071048,0.01000,1.838
46,self_attn.v_proj,0.0000363993,0.01000,1.838
46,self_attn.q_proj,0.0000375253,0.01000,1.876
46,self_attn.o_proj,0.0000640068,0.01000,1.919
46,mlp.up_proj,0.0001911036,0.01000,2.009
46,mlp.gate_proj,0.0001784168,0.01000,2.081
46,mlp.down_proj,0.0004206370,0.01000,6.225
47,self_attn.k_proj,0.0000061165,0.01000,1.837
47,self_attn.v_proj,0.0000228788,0.01000,1.920
47,self_attn.q_proj,0.0000279219,0.01000,1.940
47,self_attn.o_proj,0.0000288922,0.01000,1.906
47,mlp.up_proj,0.0002043838,0.01000,2.035
47,mlp.gate_proj,0.0001966780,0.01000,2.033
47,mlp.down_proj,0.0006320129,0.01000,6.199
|