File size: 19,239 Bytes
098533b | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 | layer,module,loss,samples,damp,time
0,linear_attn.in_proj_qkv,0.0000002075,0.05000,1.370
0,linear_attn.in_proj_z,0.0000001358,0.05000,1.004
0,linear_attn.out_proj,0.0000000001,0.05000,1.244
0,mlp.up_proj,0.0000000012,0.05000,1.379
0,mlp.gate_proj,0.0000000013,0.05000,1.396
0,mlp.down_proj,0.0000000000,0.05000,3.793
1,linear_attn.in_proj_qkv,0.0000000111,0.05000,1.035
1,linear_attn.in_proj_z,0.0000000068,0.05000,1.032
1,linear_attn.out_proj,0.0000000000,0.05000,1.236
1,mlp.up_proj,0.0000000026,0.05000,1.413
1,mlp.gate_proj,0.0000000028,0.05000,1.457
1,mlp.down_proj,0.0000000000,0.05000,3.695
2,linear_attn.in_proj_qkv,0.0000000156,0.05000,1.028
2,linear_attn.in_proj_z,0.0000000094,0.05000,1.029
2,linear_attn.out_proj,0.0000000000,0.05000,1.230
2,mlp.up_proj,0.0000000042,0.05000,1.426
2,mlp.gate_proj,0.0000000045,0.05000,1.470
2,mlp.down_proj,0.0000000001,0.05000,3.677
3,self_attn.q_proj,0.0000001636,0.05000,1.746
3,self_attn.v_proj,0.0000000129,0.05000,1.758
3,self_attn.k_proj,0.0000000128,0.05000,1.780
3,self_attn.o_proj,0.0000000000,0.05000,1.231
3,mlp.gate_proj,0.0000000052,0.05000,1.425
3,mlp.up_proj,0.0000000050,0.05000,1.430
3,mlp.down_proj,0.0000000000,0.05000,3.709
4,linear_attn.in_proj_qkv,0.0000000191,0.05000,1.034
4,linear_attn.in_proj_z,0.0000000122,0.05000,1.032
4,linear_attn.out_proj,0.0000000001,0.05000,1.229
4,mlp.up_proj,0.0000000066,0.05000,1.453
4,mlp.gate_proj,0.0000000069,0.05000,1.485
4,mlp.down_proj,0.0000000000,0.05000,3.699
5,linear_attn.in_proj_qkv,0.0000000245,0.05000,1.044
5,linear_attn.in_proj_z,0.0000000158,0.05000,1.019
5,linear_attn.out_proj,0.0000000001,0.05000,1.222
5,mlp.gate_proj,0.0000000087,0.05000,1.436
5,mlp.up_proj,0.0000000082,0.05000,1.456
5,mlp.down_proj,0.0000000001,0.05000,3.728
6,linear_attn.in_proj_qkv,0.0000000396,0.05000,1.041
6,linear_attn.in_proj_z,0.0000000235,0.05000,1.026
6,linear_attn.out_proj,0.0000000001,0.05000,1.227
6,mlp.gate_proj,0.0000000126,0.05000,1.474
6,mlp.up_proj,0.0000000116,0.05000,1.478
6,mlp.down_proj,0.0000000001,0.05000,3.676
7,self_attn.q_proj,0.0000001413,0.05000,1.711
7,self_attn.v_proj,0.0000000113,0.05000,1.726
7,self_attn.k_proj,0.0000000121,0.05000,1.752
7,self_attn.o_proj,0.0000000001,0.05000,1.225
7,mlp.up_proj,0.0000000127,0.05000,1.418
7,mlp.gate_proj,0.0000000137,0.05000,1.421
7,mlp.down_proj,0.0000000002,0.05000,3.712
8,linear_attn.in_proj_qkv,0.0000000387,0.05000,1.035
8,linear_attn.in_proj_z,0.0000000243,0.05000,1.015
8,linear_attn.out_proj,0.0000000002,0.05000,1.225
8,mlp.up_proj,0.0000000147,0.05000,1.425
8,mlp.gate_proj,0.0000000157,0.05000,1.457
8,mlp.down_proj,0.0000000002,0.05000,3.715
9,linear_attn.in_proj_qkv,0.0000000406,0.05000,1.034
9,linear_attn.in_proj_z,0.0000000246,0.05000,1.008
9,linear_attn.out_proj,0.0000000002,0.05000,1.228
9,mlp.gate_proj,0.0000000178,0.05000,1.450
9,mlp.up_proj,0.0000000167,0.05000,1.469
9,mlp.down_proj,0.0000000003,0.05000,3.706
10,linear_attn.in_proj_qkv,0.0000000437,0.05000,1.030
10,linear_attn.in_proj_z,0.0000000256,0.05000,1.004
10,linear_attn.out_proj,0.0000000002,0.05000,1.237
10,mlp.up_proj,0.0000000178,0.05000,1.444
10,mlp.gate_proj,0.0000000189,0.05000,1.458
10,mlp.down_proj,0.0000000003,0.05000,3.636
11,self_attn.k_proj,0.0000000117,0.05000,1.733
11,self_attn.q_proj,0.0000001285,0.05000,1.733
11,self_attn.v_proj,0.0000000104,0.05000,1.742
11,self_attn.o_proj,0.0000000002,0.05000,1.227
11,mlp.gate_proj,0.0000000206,0.05000,1.423
11,mlp.up_proj,0.0000000196,0.05000,1.430
11,mlp.down_proj,0.0000000004,0.05000,3.723
12,linear_attn.in_proj_qkv,0.0000000517,0.05000,1.036
12,linear_attn.in_proj_z,0.0000000303,0.05000,1.009
12,linear_attn.out_proj,0.0000000003,0.05000,1.227
12,mlp.gate_proj,0.0000000217,0.05000,1.387
12,mlp.up_proj,0.0000000206,0.05000,1.396
12,mlp.down_proj,0.0000000004,0.05000,3.688
13,linear_attn.in_proj_qkv,0.0000000543,0.05000,1.022
13,linear_attn.in_proj_z,0.0000000303,0.05000,1.012
13,linear_attn.out_proj,0.0000000004,0.05000,1.231
13,mlp.gate_proj,0.0000000234,0.05000,1.392
13,mlp.up_proj,0.0000000223,0.05000,1.414
13,mlp.down_proj,0.0000000005,0.05000,3.705
14,linear_attn.in_proj_qkv,0.0000000611,0.05000,1.010
14,linear_attn.in_proj_z,0.0000000349,0.05000,1.027
14,linear_attn.out_proj,0.0000000005,0.05000,1.224
14,mlp.gate_proj,0.0000000249,0.05000,1.391
14,mlp.up_proj,0.0000000238,0.05000,1.413
14,mlp.down_proj,0.0000000005,0.05000,3.677
15,self_attn.v_proj,0.0000000096,0.05000,1.707
15,self_attn.q_proj,0.0000001083,0.05000,1.713
15,self_attn.k_proj,0.0000000100,0.05000,1.761
15,self_attn.o_proj,0.0000000003,0.05000,1.232
15,mlp.up_proj,0.0000000278,0.05000,1.418
15,mlp.gate_proj,0.0000000289,0.05000,1.426
15,mlp.down_proj,0.0000000007,0.05000,3.684
16,linear_attn.in_proj_qkv,0.0000000651,0.05000,1.008
16,linear_attn.in_proj_z,0.0000000368,0.05000,1.011
16,linear_attn.out_proj,0.0000000005,0.05000,1.229
16,mlp.gate_proj,0.0000000321,0.05000,1.423
16,mlp.up_proj,0.0000000307,0.05000,1.444
16,mlp.down_proj,0.0000000008,0.05000,3.675
17,linear_attn.in_proj_qkv,0.0000000748,0.05000,1.021
17,linear_attn.in_proj_z,0.0000000373,0.05000,1.012
17,linear_attn.out_proj,0.0000000007,0.05000,1.231
17,mlp.gate_proj,0.0000000371,0.05000,1.425
17,mlp.up_proj,0.0000000355,0.05000,1.433
17,mlp.down_proj,0.0000000011,0.05000,3.682
18,linear_attn.in_proj_qkv,0.0000000799,0.05000,1.029
18,linear_attn.in_proj_z,0.0000000435,0.05000,1.011
18,linear_attn.out_proj,0.0000000009,0.05000,1.237
18,mlp.up_proj,0.0000000432,0.05000,1.412
18,mlp.gate_proj,0.0000000469,0.05000,1.430
18,mlp.down_proj,0.0000000017,0.05000,3.702
19,self_attn.q_proj,0.0000001313,0.05000,1.704
19,self_attn.k_proj,0.0000000129,0.05000,1.721
19,self_attn.v_proj,0.0000000148,0.05000,1.732
19,self_attn.o_proj,0.0000000014,0.05000,1.228
19,mlp.gate_proj,0.0000000578,0.05000,1.389
19,mlp.up_proj,0.0000000545,0.05000,1.400
19,mlp.down_proj,0.0000000023,0.05000,3.726
20,linear_attn.in_proj_qkv,0.0000001444,0.05000,1.033
20,linear_attn.in_proj_z,0.0000000797,0.05000,1.030
20,linear_attn.out_proj,0.0000000014,0.05000,1.230
20,mlp.up_proj,0.0000000645,0.05000,1.407
20,mlp.gate_proj,0.0000000699,0.05000,1.447
20,mlp.down_proj,0.0000000026,0.05000,3.746
21,linear_attn.in_proj_qkv,0.0000001775,0.05000,1.028
21,linear_attn.in_proj_z,0.0000001111,0.05000,1.027
21,linear_attn.out_proj,0.0000000019,0.05000,1.229
21,mlp.gate_proj,0.0000000760,0.05000,1.414
21,mlp.up_proj,0.0000000707,0.05000,1.419
21,mlp.down_proj,0.0000000028,0.05000,3.753
22,linear_attn.in_proj_qkv,0.0000001534,0.05000,1.023
22,linear_attn.in_proj_z,0.0000000923,0.05000,1.035
22,linear_attn.out_proj,0.0000000017,0.05000,1.229
22,mlp.up_proj,0.0000000799,0.05000,1.397
22,mlp.gate_proj,0.0000000898,0.05000,1.398
22,mlp.down_proj,0.0000000033,0.05000,3.691
23,self_attn.k_proj,0.0000000186,0.05000,1.713
23,self_attn.v_proj,0.0000000191,0.05000,1.733
23,self_attn.q_proj,0.0000001725,0.05000,1.747
23,self_attn.o_proj,0.0000000017,0.05000,1.243
23,mlp.gate_proj,0.0000000931,0.05000,1.417
23,mlp.up_proj,0.0000000854,0.05000,1.428
23,mlp.down_proj,0.0000000034,0.05000,3.725
24,linear_attn.in_proj_qkv,0.0000001517,0.05000,1.022
24,linear_attn.in_proj_z,0.0000000844,0.05000,1.036
24,linear_attn.out_proj,0.0000000021,0.05000,1.229
24,mlp.gate_proj,0.0000001015,0.05000,1.445
24,mlp.up_proj,0.0000000928,0.05000,1.457
24,mlp.down_proj,0.0000000040,0.05000,3.743
25,linear_attn.in_proj_qkv,0.0000001549,0.05000,1.033
25,linear_attn.in_proj_z,0.0000000803,0.05000,1.032
25,linear_attn.out_proj,0.0000000022,0.05000,1.216
25,mlp.gate_proj,0.0000000983,0.05000,1.438
25,mlp.up_proj,0.0000000952,0.05000,1.442
25,mlp.down_proj,0.0000000041,0.05000,3.747
26,linear_attn.in_proj_qkv,0.0000001424,0.05000,1.024
26,linear_attn.in_proj_z,0.0000000707,0.05000,1.034
26,linear_attn.out_proj,0.0000000023,0.05000,1.207
26,mlp.gate_proj,0.0000000940,0.05000,1.456
26,mlp.up_proj,0.0000000966,0.05000,1.468
26,mlp.down_proj,0.0000000043,0.05000,3.704
27,self_attn.k_proj,0.0000000177,0.05000,1.741
27,self_attn.q_proj,0.0000001626,0.05000,1.761
27,self_attn.v_proj,0.0000000154,0.05000,1.770
27,self_attn.o_proj,0.0000000032,0.05000,1.254
27,mlp.gate_proj,0.0000000972,0.05000,1.431
27,mlp.up_proj,0.0000001030,0.05000,1.440
27,mlp.down_proj,0.0000000047,0.05000,3.722
28,linear_attn.in_proj_qkv,0.0000001435,0.05000,1.030
28,linear_attn.in_proj_z,0.0000000666,0.05000,1.040
28,linear_attn.out_proj,0.0000000029,0.05000,1.216
28,mlp.gate_proj,0.0000000946,0.05000,1.425
28,mlp.up_proj,0.0000001020,0.05000,1.432
28,mlp.down_proj,0.0000000050,0.05000,3.754
29,linear_attn.in_proj_qkv,0.0000001544,0.05000,1.028
29,linear_attn.in_proj_z,0.0000000705,0.05000,1.027
29,linear_attn.out_proj,0.0000000025,0.05000,1.214
29,mlp.gate_proj,0.0000000945,0.05000,1.439
29,mlp.up_proj,0.0000001026,0.05000,1.465
29,mlp.down_proj,0.0000000050,0.05000,3.763
30,linear_attn.in_proj_qkv,0.0000001554,0.05000,1.043
30,linear_attn.in_proj_z,0.0000000724,0.05000,1.068
30,linear_attn.out_proj,0.0000000033,0.05000,1.230
30,mlp.gate_proj,0.0000000917,0.05000,1.436
30,mlp.up_proj,0.0000001018,0.05000,1.448
30,mlp.down_proj,0.0000000049,0.05000,3.706
31,self_attn.v_proj,0.0000000185,0.05000,1.734
31,self_attn.q_proj,0.0000001505,0.05000,1.766
31,self_attn.k_proj,0.0000000166,0.05000,1.770
31,self_attn.o_proj,0.0000000040,0.05000,1.211
31,mlp.up_proj,0.0000001088,0.05000,1.442
31,mlp.gate_proj,0.0000000964,0.05000,1.472
31,mlp.down_proj,0.0000000053,0.05000,3.693
32,linear_attn.in_proj_qkv,0.0000001616,0.05000,1.040
32,linear_attn.in_proj_z,0.0000000702,0.05000,1.029
32,linear_attn.out_proj,0.0000000033,0.05000,1.232
32,mlp.gate_proj,0.0000001028,0.05000,1.418
32,mlp.up_proj,0.0000001162,0.05000,1.447
32,mlp.down_proj,0.0000000058,0.05000,3.762
33,linear_attn.in_proj_qkv,0.0000001914,0.05000,1.022
33,linear_attn.in_proj_z,0.0000000784,0.05000,1.034
33,linear_attn.out_proj,0.0000000039,0.05000,1.222
33,mlp.up_proj,0.0000001207,0.05000,1.393
33,mlp.gate_proj,0.0000001067,0.05000,1.399
33,mlp.down_proj,0.0000000059,0.05000,3.754
34,linear_attn.in_proj_qkv,0.0000001861,0.05000,1.026
34,linear_attn.in_proj_z,0.0000000843,0.05000,1.032
34,linear_attn.out_proj,0.0000000041,0.05000,1.230
34,mlp.gate_proj,0.0000001186,0.05000,1.425
34,mlp.up_proj,0.0000001293,0.05000,1.436
34,mlp.down_proj,0.0000000078,0.05000,3.695
35,self_attn.v_proj,0.0000000283,0.05000,1.770
35,self_attn.q_proj,0.0000001840,0.05000,1.786
35,self_attn.k_proj,0.0000000199,0.05000,1.801
35,self_attn.o_proj,0.0000000071,0.05000,1.228
35,mlp.up_proj,0.0000001330,0.05000,1.440
35,mlp.gate_proj,0.0000001239,0.05000,1.460
35,mlp.down_proj,0.0000000088,0.05000,3.733
36,linear_attn.in_proj_qkv,0.0000002602,0.05000,1.038
36,linear_attn.in_proj_z,0.0000001298,0.05000,1.035
36,linear_attn.out_proj,0.0000000037,0.05000,1.233
36,mlp.up_proj,0.0000001317,0.05000,1.429
36,mlp.gate_proj,0.0000001379,0.05000,1.470
36,mlp.down_proj,0.0000000081,0.05000,3.742
37,linear_attn.in_proj_qkv,0.0000002863,0.05000,1.028
37,linear_attn.in_proj_z,0.0000001613,0.05000,1.045
37,linear_attn.out_proj,0.0000000043,0.05000,1.226
37,mlp.up_proj,0.0000001320,0.05000,1.414
37,mlp.gate_proj,0.0000001398,0.05000,1.429
37,mlp.down_proj,0.0000000078,0.05000,3.719
38,linear_attn.in_proj_qkv,0.0000002546,0.05000,1.024
38,linear_attn.in_proj_z,0.0000001477,0.05000,1.026
38,linear_attn.out_proj,0.0000000032,0.05000,1.228
38,mlp.gate_proj,0.0000001848,0.05000,1.467
38,mlp.up_proj,0.0000001489,0.05000,1.517
38,mlp.down_proj,0.0000000082,0.05000,3.692
39,self_attn.k_proj,0.0000000249,0.05000,1.712
39,self_attn.v_proj,0.0000000300,0.05000,1.727
39,self_attn.q_proj,0.0000002229,0.05000,1.746
39,self_attn.o_proj,0.0000000049,0.05000,1.231
39,mlp.gate_proj,0.0000001662,0.05000,1.488
39,mlp.up_proj,0.0000001445,0.05000,1.489
39,mlp.down_proj,0.0000000080,0.05000,3.701
40,linear_attn.in_proj_qkv,0.0000002447,0.05000,1.026
40,linear_attn.in_proj_z,0.0000001349,0.05000,1.036
40,linear_attn.out_proj,0.0000000040,0.05000,1.232
40,mlp.up_proj,0.0000001539,0.05000,1.413
40,mlp.gate_proj,0.0000001819,0.05000,1.448
40,mlp.down_proj,0.0000000083,0.05000,3.806
41,linear_attn.in_proj_qkv,0.0000002201,0.05000,1.022
41,linear_attn.in_proj_z,0.0000001207,0.05000,1.030
41,linear_attn.out_proj,0.0000000035,0.05000,1.221
41,mlp.up_proj,0.0000001497,0.05000,1.471
41,mlp.gate_proj,0.0000001583,0.05000,1.473
41,mlp.down_proj,0.0000000083,0.05000,3.754
42,linear_attn.in_proj_qkv,0.0000002117,0.05000,1.028
42,linear_attn.in_proj_z,0.0000001109,0.05000,1.028
42,linear_attn.out_proj,0.0000000042,0.05000,1.236
42,mlp.gate_proj,0.0000001501,0.05000,1.430
42,mlp.up_proj,0.0000001533,0.05000,1.449
42,mlp.down_proj,0.0000000093,0.05000,3.761
43,self_attn.k_proj,0.0000000260,0.05000,1.730
43,self_attn.q_proj,0.0000002219,0.05000,1.731
43,self_attn.v_proj,0.0000000303,0.05000,1.771
43,self_attn.o_proj,0.0000000069,0.05000,1.220
43,mlp.up_proj,0.0000001592,0.05000,1.462
43,mlp.gate_proj,0.0000001490,0.05000,1.475
43,mlp.down_proj,0.0000000100,0.05000,3.767
44,linear_attn.in_proj_qkv,0.0000002080,0.05000,1.036
44,linear_attn.in_proj_z,0.0000001016,0.05000,1.032
44,linear_attn.out_proj,0.0000000061,0.05000,1.241
44,mlp.up_proj,0.0000001637,0.05000,1.431
44,mlp.gate_proj,0.0000001513,0.05000,1.432
44,mlp.down_proj,0.0000000115,0.05000,3.686
45,linear_attn.in_proj_qkv,0.0000002124,0.05000,1.032
45,linear_attn.in_proj_z,0.0000001036,0.05000,1.036
45,linear_attn.out_proj,0.0000000054,0.05000,1.239
45,mlp.gate_proj,0.0000001512,0.05000,1.415
45,mlp.up_proj,0.0000001650,0.05000,1.427
45,mlp.down_proj,0.0000000120,0.05000,3.729
46,linear_attn.in_proj_qkv,0.0000002224,0.05000,1.027
46,linear_attn.in_proj_z,0.0000001100,0.05000,1.042
46,linear_attn.out_proj,0.0000000082,0.05000,1.233
46,mlp.gate_proj,0.0000001491,0.05000,1.447
46,mlp.up_proj,0.0000001676,0.05000,1.473
46,mlp.down_proj,0.0000000132,0.05000,3.803
47,self_attn.q_proj,0.0000002389,0.05000,1.770
47,self_attn.k_proj,0.0000000255,0.05000,1.771
47,self_attn.v_proj,0.0000000391,0.05000,1.806
47,self_attn.o_proj,0.0000000089,0.05000,1.225
47,mlp.up_proj,0.0000001848,0.05000,1.439
47,mlp.gate_proj,0.0000001653,0.05000,1.443
47,mlp.down_proj,0.0000000162,0.05000,3.724
48,linear_attn.in_proj_qkv,0.0000002445,0.05000,1.042
48,linear_attn.in_proj_z,0.0000001161,0.05000,1.022
48,linear_attn.out_proj,0.0000000094,0.05000,1.247
48,mlp.gate_proj,0.0000001822,0.05000,1.439
48,mlp.up_proj,0.0000002028,0.05000,1.475
48,mlp.down_proj,0.0000000198,0.05000,3.687
49,linear_attn.in_proj_qkv,0.0000002972,0.05000,1.048
49,linear_attn.in_proj_z,0.0000001243,0.05000,1.020
49,linear_attn.out_proj,0.0000000127,0.05000,1.247
49,mlp.gate_proj,0.0000002012,0.05000,1.429
49,mlp.up_proj,0.0000002182,0.05000,1.436
49,mlp.down_proj,0.0000000258,0.05000,3.678
50,linear_attn.in_proj_qkv,0.0000003036,0.05000,1.038
50,linear_attn.in_proj_z,0.0000001385,0.05000,1.036
50,linear_attn.out_proj,0.0000000192,0.05000,1.246
50,mlp.gate_proj,0.0000002451,0.05000,1.427
50,mlp.up_proj,0.0000002521,0.05000,1.467
50,mlp.down_proj,0.0000000435,0.05000,3.690
51,self_attn.v_proj,0.0000000820,0.05000,1.735
51,self_attn.k_proj,0.0000000351,0.05000,1.748
51,self_attn.q_proj,0.0000003200,0.05000,1.751
51,self_attn.o_proj,0.0000000278,0.05000,1.241
51,mlp.up_proj,0.0000002922,0.05000,1.427
51,mlp.gate_proj,0.0000002748,0.05000,1.440
51,mlp.down_proj,0.0000000544,0.05000,3.721
52,linear_attn.in_proj_qkv,0.0000004735,0.05000,1.035
52,linear_attn.in_proj_z,0.0000002124,0.05000,1.033
52,linear_attn.out_proj,0.0000000231,0.05000,1.243
52,mlp.gate_proj,0.0000003281,0.05000,1.440
52,mlp.up_proj,0.0000003091,0.05000,1.457
52,mlp.down_proj,0.0000000524,0.05000,3.701
53,linear_attn.in_proj_qkv,0.0000004603,0.05000,1.067
53,linear_attn.in_proj_z,0.0000002217,0.05000,1.029
53,linear_attn.out_proj,0.0000000243,0.05000,1.285
53,mlp.gate_proj,0.0000003586,0.05000,1.436
53,mlp.up_proj,0.0000003214,0.05000,1.453
53,mlp.down_proj,0.0000000558,0.05000,3.702
54,linear_attn.in_proj_qkv,0.0000004444,0.05000,1.035
54,linear_attn.in_proj_z,0.0000002355,0.05000,1.034
54,linear_attn.out_proj,0.0000000238,0.05000,1.284
54,mlp.gate_proj,0.0000004498,0.05000,1.457
54,mlp.up_proj,0.0000003799,0.05000,1.459
54,mlp.down_proj,0.0000000769,0.05000,3.709
55,self_attn.q_proj,0.0000004171,0.05000,1.702
55,self_attn.v_proj,0.0000001058,0.05000,1.715
55,self_attn.k_proj,0.0000000506,0.05000,1.764
55,self_attn.o_proj,0.0000000284,0.05000,1.233
55,mlp.up_proj,0.0000003784,0.05000,1.428
55,mlp.gate_proj,0.0000004249,0.05000,1.451
55,mlp.down_proj,0.0000000625,0.05000,3.718
56,linear_attn.in_proj_qkv,0.0000004994,0.05000,1.030
56,linear_attn.in_proj_z,0.0000002452,0.05000,1.016
56,linear_attn.out_proj,0.0000000310,0.05000,1.245
56,mlp.gate_proj,0.0000004580,0.05000,1.428
56,mlp.up_proj,0.0000003986,0.05000,1.458
56,mlp.down_proj,0.0000000565,0.05000,3.724
57,linear_attn.in_proj_qkv,0.0000005406,0.05000,1.065
57,linear_attn.in_proj_z,0.0000002603,0.05000,1.041
57,linear_attn.out_proj,0.0000000297,0.05000,1.294
57,mlp.gate_proj,0.0000005248,0.05000,1.438
57,mlp.up_proj,0.0000004510,0.05000,1.470
57,mlp.down_proj,0.0000000598,0.05000,3.737
58,linear_attn.in_proj_qkv,0.0000005110,0.05000,1.052
58,linear_attn.in_proj_z,0.0000002702,0.05000,1.040
58,linear_attn.out_proj,0.0000000303,0.05000,1.231
58,mlp.up_proj,0.0000005175,0.05000,1.446
58,mlp.gate_proj,0.0000006045,0.05000,1.452
58,mlp.down_proj,0.0000000817,0.05000,3.716
59,self_attn.v_proj,0.0000002233,0.05000,1.734
59,self_attn.q_proj,0.0000004970,0.05000,1.753
59,self_attn.k_proj,0.0000000637,0.05000,1.772
59,self_attn.o_proj,0.0000000789,0.05000,1.238
59,mlp.gate_proj,0.0000005972,0.05000,1.396
59,mlp.up_proj,0.0000005255,0.05000,1.418
59,mlp.down_proj,0.0000000991,0.05000,3.727
60,linear_attn.in_proj_qkv,0.0000006119,0.05000,1.024
60,linear_attn.in_proj_z,0.0000002857,0.05000,1.027
60,linear_attn.out_proj,0.0000000744,0.05000,1.249
60,mlp.up_proj,0.0000005230,0.05000,1.451
60,mlp.gate_proj,0.0000005900,0.05000,1.456
60,mlp.down_proj,0.0000001247,0.05000,3.711
61,linear_attn.in_proj_qkv,0.0000004431,0.05000,1.027
61,linear_attn.in_proj_z,0.0000002485,0.05000,1.025
61,linear_attn.out_proj,0.0000000689,0.05000,1.219
61,mlp.gate_proj,0.0000006208,0.05000,1.409
61,mlp.up_proj,0.0000005521,0.05000,1.425
61,mlp.down_proj,0.0000001618,0.05000,3.708
62,linear_attn.in_proj_qkv,0.0000004958,0.05000,1.027
62,linear_attn.in_proj_z,0.0000002576,0.05000,1.038
62,linear_attn.out_proj,0.0000001895,0.05000,1.220
62,mlp.gate_proj,0.0000005716,0.05000,1.410
62,mlp.up_proj,0.0000005109,0.05000,1.443
62,mlp.down_proj,0.0000002368,0.05000,3.673
63,self_attn.q_proj,0.0000004438,0.05000,1.753
63,self_attn.k_proj,0.0000000597,0.05000,1.773
63,self_attn.v_proj,0.0000001823,0.05000,1.774
63,self_attn.o_proj,0.0000002019,0.05000,1.217
63,mlp.gate_proj,0.0000004743,0.05000,1.410
63,mlp.up_proj,0.0000004088,0.05000,1.411
63,mlp.down_proj,0.0000004359,0.05000,3.645
|