|
layer,module,loss,damp,time
|
|
0,self_attn.k_proj,0.04410,0.01000,0.681
|
|
0,self_attn.v_proj,0.00009,0.01000,0.501
|
|
0,self_attn.q_proj,0.04807,0.01000,0.533
|
|
0,self_attn.o_proj,0.00000,0.01000,0.508
|
|
0,mlp.up_proj,0.01518,0.01000,0.556
|
|
0,mlp.gate_proj,0.01725,0.01000,0.543
|
|
0,mlp.down_proj,0.00004,0.01000,1.501
|
|
1,self_attn.k_proj,0.00021,0.01000,0.527
|
|
1,self_attn.v_proj,0.00000,0.01000,0.525
|
|
1,self_attn.q_proj,0.00030,0.01000,0.544
|
|
1,self_attn.o_proj,0.00000,0.01000,0.567
|
|
1,mlp.up_proj,0.00012,0.01000,0.559
|
|
1,mlp.gate_proj,0.00014,0.01000,0.568
|
|
1,mlp.down_proj,0.00000,0.01000,1.511
|
|
|