iproskurina's picture
Add files using upload-large-folder tool
97bcd9f verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.01193101,0.01000,0.766
0,self_attn.v_proj,0.00204742,0.01000,0.744
0,self_attn.q_proj,0.01151794,0.01000,0.751
0,self_attn.out_proj,0.00000879,0.01000,0.750
0,fc1,0.07220605,0.01000,0.777
0,fc2,0.00009904,0.01000,3.377
1,self_attn.k_proj,0.02748547,0.01000,0.773
1,self_attn.v_proj,0.00377348,0.01000,0.771
1,self_attn.q_proj,0.03053766,0.01000,0.799
1,self_attn.out_proj,0.00000212,0.01000,0.788
1,fc1,0.10564113,0.01000,0.766
1,fc2,0.00011769,0.01000,3.389
2,self_attn.k_proj,0.03364365,0.01000,0.774
2,self_attn.v_proj,0.00638163,0.01000,0.770
2,self_attn.q_proj,0.03404787,0.01000,0.763
2,self_attn.out_proj,0.00000442,0.01000,0.761
2,fc1,0.10685527,0.01000,0.783
2,fc2,0.00007892,0.01000,3.447
3,self_attn.k_proj,0.03226093,0.01000,0.772
3,self_attn.v_proj,0.00772221,0.01000,0.755
3,self_attn.q_proj,0.03518277,0.01000,0.763
3,self_attn.out_proj,0.00000809,0.01000,0.790
3,fc1,0.09162843,0.01000,0.769
3,fc2,0.00007157,0.01000,3.342
4,self_attn.k_proj,0.03976664,0.01000,0.771
4,self_attn.v_proj,0.00833308,0.01000,0.770
4,self_attn.q_proj,0.04298474,0.01000,0.770
4,self_attn.out_proj,0.00001194,0.01000,0.785
4,fc1,0.08744164,0.01000,0.789
4,fc2,0.00008075,0.01000,3.376
5,self_attn.k_proj,0.04211287,0.01000,0.773
5,self_attn.v_proj,0.00969345,0.01000,0.766
5,self_attn.q_proj,0.04678004,0.01000,0.765
5,self_attn.out_proj,0.00001155,0.01000,0.764
5,fc1,0.08947679,0.01000,0.773
5,fc2,0.00009699,0.01000,3.370
6,self_attn.k_proj,0.06050922,0.01000,0.801
6,self_attn.v_proj,0.01090727,0.01000,0.750
6,self_attn.q_proj,0.05891616,0.01000,0.755
6,self_attn.out_proj,0.00003464,0.01000,0.763
6,fc1,0.09683321,0.01000,0.768
6,fc2,0.00013900,0.01000,3.376
7,self_attn.k_proj,0.06143640,0.01000,0.792
7,self_attn.v_proj,0.01166906,0.01000,0.763
7,self_attn.q_proj,0.05640485,0.01000,0.786
7,self_attn.out_proj,0.00004408,0.01000,0.763
7,fc1,0.10895248,0.01000,0.778
7,fc2,0.00020347,0.01000,3.344
8,self_attn.k_proj,0.06507521,0.01000,0.768
8,self_attn.v_proj,0.01208323,0.01000,0.777
8,self_attn.q_proj,0.05399566,0.01000,0.760
8,self_attn.out_proj,0.00005616,0.01000,0.763
8,fc1,0.11881161,0.01000,0.782
8,fc2,0.00026443,0.01000,3.333
9,self_attn.k_proj,0.06506123,0.01000,0.786
9,self_attn.v_proj,0.01248781,0.01000,0.765
9,self_attn.q_proj,0.05453248,0.01000,0.783
9,self_attn.out_proj,0.00007938,0.01000,0.764
9,fc1,0.12274915,0.01000,0.769
9,fc2,0.00035536,0.01000,3.326
10,self_attn.k_proj,0.06140727,0.01000,0.768
10,self_attn.v_proj,0.01420014,0.01000,0.767
10,self_attn.q_proj,0.05016806,0.01000,0.763
10,self_attn.out_proj,0.00011017,0.01000,0.760
10,fc1,0.12526228,0.01000,0.774
10,fc2,0.00056714,0.01000,3.383
11,self_attn.k_proj,0.05852431,0.01000,0.759
11,self_attn.v_proj,0.01596023,0.01000,0.767
11,self_attn.q_proj,0.04750057,0.01000,0.764
11,self_attn.out_proj,0.00014029,0.01000,0.774
11,fc1,0.12785329,0.01000,0.775
11,fc2,0.00075469,0.01000,3.320
12,self_attn.k_proj,0.06211779,0.01000,0.773
12,self_attn.v_proj,0.01650352,0.01000,0.763
12,self_attn.q_proj,0.04717031,0.01000,0.777
12,self_attn.out_proj,0.00022129,0.01000,0.761
12,fc1,0.12406510,0.01000,0.769
12,fc2,0.00102223,0.01000,3.390
13,self_attn.k_proj,0.06443056,0.01000,0.781
13,self_attn.v_proj,0.01726957,0.01000,0.772
13,self_attn.q_proj,0.04661303,0.01000,0.758
13,self_attn.out_proj,0.00023633,0.01000,0.765
13,fc1,0.13054048,0.01000,0.792
13,fc2,0.00139816,0.01000,3.390
14,self_attn.k_proj,0.05847587,0.01000,0.771
14,self_attn.v_proj,0.02090536,0.01000,0.770
14,self_attn.q_proj,0.04376426,0.01000,0.788
14,self_attn.out_proj,0.00027757,0.01000,0.761
14,fc1,0.13830929,0.01000,0.779
14,fc2,0.00192462,0.01000,3.343
15,self_attn.k_proj,0.05246258,0.01000,0.773
15,self_attn.v_proj,0.02610055,0.01000,0.773
15,self_attn.q_proj,0.04327298,0.01000,0.758
15,self_attn.out_proj,0.00027173,0.01000,0.767
15,fc1,0.14475755,0.01000,0.775
15,fc2,0.00244589,0.01000,3.321
16,self_attn.k_proj,0.05219132,0.01000,0.786
16,self_attn.v_proj,0.02799954,0.01000,0.762
16,self_attn.q_proj,0.03783621,0.01000,0.763
16,self_attn.out_proj,0.00039026,0.01000,0.769
16,fc1,0.15572587,0.01000,0.782
16,fc2,0.00316169,0.01000,3.376
17,self_attn.k_proj,0.05054565,0.01000,0.830
17,self_attn.v_proj,0.03031302,0.01000,0.771
17,self_attn.q_proj,0.03752312,0.01000,0.761
17,self_attn.out_proj,0.00044570,0.01000,0.765
17,fc1,0.16843134,0.01000,0.772
17,fc2,0.00403455,0.01000,3.315
18,self_attn.k_proj,0.04542822,0.01000,0.766
18,self_attn.v_proj,0.03442155,0.01000,0.753
18,self_attn.q_proj,0.03605321,0.01000,0.759
18,self_attn.out_proj,0.00034129,0.01000,0.769
18,fc1,0.17829082,0.01000,0.769
18,fc2,0.00384275,0.01000,3.513
19,self_attn.k_proj,0.04639758,0.01000,0.772
19,self_attn.v_proj,0.04432996,0.01000,0.771
19,self_attn.q_proj,0.03613599,0.01000,0.770
19,self_attn.out_proj,0.00052690,0.01000,0.781
19,fc1,0.19145459,0.01000,0.782
19,fc2,0.00470920,0.01000,3.507
20,self_attn.k_proj,0.04799912,0.01000,0.791
20,self_attn.v_proj,0.05039908,0.01000,0.762
20,self_attn.q_proj,0.03520311,0.01000,0.781
20,self_attn.out_proj,0.00063094,0.01000,0.774
20,fc1,0.19941745,0.01000,0.783
20,fc2,0.00606712,0.01000,3.514
21,self_attn.k_proj,0.04461705,0.01000,0.797
21,self_attn.v_proj,0.05256410,0.01000,0.784
21,self_attn.q_proj,0.03900132,0.01000,0.821
21,self_attn.out_proj,0.00054641,0.01000,0.773
21,fc1,0.20300829,0.01000,0.783
21,fc2,0.00714681,0.01000,3.591
22,self_attn.k_proj,0.04705104,0.01000,0.829
22,self_attn.v_proj,0.06090737,0.01000,0.750
22,self_attn.q_proj,0.04897617,0.01000,0.805
22,self_attn.out_proj,0.00065823,0.01000,0.755
22,fc1,0.20262627,0.01000,0.766
22,fc2,0.00769133,0.01000,3.481
23,self_attn.k_proj,0.06682779,0.01000,0.775
23,self_attn.v_proj,0.04476626,0.01000,0.787
23,self_attn.q_proj,0.11386553,0.01000,0.775
23,self_attn.out_proj,0.00203764,0.01000,0.774
23,fc1,0.19634233,0.01000,0.810
23,fc2,0.00576396,0.01000,3.536