File size: 8,882 Bytes
fc418c2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 |
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.06161176,0.01000,0.932
0,self_attn.v_proj,0.05438014,0.01000,0.723
0,self_attn.q_proj,0.12705065,0.01000,0.915
0,self_attn.o_proj,0.17126846,0.01000,0.846
0,mlp.up_proj,0.80178344,0.01000,1.060
0,mlp.gate_proj,1.22950339,0.01000,1.030
0,mlp.down_proj,0.29198846,0.01000,0.589
1,self_attn.k_proj,0.04196536,0.01000,0.766
1,self_attn.v_proj,0.04195968,0.01000,0.801
1,self_attn.q_proj,0.08776645,0.01000,0.850
1,self_attn.o_proj,0.05204657,0.01000,0.786
1,mlp.up_proj,7.74701595,0.01000,0.884
1,mlp.gate_proj,19.37592506,0.01000,-1.316
1,mlp.down_proj,0.42635429,0.01000,2.649
2,self_attn.k_proj,0.08282123,0.01000,0.777
2,self_attn.v_proj,0.08251686,0.01000,0.780
2,self_attn.q_proj,0.18313025,0.01000,0.831
2,self_attn.o_proj,0.09041101,0.01000,0.758
2,mlp.up_proj,6.97388744,0.01000,0.819
2,mlp.gate_proj,17.37420845,0.01000,0.842
2,mlp.down_proj,555.31311035,0.01000,2.470
3,self_attn.k_proj,0.66062665,0.01000,0.745
3,self_attn.v_proj,0.66629398,0.01000,0.738
3,self_attn.q_proj,1.30134702,0.01000,0.779
3,self_attn.o_proj,0.19163772,0.01000,0.752
3,mlp.up_proj,9.49505615,0.01000,0.824
3,mlp.gate_proj,22.15675545,0.01000,0.830
3,mlp.down_proj,1.11858487,0.01000,2.587
4,self_attn.k_proj,0.60883915,0.01000,0.758
4,self_attn.v_proj,0.65701765,0.01000,0.766
4,self_attn.q_proj,1.25714827,0.01000,0.778
4,self_attn.o_proj,0.33684582,0.01000,0.767
4,mlp.up_proj,10.67844296,0.01000,0.800
4,mlp.gate_proj,22.64768982,0.01000,0.814
4,mlp.down_proj,1.57849216,0.01000,2.662
5,self_attn.k_proj,0.86607969,0.01000,0.761
5,self_attn.v_proj,0.95299339,0.01000,0.767
5,self_attn.q_proj,1.92915726,0.01000,0.806
5,self_attn.o_proj,0.51527029,0.01000,0.788
5,mlp.up_proj,8.11690903,0.01000,0.815
5,mlp.gate_proj,11.88039017,0.01000,0.810
5,mlp.down_proj,2.06314588,0.01000,2.476
6,self_attn.k_proj,0.84522438,0.01000,0.771
6,self_attn.v_proj,0.79271960,0.01000,0.758
6,self_attn.q_proj,1.74664021,0.01000,0.806
6,self_attn.o_proj,0.51649594,0.01000,0.770
6,mlp.up_proj,11.36476040,0.01000,0.821
6,mlp.gate_proj,16.26104736,0.01000,0.898
6,mlp.down_proj,3.12330055,0.01000,2.463
7,self_attn.k_proj,1.74236369,0.01000,0.763
7,self_attn.v_proj,1.94380081,0.01000,0.762
7,self_attn.q_proj,4.01041460,0.01000,0.794
7,self_attn.o_proj,0.80392551,0.01000,0.767
7,mlp.up_proj,15.10862732,0.01000,0.819
7,mlp.gate_proj,22.81257248,0.01000,0.837
7,mlp.down_proj,3.62108111,0.01000,2.464
8,self_attn.k_proj,2.43949366,0.01000,0.745
8,self_attn.v_proj,2.31129289,0.01000,0.943
8,self_attn.q_proj,5.06256580,0.01000,1.057
8,self_attn.o_proj,0.60827088,0.01000,0.802
8,mlp.up_proj,15.40246868,0.01000,0.809
8,mlp.gate_proj,20.87147713,0.01000,0.801
8,mlp.down_proj,4.27449131,0.01000,2.384
9,self_attn.k_proj,4.37583876,0.01000,-0.010
9,self_attn.v_proj,4.23343515,0.01000,0.706
9,self_attn.q_proj,9.79721832,0.01000,0.719
9,self_attn.o_proj,1.85169268,0.01000,0.739
9,mlp.up_proj,16.51148033,0.01000,0.745
9,mlp.gate_proj,20.53764725,0.01000,0.745
9,mlp.down_proj,6.68374157,0.01000,2.179
10,self_attn.k_proj,3.51351452,0.01000,0.692
10,self_attn.v_proj,3.65583849,0.01000,0.691
10,self_attn.q_proj,7.80333757,0.01000,0.702
10,self_attn.o_proj,1.93884957,0.01000,0.745
10,mlp.up_proj,17.16555405,0.01000,0.722
10,mlp.gate_proj,20.50786018,0.01000,0.751
10,mlp.down_proj,9.01197052,0.01000,2.197
11,self_attn.k_proj,6.72875261,0.01000,0.697
11,self_attn.v_proj,5.92448235,0.01000,0.648
11,self_attn.q_proj,15.31981468,0.01000,0.650
11,self_attn.o_proj,4.41754627,0.01000,0.755
11,mlp.up_proj,18.27470398,0.01000,0.786
11,mlp.gate_proj,18.97273636,0.01000,0.760
11,mlp.down_proj,10.93863583,0.01000,2.211
12,self_attn.k_proj,6.80087852,0.01000,0.664
12,self_attn.v_proj,6.75032997,0.01000,0.680
12,self_attn.q_proj,15.24656105,0.01000,0.685
12,self_attn.o_proj,2.62905002,0.01000,0.684
12,mlp.up_proj,18.10563850,0.01000,0.837
12,mlp.gate_proj,17.88245010,0.01000,0.808
12,mlp.down_proj,10.52472878,0.01000,1.750
13,self_attn.k_proj,8.15466690,0.01000,0.707
13,self_attn.v_proj,8.60487556,0.01000,0.702
13,self_attn.q_proj,21.30573654,0.01000,0.736
13,self_attn.o_proj,3.62042069,0.01000,0.731
13,mlp.up_proj,18.99537659,0.01000,0.764
13,mlp.gate_proj,18.67168045,0.01000,0.876
13,mlp.down_proj,13.00555801,0.01000,2.089
14,self_attn.k_proj,13.40824318,0.01000,0.727
14,self_attn.v_proj,13.49943829,0.01000,0.687
14,self_attn.q_proj,32.17544556,0.01000,0.673
14,self_attn.o_proj,4.37822676,0.01000,0.702
14,mlp.up_proj,20.30528450,0.01000,0.753
14,mlp.gate_proj,19.48166656,0.01000,0.776
14,mlp.down_proj,16.70061111,0.01000,2.228
15,self_attn.k_proj,25.33942032,0.01000,0.636
15,self_attn.v_proj,29.75099182,0.01000,0.648
15,self_attn.q_proj,74.12033844,0.01000,0.662
15,self_attn.o_proj,9.15364933,0.01000,0.649
15,mlp.up_proj,23.37993050,0.01000,0.699
15,mlp.gate_proj,21.96615601,0.01000,0.709
15,mlp.down_proj,24.15357208,0.01000,2.310
16,self_attn.k_proj,37.24622726,0.01000,0.711
16,self_attn.v_proj,33.53807831,0.01000,0.698
16,self_attn.q_proj,92.94651794,0.01000,0.715
16,self_attn.o_proj,10.30152321,0.01000,0.665
16,mlp.up_proj,29.35601807,0.01000,0.695
16,mlp.gate_proj,25.80093002,0.01000,0.200
16,mlp.down_proj,60.27460098,0.01000,2.165
17,self_attn.k_proj,95.47402954,0.01000,0.684
17,self_attn.v_proj,105.25405884,0.01000,0.674
17,self_attn.q_proj,253.24885559,0.01000,0.657
17,self_attn.o_proj,28.11261368,0.01000,0.670
17,mlp.up_proj,42.57036591,0.01000,0.704
17,mlp.gate_proj,36.58126831,0.01000,0.717
17,mlp.down_proj,81.79136658,0.01000,2.167
18,self_attn.k_proj,102.99479675,0.01000,0.644
18,self_attn.v_proj,101.50364685,0.01000,0.670
18,self_attn.q_proj,275.00637817,0.01000,0.704
18,self_attn.o_proj,21.60307312,0.01000,0.651
18,mlp.up_proj,54.27608109,0.01000,0.661
18,mlp.gate_proj,46.83805847,0.01000,0.716
18,mlp.down_proj,132.89431763,0.01000,2.199
19,self_attn.k_proj,178.74481201,0.01000,0.711
19,self_attn.v_proj,189.77200317,0.01000,0.786
19,self_attn.q_proj,486.16369629,0.01000,0.783
19,self_attn.o_proj,41.97334290,0.01000,0.726
19,mlp.up_proj,73.76881409,0.01000,0.756
19,mlp.gate_proj,62.54061508,0.01000,0.787
19,mlp.down_proj,308.76110840,0.01000,2.161
20,self_attn.k_proj,298.62933350,0.01000,0.629
20,self_attn.v_proj,316.93182373,0.01000,0.640
20,self_attn.q_proj,764.87170410,0.01000,0.705
20,self_attn.o_proj,67.96992493,0.01000,0.644
20,mlp.up_proj,94.94843292,0.01000,0.728
20,mlp.gate_proj,82.94094849,0.01000,0.693
20,mlp.down_proj,463.50665283,0.01000,2.142
21,self_attn.k_proj,478.08056641,0.01000,0.662
21,self_attn.v_proj,546.54919434,0.01000,0.660
21,self_attn.q_proj,1147.31347656,0.01000,0.683
21,self_attn.o_proj,118.71049500,0.01000,0.655
21,mlp.up_proj,120.02677917,0.01000,0.708
21,mlp.gate_proj,103.04946899,0.01000,0.708
21,mlp.down_proj,659.67437744,0.01000,2.128
22,self_attn.k_proj,593.22070312,0.01000,0.665
22,self_attn.v_proj,763.92529297,0.01000,0.669
22,self_attn.q_proj,1391.22949219,0.01000,0.679
22,self_attn.o_proj,101.20243835,0.01000,0.657
22,mlp.up_proj,135.26795959,0.01000,0.796
22,mlp.gate_proj,118.14506531,0.01000,0.779
22,mlp.down_proj,766.93237305,0.01000,2.130
23,self_attn.k_proj,817.42401123,0.01000,0.667
23,self_attn.v_proj,912.42480469,0.01000,0.663
23,self_attn.q_proj,1677.90209961,0.01000,0.679
23,self_attn.o_proj,115.38923645,0.01000,0.684
23,mlp.up_proj,160.92965698,0.01000,0.767
23,mlp.gate_proj,142.50930786,0.01000,0.720
23,mlp.down_proj,837.10455322,0.01000,2.173
24,self_attn.k_proj,1420.40991211,0.01000,0.793
24,self_attn.v_proj,1595.83715820,0.01000,0.683
24,self_attn.q_proj,3344.17285156,0.01000,0.736
24,self_attn.o_proj,152.69662476,0.01000,0.738
24,mlp.up_proj,158.49810791,0.01000,0.714
24,mlp.gate_proj,136.60337830,0.01000,0.771
24,mlp.down_proj,973.98236084,0.01000,2.152
25,self_attn.k_proj,1685.52282715,0.01000,0.890
25,self_attn.v_proj,2474.76318359,0.01000,0.920
25,self_attn.q_proj,3874.19628906,0.01000,0.971
25,self_attn.o_proj,197.16078186,0.01000,0.679
25,mlp.up_proj,151.62023926,0.01000,0.738
25,mlp.gate_proj,128.06694031,0.01000,0.745
25,mlp.down_proj,1148.98022461,0.01000,2.151
26,self_attn.k_proj,1625.11279297,0.01000,0.675
26,self_attn.v_proj,2256.05908203,0.01000,0.691
26,self_attn.q_proj,3975.20971680,0.01000,0.716
26,self_attn.o_proj,443.28439331,0.01000,0.676
26,mlp.up_proj,148.50442505,0.01000,0.720
26,mlp.gate_proj,127.99733734,0.01000,0.741
26,mlp.down_proj,1423.76660156,0.01000,2.141
27,self_attn.k_proj,793.07702637,0.01000,0.666
27,self_attn.v_proj,898.25610352,0.01000,0.678
27,self_attn.q_proj,1676.92187500,0.01000,0.674
27,self_attn.o_proj,251.81840515,0.01000,0.676
27,mlp.up_proj,196.21633911,0.01000,0.717
27,mlp.gate_proj,199.20074463,0.01000,0.710
27,mlp.down_proj,2001.17333984,0.01000,2.171
|