File size: 8,882 Bytes
fc418c2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.06161176,0.01000,0.932
0,self_attn.v_proj,0.05438014,0.01000,0.723
0,self_attn.q_proj,0.12705065,0.01000,0.915
0,self_attn.o_proj,0.17126846,0.01000,0.846
0,mlp.up_proj,0.80178344,0.01000,1.060
0,mlp.gate_proj,1.22950339,0.01000,1.030
0,mlp.down_proj,0.29198846,0.01000,0.589
1,self_attn.k_proj,0.04196536,0.01000,0.766
1,self_attn.v_proj,0.04195968,0.01000,0.801
1,self_attn.q_proj,0.08776645,0.01000,0.850
1,self_attn.o_proj,0.05204657,0.01000,0.786
1,mlp.up_proj,7.74701595,0.01000,0.884
1,mlp.gate_proj,19.37592506,0.01000,-1.316
1,mlp.down_proj,0.42635429,0.01000,2.649
2,self_attn.k_proj,0.08282123,0.01000,0.777
2,self_attn.v_proj,0.08251686,0.01000,0.780
2,self_attn.q_proj,0.18313025,0.01000,0.831
2,self_attn.o_proj,0.09041101,0.01000,0.758
2,mlp.up_proj,6.97388744,0.01000,0.819
2,mlp.gate_proj,17.37420845,0.01000,0.842
2,mlp.down_proj,555.31311035,0.01000,2.470
3,self_attn.k_proj,0.66062665,0.01000,0.745
3,self_attn.v_proj,0.66629398,0.01000,0.738
3,self_attn.q_proj,1.30134702,0.01000,0.779
3,self_attn.o_proj,0.19163772,0.01000,0.752
3,mlp.up_proj,9.49505615,0.01000,0.824
3,mlp.gate_proj,22.15675545,0.01000,0.830
3,mlp.down_proj,1.11858487,0.01000,2.587
4,self_attn.k_proj,0.60883915,0.01000,0.758
4,self_attn.v_proj,0.65701765,0.01000,0.766
4,self_attn.q_proj,1.25714827,0.01000,0.778
4,self_attn.o_proj,0.33684582,0.01000,0.767
4,mlp.up_proj,10.67844296,0.01000,0.800
4,mlp.gate_proj,22.64768982,0.01000,0.814
4,mlp.down_proj,1.57849216,0.01000,2.662
5,self_attn.k_proj,0.86607969,0.01000,0.761
5,self_attn.v_proj,0.95299339,0.01000,0.767
5,self_attn.q_proj,1.92915726,0.01000,0.806
5,self_attn.o_proj,0.51527029,0.01000,0.788
5,mlp.up_proj,8.11690903,0.01000,0.815
5,mlp.gate_proj,11.88039017,0.01000,0.810
5,mlp.down_proj,2.06314588,0.01000,2.476
6,self_attn.k_proj,0.84522438,0.01000,0.771
6,self_attn.v_proj,0.79271960,0.01000,0.758
6,self_attn.q_proj,1.74664021,0.01000,0.806
6,self_attn.o_proj,0.51649594,0.01000,0.770
6,mlp.up_proj,11.36476040,0.01000,0.821
6,mlp.gate_proj,16.26104736,0.01000,0.898
6,mlp.down_proj,3.12330055,0.01000,2.463
7,self_attn.k_proj,1.74236369,0.01000,0.763
7,self_attn.v_proj,1.94380081,0.01000,0.762
7,self_attn.q_proj,4.01041460,0.01000,0.794
7,self_attn.o_proj,0.80392551,0.01000,0.767
7,mlp.up_proj,15.10862732,0.01000,0.819
7,mlp.gate_proj,22.81257248,0.01000,0.837
7,mlp.down_proj,3.62108111,0.01000,2.464
8,self_attn.k_proj,2.43949366,0.01000,0.745
8,self_attn.v_proj,2.31129289,0.01000,0.943
8,self_attn.q_proj,5.06256580,0.01000,1.057
8,self_attn.o_proj,0.60827088,0.01000,0.802
8,mlp.up_proj,15.40246868,0.01000,0.809
8,mlp.gate_proj,20.87147713,0.01000,0.801
8,mlp.down_proj,4.27449131,0.01000,2.384
9,self_attn.k_proj,4.37583876,0.01000,-0.010
9,self_attn.v_proj,4.23343515,0.01000,0.706
9,self_attn.q_proj,9.79721832,0.01000,0.719
9,self_attn.o_proj,1.85169268,0.01000,0.739
9,mlp.up_proj,16.51148033,0.01000,0.745
9,mlp.gate_proj,20.53764725,0.01000,0.745
9,mlp.down_proj,6.68374157,0.01000,2.179
10,self_attn.k_proj,3.51351452,0.01000,0.692
10,self_attn.v_proj,3.65583849,0.01000,0.691
10,self_attn.q_proj,7.80333757,0.01000,0.702
10,self_attn.o_proj,1.93884957,0.01000,0.745
10,mlp.up_proj,17.16555405,0.01000,0.722
10,mlp.gate_proj,20.50786018,0.01000,0.751
10,mlp.down_proj,9.01197052,0.01000,2.197
11,self_attn.k_proj,6.72875261,0.01000,0.697
11,self_attn.v_proj,5.92448235,0.01000,0.648
11,self_attn.q_proj,15.31981468,0.01000,0.650
11,self_attn.o_proj,4.41754627,0.01000,0.755
11,mlp.up_proj,18.27470398,0.01000,0.786
11,mlp.gate_proj,18.97273636,0.01000,0.760
11,mlp.down_proj,10.93863583,0.01000,2.211
12,self_attn.k_proj,6.80087852,0.01000,0.664
12,self_attn.v_proj,6.75032997,0.01000,0.680
12,self_attn.q_proj,15.24656105,0.01000,0.685
12,self_attn.o_proj,2.62905002,0.01000,0.684
12,mlp.up_proj,18.10563850,0.01000,0.837
12,mlp.gate_proj,17.88245010,0.01000,0.808
12,mlp.down_proj,10.52472878,0.01000,1.750
13,self_attn.k_proj,8.15466690,0.01000,0.707
13,self_attn.v_proj,8.60487556,0.01000,0.702
13,self_attn.q_proj,21.30573654,0.01000,0.736
13,self_attn.o_proj,3.62042069,0.01000,0.731
13,mlp.up_proj,18.99537659,0.01000,0.764
13,mlp.gate_proj,18.67168045,0.01000,0.876
13,mlp.down_proj,13.00555801,0.01000,2.089
14,self_attn.k_proj,13.40824318,0.01000,0.727
14,self_attn.v_proj,13.49943829,0.01000,0.687
14,self_attn.q_proj,32.17544556,0.01000,0.673
14,self_attn.o_proj,4.37822676,0.01000,0.702
14,mlp.up_proj,20.30528450,0.01000,0.753
14,mlp.gate_proj,19.48166656,0.01000,0.776
14,mlp.down_proj,16.70061111,0.01000,2.228
15,self_attn.k_proj,25.33942032,0.01000,0.636
15,self_attn.v_proj,29.75099182,0.01000,0.648
15,self_attn.q_proj,74.12033844,0.01000,0.662
15,self_attn.o_proj,9.15364933,0.01000,0.649
15,mlp.up_proj,23.37993050,0.01000,0.699
15,mlp.gate_proj,21.96615601,0.01000,0.709
15,mlp.down_proj,24.15357208,0.01000,2.310
16,self_attn.k_proj,37.24622726,0.01000,0.711
16,self_attn.v_proj,33.53807831,0.01000,0.698
16,self_attn.q_proj,92.94651794,0.01000,0.715
16,self_attn.o_proj,10.30152321,0.01000,0.665
16,mlp.up_proj,29.35601807,0.01000,0.695
16,mlp.gate_proj,25.80093002,0.01000,0.200
16,mlp.down_proj,60.27460098,0.01000,2.165
17,self_attn.k_proj,95.47402954,0.01000,0.684
17,self_attn.v_proj,105.25405884,0.01000,0.674
17,self_attn.q_proj,253.24885559,0.01000,0.657
17,self_attn.o_proj,28.11261368,0.01000,0.670
17,mlp.up_proj,42.57036591,0.01000,0.704
17,mlp.gate_proj,36.58126831,0.01000,0.717
17,mlp.down_proj,81.79136658,0.01000,2.167
18,self_attn.k_proj,102.99479675,0.01000,0.644
18,self_attn.v_proj,101.50364685,0.01000,0.670
18,self_attn.q_proj,275.00637817,0.01000,0.704
18,self_attn.o_proj,21.60307312,0.01000,0.651
18,mlp.up_proj,54.27608109,0.01000,0.661
18,mlp.gate_proj,46.83805847,0.01000,0.716
18,mlp.down_proj,132.89431763,0.01000,2.199
19,self_attn.k_proj,178.74481201,0.01000,0.711
19,self_attn.v_proj,189.77200317,0.01000,0.786
19,self_attn.q_proj,486.16369629,0.01000,0.783
19,self_attn.o_proj,41.97334290,0.01000,0.726
19,mlp.up_proj,73.76881409,0.01000,0.756
19,mlp.gate_proj,62.54061508,0.01000,0.787
19,mlp.down_proj,308.76110840,0.01000,2.161
20,self_attn.k_proj,298.62933350,0.01000,0.629
20,self_attn.v_proj,316.93182373,0.01000,0.640
20,self_attn.q_proj,764.87170410,0.01000,0.705
20,self_attn.o_proj,67.96992493,0.01000,0.644
20,mlp.up_proj,94.94843292,0.01000,0.728
20,mlp.gate_proj,82.94094849,0.01000,0.693
20,mlp.down_proj,463.50665283,0.01000,2.142
21,self_attn.k_proj,478.08056641,0.01000,0.662
21,self_attn.v_proj,546.54919434,0.01000,0.660
21,self_attn.q_proj,1147.31347656,0.01000,0.683
21,self_attn.o_proj,118.71049500,0.01000,0.655
21,mlp.up_proj,120.02677917,0.01000,0.708
21,mlp.gate_proj,103.04946899,0.01000,0.708
21,mlp.down_proj,659.67437744,0.01000,2.128
22,self_attn.k_proj,593.22070312,0.01000,0.665
22,self_attn.v_proj,763.92529297,0.01000,0.669
22,self_attn.q_proj,1391.22949219,0.01000,0.679
22,self_attn.o_proj,101.20243835,0.01000,0.657
22,mlp.up_proj,135.26795959,0.01000,0.796
22,mlp.gate_proj,118.14506531,0.01000,0.779
22,mlp.down_proj,766.93237305,0.01000,2.130
23,self_attn.k_proj,817.42401123,0.01000,0.667
23,self_attn.v_proj,912.42480469,0.01000,0.663
23,self_attn.q_proj,1677.90209961,0.01000,0.679
23,self_attn.o_proj,115.38923645,0.01000,0.684
23,mlp.up_proj,160.92965698,0.01000,0.767
23,mlp.gate_proj,142.50930786,0.01000,0.720
23,mlp.down_proj,837.10455322,0.01000,2.173
24,self_attn.k_proj,1420.40991211,0.01000,0.793
24,self_attn.v_proj,1595.83715820,0.01000,0.683
24,self_attn.q_proj,3344.17285156,0.01000,0.736
24,self_attn.o_proj,152.69662476,0.01000,0.738
24,mlp.up_proj,158.49810791,0.01000,0.714
24,mlp.gate_proj,136.60337830,0.01000,0.771
24,mlp.down_proj,973.98236084,0.01000,2.152
25,self_attn.k_proj,1685.52282715,0.01000,0.890
25,self_attn.v_proj,2474.76318359,0.01000,0.920
25,self_attn.q_proj,3874.19628906,0.01000,0.971
25,self_attn.o_proj,197.16078186,0.01000,0.679
25,mlp.up_proj,151.62023926,0.01000,0.738
25,mlp.gate_proj,128.06694031,0.01000,0.745
25,mlp.down_proj,1148.98022461,0.01000,2.151
26,self_attn.k_proj,1625.11279297,0.01000,0.675
26,self_attn.v_proj,2256.05908203,0.01000,0.691
26,self_attn.q_proj,3975.20971680,0.01000,0.716
26,self_attn.o_proj,443.28439331,0.01000,0.676
26,mlp.up_proj,148.50442505,0.01000,0.720
26,mlp.gate_proj,127.99733734,0.01000,0.741
26,mlp.down_proj,1423.76660156,0.01000,2.141
27,self_attn.k_proj,793.07702637,0.01000,0.666
27,self_attn.v_proj,898.25610352,0.01000,0.678
27,self_attn.q_proj,1676.92187500,0.01000,0.674
27,self_attn.o_proj,251.81840515,0.01000,0.676
27,mlp.up_proj,196.21633911,0.01000,0.717
27,mlp.gate_proj,199.20074463,0.01000,0.710
27,mlp.down_proj,2001.17333984,0.01000,2.171