Find this model in the GPT-NeoX model summary
Model source: https://huggingface.co/EleutherAI/gpt-neox-20b
layer_type | N | M | Q | alpha | D | alpha-hat | log_SN | rank_loss | |
---|---|---|---|---|---|---|---|---|---|
layer_id | |||||||||
4 | DENSE | 18432 | 6144 | 3.00 | 3.87 | 0.02 | 10.58 | 2.74 | 0 |
5 | DENSE | 6144 | 6144 | 1.00 | 3.43 | 0.02 | 7.81 | 2.28 | 6 |
7 | DENSE | 24576 | 6144 | 4.00 | 5.63 | 0.04 | 15.23 | 2.70 | 0 |
8 | DENSE | 24576 | 6144 | 4.00 | 7.67 | 0.06 | 21.22 | 2.77 | 0 |
11 | DENSE | 18432 | 6144 | 3.00 | 2.97 | 0.01 | 8.34 | 2.81 | 0 |
12 | DENSE | 6144 | 6144 | 1.00 | 3.73 | 0.04 | 6.65 | 1.78 | 4 |
14 | DENSE | 24576 | 6144 | 4.00 | 2.24 | 0.03 | 7.23 | 3.22 | 0 |
15 | DENSE | 24576 | 6144 | 4.00 | 6.08 | 0.04 | 16.74 | 2.75 | 0 |
18 | DENSE | 18432 | 6144 | 3.00 | 2.84 | 0.02 | 7.95 | 2.80 | 0 |
19 | DENSE | 6144 | 6144 | 1.00 | 3.45 | 0.04 | 6.42 | 1.86 | 4 |
21 | DENSE | 24576 | 6144 | 4.00 | 2.42 | 0.01 | 7.00 | 2.89 | 0 |
22 | DENSE | 24576 | 6144 | 4.00 | 3.54 | 0.02 | 8.74 | 2.47 | 0 |
25 | DENSE | 18432 | 6144 | 3.00 | 3.41 | 0.03 | 9.69 | 2.84 | 0 |
26 | DENSE | 6144 | 6144 | 1.00 | 3.28 | 0.03 | 5.90 | 1.80 | 4 |
28 | DENSE | 24576 | 6144 | 4.00 | 2.61 | 0.01 | 7.57 | 2.90 | 0 |
29 | DENSE | 24576 | 6144 | 4.00 | 3.73 | 0.01 | 9.44 | 2.53 | 0 |
32 | DENSE | 18432 | 6144 | 3.00 | 3.37 | 0.02 | 8.86 | 2.63 | 0 |
33 | DENSE | 6144 | 6144 | 1.00 | 3.28 | 0.02 | 6.20 | 1.89 | 4 |
35 | DENSE | 24576 | 6144 | 4.00 | 2.68 | 0.02 | 7.81 | 2.92 | 0 |
36 | DENSE | 24576 | 6144 | 4.00 | 3.70 | 0.02 | 9.13 | 2.47 | 0 |
39 | DENSE | 18432 | 6144 | 3.00 | 3.45 | 0.02 | 8.75 | 2.54 | 0 |
40 | DENSE | 6144 | 6144 | 1.00 | 3.48 | 0.03 | 6.64 | 1.91 | 4 |
42 | DENSE | 24576 | 6144 | 4.00 | 2.80 | 0.01 | 8.07 | 2.88 | 0 |
43 | DENSE | 24576 | 6144 | 4.00 | 3.20 | 0.01 | 8.10 | 2.53 | 0 |
46 | DENSE | 18432 | 6144 | 3.00 | 3.13 | 0.02 | 7.78 | 2.49 | 0 |
47 | DENSE | 6144 | 6144 | 1.00 | 5.25 | 0.04 | 9.80 | 1.87 | 4 |
49 | DENSE | 24576 | 6144 | 4.00 | 2.83 | 0.01 | 8.21 | 2.90 | 0 |
50 | DENSE | 24576 | 6144 | 4.00 | 3.13 | 0.01 | 8.15 | 2.60 | 0 |
53 | DENSE | 18432 | 6144 | 3.00 | 3.02 | 0.02 | 7.35 | 2.43 | 0 |
54 | DENSE | 6144 | 6144 | 1.00 | 5.97 | 0.04 | 10.98 | 1.84 | 5 |
56 | DENSE | 24576 | 6144 | 4.00 | 2.80 | 0.01 | 9.87 | 3.52 | 0 |
57 | DENSE | 24576 | 6144 | 4.00 | 3.17 | 0.01 | 9.15 | 2.89 | 0 |
60 | DENSE | 18432 | 6144 | 3.00 | 3.58 | 0.03 | 9.29 | 2.59 | 0 |
61 | DENSE | 6144 | 6144 | 1.00 | 5.53 | 0.04 | 10.29 | 1.86 | 4 |
63 | DENSE | 24576 | 6144 | 4.00 | 2.80 | 0.01 | 7.92 | 2.83 | 0 |
64 | DENSE | 24576 | 6144 | 4.00 | 3.05 | 0.01 | 7.95 | 2.60 | 0 |
67 | DENSE | 18432 | 6144 | 3.00 | 3.10 | 0.02 | 9.01 | 2.90 | 0 |
68 | DENSE | 6144 | 6144 | 1.00 | 6.33 | 0.05 | 11.51 | 1.82 | 5 |
70 | DENSE | 24576 | 6144 | 4.00 | 2.81 | 0.02 | 8.05 | 2.87 | 0 |
71 | DENSE | 24576 | 6144 | 4.00 | 2.84 | 0.01 | 7.40 | 2.61 | 0 |
74 | DENSE | 18432 | 6144 | 3.00 | 2.59 | 0.01 | 8.35 | 3.22 | 0 |
75 | DENSE | 6144 | 6144 | 1.00 | 7.30 | 0.05 | 12.60 | 1.72 | 4 |
77 | DENSE | 24576 | 6144 | 4.00 | 2.74 | 0.02 | 7.80 | 2.84 | 0 |
78 | DENSE | 24576 | 6144 | 4.00 | 2.93 | 0.02 | 7.45 | 2.54 | 0 |
81 | DENSE | 18432 | 6144 | 3.00 | 2.34 | 0.01 | 8.15 | 3.47 | 0 |
82 | DENSE | 6144 | 6144 | 1.00 | 6.38 | 0.05 | 9.92 | 1.55 | 4 |
84 | DENSE | 24576 | 6144 | 4.00 | 2.69 | 0.02 | 7.89 | 2.93 | 0 |
85 | DENSE | 24576 | 6144 | 4.00 | 2.75 | 0.01 | 6.72 | 2.44 | 0 |
88 | DENSE | 18432 | 6144 | 3.00 | 2.32 | 0.01 | 8.14 | 3.51 | 0 |
89 | DENSE | 6144 | 6144 | 1.00 | 2.95 | 0.05 | 4.72 | 1.60 | 5 |
91 | DENSE | 24576 | 6144 | 4.00 | 2.69 | 0.02 | 7.87 | 2.92 | 0 |
92 | DENSE | 24576 | 6144 | 4.00 | 2.89 | 0.02 | 6.93 | 2.39 | 0 |
95 | DENSE | 18432 | 6144 | 3.00 | 2.37 | 0.01 | 8.31 | 3.51 | 0 |
96 | DENSE | 6144 | 6144 | 1.00 | 4.16 | 0.06 | 6.34 | 1.52 | 4 |
98 | DENSE | 24576 | 6144 | 4.00 | 2.61 | 0.03 | 7.61 | 2.91 | 0 |
99 | DENSE | 24576 | 6144 | 4.00 | 2.88 | 0.01 | 6.97 | 2.42 | 0 |
102 | DENSE | 18432 | 6144 | 3.00 | 2.33 | 0.02 | 8.21 | 3.53 | 0 |
103 | DENSE | 6144 | 6144 | 1.00 | 9.66 | 0.05 | 14.99 | 1.55 | 3 |
105 | DENSE | 24576 | 6144 | 4.00 | 2.61 | 0.03 | 7.64 | 2.92 | 0 |
106 | DENSE | 24576 | 6144 | 4.00 | 2.89 | 0.01 | 6.96 | 2.41 | 0 |
109 | DENSE | 18432 | 6144 | 3.00 | 2.27 | 0.02 | 8.10 | 3.57 | 0 |
110 | DENSE | 6144 | 6144 | 1.00 | 10.03 | 0.06 | 14.98 | 1.49 | 4 |
112 | DENSE | 24576 | 6144 | 4.00 | 2.60 | 0.03 | 7.57 | 2.91 | 0 |
113 | DENSE | 24576 | 6144 | 4.00 | 2.92 | 0.01 | 7.12 | 2.44 | 0 |
116 | DENSE | 18432 | 6144 | 3.00 | 2.27 | 0.02 | 8.09 | 3.57 | 0 |
117 | DENSE | 6144 | 6144 | 1.00 | 3.37 | 0.06 | 5.04 | 1.50 | 4 |
119 | DENSE | 24576 | 6144 | 4.00 | 2.59 | 0.03 | 7.67 | 2.96 | 0 |
120 | DENSE | 24576 | 6144 | 4.00 | 2.96 | 0.01 | 7.20 | 2.43 | 0 |
123 | DENSE | 18432 | 6144 | 3.00 | 2.29 | 0.02 | 8.16 | 3.57 | 0 |
124 | DENSE | 6144 | 6144 | 1.00 | 8.00 | 0.05 | 12.05 | 1.51 | 3 |
126 | DENSE | 24576 | 6144 | 4.00 | 2.59 | 0.03 | 7.69 | 2.96 | 0 |
127 | DENSE | 24576 | 6144 | 4.00 | 2.91 | 0.01 | 7.09 | 2.44 | 0 |
130 | DENSE | 18432 | 6144 | 3.00 | 2.28 | 0.02 | 8.19 | 3.59 | 0 |
131 | DENSE | 6144 | 6144 | 1.00 | 5.25 | 0.06 | 7.66 | 1.46 | 4 |
133 | DENSE | 24576 | 6144 | 4.00 | 2.65 | 0.03 | 7.82 | 2.96 | 0 |
134 | DENSE | 24576 | 6144 | 4.00 | 2.98 | 0.01 | 7.09 | 2.38 | 0 |
137 | DENSE | 18432 | 6144 | 3.00 | 2.29 | 0.02 | 8.28 | 3.61 | 0 |
138 | DENSE | 6144 | 6144 | 1.00 | 7.14 | 0.06 | 9.93 | 1.39 | 2 |
140 | DENSE | 24576 | 6144 | 4.00 | 2.66 | 0.03 | 7.86 | 2.95 | 0 |
141 | DENSE | 24576 | 6144 | 4.00 | 3.04 | 0.01 | 7.32 | 2.41 | 0 |
144 | DENSE | 18432 | 6144 | 3.00 | 2.29 | 0.02 | 8.33 | 3.64 | 0 |
145 | DENSE | 6144 | 6144 | 1.00 | 6.50 | 0.03 | 10.09 | 1.55 | 3 |
147 | DENSE | 24576 | 6144 | 4.00 | 2.69 | 0.03 | 7.97 | 2.97 | 0 |
148 | DENSE | 24576 | 6144 | 4.00 | 3.13 | 0.01 | 8.22 | 2.63 | 0 |
151 | DENSE | 18432 | 6144 | 3.00 | 2.29 | 0.02 | 8.30 | 3.62 | 0 |
152 | DENSE | 6144 | 6144 | 1.00 | 6.10 | 0.03 | 11.08 | 1.82 | 3 |
154 | DENSE | 24576 | 6144 | 4.00 | 2.69 | 0.03 | 7.90 | 2.94 | 0 |
155 | DENSE | 24576 | 6144 | 4.00 | 3.32 | 0.01 | 8.95 | 2.69 | 0 |
158 | DENSE | 18432 | 6144 | 3.00 | 2.26 | 0.02 | 8.16 | 3.60 | 0 |
159 | DENSE | 6144 | 6144 | 1.00 | 7.68 | 0.05 | 12.26 | 1.60 | 4 |
161 | DENSE | 24576 | 6144 | 4.00 | 2.72 | 0.03 | 8.05 | 2.96 | 0 |
162 | DENSE | 24576 | 6144 | 4.00 | 3.30 | 0.01 | 8.79 | 2.66 | 0 |
165 | DENSE | 18432 | 6144 | 3.00 | 2.29 | 0.02 | 8.33 | 3.64 | 0 |
166 | DENSE | 6144 | 6144 | 1.00 | 6.96 | 0.05 | 11.85 | 1.70 | 4 |
168 | DENSE | 24576 | 6144 | 4.00 | 2.74 | 0.03 | 8.06 | 2.94 | 0 |
169 | DENSE | 24576 | 6144 | 4.00 | 3.41 | 0.01 | 9.24 | 2.71 | 0 |
172 | DENSE | 18432 | 6144 | 3.00 | 2.21 | 0.03 | 8.02 | 3.62 | 0 |
173 | DENSE | 6144 | 6144 | 1.00 | 7.10 | 0.03 | 11.62 | 1.64 | 4 |
175 | DENSE | 24576 | 6144 | 4.00 | 2.77 | 0.03 | 8.18 | 2.95 | 0 |
176 | DENSE | 24576 | 6144 | 4.00 | 3.50 | 0.01 | 9.44 | 2.69 | 0 |
179 | DENSE | 18432 | 6144 | 3.00 | 2.24 | 0.02 | 8.06 | 3.60 | 0 |
180 | DENSE | 6144 | 6144 | 1.00 | 6.39 | 0.04 | 11.94 | 1.87 | 3 |
182 | DENSE | 24576 | 6144 | 4.00 | 2.78 | 0.02 | 8.19 | 2.94 | 0 |
183 | DENSE | 24576 | 6144 | 4.00 | 3.88 | 0.01 | 10.76 | 2.77 | 0 |
186 | DENSE | 18432 | 6144 | 3.00 | 2.27 | 0.02 | 8.09 | 3.56 | 0 |
187 | DENSE | 6144 | 6144 | 1.00 | 6.42 | 0.04 | 12.09 | 1.88 | 4 |
189 | DENSE | 24576 | 6144 | 4.00 | 2.83 | 0.02 | 8.31 | 2.94 | 0 |
190 | DENSE | 24576 | 6144 | 4.00 | 4.06 | 0.02 | 10.85 | 2.67 | 0 |
193 | DENSE | 18432 | 6144 | 3.00 | 2.24 | 0.02 | 8.01 | 3.57 | 0 |
194 | DENSE | 6144 | 6144 | 1.00 | 6.67 | 0.03 | 11.97 | 1.79 | 4 |
196 | DENSE | 24576 | 6144 | 4.00 | 2.85 | 0.03 | 8.35 | 2.93 | 0 |
197 | DENSE | 24576 | 6144 | 4.00 | 4.16 | 0.01 | 10.75 | 2.58 | 0 |
200 | DENSE | 18432 | 6144 | 3.00 | 2.29 | 0.03 | 8.17 | 3.57 | 0 |
201 | DENSE | 6144 | 6144 | 1.00 | 7.01 | 0.05 | 12.37 | 1.76 | 4 |
203 | DENSE | 24576 | 6144 | 4.00 | 2.87 | 0.03 | 8.43 | 2.93 | 0 |
204 | DENSE | 24576 | 6144 | 4.00 | 4.31 | 0.01 | 10.72 | 2.49 | 0 |
207 | DENSE | 18432 | 6144 | 3.00 | 2.33 | 0.02 | 8.36 | 3.59 | 0 |
208 | DENSE | 6144 | 6144 | 1.00 | 5.89 | 0.03 | 9.56 | 1.62 | 3 |
210 | DENSE | 24576 | 6144 | 4.00 | 2.92 | 0.03 | 8.55 | 2.93 | 0 |
211 | DENSE | 24576 | 6144 | 4.00 | 4.63 | 0.01 | 10.85 | 2.34 | 0 |
214 | DENSE | 18432 | 6144 | 3.00 | 2.30 | 0.02 | 8.32 | 3.61 | 0 |
215 | DENSE | 6144 | 6144 | 1.00 | 6.29 | 0.02 | 9.66 | 1.53 | 3 |
217 | DENSE | 24576 | 6144 | 4.00 | 2.97 | 0.03 | 8.63 | 2.91 | 0 |
218 | DENSE | 24576 | 6144 | 4.00 | 4.96 | 0.01 | 11.06 | 2.23 | 0 |
221 | DENSE | 18432 | 6144 | 3.00 | 2.31 | 0.02 | 8.32 | 3.61 | 0 |
222 | DENSE | 6144 | 6144 | 1.00 | 5.83 | 0.03 | 8.78 | 1.51 | 4 |
224 | DENSE | 24576 | 6144 | 4.00 | 3.00 | 0.03 | 8.71 | 2.91 | 0 |
225 | DENSE | 24576 | 6144 | 4.00 | 5.23 | 0.01 | 11.52 | 2.20 | 0 |
228 | DENSE | 18432 | 6144 | 3.00 | 2.38 | 0.03 | 8.62 | 3.61 | 0 |
229 | DENSE | 6144 | 6144 | 1.00 | 6.59 | 0.01 | 9.19 | 1.39 | 5 |
231 | DENSE | 24576 | 6144 | 4.00 | 3.09 | 0.03 | 8.97 | 2.90 | 0 |
232 | DENSE | 24576 | 6144 | 4.00 | 4.83 | 0.01 | 10.58 | 2.19 | 0 |
235 | DENSE | 18432 | 6144 | 3.00 | 2.39 | 0.03 | 8.64 | 3.61 | 0 |
236 | DENSE | 6144 | 6144 | 1.00 | 9.69 | 0.05 | 13.52 | 1.40 | 4 |
238 | DENSE | 24576 | 6144 | 4.00 | 3.16 | 0.03 | 9.15 | 2.90 | 0 |
239 | DENSE | 24576 | 6144 | 4.00 | 4.95 | 0.01 | 10.72 | 2.17 | 0 |
242 | DENSE | 18432 | 6144 | 3.00 | 2.40 | 0.03 | 8.63 | 3.60 | 0 |
243 | DENSE | 6144 | 6144 | 1.00 | 5.77 | 0.02 | 8.43 | 1.46 | 4 |
245 | DENSE | 24576 | 6144 | 4.00 | 3.22 | 0.03 | 9.32 | 2.90 | 0 |
246 | DENSE | 24576 | 6144 | 4.00 | 4.99 | 0.01 | 10.89 | 2.18 | 0 |
249 | DENSE | 18432 | 6144 | 3.00 | 2.44 | 0.03 | 8.77 | 3.60 | 0 |
250 | DENSE | 6144 | 6144 | 1.00 | 5.77 | 0.02 | 9.92 | 1.72 | 4 |
252 | DENSE | 24576 | 6144 | 4.00 | 3.25 | 0.04 | 9.34 | 2.88 | 0 |
253 | DENSE | 24576 | 6144 | 4.00 | 5.00 | 0.01 | 10.81 | 2.16 | 0 |
256 | DENSE | 18432 | 6144 | 3.00 | 2.50 | 0.03 | 8.95 | 3.57 | 0 |
257 | DENSE | 6144 | 6144 | 1.00 | 6.31 | 0.02 | 11.05 | 1.75 | 2 |
259 | DENSE | 24576 | 6144 | 4.00 | 3.31 | 0.04 | 9.50 | 2.87 | 0 |
260 | DENSE | 24576 | 6144 | 4.00 | 5.05 | 0.02 | 10.70 | 2.12 | 0 |
263 | DENSE | 18432 | 6144 | 3.00 | 2.48 | 0.03 | 8.79 | 3.54 | 0 |
264 | DENSE | 6144 | 6144 | 1.00 | 6.37 | 0.03 | 9.76 | 1.53 | 5 |
266 | DENSE | 24576 | 6144 | 4.00 | 4.89 | 0.04 | 13.96 | 2.86 | 0 |
267 | DENSE | 24576 | 6144 | 4.00 | 5.09 | 0.02 | 10.77 | 2.12 | 0 |
270 | DENSE | 18432 | 6144 | 3.00 | 2.11 | 0.03 | 7.49 | 3.55 | 0 |
271 | DENSE | 6144 | 6144 | 1.00 | 7.91 | 0.04 | 12.76 | 1.61 | 4 |
273 | DENSE | 24576 | 6144 | 4.00 | 4.88 | 0.03 | 13.82 | 2.83 | 0 |
274 | DENSE | 24576 | 6144 | 4.00 | 5.04 | 0.02 | 11.26 | 2.23 | 0 |
277 | DENSE | 18432 | 6144 | 3.00 | 2.63 | 0.04 | 9.38 | 3.57 | 0 |
278 | DENSE | 6144 | 6144 | 1.00 | 9.54 | 0.05 | 15.03 | 1.58 | 4 |
280 | DENSE | 24576 | 6144 | 4.00 | 4.86 | 0.02 | 13.78 | 2.84 | 0 |
281 | DENSE | 24576 | 6144 | 4.00 | 5.24 | 0.02 | 11.83 | 2.26 | 0 |
284 | DENSE | 18432 | 6144 | 3.00 | 2.62 | 0.04 | 9.30 | 3.56 | 0 |
285 | DENSE | 6144 | 6144 | 1.00 | 7.77 | 0.04 | 11.52 | 1.48 | 3 |
287 | DENSE | 24576 | 6144 | 4.00 | 4.70 | 0.01 | 13.30 | 2.83 | 0 |
288 | DENSE | 24576 | 6144 | 4.00 | 5.02 | 0.02 | 12.13 | 2.42 | 0 |
291 | DENSE | 18432 | 6144 | 3.00 | 2.60 | 0.04 | 9.29 | 3.57 | 0 |
292 | DENSE | 6144 | 6144 | 1.00 | 7.50 | 0.06 | 11.37 | 1.52 | 3 |
294 | DENSE | 24576 | 6144 | 4.00 | 4.57 | 0.02 | 12.95 | 2.83 | 0 |
295 | DENSE | 24576 | 6144 | 4.00 | 4.76 | 0.01 | 11.85 | 2.49 | 0 |
298 | DENSE | 18432 | 6144 | 3.00 | 2.04 | 0.04 | 7.27 | 3.56 | 0 |
299 | DENSE | 6144 | 6144 | 1.00 | 6.14 | 0.09 | 13.42 | 2.18 | 4 |
301 | DENSE | 24576 | 6144 | 4.00 | 4.29 | 0.02 | 12.32 | 2.87 | 0 |
302 | DENSE | 24576 | 6144 | 4.00 | 4.07 | 0.02 | 11.37 | 2.79 | 0 |
305 | DENSE | 18432 | 6144 | 3.00 | 2.12 | 0.03 | 6.95 | 3.29 | 0 |
306 | DENSE | 6144 | 6144 | 1.00 | 2.40 | 0.06 | 5.23 | 2.18 | 15 |
308 | DENSE | 24576 | 6144 | 4.00 | 3.77 | 0.03 | 11.17 | 2.97 | 0 |
309 | DENSE | 24576 | 6144 | 4.00 | 3.43 | 0.03 | 11.95 | 3.48 | 0 |