layer_type | N | M | Q | alpha | D | alpha-hat | log_SN | % Rand | num_traps | num_fingers | rank_loss | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
layer_id | ||||||||||||
1 | EMBEDDING | 32128 | 512 | 62.75 | 2.28 | 0.07 | 18.77 | 8.22 | 74.05 | 0 | 4 | 0 |
8 | DENSE | 512 | 384 | 1.33 | 2.06 | 0.14 | 2.29 | 1.11 | 90.37 | 0 | 1 | 0 |
9 | DENSE | 512 | 384 | 1.33 | 1.97 | 0.13 | 5.74 | 2.92 | 91.19 | 0 | 1 | 0 |
10 | DENSE | 512 | 384 | 1.33 | 3.96 | 0.14 | 10.38 | 2.62 | 94.04 | 0 | 5 | 0 |
11 | DENSE | 512 | 384 | 1.33 | 3.15 | 0.03 | 10.98 | 3.48 | 84.73 | 0 | 0 | 0 |
17 | DENSE | 1024 | 512 | 2.00 | 3.19 | 0.05 | 10.65 | 3.34 | 88.12 | 0 | 0 | 0 |
18 | DENSE | 1024 | 512 | 2.00 | 3.58 | 0.08 | 11.66 | 3.26 | 91.82 | 0 | 0 | 0 |
19 | DENSE | 1024 | 512 | 2.00 | 3.08 | 0.03 | 11.14 | 3.61 | 82.90 | 0 | 0 | 0 |
28 | DENSE | 512 | 384 | 1.33 | 5.39 | 0.05 | 6.61 | 1.23 | 92.29 | 0 | 0 | 0 |
29 | DENSE | 512 | 384 | 1.33 | 5.20 | 0.05 | 15.46 | 2.97 | 92.73 | 0 | 0 | 0 |
30 | DENSE | 512 | 384 | 1.33 | 3.66 | 0.11 | 9.46 | 2.59 | 95.05 | 0 | 0 | 0 |
31 | DENSE | 512 | 384 | 1.33 | 3.30 | 0.04 | 12.29 | 3.73 | 81.81 | 0 | 0 | 0 |
36 | DENSE | 1024 | 512 | 2.00 | 3.53 | 0.03 | 11.74 | 3.33 | 89.16 | 0 | 0 | 0 |
37 | DENSE | 1024 | 512 | 2.00 | 4.92 | 0.08 | 16.02 | 3.26 | 95.07 | 0 | 0 | 0 |
38 | DENSE | 1024 | 512 | 2.00 | 3.19 | 0.02 | 11.26 | 3.53 | 84.74 | 0 | 0 | 0 |
47 | DENSE | 512 | 384 | 1.33 | 3.61 | 0.06 | 3.57 | 0.99 | 89.73 | 0 | 0 | 0 |
48 | DENSE | 512 | 384 | 1.33 | 5.01 | 0.05 | 14.44 | 2.88 | 91.78 | 0 | 0 | 0 |
49 | DENSE | 512 | 384 | 1.33 | 3.31 | 0.11 | 9.76 | 2.94 | 89.15 | 0 | 0 | 0 |
50 | DENSE | 512 | 384 | 1.33 | 4.03 | 0.04 | 14.45 | 3.58 | 83.20 | 0 | 0 | 0 |
55 | DENSE | 1024 | 512 | 2.00 | 3.34 | 0.04 | 11.13 | 3.33 | 87.27 | 0 | 0 | 0 |
56 | DENSE | 1024 | 512 | 2.00 | 6.37 | 0.06 | 22.15 | 3.48 | 94.30 | 0 | 0 | 0 |
57 | DENSE | 1024 | 512 | 2.00 | 3.53 | 0.04 | 13.16 | 3.72 | 86.18 | 0 | 0 | 0 |
66 | DENSE | 512 | 384 | 1.33 | 4.75 | 0.06 | 4.05 | 0.85 | 92.69 | 0 | 0 | 0 |
67 | DENSE | 512 | 384 | 1.33 | 5.44 | 0.06 | 14.78 | 2.72 | 93.50 | 0 | 0 | 0 |
68 | DENSE | 512 | 384 | 1.33 | 4.85 | 0.14 | 14.12 | 2.91 | 94.54 | 0 | 7 | 0 |
69 | DENSE | 512 | 384 | 1.33 | 4.09 | 0.05 | 13.71 | 3.35 | 91.19 | 0 | 0 | 0 |
74 | DENSE | 1024 | 512 | 2.00 | 3.41 | 0.04 | 11.20 | 3.29 | 86.20 | 0 | 0 | 0 |
75 | DENSE | 1024 | 512 | 2.00 | 5.67 | 0.10 | 20.22 | 3.57 | 93.70 | 0 | 1 | 0 |
76 | DENSE | 1024 | 512 | 2.00 | 3.69 | 0.04 | 13.47 | 3.65 | 88.03 | 0 | 0 | 0 |
85 | DENSE | 512 | 384 | 1.33 | 3.74 | 0.05 | 3.16 | 0.85 | 88.66 | 0 | 0 | 0 |
86 | DENSE | 512 | 384 | 1.33 | 3.44 | 0.10 | 9.19 | 2.67 | 88.16 | 0 | 1 | 0 |
87 | DENSE | 512 | 384 | 1.33 | 2.81 | 0.14 | 8.74 | 3.11 | 90.29 | 0 | 8 | 0 |
88 | DENSE | 512 | 384 | 1.33 | 4.20 | 0.05 | 16.10 | 3.83 | 85.75 | 0 | 0 | 0 |
93 | DENSE | 1024 | 512 | 2.00 | 3.48 | 0.06 | 11.22 | 3.23 | 85.48 | 0 | 0 | 0 |
94 | DENSE | 1024 | 512 | 2.00 | 5.16 | 0.07 | 19.03 | 3.69 | 93.04 | 0 | 0 | 0 |
95 | DENSE | 1024 | 512 | 2.00 | 3.88 | 0.04 | 14.62 | 3.76 | 87.82 | 0 | 0 | 0 |
104 | DENSE | 512 | 384 | 1.33 | 4.77 | 0.04 | 4.22 | 0.88 | 87.75 | 0 | 0 | 0 |
105 | DENSE | 512 | 384 | 1.33 | 2.16 | 0.14 | 5.67 | 2.62 | 90.81 | 0 | 8 | 0 |
106 | DENSE | 512 | 384 | 1.33 | 4.63 | 0.11 | 14.27 | 3.08 | 92.27 | 0 | 0 | 0 |
107 | DENSE | 512 | 384 | 1.33 | 4.00 | 0.06 | 15.14 | 3.79 | 86.15 | 0 | 0 | 0 |
112 | DENSE | 1024 | 512 | 2.00 | 3.24 | 0.10 | 10.25 | 3.16 | 85.28 | 0 | 6 | 0 |
113 | DENSE | 1024 | 512 | 2.00 | 5.38 | 0.07 | 20.53 | 3.82 | 91.74 | 0 | 0 | 0 |
114 | DENSE | 1024 | 512 | 2.00 | 3.91 | 0.04 | 14.64 | 3.74 | 88.35 | 0 | 0 | 0 |
123 | DENSE | 512 | 384 | 1.33 | 3.73 | 0.05 | 3.81 | 1.02 | 85.85 | 0 | 0 | 0 |
124 | DENSE | 512 | 384 | 1.33 | 3.50 | 0.07 | 9.39 | 2.68 | 88.39 | 0 | 0 | 0 |
125 | DENSE | 512 | 384 | 1.33 | 4.08 | 0.13 | 13.32 | 3.26 | 90.29 | 0 | 3 | 0 |
126 | DENSE | 512 | 384 | 1.33 | 3.09 | 0.10 | 12.08 | 3.91 | 84.97 | 0 | 1 | 0 |
131 | DENSE | 1024 | 512 | 2.00 | 2.87 | 0.08 | 8.87 | 3.08 | 85.37 | 0 | 1 | 0 |
132 | DENSE | 1024 | 512 | 2.00 | 4.54 | 0.05 | 17.83 | 3.93 | 91.24 | 0 | 0 | 0 |
133 | DENSE | 1024 | 512 | 2.00 | 3.98 | 0.03 | 14.52 | 3.65 | 89.14 | 0 | 0 | 0 |
142 | DENSE | 512 | 384 | 1.33 | 2.91 | 0.04 | 2.47 | 0.85 | 80.71 | 0 | 0 | 0 |
143 | DENSE | 512 | 384 | 1.33 | 2.57 | 0.07 | 6.36 | 2.48 | 83.83 | 0 | 0 | 0 |
144 | DENSE | 512 | 384 | 1.33 | 4.82 | 0.12 | 15.94 | 3.30 | 91.44 | 0 | 1 | 0 |
145 | DENSE | 512 | 384 | 1.33 | 4.25 | 0.06 | 17.23 | 4.06 | 83.31 | 0 | 0 | 0 |
150 | DENSE | 1024 | 512 | 2.00 | 2.80 | 0.09 | 8.71 | 3.12 | 85.23 | 0 | 2 | 0 |
151 | DENSE | 1024 | 512 | 2.00 | 4.39 | 0.05 | 18.08 | 4.12 | 91.24 | 1 | 0 | 0 |
152 | DENSE | 1024 | 512 | 2.00 | 3.46 | 0.04 | 13.14 | 3.80 | 86.18 | 0 | 0 | 0 |
165 | DENSE | 512 | 384 | 1.33 | 3.90 | 0.04 | 5.10 | 1.31 | 86.09 | 0 | 0 | 0 |
166 | DENSE | 512 | 384 | 1.33 | 4.57 | 0.08 | 13.71 | 3.00 | 88.84 | 0 | 0 | 0 |
167 | DENSE | 512 | 384 | 1.33 | 4.97 | 0.07 | 13.52 | 2.72 | 90.85 | 0 | 0 | 0 |
168 | DENSE | 512 | 384 | 1.33 | 3.20 | 0.06 | 10.59 | 3.31 | 83.33 | 0 | 0 | 0 |
174 | DENSE | 512 | 384 | 1.33 | 4.21 | 0.04 | 5.12 | 1.22 | 91.69 | 0 | 0 | 0 |
175 | DENSE | 512 | 384 | 1.33 | 3.36 | 0.09 | 10.10 | 3.01 | 84.42 | 0 | 0 | 0 |
176 | DENSE | 512 | 384 | 1.33 | 5.18 | 0.04 | 13.19 | 2.55 | 91.97 | 0 | 0 | 0 |
177 | DENSE | 512 | 384 | 1.33 | 3.02 | 0.04 | 10.58 | 3.51 | 79.18 | 0 | 0 | 0 |
182 | DENSE | 1024 | 512 | 2.00 | 2.82 | 0.03 | 10.69 | 3.79 | 82.89 | 0 | 0 | 0 |
183 | DENSE | 1024 | 512 | 2.00 | 3.56 | 0.04 | 11.43 | 3.21 | 91.61 | 0 | 0 | 0 |
184 | DENSE | 1024 | 512 | 2.00 | 3.28 | 0.03 | 12.37 | 3.77 | 82.52 | 0 | 0 | 0 |
193 | DENSE | 512 | 384 | 1.33 | 2.91 | 0.04 | 4.13 | 1.42 | 81.92 | 0 | 0 | 0 |
194 | DENSE | 512 | 384 | 1.33 | 3.11 | 0.04 | 9.10 | 2.93 | 83.02 | 0 | 0 | 0 |
195 | DENSE | 512 | 384 | 1.33 | 3.63 | 0.05 | 11.04 | 3.04 | 87.82 | 0 | 0 | 0 |
196 | DENSE | 512 | 384 | 1.33 | 2.84 | 0.02 | 11.19 | 3.94 | 74.92 | 0 | 0 | 0 |
201 | DENSE | 512 | 384 | 1.33 | 4.11 | 0.05 | 5.22 | 1.27 | 88.43 | 0 | 0 | 0 |
202 | DENSE | 512 | 384 | 1.33 | 3.62 | 0.04 | 10.71 | 2.95 | 89.81 | 0 | 0 | 0 |
203 | DENSE | 512 | 384 | 1.33 | 3.54 | 0.08 | 9.64 | 2.72 | 89.86 | 0 | 0 | 0 |
204 | DENSE | 512 | 384 | 1.33 | 2.95 | 0.03 | 11.15 | 3.79 | 75.58 | 0 | 0 | 0 |
209 | DENSE | 1024 | 512 | 2.00 | 3.90 | 0.03 | 13.05 | 3.35 | 88.83 | 0 | 0 | 0 |
210 | DENSE | 1024 | 512 | 2.00 | 4.48 | 0.07 | 15.22 | 3.40 | 92.83 | 0 | 0 | 0 |
211 | DENSE | 1024 | 512 | 2.00 | 3.76 | 0.05 | 15.29 | 4.06 | 83.04 | 0 | 0 | 0 |
220 | DENSE | 512 | 384 | 1.33 | 3.09 | 0.05 | 2.93 | 0.95 | 83.15 | 0 | 0 | 0 |
221 | DENSE | 512 | 384 | 1.33 | 3.43 | 0.05 | 9.39 | 2.74 | 85.53 | 0 | 0 | 0 |
222 | DENSE | 512 | 384 | 1.33 | 3.86 | 0.12 | 11.74 | 3.04 | 88.47 | 0 | 1 | 0 |
223 | DENSE | 512 | 384 | 1.33 | 2.85 | 0.04 | 11.88 | 4.17 | 73.27 | 0 | 0 | 0 |
228 | DENSE | 512 | 384 | 1.33 | 4.70 | 0.06 | 5.59 | 1.19 | 91.29 | 0 | 0 | 0 |
229 | DENSE | 512 | 384 | 1.33 | 3.98 | 0.05 | 11.44 | 2.88 | 90.57 | 0 | 0 | 0 |
230 | DENSE | 512 | 384 | 1.33 | 4.39 | 0.11 | 12.70 | 2.89 | 94.12 | 0 | 1 | 0 |
231 | DENSE | 512 | 384 | 1.33 | 3.11 | 0.05 | 12.43 | 4.00 | 77.98 | 0 | 0 | 0 |
236 | DENSE | 1024 | 512 | 2.00 | 3.63 | 0.05 | 11.90 | 3.28 | 87.16 | 0 | 0 | 0 |
237 | DENSE | 1024 | 512 | 2.00 | 4.67 | 0.04 | 17.81 | 3.81 | 91.91 | 0 | 0 | 0 |
238 | DENSE | 1024 | 512 | 2.00 | 3.82 | 0.05 | 17.33 | 4.53 | 78.69 | 0 | 0 | 0 |
247 | DENSE | 512 | 384 | 1.33 | 3.78 | 0.07 | 3.54 | 0.94 | 86.13 | 0 | 0 | 0 |
248 | DENSE | 512 | 384 | 1.33 | 3.36 | 0.05 | 9.07 | 2.70 | 86.78 | 0 | 0 | 0 |
249 | DENSE | 512 | 384 | 1.33 | 6.01 | 0.10 | 19.50 | 3.24 | 91.91 | 0 | 0 | 0 |
250 | DENSE | 512 | 384 | 1.33 | 3.15 | 0.09 | 13.93 | 4.43 | 74.34 | 0 | 0 | 0 |
255 | DENSE | 512 | 384 | 1.33 | 2.78 | 0.05 | 3.78 | 1.36 | 83.94 | 0 | 0 | 0 |
256 | DENSE | 512 | 384 | 1.33 | 2.73 | 0.05 | 8.96 | 3.28 | 79.50 | 0 | 0 | 0 |
257 | DENSE | 512 | 384 | 1.33 | 7.44 | 0.05 | 22.28 | 2.99 | 94.90 | 0 | 0 | 0 |
258 | DENSE | 512 | 384 | 1.33 | 3.34 | 0.06 | 13.60 | 4.07 | 75.60 | 0 | 0 | 0 |
263 | DENSE | 1024 | 512 | 2.00 | 2.92 | 0.05 | 9.31 | 3.19 | 85.09 | 0 | 0 | 0 |
264 | DENSE | 1024 | 512 | 2.00 | 4.09 | 0.09 | 15.56 | 3.81 | 91.32 | 0 | 1 | 0 |
265 | DENSE | 1024 | 512 | 2.00 | 3.65 | 0.02 | 16.55 | 4.54 | 80.09 | 0 | 0 | 0 |
274 | DENSE | 512 | 384 | 1.33 | 4.98 | 0.04 | 5.69 | 1.14 | 88.89 | 0 | 0 | 0 |
275 | DENSE | 512 | 384 | 1.33 | 3.65 | 0.14 | 9.70 | 2.66 | 91.96 | 0 | 8 | 0 |
276 | DENSE | 512 | 384 | 1.33 | 5.15 | 0.12 | 16.62 | 3.23 | 91.87 | 0 | 1 | 0 |
277 | DENSE | 512 | 384 | 1.33 | 3.05 | 0.04 | 14.09 | 4.63 | 73.94 | 0 | 0 | 0 |
282 | DENSE | 512 | 384 | 1.33 | 3.30 | 0.05 | 4.55 | 1.38 | 84.44 | 0 | 0 | 0 |
283 | DENSE | 512 | 384 | 1.33 | 3.06 | 0.04 | 10.19 | 3.33 | 83.32 | 0 | 0 | 0 |
284 | DENSE | 512 | 384 | 1.33 | 3.69 | 0.14 | 11.61 | 3.15 | 91.83 | 0 | 5 | 0 |
285 | DENSE | 512 | 384 | 1.33 | 3.93 | 0.06 | 15.80 | 4.02 | 82.20 | 0 | 0 | 0 |
290 | DENSE | 1024 | 512 | 2.00 | 3.31 | 0.05 | 10.04 | 3.03 | 86.29 | 0 | 0 | 0 |
291 | DENSE | 1024 | 512 | 2.00 | 3.58 | 0.11 | 13.75 | 3.84 | 92.24 | 0 | 4 | 0 |
292 | DENSE | 1024 | 512 | 2.00 | 3.60 | 0.04 | 16.21 | 4.50 | 80.84 | 0 | 0 | 0 |
301 | DENSE | 512 | 384 | 1.33 | 3.67 | 0.04 | 4.86 | 1.33 | 85.07 | 0 | 0 | 0 |
302 | DENSE | 512 | 384 | 1.33 | 5.73 | 0.07 | 14.51 | 2.53 | 91.11 | 0 | 0 | 0 |
303 | DENSE | 512 | 384 | 1.33 | 4.88 | 0.13 | 16.57 | 3.39 | 94.82 | 0 | 5 | 0 |
304 | DENSE | 512 | 384 | 1.33 | 1.91 | 0.08 | 8.57 | 4.48 | 78.15 | 0 | 1 | 0 |
309 | DENSE | 512 | 384 | 1.33 | 4.24 | 0.06 | 5.06 | 1.19 | 88.65 | 0 | 0 | 0 |
310 | DENSE | 512 | 384 | 1.33 | 4.75 | 0.06 | 14.04 | 2.96 | 88.93 | 0 | 0 | 0 |
311 | DENSE | 512 | 384 | 1.33 | 2.60 | 0.11 | 8.58 | 3.30 | 92.74 | 0 | 0 | 0 |
312 | DENSE | 512 | 384 | 1.33 | 3.30 | 0.08 | 14.74 | 4.46 | 77.15 | 0 | 0 | 0 |
317 | DENSE | 1024 | 512 | 2.00 | 3.14 | 0.05 | 9.01 | 2.87 | 86.13 | 0 | 0 | 0 |
318 | DENSE | 1024 | 512 | 2.00 | 4.55 | 0.09 | 18.00 | 3.96 | 92.19 | 0 | 1 | 0 |
319 | DENSE | 1024 | 512 | 2.00 | 3.94 | 0.04 | 17.16 | 4.36 | 83.87 | 0 | 0 | 0 |
328 | DENSE | 512 | 384 | 1.33 | 4.06 | 0.07 | 2.81 | 0.69 | 89.92 | 0 | 0 | 0 |
329 | DENSE | 512 | 384 | 1.33 | 4.10 | 0.07 | 10.14 | 2.47 | 89.30 | 0 | 0 | 0 |
330 | DENSE | 512 | 384 | 1.33 | 2.36 | 0.14 | 7.90 | 3.35 | 94.77 | 0 | 2 | 0 |
331 | DENSE | 512 | 384 | 1.33 | 4.09 | 0.10 | 20.10 | 4.91 | 75.82 | 0 | 0 | 0 |
336 | DENSE | 512 | 384 | 1.33 | 3.62 | 0.06 | 4.43 | 1.22 | 83.39 | 0 | 0 | 0 |
337 | DENSE | 512 | 384 | 1.33 | 2.04 | 0.11 | 6.21 | 3.05 | 84.01 | 0 | 4 | 0 |
338 | DENSE | 512 | 384 | 1.33 | 10.00 | 0.11 | 33.78 | 3.38 | 95.63 | 0 | 0 | 0 |
339 | DENSE | 512 | 384 | 1.33 | 3.83 | 0.11 | 17.76 | 4.63 | 81.59 | 0 | 0 | 0 |
344 | DENSE | 1024 | 512 | 2.00 | 3.38 | 0.05 | 9.37 | 2.78 | 85.88 | 0 | 0 | 0 |
345 | DENSE | 1024 | 512 | 2.00 | 4.20 | 0.07 | 17.81 | 4.24 | 90.89 | 0 | 0 | 0 |
346 | DENSE | 1024 | 512 | 2.00 | 3.92 | 0.05 | 17.31 | 4.42 | 85.33 | 0 | 0 | 0 |
355 | DENSE | 512 | 384 | 1.33 | 4.61 | 0.03 | 3.94 | 0.86 | 92.76 | 0 | 0 | 0 |
356 | DENSE | 512 | 384 | 1.33 | 4.69 | 0.05 | 13.03 | 2.78 | 92.92 | 0 | 0 | 0 |
357 | DENSE | 512 | 384 | 1.33 | 7.66 | 0.06 | 27.15 | 3.55 | 93.95 | 0 | 0 | 0 |
358 | DENSE | 512 | 384 | 1.33 | 3.26 | 0.07 | 14.32 | 4.39 | 77.37 | 0 | 0 | 0 |
363 | DENSE | 512 | 384 | 1.33 | 2.83 | 0.09 | 4.41 | 1.56 | 75.46 | 0 | 0 | 0 |
364 | DENSE | 512 | 384 | 1.33 | 1.94 | 0.09 | 6.44 | 3.32 | 77.66 | 0 | 1 | 0 |
365 | DENSE | 512 | 384 | 1.33 | 6.62 | 0.13 | 25.27 | 3.82 | 88.93 | 0 | 1 | 0 |
366 | DENSE | 512 | 384 | 1.33 | 3.68 | 0.06 | 17.22 | 4.68 | 85.98 | 0 | 0 | 0 |
371 | DENSE | 1024 | 512 | 2.00 | 3.24 | 0.04 | 10.59 | 3.27 | 81.52 | 0 | 0 | 0 |
372 | DENSE | 1024 | 512 | 2.00 | 3.10 | 0.08 | 15.34 | 4.95 | 86.02 | 0 | 0 | 0 |
373 | DENSE | 1024 | 512 | 2.00 | 2.86 | 0.05 | 15.16 | 5.30 | 70.96 | 7 | 0 | 0 |