Token | dominance |
Token ID | 18648 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
ォ | +0.442 |
kefeller | +0.396 |
ruary | +0.373 |
hester | +0.354 |
Nebula | +0.333 |
Neg logit contributions | |
ura | -0.332 |
uable | -0.301 |
pora | -0.295 |
veland | -0.290 |
oto | -0.271 |
Token | , |
Token ID | 11 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
ura | +0.791 |
uable | +0.711 |
pora | +0.691 |
veland | +0.682 |
oto | +0.636 |
Neg logit contributions | |
ォ | -1.170 |
kefeller | -1.060 |
ruary | -0.999 |
hester | -0.950 |
Nebula | -0.897 |
Token | � |
Token ID | 447 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
ura | +0.843 |
uable | +0.764 |
pora | +0.743 |
veland | +0.735 |
oto | +0.689 |
Neg logit contributions | |
ォ | -1.089 |
kefeller | -0.983 |
ruary | -0.924 |
hester | -0.875 |
Nebula | -0.822 |
Token | � |
Token ID | 251 |
Feature activation | +5.20e-01 |
Pos logit contributions | |
ura | +0.234 |
uable | +0.213 |
pora | +0.208 |
veland | +0.205 |
oto | +0.195 |
Neg logit contributions | |
ォ | -0.236 |
kefeller | -0.214 |
ruary | -0.198 |
hester | -0.187 |
Nebula | -0.173 |
Token | explains |
Token ID | 6688 |
Feature activation | -4.87e-01 |
Pos logit contributions | |
ura | +0.407 |
uable | +0.370 |
pora | +0.361 |
veland | +0.356 |
oto | +0.334 |
Neg logit contributions | |
ォ | -0.509 |
kefeller | -0.458 |
ruary | -0.430 |
hester | -0.406 |
Nebula | -0.382 |
Token | Agu |
Token ID | 33118 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
ォ | +0.446 |
kefeller | +0.397 |
ruary | +0.371 |
hester | +0.349 |
Nebula | +0.327 |
Neg logit contributions | |
ura | -0.413 |
uable | -0.378 |
pora | -0.369 |
veland | -0.365 |
oto | -0.345 |
Token | ilar |
Token ID | 1794 |
Feature activation | -9.93e-01 |
Pos logit contributions | |
ura | +9.736 |
uable | +7.927 |
veland | +7.904 |
pora | +7.563 |
aur | +7.389 |
Neg logit contributions | |
ォ | -13.709 |
kefeller | -12.642 |
ruary | -11.750 |
hester | -11.032 |
�� | -10.873 |
Token | . |
Token ID | 13 |
Feature activation | -9.24e-02 |
Pos logit contributions | |
ォ | +1.074 |
kefeller | +0.976 |
ruary | +0.923 |
hester | +0.878 |
Nebula | +0.831 |
Neg logit contributions | |
ura | -0.678 |
uable | -0.605 |
pora | -0.588 |
veland | -0.581 |
oto | -0.539 |
Token | In |
Token ID | 554 |
Feature activation | +5.18e-01 |
Pos logit contributions | |
ォ | +0.087 |
kefeller | +0.078 |
ruary | +0.073 |
hester | +0.069 |
Nebula | +0.064 |
Neg logit contributions | |
ura | -0.076 |
uable | -0.069 |
pora | -0.068 |
veland | -0.067 |
oto | -0.063 |
Token | Seattle |
Token ID | 7312 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
ura | +0.429 |
uable | +0.392 |
pora | +0.382 |
veland | +0.378 |
oto | +0.357 |
Neg logit contributions | |
ォ | -0.484 |
kefeller | -0.433 |
ruary | -0.405 |
hester | -0.382 |
Nebula | -0.358 |
Token | , |
Token ID | 11 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
ura | +0.695 |
uable | +0.617 |
pora | +0.599 |
veland | +0.598 |
oto | +0.553 |
Neg logit contributions | |
ォ | -1.102 |
kefeller | -1.012 |
ruary | -0.946 |
hester | -0.903 |
intern | -0.856 |
Token | V |
Token ID | 53 |
Feature activation | -2.66e+00 |
Pos logit contributions | |
ォ | +0.119 |
kefeller | +0.106 |
ruary | +0.099 |
hester | +0.094 |
Nebula | +0.088 |
Neg logit contributions | |
ura | -0.107 |
uable | -0.098 |
pora | -0.096 |
veland | -0.095 |
oto | -0.089 |
Token | ir |
Token ID | 343 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
ォ | +2.681 |
kefeller | +2.449 |
ruary | +2.291 |
hester | +2.212 |
intern | +2.088 |
Neg logit contributions | |
ura | -1.908 |
uable | -1.748 |
pora | -1.709 |
veland | -1.677 |
teenth | -1.557 |
Token | Go |
Token ID | 5247 |
Feature activation | +3.74e+00 |
Pos logit contributions | |
ォ | +1.820 |
kefeller | +1.636 |
ruary | +1.529 |
hester | +1.453 |
intern | +1.360 |
Neg logit contributions | |
ura | -1.567 |
uable | -1.450 |
pora | -1.408 |
veland | -1.394 |
aur | -1.292 |
Token | � |
Token ID | 447 |
Feature activation | -2.17e-01 |
Pos logit contributions | |
ura | +2.749 |
uable | +2.467 |
veland | +2.388 |
pora | +2.383 |
oto | +2.236 |
Neg logit contributions | |
ォ | -3.839 |
kefeller | -3.476 |
ruary | -3.286 |
hester | -3.091 |
Nebula | -2.933 |
Token | � |
Token ID | 251 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
ォ | +0.191 |
kefeller | +0.171 |
ruary | +0.159 |
hester | +0.149 |
Nebula | +0.139 |
Neg logit contributions | |
ura | -0.191 |
uable | -0.175 |
pora | -0.171 |
veland | -0.169 |
oto | -0.160 |
Token | Agu |
Token ID | 33118 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
ォ | +0.131 |
kefeller | +0.117 |
ruary | +0.111 |
hester | +0.105 |
Nebula | +0.099 |
Neg logit contributions | |
ura | -0.099 |
uable | -0.090 |
pora | -0.088 |
veland | -0.086 |
oto | -0.080 |
Token | ilar |
Token ID | 1794 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
ura | +9.261 |
uable | +7.889 |
veland | +7.626 |
aur | +7.613 |
oto | +7.536 |
Neg logit contributions | |
ォ | -13.448 |
kefeller | -12.412 |
ruary | -11.433 |
hester | -10.817 |
�� | -10.784 |
Token | near |
Token ID | 1474 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
ォ | +1.460 |
kefeller | +1.318 |
ruary | +1.246 |
hester | +1.182 |
intern | +1.119 |
Neg logit contributions | |
ura | -1.020 |
uable | -0.930 |
pora | -0.910 |
veland | -0.889 |
aur | -0.825 |
Token | one |
Token ID | 530 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
ura | +1.013 |
uable | +0.924 |
pora | +0.901 |
veland | +0.894 |
oto | +0.843 |
Neg logit contributions | |
ォ | -1.136 |
kefeller | -1.014 |
ruary | -0.948 |
hester | -0.894 |
intern | -0.836 |
Token | of |
Token ID | 286 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
ura | +0.258 |
uable | +0.231 |
pora | +0.224 |
veland | +0.221 |
oto | +0.205 |
Neg logit contributions | |
ォ | -0.412 |
kefeller | -0.374 |
ruary | -0.354 |
hester | -0.337 |
Nebula | -0.319 |
Token | the |
Token ID | 262 |
Feature activation | +7.42e-01 |
Pos logit contributions | |
ura | +0.201 |
uable | +0.183 |
pora | +0.178 |
veland | +0.177 |
oto | +0.167 |
Neg logit contributions | |
ォ | -0.223 |
kefeller | -0.199 |
ruary | -0.186 |
hester | -0.175 |
Nebula | -0.164 |
Token | But |
Token ID | 887 |
Feature activation | -4.19e+00 |
Pos logit contributions | |
ォ | +0.702 |
kefeller | +0.626 |
ruary | +0.588 |
hester | +0.554 |
Nebula | +0.521 |
Neg logit contributions | |
ura | -0.612 |
uable | -0.560 |
pora | -0.548 |
veland | -0.540 |
oto | -0.509 |
Token | after |
Token ID | 706 |
Feature activation | -2.94e+00 |
Pos logit contributions | |
ォ | +3.787 |
kefeller | +3.389 |
ruary | +3.200 |
hester | +3.037 |
Nebula | +2.878 |
Neg logit contributions | |
ura | -3.401 |
uable | -3.129 |
pora | -3.069 |
veland | -3.021 |
aur | -2.843 |
Token | Washington |
Token ID | 2669 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
ォ | +2.707 |
kefeller | +2.418 |
ruary | +2.261 |
hester | +2.141 |
Nebula | +2.032 |
Neg logit contributions | |
ura | -2.413 |
uable | -2.212 |
pora | -2.161 |
veland | -2.135 |
oto | -2.008 |
Token | kicker |
Token ID | 38297 |
Feature activation | +4.34e+00 |
Pos logit contributions | |
ォ | +1.082 |
kefeller | +0.976 |
ruary | +0.916 |
hester | +0.869 |
Nebula | +0.819 |
Neg logit contributions | |
ura | -0.835 |
uable | -0.755 |
pora | -0.739 |
veland | -0.728 |
oto | -0.683 |
Token | Joe |
Token ID | 5689 |
Feature activation | -7.22e-02 |
Pos logit contributions | |
ura | +3.757 |
uable | +3.458 |
pora | +3.393 |
veland | +3.360 |
oto | +3.180 |
Neg logit contributions | |
ォ | -3.846 |
kefeller | -3.440 |
ruary | -3.194 |
hester | -2.980 |
ィ | -2.755 |
Token | Agu |
Token ID | 33118 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
ォ | +0.064 |
kefeller | +0.057 |
ruary | +0.053 |
hester | +0.050 |
Nebula | +0.047 |
Neg logit contributions | |
ura | -0.063 |
uable | -0.057 |
pora | -0.056 |
veland | -0.056 |
oto | -0.053 |
Token | ir |
Token ID | 343 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
ura | +9.039 |
uable | +7.606 |
veland | +7.520 |
pora | +7.438 |
oto | +7.322 |
Neg logit contributions | |
ォ | -13.216 |
kefeller | -11.991 |
ruary | -11.044 |
hester | -10.423 |
�� | -10.121 |
Token | re |
Token ID | 260 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
ォ | +2.189 |
kefeller | +1.988 |
ruary | +1.881 |
hester | +1.789 |
intern | +1.693 |
Neg logit contributions | |
ura | -1.422 |
uable | -1.281 |
pora | -1.253 |
veland | -1.233 |
oto | -1.137 |
Token | failed |
Token ID | 4054 |
Feature activation | -3.86e+00 |
Pos logit contributions | |
ォ | +1.098 |
kefeller | +0.982 |
ruary | +0.921 |
hester | +0.876 |
intern | +0.828 |
Neg logit contributions | |
ura | -0.864 |
uable | -0.785 |
pora | -0.765 |
veland | -0.752 |
oto | -0.705 |
Token | to |
Token ID | 284 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
ォ | +3.786 |
kefeller | +3.407 |
ruary | +3.211 |
hester | +3.024 |
intern | +2.897 |
Neg logit contributions | |
ura | -2.912 |
uable | -2.637 |
pora | -2.593 |
veland | -2.531 |
oto | -2.382 |
Token | convert |
Token ID | 10385 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
ォ | +1.047 |
kefeller | +0.941 |
ruary | +0.879 |
hester | +0.832 |
intern | +0.791 |
Neg logit contributions | |
ura | -0.835 |
uable | -0.755 |
pora | -0.738 |
veland | -0.727 |
oto | -0.685 |
Token | Des |
Token ID | 2935 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
ura | +3.776 |
uable | +3.388 |
pora | +3.351 |
veland | +3.344 |
oto | +3.170 |
Neg logit contributions | |
ォ | -4.583 |
kefeller | -4.067 |
ruary | -3.818 |
hester | -3.572 |
�� | -3.422 |
Token | hm |
Token ID | 23940 |
Feature activation | +4.18e+00 |
Pos logit contributions | |
ura | +1.058 |
uable | +0.951 |
pora | +0.924 |
veland | +0.908 |
oto | +0.862 |
Neg logit contributions | |
ォ | -1.469 |
kefeller | -1.320 |
ruary | -1.248 |
hester | -1.177 |
Nebula | -1.115 |
Token | uk |
Token ID | 2724 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
ura | +2.299 |
uable | +1.948 |
pora | +1.879 |
veland | +1.816 |
oto | +1.731 |
Neg logit contributions | |
ォ | -5.150 |
kefeller | -4.692 |
ruary | -4.489 |
hester | -4.276 |
Nebula | -4.102 |
Token | h |
Token ID | 71 |
Feature activation | -8.18e-01 |
Pos logit contributions | |
ura | +1.196 |
uable | +1.106 |
pora | +1.087 |
veland | +1.067 |
oto | +0.993 |
Neg logit contributions | |
ォ | -1.288 |
kefeller | -1.155 |
ruary | -1.085 |
hester | -1.024 |
intern | -0.958 |
Token | for |
Token ID | 329 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
ォ | +0.863 |
kefeller | +0.780 |
ruary | +0.742 |
hester | +0.704 |
Nebula | +0.667 |
Neg logit contributions | |
ura | -0.566 |
uable | -0.515 |
pora | -0.496 |
veland | -0.491 |
oto | -0.455 |
Token | allot |
Token ID | 47405 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
ura | +1.069 |
uable | +0.973 |
pora | +0.953 |
veland | +0.939 |
aur | +0.887 |
Neg logit contributions | |
ォ | -1.233 |
kefeller | -1.111 |
ruary | -1.028 |
hester | -0.974 |
Nebula | -0.908 |
Token | ting |
Token ID | 889 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
ura | +9.659 |
uable | +8.661 |
pora | +8.513 |
veland | +8.316 |
aur | +8.157 |
Neg logit contributions | |
ォ | -9.008 |
kefeller | -8.153 |
ruary | -7.051 |
hester | -6.944 |
�� | -6.735 |
Token | the |
Token ID | 262 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
ura | +1.103 |
uable | +1.004 |
pora | +0.978 |
veland | +0.965 |
oto | +0.907 |
Neg logit contributions | |
ォ | -1.383 |
kefeller | -1.243 |
ruary | -1.166 |
hester | -1.105 |
Nebula | -1.035 |
Token | land |
Token ID | 1956 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
ura | +1.005 |
uable | +0.909 |
pora | +0.885 |
veland | +0.874 |
oto | +0.817 |
Neg logit contributions | |
ォ | -1.365 |
kefeller | -1.232 |
ruary | -1.160 |
hester | -1.100 |
Nebula | -1.035 |
Token | in |
Token ID | 287 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
ura | +0.896 |
uable | +0.806 |
pora | +0.782 |
veland | +0.772 |
oto | +0.718 |
Neg logit contributions | |
ォ | -1.350 |
kefeller | -1.223 |
ruary | -1.157 |
hester | -1.098 |
Nebula | -1.040 |
Token | 2004 |
Token ID | 5472 |
Feature activation | +2.56e+00 |
Pos logit contributions | |
ura | +1.411 |
uable | +1.292 |
pora | +1.265 |
veland | +1.246 |
oto | +1.181 |
Neg logit contributions | |
ォ | -1.551 |
kefeller | -1.383 |
ruary | -1.286 |
hester | -1.218 |
intern | -1.132 |
Token | lack |
Token ID | 3092 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
ura | +1.768 |
uable | +1.617 |
pora | +1.577 |
veland | +1.547 |
aur | +1.458 |
Neg logit contributions | |
ォ | -2.130 |
kefeller | -1.913 |
ruary | -1.785 |
hester | -1.691 |
Nebula | -1.569 |
Token | of |
Token ID | 286 |
Feature activation | -1.77e-01 |
Pos logit contributions | |
ォ | +2.744 |
kefeller | +2.504 |
ruary | +2.373 |
hester | +2.264 |
Nebula | +2.150 |
Neg logit contributions | |
ura | -1.540 |
uable | -1.367 |
pora | -1.323 |
veland | -1.302 |
oto | -1.199 |
Token | transparency |
Token ID | 13902 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
ォ | +0.169 |
kefeller | +0.152 |
ruary | +0.142 |
hester | +0.134 |
Nebula | +0.126 |
Neg logit contributions | |
ura | -0.142 |
uable | -0.129 |
pora | -0.126 |
veland | -0.125 |
oto | -0.117 |
Token | in |
Token ID | 287 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
ura | +0.074 |
uable | +0.066 |
pora | +0.064 |
veland | +0.063 |
oto | +0.059 |
Neg logit contributions | |
ォ | -0.115 |
kefeller | -0.105 |
ruary | -0.099 |
hester | -0.094 |
Nebula | -0.089 |
Token | the |
Token ID | 262 |
Feature activation | +7.60e-01 |
Pos logit contributions | |
ura | +0.906 |
uable | +0.825 |
pora | +0.808 |
veland | +0.796 |
oto | +0.749 |
Neg logit contributions | |
ォ | -1.110 |
kefeller | -0.994 |
ruary | -0.931 |
hester | -0.881 |
intern | -0.823 |
Token | allot |
Token ID | 47405 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
ura | +0.600 |
uable | +0.545 |
pora | +0.532 |
veland | +0.525 |
oto | +0.494 |
Neg logit contributions | |
ォ | -0.739 |
kefeller | -0.664 |
ruary | -0.623 |
hester | -0.589 |
Nebula | -0.552 |
Token | ment |
Token ID | 434 |
Feature activation | +6.82e-01 |
Pos logit contributions | |
ura | +6.695 |
uable | +5.725 |
pora | +5.653 |
veland | +5.370 |
aur | +5.210 |
Neg logit contributions | |
ォ | -11.500 |
kefeller | -10.616 |
ruary | -9.662 |
hester | -9.474 |
�� | -9.125 |
Token | of |
Token ID | 286 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
ura | +0.494 |
uable | +0.445 |
pora | +0.433 |
veland | +0.427 |
oto | +0.399 |
Neg logit contributions | |
ォ | -0.708 |
kefeller | -0.641 |
ruary | -0.604 |
hester | -0.573 |
Nebula | -0.541 |
Token | land |
Token ID | 1956 |
Feature activation | +8.10e-01 |
Pos logit contributions | |
ura | +0.238 |
uable | +0.216 |
pora | +0.210 |
veland | +0.208 |
oto | +0.195 |
Neg logit contributions | |
ォ | -0.303 |
kefeller | -0.273 |
ruary | -0.257 |
hester | -0.243 |
Nebula | -0.229 |
Token | as |
Token ID | 355 |
Feature activation | -5.39e-01 |
Pos logit contributions | |
ura | +0.571 |
uable | +0.514 |
pora | +0.499 |
veland | +0.493 |
oto | +0.458 |
Neg logit contributions | |
ォ | -0.854 |
kefeller | -0.774 |
ruary | -0.732 |
hester | -0.694 |
Nebula | -0.658 |
Token | many |
Token ID | 867 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
ォ | +0.516 |
kefeller | +0.462 |
ruary | +0.435 |
hester | +0.410 |
Nebula | +0.387 |
Neg logit contributions | |
ura | -0.430 |
uable | -0.393 |
pora | -0.383 |
veland | -0.379 |
oto | -0.356 |
Token | Palm |
Token ID | 18358 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
ura | +0.599 |
uable | +0.550 |
pora | +0.537 |
veland | +0.531 |
oto | +0.501 |
Neg logit contributions | |
ォ | -0.641 |
kefeller | -0.573 |
ruary | -0.534 |
hester | -0.504 |
Nebula | -0.472 |
Token | Beach |
Token ID | 8511 |
Feature activation | +9.05e-01 |
Pos logit contributions | |
ura | +2.510 |
uable | +2.235 |
pora | +2.188 |
veland | +2.187 |
oto | +2.063 |
Neg logit contributions | |
ォ | -3.234 |
kefeller | -2.925 |
ruary | -2.726 |
hester | -2.583 |
�� | -2.423 |
Token | , |
Token ID | 11 |
Feature activation | +7.22e-01 |
Pos logit contributions | |
ura | +0.627 |
uable | +0.554 |
pora | +0.545 |
veland | +0.538 |
aur | +0.501 |
Neg logit contributions | |
ォ | -0.977 |
kefeller | -0.886 |
ruary | -0.834 |
hester | -0.792 |
intern | -0.751 |
Token | Florida |
Token ID | 4744 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
ura | +0.611 |
uable | +0.561 |
pora | +0.548 |
veland | +0.541 |
oto | +0.510 |
Neg logit contributions | |
ォ | -0.658 |
kefeller | -0.588 |
ruary | -0.549 |
hester | -0.518 |
Nebula | -0.485 |
Token | , |
Token ID | 11 |
Feature activation | +6.43e-01 |
Pos logit contributions | |
ura | +2.277 |
uable | +1.987 |
pora | +1.958 |
veland | +1.946 |
oto | +1.824 |
Neg logit contributions | |
ォ | -3.946 |
kefeller | -3.551 |
ruary | -3.354 |
hester | -3.188 |
intern | -3.049 |
Token | Moreno |
Token ID | 43269 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
ura | +0.551 |
uable | +0.506 |
pora | +0.495 |
veland | +0.489 |
oto | +0.461 |
Neg logit contributions | |
ォ | -0.579 |
kefeller | -0.518 |
ruary | -0.483 |
hester | -0.455 |
Nebula | -0.426 |
Token | Valley |
Token ID | 6916 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
ura | +8.821 |
veland | +7.746 |
uable | +7.675 |
pora | +7.579 |
aur | +7.416 |
Neg logit contributions | |
ォ | -9.351 |
kefeller | -8.227 |
ruary | -7.730 |
hester | -7.017 |
�� | -7.007 |
Token | , |
Token ID | 11 |
Feature activation | +5.65e-01 |
Pos logit contributions | |
ura | +0.887 |
uable | +0.783 |
pora | +0.771 |
veland | +0.757 |
oto | +0.707 |
Neg logit contributions | |
ォ | -1.368 |
kefeller | -1.243 |
ruary | -1.173 |
hester | -1.112 |
intern | -1.048 |
Token | California |
Token ID | 3442 |
Feature activation | +2.87e+00 |
Pos logit contributions | |
ura | +0.467 |
uable | +0.429 |
pora | +0.419 |
veland | +0.413 |
oto | +0.388 |
Neg logit contributions | |
ォ | -0.524 |
kefeller | -0.469 |
ruary | -0.439 |
hester | -0.415 |
Nebula | -0.391 |
Token | , |
Token ID | 11 |
Feature activation | +5.27e-01 |
Pos logit contributions | |
ura | +1.906 |
uable | +1.671 |
pora | +1.628 |
veland | +1.613 |
oto | +1.520 |
Neg logit contributions | |
ォ | -3.154 |
kefeller | -2.840 |
ruary | -2.695 |
hester | -2.556 |
�� | -2.444 |
Token | Minneapolis |
Token ID | 20455 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
ura | +0.441 |
uable | +0.405 |
pora | +0.395 |
veland | +0.390 |
oto | +0.367 |
Neg logit contributions | |
ォ | -0.484 |
kefeller | -0.434 |
ruary | -0.405 |
hester | -0.383 |
Nebula | -0.359 |
Token | Des |
Token ID | 2935 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
ォ | +1.702 |
kefeller | +1.524 |
ruary | +1.422 |
hester | +1.340 |
Nebula | +1.258 |
Neg logit contributions | |
ura | -1.568 |
uable | -1.434 |
pora | -1.399 |
veland | -1.386 |
oto | -1.306 |
Token | hm |
Token ID | 23940 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
ura | +1.099 |
uable | +1.026 |
pora | +1.003 |
veland | +0.998 |
oto | +0.948 |
Neg logit contributions | |
ォ | -0.782 |
kefeller | -0.683 |
ruary | -0.623 |
hester | -0.582 |
intern | -0.529 |
Token | uk |
Token ID | 2724 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
ura | +1.990 |
uable | +1.734 |
pora | +1.676 |
veland | +1.641 |
oto | +1.498 |
Neg logit contributions | |
ォ | -4.213 |
kefeller | -3.862 |
ruary | -3.671 |
hester | -3.517 |
Nebula | -3.354 |
Token | h |
Token ID | 71 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
ura | +0.928 |
uable | +0.852 |
pora | +0.832 |
veland | +0.822 |
oto | +0.773 |
Neg logit contributions | |
ォ | -1.040 |
kefeller | -0.933 |
ruary | -0.873 |
hester | -0.826 |
intern | -0.774 |
Token | in |
Token ID | 287 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
ォ | +1.055 |
kefeller | +0.961 |
ruary | +0.909 |
hester | +0.863 |
Nebula | +0.818 |
Neg logit contributions | |
ura | -0.705 |
uable | -0.639 |
pora | -0.613 |
veland | -0.608 |
oto | -0.566 |
Token | allot |
Token ID | 47405 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
ura | +1.086 |
uable | +0.984 |
pora | +0.963 |
veland | +0.947 |
aur | +0.890 |
Neg logit contributions | |
ォ | -1.411 |
kefeller | -1.270 |
ruary | -1.190 |
hester | -1.128 |
intern | -1.055 |
Token | ting |
Token ID | 889 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
ura | +9.407 |
uable | +8.539 |
pora | +8.358 |
veland | +8.296 |
aur | +8.003 |
Neg logit contributions | |
ォ | -8.121 |
kefeller | -7.230 |
ruary | -6.355 |
hester | -6.073 |
�� | -5.841 |
Token | the |
Token ID | 262 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
ura | +0.835 |
uable | +0.761 |
pora | +0.740 |
veland | +0.730 |
oto | +0.687 |
Neg logit contributions | |
ォ | -1.057 |
kefeller | -0.948 |
ruary | -0.892 |
hester | -0.844 |
Nebula | -0.790 |
Token | land |
Token ID | 1956 |
Feature activation | +5.49e-01 |
Pos logit contributions | |
ura | +0.809 |
uable | +0.732 |
pora | +0.712 |
veland | +0.703 |
oto | +0.658 |
Neg logit contributions | |
ォ | -1.096 |
kefeller | -0.989 |
ruary | -0.931 |
hester | -0.883 |
Nebula | -0.831 |
Token | . |
Token ID | 13 |
Feature activation | +8.05e-02 |
Pos logit contributions | |
ura | +0.376 |
uable | +0.337 |
pora | +0.327 |
veland | +0.323 |
oto | +0.299 |
Neg logit contributions | |
ォ | -0.590 |
kefeller | -0.536 |
ruary | -0.508 |
hester | -0.482 |
Nebula | -0.457 |
Token |
|
Token ID | 198 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
ura | +0.059 |
uable | +0.053 |
pora | +0.052 |
veland | +0.051 |
aur | +0.048 |
Neg logit contributions | |
ォ | -0.083 |
kefeller | -0.075 |
ruary | -0.070 |
hester | -0.067 |
intern | -0.063 |
Token | According |
Token ID | 4821 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
ura | +0.960 |
uable | +0.879 |
pora | +0.858 |
veland | +0.854 |
oto | +0.811 |
Neg logit contributions | |
ォ | -0.961 |
kefeller | -0.855 |
ruary | -0.798 |
hester | -0.746 |
Nebula | -0.694 |
Token | to |
Token ID | 284 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
ォ | +1.223 |
kefeller | +1.110 |
ruary | +1.038 |
hester | +0.991 |
Nebula | +0.940 |
Neg logit contributions | |
ura | -0.952 |
uable | -0.871 |
pora | -0.853 |
veland | -0.831 |
oto | -0.779 |
Token | CBS |
Token ID | 11133 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
ura | +0.481 |
uable | +0.439 |
veland | +0.428 |
pora | +0.428 |
oto | +0.402 |
Neg logit contributions | |
ォ | -0.531 |
kefeller | -0.470 |
ruary | -0.441 |
hester | -0.414 |
�� | -0.387 |
Token | New |
Token ID | 968 |
Feature activation | +6.99e-01 |
Pos logit contributions | |
ォ | +1.651 |
kefeller | +1.465 |
ruary | +1.363 |
hester | +1.283 |
Nebula | +1.198 |
Neg logit contributions | |
ura | -1.590 |
uable | -1.458 |
pora | -1.421 |
veland | -1.410 |
oto | -1.334 |
Token | York |
Token ID | 1971 |
Feature activation | -1.92e+00 |
Pos logit contributions | |
ura | +0.697 |
uable | +0.646 |
pora | +0.635 |
veland | +0.631 |
oto | +0.601 |
Neg logit contributions | |
ォ | -0.536 |
kefeller | -0.465 |
ruary | -0.428 |
hester | -0.395 |
Nebula | -0.363 |
Token | cho |
Token ID | 1727 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
ォ | +2.048 |
kefeller | +1.848 |
ruary | +1.736 |
hester | +1.656 |
Nebula | +1.573 |
Neg logit contributions | |
ura | -1.356 |
uable | -1.211 |
veland | -1.176 |
pora | -1.170 |
aur | -1.087 |
Token | pper |
Token ID | 2848 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
ura | +6.474 |
veland | +5.790 |
uable | +5.571 |
irs | +5.509 |
pora | +5.493 |
Neg logit contributions | |
ォ | -10.877 |
kefeller | -9.710 |
ruary | -9.361 |
hester | -8.757 |
Nebula | -8.633 |
Token | reporter |
Token ID | 9095 |
Feature activation | +8.04e-01 |
Pos logit contributions | |
ura | +1.939 |
uable | +1.770 |
veland | +1.731 |
pora | +1.723 |
oto | +1.618 |
Neg logit contributions | |
ォ | -2.111 |
kefeller | -1.882 |
ruary | -1.750 |
hester | -1.650 |
bley | -1.536 |
Token | Joe |
Token ID | 5689 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
ura | +0.728 |
uable | +0.668 |
pora | +0.655 |
veland | +0.650 |
oto | +0.617 |
Neg logit contributions | |
ォ | -0.690 |
kefeller | -0.613 |
ruary | -0.566 |
hester | -0.530 |
intern | -0.489 |
Token | B |
Token ID | 347 |
Feature activation | -9.48e-01 |
Pos logit contributions | |
ura | +1.081 |
uable | +0.985 |
pora | +0.963 |
veland | +0.957 |
oto | +0.907 |
Neg logit contributions | |
ォ | -1.122 |
kefeller | -1.001 |
ruary | -0.934 |
hester | -0.876 |
intern | -0.816 |
Token | ier |
Token ID | 959 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
ォ | +0.985 |
kefeller | +0.896 |
ruary | +0.846 |
hester | +0.803 |
intern | +0.758 |
Neg logit contributions | |
ura | -0.671 |
uable | -0.611 |
pora | -0.595 |
veland | -0.583 |
oto | -0.540 |
Token | Bun |
Token ID | 28515 |
Feature activation | +3.33e-01 |
Pos logit contributions | |
ura | +1.402 |
uable | +1.275 |
pora | +1.243 |
veland | +1.236 |
oto | +1.162 |
Neg logit contributions | |
ォ | -1.614 |
kefeller | -1.440 |
ruary | -1.354 |
hester | -1.274 |
intern | -1.190 |
Token | awan |
Token ID | 43004 |
Feature activation | +3.16e+00 |
Pos logit contributions | |
ura | +0.284 |
uable | +0.261 |
pora | +0.255 |
veland | +0.252 |
oto | +0.238 |
Neg logit contributions | |
ォ | -0.301 |
kefeller | -0.268 |
ruary | -0.251 |
hester | -0.236 |
Nebula | -0.220 |
Token | township |
Token ID | 42823 |
Feature activation | +5.31e-01 |
Pos logit contributions | |
ura | +2.388 |
uable | +2.134 |
pora | +2.093 |
veland | +2.055 |
oto | +1.948 |
Neg logit contributions | |
ォ | -3.204 |
kefeller | -2.895 |
ruary | -2.723 |
hester | -2.577 |
intern | -2.427 |
Token | in |
Token ID | 287 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
ura | +0.388 |
uable | +0.352 |
pora | +0.341 |
veland | +0.337 |
oto | +0.314 |
Neg logit contributions | |
ォ | -0.546 |
kefeller | -0.492 |
ruary | -0.466 |
hester | -0.441 |
Nebula | -0.417 |
Token | the |
Token ID | 262 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
ura | +1.266 |
uable | +1.147 |
pora | +1.119 |
veland | +1.105 |
oto | +1.037 |
Neg logit contributions | |
ォ | -1.635 |
kefeller | -1.471 |
ruary | -1.382 |
hester | -1.309 |
Nebula | -1.231 |
Token | Philippines |
Token ID | 13316 |
Feature activation | +9.73e+00 |
Pos logit contributions | |
ura | +0.978 |
uable | +0.885 |
pora | +0.861 |
veland | +0.849 |
aur | +0.790 |
Neg logit contributions | |
ォ | -1.383 |
kefeller | -1.250 |
ruary | -1.180 |
hester | -1.118 |
Nebula | -1.061 |
Token | celebrated |
Token ID | 13943 |
Feature activation | +7.21e-01 |
Pos logit contributions | |
ura | +7.206 |
uable | +6.326 |
pora | +6.269 |
veland | +6.023 |
aur | +5.886 |
Neg logit contributions | |
ォ | -9.646 |
kefeller | -8.820 |
ruary | -7.988 |
hester | -7.743 |
�� | -7.539 |
Token | what |
Token ID | 644 |
Feature activation | -3.71e-01 |
Pos logit contributions | |
ura | +0.573 |
uable | +0.520 |
pora | +0.506 |
veland | +0.501 |
oto | +0.472 |
Neg logit contributions | |
ォ | -0.701 |
kefeller | -0.626 |
ruary | -0.588 |
hester | -0.555 |
intern | -0.520 |
Token | they |
Token ID | 484 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
ォ | +0.380 |
kefeller | +0.343 |
ruary | +0.323 |
hester | +0.306 |
Nebula | +0.289 |
Neg logit contributions | |
ura | -0.274 |
uable | -0.247 |
pora | -0.241 |
veland | -0.237 |
oto | -0.222 |
Token | hope |
Token ID | 2911 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
ura | +1.140 |
uable | +1.024 |
pora | +0.996 |
veland | +0.986 |
oto | +0.922 |
Neg logit contributions | |
ォ | -1.585 |
kefeller | -1.437 |
ruary | -1.349 |
hester | -1.282 |
Nebula | -1.208 |
Token | is |
Token ID | 318 |
Feature activation | +2.71e+00 |
Pos logit contributions | |
ura | +0.849 |
uable | +0.765 |
pora | +0.734 |
veland | +0.732 |
oto | +0.689 |
Neg logit contributions | |
ォ | -1.165 |
kefeller | -1.046 |
ruary | -0.995 |
hester | -0.936 |
intern | -0.884 |
Token | It |
Token ID | 632 |
Feature activation | -7.52e-02 |
Pos logit contributions | |
ォ | +0.140 |
kefeller | +0.123 |
ruary | +0.115 |
hester | +0.108 |
Nebula | +0.101 |
Neg logit contributions | |
ura | -0.149 |
uable | -0.137 |
pora | -0.134 |
veland | -0.133 |
oto | -0.126 |
Token | � |
Token ID | 447 |
Feature activation | -3.16e-02 |
Pos logit contributions | |
ォ | +0.077 |
kefeller | +0.069 |
ruary | +0.065 |
hester | +0.062 |
Nebula | +0.058 |
Neg logit contributions | |
ura | -0.056 |
uable | -0.050 |
pora | -0.049 |
veland | -0.048 |
oto | -0.045 |
Token | � |
Token ID | 247 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
ォ | +0.026 |
kefeller | +0.022 |
ruary | +0.021 |
hester | +0.019 |
Nebula | +0.018 |
Neg logit contributions | |
ura | -0.030 |
uable | -0.028 |
pora | -0.027 |
veland | -0.027 |
oto | -0.026 |
Token | s |
Token ID | 82 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
ォ | +0.954 |
kefeller | +0.847 |
ruary | +0.789 |
hester | +0.741 |
Nebula | +0.691 |
Neg logit contributions | |
ura | -0.944 |
uable | -0.867 |
pora | -0.847 |
veland | -0.839 |
oto | -0.793 |
Token | a |
Token ID | 257 |
Feature activation | -5.15e-01 |
Pos logit contributions | |
ura | +1.477 |
uable | +1.340 |
pora | +1.306 |
veland | +1.289 |
oto | +1.211 |
Neg logit contributions | |
ォ | -1.834 |
kefeller | -1.652 |
ruary | -1.546 |
hester | -1.461 |
intern | -1.373 |
Token | Sa |
Token ID | 10318 |
Feature activation | +9.72e+00 |
Pos logit contributions | |
ォ | +0.501 |
kefeller | +0.450 |
ruary | +0.422 |
hester | +0.399 |
Nebula | +0.376 |
Neg logit contributions | |
ura | -0.406 |
uable | -0.370 |
pora | -0.361 |
veland | -0.356 |
oto | -0.335 |
Token | ison |
Token ID | 1653 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
ura | +8.422 |
veland | +7.623 |
pora | +7.496 |
uable | +7.376 |
oto | +6.998 |
Neg logit contributions | |
ォ | -8.531 |
kefeller | -7.376 |
ruary | -6.845 |
hester | -6.443 |
Nebula | -6.085 |
Token | style |
Token ID | 3918 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
ォ | +1.330 |
kefeller | +1.199 |
ruary | +1.133 |
hester | +1.073 |
Nebula | +1.018 |
Neg logit contributions | |
ura | -0.960 |
uable | -0.875 |
pora | -0.848 |
veland | -0.842 |
oto | -0.783 |
Token | beer |
Token ID | 6099 |
Feature activation | +4.49e-02 |
Pos logit contributions | |
ura | +1.211 |
uable | +1.091 |
pora | +1.066 |
veland | +1.048 |
oto | +0.982 |
Neg logit contributions | |
ォ | -1.667 |
kefeller | -1.507 |
ruary | -1.417 |
hester | -1.344 |
intern | -1.266 |
Token | , |
Token ID | 11 |
Feature activation | +7.85e-01 |
Pos logit contributions | |
ura | +0.033 |
uable | +0.030 |
pora | +0.029 |
veland | +0.028 |
oto | +0.026 |
Neg logit contributions | |
ォ | -0.046 |
kefeller | -0.042 |
ruary | -0.040 |
hester | -0.037 |
Nebula | -0.035 |
Token | unf |
Token ID | 3684 |
Feature activation | +7.20e-01 |
Pos logit contributions | |
ura | +0.577 |
uable | +0.522 |
pora | +0.508 |
veland | +0.502 |
oto | +0.468 |
Neg logit contributions | |
ォ | -0.805 |
kefeller | -0.727 |
ruary | -0.685 |
hester | -0.650 |
Nebula | -0.614 |
Token | that |
Token ID | 326 |
Feature activation | +3.78e-01 |
Pos logit contributions | |
ォ | +0.596 |
kefeller | +0.534 |
ruary | +0.501 |
hester | +0.474 |
Nebula | +0.445 |
Neg logit contributions | |
ura | -0.506 |
uable | -0.463 |
pora | -0.451 |
veland | -0.446 |
oto | -0.419 |
Token | means |
Token ID | 1724 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
ura | +0.268 |
uable | +0.241 |
pora | +0.235 |
veland | +0.231 |
oto | +0.215 |
Neg logit contributions | |
ォ | -0.398 |
kefeller | -0.362 |
ruary | -0.341 |
hester | -0.324 |
Nebula | -0.306 |
Token | death |
Token ID | 1918 |
Feature activation | -3.04e+00 |
Pos logit contributions | |
ura | +0.852 |
uable | +0.772 |
pora | +0.754 |
veland | +0.744 |
oto | +0.700 |
Neg logit contributions | |
ォ | -1.050 |
kefeller | -0.946 |
ruary | -0.886 |
hester | -0.837 |
Nebula | -0.786 |
Token | for |
Token ID | 329 |
Feature activation | +8.43e-01 |
Pos logit contributions | |
ォ | +3.140 |
kefeller | +2.835 |
ruary | +2.689 |
hester | +2.538 |
intern | +2.413 |
Neg logit contributions | |
ura | -2.148 |
uable | -1.955 |
pora | -1.918 |
veland | -1.878 |
oto | -1.727 |
Token | the |
Token ID | 262 |
Feature activation | +5.64e-01 |
Pos logit contributions | |
ura | +0.675 |
uable | +0.613 |
pora | +0.597 |
veland | +0.590 |
oto | +0.557 |
Neg logit contributions | |
ォ | -0.812 |
kefeller | -0.728 |
ruary | -0.684 |
hester | -0.646 |
Nebula | -0.605 |
Token | Yaz |
Token ID | 35856 |
Feature activation | +9.64e+00 |
Pos logit contributions | |
ura | +0.444 |
uable | +0.403 |
pora | +0.393 |
veland | +0.388 |
oto | +0.365 |
Neg logit contributions | |
ォ | -0.551 |
kefeller | -0.495 |
ruary | -0.465 |
hester | -0.439 |
Nebula | -0.412 |
Token | idis |
Token ID | 29207 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
ura | +6.312 |
uable | +5.431 |
pora | +5.330 |
veland | +5.050 |
oto | +5.005 |
Neg logit contributions | |
ォ | -10.575 |
kefeller | -9.642 |
ruary | -9.143 |
hester | -8.842 |
�� | -8.436 |
Token | , |
Token ID | 11 |
Feature activation | +9.70e-01 |
Pos logit contributions | |
ura | +0.966 |
uable | +0.860 |
pora | +0.840 |
veland | +0.822 |
aur | +0.767 |
Neg logit contributions | |
ォ | -1.538 |
kefeller | -1.399 |
ruary | -1.322 |
hester | -1.256 |
Nebula | -1.190 |
Token | and |
Token ID | 290 |
Feature activation | +7.91e-02 |
Pos logit contributions | |
ura | +0.719 |
uable | +0.648 |
pora | +0.633 |
veland | +0.621 |
oto | +0.583 |
Neg logit contributions | |
ォ | -0.993 |
kefeller | -0.897 |
ruary | -0.845 |
hester | -0.801 |
Nebula | -0.753 |
Token | a |
Token ID | 257 |
Feature activation | -7.05e-01 |
Pos logit contributions | |
ura | +0.061 |
uable | +0.055 |
pora | +0.054 |
veland | +0.053 |
oto | +0.050 |
Neg logit contributions | |
ォ | -0.079 |
kefeller | -0.071 |
ruary | -0.067 |
hester | -0.063 |
Nebula | -0.059 |
Token | mortal |
Token ID | 22122 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
ォ | +0.681 |
kefeller | +0.611 |
ruary | +0.573 |
hester | +0.541 |
Nebula | +0.508 |
Neg logit contributions | |
ura | -0.561 |
uable | -0.511 |
pora | -0.499 |
veland | -0.493 |
oto | -0.463 |
Token | in |
Token ID | 259 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
ォ | +2.764 |
kefeller | +2.492 |
ruary | +2.346 |
hester | +2.231 |
intern | +2.137 |
Neg logit contributions | |
ura | -2.005 |
uable | -1.829 |
pora | -1.786 |
veland | -1.765 |
oto | -1.630 |
Token | this |
Token ID | 428 |
Feature activation | +4.31e-01 |
Pos logit contributions | |
ura | +1.104 |
uable | +1.009 |
pora | +0.984 |
veland | +0.974 |
oto | +0.920 |
Neg logit contributions | |
ォ | -1.245 |
kefeller | -1.115 |
ruary | -1.042 |
hester | -0.983 |
Nebula | -0.914 |
Token | case |
Token ID | 1339 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
ura | +0.249 |
uable | +0.218 |
pora | +0.210 |
veland | +0.207 |
oto | +0.189 |
Neg logit contributions | |
ォ | -0.512 |
kefeller | -0.469 |
ruary | -0.445 |
hester | -0.426 |
Nebula | -0.405 |
Token | , |
Token ID | 11 |
Feature activation | +5.16e-01 |
Pos logit contributions | |
ura | +0.321 |
uable | +0.290 |
pora | +0.281 |
veland | +0.278 |
oto | +0.260 |
Neg logit contributions | |
ォ | -0.461 |
kefeller | -0.416 |
ruary | -0.391 |
hester | -0.372 |
intern | -0.348 |
Token | over |
Token ID | 625 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
ura | +0.410 |
uable | +0.373 |
pora | +0.363 |
veland | +0.358 |
oto | +0.338 |
Neg logit contributions | |
ォ | -0.501 |
kefeller | -0.448 |
ruary | -0.421 |
hester | -0.398 |
Nebula | -0.371 |
Token | Yaz |
Token ID | 35856 |
Feature activation | +9.63e+00 |
Pos logit contributions | |
ォ | +0.955 |
kefeller | +0.855 |
ruary | +0.800 |
hester | +0.754 |
Nebula | +0.707 |
Neg logit contributions | |
ura | -0.834 |
uable | -0.761 |
pora | -0.743 |
veland | -0.735 |
oto | -0.692 |
Token | idi |
Token ID | 19830 |
Feature activation | +9.94e-02 |
Pos logit contributions | |
ura | +6.293 |
uable | +5.480 |
pora | +5.323 |
oto | +5.019 |
veland | +4.911 |
Neg logit contributions | |
ォ | -10.606 |
kefeller | -9.625 |
ruary | -8.970 |
hester | -8.875 |
�� | -8.410 |
Token | refugees |
Token ID | 8015 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
ura | +0.080 |
uable | +0.073 |
pora | +0.072 |
veland | +0.071 |
oto | +0.067 |
Neg logit contributions | |
ォ | -0.095 |
kefeller | -0.085 |
ruary | -0.080 |
hester | -0.075 |
Nebula | -0.070 |
Token | hiding |
Token ID | 11816 |
Feature activation | +9.97e-01 |
Pos logit contributions | |
ura | +0.968 |
uable | +0.867 |
pora | +0.841 |
veland | +0.830 |
oto | +0.770 |
Neg logit contributions | |
ォ | -1.545 |
kefeller | -1.403 |
ruary | -1.327 |
hester | -1.263 |
Nebula | -1.196 |
Token | on |
Token ID | 319 |
Feature activation | +2.23e-01 |
Pos logit contributions | |
ura | +0.650 |
uable | +0.579 |
pora | +0.561 |
veland | +0.553 |
oto | +0.514 |
Neg logit contributions | |
ォ | -1.109 |
kefeller | -1.010 |
ruary | -0.955 |
hester | -0.910 |
Nebula | -0.862 |
Token | Mount |
Token ID | 5628 |
Feature activation | -2.62e+00 |
Pos logit contributions | |
ura | +0.182 |
uable | +0.166 |
pora | +0.162 |
veland | +0.160 |
oto | +0.151 |
Neg logit contributions | |
ォ | -0.211 |
kefeller | -0.188 |
ruary | -0.176 |
hester | -0.167 |
Nebula | -0.156 |
Token | ahan |
Token ID | 19210 |
Feature activation | +2.45e+00 |
Pos logit contributions | |
ura | +0.920 |
uable | +0.831 |
pora | +0.812 |
veland | +0.801 |
oto | +0.752 |
Neg logit contributions | |
ォ | -1.187 |
kefeller | -1.069 |
ruary | -1.003 |
hester | -0.950 |
Nebula | -0.895 |
Token | , |
Token ID | 11 |
Feature activation | +9.78e-01 |
Pos logit contributions | |
ura | +1.668 |
uable | +1.444 |
pora | +1.436 |
veland | +1.393 |
oto | +1.303 |
Neg logit contributions | |
ォ | -2.702 |
kefeller | -2.454 |
ruary | -2.291 |
hester | -2.204 |
Nebula | -2.075 |
Token | Tab |
Token ID | 16904 |
Feature activation | +1.92e+00 |
Pos logit contributions | |
ura | +0.780 |
uable | +0.709 |
pora | +0.693 |
veland | +0.684 |
oto | +0.643 |
Neg logit contributions | |
ォ | -0.944 |
kefeller | -0.846 |
ruary | -0.793 |
hester | -0.750 |
Nebula | -0.703 |
Token | riz |
Token ID | 47847 |
Feature activation | -3.87e-01 |
Pos logit contributions | |
ura | +1.797 |
uable | +1.642 |
pora | +1.615 |
veland | +1.578 |
aur | +1.519 |
Neg logit contributions | |
ォ | -1.626 |
kefeller | -1.415 |
ruary | -1.293 |
hester | -1.224 |
Nebula | -1.155 |
Token | , |
Token ID | 11 |
Feature activation | +8.25e-01 |
Pos logit contributions | |
ォ | +0.431 |
kefeller | +0.391 |
ruary | +0.368 |
hester | +0.352 |
Nebula | +0.332 |
Neg logit contributions | |
ura | -0.260 |
uable | -0.228 |
pora | -0.224 |
veland | -0.217 |
aur | -0.203 |
Token | Yaz |
Token ID | 35856 |
Feature activation | +9.62e+00 |
Pos logit contributions | |
ura | +0.661 |
uable | +0.601 |
pora | +0.587 |
veland | +0.580 |
oto | +0.545 |
Neg logit contributions | |
ォ | -0.794 |
kefeller | -0.712 |
ruary | -0.667 |
hester | -0.630 |
Nebula | -0.591 |
Token | d |
Token ID | 67 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
ura | +7.521 |
uable | +6.601 |
pora | +6.560 |
veland | +6.164 |
oto | +6.066 |
Neg logit contributions | |
ォ | -9.342 |
kefeller | -8.313 |
ruary | -7.607 |
hester | -7.475 |
�� | -7.140 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e-01 |
Pos logit contributions | |
ォ | +2.324 |
kefeller | +2.106 |
ruary | +1.990 |
hester | +1.891 |
Nebula | +1.789 |
Neg logit contributions | |
ura | -1.546 |
uable | -1.395 |
pora | -1.352 |
veland | -1.338 |
oto | -1.243 |
Token | Shir |
Token ID | 21972 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
ォ | +0.092 |
kefeller | +0.082 |
ruary | +0.077 |
hester | +0.072 |
Nebula | +0.068 |
Neg logit contributions | |
ura | -0.084 |
uable | -0.077 |
pora | -0.075 |
veland | -0.075 |
oto | -0.071 |
Token | az |
Token ID | 1031 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
ura | +0.698 |
uable | +0.583 |
pora | +0.563 |
veland | +0.547 |
oto | +0.488 |
Neg logit contributions | |
ォ | -1.956 |
kefeller | -1.812 |
ruary | -1.722 |
hester | -1.659 |
Nebula | -1.588 |
Token | , |
Token ID | 11 |
Feature activation | +6.64e-01 |
Pos logit contributions | |
ura | +2.128 |
pora | +1.830 |
uable | +1.813 |
veland | +1.745 |
aur | +1.648 |
Neg logit contributions | |
ォ | -3.574 |
kefeller | -3.272 |
ruary | -3.056 |
hester | -2.943 |
�� | -2.783 |
Token | kid |
Token ID | 5141 |
Feature activation | +2.78e+00 |
Pos logit contributions | |
ォ | +0.300 |
kefeller | +0.271 |
ruary | +0.255 |
hester | +0.241 |
Nebula | +0.228 |
Neg logit contributions | |
ura | -0.219 |
uable | -0.199 |
pora | -0.194 |
veland | -0.191 |
oto | -0.179 |
Token | ? |
Token ID | 30 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
ura | +1.696 |
uable | +1.485 |
pora | +1.453 |
veland | +1.416 |
aur | +1.315 |
Neg logit contributions | |
ォ | -3.176 |
kefeller | -2.931 |
ruary | -2.763 |
hester | -2.647 |
Nebula | -2.517 |
Token |
|
Token ID | 198 |
Feature activation | -4.98e-02 |
Pos logit contributions | |
ォ | +0.178 |
kefeller | +0.163 |
ruary | +0.153 |
hester | +0.145 |
intern | +0.136 |
Neg logit contributions | |
ura | -0.123 |
uable | -0.110 |
pora | -0.106 |
veland | -0.106 |
aur | -0.099 |
Token |
|
Token ID | 198 |
Feature activation | +2.44e-01 |
Pos logit contributions | |
ォ | +0.048 |
kefeller | +0.043 |
ruary | +0.040 |
hester | +0.038 |
intern | +0.036 |
Neg logit contributions | |
ura | -0.039 |
uable | -0.036 |
pora | -0.035 |
veland | -0.035 |
oto | -0.032 |
Token | Daniel |
Token ID | 19962 |
Feature activation | -4.37e+00 |
Pos logit contributions | |
ura | +0.191 |
uable | +0.172 |
pora | +0.166 |
veland | +0.165 |
aur | +0.156 |
Neg logit contributions | |
ォ | -0.243 |
kefeller | -0.219 |
ruary | -0.205 |
hester | -0.194 |
Nebula | -0.182 |
Token | Yaz |
Token ID | 35856 |
Feature activation | +9.57e+00 |
Pos logit contributions | |
ォ | +4.607 |
kefeller | +4.092 |
ruary | +3.911 |
hester | +3.733 |
Nebula | +3.679 |
Neg logit contributions | |
ura | -2.846 |
uable | -2.663 |
pora | -2.555 |
veland | -2.531 |
irs | -2.291 |
Token | beck |
Token ID | 27343 |
Feature activation | +3.90e-01 |
Pos logit contributions | |
ura | +7.827 |
pora | +6.980 |
uable | +6.977 |
veland | +6.963 |
oto | +6.537 |
Neg logit contributions | |
ォ | -8.932 |
kefeller | -7.819 |
ruary | -7.341 |
hester | -6.851 |
�� | -6.663 |
Token | : |
Token ID | 25 |
Feature activation | +6.72e-02 |
Pos logit contributions | |
ura | +0.266 |
uable | +0.239 |
pora | +0.232 |
veland | +0.228 |
oto | +0.212 |
Neg logit contributions | |
ォ | -0.420 |
kefeller | -0.381 |
ruary | -0.360 |
hester | -0.343 |
Nebula | -0.325 |
Token | No |
Token ID | 1400 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
ura | +0.060 |
uable | +0.055 |
pora | +0.054 |
veland | +0.054 |
oto | +0.051 |
Neg logit contributions | |
ォ | -0.058 |
kefeller | -0.051 |
ruary | -0.048 |
hester | -0.045 |
Nebula | -0.042 |
Token | , |
Token ID | 11 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
ura | +0.703 |
uable | +0.625 |
pora | +0.606 |
veland | +0.599 |
oto | +0.558 |
Neg logit contributions | |
ォ | -1.109 |
kefeller | -1.014 |
ruary | -0.952 |
hester | -0.908 |
Nebula | -0.854 |
Token | I |
Token ID | 314 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
ura | +0.897 |
uable | +0.820 |
pora | +0.800 |
veland | +0.791 |
oto | +0.749 |
Neg logit contributions | |
ォ | -0.947 |
kefeller | -0.845 |
ruary | -0.787 |
hester | -0.740 |
intern | -0.686 |
Token | author |
Token ID | 1772 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
ura | +0.214 |
uable | +0.196 |
pora | +0.191 |
veland | +0.187 |
aur | +0.179 |
Neg logit contributions | |
ォ | -0.228 |
kefeller | -0.204 |
ruary | -0.191 |
hester | -0.180 |
intern | -0.166 |
Token |
|
Token ID | 198 |
Feature activation | +4.76e-01 |
Pos logit contributions | |
ォ | +1.223 |
kefeller | +1.113 |
ruary | +1.047 |
hester | +0.992 |
Nebula | +0.934 |
Neg logit contributions | |
ura | -0.831 |
uable | -0.745 |
pora | -0.726 |
veland | -0.714 |
aur | -0.670 |
Token |
|
Token ID | 198 |
Feature activation | +5.58e-01 |
Pos logit contributions | |
ura | +0.369 |
uable | +0.340 |
pora | +0.330 |
veland | +0.325 |
oto | +0.303 |
Neg logit contributions | |
ォ | -0.465 |
kefeller | -0.415 |
ruary | -0.394 |
hester | -0.373 |
Nebula | -0.354 |
Token | Lu |
Token ID | 25596 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
ura | +0.478 |
uable | +0.437 |
pora | +0.427 |
veland | +0.422 |
oto | +0.400 |
Neg logit contributions | |
ォ | -0.507 |
kefeller | -0.453 |
ruary | -0.422 |
hester | -0.396 |
Nebula | -0.370 |
Token | is |
Token ID | 271 |
Feature activation | +2.22e+00 |
Pos logit contributions | |
ォ | +0.162 |
kefeller | +0.147 |
ruary | +0.139 |
hester | +0.133 |
Nebula | +0.125 |
Neg logit contributions | |
ura | -0.101 |
uable | -0.091 |
pora | -0.088 |
veland | -0.087 |
oto | -0.080 |
Token | Moreno |
Token ID | 43269 |
Feature activation | +9.55e+00 |
Pos logit contributions | |
ura | +1.848 |
uable | +1.675 |
pora | +1.640 |
veland | +1.612 |
oto | +1.535 |
Neg logit contributions | |
ォ | -2.054 |
kefeller | -1.848 |
ruary | -1.726 |
hester | -1.619 |
intern | -1.518 |
Token | – |
Token ID | 784 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
ura | +6.708 |
pora | +5.804 |
uable | +5.798 |
veland | +5.709 |
oto | +5.459 |
Neg logit contributions | |
ォ | -9.547 |
kefeller | -8.811 |
ruary | -8.350 |
hester | -7.758 |
�� | -7.432 |
Token | Instit |
Token ID | 37931 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
ォ | +0.148 |
kefeller | +0.131 |
ruary | +0.122 |
hester | +0.115 |
Nebula | +0.107 |
Neg logit contributions | |
ura | -0.148 |
uable | -0.136 |
pora | -0.133 |
veland | -0.132 |
oto | -0.125 |
Token | uto |
Token ID | 9390 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
ォ | +2.060 |
kefeller | +1.873 |
ruary | +1.772 |
hester | +1.683 |
intern | +1.598 |
Neg logit contributions | |
ura | -1.268 |
uable | -1.144 |
pora | -1.116 |
veland | -1.096 |
oto | -1.011 |
Token | de |
Token ID | 390 |
Feature activation | -9.97e-01 |
Pos logit contributions | |
ura | +1.740 |
uable | +1.585 |
pora | +1.557 |
veland | +1.539 |
oto | +1.455 |
Neg logit contributions | |
ォ | -1.835 |
kefeller | -1.637 |
ruary | -1.525 |
hester | -1.435 |
Nebula | -1.333 |
Token | Pol |
Token ID | 2165 |
Feature activation | -3.72e+00 |
Pos logit contributions | |
ォ | +0.891 |
kefeller | +0.788 |
ruary | +0.738 |
hester | +0.692 |
Nebula | +0.651 |
Neg logit contributions | |
ura | -0.859 |
uable | -0.794 |
pora | -0.772 |
veland | -0.766 |
aur | -0.723 |
Token |
|
Token ID | 198 |
Feature activation | -5.36e-01 |
Pos logit contributions | |
ォ | +0.681 |
kefeller | +0.617 |
ruary | +0.579 |
hester | +0.549 |
Nebula | +0.515 |
Neg logit contributions | |
ura | -0.510 |
uable | -0.462 |
pora | -0.448 |
veland | -0.444 |
oto | -0.416 |
Token |
|
Token ID | 198 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
ォ | +0.511 |
kefeller | +0.453 |
ruary | +0.430 |
hester | +0.407 |
intern | +0.389 |
Neg logit contributions | |
ura | -0.423 |
uable | -0.392 |
pora | -0.383 |
veland | -0.374 |
oto | -0.349 |
Token | Bron |
Token ID | 18760 |
Feature activation | +3.43e-01 |
Pos logit contributions | |
ォ | +0.118 |
kefeller | +0.104 |
ruary | +0.097 |
hester | +0.091 |
intern | +0.085 |
Neg logit contributions | |
ura | -0.119 |
uable | -0.109 |
pora | -0.107 |
veland | -0.106 |
oto | -0.100 |
Token | cos |
Token ID | 6966 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
ura | +0.205 |
uable | +0.182 |
pora | +0.176 |
veland | +0.167 |
teenth | +0.156 |
Neg logit contributions | |
ォ | -0.394 |
kefeller | -0.363 |
ruary | -0.343 |
hester | -0.330 |
intern | -0.317 |
Token | coach |
Token ID | 3985 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
ura | +0.262 |
uable | +0.239 |
pora | +0.233 |
veland | +0.230 |
oto | +0.216 |
Neg logit contributions | |
ォ | -0.326 |
kefeller | -0.292 |
ruary | -0.275 |
hester | -0.260 |
intern | -0.245 |
Token | Vance |
Token ID | 40154 |
Feature activation | +9.51e+00 |
Pos logit contributions | |
ura | +2.035 |
uable | +1.871 |
pora | +1.841 |
veland | +1.813 |
oto | +1.721 |
Neg logit contributions | |
ォ | -1.883 |
kefeller | -1.670 |
ruary | -1.543 |
hester | -1.446 |
Nebula | -1.347 |
Token | Joseph |
Token ID | 7212 |
Feature activation | +3.17e-01 |
Pos logit contributions | |
ura | +7.223 |
uable | +6.460 |
veland | +6.300 |
pora | +6.255 |
aur | +6.029 |
Neg logit contributions | |
ォ | -9.474 |
kefeller | -8.456 |
ruary | -7.976 |
hester | -7.453 |
�� | -7.300 |
Token | said |
Token ID | 531 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
ura | +0.252 |
uable | +0.230 |
pora | +0.224 |
veland | +0.221 |
oto | +0.208 |
Neg logit contributions | |
ォ | -0.306 |
kefeller | -0.275 |
ruary | -0.258 |
hester | -0.243 |
Nebula | -0.228 |
Token | Monday |
Token ID | 3321 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
ura | +1.120 |
uable | +1.020 |
pora | +0.993 |
veland | +0.984 |
oto | +0.926 |
Neg logit contributions | |
ォ | -1.325 |
kefeller | -1.191 |
ruary | -1.112 |
hester | -1.051 |
Nebula | -0.983 |
Token | that |
Token ID | 326 |
Feature activation | +2.65e-01 |
Pos logit contributions | |
ura | +1.282 |
uable | +1.159 |
veland | +1.118 |
pora | +1.116 |
oto | +1.049 |
Neg logit contributions | |
ォ | -1.644 |
kefeller | -1.500 |
ruary | -1.395 |
hester | -1.329 |
Nebula | -1.245 |
Token | the |
Token ID | 262 |
Feature activation | +2.95e-01 |
Pos logit contributions | |
ura | +0.220 |
uable | +0.201 |
pora | +0.196 |
veland | +0.194 |
oto | +0.183 |
Neg logit contributions | |
ォ | -0.247 |
kefeller | -0.221 |
ruary | -0.207 |
hester | -0.195 |
Nebula | -0.183 |
Token | over |
Token ID | 625 |
Feature activation | +1.77e-01 |
Pos logit contributions | |
ura | +1.307 |
uable | +1.170 |
pora | +1.135 |
veland | +1.121 |
oto | +1.050 |
Neg logit contributions | |
ォ | -1.938 |
kefeller | -1.757 |
ruary | -1.657 |
hester | -1.574 |
Nebula | -1.489 |
Token | the |
Token ID | 262 |
Feature activation | +1.64e+00 |
Pos logit contributions | |
ura | +0.125 |
uable | +0.112 |
pora | +0.109 |
veland | +0.108 |
oto | +0.100 |
Neg logit contributions | |
ォ | -0.187 |
kefeller | -0.169 |
ruary | -0.160 |
hester | -0.152 |
Nebula | -0.143 |
Token | team |
Token ID | 1074 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
ura | +1.287 |
uable | +1.164 |
pora | +1.134 |
veland | +1.123 |
oto | +1.064 |
Neg logit contributions | |
ォ | -1.605 |
kefeller | -1.438 |
ruary | -1.356 |
hester | -1.273 |
intern | -1.188 |
Token | radio |
Token ID | 5243 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
ura | +1.151 |
uable | +1.036 |
pora | +1.007 |
veland | +0.993 |
oto | +0.930 |
Neg logit contributions | |
ォ | -1.663 |
kefeller | -1.506 |
ruary | -1.417 |
hester | -1.348 |
Nebula | -1.270 |
Token | in |
Token ID | 287 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
ura | +0.146 |
uable | +0.132 |
pora | +0.128 |
veland | +0.127 |
oto | +0.118 |
Neg logit contributions | |
ォ | -0.212 |
kefeller | -0.192 |
ruary | -0.181 |
hester | -0.172 |
Nebula | -0.162 |
Token | FP |
Token ID | 31459 |
Feature activation | +9.41e+00 |
Pos logit contributions | |
ura | +1.716 |
uable | +1.566 |
pora | +1.533 |
veland | +1.520 |
oto | +1.432 |
Neg logit contributions | |
ォ | -1.855 |
kefeller | -1.652 |
ruary | -1.536 |
hester | -1.448 |
intern | -1.349 |
Token | 1 |
Token ID | 16 |
Feature activation | +7.53e-01 |
Pos logit contributions | |
ura | +7.239 |
pora | +6.239 |
uable | +6.218 |
veland | +6.099 |
oto | +5.894 |
Neg logit contributions | |
ォ | -9.161 |
kefeller | -8.477 |
ruary | -7.673 |
hester | -7.478 |
�� | -7.024 |
Token | at |
Token ID | 379 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
ura | +0.545 |
uable | +0.492 |
pora | +0.478 |
veland | +0.472 |
oto | +0.440 |
Neg logit contributions | |
ォ | -0.781 |
kefeller | -0.706 |
ruary | -0.667 |
hester | -0.633 |
Nebula | -0.598 |
Token | Suz |
Token ID | 22691 |
Feature activation | +8.17e-01 |
Pos logit contributions | |
ura | +0.257 |
uable | +0.234 |
pora | +0.229 |
veland | +0.226 |
oto | +0.213 |
Neg logit contributions | |
ォ | -0.299 |
kefeller | -0.268 |
ruary | -0.251 |
hester | -0.237 |
Nebula | -0.222 |
Token | uka |
Token ID | 14852 |
Feature activation | +4.95e-01 |
Pos logit contributions | |
ura | +0.641 |
uable | +0.581 |
pora | +0.566 |
veland | +0.559 |
oto | +0.527 |
Neg logit contributions | |
ォ | -0.801 |
kefeller | -0.719 |
ruary | -0.675 |
hester | -0.638 |
Nebula | -0.601 |
Token | to |
Token ID | 284 |
Feature activation | +5.62e-01 |
Pos logit contributions | |
ura | +0.359 |
uable | +0.326 |
pora | +0.316 |
veland | +0.312 |
aur | +0.290 |
Neg logit contributions | |
ォ | -0.512 |
kefeller | -0.462 |
ruary | -0.437 |
hester | -0.414 |
Nebula | -0.392 |
Token | - |
Token ID | 12 |
Feature activation | +4.91e-01 |
Pos logit contributions | |
ォ | +2.075 |
kefeller | +1.886 |
ruary | +1.782 |
hester | +1.698 |
Nebula | +1.617 |
Neg logit contributions | |
ura | -1.294 |
uable | -1.152 |
pora | -1.112 |
veland | -1.107 |
aur | -1.021 |
Token | time |
Token ID | 2435 |
Feature activation | -4.26e-01 |
Pos logit contributions | |
ura | +0.423 |
uable | +0.387 |
pora | +0.378 |
veland | +0.376 |
aur | +0.356 |
Neg logit contributions | |
ォ | -0.445 |
kefeller | -0.395 |
ruary | -0.367 |
hester | -0.346 |
�� | -0.323 |
Token | users |
Token ID | 2985 |
Feature activation | +2.64e+00 |
Pos logit contributions | |
ォ | +0.422 |
kefeller | +0.380 |
ruary | +0.357 |
hester | +0.338 |
Nebula | +0.318 |
Neg logit contributions | |
ura | -0.329 |
uable | -0.298 |
pora | -0.291 |
veland | -0.287 |
oto | -0.269 |
Token | . |
Token ID | 13 |
Feature activation | -6.49e-01 |
Pos logit contributions | |
ura | +1.725 |
uable | +1.527 |
pora | +1.485 |
veland | +1.457 |
aur | +1.354 |
Neg logit contributions | |
ォ | -2.932 |
kefeller | -2.673 |
ruary | -2.525 |
hester | -2.421 |
Nebula | -2.295 |
Token | Daniel |
Token ID | 7806 |
Feature activation | -4.86e+00 |
Pos logit contributions | |
ォ | +0.555 |
kefeller | +0.486 |
ruary | +0.457 |
hester | +0.427 |
Nebula | +0.403 |
Neg logit contributions | |
ura | -0.585 |
uable | -0.541 |
pora | -0.530 |
veland | -0.524 |
oto | -0.495 |
Token | Yaz |
Token ID | 35856 |
Feature activation | +9.39e+00 |
Pos logit contributions | |
ォ | +4.373 |
kefeller | +3.882 |
ruary | +3.627 |
hester | +3.417 |
Nebula | +3.242 |
Neg logit contributions | |
ura | -4.046 |
uable | -3.727 |
pora | -3.651 |
veland | -3.632 |
oto | -3.386 |
Token | beck |
Token ID | 27343 |
Feature activation | +3.06e-01 |
Pos logit contributions | |
ura | +7.607 |
uable | +6.757 |
pora | +6.681 |
veland | +6.533 |
oto | +6.432 |
Neg logit contributions | |
ォ | -8.799 |
kefeller | -7.647 |
ruary | -7.290 |
hester | -6.848 |
Nebula | -6.524 |
Token | is |
Token ID | 318 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
ura | +0.226 |
uable | +0.204 |
pora | +0.198 |
veland | +0.196 |
oto | +0.183 |
Neg logit contributions | |
ォ | -0.314 |
kefeller | -0.284 |
ruary | -0.267 |
hester | -0.253 |
Nebula | -0.239 |
Token | an |
Token ID | 281 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
ura | +1.558 |
uable | +1.419 |
pora | +1.376 |
veland | +1.371 |
aur | +1.291 |
Neg logit contributions | |
ォ | -1.843 |
kefeller | -1.650 |
ruary | -1.549 |
hester | -1.457 |
Nebula | -1.360 |
Token | entrepreneur |
Token ID | 19500 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
ォ | +1.075 |
kefeller | +0.971 |
ruary | +0.905 |
hester | +0.865 |
intern | +0.815 |
Neg logit contributions | |
ura | -0.907 |
uable | -0.823 |
pora | -0.812 |
veland | -0.798 |
oto | -0.750 |
Token | behind |
Token ID | 2157 |
Feature activation | -2.04e+00 |
Pos logit contributions | |
ォ | +1.410 |
kefeller | +1.279 |
ruary | +1.213 |
hester | +1.157 |
intern | +1.098 |
Neg logit contributions | |
ura | -0.873 |
uable | -0.783 |
pora | -0.762 |
veland | -0.747 |
oto | -0.695 |
Token | mo |
Token ID | 5908 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
ura | +0.704 |
uable | +0.612 |
pora | +0.588 |
veland | +0.576 |
oto | +0.516 |
Neg logit contributions | |
ォ | -1.679 |
kefeller | -1.546 |
ruary | -1.473 |
hester | -1.414 |
Nebula | -1.349 |
Token | L |
Token ID | 406 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
ura | +2.806 |
uable | +2.557 |
pora | +2.497 |
veland | +2.474 |
oto | +2.344 |
Neg logit contributions | |
ォ | -3.049 |
kefeller | -2.712 |
ruary | -2.538 |
hester | -2.392 |
Nebula | -2.232 |
Token | asso |
Token ID | 28372 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
ura | +0.192 |
uable | +0.176 |
pora | +0.172 |
veland | +0.171 |
oto | +0.159 |
Neg logit contributions | |
ォ | -0.221 |
kefeller | -0.200 |
ruary | -0.186 |
hester | -0.177 |
intern | -0.165 |
Token | and |
Token ID | 290 |
Feature activation | -6.66e-02 |
Pos logit contributions | |
ura | +2.201 |
uable | +1.942 |
pora | +1.886 |
veland | +1.869 |
oto | +1.751 |
Neg logit contributions | |
ォ | -3.523 |
kefeller | -3.206 |
ruary | -3.042 |
hester | -2.880 |
intern | -2.725 |
Token | Lenin |
Token ID | 22899 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
ォ | +0.061 |
kefeller | +0.054 |
ruary | +0.051 |
hester | +0.048 |
Nebula | +0.044 |
Neg logit contributions | |
ura | -0.056 |
uable | -0.052 |
pora | -0.050 |
veland | -0.050 |
oto | -0.047 |
Token | Moreno |
Token ID | 43269 |
Feature activation | +9.33e+00 |
Pos logit contributions | |
ォ | +4.394 |
kefeller | +3.971 |
ruary | +3.728 |
hester | +3.533 |
intern | +3.332 |
Neg logit contributions | |
ura | -3.787 |
uable | -3.511 |
veland | -3.425 |
pora | -3.391 |
teenth | -3.170 |
Token | , |
Token ID | 11 |
Feature activation | +8.73e-01 |
Pos logit contributions | |
ura | +5.660 |
pora | +4.858 |
uable | +4.767 |
veland | +4.720 |
oto | +4.462 |
Neg logit contributions | |
ォ | -10.417 |
kefeller | -9.417 |
ruary | -8.822 |
hester | -8.527 |
�� | -8.256 |
Token | scheduled |
Token ID | 7530 |
Feature activation | +3.64e+00 |
Pos logit contributions | |
ura | +0.707 |
uable | +0.645 |
pora | +0.629 |
veland | +0.622 |
oto | +0.585 |
Neg logit contributions | |
ォ | -0.833 |
kefeller | -0.745 |
ruary | -0.698 |
hester | -0.659 |
Nebula | -0.617 |
Token | for |
Token ID | 329 |
Feature activation | +8.24e-01 |
Pos logit contributions | |
ura | +2.168 |
uable | +1.897 |
pora | +1.854 |
veland | +1.815 |
oto | +1.685 |
Neg logit contributions | |
ォ | -4.252 |
kefeller | -3.870 |
ruary | -3.621 |
hester | -3.493 |
Nebula | -3.342 |
Token | Sunday |
Token ID | 3502 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
ura | +0.705 |
uable | +0.646 |
pora | +0.632 |
veland | +0.625 |
oto | +0.590 |
Neg logit contributions | |
ォ | -0.746 |
kefeller | -0.665 |
ruary | -0.622 |
hester | -0.584 |
Nebula | -0.546 |
Token | . |
Token ID | 13 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
ura | +1.277 |
uable | +1.134 |
pora | +1.104 |
veland | +1.083 |
oto | +1.013 |
Neg logit contributions | |
ォ | -2.043 |
kefeller | -1.857 |
ruary | -1.740 |
hester | -1.670 |
Nebula | -1.575 |
Token | Assange |
Token ID | 21882 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
ura | +0.365 |
uable | +0.336 |
pora | +0.329 |
veland | +0.325 |
oto | +0.309 |
Neg logit contributions | |
ォ | -0.349 |
kefeller | -0.308 |
ruary | -0.287 |
hester | -0.268 |
Nebula | -0.249 |
Token | if |
Token ID | 611 |
Feature activation | +7.48e-01 |
Pos logit contributions | |
ura | +2.687 |
uable | +2.375 |
pora | +2.313 |
veland | +2.253 |
oto | +2.115 |
Neg logit contributions | |
ォ | -4.622 |
kefeller | -4.173 |
ruary | -3.918 |
hester | -3.759 |
�� | -3.569 |
Token | he |
Token ID | 339 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
ura | +0.630 |
uable | +0.576 |
pora | +0.563 |
veland | +0.556 |
oto | +0.525 |
Neg logit contributions | |
ォ | -0.692 |
kefeller | -0.615 |
ruary | -0.575 |
hester | -0.542 |
Nebula | -0.505 |
Token | wins |
Token ID | 7864 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
ura | +1.258 |
uable | +1.141 |
pora | +1.110 |
veland | +1.098 |
oto | +1.034 |
Neg logit contributions | |
ォ | -1.552 |
kefeller | -1.399 |
ruary | -1.309 |
hester | -1.238 |
Nebula | -1.157 |
Token | . |
Token ID | 13 |
Feature activation | -3.00e-01 |
Pos logit contributions | |
ura | +0.859 |
uable | +0.779 |
pora | +0.755 |
veland | +0.745 |
oto | +0.707 |
Neg logit contributions | |
ォ | -1.096 |
kefeller | -0.980 |
ruary | -0.920 |
hester | -0.873 |
Nebula | -0.815 |
Token | Moreno |
Token ID | 43269 |
Feature activation | +9.30e+00 |
Pos logit contributions | |
ォ | +0.271 |
kefeller | +0.242 |
ruary | +0.226 |
hester | +0.212 |
Nebula | +0.199 |
Neg logit contributions | |
ura | -0.257 |
uable | -0.236 |
pora | -0.231 |
veland | -0.228 |
oto | -0.215 |
Token | , |
Token ID | 11 |
Feature activation | +6.73e-01 |
Pos logit contributions | |
ura | +5.958 |
uable | +5.170 |
pora | +5.107 |
veland | +5.065 |
oto | +4.752 |
Neg logit contributions | |
ォ | -9.974 |
kefeller | -9.129 |
ruary | -8.557 |
hester | -8.116 |
�� | -8.071 |
Token | meanwhile |
Token ID | 15066 |
Feature activation | +2.69e-01 |
Pos logit contributions | |
ura | +0.522 |
uable | +0.473 |
pora | +0.461 |
veland | +0.456 |
oto | +0.428 |
Neg logit contributions | |
ォ | -0.665 |
kefeller | -0.597 |
ruary | -0.561 |
hester | -0.530 |
Nebula | -0.498 |
Token | , |
Token ID | 11 |
Feature activation | +6.46e-01 |
Pos logit contributions | |
ura | +0.198 |
uable | +0.180 |
pora | +0.174 |
veland | +0.172 |
oto | +0.161 |
Neg logit contributions | |
ォ | -0.274 |
kefeller | -0.248 |
ruary | -0.233 |
hester | -0.222 |
Nebula | -0.210 |
Token | served |
Token ID | 4983 |
Feature activation | +7.80e-01 |
Pos logit contributions | |
ura | +0.504 |
uable | +0.457 |
pora | +0.446 |
veland | +0.441 |
oto | +0.414 |
Neg logit contributions | |
ォ | -0.635 |
kefeller | -0.571 |
ruary | -0.536 |
hester | -0.507 |
Nebula | -0.476 |
Token | as |
Token ID | 355 |
Feature activation | -8.61e-01 |
Pos logit contributions | |
ura | +0.525 |
uable | +0.469 |
pora | +0.455 |
veland | +0.449 |
oto | +0.416 |
Neg logit contributions | |
ォ | -0.849 |
kefeller | -0.772 |
ruary | -0.730 |
hester | -0.695 |
Nebula | -0.658 |
Token | ing |
Token ID | 278 |
Feature activation | +4.16e-01 |
Pos logit contributions | |
ォ | +0.143 |
kefeller | +0.122 |
ruary | +0.110 |
hester | +0.101 |
Nebula | +0.090 |
Neg logit contributions | |
ura | -0.234 |
uable | -0.219 |
pora | -0.215 |
veland | -0.213 |
oto | -0.204 |
Token | ? |
Token ID | 30 |
Feature activation | -5.88e-02 |
Pos logit contributions | |
ura | +0.278 |
uable | +0.249 |
pora | +0.242 |
veland | +0.238 |
oto | +0.221 |
Neg logit contributions | |
ォ | -0.454 |
kefeller | -0.413 |
ruary | -0.391 |
hester | -0.371 |
Nebula | -0.352 |
Token |
|
Token ID | 198 |
Feature activation | +3.05e-01 |
Pos logit contributions | |
ォ | +0.053 |
kefeller | +0.047 |
ruary | +0.044 |
hester | +0.041 |
Nebula | +0.039 |
Neg logit contributions | |
ura | -0.050 |
uable | -0.046 |
pora | -0.045 |
veland | -0.045 |
oto | -0.042 |
Token |
|
Token ID | 198 |
Feature activation | +5.76e-01 |
Pos logit contributions | |
ura | +0.238 |
uable | +0.219 |
pora | +0.214 |
veland | +0.210 |
oto | +0.195 |
Neg logit contributions | |
ォ | -0.296 |
kefeller | -0.264 |
ruary | -0.250 |
hester | -0.237 |
intern | -0.225 |
Token | David |
Token ID | 11006 |
Feature activation | -5.22e+00 |
Pos logit contributions | |
ura | +0.501 |
uable | +0.461 |
pora | +0.451 |
veland | +0.446 |
oto | +0.421 |
Neg logit contributions | |
ォ | -0.512 |
kefeller | -0.454 |
ruary | -0.423 |
hester | -0.397 |
intern | -0.371 |
Token | Cron |
Token ID | 31683 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
ォ | +4.638 |
kefeller | +4.118 |
ruary | +3.863 |
hester | +3.634 |
Nebula | +3.404 |
Neg logit contributions | |
ura | -4.405 |
uable | -4.092 |
pora | -4.018 |
veland | -3.974 |
aur | -3.700 |
Token | in |
Token ID | 259 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
ォ | +9.432 |
kefeller | +8.819 |
ruary | +8.143 |
hester | +7.808 |
intern | +7.639 |
Neg logit contributions | |
ura | -8.333 |
uable | -7.668 |
pora | -7.547 |
veland | -7.464 |
irs | -6.921 |
Token | is |
Token ID | 318 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
ura | +1.266 |
uable | +1.138 |
pora | +1.106 |
veland | +1.094 |
oto | +1.027 |
Neg logit contributions | |
ォ | -1.782 |
kefeller | -1.614 |
ruary | -1.521 |
hester | -1.438 |
Nebula | -1.357 |
Token | the |
Token ID | 262 |
Feature activation | +7.73e-01 |
Pos logit contributions | |
ura | +1.681 |
uable | +1.536 |
pora | +1.484 |
veland | +1.477 |
aur | +1.404 |
Neg logit contributions | |
ォ | -1.881 |
kefeller | -1.669 |
ruary | -1.571 |
hester | -1.474 |
Nebula | -1.368 |
Token | author |
Token ID | 1772 |
Feature activation | -5.47e-01 |
Pos logit contributions | |
ura | +0.689 |
uable | +0.634 |
pora | +0.619 |
veland | +0.613 |
oto | +0.582 |
Neg logit contributions | |
ォ | -0.674 |
kefeller | -0.596 |
ruary | -0.556 |
hester | -0.521 |
intern | -0.482 |
Token | of |
Token ID | 286 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
ォ | +0.636 |
kefeller | +0.582 |
ruary | +0.552 |
hester | +0.527 |
intern | +0.500 |
Neg logit contributions | |
ura | -0.332 |
uable | -0.293 |
pora | -0.283 |
veland | -0.278 |
aur | -0.259 |
Token | Os |
Token ID | 8834 |
Feature activation | +7.24e+00 |
Pos logit contributions | |
ura | +0.681 |
uable | +0.623 |
pora | +0.609 |
veland | +0.602 |
oto | +0.571 |
Neg logit contributions | |
ォ | -0.707 |
kefeller | -0.630 |
ruary | -0.588 |
hester | -0.552 |
intern | -0.514 |
Token | am |
Token ID | 321 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
ura | +5.405 |
pora | +4.783 |
uable | +4.739 |
veland | +4.609 |
oto | +4.426 |
Neg logit contributions | |
ォ | -7.277 |
kefeller | -6.521 |
ruary | -6.118 |
hester | -5.762 |
�� | -5.589 |
Token | , |
Token ID | 11 |
Feature activation | +7.01e-01 |
Pos logit contributions | |
ura | +1.757 |
uable | +1.548 |
pora | +1.508 |
veland | +1.468 |
oto | +1.384 |
Neg logit contributions | |
ォ | -3.014 |
kefeller | -2.764 |
ruary | -2.615 |
hester | -2.485 |
Nebula | -2.352 |
Token | Holland |
Token ID | 16070 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
ura | +0.600 |
uable | +0.548 |
pora | +0.536 |
veland | +0.529 |
oto | +0.502 |
Neg logit contributions | |
ォ | -0.636 |
kefeller | -0.568 |
ruary | -0.530 |
hester | -0.498 |
intern | -0.464 |
Token | ( |
Token ID | 357 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
ォ | +1.091 |
kefeller | +0.983 |
ruary | +0.928 |
hester | +0.880 |
Nebula | +0.831 |
Neg logit contributions | |
ura | -0.780 |
uable | -0.707 |
pora | -0.688 |
veland | -0.679 |
oto | -0.633 |
Token | Bern |
Token ID | 23927 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
ura | +0.199 |
uable | +0.183 |
pora | +0.178 |
veland | +0.176 |
oto | +0.166 |
Neg logit contributions | |
ォ | -0.219 |
kefeller | -0.196 |
ruary | -0.183 |
hester | -0.172 |
Nebula | -0.161 |
Token | ard |
Token ID | 446 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
ォ | +10.797 |
kefeller | +9.835 |
ruary | +9.538 |
hester | +9.099 |
intern | +8.585 |
Neg logit contributions | |
ura | -6.294 |
uable | -5.912 |
pora | -5.843 |
veland | -5.583 |
teenth | -5.011 |
Token | 80 |
Token ID | 4019 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
ォ | +1.826 |
kefeller | +1.642 |
ruary | +1.553 |
hester | +1.466 |
Nebula | +1.381 |
Neg logit contributions | |
ura | -1.402 |
uable | -1.278 |
pora | -1.249 |
veland | -1.230 |
oto | -1.146 |
Token | ), |
Token ID | 828 |
Feature activation | +5.62e-01 |
Pos logit contributions | |
ォ | +2.344 |
kefeller | +2.112 |
ruary | +2.002 |
hester | +1.900 |
intern | +1.788 |
Neg logit contributions | |
ura | -1.723 |
uable | -1.573 |
pora | -1.533 |
veland | -1.504 |
oto | -1.405 |
Token | Ben |
Token ID | 3932 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
ura | +0.482 |
uable | +0.441 |
pora | +0.431 |
veland | +0.426 |
oto | +0.404 |
Neg logit contributions | |
ォ | -0.508 |
kefeller | -0.453 |
ruary | -0.423 |
hester | -0.397 |
intern | -0.370 |
Token | rou |
Token ID | 472 |
Feature activation | -7.20e-01 |
Pos logit contributions | |
ォ | +1.564 |
kefeller | +1.415 |
ruary | +1.333 |
hester | +1.263 |
Nebula | +1.187 |
Neg logit contributions | |
ura | -1.154 |
uable | -1.044 |
pora | -1.019 |
veland | -1.004 |
oto | -0.936 |
Token | story |
Token ID | 1621 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
ォ | +0.226 |
kefeller | +0.203 |
ruary | +0.190 |
hester | +0.181 |
Nebula | +0.172 |
Neg logit contributions | |
ura | -0.172 |
uable | -0.157 |
pora | -0.153 |
veland | -0.151 |
oto | -0.140 |
Token | in |
Token ID | 287 |
Feature activation | +8.98e-01 |
Pos logit contributions | |
ォ | +2.362 |
kefeller | +2.131 |
ruary | +2.020 |
hester | +1.916 |
intern | +1.817 |
Neg logit contributions | |
ura | -1.616 |
uable | -1.463 |
pora | -1.423 |
veland | -1.404 |
oto | -1.302 |
Token | 2010 |
Token ID | 3050 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
ura | +0.765 |
uable | +0.700 |
pora | +0.684 |
veland | +0.678 |
oto | +0.640 |
Neg logit contributions | |
ォ | -0.819 |
kefeller | -0.729 |
ruary | -0.680 |
hester | -0.640 |
Nebula | -0.597 |
Token |
|
Token ID | 198 |
Feature activation | +2.98e-01 |
Pos logit contributions | |
ォ | +1.312 |
kefeller | +1.185 |
ruary | +1.120 |
hester | +1.062 |
Nebula | +1.005 |
Neg logit contributions | |
ura | -0.905 |
uable | -0.817 |
pora | -0.796 |
veland | -0.784 |
oto | -0.730 |
Token |
|
Token ID | 198 |
Feature activation | +5.00e-01 |
Pos logit contributions | |
ura | +0.231 |
uable | +0.213 |
pora | +0.207 |
veland | +0.203 |
oto | +0.190 |
Neg logit contributions | |
ォ | -0.290 |
kefeller | -0.258 |
ruary | -0.245 |
hester | -0.232 |
intern | -0.220 |
Token | Bern |
Token ID | 23927 |
Feature activation | -9.99e+00 |
Pos logit contributions | |
ura | +0.423 |
uable | +0.386 |
pora | +0.377 |
veland | +0.373 |
oto | +0.353 |
Neg logit contributions | |
ォ | -0.459 |
kefeller | -0.411 |
ruary | -0.383 |
hester | -0.361 |
Nebula | -0.337 |
Token | au |
Token ID | 559 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
ォ | +10.242 |
kefeller | +9.598 |
ruary | +9.273 |
hester | +8.871 |
sonian | +8.508 |
Neg logit contributions | |
ura | -5.156 |
uable | -5.050 |
pora | -5.018 |
veland | -4.834 |
teenth | -4.652 |
Token | pointed |
Token ID | 6235 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
ura | +0.085 |
uable | +0.077 |
pora | +0.075 |
veland | +0.074 |
oto | +0.070 |
Neg logit contributions | |
ォ | -0.104 |
kefeller | -0.093 |
ruary | -0.088 |
hester | -0.083 |
Nebula | -0.078 |
Token | out |
Token ID | 503 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
ura | +0.259 |
uable | +0.231 |
veland | +0.222 |
pora | +0.222 |
oto | +0.208 |
Neg logit contributions | |
ォ | -0.421 |
kefeller | -0.382 |
ruary | -0.362 |
hester | -0.344 |
intern | -0.326 |
Token | that |
Token ID | 326 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
ォ | +0.012 |
kefeller | +0.010 |
ruary | +0.010 |
hester | +0.009 |
Nebula | +0.009 |
Neg logit contributions | |
ura | -0.009 |
uable | -0.008 |
pora | -0.008 |
veland | -0.008 |
oto | -0.008 |
Token | 2010 |
Token ID | 3050 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
ura | +0.192 |
uable | +0.175 |
pora | +0.170 |
veland | +0.168 |
oto | +0.158 |
Neg logit contributions | |
ォ | -0.237 |
kefeller | -0.212 |
ruary | -0.199 |
hester | -0.188 |
Nebula | -0.177 |
Token | now |
Token ID | 783 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
ura | +0.349 |
uable | +0.318 |
pora | +0.310 |
veland | +0.306 |
oto | +0.288 |
Neg logit contributions | |
ォ | -0.423 |
kefeller | -0.378 |
ruary | -0.355 |
hester | -0.336 |
Nebula | -0.315 |
Token | , |
Token ID | 11 |
Feature activation | +8.98e-01 |
Pos logit contributions | |
ura | +1.422 |
uable | +1.269 |
pora | +1.219 |
veland | +1.210 |
oto | +1.129 |
Neg logit contributions | |
ォ | -2.261 |
kefeller | -2.082 |
ruary | -1.953 |
hester | -1.859 |
Nebula | -1.760 |
Token | coaches |
Token ID | 11070 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
ura | +0.722 |
uable | +0.658 |
pora | +0.643 |
veland | +0.636 |
oto | +0.597 |
Neg logit contributions | |
ォ | -0.859 |
kefeller | -0.770 |
ruary | -0.722 |
hester | -0.682 |
Nebula | -0.640 |
Token | have |
Token ID | 423 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
ura | +1.513 |
uable | +1.363 |
pora | +1.326 |
veland | +1.310 |
oto | +1.229 |
Neg logit contributions | |
ォ | -2.104 |
kefeller | -1.908 |
ruary | -1.793 |
hester | -1.703 |
Nebula | -1.604 |
Token | David |
Token ID | 3271 |
Feature activation | -4.76e+00 |
Pos logit contributions | |
ォ | +0.994 |
kefeller | +0.889 |
ruary | +0.834 |
hester | +0.787 |
Nebula | +0.741 |
Neg logit contributions | |
ura | -0.840 |
uable | -0.767 |
pora | -0.751 |
veland | -0.741 |
oto | -0.695 |
Token | Brut |
Token ID | 30291 |
Feature activation | -9.25e+00 |
Pos logit contributions | |
ォ | +4.077 |
kefeller | +3.511 |
ruary | +3.272 |
hester | +3.078 |
Nebula | +3.023 |
Neg logit contributions | |
ura | -4.136 |
uable | -3.862 |
pora | -3.750 |
veland | -3.726 |
teenth | -3.531 |
Token | on |
Token ID | 261 |
Feature activation | +2.97e-02 |
Pos logit contributions | |
ォ | +8.562 |
ruary | +7.655 |
kefeller | +7.638 |
hester | +7.236 |
ritten | +6.859 |
Neg logit contributions | |
ura | -6.380 |
pora | -6.050 |
uable | -5.999 |
veland | -5.726 |
teenth | -5.456 |
Token | Jr |
Token ID | 7504 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
ura | +0.021 |
uable | +0.019 |
pora | +0.019 |
veland | +0.018 |
oto | +0.017 |
Neg logit contributions | |
ォ | -0.031 |
kefeller | -0.028 |
ruary | -0.027 |
hester | -0.025 |
intern | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
ura | +0.711 |
uable | +0.622 |
veland | +0.601 |
pora | +0.601 |
aur | +0.557 |
Neg logit contributions | |
ォ | -1.231 |
kefeller | -1.126 |
ruary | -1.067 |
hester | -1.015 |
Nebula | -0.980 |
Token | pencil |
Token ID | 21613 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
ura | +0.096 |
uable | +0.087 |
pora | +0.084 |
veland | +0.083 |
oto | +0.077 |
Neg logit contributions | |
ォ | -0.148 |
kefeller | -0.134 |
ruary | -0.126 |
hester | -0.120 |
intern | -0.114 |
Token | ed |
Token ID | 276 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
ォ | +1.037 |
kefeller | +0.863 |
ruary | +0.767 |
hester | +0.695 |
Nebula | +0.614 |
Neg logit contributions | |
ura | -1.995 |
uable | -1.873 |
pora | -1.857 |
veland | -1.834 |
oto | -1.758 |
Token | birthday |
Token ID | 10955 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
ura | +1.545 |
uable | +1.425 |
pora | +1.394 |
veland | +1.376 |
oto | +1.306 |
Neg logit contributions | |
ォ | -1.493 |
kefeller | -1.324 |
ruary | -1.223 |
hester | -1.151 |
Nebula | -1.065 |
Token | , |
Token ID | 11 |
Feature activation | +7.10e-01 |
Pos logit contributions | |
ォ | +1.069 |
kefeller | +0.965 |
ruary | +0.914 |
hester | +0.864 |
Nebula | +0.817 |
Neg logit contributions | |
ura | -0.752 |
uable | -0.680 |
pora | -0.660 |
veland | -0.654 |
oto | -0.608 |
Token | its |
Token ID | 663 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
ura | +0.594 |
uable | +0.543 |
pora | +0.531 |
veland | +0.524 |
oto | +0.495 |
Neg logit contributions | |
ォ | -0.657 |
kefeller | -0.586 |
ruary | -0.547 |
hester | -0.516 |
Nebula | -0.482 |
Token | inventor |
Token ID | 33475 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
ォ | +1.204 |
kefeller | +1.078 |
ruary | +1.010 |
hester | +0.952 |
Nebula | +0.892 |
Neg logit contributions | |
ura | -1.053 |
uable | -0.963 |
pora | -0.939 |
veland | -0.931 |
oto | -0.876 |
Token | Tim |
Token ID | 5045 |
Feature activation | -8.82e-01 |
Pos logit contributions | |
ォ | +1.730 |
kefeller | +1.555 |
ruary | +1.462 |
hester | +1.385 |
Nebula | +1.303 |
Neg logit contributions | |
ura | -1.349 |
uable | -1.225 |
pora | -1.195 |
veland | -1.180 |
oto | -1.105 |
Token | Bern |
Token ID | 6206 |
Feature activation | -9.23e+00 |
Pos logit contributions | |
ォ | +0.737 |
kefeller | +0.651 |
ruary | +0.603 |
hester | +0.565 |
Nebula | +0.524 |
Neg logit contributions | |
ura | -0.809 |
uable | -0.752 |
pora | -0.734 |
veland | -0.732 |
aur | -0.688 |
Token | ers |
Token ID | 364 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
ォ | +7.175 |
kefeller | +6.189 |
ruary | +6.133 |
hester | +5.817 |
intern | +5.304 |
Neg logit contributions | |
ura | -7.943 |
uable | -7.794 |
veland | -7.659 |
pora | -7.579 |
teenth | -6.968 |
Token | - |
Token ID | 12 |
Feature activation | +8.20e-01 |
Pos logit contributions | |
ura | +0.949 |
uable | +0.846 |
pora | +0.817 |
veland | +0.809 |
aur | +0.764 |
Neg logit contributions | |
ォ | -1.481 |
kefeller | -1.344 |
ruary | -1.272 |
hester | -1.202 |
�� | -1.154 |
Token | Lee |
Token ID | 24338 |
Feature activation | +2.16e+00 |
Pos logit contributions | |
ura | +0.661 |
uable | +0.605 |
pora | +0.592 |
veland | +0.585 |
oto | +0.547 |
Neg logit contributions | |
ォ | -0.780 |
kefeller | -0.702 |
ruary | -0.656 |
hester | -0.625 |
intern | -0.586 |
Token | has |
Token ID | 468 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
ura | +1.674 |
uable | +1.514 |
pora | +1.471 |
veland | +1.456 |
oto | +1.373 |
Neg logit contributions | |
ォ | -2.125 |
kefeller | -1.917 |
ruary | -1.798 |
hester | -1.700 |
Nebula | -1.604 |
Token | written |
Token ID | 3194 |
Feature activation | -7.62e-01 |
Pos logit contributions | |
ォ | +1.379 |
kefeller | +1.240 |
ruary | +1.164 |
hester | +1.096 |
intern | +1.033 |
Neg logit contributions | |
ura | -1.154 |
uable | -1.055 |
pora | -1.032 |
veland | -1.018 |
oto | -0.955 |
Token | to |
Token ID | 284 |
Feature activation | -3.56e-01 |
Pos logit contributions | |
ォ | +2.443 |
kefeller | +2.201 |
ruary | +2.101 |
hester | +1.985 |
intern | +1.875 |
Neg logit contributions | |
ura | -1.736 |
uable | -1.585 |
pora | -1.550 |
veland | -1.509 |
oto | -1.402 |
Token | harvest |
Token ID | 13222 |
Feature activation | +8.27e-01 |
Pos logit contributions | |
ォ | +0.402 |
kefeller | +0.367 |
ruary | +0.348 |
hester | +0.332 |
Nebula | +0.315 |
Neg logit contributions | |
ura | -0.225 |
uable | -0.199 |
pora | -0.193 |
veland | -0.190 |
oto | -0.175 |
Token | , |
Token ID | 11 |
Feature activation | +4.91e-01 |
Pos logit contributions | |
ura | +0.584 |
uable | +0.526 |
pora | +0.511 |
veland | +0.504 |
oto | +0.469 |
Neg logit contributions | |
ォ | -0.872 |
kefeller | -0.790 |
ruary | -0.746 |
hester | -0.709 |
Nebula | -0.670 |
Token | � |
Token ID | 447 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
ura | +0.336 |
uable | +0.301 |
pora | +0.292 |
veland | +0.288 |
oto | +0.268 |
Neg logit contributions | |
ォ | -0.528 |
kefeller | -0.480 |
ruary | -0.453 |
hester | -0.431 |
Nebula | -0.408 |
Token | � |
Token ID | 251 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
ォ | +0.275 |
kefeller | +0.240 |
ruary | +0.225 |
hester | +0.210 |
Nebula | +0.197 |
Neg logit contributions | |
ura | -0.277 |
uable | -0.257 |
pora | -0.253 |
veland | -0.250 |
oto | -0.236 |
Token | Bern |
Token ID | 6206 |
Feature activation | -9.07e+00 |
Pos logit contributions | |
ura | +0.142 |
uable | +0.129 |
pora | +0.125 |
veland | +0.124 |
oto | +0.116 |
Neg logit contributions | |
ォ | -0.181 |
kefeller | -0.163 |
ruary | -0.153 |
hester | -0.145 |
Nebula | -0.137 |
Token | au |
Token ID | 559 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
ォ | +9.470 |
kefeller | +8.779 |
ruary | +8.435 |
hester | +8.069 |
ually | +7.782 |
Neg logit contributions | |
ura | -4.710 |
uable | -4.587 |
pora | -4.584 |
veland | -4.406 |
teenth | -4.254 |
Token | said |
Token ID | 531 |
Feature activation | +9.39e-01 |
Pos logit contributions | |
ォ | +0.264 |
kefeller | +0.236 |
ruary | +0.221 |
hester | +0.209 |
Nebula | +0.196 |
Neg logit contributions | |
ura | -0.227 |
uable | -0.207 |
pora | -0.203 |
veland | -0.200 |
oto | -0.188 |
Token | , |
Token ID | 11 |
Feature activation | +5.46e-01 |
Pos logit contributions | |
ura | +0.614 |
uable | +0.536 |
veland | +0.518 |
pora | +0.518 |
oto | +0.478 |
Neg logit contributions | |
ォ | -1.046 |
kefeller | -0.957 |
ruary | -0.901 |
hester | -0.863 |
Nebula | -0.821 |
Token | adding |
Token ID | 4375 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
ura | +0.388 |
uable | +0.348 |
pora | +0.338 |
veland | +0.334 |
oto | +0.311 |
Neg logit contributions | |
ォ | -0.575 |
kefeller | -0.522 |
ruary | -0.492 |
hester | -0.468 |
Nebula | -0.442 |
Token | it |
Token ID | 340 |
Feature activation | +7.63e-01 |
Pos logit contributions | |
ura | +2.167 |
uable | +1.961 |
pora | +1.897 |
veland | +1.880 |
oto | +1.770 |
Neg logit contributions | |
ォ | -2.811 |
kefeller | -2.521 |
ruary | -2.363 |
hester | -2.252 |
�� | -2.121 |
Token | in |
Token ID | 287 |
Feature activation | +9.12e-01 |
Pos logit contributions | |
ura | +0.081 |
uable | +0.073 |
pora | +0.072 |
veland | +0.071 |
oto | +0.067 |
Neg logit contributions | |
ォ | -0.098 |
kefeller | -0.087 |
ruary | -0.082 |
hester | -0.077 |
Nebula | -0.073 |
Token | AR |
Token ID | 5923 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
ura | +0.774 |
uable | +0.707 |
pora | +0.692 |
veland | +0.685 |
oto | +0.647 |
Neg logit contributions | |
ォ | -0.834 |
kefeller | -0.744 |
ruary | -0.693 |
hester | -0.654 |
Nebula | -0.609 |
Token | 4 |
Token ID | 19 |
Feature activation | +6.01e-01 |
Pos logit contributions | |
ォ | +1.078 |
kefeller | +0.966 |
ruary | +0.907 |
hester | +0.854 |
Nebula | +0.802 |
Neg logit contributions | |
ura | -0.918 |
uable | -0.838 |
pora | -0.818 |
veland | -0.808 |
oto | -0.759 |
Token | with |
Token ID | 351 |
Feature activation | -9.06e-01 |
Pos logit contributions | |
ura | +0.462 |
uable | +0.419 |
pora | +0.409 |
veland | +0.404 |
oto | +0.378 |
Neg logit contributions | |
ォ | -0.597 |
kefeller | -0.537 |
ruary | -0.505 |
hester | -0.478 |
Nebula | -0.450 |
Token | the |
Token ID | 262 |
Feature activation | +4.24e-01 |
Pos logit contributions | |
ォ | +0.850 |
kefeller | +0.759 |
ruary | +0.714 |
hester | +0.668 |
Nebula | +0.634 |
Neg logit contributions | |
ura | -0.739 |
uable | -0.678 |
pora | -0.662 |
veland | -0.654 |
oto | -0.616 |
Token | Bern |
Token ID | 6206 |
Feature activation | -9.02e+00 |
Pos logit contributions | |
ura | +0.326 |
uable | +0.296 |
pora | +0.288 |
veland | +0.285 |
oto | +0.267 |
Neg logit contributions | |
ォ | -0.421 |
kefeller | -0.379 |
ruary | -0.356 |
hester | -0.337 |
Nebula | -0.317 |
Token | formula |
Token ID | 10451 |
Feature activation | -3.19e+00 |
Pos logit contributions | |
ォ | +8.605 |
kefeller | +7.541 |
ruary | +7.381 |
hester | +6.867 |
Nebula | +6.568 |
Neg logit contributions | |
ura | -6.598 |
uable | -6.217 |
pora | -6.015 |
veland | -5.991 |
oto | -5.380 |
Token | page |
Token ID | 2443 |
Feature activation | +6.50e-01 |
Pos logit contributions | |
ォ | +3.175 |
kefeller | +2.827 |
ruary | +2.686 |
hester | +2.513 |
Nebula | +2.426 |
Neg logit contributions | |
ura | -2.357 |
uable | -2.158 |
pora | -2.104 |
veland | -2.076 |
oto | -1.921 |
Token | 213 |
Token ID | 28658 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
ura | +0.505 |
uable | +0.459 |
pora | +0.448 |
veland | +0.443 |
oto | +0.414 |
Neg logit contributions | |
ォ | -0.640 |
kefeller | -0.574 |
ruary | -0.541 |
hester | -0.510 |
Nebula | -0.480 |
Token | note |
Token ID | 3465 |
Feature activation | +9.03e-01 |
Pos logit contributions | |
ォ | +1.290 |
kefeller | +1.161 |
ruary | +1.100 |
hester | +1.035 |
Nebula | +0.986 |
Neg logit contributions | |
ura | -0.949 |
uable | -0.864 |
pora | -0.844 |
veland | -0.832 |
oto | -0.772 |
Token | a |
Token ID | 257 |
Feature activation | -5.67e-01 |
Pos logit contributions | |
ura | +0.676 |
uable | +0.612 |
pora | +0.596 |
veland | +0.588 |
oto | +0.550 |
Neg logit contributions | |
ォ | -0.914 |
kefeller | -0.825 |
ruary | -0.776 |
hester | -0.736 |
Nebula | -0.693 |
Token | back |
Token ID | 736 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
ォ | +1.486 |
kefeller | +1.353 |
ruary | +1.276 |
hester | +1.215 |
Nebula | +1.156 |
Neg logit contributions | |
ura | -1.049 |
uable | -0.953 |
pora | -0.933 |
veland | -0.913 |
oto | -0.848 |
Token | to |
Token ID | 284 |
Feature activation | -7.08e-01 |
Pos logit contributions | |
ォ | +1.785 |
kefeller | +1.617 |
ruary | +1.532 |
hester | +1.454 |
Nebula | +1.381 |
Neg logit contributions | |
ura | -1.242 |
uable | -1.124 |
pora | -1.097 |
veland | -1.078 |
oto | -1.001 |
Token | his |
Token ID | 465 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
ォ | +0.668 |
kefeller | +0.598 |
ruary | +0.560 |
hester | +0.528 |
intern | +0.493 |
Neg logit contributions | |
ura | -0.581 |
uable | -0.531 |
pora | -0.516 |
veland | -0.513 |
aur | -0.482 |
Token | prison |
Token ID | 3770 |
Feature activation | -3.89e+00 |
Pos logit contributions | |
ォ | +1.165 |
kefeller | +1.043 |
ruary | +0.977 |
hester | +0.922 |
Nebula | +0.866 |
Neg logit contributions | |
ura | -1.001 |
uable | -0.914 |
pora | -0.892 |
veland | -0.882 |
oto | -0.830 |
Token | , |
Token ID | 11 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
ォ | +3.930 |
kefeller | +3.547 |
ruary | +3.351 |
hester | +3.185 |
Nebula | +3.034 |
Neg logit contributions | |
ura | -2.845 |
uable | -2.594 |
pora | -2.506 |
veland | -2.485 |
oto | -2.311 |
Token | Worm |
Token ID | 28505 |
Feature activation | -8.88e+00 |
Pos logit contributions | |
ura | +0.116 |
uable | +0.106 |
pora | +0.103 |
veland | +0.102 |
oto | +0.096 |
Neg logit contributions | |
ォ | -0.132 |
kefeller | -0.118 |
ruary | -0.111 |
hester | -0.104 |
Nebula | -0.098 |
Token | t |
Token ID | 83 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
ォ | +5.815 |
kefeller | +5.103 |
ruary | +4.577 |
hester | +4.556 |
intern | +4.226 |
Neg logit contributions | |
ura | -8.699 |
uable | -8.295 |
pora | -7.995 |
veland | -7.912 |
oto | -7.389 |
Token | ong |
Token ID | 506 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
ォ | +0.157 |
kefeller | +0.143 |
ruary | +0.133 |
hester | +0.127 |
intern | +0.119 |
Neg logit contributions | |
ura | -0.132 |
uable | -0.123 |
pora | -0.118 |
veland | -0.117 |
oto | -0.108 |
Token | ue |
Token ID | 518 |
Feature activation | +9.79e-01 |
Pos logit contributions | |
ォ | +1.610 |
kefeller | +1.447 |
ruary | +1.358 |
hester | +1.288 |
ually | +1.205 |
Neg logit contributions | |
ura | -1.437 |
pora | -1.347 |
uable | -1.332 |
veland | -1.322 |
teenth | -1.227 |
Token | drops |
Token ID | 10532 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
ura | +0.761 |
uable | +0.686 |
pora | +0.670 |
veland | +0.662 |
oto | +0.622 |
Neg logit contributions | |
ォ | -0.969 |
kefeller | -0.873 |
ruary | -0.819 |
hester | -0.773 |
Nebula | -0.725 |
Token | a |
Token ID | 257 |
Feature activation | -9.12e-01 |
Pos logit contributions | |
ォ | +1.251 |
kefeller | +1.120 |
ruary | +1.049 |
hester | +0.990 |
Nebula | +0.939 |
Neg logit contributions | |
ura | -1.070 |
uable | -0.980 |
pora | -0.958 |
veland | -0.949 |
oto | -0.887 |
Token | . |
Token ID | 13 |
Feature activation | -5.16e-01 |
Pos logit contributions | |
ura | +1.407 |
uable | +1.261 |
pora | +1.226 |
veland | +1.209 |
oto | +1.128 |
Neg logit contributions | |
ォ | -2.114 |
kefeller | -1.923 |
ruary | -1.808 |
hester | -1.721 |
Nebula | -1.619 |
Token |
|
Token ID | 198 |
Feature activation | -5.26e-01 |
Pos logit contributions | |
ォ | +0.447 |
kefeller | +0.391 |
ruary | +0.367 |
hester | +0.343 |
Nebula | +0.327 |
Neg logit contributions | |
ura | -0.458 |
uable | -0.426 |
pora | -0.416 |
veland | -0.412 |
oto | -0.389 |
Token |
|
Token ID | 198 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
ォ | +0.499 |
kefeller | +0.442 |
ruary | +0.420 |
hester | +0.397 |
intern | +0.380 |
Neg logit contributions | |
ura | -0.416 |
uable | -0.386 |
pora | -0.376 |
veland | -0.368 |
oto | -0.344 |
Token | Still |
Token ID | 9590 |
Feature activation | -2.13e+00 |
Pos logit contributions | |
ォ | +0.173 |
kefeller | +0.152 |
ruary | +0.143 |
hester | +0.134 |
intern | +0.125 |
Neg logit contributions | |
ura | -0.178 |
uable | -0.164 |
pora | -0.161 |
veland | -0.159 |
oto | -0.150 |
Token | this |
Token ID | 428 |
Feature activation | +4.70e-01 |
Pos logit contributions | |
ォ | +2.105 |
kefeller | +1.883 |
ruary | +1.779 |
hester | +1.681 |
Nebula | +1.594 |
Neg logit contributions | |
ura | -1.627 |
uable | -1.488 |
pora | -1.444 |
veland | -1.428 |
oto | -1.338 |
Token | hadn |
Token ID | 8020 |
Feature activation | -8.84e+00 |
Pos logit contributions | |
ura | +0.381 |
uable | +0.348 |
pora | +0.340 |
veland | +0.336 |
oto | +0.316 |
Neg logit contributions | |
ォ | -0.445 |
kefeller | -0.399 |
ruary | -0.374 |
hester | -0.353 |
Nebula | -0.331 |
Token | � |
Token ID | 447 |
Feature activation | -3.27e-02 |
Pos logit contributions | |
ォ | +7.739 |
kefeller | +6.429 |
ruary | +6.299 |
ィ | +6.013 |
hester | +5.882 |
Neg logit contributions | |
ura | -6.767 |
uable | -6.671 |
pora | -6.591 |
veland | -6.307 |
cius | -5.931 |
Token | � |
Token ID | 247 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
ォ | +0.026 |
kefeller | +0.023 |
ruary | +0.021 |
hester | +0.020 |
intern | +0.018 |
Neg logit contributions | |
ura | -0.031 |
uable | -0.029 |
pora | -0.028 |
veland | -0.028 |
oto | -0.027 |
Token | t |
Token ID | 83 |
Feature activation | +5.93e-02 |
Pos logit contributions | |
ォ | +1.341 |
kefeller | +1.168 |
ruary | +1.086 |
hester | +1.005 |
intern | +0.931 |
Neg logit contributions | |
ura | -1.623 |
uable | -1.501 |
pora | -1.493 |
veland | -1.469 |
oto | -1.396 |
Token | fixed |
Token ID | 5969 |
Feature activation | -6.16e-01 |
Pos logit contributions | |
ura | +0.055 |
uable | +0.051 |
pora | +0.050 |
veland | +0.049 |
oto | +0.047 |
Neg logit contributions | |
ォ | -0.050 |
kefeller | -0.044 |
ruary | -0.041 |
hester | -0.038 |
Nebula | -0.035 |
Token | the |
Token ID | 262 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
ォ | +0.585 |
kefeller | +0.524 |
ruary | +0.493 |
hester | +0.464 |
Nebula | +0.439 |
Neg logit contributions | |
ura | -0.497 |
uable | -0.454 |
pora | -0.443 |
veland | -0.439 |
oto | -0.412 |
Token | between |
Token ID | 1022 |
Feature activation | -3.33e+00 |
Pos logit contributions | |
ォ | +2.547 |
kefeller | +2.315 |
ruary | +2.193 |
hester | +2.088 |
Nebula | +1.982 |
Neg logit contributions | |
ura | -1.677 |
uable | -1.524 |
pora | -1.482 |
veland | -1.467 |
oto | -1.344 |
Token | 1953 |
Token ID | 24217 |
Feature activation | -2.36e+00 |
Pos logit contributions | |
ォ | +2.962 |
kefeller | +2.668 |
ruary | +2.500 |
hester | +2.331 |
Nebula | +2.199 |
Neg logit contributions | |
ura | -2.837 |
uable | -2.612 |
pora | -2.561 |
veland | -2.519 |
oto | -2.380 |
Token | - |
Token ID | 12 |
Feature activation | +7.35e-01 |
Pos logit contributions | |
ォ | +2.606 |
kefeller | +2.363 |
ruary | +2.239 |
hester | +2.134 |
Nebula | +2.024 |
Neg logit contributions | |
ura | -1.573 |
uable | -1.397 |
pora | -1.350 |
veland | -1.340 |
oto | -1.242 |
Token | 56 |
Token ID | 3980 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
ura | +0.616 |
uable | +0.569 |
pora | +0.554 |
veland | +0.547 |
oto | +0.513 |
Neg logit contributions | |
ォ | -0.676 |
kefeller | -0.604 |
ruary | -0.567 |
hester | -0.532 |
intern | -0.501 |
Token | for |
Token ID | 329 |
Feature activation | +4.16e-01 |
Pos logit contributions | |
ォ | +1.079 |
kefeller | +0.979 |
ruary | +0.926 |
hester | +0.878 |
intern | +0.833 |
Neg logit contributions | |
ura | -0.716 |
uable | -0.645 |
pora | -0.628 |
veland | -0.618 |
oto | -0.572 |
Token | Bern |
Token ID | 6206 |
Feature activation | -8.76e+00 |
Pos logit contributions | |
ura | +0.352 |
uable | +0.322 |
pora | +0.314 |
veland | +0.310 |
oto | +0.294 |
Neg logit contributions | |
ォ | -0.382 |
kefeller | -0.339 |
ruary | -0.318 |
hester | -0.299 |
Nebula | -0.279 |
Token | ad |
Token ID | 324 |
Feature activation | +6.20e-02 |
Pos logit contributions | |
ォ | +8.410 |
kefeller | +7.571 |
ruary | +7.252 |
hester | +6.900 |
intern | +6.446 |
Neg logit contributions | |
ura | -6.397 |
uable | -5.921 |
pora | -5.778 |
veland | -5.719 |
oto | -5.216 |
Token | ine |
Token ID | 500 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
ura | +0.064 |
uable | +0.059 |
pora | +0.058 |
veland | +0.058 |
oto | +0.055 |
Neg logit contributions | |
ォ | -0.046 |
kefeller | -0.039 |
ruary | -0.036 |
hester | -0.033 |
Nebula | -0.030 |
Token | and |
Token ID | 290 |
Feature activation | -6.06e-01 |
Pos logit contributions | |
ura | +1.652 |
uable | +1.511 |
pora | +1.477 |
veland | +1.460 |
oto | +1.383 |
Neg logit contributions | |
ォ | -1.717 |
kefeller | -1.526 |
ruary | -1.422 |
hester | -1.332 |
intern | -1.240 |
Token | Isaac |
Token ID | 19068 |
Feature activation | +2.64e+00 |
Pos logit contributions | |
ォ | +0.519 |
kefeller | +0.459 |
ruary | +0.427 |
hester | +0.400 |
Nebula | +0.371 |
Neg logit contributions | |
ura | -0.548 |
uable | -0.504 |
pora | -0.494 |
veland | -0.489 |
oto | -0.463 |
Token | Newton |
Token ID | 17321 |
Feature activation | -6.47e+00 |
Pos logit contributions | |
ura | +2.362 |
uable | +2.169 |
pora | +2.108 |
veland | +2.085 |
oto | +2.000 |
Neg logit contributions | |
ォ | -2.280 |
kefeller | -2.008 |
ruary | -1.877 |
hester | -1.756 |
bley | -1.638 |
Token | af |
Token ID | 1878 |
Feature activation | +2.99e+00 |
Pos logit contributions | |
ura | +1.833 |
uable | +1.634 |
pora | +1.583 |
veland | +1.562 |
oto | +1.459 |
Neg logit contributions | |
ォ | -2.882 |
kefeller | -2.608 |
ruary | -2.469 |
hester | -2.345 |
Nebula | -2.221 |
Token | . |
Token ID | 13 |
Feature activation | -4.97e-01 |
Pos logit contributions | |
ura | +2.278 |
uable | +2.047 |
pora | +1.983 |
veland | +1.969 |
oto | +1.857 |
Neg logit contributions | |
ォ | -2.979 |
kefeller | -2.692 |
ruary | -2.520 |
hester | -2.393 |
intern | -2.252 |
Token | Plus |
Token ID | 8227 |
Feature activation | +2.78e+00 |
Pos logit contributions | |
ォ | +0.439 |
kefeller | +0.387 |
ruary | +0.363 |
hester | +0.340 |
Nebula | +0.319 |
Neg logit contributions | |
ura | -0.436 |
uable | -0.401 |
pora | -0.393 |
veland | -0.388 |
oto | -0.367 |
Token | , |
Token ID | 11 |
Feature activation | +5.96e-01 |
Pos logit contributions | |
ura | +2.004 |
uable | +1.791 |
pora | +1.746 |
veland | +1.726 |
oto | +1.616 |
Neg logit contributions | |
ォ | -2.882 |
kefeller | -2.631 |
ruary | -2.452 |
hester | -2.338 |
�� | -2.201 |
Token | I |
Token ID | 314 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
ura | +0.486 |
uable | +0.444 |
pora | +0.433 |
veland | +0.428 |
oto | +0.403 |
Neg logit contributions | |
ォ | -0.563 |
kefeller | -0.504 |
ruary | -0.472 |
hester | -0.446 |
Nebula | -0.417 |
Token | hadn |
Token ID | 8020 |
Feature activation | -8.66e+00 |
Pos logit contributions | |
ォ | +0.996 |
kefeller | +0.888 |
ruary | +0.839 |
hester | +0.788 |
intern | +0.746 |
Neg logit contributions | |
ura | -0.825 |
uable | -0.759 |
pora | -0.744 |
veland | -0.728 |
oto | -0.685 |
Token | � |
Token ID | 447 |
Feature activation | -4.89e-01 |
Pos logit contributions | |
ォ | +6.290 |
kefeller | +4.920 |
ruary | +4.901 |
ィ | +4.603 |
� | +4.423 |
Neg logit contributions | |
ura | -7.915 |
uable | -7.870 |
pora | -7.775 |
veland | -7.394 |
cius | -7.123 |
Token | � |
Token ID | 247 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
ォ | +0.394 |
kefeller | +0.342 |
ruary | +0.320 |
hester | +0.296 |
intern | +0.275 |
Neg logit contributions | |
ura | -0.464 |
uable | -0.430 |
pora | -0.425 |
veland | -0.420 |
oto | -0.399 |
Token | t |
Token ID | 83 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
ォ | +1.570 |
kefeller | +1.382 |
ruary | +1.284 |
hester | +1.196 |
intern | +1.112 |
Neg logit contributions | |
ura | -1.752 |
uable | -1.607 |
pora | -1.599 |
veland | -1.577 |
oto | -1.489 |
Token | really |
Token ID | 1107 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
ォ | +0.257 |
kefeller | +0.228 |
ruary | +0.213 |
hester | +0.200 |
Nebula | +0.187 |
Neg logit contributions | |
ura | -0.253 |
uable | -0.232 |
pora | -0.228 |
veland | -0.225 |
oto | -0.212 |
Token | read |
Token ID | 1100 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
ォ | +1.275 |
kefeller | +1.138 |
ruary | +1.071 |
hester | +1.006 |
Nebula | +0.950 |
Neg logit contributions | |
ura | -1.144 |
uable | -1.050 |
pora | -1.035 |
veland | -1.015 |
oto | -0.954 |
Token | the |
Token ID | 262 |
Feature activation | +3.05e-01 |
Pos logit contributions | |
ォ | +0.888 |
kefeller | +0.792 |
ruary | +0.742 |
hester | +0.699 |
Nebula | +0.657 |
Neg logit contributions | |
ura | -0.782 |
uable | -0.713 |
pora | -0.698 |
veland | -0.691 |
oto | -0.650 |
Token | second |
Token ID | 1218 |
Feature activation | -8.85e-01 |
Pos logit contributions | |
ura | +0.230 |
uable | +0.209 |
pora | +0.204 |
veland | +0.201 |
oto | +0.188 |
Neg logit contributions | |
ォ | -0.307 |
kefeller | -0.275 |
ruary | -0.259 |
hester | -0.246 |
Nebula | -0.232 |
Token | unit |
Token ID | 4326 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
ォ | +0.896 |
kefeller | +0.802 |
ruary | +0.758 |
hester | +0.718 |
intern | +0.683 |
Neg logit contributions | |
ura | -0.656 |
uable | -0.597 |
pora | -0.582 |
veland | -0.576 |
oto | -0.536 |
Token | exclusively |
Token ID | 11541 |
Feature activation | +4.63e+00 |
Pos logit contributions | |
ura | +0.912 |
uable | +0.817 |
pora | +0.793 |
veland | +0.782 |
oto | +0.727 |
Neg logit contributions | |
ォ | -1.431 |
kefeller | -1.300 |
ruary | -1.228 |
hester | -1.169 |
Nebula | -1.106 |
Token | . |
Token ID | 13 |
Feature activation | -4.45e-01 |
Pos logit contributions | |
ura | +2.952 |
uable | +2.596 |
pora | +2.527 |
veland | +2.495 |
oto | +2.320 |
Neg logit contributions | |
ォ | -5.163 |
kefeller | -4.755 |
ruary | -4.461 |
hester | -4.252 |
Nebula | -4.040 |
Token | Brut |
Token ID | 30291 |
Feature activation | -8.63e+00 |
Pos logit contributions | |
ォ | +0.432 |
kefeller | +0.391 |
ruary | +0.365 |
hester | +0.346 |
Nebula | +0.324 |
Neg logit contributions | |
ura | -0.351 |
uable | -0.319 |
pora | -0.310 |
veland | -0.307 |
oto | -0.289 |
Token | on |
Token ID | 261 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
ォ | +7.480 |
kefeller | +6.811 |
ruary | +6.596 |
hester | +6.541 |
intern | +6.194 |
Neg logit contributions | |
ura | -6.058 |
uable | -5.802 |
pora | -5.764 |
veland | -5.468 |
teenth | -5.262 |
Token | , |
Token ID | 11 |
Feature activation | +6.64e-01 |
Pos logit contributions | |
ォ | +0.156 |
kefeller | +0.140 |
ruary | +0.131 |
hester | +0.124 |
Nebula | +0.116 |
Neg logit contributions | |
ura | -0.130 |
uable | -0.118 |
pora | -0.115 |
veland | -0.114 |
oto | -0.107 |
Token | signed |
Token ID | 4488 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
ura | +0.465 |
uable | +0.418 |
pora | +0.407 |
veland | +0.400 |
oto | +0.373 |
Neg logit contributions | |
ォ | -0.705 |
kefeller | -0.638 |
ruary | -0.603 |
hester | -0.574 |
Nebula | -0.543 |
Token | as |
Token ID | 355 |
Feature activation | -9.75e-01 |
Pos logit contributions | |
ura | +0.132 |
uable | +0.119 |
pora | +0.116 |
veland | +0.115 |
oto | +0.107 |
Neg logit contributions | |
ォ | -0.194 |
kefeller | -0.175 |
ruary | -0.165 |
hester | -0.157 |
Nebula | -0.148 |
Token | a |
Token ID | 257 |
Feature activation | -7.13e-01 |
Pos logit contributions | |
ォ | +0.901 |
kefeller | +0.804 |
ruary | +0.752 |
hester | +0.709 |
Nebula | +0.664 |
Neg logit contributions | |
ura | -0.813 |
uable | -0.744 |
pora | -0.727 |
veland | -0.718 |
oto | -0.678 |
Token | 's |
Token ID | 338 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
ura | +1.077 |
uable | +0.950 |
pora | +0.929 |
veland | +0.913 |
oto | +0.852 |
Neg logit contributions | |
ォ | -1.800 |
kefeller | -1.630 |
ruary | -1.543 |
hester | -1.472 |
intern | -1.385 |
Token | spy |
Token ID | 13997 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
ォ | +1.219 |
kefeller | +1.089 |
ruary | +1.018 |
hester | +0.960 |
Nebula | +0.901 |
Neg logit contributions | |
ura | -1.086 |
uable | -0.994 |
pora | -0.970 |
veland | -0.960 |
oto | -0.904 |
Token | Gr |
Token ID | 1902 |
Feature activation | +3.09e+00 |
Pos logit contributions | |
ォ | +1.342 |
kefeller | +1.205 |
ruary | +1.131 |
hester | +1.075 |
Nebula | +1.018 |
Neg logit contributions | |
ura | -1.062 |
uable | -0.974 |
pora | -0.942 |
veland | -0.936 |
oto | -0.871 |
Token | í |
Token ID | 8836 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
ura | +2.205 |
uable | +1.963 |
pora | +1.900 |
veland | +1.894 |
oto | +1.778 |
Neg logit contributions | |
ォ | -3.264 |
kefeller | -2.949 |
ruary | -2.784 |
hester | -2.639 |
�� | -2.514 |
Token | ma |
Token ID | 2611 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
ura | +1.388 |
uable | +1.246 |
pora | +1.211 |
veland | +1.196 |
aur | +1.121 |
Neg logit contributions | |
ォ | -2.018 |
kefeller | -1.834 |
ruary | -1.720 |
hester | -1.634 |
Nebula | -1.550 |
Token | Worm |
Token ID | 28505 |
Feature activation | -8.56e+00 |
Pos logit contributions | |
ura | +1.264 |
uable | +1.125 |
pora | +1.098 |
veland | +1.088 |
aur | +1.014 |
Neg logit contributions | |
ォ | -1.901 |
kefeller | -1.724 |
ruary | -1.625 |
hester | -1.542 |
Nebula | -1.455 |
Token | t |
Token ID | 83 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
ォ | +6.777 |
kefeller | +5.897 |
ruary | +5.583 |
hester | +5.444 |
bley | +5.212 |
Neg logit contributions | |
ura | -7.236 |
uable | -6.794 |
pora | -6.775 |
veland | -6.433 |
imate | -6.105 |
Token | ong |
Token ID | 506 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
ura | +0.082 |
uable | +0.075 |
pora | +0.073 |
veland | +0.072 |
oto | +0.067 |
Neg logit contributions | |
ォ | -0.104 |
kefeller | -0.094 |
ruary | -0.088 |
hester | -0.084 |
intern | -0.079 |
Token | ue |
Token ID | 518 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
ォ | +1.386 |
kefeller | +1.251 |
ruary | +1.178 |
hester | +1.119 |
Nebula | +1.051 |
Neg logit contributions | |
ura | -1.044 |
uable | -0.947 |
pora | -0.935 |
veland | -0.920 |
oto | -0.856 |
Token | . |
Token ID | 13 |
Feature activation | -3.75e-01 |
Pos logit contributions | |
ura | +0.945 |
uable | +0.842 |
pora | +0.820 |
veland | +0.809 |
oto | +0.750 |
Neg logit contributions | |
ォ | -1.499 |
kefeller | -1.359 |
ruary | -1.286 |
hester | -1.222 |
Nebula | -1.154 |
Token | Th |
Token ID | 536 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
ォ | +0.341 |
kefeller | +0.304 |
ruary | +0.285 |
hester | +0.268 |
Nebula | +0.251 |
Neg logit contributions | |
ura | -0.318 |
uable | -0.291 |
pora | -0.285 |
veland | -0.281 |
oto | -0.265 |
Token | omp |
Token ID | 3361 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
ura | +1.479 |
uable | +1.281 |
pora | +1.222 |
veland | +1.213 |
oto | +1.104 |
Neg logit contributions | |
ォ | -3.108 |
kefeller | -2.840 |
ruary | -2.689 |
hester | -2.576 |
Nebula | -2.473 |
Token | an |
Token ID | 272 |
Feature activation | +7.12e-02 |
Pos logit contributions | |
ura | +1.137 |
uable | +1.027 |
pora | +0.991 |
veland | +0.990 |
aur | +0.938 |
Neg logit contributions | |
ォ | -1.458 |
kefeller | -1.310 |
ruary | -1.227 |
hester | -1.159 |
Nebula | -1.097 |
Token | ied |
Token ID | 798 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
ura | +0.082 |
uable | +0.076 |
pora | +0.075 |
veland | +0.074 |
oto | +0.072 |
Neg logit contributions | |
ォ | -0.044 |
kefeller | -0.037 |
ruary | -0.033 |
hester | -0.030 |
Nebula | -0.027 |
Token | by |
Token ID | 416 |
Feature activation | -1.92e+00 |
Pos logit contributions | |
ォ | +1.664 |
kefeller | +1.497 |
ruary | +1.409 |
hester | +1.334 |
Nebula | +1.260 |
Neg logit contributions | |
ura | -1.188 |
uable | -1.070 |
pora | -1.038 |
veland | -1.030 |
oto | -0.964 |
Token | their |
Token ID | 511 |
Feature activation | -8.25e-01 |
Pos logit contributions | |
ォ | +1.718 |
kefeller | +1.533 |
ruary | +1.429 |
hester | +1.347 |
Nebula | +1.262 |
Neg logit contributions | |
ura | -1.642 |
uable | -1.511 |
pora | -1.478 |
veland | -1.460 |
oto | -1.374 |
Token | Bern |
Token ID | 6206 |
Feature activation | -8.50e+00 |
Pos logit contributions | |
ォ | +0.774 |
kefeller | +0.694 |
ruary | +0.649 |
hester | +0.613 |
Nebula | +0.576 |
Neg logit contributions | |
ura | -0.675 |
uable | -0.618 |
pora | -0.605 |
veland | -0.597 |
oto | -0.561 |
Token | ese |
Token ID | 2771 |
Feature activation | +3.17e+00 |
Pos logit contributions | |
ォ | +8.129 |
kefeller | +7.275 |
ruary | +7.013 |
hester | +6.680 |
intern | +6.232 |
Neg logit contributions | |
ura | -6.207 |
uable | -5.777 |
pora | -5.636 |
veland | -5.540 |
teenth | -5.084 |
Token | mountain |
Token ID | 8598 |
Feature activation | -3.90e-01 |
Pos logit contributions | |
ura | +2.631 |
uable | +2.390 |
pora | +2.336 |
veland | +2.308 |
oto | +2.194 |
Neg logit contributions | |
ォ | -2.943 |
kefeller | -2.647 |
ruary | -2.478 |
hester | -2.314 |
Nebula | -2.158 |
Token | dog |
Token ID | 3290 |
Feature activation | +8.34e-01 |
Pos logit contributions | |
ォ | +0.432 |
kefeller | +0.393 |
ruary | +0.370 |
hester | +0.355 |
Nebula | +0.337 |
Neg logit contributions | |
ura | -0.253 |
uable | -0.226 |
pora | -0.220 |
veland | -0.216 |
aur | -0.198 |
Token | , |
Token ID | 11 |
Feature activation | +7.30e-01 |
Pos logit contributions | |
ura | +0.630 |
uable | +0.567 |
pora | +0.553 |
veland | +0.545 |
oto | +0.515 |
Neg logit contributions | |
ォ | -0.841 |
kefeller | -0.762 |
ruary | -0.718 |
hester | -0.678 |
intern | -0.636 |
Token | Bro |
Token ID | 2806 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
ura | +0.665 |
uable | +0.611 |
pora | +0.598 |
veland | +0.591 |
oto | +0.563 |
Neg logit contributions | |
ォ | -0.625 |
kefeller | -0.553 |
ruary | -0.513 |
hester | -0.478 |
intern | -0.444 |
Token | � |
Token ID | 447 |
Feature activation | +7.87e-02 |
Pos logit contributions | |
ォ | +0.115 |
kefeller | +0.103 |
ruary | +0.097 |
hester | +0.092 |
Nebula | +0.086 |
Neg logit contributions | |
ura | -0.091 |
uable | -0.083 |
pora | -0.081 |
veland | -0.080 |
oto | -0.075 |
Token | � |
Token ID | 251 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
ura | +0.064 |
uable | +0.058 |
pora | +0.056 |
veland | +0.055 |
oto | +0.052 |
Neg logit contributions | |
ォ | -0.074 |
kefeller | -0.068 |
ruary | -0.063 |
hester | -0.060 |
intern | -0.056 |
Token |
|
Token ID | 198 |
Feature activation | +8.90e-02 |
Pos logit contributions | |
ura | +0.119 |
uable | +0.108 |
pora | +0.104 |
veland | +0.103 |
oto | +0.097 |
Neg logit contributions | |
ォ | -0.162 |
kefeller | -0.147 |
ruary | -0.137 |
hester | -0.131 |
Nebula | -0.123 |
Token |
|
Token ID | 198 |
Feature activation | +4.07e-01 |
Pos logit contributions | |
ura | +0.069 |
uable | +0.064 |
pora | +0.062 |
veland | +0.061 |
oto | +0.057 |
Neg logit contributions | |
ォ | -0.086 |
kefeller | -0.076 |
ruary | -0.073 |
hester | -0.069 |
intern | -0.065 |
Token | Jim |
Token ID | 18050 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
ura | +0.341 |
uable | +0.312 |
pora | +0.305 |
veland | +0.301 |
oto | +0.284 |
Neg logit contributions | |
ォ | -0.376 |
kefeller | -0.336 |
ruary | -0.314 |
hester | -0.295 |
Nebula | -0.276 |
Token | Bern |
Token ID | 6206 |
Feature activation | -8.50e+00 |
Pos logit contributions | |
ォ | +1.467 |
kefeller | +1.305 |
ruary | +1.217 |
hester | +1.146 |
Nebula | +1.069 |
Neg logit contributions | |
ura | -1.400 |
uable | -1.288 |
pora | -1.259 |
veland | -1.247 |
oto | -1.174 |
Token | au |
Token ID | 559 |
Feature activation | +4.46e-01 |
Pos logit contributions | |
ォ | +8.065 |
kefeller | +7.289 |
ruary | +6.968 |
hester | +6.689 |
bley | +6.245 |
Neg logit contributions | |
ura | -6.120 |
uable | -5.767 |
pora | -5.679 |
veland | -5.508 |
teenth | -5.065 |
Token | , |
Token ID | 11 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
ura | +0.325 |
uable | +0.293 |
pora | +0.285 |
veland | +0.281 |
oto | +0.262 |
Neg logit contributions | |
ォ | -0.461 |
kefeller | -0.416 |
ruary | -0.392 |
hester | -0.373 |
Nebula | -0.352 |
Token | CEO |
Token ID | 6123 |
Feature activation | -4.94e-02 |
Pos logit contributions | |
ura | +0.829 |
uable | +0.755 |
pora | +0.737 |
veland | +0.730 |
oto | +0.687 |
Neg logit contributions | |
ォ | -0.941 |
kefeller | -0.840 |
ruary | -0.787 |
hester | -0.741 |
Nebula | -0.692 |
Token | of |
Token ID | 286 |
Feature activation | -3.34e-01 |
Pos logit contributions | |
ォ | +0.057 |
kefeller | +0.052 |
ruary | +0.050 |
hester | +0.047 |
Nebula | +0.045 |
Neg logit contributions | |
ura | -0.030 |
uable | -0.026 |
veland | -0.025 |
pora | -0.025 |
aur | -0.023 |
Token | Will |
Token ID | 2561 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
ォ | +0.302 |
kefeller | +0.269 |
ruary | +0.251 |
hester | +0.236 |
intern | +0.220 |
Neg logit contributions | |
ura | -0.287 |
uable | -0.262 |
pora | -0.257 |
veland | -0.254 |
oto | -0.240 |
Token | recall |
Token ID | 10014 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
ォ | +0.045 |
kefeller | +0.039 |
ruary | +0.037 |
hester | +0.035 |
Nebula | +0.032 |
Neg logit contributions | |
ura | -0.043 |
uable | -0.040 |
pora | -0.039 |
veland | -0.039 |
oto | -0.037 |
Token | 1974 |
Token ID | 16489 |
Feature activation | +9.23e-01 |
Pos logit contributions | |
ォ | +1.091 |
kefeller | +0.972 |
ruary | +0.912 |
hester | +0.857 |
Nebula | +0.799 |
Neg logit contributions | |
ura | -1.001 |
uable | -0.920 |
pora | -0.897 |
veland | -0.888 |
oto | -0.835 |
Token | 's |
Token ID | 338 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
ura | +0.648 |
uable | +0.589 |
pora | +0.575 |
veland | +0.561 |
oto | +0.521 |
Neg logit contributions | |
ォ | -0.971 |
kefeller | -0.876 |
ruary | -0.833 |
hester | -0.788 |
intern | -0.749 |
Token | masterpiece |
Token ID | 30669 |
Feature activation | -2.36e+00 |
Pos logit contributions | |
ォ | +0.928 |
kefeller | +0.825 |
ruary | +0.772 |
hester | +0.726 |
intern | +0.678 |
Neg logit contributions | |
ura | -0.941 |
uable | -0.870 |
pora | -0.854 |
veland | -0.852 |
oto | -0.799 |
Token | Young |
Token ID | 6960 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
ォ | +2.405 |
kefeller | +2.166 |
ruary | +2.054 |
hester | +1.942 |
Nebula | +1.837 |
Neg logit contributions | |
ura | -1.733 |
uable | -1.581 |
pora | -1.536 |
veland | -1.517 |
oto | -1.410 |
Token | Frankenstein |
Token ID | 45738 |
Feature activation | -8.47e+00 |
Pos logit contributions | |
ura | +2.846 |
uable | +2.643 |
pora | +2.608 |
veland | +2.581 |
oto | +2.496 |
Neg logit contributions | |
ォ | -1.539 |
kefeller | -1.282 |
ruary | -1.143 |
hester | -1.035 |
bley | -0.918 |
Token | , |
Token ID | 837 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
ォ | +8.074 |
kefeller | +7.160 |
ruary | +6.881 |
hester | +6.437 |
Nebula | +6.225 |
Neg logit contributions | |
ura | -6.181 |
uable | -5.804 |
pora | -5.628 |
veland | -5.553 |
teenth | -5.016 |
Token | containing |
Token ID | 7268 |
Feature activation | +7.97e-01 |
Pos logit contributions | |
ォ | +0.112 |
kefeller | +0.101 |
ruary | +0.094 |
hester | +0.089 |
Nebula | +0.084 |
Neg logit contributions | |
ura | -0.097 |
uable | -0.089 |
pora | -0.087 |
veland | -0.086 |
oto | -0.080 |
Token | the |
Token ID | 262 |
Feature activation | +4.65e-01 |
Pos logit contributions | |
ura | +0.665 |
uable | +0.607 |
pora | +0.592 |
veland | +0.583 |
aur | +0.554 |
Neg logit contributions | |
ォ | -0.739 |
kefeller | -0.662 |
ruary | -0.618 |
hester | -0.582 |
intern | -0.542 |
Token | inspirational |
Token ID | 40840 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
ura | +0.385 |
uable | +0.352 |
pora | +0.344 |
veland | +0.339 |
oto | +0.320 |
Neg logit contributions | |
ォ | -0.434 |
kefeller | -0.389 |
ruary | -0.363 |
hester | -0.342 |
intern | -0.320 |
Token | idea |
Token ID | 2126 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
ura | +1.098 |
uable | +0.998 |
pora | +0.969 |
veland | +0.957 |
oto | +0.910 |
Neg logit contributions | |
ォ | -1.277 |
kefeller | -1.148 |
ruary | -1.072 |
hester | -1.007 |
intern | -0.941 |
Token | that |
Token ID | 326 |
Feature activation | -4.26e-01 |
Pos logit contributions | |
ォ | +0.618 |
kefeller | +0.555 |
ruary | +0.521 |
hester | +0.493 |
Nebula | +0.463 |
Neg logit contributions | |
ura | -0.497 |
uable | -0.452 |
pora | -0.440 |
veland | -0.435 |
oto | -0.409 |
Token | the |
Token ID | 262 |
Feature activation | -5.58e-04 |
Pos logit contributions | |
ォ | +0.398 |
kefeller | +0.356 |
ruary | +0.333 |
hester | +0.314 |
Nebula | +0.294 |
Neg logit contributions | |
ura | -0.352 |
uable | -0.322 |
pora | -0.314 |
veland | -0.311 |
oto | -0.293 |
Token | group |
Token ID | 1448 |
Feature activation | +9.79e-01 |
Pos logit contributions | |
ォ | +0.001 |
kefeller | +0.000 |
ruary | +0.000 |
hester | +0.000 |
Nebula | +0.000 |
Neg logit contributions | |
ura | -0.000 |
uable | -0.000 |
pora | -0.000 |
veland | -0.000 |
oto | -0.000 |
Token | behind |
Token ID | 2157 |
Feature activation | -2.05e+00 |
Pos logit contributions | |
ura | +0.799 |
uable | +0.729 |
pora | +0.713 |
veland | +0.702 |
aur | +0.662 |
Neg logit contributions | |
ォ | -0.928 |
kefeller | -0.833 |
ruary | -0.778 |
hester | -0.734 |
Nebula | -0.688 |
Token | the |
Token ID | 262 |
Feature activation | -2.53e-01 |
Pos logit contributions | |
ォ | +1.908 |
kefeller | +1.704 |
ruary | +1.596 |
hester | +1.503 |
Nebula | +1.408 |
Neg logit contributions | |
ura | -1.705 |
uable | -1.558 |
pora | -1.522 |
veland | -1.507 |
oto | -1.418 |
Token | cyber |
Token ID | 10075 |
Feature activation | -8.47e+00 |
Pos logit contributions | |
ォ | +0.239 |
kefeller | +0.214 |
ruary | +0.200 |
hester | +0.189 |
Nebula | +0.176 |
Neg logit contributions | |
ura | -0.208 |
uable | -0.190 |
pora | -0.185 |
veland | -0.183 |
oto | -0.172 |
Token | - |
Token ID | 12 |
Feature activation | -6.90e-01 |
Pos logit contributions | |
ォ | +7.254 |
kefeller | +6.385 |
ruary | +6.064 |
hester | +5.679 |
intern | +5.444 |
Neg logit contributions | |
ura | -7.158 |
uable | -6.654 |
veland | -6.543 |
pora | -6.490 |
oto | -6.061 |
Token | attack |
Token ID | 20358 |
Feature activation | -6.71e-01 |
Pos logit contributions | |
ォ | +0.635 |
kefeller | +0.567 |
ruary | +0.528 |
hester | +0.495 |
Nebula | +0.466 |
Neg logit contributions | |
ura | -0.586 |
uable | -0.535 |
pora | -0.523 |
veland | -0.514 |
aur | -0.491 |
Token | was |
Token ID | 373 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
ォ | +0.637 |
kefeller | +0.571 |
ruary | +0.535 |
hester | +0.505 |
Nebula | +0.473 |
Neg logit contributions | |
ura | -0.544 |
uable | -0.496 |
pora | -0.484 |
veland | -0.479 |
oto | -0.450 |
Token | the |
Token ID | 262 |
Feature activation | -4.01e-01 |
Pos logit contributions | |
ォ | +1.082 |
kefeller | +0.969 |
ruary | +0.912 |
hester | +0.860 |
Nebula | +0.811 |
Neg logit contributions | |
ura | -0.909 |
uable | -0.828 |
pora | -0.808 |
veland | -0.800 |
oto | -0.751 |
Token | same |
Token ID | 976 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
ォ | +0.384 |
kefeller | +0.344 |
ruary | +0.323 |
hester | +0.304 |
Nebula | +0.286 |
Neg logit contributions | |
ura | -0.323 |
uable | -0.295 |
pora | -0.287 |
veland | -0.284 |
oto | -0.267 |
Token | � |
Token ID | 250 |
Feature activation | +4.96e-01 |
Pos logit contributions | |
ura | +1.410 |
uable | +1.298 |
pora | +1.270 |
veland | +1.257 |
oto | +1.190 |
Neg logit contributions | |
ォ | -1.368 |
kefeller | -1.211 |
ruary | -1.127 |
hester | -1.056 |
Nebula | -0.982 |
Token | Do |
Token ID | 5211 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
ura | +0.403 |
uable | +0.368 |
pora | +0.359 |
veland | +0.355 |
oto | +0.334 |
Neg logit contributions | |
ォ | -0.471 |
kefeller | -0.422 |
ruary | -0.395 |
hester | -0.373 |
Nebula | -0.350 |
Token | you |
Token ID | 345 |
Feature activation | +4.66e+00 |
Pos logit contributions | |
ォ | +1.019 |
kefeller | +0.906 |
ruary | +0.846 |
hester | +0.795 |
Nebula | +0.742 |
Neg logit contributions | |
ura | -1.006 |
uable | -0.926 |
pora | -0.904 |
veland | -0.895 |
oto | -0.844 |
Token | feel |
Token ID | 1254 |
Feature activation | +8.85e-01 |
Pos logit contributions | |
ura | +3.299 |
uable | +2.961 |
pora | +2.876 |
veland | +2.844 |
oto | +2.669 |
Neg logit contributions | |
ォ | -4.898 |
kefeller | -4.437 |
ruary | -4.179 |
hester | -3.973 |
Nebula | -3.736 |
Token | the |
Token ID | 262 |
Feature activation | +5.39e-01 |
Pos logit contributions | |
ura | +0.693 |
uable | +0.630 |
pora | +0.615 |
veland | +0.607 |
oto | +0.570 |
Neg logit contributions | |
ォ | -0.864 |
kefeller | -0.777 |
ruary | -0.730 |
hester | -0.690 |
Nebula | -0.649 |
Token | Bern |
Token ID | 6206 |
Feature activation | -8.46e+00 |
Pos logit contributions | |
ura | +0.399 |
uable | +0.361 |
pora | +0.351 |
veland | +0.347 |
oto | +0.324 |
Neg logit contributions | |
ォ | -0.550 |
kefeller | -0.497 |
ruary | -0.468 |
hester | -0.444 |
Nebula | -0.419 |
Token | ? |
Token ID | 30 |
Feature activation | +6.51e-02 |
Pos logit contributions | |
ォ | +8.719 |
kefeller | +7.751 |
ruary | +7.498 |
hester | +7.091 |
intern | +6.757 |
Neg logit contributions | |
ura | -5.562 |
uable | -5.154 |
pora | -5.003 |
veland | -4.976 |
teenth | -4.609 |
Token | � |
Token ID | 447 |
Feature activation | +7.49e-01 |
Pos logit contributions | |
ura | +0.046 |
uable | +0.042 |
pora | +0.041 |
veland | +0.040 |
oto | +0.037 |
Neg logit contributions | |
ォ | -0.068 |
kefeller | -0.062 |
ruary | -0.058 |
hester | -0.055 |
Nebula | -0.052 |
Token | � |
Token ID | 251 |
Feature activation | +5.22e-01 |
Pos logit contributions | |
ura | +0.620 |
uable | +0.563 |
pora | +0.547 |
veland | +0.539 |
oto | +0.512 |
Neg logit contributions | |
ォ | -0.700 |
kefeller | -0.636 |
ruary | -0.589 |
hester | -0.558 |
Nebula | -0.520 |
Token | also |
Token ID | 635 |
Feature activation | +2.60e+00 |
Pos logit contributions | |
ura | +0.423 |
uable | +0.386 |
pora | +0.376 |
veland | +0.371 |
oto | +0.350 |
Neg logit contributions | |
ォ | -0.497 |
kefeller | -0.446 |
ruary | -0.417 |
hester | -0.394 |
Nebula | -0.369 |
Token | included |
Token ID | 3017 |
Feature activation | +2.80e+00 |
Pos logit contributions | |
ura | +1.863 |
uable | +1.662 |
pora | +1.621 |
veland | +1.598 |
aur | +1.492 |
Neg logit contributions | |
ォ | -2.733 |
kefeller | -2.487 |
ruary | -2.335 |
hester | -2.208 |
Nebula | -2.083 |
Token | from |
Token ID | 422 |
Feature activation | -2.92e+00 |
Pos logit contributions | |
ォ | +0.089 |
kefeller | +0.080 |
ruary | +0.076 |
hester | +0.072 |
Nebula | +0.068 |
Neg logit contributions | |
ura | -0.059 |
uable | -0.053 |
pora | -0.052 |
veland | -0.051 |
oto | -0.047 |
Token | the |
Token ID | 262 |
Feature activation | +2.02e-01 |
Pos logit contributions | |
ォ | +2.553 |
kefeller | +2.280 |
ruary | +2.111 |
hester | +1.995 |
Nebula | +1.880 |
Neg logit contributions | |
ura | -2.543 |
uable | -2.338 |
pora | -2.300 |
veland | -2.264 |
oto | -2.137 |
Token | Harvard |
Token ID | 11131 |
Feature activation | -4.57e+00 |
Pos logit contributions | |
ura | +0.191 |
uable | +0.176 |
pora | +0.173 |
veland | +0.171 |
oto | +0.162 |
Neg logit contributions | |
ォ | -0.165 |
kefeller | -0.145 |
ruary | -0.134 |
hester | -0.125 |
Nebula | -0.115 |
Token | - |
Token ID | 12 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
ォ | +4.218 |
kefeller | +3.784 |
ruary | +3.537 |
hester | +3.335 |
Nebula | +3.217 |
Neg logit contributions | |
ura | -3.735 |
uable | -3.419 |
pora | -3.349 |
veland | -3.307 |
aur | -3.107 |
Token | Smith |
Token ID | 17919 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
ura | +0.124 |
uable | +0.115 |
pora | +0.113 |
veland | +0.112 |
oto | +0.107 |
Neg logit contributions | |
ォ | -0.093 |
kefeller | -0.081 |
ruary | -0.074 |
hester | -0.069 |
intern | -0.063 |
Token | sonian |
Token ID | 35202 |
Feature activation | -8.45e+00 |
Pos logit contributions | |
ォ | +0.398 |
kefeller | +0.238 |
ruary | +0.133 |
hester | +0.062 |
sonian | +0.000 |
Neg logit contributions | |
ura | -2.779 |
uable | -2.661 |
pora | -2.635 |
veland | -2.606 |
oto | -2.536 |
Token | Center |
Token ID | 3337 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
ォ | +5.591 |
kefeller | +4.831 |
ruary | +4.446 |
hester | +4.237 |
sonian | +4.148 |
Neg logit contributions | |
ura | -8.660 |
pora | -8.215 |
uable | -8.157 |
veland | -7.756 |
teenth | -7.512 |
Token | for |
Token ID | 329 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
ォ | +1.270 |
kefeller | +1.164 |
ruary | +1.104 |
hester | +1.055 |
Nebula | +1.007 |
Neg logit contributions | |
ura | -0.679 |
uable | -0.601 |
pora | -0.581 |
veland | -0.570 |
oto | -0.524 |
Token | Ast |
Token ID | 8304 |
Feature activation | +2.11e+00 |
Pos logit contributions | |
ura | +0.023 |
uable | +0.022 |
pora | +0.021 |
veland | +0.021 |
oto | +0.020 |
Neg logit contributions | |
ォ | -0.014 |
kefeller | -0.012 |
ruary | -0.011 |
hester | -0.010 |
Nebula | -0.010 |
Token | roph |
Token ID | 10051 |
Feature activation | -5.77e+00 |
Pos logit contributions | |
ura | +2.088 |
uable | +1.956 |
pora | +1.940 |
veland | +1.925 |
teenth | +1.809 |
Neg logit contributions | |
ォ | -1.568 |
kefeller | -1.349 |
ruary | -1.262 |
hester | -1.167 |
Nebula | -1.092 |
Token | ysics |
Token ID | 23154 |
Feature activation | -4.22e+00 |
Pos logit contributions | |
ォ | +4.584 |
kefeller | +3.936 |
ruary | +3.842 |
hester | +3.463 |
Nebula | +3.420 |
Neg logit contributions | |
ura | -5.031 |
uable | -4.874 |
veland | -4.784 |
pora | -4.749 |
teenth | -4.505 |
Token | will |
Token ID | 481 |
Feature activation | -3.58e-02 |
Pos logit contributions | |
ura | +1.541 |
uable | +1.388 |
pora | +1.352 |
veland | +1.333 |
oto | +1.249 |
Neg logit contributions | |
ォ | -2.149 |
kefeller | -1.944 |
ruary | -1.830 |
hester | -1.736 |
intern | -1.632 |
Token | be |
Token ID | 307 |
Feature activation | +2.71e+00 |
Pos logit contributions | |
ォ | +0.033 |
kefeller | +0.029 |
ruary | +0.027 |
hester | +0.026 |
Nebula | +0.024 |
Neg logit contributions | |
ura | -0.030 |
uable | -0.028 |
pora | -0.027 |
veland | -0.027 |
oto | -0.025 |
Token | joined |
Token ID | 5399 |
Feature activation | +3.98e-01 |
Pos logit contributions | |
ura | +2.008 |
uable | +1.804 |
pora | +1.758 |
veland | +1.742 |
oto | +1.627 |
Neg logit contributions | |
ォ | -2.774 |
kefeller | -2.499 |
ruary | -2.354 |
hester | -2.225 |
intern | -2.090 |
Token | by |
Token ID | 416 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
ura | +0.287 |
uable | +0.258 |
pora | +0.250 |
veland | +0.247 |
oto | +0.232 |
Neg logit contributions | |
ォ | -0.415 |
kefeller | -0.375 |
ruary | -0.352 |
hester | -0.335 |
Nebula | -0.316 |
Token | Jim |
Token ID | 5395 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
ォ | +1.305 |
kefeller | +1.165 |
ruary | +1.089 |
hester | +1.026 |
Nebula | +0.965 |
Neg logit contributions | |
ura | -1.205 |
uable | -1.105 |
pora | -1.079 |
veland | -1.068 |
oto | -1.006 |
Token | Hub |
Token ID | 14699 |
Feature activation | -8.41e+00 |
Pos logit contributions | |
ォ | +1.662 |
kefeller | +1.463 |
ruary | +1.355 |
hester | +1.265 |
Nebula | +1.171 |
Neg logit contributions | |
ura | -1.895 |
uable | -1.756 |
pora | -1.717 |
veland | -1.705 |
oto | -1.613 |
Token | ay |
Token ID | 323 |
Feature activation | +4.69e+00 |
Pos logit contributions | |
ォ | +7.930 |
kefeller | +7.324 |
ruary | +6.940 |
hester | +6.576 |
bley | +6.288 |
Neg logit contributions | |
ura | -5.931 |
uable | -5.622 |
pora | -5.399 |
veland | -5.320 |
teenth | -5.060 |
Token | and |
Token ID | 290 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
ura | +3.305 |
uable | +2.921 |
pora | +2.850 |
veland | +2.819 |
oto | +2.643 |
Neg logit contributions | |
ォ | -4.964 |
kefeller | -4.503 |
ruary | -4.276 |
hester | -4.048 |
Nebula | -3.801 |
Token | the |
Token ID | 262 |
Feature activation | +3.14e-01 |
Pos logit contributions | |
ォ | +0.143 |
kefeller | +0.126 |
ruary | +0.117 |
hester | +0.109 |
Nebula | +0.100 |
Neg logit contributions | |
ura | -0.156 |
uable | -0.144 |
pora | -0.141 |
veland | -0.140 |
oto | -0.133 |
Token | late |
Token ID | 2739 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
ura | +0.257 |
uable | +0.235 |
pora | +0.229 |
veland | +0.226 |
oto | +0.213 |
Neg logit contributions | |
ォ | -0.296 |
kefeller | -0.265 |
ruary | -0.248 |
hester | -0.234 |
Nebula | -0.219 |
Token | John |
Token ID | 1757 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
ォ | +1.363 |
kefeller | +1.211 |
ruary | +1.127 |
hester | +1.060 |
Nebula | +0.993 |
Neg logit contributions | |
ura | -1.348 |
uable | -1.237 |
pora | -1.212 |
veland | -1.198 |
oto | -1.133 |
Token | mo |
Token ID | 5908 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
ura | +0.704 |
uable | +0.612 |
pora | +0.588 |
veland | +0.576 |
oto | +0.516 |
Neg logit contributions | |
ォ | -1.679 |
kefeller | -1.546 |
ruary | -1.473 |
hester | -1.414 |
Nebula | -1.349 |
Token | L |
Token ID | 406 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
ura | +2.806 |
uable | +2.557 |
pora | +2.497 |
veland | +2.474 |
oto | +2.344 |
Neg logit contributions | |
ォ | -3.049 |
kefeller | -2.712 |
ruary | -2.538 |
hester | -2.392 |
Nebula | -2.232 |
Token | asso |
Token ID | 28372 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
ura | +0.192 |
uable | +0.176 |
pora | +0.172 |
veland | +0.171 |
oto | +0.159 |
Neg logit contributions | |
ォ | -0.221 |
kefeller | -0.200 |
ruary | -0.186 |
hester | -0.177 |
intern | -0.165 |
Token | and |
Token ID | 290 |
Feature activation | -6.66e-02 |
Pos logit contributions | |
ura | +2.201 |
uable | +1.942 |
pora | +1.886 |
veland | +1.869 |
oto | +1.751 |
Neg logit contributions | |
ォ | -3.523 |
kefeller | -3.206 |
ruary | -3.042 |
hester | -2.880 |
intern | -2.725 |
Token | Lenin |
Token ID | 22899 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
ォ | +0.061 |
kefeller | +0.054 |
ruary | +0.051 |
hester | +0.048 |
Nebula | +0.044 |
Neg logit contributions | |
ura | -0.056 |
uable | -0.052 |
pora | -0.050 |
veland | -0.050 |
oto | -0.047 |
Token | Moreno |
Token ID | 43269 |
Feature activation | +9.33e+00 |
Pos logit contributions | |
ォ | +4.394 |
kefeller | +3.971 |
ruary | +3.728 |
hester | +3.533 |
intern | +3.332 |
Neg logit contributions | |
ura | -3.787 |
uable | -3.511 |
veland | -3.425 |
pora | -3.391 |
teenth | -3.170 |
Token | , |
Token ID | 11 |
Feature activation | +8.73e-01 |
Pos logit contributions | |
ura | +5.660 |
pora | +4.858 |
uable | +4.767 |
veland | +4.720 |
oto | +4.462 |
Neg logit contributions | |
ォ | -10.417 |
kefeller | -9.417 |
ruary | -8.822 |
hester | -8.527 |
�� | -8.256 |
Token | scheduled |
Token ID | 7530 |
Feature activation | +3.64e+00 |
Pos logit contributions | |
ura | +0.707 |
uable | +0.645 |
pora | +0.629 |
veland | +0.622 |
oto | +0.585 |
Neg logit contributions | |
ォ | -0.833 |
kefeller | -0.745 |
ruary | -0.698 |
hester | -0.659 |
Nebula | -0.617 |
Token | for |
Token ID | 329 |
Feature activation | +8.24e-01 |
Pos logit contributions | |
ura | +2.168 |
uable | +1.897 |
pora | +1.854 |
veland | +1.815 |
oto | +1.685 |
Neg logit contributions | |
ォ | -4.252 |
kefeller | -3.870 |
ruary | -3.621 |
hester | -3.493 |
Nebula | -3.342 |
Token | Sunday |
Token ID | 3502 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
ura | +0.705 |
uable | +0.646 |
pora | +0.632 |
veland | +0.625 |
oto | +0.590 |
Neg logit contributions | |
ォ | -0.746 |
kefeller | -0.665 |
ruary | -0.622 |
hester | -0.584 |
Nebula | -0.546 |
Token | . |
Token ID | 13 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
ura | +1.277 |
uable | +1.134 |
pora | +1.104 |
veland | +1.083 |
oto | +1.013 |
Neg logit contributions | |
ォ | -2.043 |
kefeller | -1.857 |
ruary | -1.740 |
hester | -1.670 |
Nebula | -1.575 |
Token | in |
Token ID | 287 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
ura | +1.095 |
uable | +0.977 |
pora | +0.955 |
veland | +0.941 |
oto | +0.884 |
Neg logit contributions | |
ォ | -1.585 |
kefeller | -1.435 |
ruary | -1.347 |
hester | -1.284 |
Nebula | -1.210 |
Token | front |
Token ID | 2166 |
Feature activation | -2.14e+00 |
Pos logit contributions | |
ura | +0.926 |
uable | +0.845 |
pora | +0.826 |
veland | +0.817 |
oto | +0.773 |
Neg logit contributions | |
ォ | -1.024 |
kefeller | -0.914 |
ruary | -0.854 |
hester | -0.806 |
intern | -0.750 |
Token | of |
Token ID | 286 |
Feature activation | +4.80e-02 |
Pos logit contributions | |
ォ | +2.442 |
kefeller | +2.230 |
ruary | +2.112 |
hester | +2.020 |
intern | +1.913 |
Neg logit contributions | |
ura | -1.347 |
uable | -1.188 |
pora | -1.152 |
veland | -1.135 |
oto | -1.045 |
Token | the |
Token ID | 262 |
Feature activation | +5.79e-01 |
Pos logit contributions | |
ura | +0.039 |
uable | +0.035 |
pora | +0.035 |
veland | +0.034 |
oto | +0.032 |
Neg logit contributions | |
ォ | -0.046 |
kefeller | -0.041 |
ruary | -0.039 |
hester | -0.036 |
intern | -0.034 |
Token | Shaw |
Token ID | 18193 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
ura | +0.482 |
uable | +0.439 |
pora | +0.430 |
veland | +0.424 |
oto | +0.401 |
Neg logit contributions | |
ォ | -0.538 |
kefeller | -0.480 |
ruary | -0.451 |
hester | -0.424 |
intern | -0.395 |
Token | Amen |
Token ID | 34717 |
Feature activation | +7.53e+00 |
Pos logit contributions | |
ura | +1.799 |
uable | +1.631 |
pora | +1.610 |
veland | +1.586 |
oto | +1.511 |
Neg logit contributions | |
ォ | -1.834 |
kefeller | -1.632 |
ruary | -1.525 |
hester | -1.428 |
�� | -1.325 |
Token | ities |
Token ID | 871 |
Feature activation | +2.21e+00 |
Pos logit contributions | |
ura | +8.426 |
pora | +7.674 |
uable | +7.666 |
veland | +7.454 |
oto | +7.361 |
Neg logit contributions | |
ォ | -4.664 |
kefeller | -3.950 |
ruary | -3.564 |
hester | -3.229 |
�� | -3.016 |
Token | Building |
Token ID | 11819 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
ura | +1.976 |
uable | +1.804 |
pora | +1.775 |
veland | +1.744 |
aur | +1.671 |
Neg logit contributions | |
ォ | -1.921 |
kefeller | -1.710 |
ruary | -1.587 |
hester | -1.497 |
bley | -1.377 |
Token | , |
Token ID | 11 |
Feature activation | +5.63e-01 |
Pos logit contributions | |
ォ | +1.539 |
kefeller | +1.390 |
ruary | +1.310 |
hester | +1.242 |
Nebula | +1.171 |
Neg logit contributions | |
ura | -1.110 |
uable | -1.003 |
pora | -0.977 |
veland | -0.964 |
oto | -0.901 |
Token | also |
Token ID | 635 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
ura | +0.457 |
uable | +0.415 |
pora | +0.406 |
veland | +0.400 |
oto | +0.378 |
Neg logit contributions | |
ォ | -0.536 |
kefeller | -0.480 |
ruary | -0.449 |
hester | -0.425 |
Nebula | -0.397 |
Token | called |
Token ID | 1444 |
Feature activation | +8.36e-01 |
Pos logit contributions | |
ura | +1.576 |
uable | +1.416 |
pora | +1.376 |
veland | +1.363 |
oto | +1.276 |
Neg logit contributions | |
ォ | -2.182 |
kefeller | -1.979 |
ruary | -1.860 |
hester | -1.766 |
Nebula | -1.658 |
Token | d |
Token ID | 67 |
Feature activation | -2.78e+00 |
Pos logit contributions | |
ura | +0.691 |
uable | +0.639 |
pora | +0.625 |
veland | +0.619 |
oto | +0.582 |
Neg logit contributions | |
ォ | -0.705 |
kefeller | -0.626 |
ruary | -0.586 |
hester | -0.551 |
intern | -0.516 |
Token | 4 |
Token ID | 604 |
Feature activation | +9.66e-01 |
Pos logit contributions | |
ォ | +2.643 |
kefeller | +2.352 |
ruary | +2.220 |
hester | +2.084 |
Nebula | +1.965 |
Neg logit contributions | |
ura | -2.241 |
uable | -2.054 |
pora | -2.002 |
veland | -1.986 |
oto | -1.852 |
Token | . |
Token ID | 13 |
Feature activation | +6.87e-01 |
Pos logit contributions | |
ura | +0.671 |
uable | +0.607 |
pora | +0.589 |
veland | +0.579 |
oto | +0.536 |
Neg logit contributions | |
ォ | -1.026 |
kefeller | -0.926 |
ruary | -0.878 |
hester | -0.836 |
Nebula | -0.795 |
Token | Personnel |
Token ID | 41623 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
ura | +0.617 |
uable | +0.566 |
pora | +0.553 |
veland | +0.549 |
aur | +0.521 |
Neg logit contributions | |
ォ | -0.593 |
kefeller | -0.531 |
ruary | -0.490 |
hester | -0.459 |
intern | -0.426 |
Token | admitting |
Token ID | 22688 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
ura | +1.897 |
uable | +1.715 |
pora | +1.660 |
veland | +1.645 |
aur | +1.546 |
Neg logit contributions | |
ォ | -2.507 |
kefeller | -2.278 |
ruary | -2.136 |
hester | -2.022 |
Nebula | -1.898 |
Token | Scottish |
Token ID | 11905 |
Feature activation | +7.53e+00 |
Pos logit contributions | |
ura | +1.054 |
uable | +0.956 |
pora | +0.931 |
veland | +0.920 |
oto | +0.862 |
Neg logit contributions | |
ォ | -1.375 |
kefeller | -1.239 |
ruary | -1.165 |
hester | -1.103 |
Nebula | -1.038 |
Token | team |
Token ID | 1074 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
ura | +6.170 |
uable | +5.442 |
pora | +5.426 |
veland | +5.303 |
aur | +5.085 |
Neg logit contributions | |
ォ | -6.835 |
kefeller | -6.318 |
ruary | -5.835 |
hester | -5.489 |
�� | -5.208 |
Token | gets |
Token ID | 3011 |
Feature activation | -4.50e-01 |
Pos logit contributions | |
ura | +0.104 |
uable | +0.094 |
pora | +0.092 |
veland | +0.090 |
oto | +0.084 |
Neg logit contributions | |
ォ | -0.142 |
kefeller | -0.128 |
ruary | -0.121 |
hester | -0.114 |
intern | -0.108 |
Token | this |
Token ID | 428 |
Feature activation | +6.66e-01 |
Pos logit contributions | |
ォ | +0.448 |
kefeller | +0.401 |
ruary | +0.378 |
hester | +0.358 |
intern | +0.339 |
Neg logit contributions | |
ura | -0.343 |
uable | -0.312 |
pora | -0.305 |
veland | -0.301 |
oto | -0.281 |
Token | shock |
Token ID | 6380 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
ura | +0.513 |
uable | +0.465 |
pora | +0.454 |
veland | +0.448 |
oto | +0.420 |
Neg logit contributions | |
ォ | -0.661 |
kefeller | -0.595 |
ruary | -0.559 |
hester | -0.529 |
Nebula | -0.498 |
Token | treatment |
Token ID | 3513 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
ォ | +2.285 |
kefeller | +2.036 |
ruary | +1.925 |
hester | +1.817 |
intern | +1.723 |
Neg logit contributions | |
ura | -1.698 |
uable | -1.555 |
pora | -1.522 |
veland | -1.511 |
oto | -1.392 |
Token | . |
Token ID | 13 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
ォ | +0.073 |
kefeller | +0.066 |
ruary | +0.063 |
hester | +0.060 |
Nebula | +0.057 |
Neg logit contributions | |
ura | -0.047 |
uable | -0.042 |
pora | -0.041 |
veland | -0.040 |
oto | -0.037 |
Token | It |
Token ID | 632 |
Feature activation | -4.66e-01 |
Pos logit contributions | |
ォ | +0.113 |
kefeller | +0.101 |
ruary | +0.095 |
hester | +0.090 |
Nebula | +0.084 |
Neg logit contributions | |
ura | -0.095 |
uable | -0.087 |
pora | -0.085 |
veland | -0.084 |
oto | -0.079 |
Token | also |
Token ID | 635 |
Feature activation | +2.63e+00 |
Pos logit contributions | |
ォ | +0.444 |
kefeller | +0.398 |
ruary | +0.373 |
hester | +0.352 |
Nebula | +0.330 |
Neg logit contributions | |
ura | -0.377 |
uable | -0.343 |
pora | -0.335 |
veland | -0.331 |
oto | -0.312 |
Token | has |
Token ID | 468 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
ura | +1.915 |
uable | +1.724 |
pora | +1.679 |
veland | +1.662 |
oto | +1.539 |
Neg logit contributions | |
ォ | -2.739 |
kefeller | -2.482 |
ruary | -2.329 |
hester | -2.194 |
�� | -2.083 |
Token | the |
Token ID | 262 |
Feature activation | +4.97e-01 |
Pos logit contributions | |
ォ | +1.239 |
kefeller | +1.110 |
ruary | +1.044 |
hester | +0.987 |
Nebula | +0.931 |
Neg logit contributions | |
ura | -1.031 |
uable | -0.940 |
pora | -0.916 |
veland | -0.909 |
oto | -0.853 |
Token | exp |
Token ID | 1033 |
Feature activation | +7.57e+00 |
Pos logit contributions | |
ura | +0.339 |
uable | +0.304 |
pora | +0.295 |
veland | +0.291 |
oto | +0.270 |
Neg logit contributions | |
ォ | -0.535 |
kefeller | -0.486 |
ruary | -0.460 |
hester | -0.437 |
Nebula | -0.415 |
Token | o |
Token ID | 78 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
ura | +4.565 |
uable | +4.017 |
veland | +3.751 |
pora | +3.725 |
oto | +3.569 |
Neg logit contributions | |
ォ | -8.832 |
kefeller | -8.140 |
ruary | -7.561 |
hester | -7.247 |
�� | -6.989 |
Token | hall |
Token ID | 6899 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
ura | +2.467 |
uable | +2.233 |
pora | +2.166 |
veland | +2.140 |
oto | +2.014 |
Neg logit contributions | |
ォ | -3.267 |
kefeller | -2.948 |
ruary | -2.762 |
hester | -2.623 |
Nebula | -2.460 |
Token | floor |
Token ID | 4314 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
ォ | +1.472 |
kefeller | +1.328 |
ruary | +1.256 |
hester | +1.190 |
Nebula | +1.130 |
Neg logit contributions | |
ura | -1.049 |
uable | -0.949 |
pora | -0.929 |
veland | -0.921 |
oto | -0.851 |
Token | map |
Token ID | 3975 |
Feature activation | +3.71e+00 |
Pos logit contributions | |
ura | +1.097 |
uable | +0.990 |
pora | +0.963 |
veland | +0.950 |
oto | +0.887 |
Neg logit contributions | |
ォ | -1.558 |
kefeller | -1.409 |
ruary | -1.328 |
hester | -1.260 |
Nebula | -1.189 |
Token | on |
Token ID | 319 |
Feature activation | +8.79e-01 |
Pos logit contributions | |
ura | +2.596 |
uable | +2.333 |
pora | +2.252 |
veland | +2.220 |
oto | +2.083 |
Neg logit contributions | |
ォ | -3.941 |
kefeller | -3.583 |
ruary | -3.370 |
hester | -3.208 |
Nebula | -3.020 |
Token | it |
Token ID | 270 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
ォ | +2.786 |
kefeller | +2.498 |
ruary | +2.337 |
hester | +2.246 |
intern | +2.149 |
Neg logit contributions | |
ura | -2.178 |
uable | -1.999 |
pora | -1.957 |
veland | -1.930 |
oto | -1.786 |
Token | put |
Token ID | 1234 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
ura | +1.230 |
uable | +1.108 |
pora | +1.071 |
veland | +1.065 |
oto | +0.996 |
Neg logit contributions | |
ォ | -1.705 |
kefeller | -1.548 |
ruary | -1.454 |
hester | -1.381 |
Nebula | -1.307 |
Token | Brock |
Token ID | 20501 |
Feature activation | -4.16e+00 |
Pos logit contributions | |
ura | +0.120 |
uable | +0.109 |
pora | +0.106 |
veland | +0.105 |
oto | +0.098 |
Neg logit contributions | |
ォ | -0.153 |
kefeller | -0.137 |
ruary | -0.129 |
hester | -0.122 |
Nebula | -0.115 |
Token | way |
Token ID | 1014 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
ォ | +3.872 |
kefeller | +3.439 |
ruary | +3.265 |
hester | +3.091 |
Nebula | +2.905 |
Neg logit contributions | |
ura | -3.330 |
uable | -3.061 |
pora | -3.029 |
veland | -2.977 |
oto | -2.759 |
Token | , |
Token ID | 11 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
ォ | +1.658 |
kefeller | +1.497 |
ruary | +1.409 |
hester | +1.350 |
intern | +1.267 |
Neg logit contributions | |
ura | -1.166 |
uable | -1.067 |
pora | -1.039 |
veland | -1.016 |
oto | -0.950 |
Token | Og |
Token ID | 25686 |
Feature activation | +7.52e+00 |
Pos logit contributions | |
ura | +0.223 |
uable | +0.204 |
pora | +0.199 |
veland | +0.196 |
oto | +0.185 |
Neg logit contributions | |
ォ | -0.255 |
kefeller | -0.228 |
ruary | -0.213 |
hester | -0.202 |
Nebula | -0.190 |
Token | den |
Token ID | 6559 |
Feature activation | -7.49e-01 |
Pos logit contributions | |
ura | +4.746 |
uable | +3.971 |
pora | +3.863 |
veland | +3.848 |
oto | +3.646 |
Neg logit contributions | |
ォ | -8.525 |
kefeller | -7.795 |
ruary | -7.397 |
hester | -6.971 |
�� | -6.856 |
Token | ville |
Token ID | 4244 |
Feature activation | -2.87e+00 |
Pos logit contributions | |
ォ | +0.790 |
kefeller | +0.716 |
ruary | +0.676 |
hester | +0.642 |
Nebula | +0.607 |
Neg logit contributions | |
ura | -0.529 |
uable | -0.476 |
pora | -0.463 |
veland | -0.456 |
oto | -0.425 |
Token | and |
Token ID | 290 |
Feature activation | -5.54e-01 |
Pos logit contributions | |
ォ | +2.945 |
kefeller | +2.661 |
ruary | +2.514 |
hester | +2.400 |
Nebula | +2.257 |
Neg logit contributions | |
ura | -2.059 |
uable | -1.878 |
pora | -1.822 |
veland | -1.789 |
oto | -1.667 |
Token | North |
Token ID | 2258 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
ォ | +0.504 |
kefeller | +0.450 |
ruary | +0.420 |
hester | +0.395 |
Nebula | +0.371 |
Neg logit contributions | |
ura | -0.470 |
uable | -0.431 |
pora | -0.422 |
veland | -0.417 |
oto | -0.393 |
Token | H |
Token ID | 367 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
ura | +1.003 |
uable | +0.919 |
pora | +0.898 |
veland | +0.890 |
oto | +0.841 |
Neg logit contributions | |
ォ | -1.042 |
kefeller | -0.926 |
ruary | -0.863 |
hester | -0.811 |
Nebula | -0.756 |
Token |
|
Token ID | 198 |
Feature activation | -8.88e-02 |
Pos logit contributions | |
ォ | +0.380 |
kefeller | +0.341 |
ruary | +0.320 |
hester | +0.302 |
Nebula | +0.284 |
Neg logit contributions | |
ura | -0.316 |
uable | -0.288 |
pora | -0.281 |
veland | -0.278 |
oto | -0.261 |
Token |
|
Token ID | 198 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
ォ | +0.085 |
kefeller | +0.075 |
ruary | +0.071 |
hester | +0.068 |
intern | +0.065 |
Neg logit contributions | |
ura | -0.070 |
uable | -0.065 |
pora | -0.063 |
veland | -0.062 |
oto | -0.058 |
Token | And |
Token ID | 1870 |
Feature activation | -8.10e-01 |
Pos logit contributions | |
ura | +0.133 |
uable | +0.120 |
pora | +0.117 |
veland | +0.115 |
oto | +0.108 |
Neg logit contributions | |
ォ | -0.187 |
kefeller | -0.169 |
ruary | -0.159 |
hester | -0.151 |
Nebula | -0.142 |
Token | so |
Token ID | 523 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
ォ | +0.708 |
kefeller | +0.625 |
ruary | +0.587 |
hester | +0.550 |
Nebula | +0.518 |
Neg logit contributions | |
ura | -0.709 |
uable | -0.658 |
pora | -0.642 |
veland | -0.637 |
oto | -0.597 |
Token | we |
Token ID | 356 |
Feature activation | +4.05e-02 |
Pos logit contributions | |
ura | +1.451 |
uable | +1.310 |
pora | +1.280 |
veland | +1.263 |
oto | +1.188 |
Neg logit contributions | |
ォ | -1.905 |
kefeller | -1.721 |
ruary | -1.613 |
hester | -1.525 |
Nebula | -1.434 |
Token | test |
Token ID | 1332 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
ura | +0.032 |
uable | +0.029 |
pora | +0.028 |
veland | +0.028 |
oto | +0.026 |
Neg logit contributions | |
ォ | -0.040 |
kefeller | -0.036 |
ruary | -0.033 |
hester | -0.032 |
Nebula | -0.030 |
Token | out |
Token ID | 503 |
Feature activation | -4.39e-01 |
Pos logit contributions | |
ura | +1.093 |
uable | +0.994 |
pora | +0.968 |
veland | +0.957 |
oto | +0.900 |
Neg logit contributions | |
ォ | -1.346 |
kefeller | -1.211 |
ruary | -1.135 |
hester | -1.073 |
Nebula | -1.007 |
Token | our |
Token ID | 674 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
ォ | +0.423 |
kefeller | +0.379 |
ruary | +0.356 |
hester | +0.336 |
Nebula | +0.316 |
Neg logit contributions | |
ura | -0.349 |
uable | -0.319 |
pora | -0.311 |
veland | -0.307 |
oto | -0.289 |
Token | press |
Token ID | 1803 |
Feature activation | +5.34e-01 |
Pos logit contributions | |
ォ | +2.018 |
kefeller | +1.799 |
ruary | +1.696 |
hester | +1.606 |
Nebula | +1.517 |
Neg logit contributions | |
ura | -1.623 |
uable | -1.486 |
pora | -1.453 |
veland | -1.440 |
oto | -1.346 |
Token | credentials |
Token ID | 18031 |
Feature activation | +4.05e-01 |
Pos logit contributions | |
ura | +0.387 |
uable | +0.353 |
pora | +0.343 |
veland | +0.339 |
oto | +0.315 |
Neg logit contributions | |
ォ | -0.551 |
kefeller | -0.497 |
ruary | -0.469 |
hester | -0.445 |
intern | -0.420 |
Token | by |
Token ID | 416 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
ura | +0.281 |
uable | +0.252 |
pora | +0.245 |
veland | +0.241 |
oto | +0.224 |
Neg logit contributions | |
ォ | -0.433 |
kefeller | -0.393 |
ruary | -0.371 |
hester | -0.353 |
Nebula | -0.334 |
Token | T |
Token ID | 309 |
Feature activation | -2.92e-02 |
Pos logit contributions | |
ォ | +0.683 |
kefeller | +0.611 |
ruary | +0.571 |
hester | +0.539 |
Nebula | +0.507 |
Neg logit contributions | |
ura | -0.594 |
uable | -0.544 |
pora | -0.532 |
veland | -0.525 |
oto | -0.494 |
Token | atar |
Token ID | 9459 |
Feature activation | +6.93e-01 |
Pos logit contributions | |
ォ | +0.031 |
kefeller | +0.028 |
ruary | +0.026 |
hester | +0.025 |
intern | +0.024 |
Neg logit contributions | |
ura | -0.020 |
uable | -0.018 |
pora | -0.018 |
veland | -0.018 |
oto | -0.016 |
Token | ( |
Token ID | 357 |
Feature activation | +4.29e-01 |
Pos logit contributions | |
ura | +0.507 |
uable | +0.458 |
pora | +0.446 |
veland | +0.440 |
oto | +0.411 |
Neg logit contributions | |
ォ | -0.714 |
kefeller | -0.645 |
ruary | -0.608 |
hester | -0.577 |
Nebula | -0.544 |
Token | not |
Token ID | 1662 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
ura | +0.347 |
uable | +0.317 |
pora | +0.309 |
veland | +0.305 |
oto | +0.288 |
Neg logit contributions | |
ォ | -0.408 |
kefeller | -0.366 |
ruary | -0.343 |
hester | -0.323 |
Nebula | -0.303 |
Token | to |
Token ID | 284 |
Feature activation | -2.47e-01 |
Pos logit contributions | |
ura | +0.142 |
uable | +0.129 |
pora | +0.126 |
veland | +0.125 |
oto | +0.117 |
Neg logit contributions | |
ォ | -0.172 |
kefeller | -0.154 |
ruary | -0.145 |
hester | -0.137 |
Nebula | -0.128 |
Token | be |
Token ID | 307 |
Feature activation | +2.25e+00 |
Pos logit contributions | |
ォ | +0.216 |
kefeller | +0.195 |
ruary | +0.181 |
hester | +0.172 |
Nebula | +0.158 |
Neg logit contributions | |
ura | -0.219 |
uable | -0.200 |
veland | -0.195 |
pora | -0.194 |
oto | -0.184 |
Token | confused |
Token ID | 10416 |
Feature activation | -6.64e-01 |
Pos logit contributions | |
ura | +1.798 |
uable | +1.609 |
pora | +1.578 |
veland | +1.571 |
aur | +1.468 |
Neg logit contributions | |
ォ | -2.162 |
kefeller | -1.967 |
ruary | -1.823 |
hester | -1.733 |
Nebula | -1.625 |
Token | with |
Token ID | 351 |
Feature activation | -8.90e-01 |
Pos logit contributions | |
ォ | +0.722 |
kefeller | +0.658 |
ruary | +0.620 |
hester | +0.592 |
Nebula | +0.561 |
Neg logit contributions | |
ura | -0.451 |
uable | -0.403 |
pora | -0.387 |
veland | -0.385 |
aur | -0.360 |
Token | the |
Token ID | 262 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
ォ | +0.840 |
kefeller | +0.752 |
ruary | +0.704 |
hester | +0.664 |
Nebula | +0.623 |
Neg logit contributions | |
ura | -0.726 |
uable | -0.664 |
pora | -0.648 |
veland | -0.640 |
oto | -0.603 |
Token | modern |
Token ID | 3660 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
ura | +0.305 |
uable | +0.278 |
pora | +0.271 |
veland | +0.268 |
oto | +0.253 |
Neg logit contributions | |
ォ | -0.356 |
kefeller | -0.319 |
ruary | -0.299 |
hester | -0.282 |
Nebula | -0.263 |
Token | Turk |
Token ID | 8484 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
ォ | +1.635 |
kefeller | +1.449 |
ruary | +1.360 |
hester | +1.284 |
Nebula | +1.215 |
Neg logit contributions | |
ura | -1.430 |
uable | -1.310 |
pora | -1.286 |
veland | -1.269 |
oto | -1.187 |
Token | Coalition |
Token ID | 15135 |
Feature activation | -2.93e+00 |
Pos logit contributions | |
ura | +0.462 |
uable | +0.423 |
pora | +0.414 |
veland | +0.411 |
oto | +0.388 |
Neg logit contributions | |
ォ | -0.460 |
kefeller | -0.407 |
ruary | -0.380 |
hester | -0.356 |
Nebula | -0.331 |
Token | for |
Token ID | 329 |
Feature activation | +6.47e-01 |
Pos logit contributions | |
ォ | +3.196 |
kefeller | +2.895 |
ruary | +2.743 |
hester | +2.608 |
intern | +2.491 |
Neg logit contributions | |
ura | -1.937 |
uable | -1.748 |
pora | -1.685 |
veland | -1.653 |
oto | -1.532 |
Token | the |
Token ID | 262 |
Feature activation | +5.14e-01 |
Pos logit contributions | |
ura | +0.590 |
uable | +0.542 |
pora | +0.531 |
veland | +0.526 |
oto | +0.499 |
Neg logit contributions | |
ォ | -0.552 |
kefeller | -0.487 |
ruary | -0.452 |
hester | -0.423 |
Nebula | -0.392 |
Token | Homeless |
Token ID | 47706 |
Feature activation | -3.12e+00 |
Pos logit contributions | |
ura | +0.548 |
uable | +0.511 |
pora | +0.502 |
veland | +0.498 |
oto | +0.476 |
Neg logit contributions | |
ォ | -0.359 |
kefeller | -0.308 |
ruary | -0.280 |
hester | -0.257 |
Nebula | -0.232 |
Token | , |
Token ID | 11 |
Feature activation | +6.65e-01 |
Pos logit contributions | |
ォ | +3.218 |
kefeller | +2.901 |
ruary | +2.747 |
hester | +2.598 |
intern | +2.452 |
Neg logit contributions | |
ura | -2.252 |
uable | -2.058 |
pora | -1.984 |
veland | -1.954 |
oto | -1.829 |
Token | � |
Token ID | 1587 |
Feature activation | +3.29e+00 |
Pos logit contributions | |
ura | +0.536 |
uable | +0.486 |
pora | +0.475 |
veland | +0.470 |
oto | +0.442 |
Neg logit contributions | |
ォ | -0.637 |
kefeller | -0.573 |
ruary | -0.536 |
hester | -0.507 |
Nebula | -0.476 |
Token | � |
Token ID | 241 |
Feature activation | -3.63e-01 |
Pos logit contributions | |
ura | +3.309 |
uable | +3.036 |
pora | +2.974 |
veland | +2.962 |
aur | +2.822 |
Neg logit contributions | |
ォ | -2.471 |
kefeller | -2.218 |
ruary | -1.984 |
hester | -1.867 |
Nebula | -1.694 |
Token | the |
Token ID | 1169 |
Feature activation | +7.23e-01 |
Pos logit contributions | |
ォ | +0.345 |
kefeller | +0.309 |
ruary | +0.289 |
hester | +0.273 |
intern | +0.257 |
Neg logit contributions | |
ura | -0.293 |
uable | -0.267 |
pora | -0.261 |
veland | -0.258 |
oto | -0.243 |
Token | city |
Token ID | 1748 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
ura | +0.575 |
uable | +0.522 |
pora | +0.508 |
veland | +0.502 |
oto | +0.473 |
Neg logit contributions | |
ォ | -0.700 |
kefeller | -0.630 |
ruary | -0.591 |
hester | -0.559 |
Nebula | -0.522 |
Token | would |
Token ID | 561 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
ura | +0.811 |
uable | +0.734 |
pora | +0.715 |
veland | +0.706 |
aur | +0.662 |
Neg logit contributions | |
ォ | -1.055 |
kefeller | -0.953 |
ruary | -0.898 |
hester | -0.848 |
Nebula | -0.799 |
Token | be |
Token ID | 307 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
ォ | +1.781 |
kefeller | +1.577 |
ruary | +1.477 |
hester | +1.380 |
intern | +1.292 |
Neg logit contributions | |
ura | -1.716 |
uable | -1.578 |
pora | -1.543 |
veland | -1.529 |
oto | -1.441 |
Token | Creek |
Token ID | 13509 |
Feature activation | -3.49e+00 |
Pos logit contributions | |
ura | +3.186 |
uable | +2.861 |
pora | +2.833 |
veland | +2.789 |
aur | +2.655 |
Neg logit contributions | |
ォ | -3.703 |
kefeller | -3.340 |
ruary | -3.125 |
hester | -2.915 |
�� | -2.733 |
Token | Lodge |
Token ID | 27046 |
Feature activation | +3.56e+00 |
Pos logit contributions | |
ォ | +3.199 |
kefeller | +2.827 |
ruary | +2.633 |
hester | +2.527 |
Nebula | +2.414 |
Neg logit contributions | |
ura | -2.848 |
uable | -2.666 |
pora | -2.578 |
veland | -2.551 |
oto | -2.380 |
Token | ( |
Token ID | 357 |
Feature activation | +8.25e-02 |
Pos logit contributions | |
ura | +2.585 |
uable | +2.290 |
pora | +2.248 |
veland | +2.205 |
aur | +2.089 |
Neg logit contributions | |
ォ | -3.696 |
kefeller | -3.364 |
ruary | -3.164 |
hester | -2.986 |
�� | -2.837 |
Token | I |
Token ID | 40 |
Feature activation | -8.68e-01 |
Pos logit contributions | |
ura | +0.063 |
uable | +0.057 |
pora | +0.056 |
veland | +0.055 |
oto | +0.051 |
Neg logit contributions | |
ォ | -0.082 |
kefeller | -0.074 |
ruary | -0.070 |
hester | -0.066 |
Nebula | -0.062 |
Token | think |
Token ID | 892 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
ォ | +0.849 |
kefeller | +0.761 |
ruary | +0.716 |
hester | +0.680 |
bley | +0.640 |
Neg logit contributions | |
ura | -0.667 |
uable | -0.614 |
pora | -0.603 |
veland | -0.585 |
oto | -0.549 |
Token | is |
Token ID | 318 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
ura | +1.221 |
uable | +1.103 |
pora | +1.070 |
veland | +1.065 |
oto | +0.998 |
Neg logit contributions | |
ォ | -1.604 |
kefeller | -1.446 |
ruary | -1.359 |
hester | -1.284 |
intern | -1.206 |
Token | the |
Token ID | 262 |
Feature activation | +6.53e-02 |
Pos logit contributions | |
ura | +1.389 |
uable | +1.263 |
pora | +1.226 |
veland | +1.218 |
oto | +1.145 |
Neg logit contributions | |
ォ | -1.701 |
kefeller | -1.529 |
ruary | -1.436 |
hester | -1.352 |
Nebula | -1.267 |
Token | name |
Token ID | 1438 |
Feature activation | +2.28e+00 |
Pos logit contributions | |
ura | +0.052 |
uable | +0.047 |
pora | +0.046 |
veland | +0.045 |
oto | +0.043 |
Neg logit contributions | |
ォ | -0.063 |
kefeller | -0.057 |
ruary | -0.053 |
hester | -0.050 |
Nebula | -0.047 |
Token | ?) |
Token ID | 10091 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
ura | +1.522 |
uable | +1.356 |
pora | +1.308 |
veland | +1.301 |
oto | +1.207 |
Neg logit contributions | |
ォ | -2.490 |
kefeller | -2.269 |
ruary | -2.153 |
hester | -2.041 |
intern | -1.925 |
Token | down |
Token ID | 866 |
Feature activation | -8.36e-01 |
Pos logit contributions | |
ォ | +0.132 |
kefeller | +0.119 |
ruary | +0.112 |
hester | +0.106 |
Nebula | +0.101 |
Neg logit contributions | |
ura | -0.095 |
uable | -0.086 |
pora | -0.084 |
veland | -0.083 |
oto | -0.077 |
Token | the |
Token ID | 262 |
Feature activation | -1.44e-01 |
Pos logit contributions | |
ォ | +0.814 |
kefeller | +0.730 |
ruary | +0.687 |
hester | +0.651 |
intern | +0.610 |
Neg logit contributions | |
ura | -0.655 |
uable | -0.596 |
pora | -0.584 |
veland | -0.574 |
oto | -0.539 |
Token | , |
Token ID | 11 |
Feature activation | +5.26e-01 |
Pos logit contributions | |
ura | +2.865 |
uable | +2.506 |
pora | +2.422 |
veland | +2.358 |
oto | +2.228 |
Neg logit contributions | |
ォ | -4.914 |
kefeller | -4.500 |
ruary | -4.245 |
hester | -4.052 |
Nebula | -3.833 |
Token | using |
Token ID | 1262 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
ura | +0.408 |
uable | +0.370 |
pora | +0.361 |
veland | +0.357 |
oto | +0.334 |
Neg logit contributions | |
ォ | -0.519 |
kefeller | -0.467 |
ruary | -0.438 |
hester | -0.415 |
Nebula | -0.390 |
Token | a |
Token ID | 257 |
Feature activation | -5.96e-01 |
Pos logit contributions | |
ォ | +1.008 |
kefeller | +0.905 |
ruary | +0.848 |
hester | +0.803 |
Nebula | +0.755 |
Neg logit contributions | |
ura | -0.814 |
uable | -0.740 |
pora | -0.722 |
veland | -0.714 |
oto | -0.670 |
Token | block |
Token ID | 2512 |
Feature activation | -9.07e-01 |
Pos logit contributions | |
ォ | +0.587 |
kefeller | +0.528 |
ruary | +0.495 |
hester | +0.469 |
Nebula | +0.441 |
Neg logit contributions | |
ura | -0.461 |
uable | -0.420 |
pora | -0.410 |
veland | -0.405 |
oto | -0.380 |
Token | of |
Token ID | 286 |
Feature activation | +5.14e-02 |
Pos logit contributions | |
ォ | +0.973 |
kefeller | +0.875 |
ruary | +0.826 |
hester | +0.788 |
intern | +0.750 |
Neg logit contributions | |
ura | -0.623 |
uable | -0.560 |
pora | -0.544 |
veland | -0.539 |
oto | -0.497 |
Token | aluminum |
Token ID | 15955 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
ura | +0.040 |
uable | +0.036 |
pora | +0.035 |
veland | +0.035 |
oto | +0.033 |
Neg logit contributions | |
ォ | -0.051 |
kefeller | -0.046 |
ruary | -0.043 |
hester | -0.041 |
Nebula | -0.038 |
Token | to |
Token ID | 284 |
Feature activation | -8.97e-03 |
Pos logit contributions | |
ura | +1.397 |
uable | +1.257 |
pora | +1.221 |
veland | +1.200 |
oto | +1.121 |
Neg logit contributions | |
ォ | -2.069 |
kefeller | -1.877 |
ruary | -1.773 |
hester | -1.682 |
Nebula | -1.590 |
Token | delic |
Token ID | 8675 |
Feature activation | +3.21e-01 |
Pos logit contributions | |
ォ | +0.009 |
kefeller | +0.008 |
ruary | +0.007 |
hester | +0.007 |
Nebula | +0.007 |
Neg logit contributions | |
ura | -0.007 |
uable | -0.006 |
pora | -0.006 |
veland | -0.006 |
oto | -0.006 |
Token | ately |
Token ID | 1286 |
Feature activation | +2.26e+00 |
Pos logit contributions | |
ura | +0.240 |
uable | +0.217 |
pora | +0.211 |
veland | +0.209 |
oto | +0.195 |
Neg logit contributions | |
ォ | -0.326 |
kefeller | -0.294 |
ruary | -0.276 |
hester | -0.262 |
Nebula | -0.247 |
Token | set |
Token ID | 900 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
ura | +1.840 |
uable | +1.669 |
pora | +1.625 |
veland | +1.608 |
oto | +1.520 |
Neg logit contributions | |
ォ | -2.144 |
kefeller | -1.933 |
ruary | -1.809 |
hester | -1.714 |
Nebula | -1.600 |
Token | the |
Token ID | 262 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
ura | +0.868 |
uable | +0.789 |
pora | +0.769 |
veland | +0.760 |
oto | +0.715 |
Neg logit contributions | |
ォ | -1.065 |
kefeller | -0.957 |
ruary | -0.899 |
hester | -0.848 |
Nebula | -0.797 |
Token | civil |
Token ID | 3026 |
Feature activation | -2.39e+00 |
Pos logit contributions | |
ura | +1.203 |
uable | +1.090 |
pora | +1.067 |
veland | +1.053 |
aur | +0.992 |
Neg logit contributions | |
ォ | -1.444 |
kefeller | -1.300 |
ruary | -1.209 |
hester | -1.143 |
Nebula | -1.064 |
Token | servants |
Token ID | 17523 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
ォ | +2.076 |
kefeller | +1.853 |
ruary | +1.719 |
hester | +1.608 |
Nebula | +1.496 |
Neg logit contributions | |
ura | -2.152 |
uable | -1.964 |
pora | -1.934 |
veland | -1.913 |
aur | -1.815 |
Token | take |
Token ID | 1011 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
ォ | +1.640 |
kefeller | +1.461 |
ruary | +1.404 |
hester | +1.322 |
intern | +1.262 |
Neg logit contributions | |
ura | -1.199 |
uable | -1.099 |
pora | -1.060 |
veland | -1.056 |
oto | -0.990 |
Token | a |
Token ID | 257 |
Feature activation | -3.79e-01 |
Pos logit contributions | |
ura | +1.893 |
uable | +1.715 |
pora | +1.665 |
veland | +1.643 |
oto | +1.545 |
Neg logit contributions | |
ォ | -2.489 |
kefeller | -2.248 |
ruary | -2.109 |
hester | -1.997 |
Nebula | -1.872 |
Token | team |
Token ID | 1074 |
Feature activation | +3.37e-01 |
Pos logit contributions | |
ォ | +0.358 |
kefeller | +0.321 |
ruary | +0.301 |
hester | +0.284 |
Nebula | +0.266 |
Neg logit contributions | |
ura | -0.310 |
uable | -0.283 |
pora | -0.276 |
veland | -0.273 |
oto | -0.257 |
Token | approach |
Token ID | 3164 |
Feature activation | +3.66e-01 |
Pos logit contributions | |
ura | +0.230 |
uable | +0.206 |
pora | +0.200 |
veland | +0.197 |
oto | +0.183 |
Neg logit contributions | |
ォ | -0.364 |
kefeller | -0.331 |
ruary | -0.313 |
hester | -0.298 |
Nebula | -0.282 |
Token | , |
Token ID | 11 |
Feature activation | +9.51e-01 |
Pos logit contributions | |
ura | +0.263 |
uable | +0.237 |
pora | +0.231 |
veland | +0.228 |
oto | +0.212 |
Neg logit contributions | |
ォ | -0.381 |
kefeller | -0.345 |
ruary | -0.326 |
hester | -0.309 |
intern | -0.292 |
Token | making |
Token ID | 1642 |
Feature activation | -6.80e-02 |
Pos logit contributions | |
ura | +0.731 |
uable | +0.663 |
pora | +0.646 |
veland | +0.638 |
oto | +0.598 |
Neg logit contributions | |
ォ | -0.943 |
kefeller | -0.849 |
ruary | -0.798 |
hester | -0.755 |
Nebula | -0.711 |
Token | bilingual |
Token ID | 48116 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
ォ | +0.074 |
kefeller | +0.067 |
ruary | +0.063 |
hester | +0.060 |
Nebula | +0.057 |
Neg logit contributions | |
ura | -0.046 |
uable | -0.041 |
pora | -0.040 |
veland | -0.040 |
oto | -0.037 |
Token | ism |
Token ID | 1042 |
Feature activation | +9.95e-02 |
Pos logit contributions | |
ura | +1.849 |
uable | +1.697 |
pora | +1.658 |
veland | +1.637 |
aur | +1.562 |
Neg logit contributions | |
ォ | -1.821 |
kefeller | -1.625 |
ruary | -1.497 |
hester | -1.407 |
Nebula | -1.304 |
Token | for |
Token ID | 329 |
Feature activation | +6.72e-01 |
Pos logit contributions | |
ura | +0.077 |
uable | +0.070 |
pora | +0.068 |
veland | +0.068 |
oto | +0.063 |
Neg logit contributions | |
ォ | -0.098 |
kefeller | -0.088 |
ruary | -0.083 |
hester | -0.078 |
Nebula | -0.074 |
Token | on |
Token ID | 319 |
Feature activation | +5.19e-01 |
Pos logit contributions | |
ォ | +0.521 |
kefeller | +0.471 |
ruary | +0.444 |
hester | +0.421 |
Nebula | +0.397 |
Neg logit contributions | |
ura | -0.379 |
uable | -0.342 |
pora | -0.334 |
veland | -0.329 |
oto | -0.308 |
Token | in |
Token ID | 287 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
ura | +0.390 |
uable | +0.353 |
pora | +0.343 |
veland | +0.339 |
oto | +0.318 |
Neg logit contributions | |
ォ | -0.526 |
kefeller | -0.474 |
ruary | -0.446 |
hester | -0.423 |
Nebula | -0.398 |
Token | the |
Token ID | 262 |
Feature activation | +4.91e-01 |
Pos logit contributions | |
ura | +0.876 |
uable | +0.802 |
pora | +0.783 |
veland | +0.776 |
oto | +0.732 |
Neg logit contributions | |
ォ | -0.950 |
kefeller | -0.846 |
ruary | -0.790 |
hester | -0.744 |
Nebula | -0.693 |
Token | mainstream |
Token ID | 8661 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
ura | +0.435 |
uable | +0.400 |
pora | +0.391 |
veland | +0.387 |
oto | +0.366 |
Neg logit contributions | |
ォ | -0.430 |
kefeller | -0.382 |
ruary | -0.355 |
hester | -0.333 |
Nebula | -0.311 |
Token | media |
Token ID | 2056 |
Feature activation | -2.87e+00 |
Pos logit contributions | |
ォ | +1.348 |
kefeller | +1.189 |
ruary | +1.107 |
hester | +1.029 |
Nebula | +0.964 |
Neg logit contributions | |
ura | -1.530 |
uable | -1.418 |
pora | -1.386 |
veland | -1.369 |
aur | -1.295 |
Token | , |
Token ID | 11 |
Feature activation | +4.70e-01 |
Pos logit contributions | |
ォ | +2.949 |
kefeller | +2.660 |
ruary | +2.525 |
hester | +2.384 |
intern | +2.259 |
Neg logit contributions | |
ura | -2.074 |
uable | -1.881 |
pora | -1.824 |
veland | -1.808 |
oto | -1.675 |
Token | I |
Token ID | 314 |
Feature activation | -8.15e-01 |
Pos logit contributions | |
ura | +0.372 |
uable | +0.339 |
pora | +0.330 |
veland | +0.326 |
oto | +0.307 |
Neg logit contributions | |
ォ | -0.456 |
kefeller | -0.409 |
ruary | -0.384 |
hester | -0.363 |
Nebula | -0.341 |
Token | don |
Token ID | 836 |
Feature activation | -2.57e+00 |
Pos logit contributions | |
ォ | +0.832 |
kefeller | +0.749 |
ruary | +0.707 |
hester | +0.669 |
bley | +0.630 |
Neg logit contributions | |
ura | -0.600 |
uable | -0.546 |
pora | -0.531 |
veland | -0.523 |
oto | -0.488 |
Token | � |
Token ID | 447 |
Feature activation | -9.59e-02 |
Pos logit contributions | |
ォ | +2.622 |
kefeller | +2.286 |
ruary | +2.205 |
hester | +2.073 |
ィ | +2.013 |
Neg logit contributions | |
ura | -1.849 |
uable | -1.728 |
pora | -1.694 |
veland | -1.635 |
oto | -1.514 |
Token | � |
Token ID | 247 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
ォ | +0.075 |
kefeller | +0.064 |
ruary | +0.060 |
hester | +0.055 |
intern | +0.052 |
Neg logit contributions | |
ura | -0.092 |
uable | -0.087 |
pora | -0.086 |
veland | -0.085 |
oto | -0.080 |
Token | t |
Token ID | 83 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
ォ | +0.951 |
kefeller | +0.819 |
ruary | +0.766 |
hester | +0.699 |
bley | +0.652 |
Neg logit contributions | |
ura | -1.251 |
pora | -1.170 |
uable | -1.162 |
veland | -1.139 |
oto | -1.079 |
Token | to |
Token ID | 284 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
ォ | +1.837 |
kefeller | +1.658 |
ruary | +1.558 |
hester | +1.476 |
Nebula | +1.388 |
Neg logit contributions | |
ura | -1.338 |
uable | -1.206 |
pora | -1.171 |
veland | -1.158 |
oto | -1.086 |
Token | put |
Token ID | 1234 |
Feature activation | +2.86e-01 |
Pos logit contributions | |
ォ | +0.234 |
kefeller | +0.210 |
ruary | +0.197 |
hester | +0.187 |
Nebula | +0.175 |
Neg logit contributions | |
ura | -0.186 |
uable | -0.169 |
pora | -0.165 |
veland | -0.163 |
oto | -0.153 |
Token | on |
Token ID | 319 |
Feature activation | +4.47e-01 |
Pos logit contributions | |
ura | +0.215 |
uable | +0.195 |
pora | +0.190 |
veland | +0.187 |
oto | +0.175 |
Neg logit contributions | |
ォ | -0.288 |
kefeller | -0.260 |
ruary | -0.244 |
hester | -0.232 |
Nebula | -0.218 |
Token | a |
Token ID | 257 |
Feature activation | -5.67e-01 |
Pos logit contributions | |
ura | +0.360 |
uable | +0.328 |
pora | +0.320 |
veland | +0.316 |
oto | +0.298 |
Neg logit contributions | |
ォ | -0.427 |
kefeller | -0.383 |
ruary | -0.359 |
hester | -0.339 |
Nebula | -0.318 |
Token | brave |
Token ID | 14802 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
ォ | +0.551 |
kefeller | +0.495 |
ruary | +0.464 |
hester | +0.439 |
Nebula | +0.414 |
Neg logit contributions | |
ura | -0.445 |
uable | -0.407 |
pora | -0.397 |
veland | -0.392 |
oto | -0.368 |
Token | face |
Token ID | 1986 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
ォ | +1.501 |
kefeller | +1.353 |
ruary | +1.284 |
hester | +1.225 |
Nebula | +1.169 |
Neg logit contributions | |
ura | -0.972 |
uable | -0.891 |
pora | -0.860 |
veland | -0.846 |
oto | -0.778 |
Token | for |
Token ID | 329 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
ォ | +1.667 |
kefeller | +1.505 |
ruary | +1.429 |
hester | +1.349 |
intern | +1.286 |
Neg logit contributions | |
ura | -1.203 |
uable | -1.104 |
pora | -1.066 |
veland | -1.055 |
oto | -0.975 |
Token | the |
Token ID | 262 |
Feature activation | +4.11e-01 |
Pos logit contributions | |
ura | +0.306 |
uable | +0.279 |
pora | +0.272 |
veland | +0.269 |
oto | +0.254 |
Neg logit contributions | |
ォ | -0.353 |
kefeller | -0.316 |
ruary | -0.295 |
hester | -0.279 |
Nebula | -0.261 |
Token | sake |
Token ID | 11060 |
Feature activation | +6.75e-01 |
Pos logit contributions | |
ura | +0.324 |
uable | +0.295 |
pora | +0.288 |
veland | +0.284 |
oto | +0.267 |
Neg logit contributions | |
ォ | -0.401 |
kefeller | -0.360 |
ruary | -0.338 |
hester | -0.319 |
Nebula | -0.300 |
Token | of |
Token ID | 286 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
ura | +0.451 |
uable | +0.407 |
pora | +0.394 |
veland | +0.389 |
oto | +0.357 |
Neg logit contributions | |
ォ | -0.729 |
kefeller | -0.664 |
ruary | -0.629 |
hester | -0.600 |
Nebula | -0.574 |
Token | her |
Token ID | 607 |
Feature activation | -9.41e-01 |
Pos logit contributions | |
ォ | +0.152 |
kefeller | +0.136 |
ruary | +0.127 |
hester | +0.120 |
Nebula | +0.112 |
Neg logit contributions | |
ura | -0.134 |
uable | -0.122 |
pora | -0.119 |
veland | -0.118 |
oto | -0.111 |
Token | I |
Token ID | 314 |
Feature activation | -3.49e-01 |
Pos logit contributions | |
ura | +0.404 |
uable | +0.369 |
pora | +0.361 |
veland | +0.356 |
oto | +0.336 |
Neg logit contributions | |
ォ | -0.454 |
kefeller | -0.406 |
ruary | -0.379 |
hester | -0.357 |
Nebula | -0.334 |
Token | made |
Token ID | 925 |
Feature activation | -9.17e-01 |
Pos logit contributions | |
ォ | +0.344 |
kefeller | +0.306 |
ruary | +0.289 |
hester | +0.273 |
intern | +0.258 |
Neg logit contributions | |
ura | -0.270 |
uable | -0.246 |
pora | -0.241 |
veland | -0.235 |
oto | -0.223 |
Token | it |
Token ID | 340 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
ォ | +0.861 |
kefeller | +0.769 |
ruary | +0.720 |
hester | +0.680 |
Nebula | +0.638 |
Neg logit contributions | |
ura | -0.751 |
uable | -0.687 |
pora | -0.671 |
veland | -0.663 |
oto | -0.624 |
Token | . |
Token ID | 13 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
ura | +0.867 |
uable | +0.778 |
pora | +0.755 |
veland | +0.745 |
oto | +0.693 |
Neg logit contributions | |
ォ | -1.321 |
kefeller | -1.199 |
ruary | -1.131 |
hester | -1.076 |
Nebula | -1.018 |
Token |
|
Token ID | 198 |
Feature activation | +2.01e-02 |
Pos logit contributions | |
ura | +0.109 |
uable | +0.100 |
pora | +0.097 |
veland | +0.096 |
oto | +0.091 |
Neg logit contributions | |
ォ | -0.121 |
kefeller | -0.108 |
ruary | -0.101 |
hester | -0.095 |
Nebula | -0.089 |
Token |
|
Token ID | 198 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
ura | +0.016 |
uable | +0.014 |
pora | +0.014 |
veland | +0.014 |
oto | +0.013 |
Neg logit contributions | |
ォ | -0.019 |
kefeller | -0.017 |
ruary | -0.016 |
hester | -0.015 |
intern | -0.015 |
Token | Statistics |
Token ID | 48346 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
ura | +0.236 |
uable | +0.215 |
pora | +0.210 |
veland | +0.208 |
oto | +0.197 |
Neg logit contributions | |
ォ | -0.271 |
kefeller | -0.243 |
ruary | -0.227 |
hester | -0.215 |
Nebula | -0.201 |
Token | used |
Token ID | 973 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
ura | +0.347 |
uable | +0.321 |
pora | +0.315 |
veland | +0.312 |
oto | +0.296 |
Neg logit contributions | |
ォ | -0.296 |
kefeller | -0.260 |
ruary | -0.240 |
hester | -0.224 |
Nebula | -0.207 |
Token | courtesy |
Token ID | 12537 |
Feature activation | -3.38e+00 |
Pos logit contributions | |
ォ | +0.161 |
kefeller | +0.146 |
ruary | +0.138 |
hester | +0.131 |
Nebula | +0.125 |
Neg logit contributions | |
ura | -0.099 |
uable | -0.088 |
pora | -0.085 |
veland | -0.085 |
oto | -0.079 |
Token | of |
Token ID | 286 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
ォ | +3.822 |
kefeller | +3.487 |
ruary | +3.306 |
hester | +3.152 |
Nebula | +2.994 |
Neg logit contributions | |
ura | -2.137 |
uable | -1.894 |
pora | -1.833 |
veland | -1.809 |
oto | -1.666 |
Token | Basketball |
Token ID | 25911 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
ォ | +0.010 |
kefeller | +0.009 |
ruary | +0.008 |
hester | +0.008 |
Nebula | +0.007 |
Neg logit contributions | |
ura | -0.009 |
uable | -0.008 |
pora | -0.008 |
veland | -0.008 |
oto | -0.007 |
Token | Putin |
Token ID | 8144 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
ォ | +2.083 |
kefeller | +1.856 |
ruary | +1.733 |
hester | +1.626 |
Nebula | +1.522 |
Neg logit contributions | |
ura | -2.026 |
uable | -1.867 |
pora | -1.821 |
veland | -1.807 |
oto | -1.704 |
Token | talks |
Token ID | 6130 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
ura | +0.251 |
uable | +0.227 |
pora | +0.221 |
veland | +0.219 |
oto | +0.205 |
Neg logit contributions | |
ォ | -0.330 |
kefeller | -0.298 |
ruary | -0.280 |
hester | -0.265 |
Nebula | -0.250 |
Token | about |
Token ID | 546 |
Feature activation | -9.30e-01 |
Pos logit contributions | |
ォ | +1.742 |
kefeller | +1.590 |
ruary | +1.506 |
hester | +1.437 |
Nebula | +1.365 |
Neg logit contributions | |
ura | -0.977 |
uable | -0.868 |
pora | -0.841 |
veland | -0.828 |
oto | -0.763 |
Token | sovereignty |
Token ID | 18582 |
Feature activation | +1.92e-01 |
Pos logit contributions | |
ォ | +0.873 |
kefeller | +0.780 |
ruary | +0.730 |
hester | +0.689 |
Nebula | +0.644 |
Neg logit contributions | |
ura | -0.768 |
uable | -0.701 |
pora | -0.685 |
veland | -0.677 |
oto | -0.637 |
Token | , |
Token ID | 11 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
ura | +0.132 |
uable | +0.118 |
pora | +0.115 |
veland | +0.113 |
aur | +0.105 |
Neg logit contributions | |
ォ | -0.206 |
kefeller | -0.188 |
ruary | -0.177 |
hester | -0.169 |
Nebula | -0.160 |
Token | his |
Token ID | 465 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
ura | +0.147 |
uable | +0.134 |
pora | +0.131 |
veland | +0.130 |
oto | +0.122 |
Neg logit contributions | |
ォ | -0.167 |
kefeller | -0.149 |
ruary | -0.140 |
hester | -0.132 |
Nebula | -0.123 |
Token | notion |
Token ID | 9495 |
Feature activation | -2.96e+00 |
Pos logit contributions | |
ォ | +1.209 |
kefeller | +1.086 |
ruary | +1.021 |
hester | +0.962 |
Nebula | +0.909 |
Neg logit contributions | |
ura | -0.973 |
uable | -0.890 |
pora | -0.865 |
veland | -0.859 |
oto | -0.802 |
Token | is |
Token ID | 318 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
ォ | +3.253 |
kefeller | +2.954 |
ruary | +2.797 |
hester | +2.663 |
Nebula | +2.524 |
Neg logit contributions | |
ura | -1.963 |
uable | -1.756 |
pora | -1.701 |
veland | -1.677 |
oto | -1.552 |
Token | � |
Token ID | 564 |
Feature activation | +2.58e-01 |
Pos logit contributions | |
ura | +1.040 |
uable | +0.934 |
pora | +0.914 |
veland | +0.900 |
aur | +0.846 |
Neg logit contributions | |
ォ | -1.348 |
kefeller | -1.219 |
ruary | -1.152 |
hester | -1.093 |
Nebula | -1.024 |
Token | � |
Token ID | 246 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
ura | +0.209 |
uable | +0.191 |
pora | +0.186 |
veland | +0.184 |
oto | +0.173 |
Neg logit contributions | |
ォ | -0.246 |
kefeller | -0.220 |
ruary | -0.206 |
hester | -0.194 |
Nebula | -0.182 |
Token | nob |
Token ID | 34952 |
Feature activation | -6.85e-01 |
Pos logit contributions | |
ォ | +1.537 |
kefeller | +1.377 |
ruary | +1.285 |
hester | +1.214 |
intern | +1.161 |
Neg logit contributions | |
ura | -1.311 |
uable | -1.201 |
pora | -1.170 |
veland | -1.164 |
oto | -1.086 |
Token | � |
Token ID | 247 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
ォ | +0.022 |
kefeller | +0.019 |
ruary | +0.018 |
hester | +0.016 |
intern | +0.015 |
Neg logit contributions | |
ura | -0.026 |
uable | -0.024 |
pora | -0.024 |
veland | -0.023 |
oto | -0.022 |
Token | best |
Token ID | 1266 |
Feature activation | +3.66e+00 |
Pos logit contributions | |
ォ | +1.338 |
kefeller | +1.183 |
ruary | +1.102 |
hester | +1.030 |
Nebula | +0.958 |
Neg logit contributions | |
ura | -1.399 |
uable | -1.287 |
pora | -1.262 |
veland | -1.250 |
oto | -1.183 |
Token | . |
Token ID | 13 |
Feature activation | -2.70e-01 |
Pos logit contributions | |
ura | +2.788 |
uable | +2.525 |
pora | +2.425 |
veland | +2.400 |
oto | +2.286 |
Neg logit contributions | |
ォ | -3.610 |
kefeller | -3.305 |
ruary | -3.096 |
hester | -2.922 |
intern | -2.753 |
Token |
|
Token ID | 198 |
Feature activation | -4.77e-01 |
Pos logit contributions | |
ォ | +0.234 |
kefeller | +0.207 |
ruary | +0.193 |
hester | +0.180 |
Nebula | +0.168 |
Neg logit contributions | |
ura | -0.242 |
uable | -0.223 |
pora | -0.218 |
veland | -0.216 |
oto | -0.204 |
Token |
|
Token ID | 198 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
ォ | +0.455 |
kefeller | +0.404 |
ruary | +0.383 |
hester | +0.363 |
intern | +0.346 |
Neg logit contributions | |
ura | -0.376 |
uable | -0.348 |
pora | -0.339 |
veland | -0.333 |
oto | -0.310 |
Token | Without |
Token ID | 16249 |
Feature activation | -5.95e+00 |
Pos logit contributions | |
ォ | +0.116 |
kefeller | +0.105 |
ruary | +0.099 |
hester | +0.093 |
bley | +0.088 |
Neg logit contributions | |
ura | -0.093 |
uable | -0.084 |
pora | -0.082 |
veland | -0.081 |
oto | -0.077 |
Token | a |
Token ID | 257 |
Feature activation | -4.39e-01 |
Pos logit contributions | |
ォ | +5.388 |
kefeller | +4.707 |
ruary | +4.459 |
hester | +4.148 |
Nebula | +4.027 |
Neg logit contributions | |
ura | -4.902 |
uable | -4.492 |
pora | -4.402 |
veland | -4.352 |
oto | -4.113 |
Token | single |
Token ID | 2060 |
Feature activation | +6.51e-01 |
Pos logit contributions | |
ォ | +0.446 |
kefeller | +0.402 |
ruary | +0.379 |
hester | +0.359 |
Nebula | +0.339 |
Neg logit contributions | |
ura | -0.327 |
uable | -0.296 |
pora | -0.288 |
veland | -0.284 |
oto | -0.266 |
Token | version |
Token ID | 2196 |
Feature activation | -2.41e-03 |
Pos logit contributions | |
ura | +0.517 |
uable | +0.470 |
pora | +0.458 |
veland | +0.453 |
oto | +0.426 |
Neg logit contributions | |
ォ | -0.630 |
kefeller | -0.566 |
ruary | -0.531 |
hester | -0.502 |
Nebula | -0.470 |
Token | of |
Token ID | 286 |
Feature activation | +4.83e-02 |
Pos logit contributions | |
ォ | +0.003 |
kefeller | +0.002 |
ruary | +0.002 |
hester | +0.002 |
Nebula | +0.002 |
Neg logit contributions | |
ura | -0.002 |
uable | -0.001 |
pora | -0.001 |
veland | -0.001 |
oto | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +5.53e-01 |
Pos logit contributions | |
ura | +0.039 |
uable | +0.036 |
pora | +0.035 |
veland | +0.034 |
oto | +0.032 |
Neg logit contributions | |
ォ | -0.046 |
kefeller | -0.041 |
ruary | -0.039 |
hester | -0.037 |
intern | -0.034 |
Token | ing |
Token ID | 5347 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
ォ | +0.292 |
kefeller | +0.262 |
ruary | +0.246 |
hester | +0.232 |
Nebula | +0.218 |
Neg logit contributions | |
ura | -0.234 |
uable | -0.212 |
pora | -0.207 |
veland | -0.205 |
oto | -0.192 |
Token | ress |
Token ID | 601 |
Feature activation | +7.27e-01 |
Pos logit contributions | |
ura | +1.451 |
uable | +1.315 |
pora | +1.271 |
veland | +1.246 |
oto | +1.192 |
Neg logit contributions | |
ォ | -1.873 |
kefeller | -1.694 |
ruary | -1.575 |
hester | -1.499 |
�� | -1.406 |
Token | to |
Token ID | 284 |
Feature activation | -2.45e-01 |
Pos logit contributions | |
ura | +0.514 |
uable | +0.461 |
pora | +0.448 |
veland | +0.443 |
oto | +0.412 |
Neg logit contributions | |
ォ | -0.768 |
kefeller | -0.696 |
ruary | -0.657 |
hester | -0.624 |
Nebula | -0.590 |
Token | visit |
Token ID | 3187 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
ォ | +0.249 |
kefeller | +0.225 |
ruary | +0.212 |
hester | +0.201 |
Nebula | +0.190 |
Neg logit contributions | |
ura | -0.182 |
uable | -0.165 |
pora | -0.160 |
veland | -0.158 |
oto | -0.148 |
Token | . |
Token ID | 13 |
Feature activation | -6.40e-01 |
Pos logit contributions | |
ura | +0.812 |
uable | +0.727 |
pora | +0.706 |
veland | +0.696 |
oto | +0.648 |
Neg logit contributions | |
ォ | -1.260 |
kefeller | -1.143 |
ruary | -1.079 |
hester | -1.026 |
Nebula | -0.970 |
Token | Though |
Token ID | 7486 |
Feature activation | -5.84e+00 |
Pos logit contributions | |
ォ | +0.578 |
kefeller | +0.514 |
ruary | +0.480 |
hester | +0.452 |
Nebula | +0.422 |
Neg logit contributions | |
ura | -0.549 |
uable | -0.504 |
pora | -0.493 |
veland | -0.487 |
oto | -0.460 |
Token | I |
Token ID | 314 |
Feature activation | -5.76e-01 |
Pos logit contributions | |
ォ | +5.299 |
kefeller | +4.692 |
ruary | +4.441 |
hester | +4.238 |
Nebula | +3.999 |
Neg logit contributions | |
ura | -4.734 |
uable | -4.354 |
pora | -4.264 |
veland | -4.201 |
oto | -3.928 |
Token | 'm |
Token ID | 1101 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
ォ | +0.575 |
kefeller | +0.518 |
ruary | +0.489 |
hester | +0.464 |
Nebula | +0.439 |
Neg logit contributions | |
ura | -0.431 |
uable | -0.394 |
pora | -0.385 |
veland | -0.378 |
oto | -0.353 |
Token | pretty |
Token ID | 2495 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
ォ | +0.014 |
kefeller | +0.013 |
ruary | +0.012 |
hester | +0.011 |
Nebula | +0.010 |
Neg logit contributions | |
ura | -0.012 |
uable | -0.011 |
pora | -0.011 |
veland | -0.011 |
oto | -0.010 |
Token | middle |
Token ID | 3504 |
Feature activation | +3.77e-01 |
Pos logit contributions | |
ォ | +2.164 |
kefeller | +1.989 |
ruary | +1.893 |
hester | +1.823 |
Nebula | +1.752 |
Neg logit contributions | |
ura | -0.999 |
uable | -0.879 |
pora | -0.853 |
veland | -0.819 |
oto | -0.752 |
Token | of |
Token ID | 286 |
Feature activation | -2.53e-01 |
Pos logit contributions | |
ura | +0.270 |
uable | +0.245 |
pora | +0.239 |
veland | +0.233 |
oto | +0.218 |
Neg logit contributions | |
ォ | -0.393 |
kefeller | -0.354 |
ruary | -0.335 |
hester | -0.319 |
Nebula | -0.301 |
Token |
|
Token ID | 198 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
ォ | +0.128 |
kefeller | +0.114 |
ruary | +0.108 |
hester | +0.102 |
intern | +0.097 |
Neg logit contributions | |
ura | -0.104 |
uable | -0.096 |
pora | -0.094 |
veland | -0.092 |
oto | -0.086 |
Token | C |
Token ID | 34 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
ura | +0.189 |
uable | +0.173 |
pora | +0.169 |
veland | +0.167 |
oto | +0.158 |
Neg logit contributions | |
ォ | -0.203 |
kefeller | -0.181 |
ruary | -0.169 |
hester | -0.159 |
Nebula | -0.149 |
Token | ancer |
Token ID | 8250 |
Feature activation | +4.07e-01 |
Pos logit contributions | |
ォ | +1.459 |
kefeller | +1.316 |
ruary | +1.228 |
hester | +1.163 |
intern | +1.087 |
Neg logit contributions | |
ura | -1.267 |
uable | -1.158 |
pora | -1.136 |
veland | -1.120 |
oto | -1.050 |
Token | casts |
Token ID | 26217 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
ura | +0.309 |
uable | +0.279 |
pora | +0.272 |
veland | +0.267 |
oto | +0.253 |
Neg logit contributions | |
ォ | -0.410 |
kefeller | -0.368 |
ruary | -0.346 |
hester | -0.327 |
Nebula | -0.309 |
Token | a |
Token ID | 257 |
Feature activation | -4.22e-01 |
Pos logit contributions | |
ura | +1.265 |
uable | +1.152 |
pora | +1.119 |
veland | +1.098 |
oto | +1.038 |
Neg logit contributions | |
ォ | -1.518 |
kefeller | -1.362 |
ruary | -1.279 |
hester | -1.207 |
�� | -1.131 |
Token | shadow |
Token ID | 9082 |
Feature activation | -5.09e+00 |
Pos logit contributions | |
ォ | +0.404 |
kefeller | +0.362 |
ruary | +0.339 |
hester | +0.320 |
Nebula | +0.301 |
Neg logit contributions | |
ura | -0.339 |
uable | -0.309 |
pora | -0.302 |
veland | -0.299 |
oto | -0.281 |
Token | over |
Token ID | 625 |
Feature activation | -8.87e-01 |
Pos logit contributions | |
ォ | +5.098 |
kefeller | +4.597 |
ruary | +4.338 |
hester | +4.077 |
Nebula | +3.904 |
Neg logit contributions | |
ura | -3.724 |
uable | -3.414 |
veland | -3.299 |
pora | -3.259 |
oto | -3.053 |
Token | the |
Token ID | 262 |
Feature activation | +5.09e-01 |
Pos logit contributions | |
ォ | +0.837 |
kefeller | +0.752 |
ruary | +0.702 |
hester | +0.664 |
Nebula | +0.623 |
Neg logit contributions | |
ura | -0.721 |
uable | -0.659 |
pora | -0.642 |
veland | -0.637 |
oto | -0.597 |
Token | villages |
Token ID | 15425 |
Feature activation | +2.83e+00 |
Pos logit contributions | |
ura | +0.372 |
uable | +0.336 |
pora | +0.327 |
veland | +0.323 |
oto | +0.301 |
Neg logit contributions | |
ォ | -0.525 |
kefeller | -0.475 |
ruary | -0.447 |
hester | -0.424 |
Nebula | -0.401 |
Token | in |
Token ID | 287 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
ura | +1.963 |
uable | +1.737 |
pora | +1.701 |
veland | +1.664 |
oto | +1.562 |
Neg logit contributions | |
ォ | -3.026 |
kefeller | -2.754 |
ruary | -2.591 |
hester | -2.472 |
Nebula | -2.335 |
Token | this |
Token ID | 428 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
ura | +0.918 |
uable | +0.838 |
pora | +0.820 |
veland | +0.811 |
oto | +0.766 |
Neg logit contributions | |
ォ | -1.006 |
kefeller | -0.897 |
ruary | -0.836 |
hester | -0.789 |
Nebula | -0.735 |
Token | David |
Token ID | 11006 |
Feature activation | -5.52e+00 |
Pos logit contributions | |
ura | +0.108 |
uable | +0.099 |
pora | +0.097 |
veland | +0.097 |
aur | +0.092 |
Neg logit contributions | |
ォ | -0.086 |
kefeller | -0.075 |
ruary | -0.070 |
hester | -0.065 |
�� | -0.060 |
Token | : |
Token ID | 25 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
ォ | +5.170 |
kefeller | +4.587 |
ruary | +4.292 |
hester | +4.128 |
Nebula | +3.999 |
Neg logit contributions | |
ura | -4.178 |
uable | -3.993 |
pora | -3.832 |
veland | -3.702 |
oto | -3.510 |
Token | That |
Token ID | 1320 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
ォ | +0.236 |
kefeller | +0.206 |
ruary | +0.193 |
hester | +0.180 |
Nebula | +0.170 |
Neg logit contributions | |
ura | -0.257 |
uable | -0.238 |
pora | -0.234 |
veland | -0.232 |
oto | -0.219 |
Token | was |
Token ID | 373 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
ォ | +1.128 |
kefeller | +1.014 |
ruary | +0.955 |
hester | +0.904 |
Nebula | +0.854 |
Neg logit contributions | |
ura | -0.903 |
uable | -0.820 |
pora | -0.804 |
veland | -0.795 |
oto | -0.742 |
Token | Cartoon |
Token ID | 46838 |
Feature activation | -4.32e+00 |
Pos logit contributions | |
ォ | +0.959 |
kefeller | +0.861 |
ruary | +0.808 |
hester | +0.762 |
Nebula | +0.721 |
Neg logit contributions | |
ura | -0.836 |
uable | -0.764 |
pora | -0.750 |
veland | -0.740 |
oto | -0.693 |
Token | Network |
Token ID | 7311 |
Feature activation | -6.18e+00 |
Pos logit contributions | |
ォ | +2.640 |
kefeller | +2.236 |
ruary | +2.078 |
hester | +1.872 |
Nebula | +1.690 |
Neg logit contributions | |
ura | -4.782 |
uable | -4.528 |
pora | -4.479 |
veland | -4.388 |
aur | -4.201 |
Token | 's |
Token ID | 338 |
Feature activation | -9.82e-01 |
Pos logit contributions | |
ォ | +6.003 |
kefeller | +5.424 |
ruary | +5.208 |
hester | +4.916 |
intern | +4.656 |
Neg logit contributions | |
ura | -4.518 |
uable | -4.122 |
pora | -4.066 |
veland | -4.015 |
aur | -3.699 |
Token | choice |
Token ID | 3572 |
Feature activation | +2.61e+00 |
Pos logit contributions | |
ォ | +0.970 |
kefeller | +0.872 |
ruary | +0.821 |
hester | +0.777 |
Nebula | +0.732 |
Neg logit contributions | |
ura | -0.757 |
uable | -0.688 |
pora | -0.671 |
veland | -0.663 |
oto | -0.620 |
Token | and |
Token ID | 290 |
Feature activation | -3.76e-01 |
Pos logit contributions | |
ura | +1.714 |
uable | +1.514 |
pora | +1.461 |
veland | +1.444 |
oto | +1.347 |
Neg logit contributions | |
ォ | -2.910 |
kefeller | -2.649 |
ruary | -2.487 |
hester | -2.378 |
�� | -2.237 |
Token | I |
Token ID | 314 |
Feature activation | -3.97e-01 |
Pos logit contributions | |
ォ | +0.360 |
kefeller | +0.322 |
ruary | +0.302 |
hester | +0.286 |
Nebula | +0.268 |
Neg logit contributions | |
ura | -0.302 |
uable | -0.276 |
pora | -0.269 |
veland | -0.266 |
oto | -0.250 |
Token | think |
Token ID | 892 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
ォ | +0.380 |
kefeller | +0.341 |
ruary | +0.321 |
hester | +0.303 |
Nebula | +0.287 |
Neg logit contributions | |
ura | -0.314 |
uable | -0.288 |
pora | -0.282 |
veland | -0.277 |
oto | -0.260 |
Token | ' |
Token ID | 705 |
Feature activation | -7.26e-02 |
Pos logit contributions | |
ura | +1.796 |
uable | +1.631 |
pora | +1.597 |
veland | +1.577 |
oto | +1.499 |
Neg logit contributions | |
ォ | -1.930 |
kefeller | -1.726 |
ruary | -1.598 |
hester | -1.514 |
bley | -1.405 |
Token | Rem |
Token ID | 8413 |
Feature activation | +9.24e-01 |
Pos logit contributions | |
ォ | +0.064 |
kefeller | +0.056 |
ruary | +0.053 |
hester | +0.049 |
intern | +0.046 |
Neg logit contributions | |
ura | -0.064 |
uable | -0.059 |
pora | -0.058 |
veland | -0.057 |
oto | -0.054 |
Token | aining |
Token ID | 1397 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
ura | +0.606 |
uable | +0.538 |
pora | +0.523 |
veland | +0.516 |
oto | +0.479 |
Neg logit contributions | |
ォ | -1.030 |
kefeller | -0.933 |
ruary | -0.884 |
hester | -0.842 |
Nebula | -0.801 |
Token | Aw |
Token ID | 5851 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
ura | +0.929 |
uable | +0.845 |
pora | +0.826 |
veland | +0.814 |
oto | +0.766 |
Neg logit contributions | |
ォ | -1.127 |
kefeller | -1.011 |
ruary | -0.950 |
hester | -0.897 |
Nebula | -0.839 |
Token | ake |
Token ID | 539 |
Feature activation | +2.33e+00 |
Pos logit contributions | |
ura | +1.419 |
uable | +1.232 |
pora | +1.177 |
veland | +1.172 |
oto | +1.080 |
Neg logit contributions | |
ォ | -2.988 |
kefeller | -2.738 |
ruary | -2.598 |
hester | -2.490 |
Nebula | -2.388 |
Token | through |
Token ID | 832 |
Feature activation | -6.02e+00 |
Pos logit contributions | |
ura | +1.655 |
uable | +1.479 |
pora | +1.442 |
veland | +1.416 |
oto | +1.332 |
Neg logit contributions | |
ォ | -2.467 |
kefeller | -2.234 |
ruary | -2.103 |
hester | -2.000 |
Nebula | -1.882 |
Token | a |
Token ID | 257 |
Feature activation | -8.12e-01 |
Pos logit contributions | |
ォ | +4.983 |
kefeller | +4.474 |
ruary | +4.120 |
hester | +3.878 |
Antiqu | +3.702 |
Neg logit contributions | |
ura | -5.266 |
uable | -4.902 |
pora | -4.747 |
veland | -4.743 |
oto | -4.464 |
Token | Great |
Token ID | 3878 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
ォ | +0.653 |
kefeller | +0.574 |
ruary | +0.529 |
hester | +0.493 |
Nebula | +0.457 |
Neg logit contributions | |
ura | -0.773 |
uable | -0.717 |
pora | -0.702 |
veland | -0.695 |
oto | -0.662 |
Token | Revolution |
Token ID | 9303 |
Feature activation | -6.19e+00 |
Pos logit contributions | |
ォ | +1.375 |
kefeller | +1.214 |
ruary | +1.128 |
hester | +1.046 |
Nebula | +0.975 |
Neg logit contributions | |
ura | -1.656 |
uable | -1.543 |
pora | -1.511 |
veland | -1.496 |
oto | -1.416 |
Token | ', |
Token ID | 3256 |
Feature activation | -7.45e-01 |
Pos logit contributions | |
ォ | +6.031 |
kefeller | +5.441 |
ruary | +5.144 |
hester | +4.871 |
Nebula | +4.677 |
Neg logit contributions | |
ura | -4.473 |
uable | -4.121 |
pora | -4.015 |
veland | -4.006 |
oto | -3.655 |
Token | in |
Token ID | 287 |
Feature activation | +6.24e-01 |
Pos logit contributions | |
ォ | +0.724 |
kefeller | +0.652 |
ruary | +0.614 |
hester | +0.580 |
Nebula | +0.549 |
Neg logit contributions | |
ura | -0.578 |
uable | -0.531 |
pora | -0.515 |
veland | -0.511 |
oto | -0.477 |