Token | , |
Token ID | 11 |
Feature activation | +7.26e+00 |
Pos logit contributions | |
� | +11.079 |
bipartisan | +10.546 |
politically | +10.350 |
political | +10.292 |
� | +10.244 |
Neg logit contributions | |
coins | -5.855 |
detects | -5.487 |
contains | -5.148 |
img | -5.074 |
wine | -4.922 |
Token | refers |
Token ID | 10229 |
Feature activation | +5.49e+00 |
Pos logit contributions | |
� | +10.828 |
bipartisan | +10.309 |
political | +10.117 |
� | +10.104 |
politically | +10.003 |
Neg logit contributions | |
coins | -4.875 |
iton | -4.245 |
rox | -4.125 |
img | -4.091 |
wine | -3.999 |
Token | to |
Token ID | 284 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
bipartisan | +8.664 |
� | +8.481 |
political | +8.208 |
politically | +8.185 |
geopolitical | +7.922 |
Neg logit contributions | |
coins | -3.271 |
detects | -3.009 |
contains | -2.879 |
iton | -2.778 |
img | -2.679 |
Token | her |
Token ID | 607 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
bipartisan | +2.153 |
� | +2.148 |
political | +2.074 |
politically | +2.046 |
� | +2.000 |
Neg logit contributions | |
coins | -1.379 |
detects | -1.312 |
contains | -1.241 |
iton | -1.228 |
img | -1.209 |
Token | as |
Token ID | 355 |
Feature activation | +2.99e+01 |
Pos logit contributions | |
� | +24.737 |
political | +24.282 |
bipartisan | +24.119 |
politically | +23.474 |
� | +23.335 |
Neg logit contributions | |
coins | -16.028 |
detects | -14.605 |
img | -13.935 |
iton | -13.835 |
wine | -13.311 |
Token | a |
Token ID | 257 |
Feature activation | +4.73e+01 |
Pos logit contributions | |
� | +31.144 |
bipartisan | +30.141 |
political | +30.019 |
� | +29.977 |
politically | +29.377 |
Neg logit contributions | |
coins | -16.463 |
detects | -15.922 |
iton | -15.065 |
img | -14.460 |
wine | -14.407 |
Token | � |
Token ID | 564 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
� | +40.067 |
� | +39.478 |
political | +39.442 |
bipartisan | +38.698 |
politically | +37.548 |
Neg logit contributions | |
coins | -19.146 |
detects | -17.222 |
iton | -16.710 |
img | -16.121 |
wine | -15.507 |
Token | � |
Token ID | 250 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
� | +11.871 |
bipartisan | +11.505 |
political | +10.891 |
� | +10.879 |
politically | +10.761 |
Neg logit contributions | |
coins | -10.995 |
detects | -10.740 |
contains | -10.132 |
iton | -10.118 |
img | -9.668 |
Token | main |
Token ID | 12417 |
Feature activation | +9.22e+00 |
Pos logit contributions | |
� | +20.235 |
bipartisan | +19.477 |
political | +19.237 |
politically | +18.728 |
� | +18.458 |
Neg logit contributions | |
detects | -10.711 |
coins | -10.127 |
contains | -9.811 |
iton | -9.632 |
completes | -8.760 |
Token | stream |
Token ID | 5532 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
� | +12.415 |
bipartisan | +12.290 |
political | +12.069 |
� | +11.640 |
politically | +11.616 |
Neg logit contributions | |
coins | -6.587 |
detects | -6.417 |
rox | -5.912 |
contains | -5.887 |
iton | -5.698 |
Token | social |
Token ID | 1919 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
� | +20.992 |
political | +20.496 |
bipartisan | +20.095 |
� | +19.580 |
politically | +19.295 |
Neg logit contributions | |
coins | -13.417 |
detects | -12.576 |
iton | -11.888 |
img | -11.598 |
rox | -11.471 |
Token | he |
Token ID | 339 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
� | +10.931 |
bipartisan | +10.931 |
political | +10.765 |
politically | +10.596 |
� | +10.253 |
Neg logit contributions | |
coins | -6.647 |
detects | -6.025 |
iton | -5.914 |
img | -5.773 |
rox | -5.741 |
Token | has |
Token ID | 468 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
� | +15.520 |
politically | +14.494 |
bipartisan | +14.441 |
� | +14.414 |
political | +14.281 |
Neg logit contributions | |
coins | -9.150 |
rox | -7.920 |
iton | -7.917 |
mitter | -7.872 |
img | -7.743 |
Token | called |
Token ID | 1444 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
bipartisan | +19.691 |
� | +19.546 |
political | +19.208 |
politically | +19.081 |
� | +18.367 |
Neg logit contributions | |
coins | -15.648 |
rox | -13.877 |
detects | -13.865 |
mitter | -13.838 |
iton | -13.789 |
Token | the |
Token ID | 262 |
Feature activation | +2.54e+01 |
Pos logit contributions | |
� | +14.260 |
bipartisan | +14.239 |
political | +13.968 |
politically | +13.712 |
� | +13.480 |
Neg logit contributions | |
coins | -7.499 |
detects | -6.851 |
iton | -6.477 |
wine | -6.426 |
rox | -6.419 |
Token | Holocaust |
Token ID | 18661 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
political | +23.925 |
bipartisan | +23.810 |
� | +23.720 |
politically | +22.815 |
� | +22.745 |
Neg logit contributions | |
coins | -19.196 |
detects | -18.434 |
iton | -18.220 |
assium | -17.345 |
wine | -17.225 |
Token | a |
Token ID | 257 |
Feature activation | +4.66e+01 |
Pos logit contributions | |
� | +24.201 |
bipartisan | +23.299 |
� | +22.993 |
political | +22.781 |
politically | +22.750 |
Neg logit contributions | |
coins | -16.933 |
wine | -15.741 |
detects | -15.739 |
iton | -15.693 |
img | -15.232 |
Token | � |
Token ID | 564 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
political | +37.169 |
� | +36.786 |
� | +36.508 |
bipartisan | +36.269 |
politically | +35.714 |
Neg logit contributions | |
coins | -23.967 |
detects | -21.645 |
iton | -21.036 |
wine | -21.033 |
assium | -20.999 |
Token | � |
Token ID | 250 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
� | +11.536 |
bipartisan | +10.957 |
� | +10.541 |
political | +10.373 |
politically | +10.085 |
Neg logit contributions | |
coins | -12.475 |
detects | -12.352 |
iton | -11.517 |
contains | -11.318 |
wine | -11.038 |
Token | my |
Token ID | 1820 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
� | +24.285 |
bipartisan | +22.471 |
political | +22.377 |
� | +22.083 |
politically | +21.863 |
Neg logit contributions | |
detects | -13.497 |
coins | -11.972 |
contains | -11.673 |
assium | -11.536 |
iton | -11.323 |
Token | th |
Token ID | 400 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
� | +18.712 |
political | +17.882 |
bipartisan | +17.668 |
� | +17.623 |
politically | +17.151 |
Neg logit contributions | |
coins | -12.989 |
detects | -12.574 |
contains | -11.341 |
assium | -11.318 |
iton | -11.088 |
Token | � |
Token ID | 447 |
Feature activation | +6.31e+00 |
Pos logit contributions | |
� | +22.789 |
� | +20.701 |
bipartisan | +20.412 |
politically | +20.180 |
political | +20.018 |
Neg logit contributions | |
coins | -11.364 |
detects | -11.306 |
iton | -10.155 |
contains | -10.002 |
wine | -9.939 |
Token |
|
Token ID | 198 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
� | +22.487 |
� | +20.540 |
| +18.918 |
bipartisan | +16.908 |
political | +16.375 |
Neg logit contributions | |
detects | -26.287 |
eatures | -25.537 |
coins | -24.885 |
assium | -24.287 |
yip | -24.059 |
Token | The |
Token ID | 464 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
� | +18.349 |
� | +16.118 |
bipartisan | +15.954 |
political | +15.309 |
politically | +14.765 |
Neg logit contributions | |
detects | -12.224 |
coins | -11.390 |
contains | -10.864 |
iton | -10.751 |
assium | -10.394 |
Token | row |
Token ID | 5752 |
Feature activation | +8.99e+00 |
Pos logit contributions | |
bipartisan | +19.087 |
� | +19.003 |
political | +18.693 |
politically | +18.157 |
� | +18.145 |
Neg logit contributions | |
coins | -13.810 |
detects | -13.229 |
iton | -12.201 |
contains | -12.006 |
img | -11.996 |
Token | comes |
Token ID | 2058 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
� | +13.220 |
bipartisan | +12.561 |
� | +12.402 |
politically | +12.194 |
political | +12.192 |
Neg logit contributions | |
coins | -5.643 |
detects | -5.077 |
iton | -5.012 |
rox | -4.792 |
img | -4.733 |
Token | amid |
Token ID | 10371 |
Feature activation | +3.09e+01 |
Pos logit contributions | |
� | +20.604 |
bipartisan | +20.283 |
political | +19.920 |
� | +19.618 |
politically | +19.500 |
Neg logit contributions | |
coins | -15.617 |
detects | -14.396 |
img | -14.209 |
rox | -13.852 |
mitter | -13.798 |
Token | a |
Token ID | 257 |
Feature activation | +4.54e+01 |
Pos logit contributions | |
bipartisan | +29.673 |
political | +29.390 |
� | +28.987 |
politically | +28.194 |
� | +27.984 |
Neg logit contributions | |
coins | -19.472 |
detects | -17.823 |
img | -17.002 |
rox | -16.578 |
iton | -16.498 |
Token | growing |
Token ID | 3957 |
Feature activation | +3.23e+01 |
Pos logit contributions | |
bipartisan | +36.835 |
political | +36.547 |
� | +35.457 |
politically | +35.188 |
� | +34.447 |
Neg logit contributions | |
coins | -23.539 |
detects | -20.523 |
mitter | -19.877 |
rox | -19.205 |
img | -18.799 |
Token | debate |
Token ID | 4384 |
Feature activation | +2.13e+01 |
Pos logit contributions | |
bipartisan | +29.983 |
political | +29.564 |
� | +27.778 |
politically | +27.436 |
� | +27.120 |
Neg logit contributions | |
coins | -21.825 |
mitter | -18.962 |
detects | -18.611 |
assium | -18.332 |
wine | -18.203 |
Token | about |
Token ID | 546 |
Feature activation | +2.10e+01 |
Pos logit contributions | |
� | +23.591 |
� | +22.237 |
bipartisan | +22.130 |
political | +21.853 |
politically | +21.633 |
Neg logit contributions | |
coins | -15.172 |
detects | -14.096 |
assium | -13.641 |
rox | -13.313 |
itely | -13.285 |
Token | freedom |
Token ID | 4925 |
Feature activation | +9.13e+00 |
Pos logit contributions | |
political | +23.636 |
� | +23.260 |
bipartisan | +22.998 |
� | +22.862 |
politically | +22.806 |
Neg logit contributions | |
coins | -15.179 |
detects | -12.998 |
mitter | -12.824 |
img | -12.796 |
assium | -12.783 |
Token | of |
Token ID | 286 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
� | +13.463 |
bipartisan | +13.212 |
political | +12.783 |
politically | +12.700 |
� | +12.569 |
Neg logit contributions | |
coins | -5.995 |
detects | -5.616 |
iton | -5.258 |
contains | -5.193 |
img | -5.128 |
Token | was |
Token ID | 373 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
� | +11.953 |
bipartisan | +11.763 |
political | +11.382 |
politically | +11.242 |
� | +11.090 |
Neg logit contributions | |
coins | -5.349 |
detects | -4.975 |
img | -4.464 |
rox | -4.434 |
iton | -4.383 |
Token | 20 |
Token ID | 1160 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
bipartisan | +19.554 |
� | +19.553 |
political | +18.742 |
politically | +18.444 |
� | +18.392 |
Neg logit contributions | |
coins | -14.135 |
detects | -12.926 |
rox | -12.867 |
mitter | -12.587 |
img | -12.525 |
Token | years |
Token ID | 812 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
� | +12.210 |
bipartisan | +11.918 |
political | +11.496 |
politically | +10.936 |
� | +10.831 |
Neg logit contributions | |
coins | -13.247 |
detects | -12.882 |
iton | -12.573 |
mitter | -12.299 |
wine | -12.179 |
Token | ago |
Token ID | 2084 |
Feature activation | +2.21e+01 |
Pos logit contributions | |
� | +12.648 |
bipartisan | +11.906 |
� | +11.482 |
political | +11.333 |
politically | +11.250 |
Neg logit contributions | |
coins | -11.840 |
detects | -11.058 |
iton | -10.576 |
rox | -10.436 |
img | -10.347 |
Token | . |
Token ID | 13 |
Feature activation | +3.06e+01 |
Pos logit contributions | |
� | +24.958 |
bipartisan | +23.084 |
� | +22.935 |
political | +22.407 |
politically | +22.362 |
Neg logit contributions | |
coins | -15.625 |
detects | -15.157 |
rox | -14.181 |
img | -13.888 |
wine | -13.846 |
Token |
|
Token ID | 198 |
Feature activation | +4.49e+01 |
Pos logit contributions | |
� | +30.458 |
� | +28.133 |
bipartisan | +26.963 |
Democratic | +25.975 |
political | +25.824 |
Neg logit contributions | |
coins | -19.391 |
detects | -19.361 |
mitter | -17.997 |
wine | -17.499 |
rox | -17.429 |
Token |
|
Token ID | 198 |
Feature activation | +3.18e+01 |
Pos logit contributions | |
� | +28.068 |
� | +25.392 |
| +23.639 |
bipartisan | +20.134 |
political | +19.394 |
Neg logit contributions | |
eatures | -29.920 |
detects | -28.917 |
senal | -27.595 |
yip | -27.553 |
coins | -26.788 |
Token | � |
Token ID | 447 |
Feature activation | +1.77e+00 |
Pos logit contributions | |
� | +33.573 |
� | +28.782 |
bipartisan | +27.843 |
political | +26.454 |
| +25.582 |
Neg logit contributions | |
detects | -19.641 |
coins | -17.131 |
contains | -16.844 |
iton | -16.532 |
behaves | -15.942 |
Token | � |
Token ID | 250 |
Feature activation | +4.54e+00 |
Pos logit contributions | |
� | +2.057 |
bipartisan | +2.020 |
political | +1.886 |
� | +1.884 |
politically | +1.861 |
Neg logit contributions | |
coins | -1.799 |
detects | -1.747 |
iton | -1.655 |
contains | -1.654 |
wine | -1.600 |
Token | But |
Token ID | 1537 |
Feature activation | +8.82e+00 |
Pos logit contributions | |
� | +5.471 |
bipartisan | +5.237 |
political | +4.950 |
� | +4.860 |
politically | +4.823 |
Neg logit contributions | |
detects | -4.387 |
coins | -4.302 |
contains | -4.060 |
iton | -3.982 |
rox | -3.854 |
Token | in |
Token ID | 287 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
� | +12.259 |
bipartisan | +12.196 |
political | +11.802 |
politically | +11.602 |
� | +11.362 |
Neg logit contributions | |
coins | -6.179 |
detects | -5.788 |
img | -5.343 |
contains | -5.309 |
iton | -5.222 |
Token | season |
Token ID | 1622 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
bipartisan | +20.790 |
� | +20.591 |
political | +20.253 |
politically | +20.158 |
� | +19.566 |
Neg logit contributions | |
coins | -11.685 |
detects | -10.878 |
rox | -10.591 |
mitter | -10.584 |
img | -10.431 |
Token | with |
Token ID | 351 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
� | +23.769 |
bipartisan | +23.464 |
politically | +22.929 |
political | +22.744 |
� | +22.448 |
Neg logit contributions | |
coins | -12.889 |
detects | -12.058 |
rox | -11.377 |
mitter | -11.209 |
img | -11.198 |
Token | bragging |
Token ID | 43018 |
Feature activation | +3.37e+00 |
Pos logit contributions | |
bipartisan | +21.058 |
political | +19.990 |
politically | +19.454 |
� | +18.933 |
ideological | +18.411 |
Neg logit contributions | |
coins | -13.605 |
detects | -12.820 |
img | -12.565 |
rox | -12.467 |
iton | -12.209 |
Token | rights |
Token ID | 2489 |
Feature activation | +2.03e+01 |
Pos logit contributions | |
bipartisan | +2.813 |
� | +2.736 |
political | +2.656 |
politically | +2.601 |
� | +2.443 |
Neg logit contributions | |
coins | -4.294 |
detects | -4.290 |
iton | -4.134 |
img | -4.102 |
rox | -4.098 |
Token | . |
Token ID | 13 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
� | +23.213 |
bipartisan | +22.226 |
politically | +21.943 |
political | +21.743 |
� | +21.723 |
Neg logit contributions | |
detects | -13.287 |
coins | -13.203 |
rox | -12.492 |
img | -12.379 |
mitter | -12.227 |
Token |
|
Token ID | 198 |
Feature activation | +4.48e+01 |
Pos logit contributions | |
� | +29.361 |
� | +27.153 |
bipartisan | +25.958 |
political | +24.975 |
Democratic | +24.839 |
Neg logit contributions | |
detects | -19.831 |
coins | -19.635 |
mitter | -18.809 |
iton | -18.117 |
rox | -18.033 |
Token |
|
Token ID | 198 |
Feature activation | +3.33e+01 |
Pos logit contributions | |
� | +27.523 |
� | +25.179 |
| +23.544 |
bipartisan | +19.840 |
political | +19.161 |
Neg logit contributions | |
eatures | -30.191 |
detects | -28.994 |
senal | -28.137 |
yip | -27.539 |
coins | -27.019 |
Token | � |
Token ID | 447 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
� | +34.782 |
� | +29.985 |
bipartisan | +28.912 |
political | +27.422 |
| +26.625 |
Neg logit contributions | |
detects | -20.177 |
contains | -17.391 |
coins | -17.260 |
iton | -16.993 |
behaves | -16.213 |
Token | � |
Token ID | 250 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
coins | +1.626 |
detects | +1.580 |
contains | +1.494 |
iton | +1.489 |
wine | +1.438 |
Neg logit contributions | |
� | -1.938 |
bipartisan | -1.916 |
political | -1.793 |
� | -1.778 |
politically | -1.773 |
Token | In |
Token ID | 818 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
� | +1.442 |
bipartisan | +1.393 |
political | +1.313 |
politically | +1.286 |
� | +1.284 |
Neg logit contributions | |
detects | -1.252 |
coins | -1.236 |
contains | -1.174 |
iton | -1.153 |
rox | -1.113 |
Token | this |
Token ID | 428 |
Feature activation | +2.45e+01 |
Pos logit contributions | |
bipartisan | +12.722 |
� | +12.468 |
political | +12.258 |
politically | +11.976 |
� | +11.508 |
Neg logit contributions | |
coins | -8.271 |
detects | -8.068 |
contains | -7.486 |
rox | -7.387 |
img | -7.300 |
Token | the |
Token ID | 262 |
Feature activation | +4.88e+00 |
Pos logit contributions | |
coins | +4.401 |
detects | +4.169 |
contains | +4.014 |
iton | +3.952 |
img | +3.889 |
Neg logit contributions | |
bipartisan | -6.201 |
� | -6.142 |
political | -5.860 |
politically | -5.836 |
� | -5.654 |
Token | bench |
Token ID | 7624 |
Feature activation | +7.98e+00 |
Pos logit contributions | |
� | +5.545 |
bipartisan | +5.513 |
political | +5.251 |
politically | +5.121 |
� | +5.028 |
Neg logit contributions | |
coins | -4.940 |
detects | -4.610 |
iton | -4.417 |
contains | -4.378 |
img | -4.364 |
Token | . |
Token ID | 13 |
Feature activation | +8.53e+00 |
Pos logit contributions | |
� | +10.784 |
bipartisan | +10.218 |
� | +9.986 |
political | +9.826 |
politically | +9.824 |
Neg logit contributions | |
coins | -6.184 |
detects | -5.811 |
iton | -5.459 |
wine | -5.452 |
img | -5.414 |
Token | � |
Token ID | 447 |
Feature activation | +4.52e+00 |
Pos logit contributions | |
� | +9.424 |
bipartisan | +8.984 |
� | +8.595 |
political | +8.468 |
politically | +8.368 |
Neg logit contributions | |
coins | -8.738 |
detects | -8.556 |
contains | -8.049 |
iton | -7.945 |
wine | -7.859 |
Token | � |
Token ID | 251 |
Feature activation | +7.37e+00 |
Pos logit contributions | |
� | +5.281 |
bipartisan | +5.267 |
political | +4.951 |
politically | +4.919 |
� | +4.829 |
Neg logit contributions | |
coins | -4.430 |
detects | -4.207 |
contains | -4.044 |
iton | -4.017 |
img | -3.929 |
Token |
|
Token ID | 198 |
Feature activation | +4.43e+01 |
Pos logit contributions | |
� | +8.591 |
bipartisan | +7.930 |
� | +7.842 |
political | +7.587 |
politically | +7.456 |
Neg logit contributions | |
coins | -7.108 |
detects | -6.997 |
contains | -6.473 |
iton | -6.373 |
wine | -6.368 |
Token |
|
Token ID | 198 |
Feature activation | +2.69e+01 |
Pos logit contributions | |
� | +27.170 |
� | +24.523 |
| +22.299 |
bipartisan | +18.574 |
political | +17.870 |
Neg logit contributions | |
eatures | -31.990 |
senal | -30.265 |
detects | -30.024 |
yip | -29.073 |
perpend | -27.809 |
Token | Gl |
Token ID | 9861 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
� | +30.984 |
� | +27.458 |
bipartisan | +26.229 |
political | +24.973 |
| +24.714 |
Neg logit contributions | |
detects | -18.351 |
coins | -17.008 |
contains | -16.375 |
iton | -15.894 |
behaves | -15.315 |
Token | as |
Token ID | 292 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
coins | +4.216 |
detects | +3.747 |
contains | +3.437 |
iton | +3.306 |
img | +3.169 |
Neg logit contributions | |
bipartisan | -17.530 |
� | -17.403 |
political | -16.826 |
politically | -16.787 |
� | -16.400 |
Token | gow |
Token ID | 21175 |
Feature activation | -9.17e+00 |
Pos logit contributions | |
coins | +17.214 |
detects | +16.172 |
iton | +16.150 |
contains | +15.952 |
img | +15.615 |
Neg logit contributions | |
bipartisan | -16.677 |
� | -15.947 |
� | -15.755 |
political | -15.372 |
politically | -15.293 |
Token | Warriors |
Token ID | 12090 |
Feature activation | +4.37e+00 |
Pos logit contributions | |
coins | +10.207 |
detects | +9.826 |
contains | +9.641 |
iton | +9.413 |
img | +9.315 |
Neg logit contributions | |
bipartisan | -9.173 |
� | -8.890 |
politically | -8.435 |
political | -8.426 |
� | -8.029 |
Token | and |
Token ID | 290 |
Feature activation | +6.96e+00 |
Pos logit contributions | |
� | +18.670 |
bipartisan | +17.703 |
political | +17.457 |
politically | +17.314 |
� | +17.262 |
Neg logit contributions | |
coins | -8.388 |
detects | -7.788 |
img | -7.669 |
iton | -7.433 |
rox | -7.390 |
Token | Washington |
Token ID | 2669 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
bipartisan | +7.695 |
� | +7.492 |
political | +7.383 |
politically | +7.162 |
� | +6.984 |
Neg logit contributions | |
coins | -7.106 |
iton | -6.493 |
rox | -6.435 |
detects | -6.354 |
img | -6.283 |
Token | on |
Token ID | 319 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
� | +17.896 |
bipartisan | +17.129 |
political | +16.883 |
� | +16.768 |
politically | +16.582 |
Neg logit contributions | |
coins | -9.179 |
detects | -8.638 |
img | -8.290 |
iton | -8.172 |
rox | -8.167 |
Token | weed |
Token ID | 20349 |
Feature activation | +3.60e+00 |
Pos logit contributions | |
bipartisan | +18.031 |
political | +17.829 |
politically | +17.262 |
� | +17.031 |
constitutional | +16.237 |
Neg logit contributions | |
coins | -12.533 |
iton | -11.287 |
detects | -11.281 |
img | -11.176 |
rox | -11.128 |
Token | . |
Token ID | 13 |
Feature activation | +2.65e+01 |
Pos logit contributions | |
� | +4.424 |
bipartisan | +4.404 |
political | +4.235 |
politically | +4.172 |
� | +4.070 |
Neg logit contributions | |
coins | -3.323 |
detects | -3.122 |
iton | -3.037 |
img | -3.010 |
rox | -2.980 |
Token |
|
Token ID | 198 |
Feature activation | +4.40e+01 |
Pos logit contributions | |
� | +26.923 |
� | +24.807 |
bipartisan | +24.284 |
political | +23.176 |
| +22.602 |
Neg logit contributions | |
detects | -19.070 |
coins | -18.973 |
iton | -18.261 |
mitter | -18.150 |
rox | -17.724 |
Token |
|
Token ID | 198 |
Feature activation | +2.31e+01 |
Pos logit contributions | |
� | +26.759 |
� | +24.132 |
| +22.575 |
bipartisan | +19.340 |
political | +18.683 |
Neg logit contributions | |
eatures | -30.548 |
detects | -29.495 |
senal | -28.275 |
yip | -27.996 |
coins | -27.574 |
Token | � |
Token ID | 447 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
� | +25.871 |
� | +22.045 |
bipartisan | +21.625 |
political | +20.529 |
| +19.822 |
Neg logit contributions | |
detects | -17.616 |
iton | -15.850 |
coins | -15.594 |
contains | -15.381 |
assium | -14.830 |
Token | � |
Token ID | 250 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
� | +1.182 |
bipartisan | +1.159 |
� | +1.086 |
political | +1.078 |
politically | +1.064 |
Neg logit contributions | |
coins | -1.037 |
detects | -1.009 |
iton | -0.953 |
contains | -0.948 |
wine | -0.914 |
Token | The |
Token ID | 464 |
Feature activation | +2.21e+01 |
Pos logit contributions | |
� | +4.279 |
bipartisan | +4.114 |
political | +3.894 |
� | +3.865 |
politically | +3.821 |
Neg logit contributions | |
coins | -3.080 |
detects | -3.077 |
iton | -2.868 |
contains | -2.855 |
rox | -2.734 |
Token | Obama |
Token ID | 2486 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
bipartisan | +23.248 |
political | +22.765 |
� | +21.989 |
politically | +21.773 |
� | +20.865 |
Neg logit contributions | |
coins | -16.407 |
detects | -15.449 |
iton | -14.592 |
img | -14.329 |
contains | -14.228 |
Token | there |
Token ID | 612 |
Feature activation | +2.99e+01 |
Pos logit contributions | |
� | +23.437 |
� | +21.735 |
politically | +21.637 |
bipartisan | +21.581 |
political | +20.964 |
Neg logit contributions | |
coins | -14.054 |
detects | -12.594 |
wine | -12.540 |
rox | -12.299 |
mitter | -12.274 |
Token | . |
Token ID | 13 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
� | +32.168 |
� | +29.048 |
politically | +28.182 |
bipartisan | +27.817 |
political | +27.448 |
Neg logit contributions | |
coins | -16.745 |
detects | -15.514 |
wine | -14.567 |
mitter | -14.537 |
img | -14.423 |
Token | Here |
Token ID | 3423 |
Feature activation | +8.64e+00 |
Pos logit contributions | |
� | +18.725 |
� | +17.412 |
bipartisan | +16.917 |
political | +16.256 |
| +15.752 |
Neg logit contributions | |
coins | -12.202 |
detects | -11.698 |
mitter | -11.542 |
iton | -11.336 |
rox | -10.979 |
Token | goes |
Token ID | 2925 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
� | +13.608 |
bipartisan | +13.070 |
political | +12.751 |
� | +12.726 |
politically | +12.552 |
Neg logit contributions | |
coins | -4.715 |
detects | -4.285 |
iton | -4.034 |
img | -3.875 |
mitter | -3.802 |
Token | : |
Token ID | 25 |
Feature activation | +2.96e+01 |
Pos logit contributions | |
� | +17.310 |
bipartisan | +16.785 |
political | +16.177 |
� | +16.159 |
politically | +15.847 |
Neg logit contributions | |
coins | -10.665 |
detects | -9.926 |
rox | -9.269 |
wine | -9.075 |
img | -9.050 |
Token |
|
Token ID | 198 |
Feature activation | +4.38e+01 |
Pos logit contributions | |
� | +32.204 |
� | +30.200 |
bipartisan | +29.577 |
political | +29.217 |
politically | +28.362 |
Neg logit contributions | |
coins | -15.848 |
iton | -14.328 |
detects | -14.176 |
mitter | -14.022 |
wine | -13.902 |
Token |
|
Token ID | 198 |
Feature activation | +2.43e+01 |
Pos logit contributions | |
� | +26.595 |
� | +23.777 |
| +22.046 |
bipartisan | +19.206 |
political | +18.467 |
Neg logit contributions | |
eatures | -30.882 |
detects | -29.632 |
senal | -28.609 |
yip | -28.425 |
perpend | -27.558 |
Token | About |
Token ID | 8585 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
� | +27.286 |
� | +23.340 |
bipartisan | +22.884 |
political | +21.481 |
| +20.598 |
Neg logit contributions | |
detects | -17.011 |
coins | -15.254 |
iton | -15.054 |
contains | -14.684 |
assium | -14.072 |
Token | Aleppo |
Token ID | 18593 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
bipartisan | +14.241 |
political | +13.857 |
� | +13.855 |
politically | +13.397 |
� | +13.180 |
Neg logit contributions | |
coins | -8.455 |
detects | -7.638 |
iton | -7.566 |
img | -7.508 |
wine | -7.436 |
Token | and |
Token ID | 290 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
� | +16.127 |
� | +15.043 |
bipartisan | +14.958 |
political | +14.883 |
politically | +14.610 |
Neg logit contributions | |
coins | -8.899 |
detects | -8.300 |
wine | -7.989 |
iton | -7.946 |
img | -7.832 |
Token | Syria |
Token ID | 4392 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
� | +16.066 |
bipartisan | +15.887 |
political | +15.850 |
� | +15.333 |
politically | +15.254 |
Neg logit contributions | |
coins | -9.969 |
iton | -8.857 |
mitter | -8.852 |
detects | -8.821 |
wine | -8.781 |
Token | r |
Token ID | 81 |
Feature activation | -4.88e+00 |
Pos logit contributions | |
coins | +0.794 |
detects | +0.743 |
contains | +0.691 |
iton | +0.657 |
img | +0.632 |
Neg logit contributions | |
� | -1.730 |
bipartisan | -1.709 |
political | -1.645 |
politically | -1.633 |
� | -1.613 |
Token | / |
Token ID | 14 |
Feature activation | +6.67e+00 |
Pos logit contributions | |
coins | +2.702 |
detects | +2.477 |
contains | +2.325 |
iton | +2.261 |
img | +2.192 |
Neg logit contributions | |
bipartisan | -7.838 |
� | -7.782 |
political | -7.499 |
politically | -7.479 |
� | -7.295 |
Token | Getty |
Token ID | 6633 |
Feature activation | -2.93e+00 |
Pos logit contributions | |
� | +7.701 |
bipartisan | +7.348 |
political | +7.176 |
politically | +6.980 |
� | +6.940 |
Neg logit contributions | |
detects | -6.203 |
coins | -6.141 |
contains | -5.831 |
iton | -5.774 |
rox | -5.546 |
Token | Images |
Token ID | 5382 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
coins | +1.486 |
detects | +1.329 |
contains | +1.319 |
img | +1.229 |
iton | +1.177 |
Neg logit contributions | |
bipartisan | -4.740 |
� | -4.579 |
politically | -4.505 |
political | -4.467 |
geopolitical | -4.374 |
Token | ) |
Token ID | 8 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
bipartisan | +0.573 |
� | +0.559 |
politically | +0.544 |
political | +0.541 |
� | +0.528 |
Neg logit contributions | |
coins | -0.179 |
detects | -0.160 |
contains | -0.154 |
iton | -0.146 |
img | -0.142 |
Token |
|
Token ID | 198 |
Feature activation | +4.37e+01 |
Pos logit contributions | |
� | +19.880 |
bipartisan | +19.634 |
political | +18.644 |
politically | +18.417 |
� | +18.229 |
Neg logit contributions | |
coins | -14.726 |
detects | -14.136 |
iton | -13.358 |
contains | -13.353 |
img | -13.172 |
Token |
|
Token ID | 198 |
Feature activation | +2.04e+01 |
Pos logit contributions | |
� | +26.910 |
� | +24.335 |
| +22.887 |
bipartisan | +20.078 |
political | +19.329 |
Neg logit contributions | |
eatures | -29.600 |
detects | -28.834 |
yip | -27.473 |
senal | -27.246 |
coins | -26.970 |
Token | South |
Token ID | 14942 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
� | +22.847 |
bipartisan | +19.661 |
� | +19.466 |
political | +18.448 |
| +17.845 |
Neg logit contributions | |
detects | -16.216 |
iton | -14.500 |
coins | -14.360 |
contains | -14.059 |
assium | -13.694 |
Token | Carolina |
Token ID | 5913 |
Feature activation | +9.53e+00 |
Pos logit contributions | |
� | +2.858 |
bipartisan | +2.797 |
political | +2.653 |
politically | +2.596 |
� | +2.565 |
Neg logit contributions | |
coins | -3.210 |
detects | -3.122 |
img | -3.002 |
contains | -2.968 |
iton | -2.949 |
Token | Sen |
Token ID | 2311 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
� | +11.507 |
bipartisan | +11.453 |
political | +11.169 |
� | +10.691 |
politically | +10.686 |
Neg logit contributions | |
coins | -8.159 |
detects | -7.628 |
img | -7.529 |
iton | -7.412 |
mitter | -7.300 |
Token | . |
Token ID | 13 |
Feature activation | +7.35e+00 |
Pos logit contributions | |
� | +0.638 |
bipartisan | +0.614 |
� | +0.588 |
political | +0.587 |
politically | +0.577 |
Neg logit contributions | |
coins | -0.401 |
detects | -0.398 |
contains | -0.361 |
rox | -0.354 |
iton | -0.353 |
Token | being |
Token ID | 852 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
bipartisan | +2.749 |
� | +2.728 |
political | +2.636 |
politically | +2.625 |
� | +2.549 |
Neg logit contributions | |
coins | -1.542 |
detects | -1.416 |
iton | -1.360 |
img | -1.348 |
rox | -1.336 |
Token | on |
Token ID | 319 |
Feature activation | +6.33e-01 |
Pos logit contributions | |
coins | +1.735 |
detects | +1.657 |
iton | +1.618 |
contains | +1.601 |
img | +1.598 |
Neg logit contributions | |
bipartisan | -0.998 |
� | -0.963 |
political | -0.919 |
politically | -0.918 |
� | -0.849 |
Token | the |
Token ID | 262 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
bipartisan | +0.953 |
� | +0.943 |
political | +0.919 |
politically | +0.908 |
� | +0.887 |
Neg logit contributions | |
coins | -0.420 |
detects | -0.390 |
iton | -0.366 |
contains | -0.364 |
img | -0.359 |
Token | table |
Token ID | 3084 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
bipartisan | +19.547 |
political | +19.470 |
� | +18.927 |
politically | +18.904 |
� | +17.601 |
Neg logit contributions | |
coins | -16.085 |
detects | -15.965 |
assium | -15.262 |
img | -15.216 |
iton | -15.088 |
Token | . |
Token ID | 13 |
Feature activation | +2.99e+01 |
Pos logit contributions | |
� | +14.570 |
bipartisan | +14.200 |
politically | +14.045 |
political | +13.765 |
� | +13.598 |
Neg logit contributions | |
coins | -8.881 |
detects | -8.313 |
img | -7.878 |
rox | -7.794 |
iton | -7.757 |
Token |
|
Token ID | 198 |
Feature activation | +4.37e+01 |
Pos logit contributions | |
� | +31.608 |
� | +29.654 |
bipartisan | +28.684 |
political | +27.254 |
| +26.629 |
Neg logit contributions | |
detects | -19.347 |
coins | -19.238 |
mitter | -18.019 |
iton | -17.919 |
rox | -17.793 |
Token |
|
Token ID | 198 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
� | +26.781 |
� | +24.271 |
| +22.569 |
bipartisan | +19.178 |
political | +18.385 |
Neg logit contributions | |
eatures | -30.500 |
detects | -29.442 |
senal | -28.396 |
yip | -28.120 |
coins | -27.696 |
Token | � |
Token ID | 447 |
Feature activation | -5.24e+00 |
Pos logit contributions | |
� | +21.063 |
� | +18.286 |
bipartisan | +17.997 |
political | +16.897 |
| +16.309 |
Neg logit contributions | |
detects | -15.215 |
coins | -13.772 |
iton | -13.437 |
contains | -13.310 |
behaves | -12.850 |
Token | � |
Token ID | 250 |
Feature activation | -5.71e+00 |
Pos logit contributions | |
coins | +5.043 |
detects | +4.852 |
contains | +4.608 |
iton | +4.563 |
img | +4.425 |
Neg logit contributions | |
� | -6.502 |
bipartisan | -6.475 |
political | -6.072 |
politically | -6.030 |
� | -5.979 |
Token | I |
Token ID | 40 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
coins | +6.132 |
detects | +5.875 |
contains | +5.692 |
iton | +5.619 |
img | +5.538 |
Neg logit contributions | |
bipartisan | -6.185 |
� | -6.123 |
political | -5.787 |
politically | -5.762 |
� | -5.551 |
Token | think |
Token ID | 892 |
Feature activation | -6.64e+00 |
Pos logit contributions | |
� | +21.064 |
� | +19.404 |
bipartisan | +19.022 |
politically | +18.235 |
political | +18.181 |
Neg logit contributions | |
coins | -12.973 |
detects | -12.164 |
iton | -11.778 |
ames | -11.478 |
img | -11.456 |
Token | s |
Token ID | 82 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
� | +15.604 |
bipartisan | +14.833 |
political | +14.531 |
� | +14.452 |
politically | +14.310 |
Neg logit contributions | |
coins | -5.985 |
detects | -5.853 |
iton | -5.551 |
contains | -5.371 |
rox | -5.318 |
Token | emails |
Token ID | 7237 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
bipartisan | +19.349 |
political | +19.233 |
� | +18.783 |
politically | +18.522 |
� | +17.616 |
Neg logit contributions | |
coins | -13.985 |
detects | -13.230 |
iton | -13.121 |
mitter | -12.891 |
rox | -12.885 |
Token | . |
Token ID | 13 |
Feature activation | +3.36e+01 |
Pos logit contributions | |
� | +26.586 |
� | +24.459 |
politically | +23.442 |
bipartisan | +23.259 |
political | +23.218 |
Neg logit contributions | |
coins | -14.088 |
detects | -13.747 |
iton | -13.304 |
wine | -13.199 |
rox | -12.780 |
Token | � |
Token ID | 447 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
� | +33.470 |
� | +31.092 |
bipartisan | +28.862 |
political | +27.932 |
| +27.638 |
Neg logit contributions | |
detects | -19.085 |
coins | -18.604 |
mitter | -17.726 |
iton | -17.607 |
rox | -17.343 |
Token | � |
Token ID | 251 |
Feature activation | +2.60e+01 |
Pos logit contributions | |
� | +13.876 |
bipartisan | +13.847 |
political | +13.093 |
politically | +12.971 |
� | +12.755 |
Neg logit contributions | |
coins | -10.514 |
detects | -9.956 |
contains | -9.543 |
iton | -9.498 |
img | -9.204 |
Token |
|
Token ID | 198 |
Feature activation | +4.36e+01 |
Pos logit contributions | |
� | +29.433 |
� | +27.114 |
bipartisan | +26.056 |
political | +25.426 |
politically | +24.607 |
Neg logit contributions | |
coins | -16.675 |
detects | -16.271 |
iton | -15.006 |
wine | -14.989 |
rox | -14.499 |
Token |
|
Token ID | 198 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
� | +27.473 |
� | +24.625 |
| +22.991 |
bipartisan | +20.165 |
political | +19.256 |
Neg logit contributions | |
eatures | -29.482 |
detects | -28.747 |
yip | -27.038 |
coins | -26.743 |
senal | -26.647 |
Token | The |
Token ID | 464 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
� | +30.353 |
� | +25.503 |
bipartisan | +24.689 |
political | +23.484 |
| +23.153 |
Neg logit contributions | |
detects | -19.570 |
coins | -17.263 |
iton | -17.130 |
contains | -16.827 |
behaves | -16.586 |
Token | Lerner |
Token ID | 49750 |
Feature activation | -4.91e-01 |
Pos logit contributions | |
bipartisan | +14.490 |
political | +13.986 |
politically | +13.757 |
� | +13.667 |
troubling | +12.796 |
Neg logit contributions | |
coins | -12.693 |
detects | -12.034 |
iton | -11.506 |
rox | -11.330 |
img | -11.232 |
Token | emails |
Token ID | 7237 |
Feature activation | +4.06e+00 |
Pos logit contributions | |
coins | +0.555 |
detects | +0.532 |
iton | +0.513 |
contains | +0.511 |
img | +0.504 |
Neg logit contributions | |
bipartisan | -0.512 |
� | -0.511 |
political | -0.486 |
politically | -0.479 |
� | -0.461 |
Token | have |
Token ID | 423 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
� | +5.688 |
bipartisan | +5.549 |
political | +5.352 |
politically | +5.334 |
� | +5.316 |
Neg logit contributions | |
coins | -3.131 |
detects | -2.876 |
iton | -2.812 |
img | -2.722 |
rox | -2.721 |
Token | judge |
Token ID | 5052 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
� | +15.105 |
bipartisan | +14.637 |
political | +14.156 |
� | +13.776 |
politically | +13.537 |
Neg logit contributions | |
coins | -8.984 |
detects | -8.343 |
img | -8.067 |
rox | -7.906 |
iton | -7.768 |
Token | sided |
Token ID | 34384 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
� | +15.905 |
bipartisan | +14.947 |
� | +14.629 |
political | +14.414 |
politically | +14.081 |
Neg logit contributions | |
coins | -9.587 |
detects | -8.455 |
rox | -8.438 |
img | -8.427 |
iton | -8.255 |
Token | with |
Token ID | 351 |
Feature activation | -4.62e+00 |
Pos logit contributions | |
bipartisan | +16.963 |
� | +16.951 |
political | +16.228 |
politically | +16.212 |
� | +15.931 |
Neg logit contributions | |
coins | -5.764 |
detects | -5.220 |
contains | -4.831 |
iton | -4.800 |
img | -4.712 |
Token | Ottawa |
Token ID | 14074 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
coins | +4.768 |
detects | +4.554 |
contains | +4.411 |
iton | +4.350 |
img | +4.287 |
Neg logit contributions | |
bipartisan | -5.186 |
� | -5.129 |
political | -4.864 |
politically | -4.847 |
� | -4.670 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
� | +16.424 |
bipartisan | +15.213 |
� | +15.108 |
political | +14.993 |
politically | +14.768 |
Neg logit contributions | |
coins | -8.677 |
detects | -8.059 |
img | -7.722 |
rox | -7.492 |
contains | -7.488 |
Token |
|
Token ID | 198 |
Feature activation | +4.34e+01 |
Pos logit contributions | |
� | +19.310 |
� | +17.827 |
bipartisan | +17.551 |
political | +16.983 |
politically | +16.287 |
Neg logit contributions | |
coins | -16.060 |
detects | -15.291 |
rox | -14.347 |
iton | -14.304 |
img | -14.106 |
Token |
|
Token ID | 198 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
� | +26.663 |
� | +24.392 |
| +21.915 |
bipartisan | +19.222 |
political | +18.739 |
Neg logit contributions | |
eatures | -29.939 |
detects | -29.377 |
senal | -28.068 |
coins | -27.332 |
perpend | -27.102 |
Token | But |
Token ID | 1537 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
� | +21.978 |
� | +19.193 |
bipartisan | +18.862 |
political | +18.110 |
politically | +17.441 |
Neg logit contributions | |
detects | -14.235 |
coins | -13.378 |
contains | -12.537 |
iton | -12.260 |
behaves | -11.771 |
Token | the |
Token ID | 262 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
coins | +1.216 |
detects | +1.147 |
contains | +1.090 |
img | +1.086 |
iton | +1.079 |
Neg logit contributions | |
bipartisan | -1.475 |
� | -1.473 |
political | -1.409 |
politically | -1.393 |
� | -1.353 |
Token | Court |
Token ID | 3078 |
Feature activation | +5.26e+00 |
Pos logit contributions | |
bipartisan | +11.603 |
� | +11.417 |
political | +11.359 |
politically | +11.075 |
� | +10.511 |
Neg logit contributions | |
coins | -11.744 |
detects | -11.180 |
img | -10.801 |
wine | -10.510 |
iton | -10.467 |
Token | of |
Token ID | 286 |
Feature activation | +3.88e-01 |
Pos logit contributions | |
bipartisan | +8.126 |
� | +8.052 |
political | +7.757 |
politically | +7.740 |
� | +7.530 |
Neg logit contributions | |
coins | -3.219 |
detects | -2.978 |
contains | -2.819 |
iton | -2.744 |
img | -2.669 |
Token | be |
Token ID | 307 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
� | +18.392 |
bipartisan | +16.884 |
� | +16.718 |
politically | +16.522 |
political | +16.418 |
Neg logit contributions | |
coins | -12.521 |
detects | -11.783 |
img | -11.487 |
iton | -11.439 |
rox | -11.389 |
Token | legal |
Token ID | 2742 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
bipartisan | +15.150 |
� | +14.775 |
political | +14.491 |
politically | +14.368 |
� | +13.811 |
Neg logit contributions | |
coins | -9.761 |
iton | -9.105 |
rox | -9.009 |
detects | -8.937 |
img | -8.809 |
Token | . |
Token ID | 13 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
� | +17.653 |
bipartisan | +16.772 |
� | +16.602 |
politically | +16.432 |
political | +16.393 |
Neg logit contributions | |
coins | -11.108 |
detects | -10.337 |
rox | -10.018 |
img | -9.846 |
iton | -9.699 |
Token | � |
Token ID | 447 |
Feature activation | +2.97e+00 |
Pos logit contributions | |
� | +20.764 |
� | +19.470 |
bipartisan | +18.241 |
political | +17.319 |
| +17.272 |
Neg logit contributions | |
detects | -12.901 |
coins | -12.884 |
iton | -12.639 |
rox | -12.035 |
mitter | -11.881 |
Token | � |
Token ID | 251 |
Feature activation | +7.04e+00 |
Pos logit contributions | |
bipartisan | +3.596 |
� | +3.580 |
political | +3.388 |
politically | +3.365 |
� | +3.285 |
Neg logit contributions | |
coins | -2.814 |
detects | -2.660 |
contains | -2.557 |
iton | -2.548 |
img | -2.484 |
Token |
|
Token ID | 198 |
Feature activation | +4.33e+01 |
Pos logit contributions | |
� | +8.650 |
bipartisan | +8.235 |
� | +8.038 |
political | +7.824 |
politically | +7.649 |
Neg logit contributions | |
coins | -6.437 |
detects | -6.270 |
iton | -6.031 |
rox | -5.781 |
contains | -5.747 |
Token |
|
Token ID | 198 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
� | +26.940 |
� | +24.344 |
| +22.419 |
bipartisan | +19.676 |
political | +19.036 |
Neg logit contributions | |
eatures | -30.099 |
detects | -28.938 |
yip | -27.898 |
senal | -27.766 |
coins | -26.986 |
Token | In |
Token ID | 818 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
� | +24.720 |
bipartisan | +21.224 |
� | +21.158 |
political | +19.746 |
| +18.895 |
Neg logit contributions | |
detects | -16.751 |
iton | -15.217 |
coins | -14.867 |
contains | -14.723 |
behaves | -14.210 |
Token | a |
Token ID | 257 |
Feature activation | +3.26e+01 |
Pos logit contributions | |
bipartisan | +18.624 |
� | +18.150 |
political | +17.936 |
politically | +17.357 |
� | +17.009 |
Neg logit contributions | |
coins | -12.048 |
detects | -11.664 |
img | -11.060 |
iton | -11.040 |
rox | -10.938 |
Token | 2014 |
Token ID | 1946 |
Feature activation | +2.28e+01 |
Pos logit contributions | |
bipartisan | +31.577 |
political | +30.040 |
politically | +29.116 |
� | +28.732 |
troubling | +27.673 |
Neg logit contributions | |
coins | -20.763 |
detects | -18.321 |
rox | -17.753 |
img | -17.648 |
mitter | -17.585 |
Token | interview |
Token ID | 2720 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
bipartisan | +23.291 |
political | +22.517 |
� | +22.112 |
politically | +21.172 |
� | +20.585 |
Neg logit contributions | |
coins | -17.676 |
detects | -16.684 |
mitter | -15.710 |
img | -15.616 |
rox | -15.392 |
Token | Democrats |
Token ID | 4956 |
Feature activation | +2.67e+01 |
Pos logit contributions | |
bipartisan | +21.324 |
political | +20.078 |
� | +19.530 |
politically | +19.340 |
� | +18.722 |
Neg logit contributions | |
coins | -13.716 |
detects | -12.152 |
img | -11.898 |
mitter | -11.860 |
rox | -11.639 |
Token | � |
Token ID | 447 |
Feature activation | +5.43e+00 |
Pos logit contributions | |
� | +29.950 |
� | +28.126 |
bipartisan | +28.034 |
political | +27.261 |
politically | +26.912 |
Neg logit contributions | |
coins | -16.389 |
detects | -15.031 |
img | -14.426 |
iton | -13.952 |
rox | -13.872 |
Token | � |
Token ID | 247 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
� | +5.352 |
bipartisan | +5.159 |
political | +4.791 |
� | +4.725 |
politically | +4.658 |
Neg logit contributions | |
coins | -6.297 |
detects | -6.108 |
iton | -5.790 |
contains | -5.769 |
wine | -5.635 |
Token | fire |
Token ID | 2046 |
Feature activation | +2.03e+01 |
Pos logit contributions | |
� | +18.753 |
bipartisan | +18.261 |
political | +17.479 |
� | +17.468 |
politically | +17.161 |
Neg logit contributions | |
coins | -7.842 |
detects | -7.598 |
rox | -6.924 |
contains | -6.902 |
img | -6.702 |
Token | : |
Token ID | 25 |
Feature activation | +3.48e+01 |
Pos logit contributions | |
� | +25.468 |
� | +24.118 |
bipartisan | +23.801 |
political | +22.950 |
politically | +22.928 |
Neg logit contributions | |
coins | -11.919 |
detects | -11.628 |
img | -10.185 |
mitter | -10.108 |
iton | -10.108 |
Token |
|
Token ID | 198 |
Feature activation | +4.33e+01 |
Pos logit contributions | |
� | +35.474 |
� | +34.568 |
bipartisan | +33.202 |
political | +32.718 |
politically | +31.743 |
Neg logit contributions | |
coins | -16.611 |
detects | -15.561 |
mitter | -15.024 |
iton | -14.439 |
rox | -14.097 |
Token |
|
Token ID | 198 |
Feature activation | +2.63e+01 |
Pos logit contributions | |
� | +27.168 |
� | +24.373 |
| +22.577 |
bipartisan | +20.203 |
political | +19.349 |
Neg logit contributions | |
eatures | -29.835 |
detects | -29.141 |
yip | -27.793 |
coins | -27.047 |
senal | -26.938 |
Token | Even |
Token ID | 6104 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
� | +28.726 |
� | +24.972 |
bipartisan | +24.227 |
political | +23.221 |
| +22.274 |
Neg logit contributions | |
detects | -18.134 |
coins | -16.335 |
iton | -15.370 |
contains | -15.298 |
mitter | -15.133 |
Token | Democrats |
Token ID | 4956 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
bipartisan | +15.310 |
� | +14.827 |
political | +14.805 |
politically | +14.467 |
� | +13.911 |
Neg logit contributions | |
coins | -9.257 |
detects | -8.180 |
mitter | -8.112 |
iton | -7.993 |
rox | -7.819 |
Token | who |
Token ID | 508 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
� | +22.133 |
bipartisan | +20.987 |
� | +20.781 |
political | +20.678 |
politically | +20.363 |
Neg logit contributions | |
coins | -12.886 |
detects | -11.517 |
iton | -11.457 |
img | -11.132 |
rox | -10.822 |
Token | are |
Token ID | 389 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
� | +22.402 |
bipartisan | +21.363 |
� | +21.221 |
political | +21.127 |
politically | +21.068 |
Neg logit contributions | |
coins | -14.372 |
iton | -12.155 |
rox | -12.146 |
properties | -12.103 |
detects | -11.953 |
Token | Republicans |
Token ID | 4734 |
Feature activation | +2.47e+01 |
Pos logit contributions | |
bipartisan | +31.183 |
political | +30.934 |
politically | +29.842 |
� | +28.367 |
ideological | +27.637 |
Neg logit contributions | |
coins | -21.141 |
detects | -19.746 |
wine | -18.851 |
rox | -18.265 |
img | -17.980 |
Token | � |
Token ID | 447 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
� | +26.153 |
political | +25.071 |
bipartisan | +24.457 |
politically | +24.127 |
� | +23.461 |
Neg logit contributions | |
coins | -17.753 |
detects | -16.762 |
wine | -15.825 |
rox | -15.653 |
mitter | -15.536 |
Token | � |
Token ID | 247 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
� | +10.529 |
bipartisan | +10.047 |
political | +9.429 |
� | +9.311 |
politically | +9.164 |
Neg logit contributions | |
coins | -10.953 |
detects | -10.610 |
contains | -10.111 |
iton | -10.082 |
rox | -9.911 |
Token | months |
Token ID | 1933 |
Feature activation | +2.10e+01 |
Pos logit contributions | |
� | +23.372 |
bipartisan | +22.941 |
political | +22.553 |
politically | +21.857 |
� | +21.121 |
Neg logit contributions | |
coins | -10.585 |
detects | -10.398 |
rox | -9.329 |
contains | -9.226 |
img | -8.876 |
Token | - |
Token ID | 12 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
� | +24.924 |
bipartisan | +24.001 |
political | +23.655 |
politically | +23.139 |
� | +22.922 |
Neg logit contributions | |
coins | -14.669 |
detects | -13.707 |
rox | -12.708 |
img | -12.382 |
itely | -12.048 |
Token | long |
Token ID | 6511 |
Feature activation | +4.31e+01 |
Pos logit contributions | |
� | +16.481 |
bipartisan | +16.377 |
politically | +15.693 |
political | +15.634 |
� | +14.895 |
Neg logit contributions | |
detects | -14.060 |
coins | -13.844 |
contains | -12.485 |
assium | -12.342 |
behaves | -12.197 |
Token | struggle |
Token ID | 6531 |
Feature activation | +2.42e+01 |
Pos logit contributions | |
political | +35.313 |
bipartisan | +35.106 |
politically | +32.511 |
ideological | +32.002 |
� | +31.932 |
Neg logit contributions | |
coins | -24.218 |
detects | -22.337 |
rox | -21.225 |
wine | -20.695 |
mitter | -20.591 |
Token | to |
Token ID | 284 |
Feature activation | +1.94e+01 |
Pos logit contributions | |
� | +26.732 |
bipartisan | +25.478 |
politically | +25.147 |
political | +24.691 |
� | +24.409 |
Neg logit contributions | |
coins | -15.726 |
detects | -15.331 |
rox | -14.410 |
wine | -14.265 |
img | -14.075 |
Token | reach |
Token ID | 3151 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
bipartisan | +18.940 |
politically | +18.831 |
� | +18.386 |
political | +18.130 |
� | +17.274 |
Neg logit contributions | |
coins | -16.537 |
wine | -15.198 |
detects | -14.780 |
assium | -14.406 |
rox | -14.395 |
Token | a |
Token ID | 257 |
Feature activation | +3.33e+01 |
Pos logit contributions | |
bipartisan | +21.957 |
political | +20.216 |
politically | +19.715 |
� | +19.323 |
ideological | +18.347 |
Neg logit contributions | |
coins | -16.636 |
detects | -15.086 |
wine | -14.995 |
rox | -14.888 |
img | -14.853 |
Token | budget |
Token ID | 4466 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
bipartisan | +31.904 |
political | +29.651 |
politically | +28.997 |
� | +27.194 |
| +26.154 |
Neg logit contributions | |
coins | -23.840 |
iton | -20.874 |
rox | -20.541 |
wine | -20.505 |
img | -20.161 |
Token | countries |
Token ID | 2678 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
� | +10.128 |
bipartisan | +9.921 |
political | +9.857 |
politically | +9.480 |
� | +9.228 |
Neg logit contributions | |
coins | -8.695 |
iton | -8.144 |
rox | -7.993 |
detects | -7.922 |
img | -7.863 |
Token | includes |
Token ID | 3407 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
� | +16.512 |
bipartisan | +15.803 |
� | +15.517 |
political | +15.228 |
politically | +15.219 |
Neg logit contributions | |
coins | -6.325 |
rox | -5.291 |
iton | -5.272 |
img | -5.155 |
detects | -5.099 |
Token | the |
Token ID | 262 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
bipartisan | +25.468 |
� | +25.341 |
political | +25.138 |
� | +24.015 |
politically | +23.860 |
Neg logit contributions | |
coins | -15.146 |
img | -14.160 |
detects | -13.626 |
rox | -13.325 |
iton | -13.123 |
Token | following |
Token ID | 1708 |
Feature activation | +2.70e+01 |
Pos logit contributions | |
political | +23.083 |
bipartisan | +22.920 |
� | +22.445 |
politically | +21.758 |
geopolitical | +20.920 |
Neg logit contributions | |
coins | -17.466 |
detects | -16.299 |
img | -15.894 |
wine | -15.436 |
iton | -15.108 |
Token | : |
Token ID | 25 |
Feature activation | +3.45e+01 |
Pos logit contributions | |
� | +29.020 |
political | +28.090 |
bipartisan | +27.728 |
� | +27.275 |
politically | +26.606 |
Neg logit contributions | |
coins | -15.664 |
img | -14.892 |
detects | -13.988 |
rox | -13.748 |
assium | -13.714 |
Token |
|
Token ID | 198 |
Feature activation | +4.31e+01 |
Pos logit contributions | |
� | +36.260 |
� | +33.890 |
political | +33.517 |
bipartisan | +33.256 |
politically | +31.604 |
Neg logit contributions | |
coins | -16.547 |
detects | -15.504 |
img | -15.103 |
rox | -14.859 |
iton | -14.708 |
Token |
|
Token ID | 198 |
Feature activation | +2.51e+01 |
Pos logit contributions | |
� | +27.487 |
� | +24.893 |
| +22.733 |
bipartisan | +20.027 |
political | +19.619 |
Neg logit contributions | |
detects | -28.536 |
eatures | -28.470 |
yip | -27.234 |
senal | -26.936 |
coins | -26.580 |
Token | In |
Token ID | 818 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
� | +29.477 |
� | +25.755 |
bipartisan | +25.325 |
political | +24.907 |
| +23.546 |
Neg logit contributions | |
detects | -14.960 |
coins | -13.507 |
contains | -13.067 |
iton | -12.756 |
behaves | -12.743 |
Token | the |
Token ID | 262 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
� | +13.081 |
bipartisan | +13.005 |
political | +12.752 |
politically | +12.335 |
� | +12.202 |
Neg logit contributions | |
coins | -8.590 |
detects | -8.447 |
contains | -7.796 |
wine | -7.781 |
img | -7.684 |
Token | framework |
Token ID | 9355 |
Feature activation | +2.46e+00 |
Pos logit contributions | |
political | +21.721 |
bipartisan | +21.054 |
� | +20.972 |
politically | +20.387 |
geopolitical | +19.760 |
Neg logit contributions | |
coins | -16.730 |
detects | -15.912 |
ames | -15.176 |
iton | -15.105 |
img | -15.061 |
Token | of |
Token ID | 286 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
bipartisan | +3.976 |
� | +3.846 |
politically | +3.771 |
political | +3.758 |
geopolitical | +3.625 |
Neg logit contributions | |
coins | -1.346 |
detects | -1.230 |
contains | -1.203 |
iton | -1.153 |
img | -1.067 |
Token | different |
Token ID | 1180 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
� | +12.357 |
bipartisan | +12.234 |
political | +11.980 |
politically | +11.674 |
� | +11.637 |
Neg logit contributions | |
coins | -6.979 |
detects | -6.479 |
iton | -6.175 |
img | -6.147 |
rox | -6.077 |
Token | policies |
Token ID | 4788 |
Feature activation | +8.74e+00 |
Pos logit contributions | |
political | +17.362 |
bipartisan | +17.197 |
� | +16.936 |
politically | +16.295 |
� | +16.036 |
Neg logit contributions | |
coins | -12.801 |
detects | -12.028 |
iton | -11.819 |
img | -11.737 |
mitter | -11.548 |
Token | . |
Token ID | 13 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
� | +11.863 |
bipartisan | +11.344 |
politically | +11.170 |
� | +11.044 |
political | +10.976 |
Neg logit contributions | |
coins | -6.765 |
detects | -6.311 |
img | -5.980 |
rox | -5.885 |
contains | -5.817 |
Token | � |
Token ID | 447 |
Feature activation | +4.44e+00 |
Pos logit contributions | |
� | +21.592 |
� | +19.842 |
bipartisan | +19.049 |
political | +18.308 |
| +17.921 |
Neg logit contributions | |
coins | -11.617 |
detects | -11.507 |
iton | -10.852 |
rox | -10.542 |
mitter | -10.375 |
Token | � |
Token ID | 251 |
Feature activation | +1.73e+01 |
Pos logit contributions | |
� | +5.241 |
bipartisan | +5.208 |
political | +4.895 |
politically | +4.848 |
� | +4.790 |
Neg logit contributions | |
coins | -4.352 |
detects | -4.121 |
iton | -3.949 |
contains | -3.933 |
img | -3.837 |
Token |
|
Token ID | 198 |
Feature activation | +4.30e+01 |
Pos logit contributions | |
� | +21.983 |
bipartisan | +21.228 |
� | +20.331 |
political | +20.270 |
politically | +20.045 |
Neg logit contributions | |
coins | -13.634 |
detects | -13.018 |
iton | -12.229 |
contains | -12.100 |
img | -11.920 |
Token |
|
Token ID | 198 |
Feature activation | +1.87e+01 |
Pos logit contributions | |
� | +26.569 |
� | +24.032 |
| +22.581 |
bipartisan | +19.618 |
political | +18.839 |
Neg logit contributions | |
eatures | -29.798 |
detects | -28.887 |
senal | -27.269 |
yip | -27.254 |
coins | -26.925 |
Token | But |
Token ID | 1537 |
Feature activation | +9.89e-01 |
Pos logit contributions | |
� | +21.310 |
bipartisan | +18.310 |
� | +18.226 |
political | +17.336 |
| +16.785 |
Neg logit contributions | |
detects | -15.240 |
coins | -13.715 |
iton | -13.638 |
contains | -13.346 |
assium | -12.941 |
Token | in |
Token ID | 287 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
bipartisan | +1.273 |
� | +1.263 |
political | +1.218 |
politically | +1.202 |
� | +1.168 |
Neg logit contributions | |
coins | -0.900 |
detects | -0.840 |
img | -0.807 |
iton | -0.805 |
contains | -0.791 |
Token | 2014 |
Token ID | 1946 |
Feature activation | +6.94e+00 |
Pos logit contributions | |
bipartisan | +17.388 |
political | +17.082 |
� | +16.832 |
politically | +16.367 |
� | +15.754 |
Neg logit contributions | |
coins | -13.758 |
detects | -12.687 |
rox | -12.660 |
img | -12.612 |
iton | -12.471 |
Token | , |
Token ID | 11 |
Feature activation | +3.50e-01 |
Pos logit contributions | |
bipartisan | +9.960 |
� | +9.948 |
political | +9.545 |
politically | +9.463 |
� | +9.275 |
Neg logit contributions | |
coins | -4.869 |
detects | -4.545 |
contains | -4.279 |
iton | -4.258 |
img | -4.192 |
Token | years |
Token ID | 812 |
Feature activation | +8.08e+00 |
Pos logit contributions | |
political | +16.418 |
bipartisan | +16.274 |
politically | +15.961 |
� | +15.170 |
geopolitical | +15.113 |
Neg logit contributions | |
coins | -14.525 |
iton | -13.220 |
rox | -13.190 |
img | -13.146 |
wine | -12.942 |
Token | of |
Token ID | 286 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
� | +11.454 |
bipartisan | +11.267 |
political | +10.917 |
politically | +10.879 |
� | +10.693 |
Neg logit contributions | |
coins | -5.848 |
detects | -5.292 |
iton | -4.959 |
img | -4.898 |
rox | -4.886 |
Token | high |
Token ID | 1029 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
political | +19.646 |
bipartisan | +19.609 |
politically | +18.988 |
� | +18.201 |
geopolitical | +18.097 |
Neg logit contributions | |
coins | -15.043 |
img | -13.544 |
detects | -13.293 |
iton | -13.265 |
rox | -13.153 |
Token | prices |
Token ID | 4536 |
Feature activation | +9.01e+00 |
Pos logit contributions | |
bipartisan | +11.297 |
political | +11.253 |
� | +10.899 |
politically | +10.692 |
geopolitical | +10.474 |
Neg logit contributions | |
coins | -9.736 |
img | -8.843 |
detects | -8.764 |
iton | -8.759 |
rox | -8.719 |
Token | . |
Token ID | 13 |
Feature activation | +1.89e+01 |
Pos logit contributions | |
� | +11.717 |
bipartisan | +11.269 |
political | +10.940 |
politically | +10.921 |
� | +10.822 |
Neg logit contributions | |
coins | -7.220 |
detects | -6.729 |
iton | -6.376 |
img | -6.333 |
rox | -6.247 |
Token |
|
Token ID | 198 |
Feature activation | +4.27e+01 |
Pos logit contributions | |
� | +21.546 |
� | +19.499 |
bipartisan | +18.665 |
political | +18.362 |
politically | +17.692 |
Neg logit contributions | |
coins | -14.831 |
detects | -14.701 |
rox | -13.848 |
mitter | -13.693 |
iton | -13.497 |
Token |
|
Token ID | 198 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
� | +26.177 |
� | +24.024 |
| +21.505 |
bipartisan | +19.306 |
political | +18.689 |
Neg logit contributions | |
eatures | -29.974 |
detects | -29.691 |
yip | -27.969 |
senal | -27.693 |
coins | -27.468 |
Token | However |
Token ID | 4864 |
Feature activation | +6.22e+00 |
Pos logit contributions | |
� | +18.185 |
bipartisan | +15.692 |
� | +15.583 |
political | +15.159 |
politically | +14.543 |
Neg logit contributions | |
detects | -13.071 |
coins | -12.241 |
contains | -11.758 |
iton | -11.544 |
behaves | -11.097 |
Token | , |
Token ID | 11 |
Feature activation | -7.19e-01 |
Pos logit contributions | |
bipartisan | +9.589 |
� | +9.460 |
political | +9.096 |
politically | +9.070 |
� | +8.831 |
Neg logit contributions | |
coins | -3.902 |
detects | -3.616 |
contains | -3.471 |
iton | -3.362 |
img | -3.249 |
Token | the |
Token ID | 262 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
coins | +0.663 |
detects | +0.623 |
contains | +0.592 |
iton | +0.587 |
img | +0.582 |
Neg logit contributions | |
bipartisan | -0.914 |
� | -0.908 |
political | -0.879 |
politically | -0.871 |
� | -0.838 |
Token | new |
Token ID | 649 |
Feature activation | +7.25e+00 |
Pos logit contributions | |
bipartisan | +13.085 |
political | +12.925 |
politically | +12.542 |
� | +12.408 |
geopolitical | +11.918 |
Neg logit contributions | |
coins | -12.522 |
detects | -12.002 |
img | -11.328 |
iton | -11.217 |
rox | -11.068 |
Token | economic |
Token ID | 3034 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
political | +25.873 |
� | +25.285 |
bipartisan | +24.900 |
politically | +24.709 |
geopolitical | +24.345 |
Neg logit contributions | |
coins | -16.462 |
rox | -14.732 |
detects | -14.497 |
img | -14.496 |
wine | -14.261 |
Token | and |
Token ID | 290 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
political | +16.469 |
bipartisan | +16.102 |
� | +15.751 |
politically | +15.646 |
geopolitical | +15.486 |
Neg logit contributions | |
coins | -13.081 |
img | -12.038 |
detects | -11.961 |
mitter | -11.530 |
wine | -11.308 |
Token | political |
Token ID | 1964 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
political | +24.128 |
politically | +22.407 |
geopolitical | +22.266 |
bipartisan | +21.873 |
ideological | +21.275 |
Neg logit contributions | |
coins | -19.823 |
detects | -17.605 |
rox | -17.280 |
img | -17.233 |
iton | -17.103 |
Token | agenda |
Token ID | 8666 |
Feature activation | +2.45e+01 |
Pos logit contributions | |
political | +21.399 |
bipartisan | +20.189 |
politically | +19.910 |
geopolitical | +19.846 |
� | +19.829 |
Neg logit contributions | |
coins | -17.469 |
img | -16.010 |
detects | -15.951 |
wine | -15.503 |
mitter | -15.397 |
Token | . |
Token ID | 13 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
� | +26.901 |
politically | +24.669 |
� | +24.520 |
political | +24.353 |
bipartisan | +24.273 |
Neg logit contributions | |
coins | -16.739 |
detects | -15.560 |
rox | -14.813 |
img | -14.729 |
iton | -14.550 |
Token |
|
Token ID | 198 |
Feature activation | +4.27e+01 |
Pos logit contributions | |
� | +23.386 |
� | +21.420 |
bipartisan | +20.076 |
political | +19.612 |
politically | +18.886 |
Neg logit contributions | |
coins | -16.890 |
detects | -16.750 |
mitter | -15.739 |
rox | -15.596 |
iton | -15.335 |
Token |
|
Token ID | 198 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
� | +26.035 |
� | +24.127 |
| +21.717 |
bipartisan | +19.356 |
political | +18.587 |
Neg logit contributions | |
eatures | -29.749 |
detects | -29.352 |
yip | -27.806 |
senal | -27.595 |
coins | -27.363 |
Token | The |
Token ID | 464 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
� | +19.729 |
� | +17.183 |
bipartisan | +17.097 |
political | +16.486 |
politically | +15.821 |
Neg logit contributions | |
detects | -13.199 |
coins | -12.433 |
contains | -11.771 |
iton | -11.682 |
assium | -11.235 |
Token | real |
Token ID | 1103 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
bipartisan | +15.945 |
political | +15.660 |
� | +15.259 |
politically | +15.168 |
geopolitical | +14.613 |
Neg logit contributions | |
coins | -12.639 |
detects | -12.220 |
iton | -11.252 |
contains | -11.146 |
img | -11.113 |
Token | problem |
Token ID | 1917 |
Feature activation | +6.56e+00 |
Pos logit contributions | |
political | +18.691 |
bipartisan | +18.608 |
� | +18.307 |
geopolitical | +17.544 |
politically | +17.489 |
Neg logit contributions | |
coins | -13.544 |
detects | -13.008 |
rox | -12.250 |
contains | -11.813 |
img | -11.633 |
Token | for |
Token ID | 329 |
Feature activation | +2.26e+00 |
Pos logit contributions | |
� | +10.249 |
bipartisan | +10.021 |
political | +9.712 |
politically | +9.686 |
� | +9.606 |
Neg logit contributions | |
coins | -3.865 |
detects | -3.456 |
iton | -3.312 |
rox | -3.196 |
img | -3.112 |
Token | to |
Token ID | 284 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
coins | +2.756 |
detects | +2.612 |
contains | +2.487 |
iton | +2.435 |
img | +2.407 |
Neg logit contributions | |
bipartisan | -4.701 |
� | -4.677 |
political | -4.472 |
politically | -4.442 |
� | -4.333 |
Token | recruit |
Token ID | 10960 |
Feature activation | -5.17e+00 |
Pos logit contributions | |
� | +16.253 |
� | +14.982 |
bipartisan | +14.170 |
politically | +14.170 |
political | +13.997 |
Neg logit contributions | |
coins | -13.411 |
detects | -12.424 |
rox | -11.796 |
assium | -11.763 |
mitter | -11.721 |
Token | . |
Token ID | 13 |
Feature activation | +6.30e+00 |
Pos logit contributions | |
coins | +5.550 |
detects | +5.303 |
contains | +5.111 |
iton | +5.049 |
img | +5.002 |
Neg logit contributions | |
bipartisan | -5.720 |
� | -5.672 |
political | -5.371 |
politically | -5.341 |
� | -5.153 |
Token | � |
Token ID | 447 |
Feature activation | +3.49e+00 |
Pos logit contributions | |
� | +8.274 |
� | +7.619 |
bipartisan | +7.494 |
political | +7.131 |
politically | +6.993 |
Neg logit contributions | |
coins | -5.549 |
detects | -5.453 |
iton | -5.024 |
rox | -4.923 |
mitter | -4.901 |
Token | � |
Token ID | 251 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
bipartisan | +4.344 |
� | +4.294 |
political | +4.099 |
politically | +4.087 |
� | +3.947 |
Neg logit contributions | |
coins | -3.189 |
detects | -3.029 |
contains | -2.924 |
iton | -2.873 |
img | -2.829 |
Token |
|
Token ID | 198 |
Feature activation | +4.26e+01 |
Pos logit contributions | |
� | +12.231 |
bipartisan | +11.734 |
� | +11.187 |
political | +11.133 |
politically | +11.020 |
Neg logit contributions | |
coins | -10.580 |
detects | -10.230 |
contains | -9.611 |
iton | -9.547 |
img | -9.477 |
Token |
|
Token ID | 198 |
Feature activation | +1.81e+01 |
Pos logit contributions | |
� | +26.002 |
� | +23.508 |
| +21.887 |
bipartisan | +18.540 |
political | +18.067 |
Neg logit contributions | |
eatures | -30.631 |
detects | -29.322 |
senal | -28.331 |
yip | -27.710 |
coins | -27.459 |
Token | EM |
Token ID | 3620 |
Feature activation | +3.99e+00 |
Pos logit contributions | |
� | +22.241 |
� | +19.488 |
bipartisan | +18.678 |
political | +18.030 |
| +17.633 |
Neg logit contributions | |
detects | -13.410 |
coins | -12.492 |
contains | -11.740 |
iton | -11.483 |
behaves | -11.139 |
Token | M |
Token ID | 44 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
� | +5.088 |
bipartisan | +4.920 |
political | +4.758 |
� | +4.666 |
politically | +4.652 |
Neg logit contributions | |
coins | -3.570 |
detects | -3.294 |
iton | -3.114 |
contains | -3.058 |
rox | -3.054 |
Token | ITT |
Token ID | 22470 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
bipartisan | +1.866 |
� | +1.855 |
political | +1.770 |
politically | +1.744 |
� | +1.730 |
Neg logit contributions | |
coins | -1.359 |
detects | -1.268 |
iton | -1.233 |
contains | -1.212 |
img | -1.184 |
Token | SM |
Token ID | 9447 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
coins | +1.485 |
detects | +1.394 |
iton | +1.334 |
contains | +1.325 |
rox | +1.301 |
Neg logit contributions | |
� | -1.832 |
bipartisan | -1.826 |
political | -1.722 |
politically | -1.698 |
� | -1.694 |
Token | cv |
Token ID | 33967 |
Feature activation | -6.25e+01 |
Pos logit contributions | |
coins | +38.294 |
img | +37.403 |
ax | +36.411 |
cube | +36.024 |
cs | +35.295 |
Neg logit contributions | |
� | -35.329 |
� | -26.608 |
ccording | -26.360 |
tremend | -25.889 |
millenn | -25.804 |
Token | 2 |
Token ID | 17 |
Feature activation | -5.96e+01 |
Pos logit contributions | |
coins | +37.602 |
2 | +37.595 |
img | +36.983 |
X | +36.330 |
x | +35.946 |
Neg logit contributions | |
� | -49.652 |
tremend | -41.223 |
� | -39.670 |
behavi | -38.904 |
millenn | -38.476 |
Token | . |
Token ID | 13 |
Feature activation | -3.69e+01 |
Pos logit contributions | |
coins | +37.165 |
img | +36.261 |
contains | +35.799 |
X | +35.260 |
forge | +35.248 |
Neg logit contributions | |
� | -46.667 |
tremend | -40.235 |
millenn | -39.118 |
� | -37.788 |
ccording | -37.412 |
Token | M |
Token ID | 44 |
Feature activation | -5.00e+01 |
Pos logit contributions | |
coins | +31.131 |
img | +30.288 |
X | +30.142 |
contains | +29.644 |
map | +28.401 |
Neg logit contributions | |
� | -29.120 |
tremend | -26.301 |
behavi | -24.671 |
bipartisan | -24.078 |
ccording | -23.946 |
Token | OR |
Token ID | 1581 |
Feature activation | -4.79e+01 |
Pos logit contributions | |
coins | +31.589 |
X | +31.258 |
img | +31.049 |
rox | +30.700 |
contains | +30.580 |
Neg logit contributions | |
� | -39.090 |
tremend | -33.494 |
behavi | -32.171 |
ccording | -31.313 |
millenn | -29.747 |
Token | PH |
Token ID | 11909 |
Feature activation | -6.55e+01 |
Pos logit contributions | |
coins | +33.661 |
X | +32.258 |
contains | +31.153 |
hex | +30.977 |
img | +30.850 |
Neg logit contributions | |
� | -36.304 |
tremend | -32.663 |
millenn | -29.269 |
behavi | -29.102 |
ccording | -28.968 |
Token | _ |
Token ID | 62 |
Feature activation | -4.53e+01 |
Pos logit contributions | |
_ | +41.955 |
X | +38.559 |
coins | +37.956 |
+ | +37.170 |
img | +37.062 |
Neg logit contributions | |
� | -44.346 |
tremend | -39.366 |
millenn | -37.678 |
ccording | -36.220 |
� | -35.124 |
Token | RECT |
Token ID | 23988 |
Feature activation | -4.83e+01 |
Pos logit contributions | |
X | +34.496 |
RECT | +33.521 |
coins | +33.282 |
img | +32.616 |
contains | +32.300 |
Neg logit contributions | |
� | -32.892 |
tremend | -28.512 |
behavi | -27.283 |
millenn | -26.338 |
bipartisan | -25.824 |
Token | , |
Token ID | 11 |
Feature activation | -3.78e+01 |
Pos logit contributions | |
contains | +34.579 |
coins | +34.282 |
img | +33.873 |
you | +33.583 |
X | +33.073 |
Neg logit contributions | |
� | -37.975 |
tremend | -33.464 |
millenn | -31.661 |
ccording | -31.492 |
� | -29.837 |
Token | ( |
Token ID | 357 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
contains | +32.627 |
coins | +32.080 |
img | +30.696 |
iton | +30.545 |
detects | +30.485 |
Neg logit contributions | |
� | -28.767 |
ccording | -24.458 |
tremend | -24.124 |
behavi | -23.065 |
millenn | -22.786 |
Token | 21 |
Token ID | 2481 |
Feature activation | -4.46e+01 |
Pos logit contributions | |
coins | +12.738 |
detects | +11.300 |
iton | +11.267 |
contains | +11.250 |
img | +11.055 |
Neg logit contributions | |
bipartisan | -18.269 |
� | -17.334 |
� | -17.089 |
politically | -17.023 |
political | -16.785 |
Token | 2 |
Token ID | 17 |
Feature activation | -3.87e+01 |
Pos logit contributions | |
coins | +24.617 |
contains | +23.422 |
iton | +23.390 |
img | +23.384 |
angles | +22.975 |
Neg logit contributions | |
bipartisan | -19.246 |
politically | -18.504 |
� | -18.268 |
political | -18.236 |
� | -17.853 |
Token | = |
Token ID | 796 |
Feature activation | -4.07e+01 |
Pos logit contributions | |
coins | +34.042 |
img | +33.263 |
contains | +33.203 |
= | +32.381 |
iton | +31.704 |
Neg logit contributions | |
� | -33.697 |
tremend | -27.264 |
behavi | -26.583 |
millenn | -26.557 |
� | -26.343 |
Token | New |
Token ID | 968 |
Feature activation | -6.33e+01 |
Pos logit contributions | |
contains | +31.517 |
coins | +30.222 |
img | +29.575 |
Load | +29.274 |
Mk | +29.219 |
Neg logit contributions | |
� | -31.467 |
tremend | -26.983 |
ccording | -26.810 |
behavi | -26.534 |
millenn | -24.783 |
Token | - |
Token ID | 12 |
Feature activation | -5.47e+01 |
Pos logit contributions | |
img | +35.304 |
+ | +35.048 |
- | +34.557 |
coins | +34.464 |
contains | +34.381 |
Neg logit contributions | |
� | -50.368 |
tremend | -42.541 |
ccording | -40.314 |
� | -40.122 |
millenn | -39.635 |
Token | Object |
Token ID | 10267 |
Feature activation | -4.77e+01 |
Pos logit contributions | |
X | +35.382 |
coins | +34.446 |
img | +34.172 |
edit | +33.334 |
cube | +32.915 |
Neg logit contributions | |
� | -45.220 |
tremend | -37.072 |
exting | -35.480 |
millenn | -34.771 |
ccording | -34.006 |
Token | System |
Token ID | 4482 |
Feature activation | -6.55e+01 |
Pos logit contributions | |
contains | +36.831 |
img | +35.676 |
Load | +34.062 |
X | +34.037 |
detects | +33.936 |
Neg logit contributions | |
� | -31.338 |
ccording | -25.140 |
tremend | -24.895 |
millenn | -23.563 |
behavi | -23.130 |
Token | . |
Token ID | 13 |
Feature activation | -4.94e+01 |
Pos logit contributions | |
img | +36.525 |
coins | +36.186 |
forge | +35.349 |
contains | +35.316 |
you | +35.312 |
Neg logit contributions | |
� | -51.314 |
tremend | -43.477 |
millenn | -42.010 |
� | -41.885 |
ccording | -41.247 |
Token | Draw |
Token ID | 25302 |
Feature activation | -5.80e+01 |
Pos logit contributions | |
img | +35.687 |
coins | +35.468 |
X | +34.743 |
wine | +33.988 |
forge | +33.518 |
Neg logit contributions | |
� | -38.595 |
tremend | -33.085 |
ccording | -29.507 |
millenn | -29.277 |
� | -28.780 |
Token | ing |
Token ID | 278 |
Feature activation | -5.66e+01 |
Pos logit contributions | |
img | +37.127 |
ing | +36.028 |
iton | +35.151 |
coins | +34.130 |
ings | +33.416 |
Neg logit contributions | |
� | -48.959 |
tremend | -40.519 |
� | -39.040 |
ccording | -38.139 |
millenn | -37.866 |
Token | . |
Token ID | 13 |
Feature activation | -3.59e+01 |
Pos logit contributions | |
img | +35.509 |
coins | +35.088 |
forge | +34.456 |
contains | +34.407 |
/ | +33.735 |
Neg logit contributions | |
� | -47.982 |
tremend | -39.957 |
millenn | -38.569 |
� | -38.265 |
ccording | -38.198 |
Token | Rect |
Token ID | 45474 |
Feature activation | -5.12e+01 |
Pos logit contributions | |
coins | +28.219 |
img | +27.877 |
X | +27.121 |
contains | +26.780 |
cube | +26.434 |
Neg logit contributions | |
� | -29.301 |
bipartisan | -26.077 |
politically | -25.146 |
behavi | -24.651 |
political | -24.200 |
Token | v |
Token ID | 410 |
Feature activation | -4.18e+01 |
Pos logit contributions | |
contains | +25.339 |
coins | +24.785 |
detects | +24.776 |
img | +23.637 |
iton | +23.493 |
Neg logit contributions | |
� | -23.567 |
bipartisan | -21.389 |
� | -20.471 |
ccording | -19.606 |
politically | -19.500 |
Token | ars |
Token ID | 945 |
Feature activation | -4.20e+01 |
Pos logit contributions | |
coins | +34.156 |
ames | +31.969 |
img | +31.722 |
rox | +31.263 |
ax | +31.066 |
Neg logit contributions | |
� | -36.191 |
behavi | -28.753 |
� | -28.540 |
millenn | -28.132 |
ccording | -27.987 |
Token | ( |
Token ID | 7 |
Feature activation | -3.67e+01 |
Pos logit contributions | |
coins | +36.437 |
contains | +35.535 |
img | +35.200 |
rox | +33.959 |
cube | +33.529 |
Neg logit contributions | |
� | -34.310 |
millenn | -27.677 |
tremend | -27.541 |
behavi | -26.908 |
ccording | -26.750 |
Token | ap |
Token ID | 499 |
Feature activation | -4.46e+01 |
Pos logit contributions | |
coins | +34.007 |
img | +33.538 |
ax | +32.997 |
map | +32.083 |
foo | +31.723 |
Neg logit contributions | |
� | -28.730 |
behavi | -22.805 |
bipartisan | -22.024 |
� | -21.772 |
ccording | -21.498 |
Token | . |
Token ID | 13 |
Feature activation | -3.92e+01 |
Pos logit contributions | |
coins | +36.447 |
img | +34.996 |
contains | +34.447 |
forge | +33.513 |
rox | +33.321 |
Neg logit contributions | |
� | -38.538 |
tremend | -32.084 |
millenn | -31.931 |
ccording | -30.989 |
� | -30.715 |
Token | parse |
Token ID | 29572 |
Feature activation | -6.51e+01 |
Pos logit contributions | |
img | +31.200 |
coins | +30.782 |
map | +29.887 |
scan | +29.619 |
init | +28.821 |
Neg logit contributions | |
� | -34.452 |
bipartisan | -28.593 |
behavi | -28.396 |
� | -27.957 |
political | -26.914 |
Token | _ |
Token ID | 62 |
Feature activation | -5.57e+01 |
Pos logit contributions | |
_ | +41.307 |
coins | +37.939 |
img | +37.252 |
X | +36.516 |
x | +36.019 |
Neg logit contributions | |
� | -46.952 |
tremend | -39.816 |
millenn | -38.933 |
� | -38.288 |
ccording | -37.024 |
Token | args |
Token ID | 22046 |
Feature activation | -2.17e+01 |
Pos logit contributions | |
coins | +37.538 |
img | +35.892 |
properties | +35.230 |
foo | +34.836 |
angles | +34.378 |
Neg logit contributions | |
� | -40.831 |
behavi | -31.749 |
� | -31.438 |
tremend | -31.396 |
ccording | -31.266 |
Token | ()) |
Token ID | 28955 |
Feature activation | -2.25e+01 |
Pos logit contributions | |
coins | +18.363 |
contains | +16.797 |
iton | +16.612 |
detects | +16.598 |
rox | +16.343 |
Neg logit contributions | |
bipartisan | -24.340 |
� | -24.004 |
political | -23.101 |
politically | -23.092 |
� | -22.779 |
Token | # |
Token ID | 1303 |
Feature activation | -3.45e+01 |
Pos logit contributions | |
detects | +18.036 |
contains | +17.651 |
coins | +16.753 |
img | +16.521 |
map | +15.833 |
Neg logit contributions | |
bipartisan | -18.840 |
� | -17.885 |
politically | -17.409 |
� | -17.087 |
geopolitical | -16.824 |
Token | initialize |
Token ID | 41216 |
Feature activation | -5.00e+01 |
Pos logit contributions | |
detects | +28.625 |
contains | +28.098 |
coins | +27.084 |
initialize | +25.745 |
iton | +25.348 |
Neg logit contributions | |
bipartisan | -24.346 |
� | -23.194 |
� | -22.814 |
politically | -22.022 |
political | -21.809 |
Token | ) |
Token ID | 8 |
Feature activation | -2.19e+01 |
Pos logit contributions | |
coins | +21.411 |
contains | +20.231 |
img | +19.881 |
detects | +19.594 |
rox | +19.135 |
Neg logit contributions | |
� | -20.196 |
bipartisan | -19.880 |
� | -18.968 |
politically | -18.660 |
political | -18.409 |
Token | $ |
Token ID | 720 |
Feature activation | -2.85e+01 |
Pos logit contributions | |
contains | +17.553 |
coins | +17.363 |
detects | +17.240 |
img | +16.431 |
wine | +15.929 |
Neg logit contributions | |
� | -18.501 |
bipartisan | -18.106 |
politically | -17.024 |
geopolitical | -16.785 |
political | -16.542 |
Token | rect |
Token ID | 2554 |
Feature activation | -2.84e+01 |
Pos logit contributions | |
coins | +28.495 |
img | +28.105 |
wine | +26.535 |
angles | +26.136 |
contains | +26.028 |
Neg logit contributions | |
bipartisan | -19.236 |
� | -17.852 |
� | -17.838 |
politically | -17.464 |
political | -17.405 |
Token | 2 |
Token ID | 17 |
Feature activation | -3.87e+01 |
Pos logit contributions | |
coins | +24.617 |
contains | +23.422 |
iton | +23.390 |
img | +23.384 |
angles | +22.975 |
Neg logit contributions | |
bipartisan | -19.246 |
politically | -18.504 |
� | -18.268 |
political | -18.236 |
� | -17.853 |
Token | = |
Token ID | 796 |
Feature activation | -4.07e+01 |
Pos logit contributions | |
coins | +34.042 |
img | +33.263 |
contains | +33.203 |
= | +32.381 |
iton | +31.704 |
Neg logit contributions | |
� | -33.697 |
tremend | -27.264 |
behavi | -26.583 |
millenn | -26.557 |
� | -26.343 |
Token | New |
Token ID | 968 |
Feature activation | -6.33e+01 |
Pos logit contributions | |
contains | +31.517 |
coins | +30.222 |
img | +29.575 |
Load | +29.274 |
Mk | +29.219 |
Neg logit contributions | |
� | -31.467 |
tremend | -26.983 |
ccording | -26.810 |
behavi | -26.534 |
millenn | -24.783 |
Token | - |
Token ID | 12 |
Feature activation | -5.47e+01 |
Pos logit contributions | |
img | +35.304 |
+ | +35.048 |
- | +34.557 |
coins | +34.464 |
contains | +34.381 |
Neg logit contributions | |
� | -50.368 |
tremend | -42.541 |
ccording | -40.314 |
� | -40.122 |
millenn | -39.635 |
Token | Object |
Token ID | 10267 |
Feature activation | -4.77e+01 |
Pos logit contributions | |
X | +35.382 |
coins | +34.446 |
img | +34.172 |
edit | +33.334 |
cube | +32.915 |
Neg logit contributions | |
� | -45.220 |
tremend | -37.072 |
exting | -35.480 |
millenn | -34.771 |
ccording | -34.006 |
Token | System |
Token ID | 4482 |
Feature activation | -6.55e+01 |
Pos logit contributions | |
contains | +36.831 |
img | +35.676 |
Load | +34.062 |
X | +34.037 |
detects | +33.936 |
Neg logit contributions | |
� | -31.338 |
ccording | -25.140 |
tremend | -24.895 |
millenn | -23.563 |
behavi | -23.130 |
Token | . |
Token ID | 13 |
Feature activation | -4.94e+01 |
Pos logit contributions | |
img | +36.525 |
coins | +36.186 |
forge | +35.349 |
contains | +35.316 |
you | +35.312 |
Neg logit contributions | |
� | -51.314 |
tremend | -43.477 |
millenn | -42.010 |
� | -41.885 |
ccording | -41.247 |
Token | Draw |
Token ID | 25302 |
Feature activation | -5.80e+01 |
Pos logit contributions | |
img | +35.687 |
coins | +35.468 |
X | +34.743 |
wine | +33.988 |
forge | +33.518 |
Neg logit contributions | |
� | -38.595 |
tremend | -33.085 |
ccording | -29.507 |
millenn | -29.277 |
� | -28.780 |
Token | , |
Token ID | 11 |
Feature activation | -4.55e+01 |
Pos logit contributions | |
contains | +29.280 |
coins | +29.249 |
detects | +28.301 |
img | +28.122 |
you | +27.601 |
Neg logit contributions | |
� | -30.765 |
ccording | -25.706 |
� | -23.993 |
tremend | -23.982 |
behavi | -23.804 |
Token | resize |
Token ID | 47558 |
Feature activation | -6.29e+01 |
Pos logit contributions | |
contains | +33.900 |
detects | +33.809 |
coins | +32.531 |
img | +31.797 |
you | +31.695 |
Neg logit contributions | |
� | -32.290 |
ccording | -27.285 |
behavi | -25.922 |
millenn | -25.824 |
� | -24.748 |
Token | it |
Token ID | 340 |
Feature activation | -3.91e+01 |
Pos logit contributions | |
it | +40.141 |
you | +36.658 |
iton | +35.766 |
it | +34.678 |
img | +34.514 |
Neg logit contributions | |
� | -42.837 |
ccording | -36.249 |
� | -34.241 |
tremend | -33.590 |
millenn | -33.111 |
Token | , |
Token ID | 11 |
Feature activation | -4.70e+01 |
Pos logit contributions | |
contains | +30.455 |
coins | +30.420 |
img | +29.202 |
you | +29.026 |
detects | +28.309 |
Neg logit contributions | |
� | -36.008 |
ccording | -30.251 |
tremend | -29.732 |
millenn | -29.210 |
� | -28.464 |
Token | and |
Token ID | 290 |
Feature activation | -3.82e+01 |
Pos logit contributions | |
contains | +31.839 |
coins | +30.923 |
detects | +30.726 |
you | +30.642 |
img | +29.173 |
Neg logit contributions | |
� | -37.307 |
ccording | -31.802 |
� | -29.954 |
millenn | -29.711 |
behavi | -29.575 |
Token | convert |
Token ID | 10385 |
Feature activation | -6.29e+01 |
Pos logit contributions | |
coins | +28.274 |
contains | +28.273 |
detects | +28.229 |
img | +26.447 |
you | +25.843 |
Neg logit contributions | |
� | -32.852 |
bipartisan | -26.983 |
ccording | -26.490 |
� | -25.937 |
behavi | -25.902 |
Token | it |
Token ID | 340 |
Feature activation | -4.84e+01 |
Pos logit contributions | |
it | +40.489 |
you | +37.136 |
iton | +35.901 |
contains | +35.120 |
img | +34.745 |
Neg logit contributions | |
� | -42.473 |
ccording | -35.164 |
� | -33.936 |
tremend | -33.584 |
millenn | -33.583 |
Token | to |
Token ID | 284 |
Feature activation | -2.50e+01 |
Pos logit contributions | |
contains | +36.361 |
coins | +35.075 |
you | +34.870 |
img | +33.437 |
iton | +33.401 |
Neg logit contributions | |
� | -37.914 |
ccording | -31.594 |
millenn | -29.928 |
� | -29.762 |
tremend | -29.429 |
Token | gr |
Token ID | 1036 |
Feature activation | -4.29e+01 |
Pos logit contributions | |
detects | +24.372 |
coins | +24.317 |
contains | +24.057 |
img | +23.207 |
iton | +22.148 |
Neg logit contributions | |
� | -21.327 |
bipartisan | -20.021 |
� | -19.790 |
politically | -18.341 |
ccording | -18.189 |
Token | ays |
Token ID | 592 |
Feature activation | -4.79e+01 |
Pos logit contributions | |
coins | +38.019 |
ames | +37.378 |
img | +36.201 |
angles | +35.814 |
detects | +35.435 |
Neg logit contributions | |
� | -29.111 |
ccording | -23.078 |
behavi | -22.434 |
� | -22.098 |
� | -21.524 |
Token | cale |
Token ID | 38765 |
Feature activation | -4.79e+01 |
Pos logit contributions | |
coins | +35.423 |
img | +34.010 |
rox | +33.903 |
iton | +33.172 |
ames | +33.163 |
Neg logit contributions | |
� | -36.699 |
� | -29.824 |
ccording | -28.642 |
millenn | -27.861 |
� | -27.551 |
Token | # |
Token ID | 1303 |
Feature activation | -3.43e+01 |
Pos logit contributions | |
detects | +22.543 |
coins | +22.462 |
contains | +22.083 |
img | +21.433 |
iton | +20.408 |
Neg logit contributions | |
� | -23.084 |
bipartisan | -22.026 |
� | -21.654 |
politically | -20.482 |
political | -19.933 |
Token | load |
Token ID | 3440 |
Feature activation | -5.69e+01 |
Pos logit contributions | |
contains | +27.116 |
detects | +26.865 |
coins | +26.843 |
img | +25.879 |
Load | +25.448 |
Neg logit contributions | |
� | -28.289 |
bipartisan | -27.383 |
� | -25.934 |
politically | -25.107 |
political | -24.845 |
Token | the |
Token ID | 262 |
Feature activation | -4.84e+01 |
Pos logit contributions | |
you | +35.818 |
contains | +35.479 |
img | +35.101 |
coins | +34.667 |
it | +34.217 |
Neg logit contributions | |
� | -39.993 |
ccording | -34.028 |
tremend | -33.500 |
millenn | -32.192 |
� | -31.704 |
Token | image |
Token ID | 2939 |
Feature activation | -3.51e+01 |
Pos logit contributions | |
img | +32.967 |
contains | +31.678 |
detects | +31.099 |
you | +30.627 |
X | +30.230 |
Neg logit contributions | |
� | -37.550 |
ccording | -32.389 |
� | -30.163 |
� | -29.832 |
� | -28.490 |
Token | , |
Token ID | 11 |
Feature activation | -4.55e+01 |
Pos logit contributions | |
contains | +29.280 |
coins | +29.249 |
detects | +28.301 |
img | +28.122 |
you | +27.601 |
Neg logit contributions | |
� | -30.765 |
ccording | -25.706 |
� | -23.993 |
tremend | -23.982 |
behavi | -23.804 |
Token | resize |
Token ID | 47558 |
Feature activation | -6.29e+01 |
Pos logit contributions | |
contains | +33.900 |
detects | +33.809 |
coins | +32.531 |
img | +31.797 |
you | +31.695 |
Neg logit contributions | |
� | -32.290 |
ccording | -27.285 |
behavi | -25.922 |
millenn | -25.824 |
� | -24.748 |
Token | it |
Token ID | 340 |
Feature activation | -3.91e+01 |
Pos logit contributions | |
it | +40.141 |
you | +36.658 |
iton | +35.766 |
it | +34.678 |
img | +34.514 |
Neg logit contributions | |
� | -42.837 |
ccording | -36.249 |
� | -34.241 |
tremend | -33.590 |
millenn | -33.111 |
Token | , |
Token ID | 11 |
Feature activation | -4.70e+01 |
Pos logit contributions | |
contains | +30.455 |
coins | +30.420 |
img | +29.202 |
you | +29.026 |
detects | +28.309 |
Neg logit contributions | |
� | -36.008 |
ccording | -30.251 |
tremend | -29.732 |
millenn | -29.210 |
� | -28.464 |
Token | and |
Token ID | 290 |
Feature activation | -3.82e+01 |
Pos logit contributions | |
contains | +31.839 |
coins | +30.923 |
detects | +30.726 |
you | +30.642 |
img | +29.173 |
Neg logit contributions | |
� | -37.307 |
ccording | -31.802 |
� | -29.954 |
millenn | -29.711 |
behavi | -29.575 |
Token | convert |
Token ID | 10385 |
Feature activation | -6.29e+01 |
Pos logit contributions | |
coins | +28.274 |
contains | +28.273 |
detects | +28.229 |
img | +26.447 |
you | +25.843 |
Neg logit contributions | |
� | -32.852 |
bipartisan | -26.983 |
ccording | -26.490 |
� | -25.937 |
behavi | -25.902 |
Token | it |
Token ID | 340 |
Feature activation | -4.84e+01 |
Pos logit contributions | |
it | +40.489 |
you | +37.136 |
iton | +35.901 |
contains | +35.120 |
img | +34.745 |
Neg logit contributions | |
� | -42.473 |
ccording | -35.164 |
� | -33.936 |
tremend | -33.584 |
millenn | -33.583 |
Token | SR |
Token ID | 12562 |
Feature activation | -2.33e+01 |
Pos logit contributions | |
coins | +28.123 |
img | +27.835 |
rox | +25.965 |
wine | +25.590 |
contains | +25.477 |
Neg logit contributions | |
bipartisan | -18.708 |
� | -17.787 |
� | -17.269 |
politically | -16.997 |
political | -16.490 |
Token | . |
Token ID | 13 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
coins | +19.931 |
contains | +19.002 |
detects | +18.361 |
img | +18.349 |
rox | +18.047 |
Neg logit contributions | |
bipartisan | -17.896 |
� | -16.252 |
� | -16.129 |
politically | -16.114 |
political | -15.958 |
Token | Width |
Token ID | 30916 |
Feature activation | -1.61e+01 |
Pos logit contributions | |
coins | +23.349 |
img | +22.188 |
contains | +21.905 |
detects | +21.401 |
angles | +21.290 |
Neg logit contributions | |
bipartisan | -19.520 |
politically | -18.063 |
� | -17.955 |
political | -17.807 |
� | -17.747 |
Token | ), |
Token ID | 828 |
Feature activation | -2.03e+01 |
Pos logit contributions | |
coins | +17.101 |
contains | +16.219 |
detects | +16.215 |
img | +15.630 |
rox | +15.362 |
Neg logit contributions | |
bipartisan | -14.518 |
� | -13.641 |
politically | -13.261 |
political | -13.140 |
� | -12.838 |
Token | ($ |
Token ID | 16763 |
Feature activation | -3.76e+01 |
Pos logit contributions | |
coins | +21.628 |
contains | +20.379 |
img | +20.162 |
detects | +20.149 |
wine | +19.669 |
Neg logit contributions | |
bipartisan | -14.669 |
politically | -13.383 |
� | -13.339 |
political | -12.929 |
� | -12.571 |
Token | SR |
Token ID | 12562 |
Feature activation | -6.27e+01 |
Pos logit contributions | |
coins | +31.466 |
img | +31.196 |
rox | +29.101 |
wine | +28.760 |
cube | +28.268 |
Neg logit contributions | |
� | -22.903 |
bipartisan | -21.818 |
politically | -20.096 |
� | -19.837 |
political | -19.170 |
Token | . |
Token ID | 13 |
Feature activation | -2.73e+01 |
Pos logit contributions | |
coins | +36.924 |
img | +36.546 |
contains | +36.341 |
forge | +36.199 |
/ | +35.872 |
Neg logit contributions | |
� | -48.683 |
tremend | -42.043 |
millenn | -41.226 |
� | -39.290 |
ccording | -39.037 |
Token | Height |
Token ID | 23106 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
img | +18.759 |
X | +18.662 |
coins | +18.570 |
contains | +18.060 |
angles | +17.671 |
Neg logit contributions | |
bipartisan | -25.165 |
politically | -23.272 |
� | -22.983 |
political | -22.824 |
geopolitical | -22.474 |
Token | ))) |
Token ID | 22305 |
Feature activation | -1.47e+01 |
Pos logit contributions | |
coins | +9.848 |
detects | +8.987 |
contains | +8.943 |
img | +8.500 |
rox | +8.499 |
Neg logit contributions | |
bipartisan | -15.219 |
� | -14.541 |
politically | -14.178 |
political | -14.071 |
geopolitical | -13.612 |
Token | ) |
Token ID | 1267 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
coins | +13.906 |
detects | +13.526 |
contains | +13.394 |
img | +12.846 |
iton | +12.713 |
Neg logit contributions | |
bipartisan | -15.285 |
� | -15.175 |
politically | -14.216 |
political | -14.113 |
� | -13.555 |
Token | } |
Token ID | 1782 |
Feature activation | -1.78e+01 |
Pos logit contributions | |
coins | +12.564 |
detects | +12.104 |
contains | +11.939 |
img | +11.461 |
iton | +11.459 |
Neg logit contributions | |
bipartisan | -14.867 |
� | -14.742 |
politically | -13.881 |
political | -13.806 |
� | -13.243 |
Token | get |
Token ID | 1136 |
Feature activation | -4.48e+01 |
Pos logit contributions | |
coins | +38.785 |
img | +38.183 |
init | +37.207 |
map | +37.043 |
X | +36.384 |
Neg logit contributions | |
� | -34.176 |
behavi | -27.463 |
tremend | -27.110 |
� | -26.295 |
ccording | -25.838 |
Token | Struct |
Token ID | 44909 |
Feature activation | -4.37e+01 |
Pos logit contributions | |
coins | +35.326 |
img | +35.035 |
contains | +34.871 |
X | +33.888 |
map | +32.053 |
Neg logit contributions | |
� | -32.162 |
tremend | -26.821 |
millenn | -25.773 |
ccording | -24.824 |
conflic | -24.363 |
Token | uring |
Token ID | 870 |
Feature activation | -4.78e+01 |
Pos logit contributions | |
img | +35.019 |
iton | +34.769 |
coins | +34.572 |
ules | +33.807 |
contains | +33.305 |
Neg logit contributions | |
� | -30.280 |
� | -23.362 |
ccording | -23.287 |
conflic | -22.992 |
� | -22.440 |
Token | Element |
Token ID | 20180 |
Feature activation | -5.22e+01 |
Pos logit contributions | |
contains | +35.480 |
X | +34.535 |
img | +34.022 |
coins | +33.692 |
iton | +33.200 |
Neg logit contributions | |
� | -33.197 |
tremend | -28.680 |
ccording | -26.219 |
conflic | -26.103 |
bipartisan | -25.581 |
Token | ( |
Token ID | 7 |
Feature activation | -5.14e+01 |
Pos logit contributions | |
coins | +38.908 |
img | +38.523 |
contains | +38.033 |
X | +37.163 |
cube | +37.139 |
Neg logit contributions | |
� | -38.825 |
tremend | -32.878 |
millenn | -32.121 |
ccording | -30.341 |
� | -30.111 |
Token | cv |
Token ID | 33967 |
Feature activation | -6.25e+01 |
Pos logit contributions | |
coins | +38.294 |
img | +37.403 |
ax | +36.411 |
cube | +36.024 |
cs | +35.295 |
Neg logit contributions | |
� | -35.329 |
� | -26.608 |
ccording | -26.360 |
tremend | -25.889 |
millenn | -25.804 |
Token | 2 |
Token ID | 17 |
Feature activation | -5.96e+01 |
Pos logit contributions | |
coins | +37.602 |
2 | +37.595 |
img | +36.983 |
X | +36.330 |
x | +35.946 |
Neg logit contributions | |
� | -49.652 |
tremend | -41.223 |
� | -39.670 |
behavi | -38.904 |
millenn | -38.476 |
Token | . |
Token ID | 13 |
Feature activation | -3.69e+01 |
Pos logit contributions | |
coins | +37.165 |
img | +36.261 |
contains | +35.799 |
X | +35.260 |
forge | +35.248 |
Neg logit contributions | |
� | -46.667 |
tremend | -40.235 |
millenn | -39.118 |
� | -37.788 |
ccording | -37.412 |
Token | M |
Token ID | 44 |
Feature activation | -5.00e+01 |
Pos logit contributions | |
coins | +31.131 |
img | +30.288 |
X | +30.142 |
contains | +29.644 |
map | +28.401 |
Neg logit contributions | |
� | -29.120 |
tremend | -26.301 |
behavi | -24.671 |
bipartisan | -24.078 |
ccording | -23.946 |
Token | OR |
Token ID | 1581 |
Feature activation | -4.79e+01 |
Pos logit contributions | |
coins | +31.589 |
X | +31.258 |
img | +31.049 |
rox | +30.700 |
contains | +30.580 |
Neg logit contributions | |
� | -39.090 |
tremend | -33.494 |
behavi | -32.171 |
ccording | -31.313 |
millenn | -29.747 |
Token | PH |
Token ID | 11909 |
Feature activation | -6.55e+01 |
Pos logit contributions | |
coins | +33.661 |
X | +32.258 |
contains | +31.153 |
hex | +30.977 |
img | +30.850 |
Neg logit contributions | |
� | -36.304 |
tremend | -32.663 |
millenn | -29.269 |
behavi | -29.102 |
ccording | -28.968 |
Token | Ex |
Token ID | 3109 |
Feature activation | -3.37e+01 |
Pos logit contributions | |
coins | +25.971 |
contains | +25.494 |
img | +24.253 |
X | +24.160 |
detects | +24.034 |
Neg logit contributions | |
� | -25.941 |
bipartisan | -24.082 |
politically | -23.151 |
political | -22.401 |
tremend | -22.057 |
Token | ( |
Token ID | 357 |
Feature activation | -3.28e+01 |
Pos logit contributions | |
coins | +28.776 |
contains | +27.948 |
img | +27.269 |
rox | +26.642 |
iton | +26.619 |
Neg logit contributions | |
� | -31.910 |
tremend | -26.543 |
ccording | -26.507 |
millenn | -26.332 |
behavi | -25.981 |
Token | gray |
Token ID | 12768 |
Feature activation | -4.78e+01 |
Pos logit contributions | |
contains | +27.863 |
detects | +27.676 |
img | +27.115 |
coins | +26.719 |
iton | +26.420 |
Neg logit contributions | |
� | -27.477 |
� | -22.746 |
ccording | -22.715 |
� | -21.448 |
� | -21.074 |
Token | , |
Token ID | 837 |
Feature activation | -4.79e+01 |
Pos logit contributions | |
coins | +34.492 |
contains | +34.474 |
img | +34.180 |
you | +32.971 |
iton | +32.330 |
Neg logit contributions | |
� | -39.149 |
ccording | -33.729 |
tremend | -33.429 |
millenn | -32.546 |
� | -31.787 |
Token | c |
Token ID | 269 |
Feature activation | -5.40e+01 |
Pos logit contributions | |
contains | +35.249 |
detects | +32.653 |
you | +32.625 |
img | +32.584 |
coins | +32.016 |
Neg logit contributions | |
� | -34.180 |
ccording | -28.373 |
� | -27.566 |
� | -26.537 |
tremend | -24.924 |
Token | v |
Token ID | 85 |
Feature activation | -6.14e+01 |
Pos logit contributions | |
coins | +38.712 |
img | +38.687 |
iton | +37.889 |
ux | +36.609 |
x | +36.428 |
Neg logit contributions | |
� | -42.728 |
� | -33.826 |
millenn | -33.042 |
tremend | -32.354 |
behavi | -32.182 |
Token | 2 |
Token ID | 17 |
Feature activation | -5.45e+01 |
Pos logit contributions | |
2 | +37.366 |
coins | +37.071 |
img | +36.742 |
X | +36.038 |
x | +35.248 |
Neg logit contributions | |
� | -48.760 |
tremend | -41.558 |
� | -39.192 |
millenn | -39.186 |
behavi | -38.734 |
Token | . |
Token ID | 764 |
Feature activation | -2.68e+01 |
Pos logit contributions | |
contains | +36.522 |
coins | +35.614 |
img | +35.390 |
you | +34.678 |
forge | +34.211 |
Neg logit contributions | |
� | -43.524 |
tremend | -37.201 |
ccording | -36.285 |
millenn | -36.236 |
� | -35.529 |
Token | MOR |
Token ID | 35208 |
Feature activation | -2.76e+01 |
Pos logit contributions | |
detects | +20.920 |
contains | +20.613 |
coins | +19.839 |
img | +19.552 |
X | +19.236 |
Neg logit contributions | |
� | -19.516 |
bipartisan | -19.333 |
politically | -18.253 |
political | -17.842 |
� | -17.247 |
Token | PH |
Token ID | 11909 |
Feature activation | -4.97e+01 |
Pos logit contributions | |
coins | +25.172 |
contains | +24.071 |
img | +23.449 |
rox | +23.004 |
X | +22.918 |
Neg logit contributions | |
� | -25.944 |
bipartisan | -23.087 |
tremend | -22.015 |
politically | -21.839 |
behavi | -21.492 |
Token | _ |
Token ID | 62 |
Feature activation | -3.06e+01 |
Pos logit contributions | |
_ | +37.570 |
coins | +36.257 |
X | +35.780 |
contains | +35.324 |
img | +35.318 |
Neg logit contributions | |
� | -37.806 |
tremend | -32.760 |
millenn | -32.090 |
ccording | -31.583 |
� | -29.974 |
Token | at |
Token ID | 265 |
Feature activation | -2.92e+01 |
Pos logit contributions | |
ata | +34.926 |
img | +34.436 |
iton | +33.417 |
coins | +32.838 |
ax | +32.249 |
Neg logit contributions | |
� | -39.546 |
� | -31.956 |
ccording | -31.212 |
millenn | -31.192 |
behavi | -30.808 |
Token | otic |
Token ID | 6210 |
Feature activation | -3.80e+01 |
Pos logit contributions | |
coins | +21.120 |
img | +19.060 |
rox | +18.874 |
iton | +18.715 |
ames | +18.528 |
Neg logit contributions | |
� | -33.259 |
bipartisan | -29.955 |
behavi | -29.141 |
political | -28.162 |
politically | -27.594 |
Token | plugs |
Token ID | 37008 |
Feature activation | -3.96e+01 |
Pos logit contributions | |
contains | +29.193 |
coins | +28.645 |
detects | +28.510 |
completes | +26.647 |
corresponds | +26.435 |
Neg logit contributions | |
� | -30.831 |
ccording | -25.771 |
bipartisan | -25.181 |
behavi | -24.624 |
� | -23.933 |
Token | , |
Token ID | 11 |
Feature activation | -2.53e+01 |
Pos logit contributions | |
coins | +30.119 |
contains | +29.600 |
you | +28.776 |
img | +28.521 |
iton | +27.879 |
Neg logit contributions | |
� | -37.749 |
ccording | -31.711 |
tremend | -30.955 |
� | -30.564 |
millenn | -30.315 |
Token | mim |
Token ID | 17007 |
Feature activation | -2.77e+01 |
Pos logit contributions | |
contains | +21.160 |
detects | +20.932 |
coins | +20.444 |
img | +19.331 |
iton | +18.906 |
Neg logit contributions | |
� | -24.232 |
bipartisan | -22.614 |
� | -22.574 |
politically | -20.909 |
political | -20.558 |
Token | icking |
Token ID | 7958 |
Feature activation | -6.11e+01 |
Pos logit contributions | |
coins | +22.726 |
iton | +21.681 |
detects | +21.159 |
rox | +21.137 |
img | +21.044 |
Neg logit contributions | |
� | -28.038 |
bipartisan | -24.966 |
behavi | -23.952 |
� | -23.907 |
political | -23.130 |
Token | the |
Token ID | 262 |
Feature activation | -3.64e+01 |
Pos logit contributions | |
you | +36.575 |
contains | +35.395 |
it | +34.822 |
X | +34.519 |
is | +34.501 |
Neg logit contributions | |
� | -45.542 |
ccording | -38.273 |
tremend | -37.844 |
� | -36.729 |
millenn | -36.070 |
Token | sp |
Token ID | 599 |
Feature activation | -4.45e+01 |
Pos logit contributions | |
contains | +30.855 |
detects | +30.711 |
coins | +29.846 |
you | +28.810 |
img | +28.535 |
Neg logit contributions | |
� | -29.795 |
ccording | -25.086 |
� | -23.396 |
� | -22.665 |
bipartisan | -22.441 |
Token | ines |
Token ID | 1127 |
Feature activation | -5.76e+01 |
Pos logit contributions | |
coins | +34.699 |
ames | +34.070 |
ines | +32.862 |
angles | +32.622 |
img | +32.579 |
Neg logit contributions | |
� | -39.011 |
behavi | -32.691 |
� | -31.387 |
ccording | -30.139 |
millenn | -29.970 |
Token | on |
Token ID | 319 |
Feature activation | -5.60e+01 |
Pos logit contributions | |
you | +36.412 |
contains | +35.945 |
coins | +35.427 |
is | +34.334 |
img | +33.850 |
Neg logit contributions | |
� | -44.518 |
ccording | -37.479 |
millenn | -36.991 |
tremend | -36.695 |
� | -35.749 |
Token | a |
Token ID | 257 |
Feature activation | -2.72e+01 |
Pos logit contributions | |
contains | +35.678 |
you | +35.429 |
coins | +34.577 |
img | +34.027 |
is | +33.237 |
Neg logit contributions | |
� | -43.449 |
ccording | -35.243 |
� | -34.743 |
millenn | -33.116 |
tremend | -31.850 |
Token | they |
Token ID | 484 |
Feature activation | -3.89e+01 |
Pos logit contributions | |
you | +33.730 |
contains | +32.861 |
coins | +32.188 |
img | +31.874 |
detects | +31.620 |
Neg logit contributions | |
� | -33.159 |
ccording | -27.657 |
tremend | -25.564 |
bipartisan | -25.511 |
millenn | -25.077 |
Token | are |
Token ID | 389 |
Feature activation | -3.16e+01 |
Pos logit contributions | |
contains | +32.725 |
coins | +30.919 |
you | +30.898 |
is | +30.840 |
img | +30.752 |
Neg logit contributions | |
� | -32.927 |
ccording | -28.709 |
tremend | -25.936 |
millenn | -25.814 |
behavi | -25.280 |
Token | there |
Token ID | 612 |
Feature activation | -4.42e+01 |
Pos logit contributions | |
contains | +26.333 |
coins | +24.703 |
you | +24.442 |
detects | +24.101 |
img | +23.687 |
Neg logit contributions | |
� | -29.532 |
ccording | -24.499 |
bipartisan | -24.451 |
behavi | -22.885 |
� | -22.716 |
Token | at |
Token ID | 379 |
Feature activation | -3.37e+01 |
Pos logit contributions | |
contains | +33.326 |
you | +32.471 |
detects | +30.848 |
img | +30.771 |
is | +30.548 |
Neg logit contributions | |
� | -34.993 |
ccording | -29.848 |
millenn | -27.727 |
tremend | -27.668 |
� | -26.870 |
Token | 16 |
Token ID | 1467 |
Feature activation | -3.39e+01 |
Pos logit contributions | |
contains | +28.491 |
coins | +27.386 |
rox | +26.760 |
img | +26.666 |
detects | +26.526 |
Neg logit contributions | |
� | -28.915 |
ccording | -23.664 |
bipartisan | -23.579 |
behavi | -22.687 |
� | -21.823 |
Token | 80 |
Token ID | 1795 |
Feature activation | -6.09e+01 |
Pos logit contributions | |
coins | +28.731 |
img | +27.974 |
contains | +26.751 |
rox | +26.568 |
ax | +26.270 |
Neg logit contributions | |
� | -32.594 |
ccording | -26.454 |
behavi | -25.925 |
bipartisan | -25.338 |
millenn | -25.249 |
Token | x |
Token ID | 87 |
Feature activation | -4.32e+01 |
Pos logit contributions | |
x | +42.871 |
img | +39.992 |
coins | +39.187 |
X | +39.095 |
contains | +36.972 |
Neg logit contributions | |
� | -40.835 |
ccording | -33.723 |
millenn | -33.529 |
tremend | -33.016 |
� | -32.131 |
Token | 10 |
Token ID | 940 |
Feature activation | -3.12e+01 |
Pos logit contributions | |
coins | +33.248 |
img | +31.291 |
1000 | +31.016 |
contains | +30.759 |
X | +30.223 |
Neg logit contributions | |
� | -40.120 |
tremend | -32.731 |
ccording | -31.656 |
millenn | -30.919 |
behavi | -30.696 |
Token | 50 |
Token ID | 1120 |
Feature activation | -3.94e+01 |
Pos logit contributions | |
coins | +26.817 |
img | +26.492 |
contains | +26.361 |
detects | +25.085 |
rox | +24.683 |
Neg logit contributions | |
� | -30.442 |
ccording | -24.879 |
tremend | -24.133 |
behavi | -23.955 |
bipartisan | -23.917 |
Token | the |
Token ID | 262 |
Feature activation | -2.48e+01 |
Pos logit contributions | |
contains | +31.780 |
you | +31.096 |
coins | +30.834 |
detects | +30.139 |
img | +29.973 |
Neg logit contributions | |
� | -31.403 |
ccording | -26.406 |
tremend | -25.270 |
bipartisan | -24.401 |
millenn | -24.312 |
Token | pixels |
Token ID | 17848 |
Feature activation | -4.11e+01 |
Pos logit contributions | |
coins | +23.659 |
detects | +22.851 |
contains | +22.433 |
img | +21.936 |
iton | +20.982 |
Neg logit contributions | |
� | -22.168 |
bipartisan | -21.784 |
� | -20.246 |
political | -19.483 |
politically | -19.427 |
Token | Line |
Token ID | 13949 |
Feature activation | -2.86e+01 |
Pos logit contributions | |
coins | +18.711 |
img | +17.465 |
contains | +17.348 |
detects | +17.293 |
iton | +17.066 |
Neg logit contributions | |
bipartisan | -15.300 |
politically | -14.437 |
political | -14.218 |
� | -14.191 |
� | -13.956 |
Token | Al |
Token ID | 2348 |
Feature activation | -4.20e+01 |
Pos logit contributions | |
coins | +25.955 |
contains | +25.606 |
X | +24.711 |
iton | +24.635 |
img | +24.631 |
Neg logit contributions | |
bipartisan | -19.858 |
� | -19.646 |
politically | -18.993 |
political | -18.200 |
geopolitical | -17.835 |
Token | ignment |
Token ID | 16747 |
Feature activation | -3.19e+01 |
Pos logit contributions | |
iton | +34.428 |
coins | +32.826 |
ax | +32.522 |
img | +31.860 |
ux | +31.762 |
Neg logit contributions | |
� | -30.301 |
bipartisan | -23.928 |
tremend | -23.687 |
millenn | -23.673 |
behavi | -23.480 |
Token | = |
Token ID | 796 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
coins | +31.294 |
contains | +30.735 |
img | +30.087 |
iton | +29.208 |
detects | +28.878 |
Neg logit contributions | |
� | -26.274 |
bipartisan | -21.272 |
tremend | -21.188 |
ccording | -20.950 |
behavi | -20.900 |
Token | [ |
Token ID | 685 |
Feature activation | -3.68e+01 |
Pos logit contributions | |
coins | +26.135 |
contains | +26.018 |
detects | +25.625 |
iton | +24.755 |
img | +24.516 |
Neg logit contributions | |
� | -18.313 |
bipartisan | -18.229 |
� | -18.017 |
politically | -16.540 |
political | -16.234 |
Token | system |
Token ID | 10057 |
Feature activation | -6.09e+01 |
Pos logit contributions | |
coins | +33.672 |
img | +33.213 |
cube | +31.358 |
wine | +31.261 |
rox | +30.946 |
Neg logit contributions | |
� | -28.383 |
behavi | -22.397 |
bipartisan | -22.110 |
ccording | -21.725 |
� | -21.189 |
Token | . |
Token ID | 13 |
Feature activation | -4.13e+01 |
Pos logit contributions | |
coins | +37.334 |
img | +36.944 |
you | +35.483 |
contains | +35.438 |
forge | +35.402 |
Neg logit contributions | |
� | -49.602 |
tremend | -41.200 |
� | -40.624 |
millenn | -40.531 |
ccording | -39.591 |
Token | draw |
Token ID | 19334 |
Feature activation | -5.51e+01 |
Pos logit contributions | |
coins | +36.150 |
img | +35.749 |
wine | +34.071 |
cube | +33.768 |
map | +33.282 |
Neg logit contributions | |
� | -32.432 |
� | -24.579 |
behavi | -24.177 |
ccording | -23.899 |
bipartisan | -23.500 |
Token | ing |
Token ID | 278 |
Feature activation | -5.75e+01 |
Pos logit contributions | |
img | +36.658 |
ing | +35.058 |
iton | +34.714 |
coins | +33.611 |
ings | +32.337 |
Neg logit contributions | |
� | -48.997 |
� | -39.429 |
tremend | -39.303 |
ccording | -37.695 |
millenn | -37.420 |
Token | . |
Token ID | 13 |
Feature activation | -3.41e+01 |
Pos logit contributions | |
coins | +35.958 |
img | +35.923 |
contains | +34.780 |
/ | +34.448 |
you | +34.425 |
Neg logit contributions | |
� | -49.064 |
tremend | -40.925 |
millenn | -39.792 |
� | -39.702 |
ccording | -39.201 |
Token | String |
Token ID | 10100 |
Feature activation | -5.00e+01 |
Pos logit contributions | |
img | +28.499 |
coins | +28.300 |
wine | +26.795 |
contains | +26.767 |
X | +26.686 |
Neg logit contributions | |
� | -27.993 |
bipartisan | -24.765 |
politically | -24.075 |
political | -23.137 |
behavi | -23.116 |
Token | sq |
Token ID | 19862 |
Feature activation | -5.50e+01 |
Pos logit contributions | |
coins | +20.412 |
contains | +20.268 |
detects | +20.152 |
img | +19.507 |
rox | +18.842 |
Neg logit contributions | |
bipartisan | -18.993 |
� | -18.182 |
politically | -17.298 |
political | -17.150 |
� | -17.051 |
Token | K |
Token ID | 42 |
Feature activation | -5.29e+01 |
Pos logit contributions | |
X | +34.873 |
coins | +33.274 |
img | +32.021 |
_ | +31.955 |
cube | +31.211 |
Neg logit contributions | |
� | -42.821 |
tremend | -37.674 |
ccording | -33.992 |
millenn | -33.696 |
exting | -33.675 |
Token | ernel |
Token ID | 7948 |
Feature activation | -5.30e+01 |
Pos logit contributions | |
img | +37.099 |
coins | +36.639 |
iton | +35.254 |
rox | +35.248 |
ames | +35.201 |
Neg logit contributions | |
� | -36.181 |
� | -28.374 |
behavi | -27.410 |
ccording | -26.793 |
� | -26.391 |
Token | = |
Token ID | 796 |
Feature activation | -5.19e+01 |
Pos logit contributions | |
= | +38.927 |
coins | +37.462 |
contains | +37.099 |
img | +36.937 |
iton | +35.894 |
Neg logit contributions | |
� | -38.743 |
tremend | -32.261 |
millenn | -30.933 |
ccording | -30.868 |
� | -30.689 |
Token | c |
Token ID | 269 |
Feature activation | -5.20e+01 |
Pos logit contributions | |
contains | +36.079 |
you | +33.606 |
detects | +33.313 |
coins | +32.854 |
img | +32.244 |
Neg logit contributions | |
� | -36.171 |
ccording | -30.432 |
� | -28.633 |
� | -26.830 |
tremend | -26.442 |
Token | v |
Token ID | 85 |
Feature activation | -6.08e+01 |
Pos logit contributions | |
coins | +38.928 |
img | +38.169 |
iton | +37.273 |
ux | +36.390 |
map | +35.777 |
Neg logit contributions | |
� | -40.933 |
� | -32.134 |
millenn | -30.533 |
tremend | -30.509 |
behavi | -30.007 |
Token | 2 |
Token ID | 17 |
Feature activation | -5.61e+01 |
Pos logit contributions | |
coins | +38.005 |
2 | +37.473 |
img | +37.273 |
X | +36.135 |
x | +35.636 |
Neg logit contributions | |
� | -48.464 |
tremend | -40.041 |
� | -38.986 |
behavi | -37.511 |
millenn | -37.283 |
Token | . |
Token ID | 13 |
Feature activation | -4.70e+01 |
Pos logit contributions | |
coins | +36.657 |
img | +35.770 |
contains | +35.600 |
forge | +34.898 |
you | +34.576 |
Neg logit contributions | |
� | -46.290 |
tremend | -38.690 |
millenn | -37.999 |
� | -37.870 |
ccording | -36.846 |
Token | get |
Token ID | 1136 |
Feature activation | -4.48e+01 |
Pos logit contributions | |
coins | +38.785 |
img | +38.183 |
init | +37.207 |
map | +37.043 |
X | +36.384 |
Neg logit contributions | |
� | -34.176 |
behavi | -27.463 |
tremend | -27.110 |
� | -26.295 |
ccording | -25.838 |
Token | Struct |
Token ID | 44909 |
Feature activation | -4.37e+01 |
Pos logit contributions | |
coins | +35.326 |
img | +35.035 |
contains | +34.871 |
X | +33.888 |
map | +32.053 |
Neg logit contributions | |
� | -32.162 |
tremend | -26.821 |
millenn | -25.773 |
ccording | -24.824 |
conflic | -24.363 |
Token | uring |
Token ID | 870 |
Feature activation | -4.78e+01 |
Pos logit contributions | |
img | +35.019 |
iton | +34.769 |
coins | +34.572 |
ules | +33.807 |
contains | +33.305 |
Neg logit contributions | |
� | -30.280 |
� | -23.362 |
ccording | -23.287 |
conflic | -22.992 |
� | -22.440 |
Token | cv |
Token ID | 33967 |
Feature activation | -5.65e+01 |
Pos logit contributions | |
coins | +32.671 |
img | +32.178 |
ax | +30.487 |
cube | +30.317 |
iton | +30.083 |
Neg logit contributions | |
� | -31.490 |
bipartisan | -25.330 |
behavi | -24.239 |
ccording | -23.844 |
politically | -23.752 |
Token | 2 |
Token ID | 17 |
Feature activation | -5.05e+01 |
Pos logit contributions | |
coins | +37.143 |
img | +36.406 |
2 | +36.165 |
X | +35.503 |
x | +35.114 |
Neg logit contributions | |
� | -47.119 |
tremend | -38.652 |
� | -37.295 |
behavi | -36.945 |
millenn | -36.693 |
Token | . |
Token ID | 13 |
Feature activation | -2.85e+01 |
Pos logit contributions | |
coins | +36.777 |
img | +35.776 |
contains | +35.131 |
forge | +34.452 |
X | +34.383 |
Neg logit contributions | |
� | -42.501 |
tremend | -36.224 |
millenn | -35.035 |
� | -34.020 |
ccording | -33.813 |
Token | M |
Token ID | 44 |
Feature activation | -4.15e+01 |
Pos logit contributions | |
coins | +26.261 |
img | +25.391 |
contains | +25.002 |
X | +24.427 |
detects | +24.221 |
Neg logit contributions | |
� | -24.715 |
bipartisan | -22.782 |
politically | -21.670 |
tremend | -21.335 |
behavi | -21.229 |
Token | OR |
Token ID | 1581 |
Feature activation | -4.12e+01 |
Pos logit contributions | |
coins | +29.489 |
img | +29.067 |
contains | +28.639 |
X | +28.507 |
rox | +28.346 |
Neg logit contributions | |
� | -35.134 |
tremend | -28.855 |
behavi | -28.838 |
ccording | -28.062 |
bipartisan | -26.553 |
Token | PH |
Token ID | 11909 |
Feature activation | -6.08e+01 |
Pos logit contributions | |
coins | +33.479 |
X | +32.047 |
contains | +31.910 |
img | +31.322 |
hex | +31.125 |
Neg logit contributions | |
� | -31.276 |
tremend | -27.139 |
behavi | -25.195 |
millenn | -24.829 |
ccording | -24.697 |
Token | _ |
Token ID | 62 |
Feature activation | -4.00e+01 |
Pos logit contributions | |
_ | +40.790 |
X | +38.085 |
coins | +37.336 |
img | +36.893 |
contains | +36.403 |
Neg logit contributions | |
� | -42.999 |
tremend | -37.581 |
millenn | -36.198 |
ccording | -34.773 |
� | -33.773 |
Token | RECT |
Token ID | 23988 |
Feature activation | -4.54e+01 |
Pos logit contributions | |
X | +31.998 |
coins | +31.279 |
img | +30.957 |
RECT | +30.294 |
contains | +30.276 |
Neg logit contributions | |
� | -30.232 |
tremend | -25.465 |
bipartisan | -25.282 |
behavi | -25.238 |
politically | -23.901 |
Token | , |
Token ID | 11 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
contains | +33.973 |
coins | +33.737 |
img | +33.518 |
you | +32.792 |
X | +32.784 |
Neg logit contributions | |
� | -36.759 |
tremend | -31.805 |
millenn | -30.499 |
ccording | -30.121 |
behavi | -28.720 |
Token | ( |
Token ID | 357 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
contains | +18.243 |
detects | +17.705 |
coins | +17.586 |
img | +17.188 |
iton | +16.601 |
Neg logit contributions | |
bipartisan | -18.116 |
� | -17.604 |
politically | -17.153 |
� | -16.677 |
political | -16.554 |
Token | 13 |
Token ID | 1485 |
Feature activation | -3.80e+01 |
Pos logit contributions | |
coins | +14.695 |
detects | +13.401 |
contains | +13.309 |
img | +13.237 |
iton | +13.117 |
Neg logit contributions | |
bipartisan | -16.655 |
� | -15.893 |
� | -15.534 |
politically | -15.525 |
political | -15.394 |
Token | [ |
Token ID | 685 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
coins | +15.156 |
detects | +14.579 |
contains | +14.477 |
iton | +14.252 |
img | +13.993 |
Neg logit contributions | |
bipartisan | -13.199 |
� | -12.840 |
politically | -12.096 |
political | -12.044 |
� | -11.622 |
Token | b |
Token ID | 65 |
Feature activation | -2.22e+01 |
Pos logit contributions | |
coins | +26.965 |
img | +26.048 |
contains | +24.760 |
wine | +24.632 |
iton | +24.611 |
Neg logit contributions | |
� | -20.644 |
bipartisan | -19.249 |
� | -17.778 |
politically | -17.537 |
political | -17.526 |
Token | ] |
Token ID | 60 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
coins | +22.706 |
img | +21.602 |
contains | +21.587 |
iton | +21.006 |
detects | +20.910 |
Neg logit contributions | |
� | -21.803 |
bipartisan | -19.820 |
behavi | -18.786 |
� | -18.287 |
politically | -18.274 |
Token | Console |
Token ID | 47581 |
Feature activation | -2.91e+01 |
Pos logit contributions | |
coins | +17.638 |
contains | +16.824 |
detects | +16.762 |
iton | +16.707 |
img | +16.686 |
Neg logit contributions | |
bipartisan | -16.430 |
politically | -15.079 |
� | -14.997 |
� | -14.879 |
political | -14.706 |
Token | : |
Token ID | 25 |
Feature activation | -2.66e+01 |
Pos logit contributions | |
coins | +31.651 |
contains | +31.333 |
detects | +30.632 |
img | +30.462 |
iton | +29.743 |
Neg logit contributions | |
� | -20.526 |
bipartisan | -17.386 |
ccording | -16.222 |
behavi | -16.152 |
politically | -15.554 |
Token | [/ |
Token ID | 13412 |
Feature activation | -6.02e+01 |
Pos logit contributions | |
coins | +29.895 |
contains | +28.755 |
img | +28.468 |
iton | +27.996 |
detects | +27.976 |
Neg logit contributions | |
� | -18.955 |
bipartisan | -17.249 |
politically | -15.309 |
behavi | -15.282 |
tremend | -14.979 |
Token | b |
Token ID | 65 |
Feature activation | -2.63e+01 |
Pos logit contributions | |
img | +37.482 |
coins | +34.899 |
b | +33.923 |
cube | +33.806 |
bis | +33.269 |
Neg logit contributions | |
� | -49.406 |
millenn | -39.459 |
� | -39.413 |
behavi | -37.926 |
tremend | -37.700 |
Token | ] |
Token ID | 60 |
Feature activation | -2.03e+01 |
Pos logit contributions | |
coins | +27.257 |
contains | +26.506 |
img | +26.394 |
iton | +25.495 |
detects | +25.350 |
Neg logit contributions | |
� | -23.392 |
bipartisan | -19.862 |
behavi | -19.596 |
tremend | -18.953 |
ccording | -18.844 |
Token | NES |
Token ID | 31925 |
Feature activation | -1.79e+01 |
Pos logit contributions | |
coins | +22.791 |
contains | +22.366 |
detects | +22.308 |
iton | +21.793 |
img | +21.754 |
Neg logit contributions | |
bipartisan | -14.704 |
� | -13.757 |
politically | -13.051 |
political | -12.924 |
� | -12.750 |
Token | ( |
Token ID | 357 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
coins | +20.656 |
detects | +19.891 |
contains | +19.838 |
iton | +19.291 |
img | +19.273 |
Neg logit contributions | |
bipartisan | -14.520 |
� | -14.164 |
politically | -13.144 |
political | -13.076 |
� | -12.620 |
Token | P |
Token ID | 47 |
Feature activation | -2.78e+01 |
Pos logit contributions | |
coins | +27.440 |
contains | +25.877 |
detects | +25.675 |
img | +25.652 |
rox | +25.433 |
Neg logit contributions | |
bipartisan | -15.775 |
� | -14.540 |
� | -14.382 |
politically | -14.146 |
political | -13.880 |
Token | Color |
Token ID | 10258 |
Feature activation | -3.11e+01 |
Pos logit contributions | |
coins | +17.048 |
img | +16.355 |
contains | +15.867 |
detects | +15.862 |
rox | +15.590 |
Neg logit contributions | |
bipartisan | -22.869 |
� | -22.806 |
politically | -21.551 |
political | -21.427 |
� | -21.390 |
Token | ( |
Token ID | 357 |
Feature activation | -3.80e+01 |
Pos logit contributions | |
coins | +28.505 |
contains | +27.098 |
img | +27.030 |
iton | +26.096 |
rox | +25.814 |
Neg logit contributions | |
� | -27.159 |
bipartisan | -23.808 |
politically | -22.850 |
� | -22.629 |
ccording | -22.529 |
Token | image |
Token ID | 2939 |
Feature activation | -3.88e+01 |
Pos logit contributions | |
img | +29.120 |
contains | +28.339 |
detects | +27.699 |
iton | +26.139 |
X | +26.043 |
Neg logit contributions | |
� | -32.276 |
� | -27.411 |
ccording | -27.298 |
bipartisan | -26.706 |
� | -26.386 |
Token | , |
Token ID | 837 |
Feature activation | -3.98e+01 |
Pos logit contributions | |
coins | +32.579 |
contains | +32.093 |
img | +31.472 |
iton | +29.911 |
X | +29.901 |
Neg logit contributions | |
� | -31.582 |
tremend | -27.425 |
ccording | -27.048 |
millenn | -25.629 |
behavi | -25.101 |
Token | c |
Token ID | 269 |
Feature activation | -5.03e+01 |
Pos logit contributions | |
contains | +32.542 |
detects | +30.943 |
img | +30.490 |
coins | +30.349 |
you | +29.469 |
Neg logit contributions | |
� | -29.632 |
ccording | -24.619 |
� | -24.001 |
bipartisan | -23.490 |
� | -23.021 |
Token | v |
Token ID | 85 |
Feature activation | -6.00e+01 |
Pos logit contributions | |
coins | +37.607 |
img | +37.130 |
iton | +36.404 |
ux | +35.547 |
rox | +34.796 |
Neg logit contributions | |
� | -40.827 |
� | -32.315 |
millenn | -31.562 |
behavi | -30.883 |
tremend | -30.546 |
Token | 2 |
Token ID | 17 |
Feature activation | -5.71e+01 |
Pos logit contributions | |
coins | +36.942 |
2 | +36.707 |
img | +36.218 |
X | +35.842 |
x | +34.727 |
Neg logit contributions | |
� | -47.708 |
tremend | -40.256 |
� | -38.311 |
millenn | -38.218 |
behavi | -37.580 |
Token | . |
Token ID | 764 |
Feature activation | -2.89e+01 |
Pos logit contributions | |
contains | +36.515 |
coins | +35.923 |
img | +35.496 |
you | +34.582 |
forge | +34.239 |
Neg logit contributions | |
� | -44.341 |
tremend | -37.321 |
millenn | -36.611 |
ccording | -36.549 |
� | -36.178 |
Token | COL |
Token ID | 20444 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
contains | +27.241 |
detects | +26.832 |
coins | +26.070 |
img | +26.032 |
corresponds | +24.998 |
Neg logit contributions | |
� | -17.004 |
bipartisan | -16.956 |
politically | -15.698 |
political | -15.261 |
� | -15.173 |
Token | OR |
Token ID | 1581 |
Feature activation | -5.05e+01 |
Pos logit contributions | |
coins | +21.935 |
contains | +20.871 |
img | +20.833 |
iton | +20.419 |
detects | +20.314 |
Neg logit contributions | |
� | -21.783 |
bipartisan | -20.886 |
politically | -20.249 |
political | -20.040 |
� | -19.917 |
Token | _ |
Token ID | 62 |
Feature activation | -2.72e+01 |
Pos logit contributions | |
_ | +36.140 |
coins | +34.397 |
img | +33.789 |
X | +33.711 |
contains | +33.484 |
Neg logit contributions | |
� | -38.197 |
tremend | -33.485 |
ccording | -32.077 |
millenn | -31.698 |
behavi | -30.386 |
Token | Struct |
Token ID | 44909 |
Feature activation | -4.37e+01 |
Pos logit contributions | |
coins | +35.326 |
img | +35.035 |
contains | +34.871 |
X | +33.888 |
map | +32.053 |
Neg logit contributions | |
� | -32.162 |
tremend | -26.821 |
millenn | -25.773 |
ccording | -24.824 |
conflic | -24.363 |
Token | uring |
Token ID | 870 |
Feature activation | -4.78e+01 |
Pos logit contributions | |
img | +35.019 |
iton | +34.769 |
coins | +34.572 |
ules | +33.807 |
contains | +33.305 |
Neg logit contributions | |
� | -30.280 |
� | -23.362 |
ccording | -23.287 |
conflic | -22.992 |
� | -22.440 |
Token | Element |
Token ID | 20180 |
Feature activation | -5.22e+01 |
Pos logit contributions | |
contains | +35.480 |
X | +34.535 |
img | +34.022 |
coins | +33.692 |
iton | +33.200 |
Neg logit contributions | |
� | -33.197 |
tremend | -28.680 |
ccording | -26.219 |
conflic | -26.103 |
bipartisan | -25.581 |
Token | ( |
Token ID | 7 |
Feature activation | -5.14e+01 |
Pos logit contributions | |
coins | +38.908 |
img | +38.523 |
contains | +38.033 |
X | +37.163 |
cube | +37.139 |
Neg logit contributions | |
� | -38.825 |
tremend | -32.878 |
millenn | -32.121 |
ccording | -30.341 |
� | -30.111 |
Token | cv |
Token ID | 33967 |
Feature activation | -6.25e+01 |
Pos logit contributions | |
coins | +38.294 |
img | +37.403 |
ax | +36.411 |
cube | +36.024 |
cs | +35.295 |
Neg logit contributions | |
� | -35.329 |
� | -26.608 |
ccording | -26.360 |
tremend | -25.889 |
millenn | -25.804 |
Token | 2 |
Token ID | 17 |
Feature activation | -5.96e+01 |
Pos logit contributions | |
coins | +37.602 |
2 | +37.595 |
img | +36.983 |
X | +36.330 |
x | +35.946 |
Neg logit contributions | |
� | -49.652 |
tremend | -41.223 |
� | -39.670 |
behavi | -38.904 |
millenn | -38.476 |
Token | . |
Token ID | 13 |
Feature activation | -3.69e+01 |
Pos logit contributions | |
coins | +37.165 |
img | +36.261 |
contains | +35.799 |
X | +35.260 |
forge | +35.248 |
Neg logit contributions | |
� | -46.667 |
tremend | -40.235 |
millenn | -39.118 |
� | -37.788 |
ccording | -37.412 |
Token | M |
Token ID | 44 |
Feature activation | -5.00e+01 |
Pos logit contributions | |
coins | +31.131 |
img | +30.288 |
X | +30.142 |
contains | +29.644 |
map | +28.401 |
Neg logit contributions | |
� | -29.120 |
tremend | -26.301 |
behavi | -24.671 |
bipartisan | -24.078 |
ccording | -23.946 |
Token | OR |
Token ID | 1581 |
Feature activation | -4.79e+01 |
Pos logit contributions | |
coins | +31.589 |
X | +31.258 |
img | +31.049 |
rox | +30.700 |
contains | +30.580 |
Neg logit contributions | |
� | -39.090 |
tremend | -33.494 |
behavi | -32.171 |
ccording | -31.313 |
millenn | -29.747 |
Token | PH |
Token ID | 11909 |
Feature activation | -6.55e+01 |
Pos logit contributions | |
coins | +33.661 |
X | +32.258 |
contains | +31.153 |
hex | +30.977 |
img | +30.850 |
Neg logit contributions | |
� | -36.304 |
tremend | -32.663 |
millenn | -29.269 |
behavi | -29.102 |
ccording | -28.968 |
Token | _ |
Token ID | 62 |
Feature activation | -4.53e+01 |
Pos logit contributions | |
_ | +41.955 |
X | +38.559 |
coins | +37.956 |
+ | +37.170 |
img | +37.062 |
Neg logit contributions | |
� | -44.346 |
tremend | -39.366 |
millenn | -37.678 |
ccording | -36.220 |
� | -35.124 |
Token | SR |
Token ID | 12562 |
Feature activation | -4.12e+01 |
Pos logit contributions | |
coins | +28.218 |
img | +27.398 |
wine | +25.456 |
properties | +25.383 |
contains | +25.311 |
Neg logit contributions | |
bipartisan | -19.377 |
� | -18.298 |
� | -17.908 |
politically | -17.551 |
political | -17.318 |
Token | . |
Token ID | 13 |
Feature activation | -2.77e+01 |
Pos logit contributions | |
coins | +33.889 |
img | +33.111 |
contains | +32.691 |
forge | +31.719 |
X | +31.009 |
Neg logit contributions | |
� | -35.654 |
tremend | -30.006 |
millenn | -29.908 |
ccording | -28.655 |
� | -27.907 |
Token | Width |
Token ID | 30916 |
Feature activation | -2.64e+01 |
Pos logit contributions | |
coins | +21.566 |
img | +20.805 |
X | +20.738 |
contains | +20.522 |
wine | +20.050 |
Neg logit contributions | |
bipartisan | -22.718 |
politically | -21.664 |
� | -21.401 |
political | -21.174 |
geopolitical | -20.667 |
Token | , |
Token ID | 11 |
Feature activation | -3.80e+01 |
Pos logit contributions | |
coins | +21.985 |
contains | +21.281 |
detects | +20.976 |
img | +20.350 |
+ | +20.219 |
Neg logit contributions | |
bipartisan | -17.401 |
� | -16.278 |
politically | -16.171 |
� | -16.099 |
political | -15.593 |
Token | $ |
Token ID | 3 |
Feature activation | -3.79e+01 |
Pos logit contributions | |
coins | +37.305 |
img | +35.961 |
contains | +34.585 |
wine | +34.087 |
X | +34.029 |
Neg logit contributions | |
� | -24.966 |
bipartisan | -20.149 |
tremend | -19.915 |
behavi | -19.473 |
millenn | -19.113 |
Token | SR |
Token ID | 12562 |
Feature activation | -5.95e+01 |
Pos logit contributions | |
coins | +32.575 |
img | +31.341 |
iton | +29.047 |
wine | +28.847 |
rox | +28.680 |
Neg logit contributions | |
� | -23.582 |
bipartisan | -22.590 |
� | -20.769 |
politically | -20.411 |
political | -19.989 |
Token | . |
Token ID | 13 |
Feature activation | -3.31e+01 |
Pos logit contributions | |
coins | +37.699 |
img | +37.293 |
forge | +36.708 |
contains | +36.152 |
+ | +35.556 |
Neg logit contributions | |
� | -45.667 |
tremend | -38.899 |
millenn | -38.888 |
ccording | -36.609 |
� | -36.557 |
Token | Height |
Token ID | 23106 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
coins | +28.673 |
img | +28.609 |
X | +27.875 |
contains | +27.402 |
angles | +26.182 |
Neg logit contributions | |
� | -28.147 |
bipartisan | -25.224 |
tremend | -24.912 |
behavi | -23.884 |
politically | -23.721 |
Token | ) |
Token ID | 8 |
Feature activation | -2.16e+01 |
Pos logit contributions | |
coins | +8.320 |
contains | +7.476 |
detects | +7.302 |
img | +6.812 |
rox | +6.720 |
Neg logit contributions | |
bipartisan | -16.504 |
� | -15.782 |
politically | -15.647 |
political | -15.402 |
geopolitical | -15.296 |
Token | $ |
Token ID | 720 |
Feature activation | -2.83e+01 |
Pos logit contributions | |
contains | +17.695 |
coins | +17.606 |
detects | +17.271 |
img | +16.494 |
wine | +15.764 |
Neg logit contributions | |
� | -18.088 |
bipartisan | -17.684 |
politically | -16.571 |
geopolitical | -16.357 |
fraught | -16.110 |
Token | image |
Token ID | 9060 |
Feature activation | -2.65e+01 |
Pos logit contributions | |
img | +27.908 |
coins | +27.609 |
wine | +25.912 |
angles | +25.133 |
properties | +25.124 |
Neg logit contributions | |
bipartisan | -20.038 |
� | -19.407 |
� | -18.619 |
politically | -18.312 |
political | -18.124 |
Token | , |
Token ID | 11 |
Feature activation | -3.37e+01 |
Pos logit contributions | |
coins | +36.415 |
contains | +35.071 |
img | +35.015 |
you | +34.424 |
X | +33.665 |
Neg logit contributions | |
� | -37.151 |
tremend | -31.181 |
millenn | -30.201 |
ccording | -29.891 |
behavi | -28.935 |
Token | 21 |
Token ID | 2310 |
Feature activation | -2.30e+01 |
Pos logit contributions | |
coins | +25.166 |
contains | +24.263 |
corresponds | +23.215 |
ax | +23.025 |
iton | +22.975 |
Neg logit contributions | |
� | -30.212 |
behavi | -26.497 |
bipartisan | -25.607 |
tremend | -25.498 |
ccording | -25.388 |
Token | )) |
Token ID | 4008 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
coins | +18.497 |
contains | +17.341 |
detects | +16.869 |
rox | +16.410 |
iton | +16.287 |
Neg logit contributions | |
� | -25.563 |
bipartisan | -25.198 |
political | -23.783 |
� | -23.770 |
politically | -23.763 |
Token | # |
Token ID | 1303 |
Feature activation | -3.25e+01 |
Pos logit contributions | |
detects | +16.587 |
contains | +16.334 |
coins | +15.834 |
img | +15.594 |
map | +14.473 |
Neg logit contributions | |
bipartisan | -19.358 |
� | -18.784 |
politically | -18.039 |
political | -17.618 |
� | -17.518 |
Token | loop |
Token ID | 9052 |
Feature activation | -4.34e+01 |
Pos logit contributions | |
detects | +26.946 |
contains | +26.849 |
coins | +26.567 |
iton | +25.121 |
ax | +24.841 |
Neg logit contributions | |
� | -23.655 |
bipartisan | -23.355 |
� | -22.672 |
politically | -21.381 |
political | -21.215 |
Token | over |
Token ID | 625 |
Feature activation | -5.93e+01 |
Pos logit contributions | |
contains | +31.354 |
detects | +29.827 |
you | +29.484 |
coins | +29.454 |
rox | +28.491 |
Neg logit contributions | |
� | -35.308 |
ccording | -28.591 |
� | -27.886 |
behavi | -26.960 |
tremend | -26.701 |
Token | the |
Token ID | 262 |
Feature activation | -4.53e+01 |
Pos logit contributions | |
contains | +36.932 |
you | +36.551 |
img | +34.997 |
it | +34.654 |
coins | +34.652 |
Neg logit contributions | |
� | -41.698 |
ccording | -34.536 |
tremend | -33.621 |
� | -33.370 |
millenn | -31.598 |
Token | input |
Token ID | 5128 |
Feature activation | -4.83e+01 |
Pos logit contributions | |
contains | +34.620 |
img | +33.506 |
detects | +33.418 |
input | +32.301 |
you | +31.965 |
Neg logit contributions | |
� | -32.355 |
ccording | -25.600 |
� | -24.872 |
behavi | -23.803 |
� | -23.654 |
Token | image |
Token ID | 2939 |
Feature activation | -3.14e+01 |
Pos logit contributions | |
contains | +33.591 |
img | +33.495 |
detects | +33.278 |
you | +31.965 |
X | +31.877 |
Neg logit contributions | |
� | -34.862 |
ccording | -29.656 |
� | -27.557 |
� | -27.405 |
� | -25.921 |
Token | paths |
Token ID | 13532 |
Feature activation | -3.65e+01 |
Pos logit contributions | |
contains | +28.213 |
coins | +28.078 |
detects | +27.852 |
img | +25.742 |
corresponds | +25.617 |
Neg logit contributions | |
� | -25.553 |
bipartisan | -22.225 |
ccording | -21.582 |
� | -21.491 |
cynical | -20.323 |
Token | for |
Token ID | 329 |
Feature activation | -4.29e+01 |
Pos logit contributions | |
contains | +29.666 |
coins | +29.268 |
detects | +28.561 |
img | +27.581 |
iton | +27.289 |
Neg logit contributions | |
� | -31.008 |
ccording | -26.447 |
� | -24.798 |
behavi | -24.051 |
bipartisan | -23.650 |
Token | 2 |
Token ID | 17 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
coins | +21.387 |
img | +20.312 |
contains | +20.030 |
detects | +19.414 |
iton | +19.303 |
Neg logit contributions | |
bipartisan | -18.153 |
� | -17.108 |
politically | -17.089 |
political | -16.790 |
geopolitical | -16.512 |
Token | = |
Token ID | 796 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
coins | +21.872 |
contains | +20.509 |
img | +20.165 |
detects | +20.165 |
iton | +19.938 |
Neg logit contributions | |
bipartisan | -19.807 |
� | -19.258 |
� | -18.821 |
politically | -18.480 |
political | -18.465 |
Token | New |
Token ID | 968 |
Feature activation | -5.32e+01 |
Pos logit contributions | |
contains | +17.964 |
coins | +17.525 |
detects | +17.142 |
img | +16.710 |
wine | +16.464 |
Neg logit contributions | |
bipartisan | -18.943 |
� | -18.695 |
politically | -17.550 |
political | -17.251 |
geopolitical | -17.202 |
Token | - |
Token ID | 12 |
Feature activation | -4.80e+01 |
Pos logit contributions | |
img | +34.958 |
coins | +34.951 |
contains | +34.406 |
+ | +34.217 |
iton | +33.216 |
Neg logit contributions | |
� | -43.349 |
tremend | -37.245 |
ccording | -34.501 |
millenn | -34.157 |
� | -33.615 |
Token | Object |
Token ID | 10267 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
X | +33.778 |
coins | +33.363 |
img | +32.695 |
wine | +31.670 |
edit | +31.591 |
Neg logit contributions | |
� | -41.422 |
tremend | -34.369 |
millenn | -32.097 |
exting | -31.941 |
ccording | -31.261 |
Token | System |
Token ID | 4482 |
Feature activation | -5.85e+01 |
Pos logit contributions | |
contains | +21.294 |
detects | +20.428 |
img | +20.140 |
coins | +20.038 |
wine | +19.579 |
Neg logit contributions | |
bipartisan | -17.656 |
� | -17.533 |
politically | -16.736 |
� | -16.570 |
geopolitical | -16.135 |
Token | . |
Token ID | 13 |
Feature activation | -2.91e+01 |
Pos logit contributions | |
coins | +36.286 |
img | +36.227 |
contains | +35.236 |
forge | +34.620 |
you | +34.613 |
Neg logit contributions | |
� | -47.565 |
tremend | -40.082 |
� | -38.365 |
millenn | -38.341 |
ccording | -37.766 |
Token | Draw |
Token ID | 25302 |
Feature activation | -5.38e+01 |
Pos logit contributions | |
coins | +29.747 |
img | +28.403 |
contains | +27.887 |
wine | +27.586 |
detects | +26.711 |
Neg logit contributions | |
� | -23.578 |
bipartisan | -20.595 |
politically | -19.580 |
political | -19.153 |
tremend | -19.152 |
Token | ing |
Token ID | 278 |
Feature activation | -4.09e+01 |
Pos logit contributions | |
img | +36.698 |
ing | +35.030 |
iton | +34.708 |
coins | +34.174 |
ings | +33.055 |
Neg logit contributions | |
� | -46.415 |
tremend | -38.293 |
� | -36.761 |
ccording | -35.802 |
millenn | -35.712 |
Token | . |
Token ID | 13 |
Feature activation | -2.54e+01 |
Pos logit contributions | |
coins | +34.004 |
img | +33.465 |
contains | +32.506 |
forge | +31.536 |
cube | +31.249 |
Neg logit contributions | |
� | -36.360 |
tremend | -30.182 |
ccording | -28.580 |
millenn | -28.521 |
� | -27.910 |
Token | Font |
Token ID | 23252 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
coins | +23.592 |
img | +23.004 |
contains | +21.902 |
wine | +21.609 |
hex | +21.415 |
Neg logit contributions | |
bipartisan | -20.510 |
� | -19.849 |
politically | -19.348 |
political | -18.885 |
geopolitical | -18.451 |
Token | which |
Token ID | 543 |
Feature activation | -4.45e+00 |
Pos logit contributions | |
� | +7.812 |
bipartisan | +7.733 |
political | +7.609 |
politically | +7.561 |
� | +7.267 |
Neg logit contributions | |
coins | -3.876 |
detects | -3.443 |
iton | -3.268 |
img | -3.219 |
contains | -3.182 |
Token | impacts |
Token ID | 12751 |
Feature activation | -5.15e+00 |
Pos logit contributions | |
coins | +4.541 |
detects | +4.233 |
iton | +4.126 |
img | +4.060 |
contains | +4.059 |
Neg logit contributions | |
bipartisan | -5.194 |
� | -5.156 |
political | -4.963 |
politically | -4.937 |
� | -4.721 |
Token | us |
Token ID | 514 |
Feature activation | +9.67e+00 |
Pos logit contributions | |
coins | +5.397 |
detects | +5.135 |
contains | +4.965 |
iton | +4.914 |
img | +4.849 |
Neg logit contributions | |
bipartisan | -5.769 |
� | -5.712 |
political | -5.440 |
politically | -5.416 |
� | -5.199 |
Token | personally |
Token ID | 7620 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
� | +12.460 |
politically | +12.180 |
bipartisan | +11.767 |
political | +11.749 |
� | +11.391 |
Neg logit contributions | |
coins | -8.000 |
detects | -7.278 |
iton | -6.913 |
wine | -6.815 |
contains | -6.720 |
Token | . |
Token ID | 13 |
Feature activation | +5.74e+00 |
Pos logit contributions | |
� | +20.632 |
politically | +19.520 |
bipartisan | +18.746 |
political | +18.746 |
� | +18.654 |
Neg logit contributions | |
coins | -13.310 |
detects | -12.126 |
iton | -11.589 |
wine | -11.370 |
rox | -11.213 |
Token |
|
Token ID | 198 |
Feature activation | +3.62e+01 |
Pos logit contributions | |
� | +6.474 |
bipartisan | +6.010 |
� | +5.940 |
political | +5.773 |
politically | +5.630 |
Neg logit contributions | |
coins | -5.975 |
detects | -5.825 |
iton | -5.573 |
mitter | -5.433 |
rox | -5.433 |
Token |
|
Token ID | 198 |
Feature activation | +8.63e+00 |
Pos logit contributions | |
� | +22.551 |
� | +20.383 |
| +18.930 |
bipartisan | +17.029 |
political | +16.504 |
Neg logit contributions | |
detects | -28.066 |
eatures | -27.857 |
yip | -26.606 |
coins | -26.021 |
senal | -25.849 |
Token | If |
Token ID | 1532 |
Feature activation | -9.91e+00 |
Pos logit contributions | |
� | +11.246 |
bipartisan | +9.853 |
� | +9.815 |
political | +9.484 |
politically | +9.175 |
Neg logit contributions | |
detects | -7.487 |
coins | -7.023 |
contains | -6.700 |
iton | -6.686 |
assium | -6.315 |
Token | you |
Token ID | 345 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
coins | +12.065 |
detects | +11.660 |
contains | +11.416 |
iton | +11.171 |
img | +11.051 |
Neg logit contributions | |
bipartisan | -8.830 |
� | -8.653 |
politically | -8.037 |
political | -8.019 |
� | -7.664 |
Token | , |
Token ID | 11 |
Feature activation | -4.34e+00 |
Pos logit contributions | |
� | +15.812 |
� | +14.778 |
bipartisan | +14.439 |
politically | +14.264 |
political | +14.248 |
Neg logit contributions | |
coins | -9.179 |
detects | -7.966 |
iton | -7.844 |
img | -7.626 |
rox | -7.625 |
Token | like |
Token ID | 588 |
Feature activation | -7.37e+00 |
Pos logit contributions | |
coins | +3.685 |
detects | +3.451 |
contains | +3.291 |
iton | +3.280 |
img | +3.208 |
Neg logit contributions | |
bipartisan | -5.784 |
� | -5.750 |
political | -5.514 |
politically | -5.502 |
� | -5.332 |
Token | of |
Token ID | 286 |
Feature activation | +7.96e+00 |
Pos logit contributions | |
bipartisan | +3.210 |
� | +3.133 |
political | +3.053 |
politically | +3.047 |
geopolitical | +2.958 |
Neg logit contributions | |
coins | -0.999 |
detects | -0.909 |
contains | -0.879 |
iton | -0.836 |
img | -0.810 |
Token | working |
Token ID | 1762 |
Feature activation | +4.68e+00 |
Pos logit contributions | |
bipartisan | +9.633 |
political | +9.313 |
� | +9.153 |
politically | +9.103 |
troubling | +8.510 |
Neg logit contributions | |
coins | -7.293 |
detects | -6.765 |
iton | -6.651 |
wine | -6.473 |
img | -6.386 |
Token | families |
Token ID | 4172 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
bipartisan | +4.610 |
� | +4.464 |
political | +4.423 |
politically | +4.301 |
� | +4.058 |
Neg logit contributions | |
coins | -5.482 |
detects | -5.151 |
iton | -4.951 |
mitter | -4.948 |
rox | -4.943 |
Token | . |
Token ID | 13 |
Feature activation | +2.44e+01 |
Pos logit contributions | |
� | +20.029 |
bipartisan | +18.981 |
politically | +18.692 |
� | +18.522 |
political | +18.400 |
Neg logit contributions | |
coins | -12.248 |
detects | -11.498 |
iton | -11.113 |
rox | -10.959 |
wine | -10.593 |
Token |
|
Token ID | 198 |
Feature activation | +3.73e+01 |
Pos logit contributions | |
� | +24.660 |
� | +22.455 |
bipartisan | +21.375 |
Democratic | +20.478 |
political | +20.429 |
Neg logit contributions | |
detects | -18.998 |
iton | -18.207 |
coins | -18.144 |
mitter | -17.759 |
rox | -17.056 |
Token |
|
Token ID | 198 |
Feature activation | +2.13e+01 |
Pos logit contributions | |
� | +22.753 |
� | +20.618 |
| +19.321 |
bipartisan | +17.479 |
political | +16.487 |
Neg logit contributions | |
eatures | -29.503 |
detects | -28.826 |
yip | -27.395 |
senal | -26.996 |
coins | -26.771 |
Token | I |
Token ID | 40 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
� | +22.531 |
bipartisan | +18.856 |
� | +18.618 |
political | +17.670 |
Politics | +17.588 |
Neg logit contributions | |
detects | -18.093 |
iton | -16.319 |
assium | -15.702 |
coins | -15.372 |
contains | -15.370 |
Token | represent |
Token ID | 2380 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
� | +22.313 |
� | +20.621 |
bipartisan | +20.600 |
political | +19.760 |
politically | +19.602 |
Neg logit contributions | |
coins | -13.257 |
detects | -12.375 |
iton | -11.629 |
ames | -11.537 |
img | -11.350 |
Token | Vermont |
Token ID | 16033 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
bipartisan | +16.266 |
� | +15.745 |
political | +15.646 |
politically | +15.252 |
� | +14.784 |
Neg logit contributions | |
coins | -10.143 |
detects | -9.747 |
img | -9.197 |
rox | -9.057 |
iton | -9.037 |
Token | , |
Token ID | 11 |
Feature activation | +3.15e+00 |
Pos logit contributions | |
� | +2.586 |
bipartisan | +2.584 |
political | +2.498 |
politically | +2.475 |
� | +2.408 |
Neg logit contributions | |
coins | -1.193 |
detects | -1.123 |
rox | -1.035 |
img | -1.031 |
contains | -1.026 |
Token | a |
Token ID | 257 |
Feature activation | +2.65e+01 |
Pos logit contributions | |
bipartisan | +4.436 |
� | +4.320 |
political | +4.264 |
politically | +4.216 |
� | +4.044 |
Neg logit contributions | |
coins | -2.489 |
detects | -2.236 |
img | -2.151 |
rox | -2.135 |
iton | -2.120 |
Token | harassment |
Token ID | 10556 |
Feature activation | +3.66e+00 |
Pos logit contributions | |
bipartisan | +17.258 |
� | +17.158 |
political | +17.089 |
politically | +16.771 |
� | +16.546 |
Neg logit contributions | |
coins | -8.208 |
iton | -6.920 |
mitter | -6.668 |
wine | -6.627 |
img | -6.571 |
Token | is |
Token ID | 318 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
� | +5.702 |
bipartisan | +5.701 |
political | +5.519 |
politically | +5.498 |
� | +5.399 |
Neg logit contributions | |
coins | -2.207 |
iton | -1.916 |
img | -1.823 |
detects | -1.800 |
rox | -1.780 |
Token | often |
Token ID | 1690 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
bipartisan | +19.003 |
political | +18.712 |
politically | +18.495 |
� | +18.060 |
troubling | +17.721 |
Neg logit contributions | |
coins | -14.237 |
iton | -12.910 |
detects | -12.438 |
mitter | -12.402 |
assium | -12.385 |
Token | linked |
Token ID | 6692 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
bipartisan | +18.412 |
political | +18.192 |
politically | +17.876 |
� | +17.259 |
troubling | +16.819 |
Neg logit contributions | |
coins | -13.241 |
iton | -11.906 |
assium | -11.416 |
mitter | -11.326 |
img | -11.295 |
Token | to |
Token ID | 284 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
� | +19.022 |
bipartisan | +18.982 |
politically | +18.302 |
political | +18.297 |
� | +17.800 |
Neg logit contributions | |
coins | -8.811 |
detects | -8.091 |
contains | -7.545 |
iton | -7.494 |
img | -7.441 |
Token | the |
Token ID | 262 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
political | +15.788 |
politically | +15.297 |
bipartisan | +15.177 |
� | +15.113 |
� | +14.502 |
Neg logit contributions | |
coins | -11.505 |
assium | -10.260 |
detects | -10.141 |
mitter | -10.084 |
img | -10.013 |
Token | threat |
Token ID | 2372 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
political | +20.046 |
politically | +19.445 |
bipartisan | +19.225 |
� | +18.901 |
� | +18.294 |
Neg logit contributions | |
coins | -15.556 |
detects | -13.909 |
wine | -13.745 |
assium | -13.635 |
img | -13.435 |
Token | of |
Token ID | 286 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
bipartisan | +3.727 |
� | +3.680 |
political | +3.543 |
politically | +3.537 |
� | +3.441 |
Neg logit contributions | |
coins | -1.403 |
detects | -1.297 |
contains | -1.230 |
iton | -1.193 |
img | -1.156 |
Token | violence |
Token ID | 3685 |
Feature activation | +6.80e+00 |
Pos logit contributions | |
political | +12.761 |
bipartisan | +12.429 |
politically | +12.313 |
� | +12.137 |
� | +11.547 |
Neg logit contributions | |
coins | -11.745 |
mitter | -10.829 |
wine | -10.653 |
img | -10.621 |
detects | -10.606 |
Token | . |
Token ID | 13 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
� | +9.338 |
bipartisan | +9.130 |
politically | +8.940 |
political | +8.915 |
� | +8.789 |
Neg logit contributions | |
coins | -5.096 |
detects | -4.575 |
iton | -4.492 |
img | -4.407 |
assium | -4.306 |
Token | A |
Token ID | 317 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
� | +12.163 |
� | +11.327 |
bipartisan | +11.081 |
political | +10.677 |
| +10.466 |
Neg logit contributions | |
coins | -10.357 |
detects | -9.889 |
mitter | -9.744 |
iton | -9.649 |
assium | -9.494 |
Token | is |
Token ID | 318 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
bipartisan | +9.391 |
� | +9.350 |
political | +9.175 |
politically | +9.060 |
� | +8.918 |
Neg logit contributions | |
coins | -3.845 |
img | -3.122 |
wine | -3.056 |
iton | -3.056 |
detects | -3.042 |
Token | seldom |
Token ID | 25129 |
Feature activation | +5.52e+00 |
Pos logit contributions | |
� | +14.518 |
bipartisan | +14.189 |
politically | +14.174 |
political | +14.085 |
� | +13.458 |
Neg logit contributions | |
coins | -13.123 |
detects | -12.208 |
wine | -11.729 |
img | -11.721 |
iton | -11.610 |
Token | the |
Token ID | 262 |
Feature activation | +7.17e+00 |
Pos logit contributions | |
� | +7.611 |
bipartisan | +7.527 |
politically | +7.245 |
political | +7.224 |
� | +7.081 |
Neg logit contributions | |
coins | -4.135 |
detects | -3.729 |
iton | -3.629 |
img | -3.624 |
wine | -3.583 |
Token | case |
Token ID | 1339 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
bipartisan | +6.389 |
� | +6.369 |
political | +6.156 |
politically | +6.043 |
� | +5.707 |
Neg logit contributions | |
coins | -8.683 |
detects | -8.168 |
img | -8.079 |
wine | -7.956 |
contains | -7.854 |
Token | . |
Token ID | 13 |
Feature activation | -3.76e+00 |
Pos logit contributions | |
� | +20.712 |
� | +18.975 |
politically | +18.425 |
bipartisan | +18.361 |
political | +18.119 |
Neg logit contributions | |
coins | -12.308 |
detects | -11.256 |
wine | -10.612 |
img | -10.532 |
iton | -10.430 |
Token |
|
Token ID | 198 |
Feature activation | +2.59e+01 |
Pos logit contributions | |
coins | +3.750 |
detects | +3.546 |
iton | +3.424 |
contains | +3.389 |
rox | +3.310 |
Neg logit contributions | |
� | -4.515 |
bipartisan | -4.469 |
political | -4.233 |
politically | -4.189 |
� | -4.143 |
Token |
|
Token ID | 198 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
� | +17.967 |
� | +16.023 |
| +14.653 |
bipartisan | +13.711 |
political | +13.108 |
Neg logit contributions | |
detects | -24.584 |
coins | -23.284 |
eatures | -23.231 |
assium | -22.554 |
yip | -22.249 |
Token | To |
Token ID | 2514 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
coins | +1.277 |
detects | +1.256 |
contains | +1.197 |
iton | +1.183 |
rox | +1.127 |
Neg logit contributions | |
� | -1.611 |
bipartisan | -1.537 |
political | -1.454 |
� | -1.438 |
politically | -1.433 |
Token | understand |
Token ID | 1833 |
Feature activation | -5.21e+00 |
Pos logit contributions | |
coins | +2.097 |
detects | +1.940 |
contains | +1.877 |
img | +1.874 |
iton | +1.872 |
Neg logit contributions | |
bipartisan | -2.210 |
� | -2.208 |
political | -2.107 |
politically | -2.096 |
� | -2.018 |
Token | why |
Token ID | 1521 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
coins | +4.561 |
detects | +4.301 |
contains | +4.137 |
iton | +4.077 |
img | +4.016 |
Neg logit contributions | |
bipartisan | -6.727 |
� | -6.674 |
political | -6.382 |
politically | -6.350 |
� | -6.159 |
Token | we |
Token ID | 356 |
Feature activation | +4.23e+00 |
Pos logit contributions | |
coins | +11.871 |
detects | +11.519 |
contains | +11.203 |
iton | +10.987 |
img | +10.814 |
Neg logit contributions | |
bipartisan | -9.651 |
� | -9.497 |
politically | -8.877 |
political | -8.867 |
� | -8.456 |
Token | in |
Token ID | 287 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
coins | +2.684 |
detects | +2.489 |
contains | +2.358 |
iton | +2.306 |
img | +2.250 |
Neg logit contributions | |
bipartisan | -6.302 |
� | -6.253 |
political | -6.013 |
politically | -5.998 |
� | -5.838 |
Token | a |
Token ID | 257 |
Feature activation | +8.57e+00 |
Pos logit contributions | |
coins | +0.162 |
detects | +0.157 |
contains | +0.150 |
iton | +0.150 |
img | +0.149 |
Neg logit contributions | |
bipartisan | -0.134 |
� | -0.133 |
political | -0.128 |
politically | -0.125 |
� | -0.120 |
Token | ball |
Token ID | 2613 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
bipartisan | +8.235 |
political | +7.941 |
� | +7.886 |
politically | +7.661 |
� | +7.138 |
Neg logit contributions | |
coins | -10.006 |
detects | -9.352 |
img | -8.977 |
iton | -8.896 |
contains | -8.758 |
Token | room |
Token ID | 3823 |
Feature activation | -7.30e+00 |
Pos logit contributions | |
coins | +13.008 |
detects | +12.572 |
contains | +12.418 |
iton | +12.167 |
img | +11.975 |
Neg logit contributions | |
bipartisan | -11.071 |
� | -10.805 |
politically | -10.225 |
political | -10.188 |
� | -9.637 |
Token | is |
Token ID | 318 |
Feature activation | +7.19e+00 |
Pos logit contributions | |
coins | +8.131 |
detects | +7.813 |
contains | +7.608 |
iton | +7.479 |
img | +7.381 |
Neg logit contributions | |
bipartisan | -7.545 |
� | -7.427 |
political | -7.023 |
politically | -7.002 |
� | -6.702 |
Token | a |
Token ID | 257 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
� | +8.860 |
bipartisan | +8.784 |
political | +8.545 |
politically | +8.509 |
� | +8.316 |
Neg logit contributions | |
coins | -6.338 |
detects | -5.860 |
iton | -5.629 |
img | -5.571 |
rox | -5.508 |
Token | piece |
Token ID | 3704 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
political | +22.137 |
bipartisan | +22.119 |
� | +22.100 |
politically | +21.409 |
� | +20.834 |
Neg logit contributions | |
coins | -17.368 |
detects | -14.932 |
rox | -14.859 |
mitter | -14.816 |
iton | -14.774 |
Token | of |
Token ID | 286 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
bipartisan | +2.605 |
� | +2.517 |
political | +2.455 |
politically | +2.454 |
geopolitical | +2.390 |
Neg logit contributions | |
coins | -0.797 |
detects | -0.743 |
contains | -0.716 |
iton | -0.677 |
img | -0.638 |
Token | imper |
Token ID | 11071 |
Feature activation | +7.07e+00 |
Pos logit contributions | |
political | +15.585 |
� | +15.544 |
bipartisan | +15.458 |
politically | +15.003 |
� | +14.521 |
Neg logit contributions | |
coins | -12.788 |
detects | -11.601 |
iton | -11.175 |
mitter | -11.087 |
img | -11.007 |
Token | t |
Token ID | 83 |
Feature activation | +5.59e+00 |
Pos logit contributions | |
� | +9.463 |
bipartisan | +9.150 |
political | +8.765 |
� | +8.756 |
politically | +8.629 |
Neg logit contributions | |
coins | -5.165 |
detects | -4.981 |
contains | -4.565 |
iton | -4.220 |
wine | -4.158 |
Token | inence |
Token ID | 18386 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
� | +5.859 |
bipartisan | +5.789 |
political | +5.501 |
� | +5.334 |
politically | +5.307 |
Neg logit contributions | |
coins | -5.823 |
detects | -5.468 |
contains | -5.240 |
iton | -5.165 |
mitter | -5.004 |
Token | , |
Token ID | 11 |
Feature activation | -6.22e+00 |
Pos logit contributions | |
coins | +2.870 |
detects | +2.676 |
contains | +2.537 |
iton | +2.515 |
img | +2.452 |
Neg logit contributions | |
bipartisan | -5.271 |
� | -5.254 |
political | -5.036 |
politically | -5.029 |
� | -4.879 |
Token | who |
Token ID | 508 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
coins | +7.128 |
detects | +6.798 |
contains | +6.583 |
iton | +6.573 |
img | +6.449 |
Neg logit contributions | |
bipartisan | -6.426 |
� | -6.364 |
political | -6.030 |
politically | -5.993 |
� | -5.731 |
Token | flee |
Token ID | 11562 |
Feature activation | -9.69e+00 |
Pos logit contributions | |
coins | +11.752 |
detects | +11.328 |
contains | +11.032 |
iton | +10.847 |
img | +10.708 |
Neg logit contributions | |
bipartisan | -10.113 |
� | -9.969 |
political | -9.361 |
politically | -9.321 |
� | -8.947 |
Token | into |
Token ID | 656 |
Feature activation | -6.64e+00 |
Pos logit contributions | |
coins | +9.719 |
detects | +9.298 |
contains | +9.032 |
iton | +8.863 |
img | +8.738 |
Neg logit contributions | |
bipartisan | -11.006 |
� | -10.856 |
political | -10.282 |
politically | -10.250 |
� | -9.887 |
Token | the |
Token ID | 262 |
Feature activation | +6.31e+00 |
Pos logit contributions | |
coins | +5.856 |
detects | +5.551 |
contains | +5.355 |
iton | +5.255 |
img | +5.172 |
Neg logit contributions | |
bipartisan | -8.421 |
� | -8.335 |
political | -7.940 |
politically | -7.926 |
� | -7.670 |
Token | " |
Token ID | 366 |
Feature activation | +3.57e+00 |
Pos logit contributions | |
� | +6.503 |
bipartisan | +6.478 |
political | +6.423 |
politically | +6.180 |
� | +5.967 |
Neg logit contributions | |
coins | -6.572 |
detects | -6.308 |
iton | -6.148 |
contains | -5.937 |
img | -5.906 |
Token | forest |
Token ID | 29623 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
� | +4.651 |
bipartisan | +4.537 |
political | +4.396 |
politically | +4.292 |
� | +4.226 |
Neg logit contributions | |
detects | -2.842 |
coins | -2.780 |
contains | -2.664 |
iton | -2.613 |
img | -2.457 |
Token | " |
Token ID | 1 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
coins | +10.472 |
detects | +10.094 |
contains | +9.960 |
iton | +9.531 |
wine | +9.368 |
Neg logit contributions | |
bipartisan | -12.647 |
� | -12.315 |
politically | -11.737 |
political | -11.715 |
� | -11.300 |
Token | of |
Token ID | 286 |
Feature activation | -8.69e+00 |
Pos logit contributions | |
coins | +10.722 |
detects | +10.302 |
contains | +10.066 |
iton | +9.779 |
img | +9.662 |
Neg logit contributions | |
bipartisan | -12.103 |
� | -11.873 |
political | -11.262 |
politically | -11.241 |
� | -10.807 |
Token | Hu |
Token ID | 11256 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
coins | +8.381 |
detects | +7.986 |
contains | +7.755 |
iton | +7.590 |
img | +7.499 |
Neg logit contributions | |
bipartisan | -10.176 |
� | -10.047 |
political | -9.523 |
politically | -9.520 |
� | -9.164 |
Token | orns |
Token ID | 19942 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
coins | +24.821 |
contains | +23.088 |
rox | +22.948 |
iton | +22.876 |
img | +22.781 |
Neg logit contributions | |
bipartisan | -20.954 |
� | -20.914 |
� | -19.320 |
political | -19.184 |
politically | -19.115 |
Token | sensor |
Token ID | 12694 |
Feature activation | -1.73e+01 |
Pos logit contributions | |
coins | +10.135 |
detects | +9.719 |
contains | +9.426 |
iton | +9.287 |
img | +9.161 |
Neg logit contributions | |
bipartisan | -10.370 |
� | -10.250 |
political | -9.691 |
politically | -9.665 |
� | -9.298 |
Token | into |
Token ID | 656 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
coins | +20.018 |
detects | +19.746 |
contains | +19.427 |
iton | +19.023 |
img | +18.601 |
Neg logit contributions | |
bipartisan | -14.265 |
� | -13.766 |
political | -12.855 |
politically | -12.839 |
� | -12.812 |
Token | an |
Token ID | 281 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
coins | +11.919 |
detects | +11.383 |
contains | +11.115 |
iton | +11.067 |
img | +10.755 |
Neg logit contributions | |
bipartisan | -13.316 |
� | -13.073 |
political | -12.345 |
politically | -12.334 |
� | -11.900 |
Token | overall |
Token ID | 4045 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
coins | +1.529 |
detects | +1.419 |
contains | +1.356 |
iton | +1.351 |
wine | +1.338 |
Neg logit contributions | |
� | -1.409 |
bipartisan | -1.406 |
politically | -1.343 |
political | -1.340 |
� | -1.289 |
Token | smaller |
Token ID | 4833 |
Feature activation | -7.23e+00 |
Pos logit contributions | |
bipartisan | +2.035 |
� | +2.020 |
political | +1.958 |
politically | +1.923 |
� | +1.854 |
Neg logit contributions | |
coins | -1.979 |
detects | -1.811 |
contains | -1.714 |
iton | -1.710 |
wine | -1.708 |
Token | package |
Token ID | 5301 |
Feature activation | -3.63e+00 |
Pos logit contributions | |
coins | +7.656 |
detects | +7.248 |
contains | +7.007 |
iton | +6.940 |
img | +6.834 |
Neg logit contributions | |
bipartisan | -8.135 |
� | -8.057 |
political | -7.671 |
politically | -7.620 |
� | -7.347 |
Token | than |
Token ID | 621 |
Feature activation | -1.82e+01 |
Pos logit contributions | |
coins | +2.881 |
detects | +2.688 |
contains | +2.554 |
iton | +2.524 |
img | +2.483 |
Neg logit contributions | |
� | -5.033 |
bipartisan | -5.006 |
political | -4.786 |
politically | -4.778 |
� | -4.662 |
Token | you |
Token ID | 345 |
Feature activation | -2.54e+00 |
Pos logit contributions | |
coins | +22.315 |
detects | +22.020 |
contains | +21.677 |
iton | +21.118 |
img | +20.734 |
Neg logit contributions | |
bipartisan | -13.839 |
� | -13.232 |
politically | -12.317 |
political | -12.275 |
� | -12.003 |
Token | � |
Token ID | 447 |
Feature activation | +5.38e-01 |
Pos logit contributions | |
coins | +1.965 |
detects | +1.771 |
iton | +1.703 |
contains | +1.686 |
img | +1.649 |
Neg logit contributions | |
� | -3.673 |
bipartisan | -3.600 |
politically | -3.458 |
political | -3.451 |
� | -3.395 |
Token | � |
Token ID | 247 |
Feature activation | -3.60e-01 |
Pos logit contributions | |
� | +0.588 |
bipartisan | +0.575 |
political | +0.540 |
politically | +0.534 |
� | +0.524 |
Neg logit contributions | |
coins | -0.589 |
detects | -0.564 |
contains | -0.540 |
iton | -0.538 |
rox | -0.525 |
Token | d |
Token ID | 67 |
Feature activation | +5.32e+00 |
Pos logit contributions | |
coins | +0.260 |
detects | +0.243 |
contains | +0.229 |
iton | +0.228 |
rox | +0.223 |
Neg logit contributions | |
� | -0.527 |
bipartisan | -0.512 |
political | -0.491 |
politically | -0.490 |
� | -0.486 |
Token | through |
Token ID | 832 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
coins | +5.469 |
detects | +5.196 |
contains | +5.003 |
iton | +4.947 |
img | +4.876 |
Neg logit contributions | |
bipartisan | -6.699 |
� | -6.671 |
political | -6.322 |
politically | -6.302 |
� | -6.106 |
Token | , |
Token ID | 11 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
� | +5.807 |
bipartisan | +5.614 |
political | +5.449 |
politically | +5.412 |
� | +5.367 |
Neg logit contributions | |
coins | -3.163 |
detects | -2.952 |
iton | -2.823 |
img | -2.754 |
contains | -2.718 |
Token | � |
Token ID | 447 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
� | +1.977 |
bipartisan | +1.917 |
political | +1.841 |
politically | +1.829 |
� | +1.824 |
Neg logit contributions | |
coins | -1.218 |
detects | -1.115 |
iton | -1.093 |
img | -1.055 |
rox | -1.053 |
Token | � |
Token ID | 251 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
� | +1.604 |
bipartisan | +1.591 |
political | +1.499 |
politically | +1.484 |
� | +1.462 |
Neg logit contributions | |
coins | -1.438 |
detects | -1.363 |
iton | -1.318 |
contains | -1.310 |
img | -1.282 |
Token | says |
Token ID | 1139 |
Feature activation | -6.51e-01 |
Pos logit contributions | |
coins | +1.213 |
detects | +1.141 |
contains | +1.083 |
iton | +1.079 |
img | +1.060 |
Neg logit contributions | |
� | -1.988 |
bipartisan | -1.957 |
political | -1.882 |
politically | -1.868 |
� | -1.841 |
Token | Thomas |
Token ID | 5658 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
coins | +0.665 |
detects | +0.635 |
contains | +0.612 |
iton | +0.605 |
img | +0.596 |
Neg logit contributions | |
bipartisan | -0.747 |
� | -0.741 |
political | -0.707 |
politically | -0.701 |
� | -0.679 |
Token | , |
Token ID | 11 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
� | +22.535 |
bipartisan | +21.006 |
� | +20.820 |
political | +20.553 |
politically | +20.493 |
Neg logit contributions | |
coins | -12.902 |
detects | -12.111 |
iton | -11.529 |
contains | -11.367 |
img | -11.209 |
Token | who |
Token ID | 508 |
Feature activation | +8.29e+00 |
Pos logit contributions | |
� | +23.119 |
� | +21.393 |
bipartisan | +20.887 |
political | +20.629 |
politically | +20.305 |
Neg logit contributions | |
coins | -12.765 |
iton | -11.610 |
detects | -11.327 |
rox | -10.850 |
img | -10.645 |
Token | earned |
Token ID | 7366 |
Feature activation | +8.08e+00 |
Pos logit contributions | |
� | +12.631 |
bipartisan | +11.774 |
� | +11.686 |
political | +11.593 |
politically | +11.519 |
Neg logit contributions | |
coins | -4.956 |
iton | -4.280 |
img | -4.158 |
detects | -4.128 |
rox | -4.107 |
Token | her |
Token ID | 607 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
bipartisan | +9.825 |
� | +9.701 |
political | +9.450 |
politically | +9.184 |
� | +9.013 |
Neg logit contributions | |
coins | -7.095 |
detects | -6.824 |
contains | -6.496 |
iton | -6.409 |
rox | -6.351 |
Token | masters |
Token ID | 18159 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
� | +13.795 |
bipartisan | +13.619 |
political | +13.574 |
politically | +12.967 |
� | +12.712 |
Neg logit contributions | |
coins | -11.450 |
detects | -11.010 |
contains | -10.425 |
rox | -10.264 |
img | -10.263 |
Token | opt |
Token ID | 2172 |
Feature activation | +3.37e+00 |
Pos logit contributions | |
� | +13.326 |
politically | +12.904 |
bipartisan | +12.851 |
political | +12.763 |
� | +12.586 |
Neg logit contributions | |
coins | -10.989 |
detects | -9.879 |
assium | -9.869 |
wine | -9.643 |
rox | -9.517 |
Token | out |
Token ID | 503 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
� | +4.602 |
bipartisan | +4.531 |
politically | +4.374 |
political | +4.348 |
� | +4.265 |
Neg logit contributions | |
coins | -2.695 |
detects | -2.536 |
contains | -2.393 |
img | -2.338 |
iton | -2.335 |
Token | of |
Token ID | 286 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
� | +15.172 |
bipartisan | +14.918 |
politically | +14.470 |
political | +14.445 |
� | +14.166 |
Neg logit contributions | |
coins | -7.157 |
detects | -6.594 |
iton | -6.110 |
contains | -6.091 |
img | -6.065 |
Token | the |
Token ID | 262 |
Feature activation | +2.46e+01 |
Pos logit contributions | |
bipartisan | +16.216 |
political | +16.104 |
� | +15.861 |
politically | +15.589 |
geopolitical | +15.160 |
Neg logit contributions | |
coins | -10.594 |
wine | -9.119 |
detects | -9.085 |
rox | -9.017 |
iton | -8.965 |
Token | post |
Token ID | 1281 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
political | +24.996 |
bipartisan | +24.740 |
� | +24.174 |
geopolitical | +23.750 |
politically | +23.650 |
Neg logit contributions | |
coins | -18.217 |
detects | -16.231 |
assium | -15.644 |
wine | -15.537 |
mitter | -15.484 |
Token | - |
Token ID | 12 |
Feature activation | +1.84e+01 |
Pos logit contributions | |
� | +20.542 |
bipartisan | +19.754 |
political | +19.388 |
� | +19.198 |
politically | +18.926 |
Neg logit contributions | |
coins | -11.244 |
detects | -10.510 |
iton | -9.556 |
contains | -9.362 |
wine | -9.361 |
Token | 1945 |
Token ID | 41931 |
Feature activation | +2.17e+01 |
Pos logit contributions | |
� | +19.636 |
bipartisan | +18.677 |
political | +18.476 |
� | +17.734 |
geopolitical | +17.495 |
Neg logit contributions | |
coins | -13.859 |
detects | -13.787 |
iton | -13.012 |
contains | -12.850 |
assium | -11.997 |
Token | world |
Token ID | 995 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
political | +23.040 |
bipartisan | +22.557 |
� | +22.327 |
geopolitical | +21.990 |
� | +21.459 |
Neg logit contributions | |
coins | -16.374 |
detects | -15.007 |
mitter | -14.263 |
assium | -14.229 |
wine | -14.157 |
Token | order |
Token ID | 1502 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
� | +16.319 |
political | +15.687 |
bipartisan | +15.378 |
� | +15.157 |
politically | +14.991 |
Neg logit contributions | |
coins | -9.615 |
detects | -9.198 |
iton | -8.600 |
img | -8.549 |
wine | -8.537 |
Token | . |
Token ID | 13 |
Feature activation | +2.11e+01 |
Pos logit contributions | |
� | +20.692 |
bipartisan | +19.182 |
political | +19.129 |
� | +19.077 |
politically | +18.835 |
Neg logit contributions | |
coins | -11.089 |
detects | -10.426 |
wine | -9.836 |
assium | -9.600 |
img | -9.554 |
Token | � |
Token ID | 447 |
Feature activation | +7.03e+00 |
Pos logit contributions | |
� | +23.645 |
� | +21.685 |
bipartisan | +20.257 |
political | +19.629 |
| +19.181 |
Neg logit contributions | |
coins | -16.536 |
detects | -15.517 |
iton | -15.131 |
mitter | -15.061 |
rox | -14.704 |
Token |
|
Token ID | 198 |
Feature activation | +2.69e+01 |
Pos logit contributions | |
coins | +5.356 |
detects | +5.163 |
contains | +4.947 |
iton | +4.924 |
img | +4.824 |
Neg logit contributions | |
bipartisan | -5.971 |
� | -5.968 |
political | -5.624 |
politically | -5.589 |
� | -5.437 |
Token |
|
Token ID | 198 |
Feature activation | -4.34e+00 |
Pos logit contributions | |
� | +20.541 |
� | +18.002 |
| +16.379 |
bipartisan | +16.124 |
political | +15.949 |
Neg logit contributions | |
detects | -23.464 |
coins | -20.827 |
yip | -20.814 |
perpend | -20.720 |
eatures | -20.684 |
Token | 2011 |
Token ID | 9804 |
Feature activation | -3.28e+00 |
Pos logit contributions | |
coins | +4.430 |
detects | +4.382 |
contains | +4.183 |
iton | +4.134 |
img | +4.000 |
Neg logit contributions | |
� | -4.992 |
bipartisan | -4.907 |
political | -4.627 |
politically | -4.586 |
� | -4.479 |
Token | polymer |
Token ID | 30528 |
Feature activation | -9.64e+00 |
Pos logit contributions | |
coins | +3.346 |
detects | +3.199 |
iton | +3.087 |
contains | +3.052 |
img | +3.028 |
Neg logit contributions | |
bipartisan | -3.775 |
� | -3.760 |
political | -3.584 |
politically | -3.541 |
� | -3.448 |
Token | series |
Token ID | 2168 |
Feature activation | -7.23e+00 |
Pos logit contributions | |
coins | +11.480 |
detects | +10.938 |
contains | +10.714 |
iton | +10.563 |
img | +10.361 |
Neg logit contributions | |
bipartisan | -9.157 |
� | -8.997 |
politically | -8.424 |
political | -8.419 |
� | -8.018 |
Token | [ |
Token ID | 685 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
coins | +7.766 |
detects | +7.435 |
contains | +7.200 |
iton | +7.119 |
img | +7.024 |
Neg logit contributions | |
bipartisan | -7.852 |
� | -7.768 |
political | -7.355 |
politically | -7.322 |
� | -7.051 |
Token | edit |
Token ID | 4370 |
Feature activation | -6.93e-01 |
Pos logit contributions | |
� | +2.715 |
bipartisan | +2.632 |
political | +2.553 |
politically | +2.505 |
� | +2.485 |
Neg logit contributions | |
detects | -1.795 |
coins | -1.791 |
iton | -1.649 |
contains | -1.613 |
ames | -1.594 |
Token | ] |
Token ID | 2361 |
Feature activation | +9.71e+00 |
Pos logit contributions | |
coins | +0.622 |
detects | +0.605 |
iton | +0.556 |
mitter | +0.555 |
wine | +0.554 |
Neg logit contributions | |
� | -0.880 |
bipartisan | -0.868 |
political | -0.845 |
politically | -0.834 |
� | -0.831 |
Token |
|
Token ID | 198 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
� | +7.538 |
� | +6.933 |
bipartisan | +6.594 |
political | +6.340 |
| +6.165 |
Neg logit contributions | |
detects | -12.153 |
coins | -11.648 |
mitter | -11.220 |
iton | -10.953 |
behaves | -10.932 |
Token |
|
Token ID | 198 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
� | +14.435 |
� | +12.966 |
| +11.876 |
bipartisan | +10.937 |
political | +10.642 |
Neg logit contributions | |
detects | -23.643 |
coins | -22.257 |
eatures | -22.031 |
assium | -21.760 |
mitter | -21.720 |
Token | $ |
Token ID | 3 |
Feature activation | -6.79e+00 |
Pos logit contributions | |
coins | +12.757 |
detects | +11.994 |
contains | +11.809 |
iton | +11.656 |
img | +11.605 |
Neg logit contributions | |
bipartisan | -10.426 |
� | -10.048 |
politically | -9.631 |
political | -9.625 |
� | -9.108 |
Token | going |
Token ID | 1016 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
coins | +0.516 |
detects | +0.483 |
iton | +0.474 |
rox | +0.458 |
contains | +0.458 |
Neg logit contributions | |
bipartisan | -0.536 |
� | -0.527 |
political | -0.512 |
politically | -0.509 |
� | -0.486 |
Token | to |
Token ID | 284 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
coins | +0.849 |
detects | +0.778 |
contains | +0.754 |
iton | +0.712 |
img | +0.688 |
Neg logit contributions | |
bipartisan | -2.578 |
� | -2.537 |
political | -2.438 |
politically | -2.435 |
� | -2.370 |
Token | judge |
Token ID | 5052 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
coins | +4.704 |
detects | +4.438 |
iton | +4.296 |
contains | +4.268 |
img | +4.242 |
Neg logit contributions | |
bipartisan | -4.985 |
� | -4.980 |
political | -4.729 |
politically | -4.725 |
� | -4.564 |
Token | you |
Token ID | 345 |
Feature activation | +6.59e-01 |
Pos logit contributions | |
coins | +12.438 |
detects | +11.835 |
contains | +11.624 |
iton | +11.250 |
img | +11.142 |
Neg logit contributions | |
bipartisan | -13.334 |
� | -13.018 |
politically | -12.331 |
political | -12.301 |
� | -11.987 |
Token | for |
Token ID | 329 |
Feature activation | -6.56e+00 |
Pos logit contributions | |
� | +0.953 |
bipartisan | +0.928 |
politically | +0.908 |
political | +0.899 |
� | +0.883 |
Neg logit contributions | |
coins | -0.498 |
detects | -0.467 |
iton | -0.439 |
contains | -0.430 |
img | -0.423 |
Token | playing |
Token ID | 2712 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
coins | +6.850 |
detects | +6.552 |
contains | +6.316 |
iton | +6.254 |
img | +6.155 |
Neg logit contributions | |
bipartisan | -7.389 |
� | -7.321 |
political | -6.967 |
politically | -6.927 |
� | -6.680 |
Token | some |
Token ID | 617 |
Feature activation | +4.09e+00 |
Pos logit contributions | |
coins | +12.120 |
detects | +11.647 |
contains | +11.373 |
iton | +11.169 |
img | +11.075 |
Neg logit contributions | |
bipartisan | -9.893 |
� | -9.751 |
political | -9.096 |
politically | -9.078 |
� | -8.713 |
Token | Pokemon |
Token ID | 14878 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
bipartisan | +4.763 |
� | +4.726 |
political | +4.651 |
politically | +4.596 |
� | +4.393 |
Neg logit contributions | |
coins | -3.906 |
detects | -3.728 |
iton | -3.528 |
contains | -3.497 |
rox | -3.479 |
Token | while |
Token ID | 981 |
Feature activation | -1.37e+01 |
Pos logit contributions | |
coins | +10.255 |
detects | +9.759 |
contains | +9.476 |
iton | +9.309 |
img | +9.179 |
Neg logit contributions | |
bipartisan | -11.335 |
� | -11.151 |
political | -10.557 |
politically | -10.556 |
� | -10.141 |
Token | in |
Token ID | 287 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
coins | +15.474 |
detects | +14.912 |
contains | +14.687 |
iton | +14.274 |
img | +14.164 |
Neg logit contributions | |
bipartisan | -12.749 |
� | -12.458 |
political | -11.653 |
politically | -11.616 |
� | -11.121 |
Token | line |
Token ID | 1627 |
Feature activation | -4.40e+00 |
Pos logit contributions | |
coins | +13.628 |
detects | +13.083 |
contains | +12.877 |
iton | +12.565 |
img | +12.317 |
Neg logit contributions | |
bipartisan | -13.537 |
� | -13.294 |
politically | -12.535 |
political | -12.413 |
� | -12.081 |
Token | our |
Token ID | 674 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
detects | +32.233 |
coins | +31.936 |
contains | +31.794 |
img | +31.285 |
iton | +30.217 |
Neg logit contributions | |
� | -15.607 |
bipartisan | -15.231 |
� | -14.380 |
politically | -13.154 |
political | -12.947 |
Token | original |
Token ID | 2656 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
coins | +15.476 |
detects | +15.068 |
contains | +14.696 |
iton | +14.392 |
img | +14.349 |
Neg logit contributions | |
bipartisan | -10.841 |
� | -10.821 |
politically | -9.907 |
political | -9.901 |
� | -9.530 |
Token | image |
Token ID | 2939 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
coins | +23.111 |
detects | +22.868 |
contains | +22.383 |
img | +21.929 |
iton | +21.735 |
Neg logit contributions | |
� | -12.674 |
bipartisan | -12.341 |
politically | -11.074 |
� | -10.977 |
political | -10.892 |
Token | from |
Token ID | 422 |
Feature activation | -1.71e+01 |
Pos logit contributions | |
coins | +28.459 |
detects | +28.067 |
contains | +27.970 |
img | +27.121 |
iton | +26.454 |
Neg logit contributions | |
bipartisan | -16.084 |
� | -15.396 |
� | -14.190 |
political | -14.023 |
politically | -13.934 |
Token | disk |
Token ID | 11898 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
coins | +19.457 |
detects | +19.049 |
contains | +18.782 |
img | +18.532 |
iton | +18.213 |
Neg logit contributions | |
bipartisan | -14.332 |
� | -14.209 |
politically | -13.038 |
political | -12.939 |
� | -12.592 |
Token | and |
Token ID | 290 |
Feature activation | -3.12e+01 |
Pos logit contributions | |
coins | +22.393 |
detects | +21.786 |
contains | +21.512 |
img | +21.011 |
iton | +20.906 |
Neg logit contributions | |
bipartisan | -14.930 |
� | -14.093 |
political | -13.414 |
politically | -13.272 |
� | -12.839 |
Token | res |
Token ID | 581 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
detects | +34.788 |
contains | +34.423 |
coins | +33.104 |
completes | +32.532 |
allows | +31.838 |
Neg logit contributions | |
� | -16.937 |
bipartisan | -16.765 |
� | -16.515 |
political | -14.455 |
politically | -14.234 |
Token | izes |
Token ID | 4340 |
Feature activation | -3.04e+01 |
Pos logit contributions | |
coins | +14.229 |
detects | +13.306 |
contains | +12.987 |
img | +12.832 |
rox | +12.594 |
Neg logit contributions | |
bipartisan | -21.430 |
� | -20.690 |
political | -20.156 |
politically | -20.045 |
� | -19.816 |
Token | it |
Token ID | 340 |
Feature activation | -2.08e+01 |
Pos logit contributions | |
coins | +29.861 |
detects | +29.629 |
iton | +29.325 |
contains | +29.241 |
img | +29.071 |
Neg logit contributions | |
bipartisan | -18.720 |
� | -18.603 |
� | -17.610 |
politically | -16.692 |
political | -16.597 |
Token | to |
Token ID | 284 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
coins | +22.993 |
detects | +22.890 |
contains | +22.638 |
img | +21.830 |
iton | +21.822 |
Neg logit contributions | |
bipartisan | -16.194 |
� | -15.776 |
� | -15.142 |
political | -14.692 |
politically | -14.269 |
Token | have |
Token ID | 423 |
Feature activation | -1.72e+01 |
Pos logit contributions | |
coins | +21.075 |
detects | +20.936 |
contains | +20.763 |
img | +19.994 |
iton | +19.588 |
Neg logit contributions | |
� | -14.597 |
bipartisan | -14.516 |
politically | -13.253 |
� | -13.205 |
political | -13.153 |
Token | pre |
Token ID | 3866 |
Feature activation | -2.99e+01 |
Pos logit contributions | |
coins | +19.609 |
detects | +17.768 |
img | +17.640 |
iton | +17.581 |
contains | +17.547 |
Neg logit contributions | |
bipartisan | -19.236 |
� | -18.766 |
� | -17.971 |
political | -17.598 |
politically | -17.547 |
Token | y |
Token ID | 88 |
Feature activation | +3.70e+00 |
Pos logit contributions | |
coins | +27.207 |
img | +25.940 |
iton | +25.592 |
wine | +25.561 |
yne | +25.286 |
Neg logit contributions | |
� | -29.250 |
behavi | -24.698 |
bipartisan | -23.994 |
� | -22.882 |
ccording | -22.634 |
Token | - |
Token ID | 12 |
Feature activation | -3.02e+00 |
Pos logit contributions | |
bipartisan | +5.902 |
� | +5.867 |
political | +5.648 |
politically | +5.632 |
� | +5.496 |
Neg logit contributions | |
coins | -2.062 |
detects | -1.892 |
contains | -1.775 |
iton | -1.729 |
img | -1.677 |
Token | cry |
Token ID | 20470 |
Feature activation | -7.39e+00 |
Pos logit contributions | |
coins | +2.317 |
detects | +2.217 |
contains | +2.101 |
iton | +2.055 |
img | +2.009 |
Neg logit contributions | |
� | -4.187 |
bipartisan | -4.167 |
political | -3.973 |
politically | -3.958 |
� | -3.862 |
Token | stal |
Token ID | 7757 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
coins | +7.663 |
detects | +7.296 |
contains | +7.094 |
iton | +6.982 |
img | +6.884 |
Neg logit contributions | |
bipartisan | -8.240 |
� | -8.115 |
political | -7.723 |
politically | -7.695 |
� | -7.392 |
Token | - |
Token ID | 12 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
coins | +10.815 |
contains | +10.062 |
detects | +10.017 |
img | +9.961 |
wine | +9.712 |
Neg logit contributions | |
bipartisan | -14.874 |
� | -14.374 |
political | -13.969 |
politically | -13.802 |
� | -13.769 |
Token | emb |
Token ID | 24419 |
Feature activation | -2.00e+01 |
Pos logit contributions | |
coins | +13.647 |
img | +12.625 |
wine | +12.499 |
detects | +12.227 |
iton | +12.176 |
Neg logit contributions | |
bipartisan | -16.686 |
� | -15.850 |
political | -15.730 |
� | -15.580 |
politically | -15.461 |
Token | ry |
Token ID | 563 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
coins | +15.496 |
detects | +14.334 |
rox | +14.300 |
contains | +13.970 |
iton | +13.866 |
Neg logit contributions | |
bipartisan | -24.234 |
� | -24.173 |
� | -23.192 |
political | -22.838 |
politically | -22.627 |
Token | o |
Token ID | 78 |
Feature activation | +4.62e+00 |
Pos logit contributions | |
coins | +9.654 |
iton | +9.161 |
rox | +8.573 |
img | +8.501 |
contains | +8.472 |
Neg logit contributions | |
bipartisan | -17.429 |
� | -16.750 |
political | -16.473 |
politically | -16.349 |
� | -16.290 |
Token | - |
Token ID | 12 |
Feature activation | -6.17e-01 |
Pos logit contributions | |
bipartisan | +7.611 |
� | +7.602 |
political | +7.307 |
politically | +7.288 |
� | +7.128 |
Neg logit contributions | |
coins | -2.292 |
detects | -2.085 |
contains | -1.926 |
iton | -1.876 |
img | -1.810 |
Token | review |
Token ID | 19023 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
coins | +0.455 |
detects | +0.441 |
contains | +0.414 |
iton | +0.403 |
img | +0.393 |
Neg logit contributions | |
� | -0.870 |
bipartisan | -0.859 |
political | -0.821 |
politically | -0.819 |
� | -0.800 |
Token | Each |
Token ID | 10871 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
coins | +26.744 |
img | +25.440 |
contains | +25.230 |
detects | +25.154 |
iton | +24.771 |
Neg logit contributions | |
bipartisan | -13.236 |
� | -12.644 |
politically | -11.983 |
political | -11.737 |
� | -11.389 |
Token | vehicle |
Token ID | 4038 |
Feature activation | -3.40e+01 |
Pos logit contributions | |
coins | +18.880 |
detects | +18.734 |
contains | +18.608 |
iton | +17.978 |
img | +17.520 |
Neg logit contributions | |
bipartisan | -13.598 |
� | -13.461 |
politically | -12.393 |
political | -12.200 |
� | -12.101 |
Token | in |
Token ID | 287 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
contains | +36.719 |
detects | +35.415 |
completes | +33.570 |
corresponds | +33.318 |
allows | +33.238 |
Neg logit contributions | |
� | -18.068 |
bipartisan | -17.332 |
� | -16.488 |
politically | -14.929 |
political | -14.606 |
Token | Racing |
Token ID | 14954 |
Feature activation | -4.53e+01 |
Pos logit contributions | |
coins | +19.442 |
contains | +19.437 |
detects | +19.129 |
iton | +18.964 |
img | +18.326 |
Neg logit contributions | |
bipartisan | -13.668 |
� | -13.130 |
politically | -12.469 |
� | -12.226 |
political | -11.990 |
Token | Apex |
Token ID | 49440 |
Feature activation | -2.98e+01 |
Pos logit contributions | |
contains | +35.470 |
coins | +33.259 |
detects | +32.983 |
X | +32.402 |
img | +32.276 |
Neg logit contributions | |
� | -30.011 |
ccording | -24.128 |
tremend | -23.388 |
behavi | -22.942 |
bipartisan | -22.702 |
Token | has |
Token ID | 468 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
contains | +33.277 |
detects | +32.432 |
coins | +30.578 |
utilizes | +30.406 |
allows | +30.235 |
Neg logit contributions | |
� | -17.092 |
bipartisan | -16.718 |
� | -16.203 |
politically | -14.871 |
political | -14.659 |
Token | four |
Token ID | 1440 |
Feature activation | -8.67e+00 |
Pos logit contributions | |
coins | +12.852 |
detects | +12.499 |
contains | +12.312 |
iton | +11.970 |
img | +11.733 |
Neg logit contributions | |
bipartisan | -12.244 |
� | -12.199 |
politically | -11.404 |
political | -11.374 |
� | -10.929 |
Token | unique |
Token ID | 3748 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
coins | +9.657 |
detects | +9.267 |
contains | +9.010 |
iton | +8.881 |
img | +8.761 |
Neg logit contributions | |
bipartisan | -8.967 |
� | -8.863 |
political | -8.351 |
politically | -8.325 |
� | -7.993 |
Token | modes |
Token ID | 12881 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
coins | +12.072 |
detects | +11.633 |
contains | +11.370 |
iton | +11.149 |
img | +10.984 |
Neg logit contributions | |
bipartisan | -10.732 |
� | -10.613 |
politically | -9.933 |
political | -9.920 |
� | -9.497 |
Token | - |
Token ID | 532 |
Feature activation | -8.31e+00 |
Pos logit contributions | |
coins | +13.027 |
detects | +12.520 |
contains | +12.269 |
iton | +11.892 |
img | +11.657 |
Neg logit contributions | |
bipartisan | -13.916 |
� | -13.524 |
political | -12.893 |
politically | -12.823 |
geopolitical | -12.301 |
Token | Standard |
Token ID | 8997 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
coins | +9.192 |
detects | +8.839 |
contains | +8.590 |
iton | +8.457 |
img | +8.342 |
Neg logit contributions | |
bipartisan | -8.619 |
� | -8.519 |
political | -8.026 |
politically | -8.008 |
� | -7.687 |
Token | 6 |
Token ID | 21 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
coins | +35.788 |
contains | +33.224 |
rox | +32.664 |
img | +32.471 |
ax | +32.249 |
Neg logit contributions | |
� | -33.752 |
millenn | -26.713 |
tremend | -26.203 |
behavi | -26.145 |
� | -25.626 |
Token | + |
Token ID | 10 |
Feature activation | -2.94e+01 |
Pos logit contributions | |
contains | +27.404 |
detects | +27.066 |
coins | +26.834 |
behaves | +25.441 |
rox | +25.171 |
Neg logit contributions | |
bipartisan | -16.079 |
� | -14.940 |
politically | -14.377 |
political | -14.286 |
� | -14.173 |
Token | x |
Token ID | 87 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
coins | +27.569 |
contains | +27.363 |
x | +26.492 |
detects | +26.491 |
img | +25.807 |
Neg logit contributions | |
bipartisan | -19.003 |
� | -16.687 |
� | -16.603 |
politically | -16.450 |
political | -16.391 |
Token | oscill |
Token ID | 24969 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
detects | +23.741 |
contains | +23.726 |
coins | +23.621 |
behaves | +22.217 |
iton | +22.116 |
Neg logit contributions | |
bipartisan | -14.008 |
� | -13.239 |
� | -12.502 |
politically | -12.458 |
political | -12.403 |
Token | ates |
Token ID | 689 |
Feature activation | -7.26e+00 |
Pos logit contributions | |
coins | +7.130 |
detects | +6.755 |
contains | +6.408 |
iton | +6.156 |
rox | +6.002 |
Neg logit contributions | |
bipartisan | -19.606 |
� | -19.296 |
political | -18.664 |
politically | -18.595 |
� | -18.063 |
Token | between |
Token ID | 1022 |
Feature activation | -1.00e+01 |
Pos logit contributions | |
coins | +7.378 |
detects | +6.951 |
contains | +6.709 |
iton | +6.651 |
img | +6.582 |
Neg logit contributions | |
bipartisan | -8.489 |
� | -8.408 |
political | -8.002 |
politically | -7.989 |
� | -7.687 |
Token | two |
Token ID | 734 |
Feature activation | -5.52e+00 |
Pos logit contributions | |
coins | +11.467 |
detects | +11.060 |
contains | +10.771 |
iton | +10.606 |
img | +10.441 |
Neg logit contributions | |
bipartisan | -9.893 |
� | -9.768 |
political | -9.174 |
politically | -9.148 |
� | -8.754 |
Token | quantum |
Token ID | 14821 |
Feature activation | -7.22e+00 |
Pos logit contributions | |
coins | +6.529 |
detects | +6.225 |
contains | +6.048 |
iton | +6.010 |
img | +5.964 |
Neg logit contributions | |
bipartisan | -5.508 |
� | -5.438 |
political | -5.149 |
politically | -5.128 |
� | -4.907 |
Token | states |
Token ID | 2585 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
coins | +8.580 |
detects | +8.226 |
contains | +7.997 |
iton | +7.907 |
img | +7.836 |
Neg logit contributions | |
bipartisan | -7.043 |
� | -6.959 |
political | -6.559 |
politically | -6.522 |
� | -6.249 |
Token | during |
Token ID | 1141 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
coins | +14.068 |
detects | +13.657 |
contains | +13.316 |
iton | +13.007 |
img | +12.790 |
Neg logit contributions | |
bipartisan | -12.561 |
� | -12.270 |
political | -11.591 |
politically | -11.535 |
� | -11.003 |
Token | the |
Token ID | 262 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
coins | +12.360 |
detects | +12.030 |
contains | +11.745 |
iton | +11.541 |
rox | +11.262 |
Neg logit contributions | |
bipartisan | -10.807 |
� | -10.684 |
politically | -9.960 |
political | -9.900 |
� | -9.555 |
Token | clones |
Token ID | 32498 |
Feature activation | -2.95e+01 |
Pos logit contributions | |
coins | +29.775 |
contains | +29.080 |
detects | +28.455 |
completes | +26.886 |
behaves | +26.465 |
Neg logit contributions | |
bipartisan | -18.532 |
� | -18.524 |
� | -17.942 |
politically | -16.468 |
political | -16.085 |
Token | must |
Token ID | 1276 |
Feature activation | -3.85e+01 |
Pos logit contributions | |
coins | +29.971 |
contains | +29.961 |
detects | +28.528 |
you | +27.447 |
img | +26.698 |
Neg logit contributions | |
� | -23.129 |
bipartisan | -19.856 |
ccording | -19.407 |
behavi | -18.043 |
millenn | -17.737 |
Token | be |
Token ID | 307 |
Feature activation | -2.44e+01 |
Pos logit contributions | |
contains | +33.940 |
coins | +33.139 |
detects | +32.172 |
you | +31.587 |
img | +30.804 |
Neg logit contributions | |
� | -30.107 |
ccording | -25.642 |
behavi | -24.250 |
millenn | -23.459 |
� | -23.036 |
Token | have |
Token ID | 423 |
Feature activation | -4.58e+01 |
Pos logit contributions | |
contains | +26.072 |
coins | +26.051 |
detects | +25.541 |
iton | +23.650 |
img | +23.354 |
Neg logit contributions | |
� | -19.288 |
bipartisan | -17.802 |
� | -17.534 |
political | -15.687 |
rhetorical | -15.652 |
Token | the |
Token ID | 262 |
Feature activation | -2.58e+01 |
Pos logit contributions | |
contains | +35.857 |
coins | +34.757 |
you | +34.504 |
iton | +33.532 |
detects | +33.377 |
Neg logit contributions | |
� | -32.497 |
ccording | -27.721 |
tremend | -26.479 |
millenn | -26.005 |
� | -25.179 |
Token | ability |
Token ID | 2694 |
Feature activation | -4.18e+01 |
Pos logit contributions | |
coins | +26.095 |
contains | +25.915 |
detects | +25.413 |
iton | +24.951 |
allows | +24.239 |
Neg logit contributions | |
� | -20.698 |
bipartisan | -18.539 |
� | -17.461 |
ccording | -17.061 |
politically | -16.682 |
Token | to |
Token ID | 284 |
Feature activation | -3.80e+01 |
Pos logit contributions | |
contains | +34.910 |
coins | +34.739 |
you | +33.577 |
detects | +32.600 |
iton | +32.053 |
Neg logit contributions | |
� | -32.999 |
ccording | -28.382 |
millenn | -27.014 |
tremend | -26.131 |
� | -26.059 |
Token | be |
Token ID | 307 |
Feature activation | -3.61e+01 |
Pos logit contributions | |
contains | +34.319 |
coins | +33.116 |
detects | +32.830 |
you | +31.840 |
iton | +31.730 |
Neg logit contributions | |
� | -29.517 |
ccording | -25.063 |
behavi | -22.748 |
� | -22.548 |
millenn | -22.461 |
Token | sent |
Token ID | 1908 |
Feature activation | -2.89e+01 |
Pos logit contributions | |
contains | +30.664 |
coins | +30.001 |
detects | +29.591 |
you | +27.973 |
iton | +27.358 |
Neg logit contributions | |
� | -28.898 |
� | -23.368 |
behavi | -23.162 |
ccording | -23.054 |
bipartisan | -22.834 |
Token | across |
Token ID | 1973 |
Feature activation | -3.08e+01 |
Pos logit contributions | |
coins | +28.658 |
contains | +27.319 |
detects | +26.785 |
iton | +25.535 |
rox | +25.006 |
Neg logit contributions | |
� | -23.665 |
bipartisan | -20.530 |
� | -19.355 |
ccording | -18.708 |
political | -18.243 |
Token | threads |
Token ID | 14390 |
Feature activation | -2.85e+01 |
Pos logit contributions | |
coins | +31.160 |
contains | +30.296 |
detects | +29.482 |
iton | +27.599 |
completes | +27.596 |
Neg logit contributions | |
� | -22.917 |
bipartisan | -19.128 |
ccording | -18.348 |
� | -17.649 |
cynical | -17.178 |
Token | you |
Token ID | 345 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
coins | +15.650 |
detects | +15.141 |
contains | +14.904 |
iton | +14.616 |
img | +14.291 |
Neg logit contributions | |
bipartisan | -12.652 |
� | -12.518 |
political | -11.508 |
politically | -11.477 |
� | -11.099 |
Token | were |
Token ID | 547 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
coins | +8.605 |
detects | +8.185 |
contains | +7.913 |
iton | +7.724 |
img | +7.585 |
Neg logit contributions | |
bipartisan | -12.859 |
� | -12.721 |
political | -12.132 |
politically | -12.078 |
� | -11.699 |
Token | -- |
Token ID | 1377 |
Feature activation | -9.53e+00 |
Pos logit contributions | |
coins | +1.519 |
detects | +1.423 |
iton | +1.361 |
contains | +1.344 |
rox | +1.341 |
Neg logit contributions | |
bipartisan | -1.600 |
� | -1.563 |
political | -1.524 |
politically | -1.520 |
� | -1.442 |
Token |
|
Token ID | 198 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
coins | +10.321 |
detects | +9.912 |
contains | +9.669 |
iton | +9.477 |
img | +9.358 |
Neg logit contributions | |
bipartisan | -9.943 |
� | -9.813 |
political | -9.219 |
politically | -9.177 |
� | -8.843 |
Token |
|
Token ID | 198 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
� | +10.709 |
� | +9.510 |
| +8.389 |
bipartisan | +8.084 |
political | +7.593 |
Neg logit contributions | |
detects | -20.050 |
coins | -19.470 |
assium | -18.519 |
mitter | -18.493 |
iton | -18.377 |
Token | RF |
Token ID | 32754 |
Feature activation | -3.86e+01 |
Pos logit contributions | |
coins | +20.931 |
img | +19.699 |
contains | +19.516 |
rox | +19.184 |
detects | +19.144 |
Neg logit contributions | |
bipartisan | -17.466 |
� | -17.056 |
politically | -15.997 |
geopolitical | -15.666 |
political | -15.574 |
Token | : |
Token ID | 25 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
contains | +32.537 |
coins | +32.320 |
img | +31.429 |
you | +30.167 |
iton | +29.833 |
Neg logit contributions | |
� | -36.544 |
tremend | -29.311 |
ccording | -28.643 |
� | -28.590 |
behavi | -28.459 |
Token | You |
Token ID | 921 |
Feature activation | -5.62e+00 |
Pos logit contributions | |
coins | +13.661 |
detects | +13.070 |
contains | +12.802 |
iton | +12.509 |
img | +12.430 |
Neg logit contributions | |
bipartisan | -13.484 |
� | -13.227 |
political | -12.538 |
politically | -12.521 |
� | -11.919 |
Token | know |
Token ID | 760 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
coins | +5.273 |
detects | +4.958 |
contains | +4.766 |
iton | +4.748 |
img | +4.650 |
Neg logit contributions | |
bipartisan | -7.002 |
� | -6.956 |
political | -6.645 |
politically | -6.632 |
� | -6.412 |
Token | , |
Token ID | 11 |
Feature activation | -1.81e+01 |
Pos logit contributions | |
coins | +14.874 |
detects | +14.356 |
contains | +14.174 |
iton | +13.771 |
img | +13.520 |
Neg logit contributions | |
bipartisan | -14.064 |
� | -13.959 |
political | -12.812 |
politically | -12.762 |
� | -12.618 |
Token | it |
Token ID | 340 |
Feature activation | -5.24e+00 |
Pos logit contributions | |
coins | +23.890 |
detects | +23.426 |
contains | +23.201 |
iton | +22.585 |
img | +22.280 |
Neg logit contributions | |
bipartisan | -11.505 |
� | -11.411 |
� | -10.312 |
political | -9.927 |
politically | -9.815 |
Token | With |
Token ID | 2080 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
coins | +20.701 |
detects | +20.029 |
contains | +19.889 |
img | +19.489 |
iton | +19.328 |
Neg logit contributions | |
bipartisan | -10.117 |
� | -9.298 |
politically | -9.067 |
political | -9.004 |
� | -8.495 |
Token | the |
Token ID | 262 |
Feature activation | -7.18e+00 |
Pos logit contributions | |
coins | +16.850 |
detects | +16.258 |
contains | +15.842 |
iton | +15.642 |
img | +15.494 |
Neg logit contributions | |
bipartisan | -13.905 |
� | -13.551 |
politically | -12.714 |
political | -12.622 |
� | -12.169 |
Token | 16 |
Token ID | 1467 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
coins | +7.848 |
detects | +7.499 |
contains | +7.270 |
iton | +7.186 |
img | +7.076 |
Neg logit contributions | |
bipartisan | -7.717 |
� | -7.637 |
political | -7.230 |
politically | -7.196 |
� | -6.926 |
Token | - |
Token ID | 12 |
Feature activation | -2.55e+01 |
Pos logit contributions | |
detects | +19.665 |
coins | +19.620 |
contains | +19.389 |
img | +19.027 |
iton | +18.269 |
Neg logit contributions | |
bipartisan | -15.789 |
geopolitical | -13.950 |
� | -13.833 |
politically | -13.791 |
� | -13.699 |
Token | 35 |
Token ID | 2327 |
Feature activation | -2.79e+01 |
Pos logit contributions | |
coins | +27.039 |
img | +26.442 |
contains | +25.608 |
detects | +25.533 |
wine | +24.929 |
Neg logit contributions | |
� | -20.864 |
bipartisan | -19.390 |
� | -17.951 |
politically | -17.802 |
political | -17.719 |
Token | f |
Token ID | 277 |
Feature activation | -4.15e+01 |
Pos logit contributions | |
detects | +28.248 |
contains | +28.231 |
coins | +27.993 |
img | +27.403 |
you | +26.922 |
Neg logit contributions | |
bipartisan | -14.689 |
� | -12.947 |
� | -12.661 |
politically | -12.180 |
troubling | -12.005 |
Token | / |
Token ID | 14 |
Feature activation | -2.21e+01 |
Pos logit contributions | |
img | +39.539 |
coins | +39.385 |
/ | +38.651 |
contains | +37.778 |
iton | +36.988 |
Neg logit contributions | |
� | -27.549 |
behavi | -21.605 |
tremend | -20.845 |
ccording | -20.604 |
millenn | -20.423 |
Token | 4 |
Token ID | 19 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
coins | +18.580 |
img | +18.480 |
detects | +17.560 |
iton | +17.483 |
contains | +17.417 |
Neg logit contributions | |
bipartisan | -18.084 |
politically | -17.000 |
� | -16.602 |
political | -16.285 |
troubling | -16.224 |
Token | even |
Token ID | 772 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
detects | +28.531 |
contains | +28.240 |
coins | +28.120 |
img | +27.367 |
iton | +27.225 |
Neg logit contributions | |
bipartisan | -14.215 |
� | -12.820 |
� | -12.234 |
politically | -11.968 |
political | -11.642 |
Token | 40 |
Token ID | 2319 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
coins | +15.339 |
detects | +14.940 |
contains | +14.623 |
iton | +14.377 |
img | +14.221 |
Neg logit contributions | |
bipartisan | -10.818 |
� | -10.418 |
politically | -9.812 |
political | -9.796 |
� | -9.221 |
Token | l |
Token ID | 300 |
Feature activation | -1.70e+01 |
Pos logit contributions | |
coins | +16.267 |
detects | +15.813 |
contains | +15.542 |
img | +15.163 |
iton | +15.051 |
Neg logit contributions | |
bipartisan | -10.090 |
� | -9.482 |
politically | -9.127 |
political | -9.052 |
geopolitical | -8.454 |
Token | 1 |
Token ID | 16 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
coins | +19.599 |
contains | +18.438 |
detects | +18.253 |
img | +17.873 |
iton | +17.862 |
Neg logit contributions | |
bipartisan | -21.235 |
� | -20.705 |
� | -20.123 |
political | -19.760 |
politically | -19.734 |
Token | // |
Token ID | 3373 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
coins | +21.872 |
contains | +21.458 |
detects | +21.289 |
img | +20.851 |
iton | +20.558 |
Neg logit contributions | |
bipartisan | -18.021 |
� | -17.929 |
� | -17.519 |
politically | -16.552 |
political | -16.429 |
Token | metres |
Token ID | 18985 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
coins | +21.360 |
detects | +20.694 |
contains | +20.620 |
img | +19.261 |
iton | +19.147 |
Neg logit contributions | |
bipartisan | -16.794 |
� | -15.445 |
� | -15.421 |
politically | -15.194 |
political | -15.088 |
Token | _ |
Token ID | 4808 |
Feature activation | -4.71e+01 |
Pos logit contributions | |
coins | +12.679 |
contains | +12.488 |
detects | +12.374 |
iton | +11.735 |
img | +11.718 |
Neg logit contributions | |
bipartisan | -12.771 |
� | -12.397 |
politically | -11.957 |
political | -11.765 |
geopolitical | -11.369 |
Token | P |
Token ID | 47 |
Feature activation | -4.76e+01 |
Pos logit contributions | |
X | +33.190 |
coins | +32.691 |
contains | +31.333 |
img | +30.802 |
iton | +30.716 |
Neg logit contributions | |
� | -38.711 |
tremend | -33.559 |
millenn | -31.507 |
ccording | -31.112 |
behavi | -30.332 |
Token | ulse |
Token ID | 9615 |
Feature activation | -4.55e+01 |
Pos logit contributions | |
ulse | +37.971 |
coins | +36.614 |
iton | +36.197 |
rox | +34.829 |
img | +34.625 |
Neg logit contributions | |
� | -36.075 |
� | -28.616 |
behavi | -28.171 |
ccording | -27.043 |
tremend | -26.197 |
Token | Per |
Token ID | 5990 |
Feature activation | -3.68e+01 |
Pos logit contributions | |
coins | +34.194 |
contains | +33.273 |
X | +32.866 |
iton | +32.000 |
img | +31.397 |
Neg logit contributions | |
� | -35.276 |
tremend | -30.321 |
� | -26.830 |
millenn | -26.774 |
behavi | -26.535 |
Token | iod |
Token ID | 2101 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
iton | +35.732 |
coins | +35.420 |
rox | +33.235 |
img | +33.112 |
mitter | +32.546 |
Neg logit contributions | |
� | -27.683 |
behavi | -20.513 |
bipartisan | -20.154 |
tremend | -19.781 |
� | -19.759 |
Token | ( |
Token ID | 357 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
coins | +8.489 |
detects | +7.942 |
contains | +7.678 |
iton | +7.493 |
img | +7.353 |
Neg logit contributions | |
bipartisan | -15.972 |
� | -15.811 |
political | -15.167 |
politically | -15.163 |
� | -14.625 |
Token | " |
Token ID | 366 |
Feature activation | -4.77e+01 |
Pos logit contributions | |
coins | +12.848 |
detects | +12.336 |
contains | +12.116 |
iton | +11.890 |
img | +11.715 |
Neg logit contributions | |
bipartisan | -11.588 |
� | -11.403 |
political | -10.741 |
politically | -10.730 |
� | -10.179 |
Token | P |
Token ID | 47 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
X | +35.355 |
coins | +34.896 |
img | +32.662 |
P | +31.811 |
contains | +31.766 |
Neg logit contributions | |
� | -38.055 |
tremend | -32.660 |
millenn | -31.006 |
behavi | -29.382 |
ccording | -28.839 |
Token | playing |
Token ID | 2712 |
Feature activation | -4.57e+01 |
Pos logit contributions | |
you | +24.995 |
contains | +23.705 |
coins | +23.505 |
img | +23.206 |
behaves | +22.868 |
Neg logit contributions | |
� | -37.232 |
ccording | -30.662 |
� | -29.491 |
tremend | -28.108 |
� | -27.869 |
Token | at |
Token ID | 379 |
Feature activation | -2.54e+01 |
Pos logit contributions | |
contains | +32.873 |
you | +32.529 |
coins | +31.388 |
img | +31.119 |
rox | +30.980 |
Neg logit contributions | |
� | -35.866 |
ccording | -29.804 |
tremend | -27.591 |
� | -27.156 |
millenn | -26.437 |
Token | 640 |
Token ID | 33759 |
Feature activation | -5.83e+01 |
Pos logit contributions | |
coins | +22.189 |
contains | +21.511 |
rox | +21.127 |
img | +20.994 |
detects | +20.698 |
Neg logit contributions | |
� | -23.806 |
bipartisan | -22.814 |
� | -21.726 |
political | -20.930 |
politically | -20.921 |
Token | x |
Token ID | 87 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
x | +41.853 |
img | +39.039 |
X | +38.226 |
coins | +37.878 |
x | +36.224 |
Neg logit contributions | |
� | -41.270 |
ccording | -34.061 |
tremend | -33.583 |
millenn | -33.286 |
� | -32.564 |
Token | 480 |
Token ID | 22148 |
Feature activation | -4.58e+01 |
Pos logit contributions | |
coins | +20.100 |
img | +19.689 |
contains | +18.802 |
detects | +18.444 |
cube | +18.153 |
Neg logit contributions | |
� | -27.870 |
bipartisan | -26.775 |
politically | -25.047 |
political | -24.444 |
� | -24.247 |
Token | with |
Token ID | 351 |
Feature activation | -4.69e+01 |
Pos logit contributions | |
contains | +32.358 |
you | +30.978 |
img | +30.192 |
with | +30.115 |
coins | +29.690 |
Neg logit contributions | |
� | -36.824 |
ccording | -30.362 |
tremend | -30.104 |
� | -28.926 |
behavi | -28.543 |
Token | j |
Token ID | 474 |
Feature activation | -4.63e+01 |
Pos logit contributions | |
you | +31.749 |
contains | +30.826 |
detects | +30.402 |
img | +30.050 |
coins | +29.869 |
Neg logit contributions | |
� | -34.488 |
ccording | -29.750 |
� | -27.961 |
� | -25.747 |
millenn | -25.622 |
Token | agg |
Token ID | 9460 |
Feature activation | -4.52e+01 |
Pos logit contributions | |
img | +36.579 |
coins | +35.951 |
angles | +34.713 |
ames | +34.562 |
ax | +34.393 |
Neg logit contributions | |
� | -32.802 |
behavi | -25.272 |
tremend | -24.295 |
millenn | -24.285 |
� | -24.132 |
Token | ies |
Token ID | 444 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
coins | +32.170 |
ies | +30.866 |
ames | +30.332 |
angles | +29.995 |
img | +29.568 |
Neg logit contributions | |
� | -37.493 |
behavi | -31.392 |
ccording | -30.503 |
tremend | -29.927 |
� | -29.228 |
Token | ) |
Token ID | 8 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
coins | +24.355 |
contains | +22.923 |
detects | +22.234 |
img | +22.188 |
iton | +22.162 |
Neg logit contributions | |
� | -22.407 |
bipartisan | -20.102 |
politically | -18.822 |
behavi | -18.636 |
political | -18.585 |
Token | even |
Token ID | 772 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
coins | +17.252 |
contains | +16.459 |
detects | +16.381 |
img | +15.658 |
iton | +15.214 |
Neg logit contributions | |
� | -23.327 |
bipartisan | -22.246 |
� | -21.534 |
politically | -20.885 |
political | -20.664 |