Token | streaming |
Token ID | 11305 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
these | +15.899 |
those | +15.471 |
many | +15.451 |
things | +15.021 |
various | +14.789 |
Neg logit contributions | |
usk | -14.514 |
uty | -14.307 |
ien | -14.077 |
elaide | -13.690 |
oultry | -13.530 |
Token | music |
Token ID | 2647 |
Feature activation | +5.78e+00 |
Pos logit contributions | |
distinguishing | +0.662 |
totality | +0.658 |
deviations | +0.654 |
inaction | +0.653 |
revolving | +0.637 |
Neg logit contributions | |
u | -0.468 |
amp | -0.467 |
- | -0.459 |
ump | -0.454 |
ire | -0.436 |
Token | . |
Token ID | 13 |
Feature activation | +6.07e+01 |
Pos logit contributions | |
distinguishing | +3.778 |
totality | +3.736 |
hindsight | +3.707 |
inaction | +3.671 |
deviations | +3.653 |
Neg logit contributions | |
u | -1.814 |
amp | -1.797 |
ab | -1.724 |
ich | -1.642 |
ire | -1.628 |
Token | Furthermore |
Token ID | 11399 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
The | +14.433 |
I | +13.415 |
One | +13.110 |
these | +12.979 |
Modern | +12.973 |
Neg logit contributions | |
teasp | -24.848 |
elaide | -23.689 |
RandomRedditor | -23.541 |
� | -23.530 |
| -23.493 |
Token | , |
Token ID | 11 |
Feature activation | +8.36e+01 |
Pos logit contributions | |
u | +2.750 |
ire | +2.591 |
aga | +2.582 |
usk | +2.412 |
ien | +2.363 |
Neg logit contributions | |
totality | -6.936 |
deviations | -6.874 |
disadvantages | -6.575 |
bureaucrats | -6.553 |
symbolism | -6.539 |
Token | the |
Token ID | 262 |
Feature activation | +8.71e+01 |
Pos logit contributions | |
these | +21.489 |
those | +20.382 |
many | +20.170 |
the | +19.837 |
it | +18.893 |
Neg logit contributions | |
RandomRedditor | -20.050 |
� | -20.039 |
| -19.985 |
| -19.966 |
| -19.940 |
Token | only |
Token ID | 691 |
Feature activation | +5.89e+01 |
Pos logit contributions | |
lack | +19.711 |
many | +19.071 |
most | +18.942 |
only | +18.823 |
these | +18.736 |
Neg logit contributions | |
elaide | -17.931 |
oultry | -17.357 |
teasp | -16.778 |
� | -16.413 |
RNA | -16.409 |
Token | speakers |
Token ID | 11636 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
things | +18.339 |
distinguishing | +17.067 |
real | +17.019 |
people | +16.982 |
other | +16.664 |
Neg logit contributions | |
usk | -18.150 |
teasp | -17.927 |
elaide | -17.635 |
RandomRedditor | -17.117 |
� | -17.107 |
Token | I |
Token ID | 314 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
totality | +10.903 |
these | +10.821 |
distinguishing | +10.649 |
things | +10.630 |
those | +10.511 |
Neg logit contributions | |
uty | -11.801 |
usk | -11.750 |
ien | -11.691 |
ump | -11.080 |
aga | -11.009 |
Token | � |
Token ID | 447 |
Feature activation | -4.16e+01 |
Pos logit contributions | |
ike | +4.087 |
ikes | +3.830 |
u | +3.809 |
ve | +3.771 |
ath | +3.761 |
Neg logit contributions | |
behavi | -7.323 |
inaction | -7.148 |
totality | -6.944 |
fundamentals | -6.396 |
similarities | -6.371 |
Token | � |
Token ID | 247 |
Feature activation | -3.56e+01 |
Pos logit contributions | |
� | +9.813 |
� | +9.512 |
� | +8.354 |
� | +8.203 |
� | +8.177 |
Neg logit contributions | |
behavi | -21.190 |
totality | -20.073 |
'[ | -19.777 |
similarities | -19.703 |
acron | -19.601 |
Token |
|
Token ID | 198 |
Feature activation | +6.46e+01 |
Pos logit contributions | |
u | +1.982 |
| +1.812 |
- | +1.667 |
q | +1.047 |
b | +0.606 |
Neg logit contributions | |
tremend | -39.310 |
eleph | -36.955 |
cumbers | -36.348 |
exha | -36.295 |
millenn | -36.005 |
Token | � |
Token ID | 447 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
� | +14.122 |
� | +12.484 |
things | +12.435 |
people | +12.369 |
those | +11.788 |
Neg logit contributions | |
teasp | -22.952 |
RandomRedditor | -22.839 |
| -22.791 |
� | -22.791 |
StreamerBot | -22.779 |
Token | � |
Token ID | 250 |
Feature activation | +5.36e+01 |
Pos logit contributions | |
� | +3.876 |
� | +3.268 |
� | +2.863 |
� | +2.826 |
� | +2.771 |
Neg logit contributions | |
behavi | -14.788 |
similarities | -14.705 |
totality | -14.596 |
distinguishing | -14.529 |
pecul | -14.512 |
Token | T |
Token ID | 51 |
Feature activation | -1.87e+01 |
Pos logit contributions | |
people | +14.134 |
things | +13.894 |
those | +13.692 |
these | +13.345 |
it | +12.799 |
Neg logit contributions | |
teasp | -18.258 |
� | -17.904 |
RandomRedditor | -17.883 |
� | -17.860 |
| -17.857 |
Token | ruly |
Token ID | 34715 |
Feature activation | +4.48e+01 |
Pos logit contributions | |
rou | +6.553 |
une | +5.956 |
ak | +5.921 |
ong | +5.919 |
ien | +5.878 |
Neg logit contributions | |
totality | -8.841 |
disadvantages | -8.740 |
behavi | -8.702 |
revolving | -8.650 |
anonymity | -8.595 |
Token | , |
Token ID | 11 |
Feature activation | +8.64e+01 |
Pos logit contributions | |
these | +17.795 |
people | +17.272 |
things | +17.221 |
those | +17.206 |
many | +17.081 |
Neg logit contributions | |
uty | -14.112 |
usk | -13.486 |
oultry | -13.385 |
inion | -12.864 |
illo | -12.850 |
Token | in |
Token ID | 287 |
Feature activation | +5.70e+01 |
Pos logit contributions | |
these | +21.805 |
people | +21.742 |
it | +21.234 |
many | +21.215 |
those | +21.057 |
Neg logit contributions | |
oultry | -15.319 |
uty | -14.860 |
arthed | -14.365 |
usk | -14.303 |
osite | -14.225 |
Token | and |
Token ID | 290 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
many | +20.434 |
these | +20.090 |
those | +19.844 |
people | +18.761 |
some | +18.660 |
Neg logit contributions | |
uty | -14.235 |
oultry | -13.935 |
inion | -13.842 |
usk | -13.728 |
arthed | -13.248 |
Token | of |
Token ID | 286 |
Feature activation | -2.68e+01 |
Pos logit contributions | |
u | +5.142 |
ock | +4.858 |
ien | +4.839 |
� | +4.782 |
ene | +4.686 |
Neg logit contributions | |
deviations | -7.440 |
Mankind | -7.214 |
disadvantages | -7.124 |
Intelligent | -7.081 |
bureaucrats | -7.079 |
Token | itself |
Token ID | 2346 |
Feature activation | +2.54e+01 |
Pos logit contributions | |
o | +2.964 |
u | +2.894 |
ig | +2.848 |
ab | +2.752 |
- | +2.506 |
Neg logit contributions | |
promoters | -12.695 |
disadvantages | -12.423 |
distinguishing | -12.315 |
Intelligent | -12.233 |
bureaucrats | -12.230 |
Token | , |
Token ID | 11 |
Feature activation | +7.47e+01 |
Pos logit contributions | |
totality | +12.548 |
deviations | +12.021 |
distinguishing | +11.929 |
similarities | +11.881 |
inaction | +11.877 |
Neg logit contributions | |
ien | -11.465 |
uty | -11.260 |
usk | -11.115 |
aga | -10.849 |
ump | -10.754 |
Token | want |
Token ID | 765 |
Feature activation | -5.77e+00 |
Pos logit contributions | |
q | +2.150 |
usk | +2.085 |
ump | +2.045 |
u | +2.003 |
ike | +1.995 |
Neg logit contributions | |
inaction | -3.530 |
totality | -3.456 |
similarities | -3.425 |
behavi | -3.398 |
deviations | -3.348 |
Token | to |
Token ID | 284 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
u | +1.549 |
� | +1.470 |
uty | +1.407 |
ien | +1.356 |
aga | +1.306 |
Neg logit contributions | |
deviations | -3.539 |
disadvantages | -3.505 |
similarities | -3.356 |
totality | -3.350 |
inaction | -3.319 |
Token | point |
Token ID | 966 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
q | +4.396 |
aki | +4.300 |
u | +4.225 |
ée | +4.086 |
ay | +4.053 |
Neg logit contributions | |
behavi | -10.676 |
inaction | -9.714 |
deviations | -9.235 |
conflic | -8.637 |
Palestin | -8.621 |
Token | out |
Token ID | 503 |
Feature activation | +2.52e+01 |
Pos logit contributions | |
u | +3.950 |
- | +3.677 |
out | +3.604 |
ay | +3.252 |
end | +3.177 |
Neg logit contributions | |
totality | -8.999 |
inaction | -8.802 |
disadvantages | -8.761 |
underest | -8.650 |
behavi | -8.650 |
Token | that |
Token ID | 326 |
Feature activation | +7.67e+01 |
Pos logit contributions | |
totality | +10.815 |
deviations | +10.146 |
inaction | +10.134 |
distinguishing | +10.101 |
hindsight | +9.934 |
Neg logit contributions | |
ien | -13.096 |
uty | -13.018 |
usk | -12.908 |
ump | -12.538 |
aga | -12.482 |
Token | the |
Token ID | 262 |
Feature activation | +8.61e+01 |
Pos logit contributions | |
these | +21.401 |
many | +20.379 |
the | +20.057 |
those | +20.039 |
people | +19.668 |
Neg logit contributions | |
RandomRedditor | -17.195 |
� | -17.187 |
| -17.179 |
teasp | -17.163 |
| -17.140 |
Token | app |
Token ID | 598 |
Feature activation | +2.75e+01 |
Pos logit contributions | |
folks | +18.936 |
actual | +18.443 |
people | +18.210 |
most | +17.863 |
things | +17.843 |
Neg logit contributions | |
teasp | -19.150 |
RandomRedditor | -18.741 |
� | -18.703 |
| -18.701 |
� | -18.699 |
Token | includes |
Token ID | 3407 |
Feature activation | +3.18e+01 |
Pos logit contributions | |
totality | +12.071 |
these | +11.612 |
distinguishing | +11.553 |
things | +11.528 |
deviations | +11.517 |
Neg logit contributions | |
uty | -12.285 |
ien | -12.255 |
usk | -12.086 |
aga | -11.599 |
ump | -11.539 |
Token | some |
Token ID | 617 |
Feature activation | +4.48e+01 |
Pos logit contributions | |
totality | +13.550 |
things | +13.260 |
these | +13.242 |
distinguishing | +13.014 |
similarities | +12.885 |
Neg logit contributions | |
uty | -13.912 |
usk | -13.822 |
ien | -13.735 |
aga | -13.021 |
� | -12.979 |
Token | governors |
Token ID | 26824 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
things | +16.581 |
similarities | +15.126 |
many | +15.102 |
distinguishing | +15.002 |
people | +14.999 |
Neg logit contributions | |
usk | -16.640 |
elaide | -16.319 |
ien | -15.964 |
byss | -15.954 |
uty | -15.838 |
Token | to |
Token ID | 284 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
totality | +11.987 |
hindsight | +11.564 |
deviations | +11.459 |
similarities | +11.293 |
inaction | +11.131 |
Neg logit contributions | |
ien | -6.275 |
usk | -6.098 |
uty | -5.929 |
u | -5.834 |
ike | -5.742 |
Token | and |
Token ID | 290 |
Feature activation | +3.79e+01 |
Pos logit contributions | |
deviations | +1.353 |
totality | +1.314 |
anonymity | +1.301 |
similarities | +1.289 |
distinguishing | +1.281 |
Neg logit contributions | |
usk | -0.517 |
ien | -0.507 |
u | -0.490 |
- | -0.482 |
ab | -0.443 |
Token | the |
Token ID | 262 |
Feature activation | +3.47e+01 |
Pos logit contributions | |
those | +14.983 |
these | +14.791 |
many | +14.748 |
totality | +14.714 |
inaction | +14.589 |
Neg logit contributions | |
ien | -14.664 |
uty | -14.523 |
elaide | -14.364 |
usk | -14.321 |
ikes | -14.049 |
Token | Washington |
Token ID | 2669 |
Feature activation | -5.03e+00 |
Pos logit contributions | |
totality | +13.328 |
inaction | +12.850 |
things | +12.735 |
reality | +12.649 |
many | +12.530 |
Neg logit contributions | |
elaide | -15.107 |
usk | -15.098 |
uty | -14.988 |
ien | -14.655 |
aga | -14.576 |
Token | status |
Token ID | 3722 |
Feature activation | -3.70e+00 |
Pos logit contributions | |
ien | +2.274 |
- | +2.152 |
ump | +2.093 |
usk | +2.022 |
ian | +2.014 |
Neg logit contributions | |
Mankind | -2.387 |
behavi | -2.253 |
distinguishing | -2.211 |
newer | -2.136 |
totality | -2.122 |
Token | quo |
Token ID | 18658 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
- | +0.662 |
ien | +0.591 |
u | +0.577 |
ike | +0.490 |
ale | +0.462 |
Neg logit contributions | |
hindsight | -2.945 |
totality | -2.876 |
spontaneous | -2.838 |
Mankind | -2.831 |
spont | -2.801 |
Token | , |
Token ID | 11 |
Feature activation | +8.42e+01 |
Pos logit contributions | |
totality | +11.078 |
anonymity | +10.679 |
similarities | +10.590 |
hindsight | +10.544 |
deviations | +10.500 |
Neg logit contributions | |
ien | -7.026 |
u | -6.718 |
usk | -6.710 |
ump | -6.480 |
uty | -6.422 |
Token | the |
Token ID | 262 |
Feature activation | +5.41e+01 |
Pos logit contributions | |
those | +21.364 |
these | +21.181 |
many | +20.775 |
the | +20.421 |
it | +20.328 |
Neg logit contributions | |
teasp | -17.392 |
ubes | -17.035 |
| -16.689 |
� | -16.685 |
| -16.622 |
Token | ga |
Token ID | 31986 |
Feature activation | -1.71e+01 |
Pos logit contributions | |
reality | +17.362 |
inaction | +16.761 |
lack | +16.716 |
people | +16.636 |
totality | +16.635 |
Neg logit contributions | |
elaide | -17.042 |
teasp | -15.807 |
ikes | -15.454 |
aiden | -15.396 |
ike | -15.200 |
Token | vel |
Token ID | 626 |
Feature activation | +2.96e+01 |
Pos logit contributions | |
vel | +0.207 |
urn | +0.068 |
ust | -0.381 |
ong | -0.477 |
ump | -0.633 |
Neg logit contributions | |
behavi | -18.116 |
totality | -16.693 |
conflic | -16.001 |
reluct | -15.722 |
deviations | -15.719 |
Token | may |
Token ID | 743 |
Feature activation | -7.68e+00 |
Pos logit contributions | |
totality | +13.926 |
these | +13.662 |
inaction | +13.598 |
things | +13.550 |
distinguishing | +13.379 |
Neg logit contributions | |
uty | -11.146 |
ien | -11.071 |
usk | -10.799 |
ikes | -10.331 |
aga | -10.238 |
Token | have |
Token ID | 423 |
Feature activation | +8.01e+00 |
Pos logit contributions | |
ump | +2.161 |
o | +2.046 |
u | +2.037 |
ong | +2.009 |
é | +1.930 |
Neg logit contributions | |
behavi | -4.916 |
deviations | -4.484 |
totality | -4.353 |
Palestin | -4.288 |
Mankind | -4.168 |
Token | members |
Token ID | 1866 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
folks | +14.965 |
people | +14.873 |
individuals | +14.773 |
members | +14.402 |
participants | +14.122 |
Neg logit contributions | |
elaide | -15.881 |
uty | -15.729 |
� | -15.623 |
iren | -15.567 |
ien | -15.509 |
Token | have |
Token ID | 423 |
Feature activation | +5.75e+00 |
Pos logit contributions | |
totality | +7.267 |
similarities | +7.004 |
deviations | +6.966 |
inaction | +6.734 |
hindsight | +6.677 |
Neg logit contributions | |
u | -5.835 |
ien | -5.670 |
aga | -5.619 |
ike | -5.571 |
usk | -5.558 |
Token | been |
Token ID | 587 |
Feature activation | +8.29e+00 |
Pos logit contributions | |
deviations | +3.181 |
inaction | +3.124 |
symbolism | +3.075 |
totality | +3.058 |
behavi | +3.057 |
Neg logit contributions | |
u | -2.628 |
ien | -2.491 |
ikes | -2.474 |
aga | -2.377 |
ike | -2.338 |
Token | test |
Token ID | 1332 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
totality | +4.003 |
deviations | +3.705 |
similarities | +3.655 |
hindsight | +3.516 |
inaction | +3.481 |
Neg logit contributions | |
u | -4.724 |
aga | -4.548 |
ien | -4.502 |
ag | -4.335 |
usk | -4.286 |
Token | driving |
Token ID | 5059 |
Feature activation | +5.33e+01 |
Pos logit contributions | |
- | +6.683 |
ailed | +5.977 |
ab | +5.710 |
é | +5.709 |
u | +5.687 |
Neg logit contributions | |
totality | -7.196 |
hindsight | -7.136 |
disadvantages | -6.998 |
Canaver | -6.982 |
similarities | -6.905 |
Token | the |
Token ID | 262 |
Feature activation | +8.41e+01 |
Pos logit contributions | |
these | +18.683 |
things | +17.396 |
those | +17.320 |
the | +17.095 |
many | +16.995 |
Neg logit contributions | |
teasp | -15.807 |
usk | -15.655 |
ien | -15.518 |
oultry | -15.459 |
uty | -15.332 |
Token | Washington |
Token ID | 2669 |
Feature activation | +5.30e+01 |
Pos logit contributions | |
new | +17.769 |
folks | +17.119 |
many | +17.091 |
various | +16.998 |
things | +16.848 |
Neg logit contributions | |
teasp | -20.269 |
RandomRedditor | -19.436 |
� | -19.423 |
� | -19.407 |
| -19.390 |
Token | Beer |
Token ID | 16971 |
Feature activation | +5.39e+01 |
Pos logit contributions | |
folks | +13.690 |
these | +13.601 |
people | +13.180 |
things | +13.170 |
those | +12.929 |
Neg logit contributions | |
uty | -15.771 |
elaide | -15.681 |
iren | -15.334 |
lesiastical | -15.276 |
airo | -15.226 |
Token | Mobile |
Token ID | 12173 |
Feature activation | +4.31e+01 |
Pos logit contributions | |
folks | +16.402 |
these | +16.354 |
moving | +16.228 |
operating | +16.154 |
people | +15.980 |
Neg logit contributions | |
eteen | -14.850 |
uty | -14.506 |
� | -14.306 |
oultry | -14.188 |
elaide | -14.057 |
Token | App |
Token ID | 2034 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
these | +13.715 |
operating | +13.021 |
many | +13.012 |
things | +12.844 |
folks | +12.829 |
Neg logit contributions | |
uty | -16.440 |
ubes | -15.550 |
ien | -15.522 |
� | -15.305 |
usk | -15.259 |
Token | for |
Token ID | 329 |
Feature activation | +7.79e+00 |
Pos logit contributions | |
totality | +12.312 |
deviations | +11.840 |
inaction | +11.705 |
distinguishing | +11.702 |
similarities | +11.700 |
Neg logit contributions | |
ien | -8.284 |
usk | -8.095 |
uty | -7.993 |
ump | -7.693 |
aga | -7.652 |
Token | of |
Token ID | 286 |
Feature activation | +4.00e+01 |
Pos logit contributions | |
- | +3.028 |
ab | +2.766 |
u | +2.591 |
ien | +2.501 |
ag | +2.411 |
Neg logit contributions | |
totality | -7.213 |
Situation | -6.933 |
Falling | -6.908 |
Corpor | -6.878 |
symbolism | -6.770 |
Token | streaming |
Token ID | 11305 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
these | +15.899 |
those | +15.471 |
many | +15.451 |
things | +15.021 |
various | +14.789 |
Neg logit contributions | |
usk | -14.514 |
uty | -14.307 |
ien | -14.077 |
elaide | -13.690 |
oultry | -13.530 |
Token | music |
Token ID | 2647 |
Feature activation | +5.78e+00 |
Pos logit contributions | |
distinguishing | +0.662 |
totality | +0.658 |
deviations | +0.654 |
inaction | +0.653 |
revolving | +0.637 |
Neg logit contributions | |
u | -0.468 |
amp | -0.467 |
- | -0.459 |
ump | -0.454 |
ire | -0.436 |
Token | . |
Token ID | 13 |
Feature activation | +6.07e+01 |
Pos logit contributions | |
distinguishing | +3.778 |
totality | +3.736 |
hindsight | +3.707 |
inaction | +3.671 |
deviations | +3.653 |
Neg logit contributions | |
u | -1.814 |
amp | -1.797 |
ab | -1.724 |
ich | -1.642 |
ire | -1.628 |
Token | Furthermore |
Token ID | 11399 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
The | +14.433 |
I | +13.415 |
One | +13.110 |
these | +12.979 |
Modern | +12.973 |
Neg logit contributions | |
teasp | -24.848 |
elaide | -23.689 |
RandomRedditor | -23.541 |
� | -23.530 |
| -23.493 |
Token | , |
Token ID | 11 |
Feature activation | +8.36e+01 |
Pos logit contributions | |
u | +2.750 |
ire | +2.591 |
aga | +2.582 |
usk | +2.412 |
ien | +2.363 |
Neg logit contributions | |
totality | -6.936 |
deviations | -6.874 |
disadvantages | -6.575 |
bureaucrats | -6.553 |
symbolism | -6.539 |
Token | the |
Token ID | 262 |
Feature activation | +8.71e+01 |
Pos logit contributions | |
these | +21.489 |
those | +20.382 |
many | +20.170 |
the | +19.837 |
it | +18.893 |
Neg logit contributions | |
RandomRedditor | -20.050 |
� | -20.039 |
| -19.985 |
| -19.966 |
| -19.940 |
Token | only |
Token ID | 691 |
Feature activation | +5.89e+01 |
Pos logit contributions | |
lack | +19.711 |
many | +19.071 |
most | +18.942 |
only | +18.823 |
these | +18.736 |
Neg logit contributions | |
elaide | -17.931 |
oultry | -17.357 |
teasp | -16.778 |
� | -16.413 |
RNA | -16.409 |
Token | speakers |
Token ID | 11636 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
things | +18.339 |
distinguishing | +17.067 |
real | +17.019 |
people | +16.982 |
other | +16.664 |
Neg logit contributions | |
usk | -18.150 |
teasp | -17.927 |
elaide | -17.635 |
RandomRedditor | -17.117 |
� | -17.107 |
Token | I |
Token ID | 314 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
totality | +10.903 |
these | +10.821 |
distinguishing | +10.649 |
things | +10.630 |
those | +10.511 |
Neg logit contributions | |
uty | -11.801 |
usk | -11.750 |
ien | -11.691 |
ump | -11.080 |
aga | -11.009 |
Token | � |
Token ID | 447 |
Feature activation | -4.16e+01 |
Pos logit contributions | |
ike | +4.087 |
ikes | +3.830 |
u | +3.809 |
ve | +3.771 |
ath | +3.761 |
Neg logit contributions | |
behavi | -7.323 |
inaction | -7.148 |
totality | -6.944 |
fundamentals | -6.396 |
similarities | -6.371 |
Token | imagination |
Token ID | 13843 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
totality | +11.700 |
deviations | +11.234 |
bureaucrats | +11.015 |
hindsight | +11.003 |
disadvantages | +10.958 |
Neg logit contributions | |
ien | -6.367 |
usk | -5.898 |
uty | -5.699 |
u | -5.684 |
� | -5.665 |
Token | and |
Token ID | 290 |
Feature activation | +3.80e+01 |
Pos logit contributions | |
totality | +15.433 |
inaction | +14.856 |
deviations | +14.807 |
hindsight | +14.745 |
similarities | +14.637 |
Neg logit contributions | |
ien | -6.891 |
usk | -6.698 |
uty | -6.513 |
ump | -6.389 |
u | -6.351 |
Token | problem |
Token ID | 1917 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
these | +14.233 |
those | +14.057 |
things | +13.851 |
everyday | +13.573 |
many | +13.457 |
Neg logit contributions | |
uty | -15.431 |
usk | -15.089 |
oultry | -14.379 |
aga | -14.376 |
ump | -14.176 |
Token | solving |
Token ID | 18120 |
Feature activation | +1.88e+01 |
Pos logit contributions | |
- | +4.901 |
ien | +4.050 |
ab | +3.928 |
ag | +3.738 |
u | +3.662 |
Neg logit contributions | |
Corpor | -6.934 |
disadvantages | -6.815 |
bribes | -6.494 |
CoC | -6.480 |
Orn | -6.442 |
Token | skills |
Token ID | 4678 |
Feature activation | +2.50e+01 |
Pos logit contributions | |
totality | +12.201 |
distinguishing | +11.699 |
hindsight | +11.507 |
bureaucrats | +11.497 |
deviations | +11.495 |
Neg logit contributions | |
ien | -6.917 |
uty | -6.456 |
usk | -6.395 |
ump | -6.302 |
u | -6.183 |
Token | . |
Token ID | 13 |
Feature activation | +8.35e+01 |
Pos logit contributions | |
totality | +15.354 |
deviations | +14.784 |
distinguishing | +14.738 |
inaction | +14.675 |
similarities | +14.667 |
Neg logit contributions | |
ien | -8.079 |
uty | -7.916 |
usk | -7.854 |
ump | -7.436 |
aga | -7.404 |
Token | Parents |
Token ID | 28231 |
Feature activation | +2.70e+01 |
Pos logit contributions | |
The | +17.713 |
these | +17.456 |
One | +16.716 |
many | +16.611 |
People | +16.291 |
Neg logit contributions | |
elaide | -18.212 |
teasp | -17.808 |
uty | -17.311 |
StreamerBot | -17.270 |
| -17.224 |
Token | can |
Token ID | 460 |
Feature activation | +2.55e+01 |
Pos logit contributions | |
these | +10.428 |
totality | +10.177 |
things | +10.133 |
distinguishing | +10.079 |
those | +10.037 |
Neg logit contributions | |
uty | -12.800 |
ien | -12.718 |
usk | -12.503 |
ump | -12.094 |
aga | -12.009 |
Token | buy |
Token ID | 2822 |
Feature activation | +5.46e+01 |
Pos logit contributions | |
these | +7.766 |
totality | +7.475 |
things | +7.440 |
those | +7.407 |
many | +7.306 |
Neg logit contributions | |
uty | -14.120 |
ien | -14.082 |
usk | -13.909 |
� | -13.546 |
aga | -13.432 |
Token | toys |
Token ID | 14958 |
Feature activation | +3.01e+01 |
Pos logit contributions | |
these | +19.402 |
many | +18.098 |
things | +17.602 |
those | +17.515 |
various | +16.793 |
Neg logit contributions | |
| -17.034 |
� | -16.987 |
| -16.970 |
| -16.960 |
RandomRedditor | -16.938 |
Token | online |
Token ID | 2691 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
these | +10.514 |
those | +9.967 |
things | +9.907 |
many | +9.897 |
everyday | +9.839 |
Neg logit contributions | |
uty | -14.864 |
ien | -14.545 |
usk | -14.387 |
� | -13.902 |
aga | -13.845 |
Token | p |
Token ID | 79 |
Feature activation | -3.30e+01 |
Pos logit contributions | |
these | +18.626 |
many | +18.026 |
The | +17.596 |
those | +17.310 |
people | +17.256 |
Neg logit contributions | |
uty | -12.500 |
elaide | -12.447 |
byss | -12.305 |
teasp | -12.135 |
��極 | -12.098 |
Token | k |
Token ID | 74 |
Feature activation | +2.29e+01 |
Pos logit contributions | |
orn | +10.612 |
k | +10.241 |
ix | +10.223 |
q | +10.032 |
ag | +9.960 |
Neg logit contributions | |
behavi | -12.105 |
totality | -11.428 |
disadvantages | -11.242 |
mileage | -11.176 |
hindsight | -11.155 |
Token | and |
Token ID | 290 |
Feature activation | +3.51e+01 |
Pos logit contributions | |
totality | +16.698 |
deviations | +16.224 |
distinguishing | +16.189 |
inaction | +16.170 |
similarities | +16.137 |
Neg logit contributions | |
ien | -5.115 |
uty | -5.003 |
usk | -4.988 |
ump | -4.559 |
aga | -4.475 |
Token | many |
Token ID | 867 |
Feature activation | +3.82e+01 |
Pos logit contributions | |
these | +16.170 |
many | +15.786 |
those | +15.720 |
things | +15.697 |
totality | +15.620 |
Neg logit contributions | |
uty | -12.154 |
ien | -11.933 |
usk | -11.801 |
aga | -11.212 |
inion | -11.152 |
Token | others |
Token ID | 1854 |
Feature activation | +3.93e+01 |
Pos logit contributions | |
these | +16.459 |
many | +16.333 |
things | +16.107 |
people | +15.897 |
those | +15.801 |
Neg logit contributions | |
uty | -13.089 |
ien | -12.591 |
usk | -12.491 |
ump | -11.781 |
aki | -11.732 |
Token | . |
Token ID | 13 |
Feature activation | +8.31e+01 |
Pos logit contributions | |
these | +15.981 |
many | +15.330 |
those | +15.270 |
things | +15.101 |
people | +14.913 |
Neg logit contributions | |
uty | -13.935 |
ien | -13.434 |
usk | -13.210 |
aga | -12.509 |
elaide | -12.374 |
Token |
|
Token ID | 198 |
Feature activation | -3.92e+01 |
Pos logit contributions | |
The | +17.631 |
these | +17.244 |
many | +16.652 |
One | +16.442 |
Canadians | +16.131 |
Neg logit contributions | |
elaide | -18.148 |
teasp | -17.800 |
byss | -17.423 |
StreamerBot | -17.337 |
| -17.315 |
Token |
|
Token ID | 198 |
Feature activation | +6.10e+01 |
Pos logit contributions | |
u | +2.088 |
- | +1.692 |
| +1.476 |
q | +1.274 |
o | +0.655 |
Neg logit contributions | |
tremend | -37.877 |
eleph | -35.828 |
cumbers | -34.569 |
hemor | -34.507 |
exha | -34.487 |
Token | T |
Token ID | 51 |
Feature activation | -9.12e+00 |
Pos logit contributions | |
things | +13.615 |
these | +13.269 |
people | +13.037 |
many | +12.944 |
those | +12.858 |
Neg logit contributions | |
teasp | -20.660 |
| -20.109 |
RandomRedditor | -20.105 |
| -20.099 |
� | -20.080 |
Token | oys |
Token ID | 19417 |
Feature activation | +2.31e+01 |
Pos logit contributions | |
ubes | +1.178 |
oy | +1.037 |
rou | +1.015 |
orn | +0.987 |
usk | +0.984 |
Neg logit contributions | |
totality | -7.998 |
behavi | -7.796 |
hindsight | -7.619 |
bragging | -7.487 |
prevailing | -7.466 |
Token | & |
Token ID | 1222 |
Feature activation | +5.26e+00 |
Pos logit contributions | |
totality | +11.371 |
deviations | +10.880 |
distinguishing | +10.790 |
inaction | +10.675 |
similarities | +10.667 |
Neg logit contributions | |
ien | -10.222 |
usk | -10.044 |
uty | -10.036 |
aga | -9.619 |
ump | -9.579 |
Token | of |
Token ID | 286 |
Feature activation | +3.45e+01 |
Pos logit contributions | |
of | +5.025 |
- | +4.636 |
u | +4.422 |
ag | +4.281 |
ada | +4.046 |
Neg logit contributions | |
behavi | -17.161 |
hemor | -16.266 |
Palestin | -16.034 |
cumbers | -15.950 |
ccording | -15.777 |
Token | ' |
Token ID | 705 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
these | +12.694 |
totality | +12.682 |
things | +12.641 |
those | +12.487 |
deviations | +12.365 |
Neg logit contributions | |
usk | -15.785 |
ien | -15.662 |
uty | -15.458 |
� | -15.144 |
ump | -15.011 |
Token | tr |
Token ID | 2213 |
Feature activation | -4.89e+01 |
Pos logit contributions | |
totality | +17.152 |
deviations | +16.697 |
these | +16.693 |
things | +16.682 |
distinguishing | +16.659 |
Neg logit contributions | |
ien | -6.072 |
uty | -6.033 |
usk | -5.976 |
aga | -5.458 |
ump | -5.413 |
Token | ades |
Token ID | 2367 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
usted | +11.388 |
ad | +11.336 |
unk | +10.784 |
ig | +10.750 |
ades | +10.400 |
Neg logit contributions | |
behavi | -20.536 |
Bots | -19.928 |
doubling | -19.613 |
inaction | -18.958 |
successors | -18.260 |
Token | '. |
Token ID | 4458 |
Feature activation | +5.31e+01 |
Pos logit contributions | |
totality | +15.096 |
inaction | +14.439 |
distinguishing | +14.417 |
deviations | +14.303 |
hindsight | +14.164 |
Neg logit contributions | |
ien | -8.110 |
uty | -7.957 |
usk | -7.734 |
aga | -7.439 |
u | -7.421 |
Token | The |
Token ID | 383 |
Feature activation | +8.30e+01 |
Pos logit contributions | |
these | +13.903 |
The | +13.770 |
"[ | +13.026 |
those | +12.835 |
"… | +12.831 |
Neg logit contributions | |
teasp | -22.447 |
� | -21.656 |
| -21.630 |
� | -21.629 |
RandomRedditor | -21.622 |
Token | real |
Token ID | 1103 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
similarities | +19.863 |
people | +19.712 |
things | +19.111 |
deviations | +19.060 |
many | +19.031 |
Neg logit contributions | |
elaide | -19.137 |
| -18.749 |
RandomRedditor | -18.729 |
� | -18.719 |
� | -18.712 |
Token | difference |
Token ID | 3580 |
Feature activation | -2.94e+00 |
Pos logit contributions | |
distinguishing | +17.277 |
similarities | +17.272 |
dividing | +16.765 |
things | +16.606 |
differences | +16.570 |
Neg logit contributions | |
usk | -15.485 |
uty | -15.435 |
elaide | -15.408 |
oultry | -14.693 |
airo | -14.449 |
Token | between |
Token ID | 1022 |
Feature activation | +5.77e+01 |
Pos logit contributions | |
ien | +0.853 |
u | +0.821 |
ab | +0.747 |
- | +0.739 |
uty | +0.698 |
Neg logit contributions | |
behavi | -1.831 |
totality | -1.755 |
conflic | -1.726 |
DRAG | -1.703 |
anonymity | -1.682 |
Token | the |
Token ID | 262 |
Feature activation | +7.69e+01 |
Pos logit contributions | |
these | +20.426 |
those | +19.169 |
the | +17.685 |
things | +17.273 |
many | +16.951 |
Neg logit contributions | |
teasp | -18.246 |
elaide | -18.144 |
| -17.641 |
� | -17.588 |
� | -17.582 |
Token | Mil |
Token ID | 4460 |
Feature activation | -5.55e+00 |
Pos logit contributions | |
these | +19.204 |
various | +18.849 |
people | +18.605 |
two | +18.549 |
many | +18.534 |
Neg logit contributions | |
| -19.613 |
� | -19.602 |
RandomRedditor | -19.591 |
� | -19.547 |
| -19.515 |
Token | were |
Token ID | 547 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
totality | +6.787 |
inaction | +6.656 |
deviations | +6.525 |
disadvantages | +6.414 |
bureaucrats | +6.354 |
Neg logit contributions | |
ien | -6.865 |
u | -6.575 |
usk | -6.490 |
aga | -6.386 |
ump | -6.270 |
Token | filmed |
Token ID | 18976 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
these | +9.927 |
those | +9.799 |
things | +9.736 |
many | +9.418 |
moving | +9.373 |
Neg logit contributions | |
uty | -17.388 |
ien | -17.239 |
usk | -16.930 |
ump | -16.647 |
inion | -16.568 |
Token | in |
Token ID | 287 |
Feature activation | +4.38e+01 |
Pos logit contributions | |
totality | +8.775 |
deviations | +8.315 |
similarities | +8.312 |
inaction | +8.276 |
hindsight | +8.189 |
Neg logit contributions | |
ien | -10.117 |
uty | -9.779 |
usk | -9.735 |
ump | -9.492 |
ike | -9.427 |
Token | a |
Token ID | 257 |
Feature activation | +1.84e+01 |
Pos logit contributions | |
these | +18.025 |
those | +17.553 |
many | +17.180 |
totality | +16.953 |
various | +16.670 |
Neg logit contributions | |
uty | -14.267 |
usk | -14.038 |
ien | -13.483 |
gex | -13.317 |
ube | -13.309 |
Token | studio |
Token ID | 8034 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
totality | +7.686 |
deviations | +7.452 |
inaction | +7.400 |
disadvantages | +7.341 |
similarities | +7.303 |
Neg logit contributions | |
ien | -10.485 |
usk | -10.238 |
uty | -10.169 |
ump | -10.156 |
u | -9.933 |
Token | . |
Token ID | 13 |
Feature activation | +8.28e+01 |
Pos logit contributions | |
behavi | +1.108 |
disadvantages | +1.095 |
deviations | +1.090 |
acron | +1.087 |
totality | +1.071 |
Neg logit contributions | |
ike | -0.710 |
ien | -0.687 |
- | -0.686 |
ock | -0.673 |
ire | -0.653 |
Token | Image |
Token ID | 7412 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
The | +18.613 |
these | +17.304 |
One | +16.756 |
Wikipedia | +16.406 |
the | +16.199 |
Neg logit contributions | |
teasp | -19.777 |
� | -17.996 |
| -17.992 |
RandomRedditor | -17.963 |
| -17.960 |
Token | courtesy |
Token ID | 12537 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
totality | +5.482 |
distinguishing | +5.150 |
deviations | +5.142 |
these | +5.112 |
similarities | +5.090 |
Neg logit contributions | |
ien | -9.435 |
uty | -9.401 |
usk | -9.338 |
aga | -9.020 |
ump | -9.013 |
Token | of |
Token ID | 286 |
Feature activation | +3.94e+01 |
Pos logit contributions | |
ien | +0.894 |
u | +0.890 |
usk | +0.834 |
uty | +0.820 |
aga | +0.812 |
Neg logit contributions | |
totality | -1.614 |
deviations | -1.598 |
inaction | -1.580 |
distinguishing | -1.551 |
disadvantages | -1.550 |
Token | Columbia |
Token ID | 9309 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
these | +16.257 |
those | +15.933 |
things | +15.794 |
Wikipedia | +15.591 |
totality | +15.582 |
Neg logit contributions | |
uty | -13.249 |
usk | -12.964 |
ien | -12.620 |
elaide | -12.386 |
aga | -12.157 |
Token | Pictures |
Token ID | 20051 |
Feature activation | +7.04e+01 |
Pos logit contributions | |
totality | +8.513 |
deviations | +8.075 |
distinguishing | +8.025 |
inaction | +7.944 |
similarities | +7.843 |
Neg logit contributions | |
ien | -12.268 |
usk | -12.046 |
uty | -12.038 |
ump | -11.588 |
aga | -11.585 |
Token | with |
Token ID | 351 |
Feature activation | +4.07e+01 |
Pos logit contributions | |
totality | +6.462 |
similarities | +5.992 |
deviations | +5.925 |
hindsight | +5.919 |
inaction | +5.846 |
Neg logit contributions | |
u | -5.330 |
usk | -5.159 |
ien | -5.154 |
ike | -5.101 |
uty | -5.069 |
Token | Amazon |
Token ID | 6186 |
Feature activation | +4.10e+01 |
Pos logit contributions | |
these | +14.869 |
those | +14.734 |
many | +14.299 |
things | +13.960 |
people | +13.951 |
Neg logit contributions | |
inion | -15.332 |
uty | -15.195 |
usk | -15.124 |
ien | -15.095 |
igger | -15.008 |
Token | Mom |
Token ID | 11254 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
these | +17.630 |
things | +17.534 |
those | +17.293 |
people | +17.235 |
many | +17.132 |
Neg logit contributions | |
uty | -11.544 |
usk | -11.117 |
oultry | -11.112 |
inion | -11.069 |
ump | -10.840 |
Token | can |
Token ID | 460 |
Feature activation | +2.36e+01 |
Pos logit contributions | |
totality | +12.402 |
distinguishing | +11.831 |
inaction | +11.730 |
deviations | +11.658 |
similarities | +11.591 |
Neg logit contributions | |
u | -5.497 |
ien | -5.443 |
usk | -5.288 |
uty | -4.957 |
aga | -4.878 |
Token | share |
Token ID | 2648 |
Feature activation | +6.06e+01 |
Pos logit contributions | |
totality | +13.384 |
deviations | +12.917 |
distinguishing | +12.889 |
inaction | +12.763 |
similarities | +12.740 |
Neg logit contributions | |
ien | -8.617 |
usk | -8.511 |
uty | -8.498 |
ump | -8.002 |
aga | -7.962 |
Token | their |
Token ID | 511 |
Feature activation | +8.24e+01 |
Pos logit contributions | |
those | +19.146 |
these | +19.045 |
things | +18.711 |
many | +17.936 |
everything | +17.835 |
Neg logit contributions | |
oultry | -17.019 |
teasp | -16.919 |
� | -16.660 |
RandomRedditor | -16.620 |
| -16.612 |
Token | 20 |
Token ID | 1160 |
Feature activation | -2.68e+01 |
Pos logit contributions | |
things | +19.428 |
benefits | +18.322 |
many | +18.300 |
these | +18.102 |
those | +17.990 |
Neg logit contributions | |
oultry | -18.004 |
teasp | -17.756 |
byss | -17.737 |
elaide | -17.611 |
� | -17.487 |
Token | percent |
Token ID | 1411 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
u | +8.607 |
- | +8.606 |
GB | +7.946 |
k | +7.866 |
am | +7.549 |
Neg logit contributions | |
resemb | -10.375 |
totality | -10.282 |
behavi | -9.901 |
symbolism | -9.751 |
inaction | -9.328 |
Token | diaper |
Token ID | 48196 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
totality | +7.593 |
inaction | +7.103 |
distinguishing | +7.031 |
deviations | +7.006 |
bureaucrats | +7.002 |
Neg logit contributions | |
ien | -7.327 |
aga | -7.229 |
u | -7.225 |
usk | -7.058 |
uty | -6.835 |
Token | and |
Token ID | 290 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
totality | +9.967 |
inaction | +9.249 |
distinguishing | +9.140 |
academics | +9.134 |
disparate | +9.129 |
Neg logit contributions | |
ien | -7.092 |
u | -6.731 |
ump | -6.654 |
uty | -6.594 |
aga | -6.475 |
Token | 15 |
Token ID | 1315 |
Feature activation | -3.45e+01 |
Pos logit contributions | |
totality | +7.115 |
deviations | +6.940 |
distinguishing | +6.877 |
inaction | +6.744 |
disadvantages | +6.672 |
Neg logit contributions | |
ien | -7.761 |
u | -7.482 |
amp | -7.337 |
usk | -7.303 |
ump | -7.183 |
Token | agar |
Token ID | 32452 |
Feature activation | -2.72e-01 |
Pos logit contributions | |
u | +1.939 |
aga | +1.911 |
ak | +1.910 |
ag | +1.776 |
ab | +1.767 |
Neg logit contributions | |
inaction | -3.045 |
disadvantages | -2.996 |
deviations | -2.986 |
hindsight | -2.911 |
distinguishing | -2.839 |
Token | temple |
Token ID | 12505 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
aga | +0.117 |
u | +0.116 |
ab | +0.107 |
ak | +0.107 |
am | +0.106 |
Neg logit contributions | |
disadvantages | -0.174 |
inaction | -0.173 |
hindsight | -0.168 |
deviations | -0.166 |
distinguishing | -0.164 |
Token | in |
Token ID | 287 |
Feature activation | -4.00e+00 |
Pos logit contributions | |
inaction | +9.500 |
totality | +9.464 |
deviations | +9.424 |
hindsight | +9.407 |
disadvantages | +9.353 |
Neg logit contributions | |
usk | -5.501 |
u | -5.482 |
aga | -5.453 |
ien | -5.359 |
uty | -5.205 |
Token | Mad |
Token ID | 4627 |
Feature activation | -8.37e+01 |
Pos logit contributions | |
u | +1.696 |
ab | +1.606 |
uty | +1.585 |
ip | +1.573 |
aga | +1.560 |
Neg logit contributions | |
deviations | -1.910 |
behavi | -1.884 |
disadvantages | -1.817 |
inaction | -1.753 |
distractions | -1.714 |
Token | urai |
Token ID | 16998 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
u | +15.525 |
ag | +15.473 |
hya | +15.313 |
ras | +14.371 |
ura | +14.245 |
Neg logit contributions | |
behavi | -21.277 |
disadvantages | -19.162 |
detractors | -18.596 |
inaction | -18.264 |
distinguishing | -18.190 |
Token | . |
Token ID | 13 |
Feature activation | +8.24e+01 |
Pos logit contributions | |
disadvantages | +9.098 |
deviations | +9.061 |
inaction | +8.989 |
totality | +8.941 |
hindsight | +8.805 |
Neg logit contributions | |
u | -3.497 |
aga | -3.311 |
usk | -3.264 |
ien | -3.241 |
uty | -3.118 |
Token |
|
Token ID | 198 |
Feature activation | -3.91e+01 |
Pos logit contributions | |
The | +18.890 |
these | +17.235 |
One | +16.969 |
Mother | +16.582 |
the | +16.581 |
Neg logit contributions | |
teasp | -17.859 |
ikuman | -17.791 |
| -16.738 |
� | -16.713 |
oultry | -16.708 |
Token |
|
Token ID | 198 |
Feature activation | +6.83e+01 |
Pos logit contributions | |
u | +2.111 |
- | +1.804 |
| +1.456 |
q | +1.235 |
k | +0.559 |
Neg logit contributions | |
tremend | -37.838 |
eleph | -35.784 |
undermin | -34.548 |
cumbers | -34.417 |
exha | -34.297 |
Token | Other |
Token ID | 6395 |
Feature activation | +4.48e+01 |
Pos logit contributions | |
things | +13.889 |
these | +13.861 |
people | +13.267 |
many | +13.242 |
the | +12.939 |
Neg logit contributions | |
teasp | -20.023 |
RandomRedditor | -19.697 |
| -19.671 |
� | -19.656 |
� | -19.653 |
Token | main |
Token ID | 1388 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
things | +18.638 |
similarities | +17.767 |
people | +17.624 |
distinguishing | +17.512 |
these | +17.299 |
Neg logit contributions | |
oultry | -13.226 |
inion | -12.949 |
uty | -12.923 |
gex | -12.648 |
elaide | -12.625 |
Token | special |
Token ID | 2041 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
totality | +11.682 |
deviations | +11.119 |
inaction | +11.094 |
hindsight | +11.005 |
distinguishing | +10.986 |
Neg logit contributions | |
ien | -9.553 |
uty | -9.408 |
usk | -9.356 |
aga | -8.971 |
ump | -8.897 |
Token | - |
Token ID | 12 |
Feature activation | +1.73e+01 |
Pos logit contributions | |
things | +19.207 |
people | +18.969 |
these | +18.536 |
changing | +18.453 |
folks | +18.309 |
Neg logit contributions | |
elaide | -13.644 |
uty | -13.210 |
oultry | -13.131 |
leground | -12.150 |
inion | -12.098 |
Token | style |
Token ID | 7635 |
Feature activation | +4.95e+01 |
Pos logit contributions | |
totality | +14.233 |
deviations | +13.626 |
inaction | +13.591 |
distinguishing | +13.527 |
similarities | +13.358 |
Neg logit contributions | |
ien | -3.483 |
usk | -3.365 |
u | -3.288 |
ike | -3.154 |
uty | -3.124 |
Token | bike |
Token ID | 7161 |
Feature activation | +4.82e+01 |
Pos logit contributions | |
things | +17.220 |
totality | +16.680 |
people | +16.283 |
deviations | +16.191 |
similarities | +16.181 |
Neg logit contributions | |
elaide | -15.936 |
gex | -15.142 |
uty | -15.111 |
oultry | -14.908 |
inion | -14.849 |
Token | and |
Token ID | 290 |
Feature activation | +6.08e+01 |
Pos logit contributions | |
these | +17.536 |
things | +17.478 |
changing | +17.251 |
those | +17.186 |
people | +17.150 |
Neg logit contributions | |
uty | -13.501 |
elaide | -13.431 |
oultry | -12.848 |
usk | -12.601 |
aga | -12.354 |
Token | with |
Token ID | 351 |
Feature activation | +7.50e+01 |
Pos logit contributions | |
those | +19.403 |
the | +19.111 |
many | +19.085 |
lack | +18.885 |
these | +18.869 |
Neg logit contributions | |
uty | -15.125 |
gex | -14.683 |
elaide | -14.661 |
oultry | -14.278 |
ijah | -13.785 |
Token | the |
Token ID | 262 |
Feature activation | +8.20e+01 |
Pos logit contributions | |
the | +20.731 |
those | +20.681 |
many | +20.665 |
things | +20.588 |
these | +20.345 |
Neg logit contributions | |
uty | -15.643 |
elaide | -14.885 |
inion | -14.819 |
oultry | -14.497 |
leground | -14.323 |
Token | normal |
Token ID | 3487 |
Feature activation | +6.53e+01 |
Pos logit contributions | |
lack | +19.989 |
newer | +19.389 |
modern | +19.361 |
things | +19.259 |
many | +19.028 |
Neg logit contributions | |
uty | -16.398 |
oultry | -16.280 |
elaide | -15.874 |
gex | -15.783 |
inion | -15.359 |
Token | TT |
Token ID | 26653 |
Feature activation | +4.54e+01 |
Pos logit contributions | |
things | +19.371 |
people | +18.409 |
everyday | +18.316 |
deviations | +18.223 |
modern | +18.156 |
Neg logit contributions | |
inion | -15.394 |
uty | -15.083 |
gex | -14.981 |
oultry | -14.819 |
elaide | -14.393 |
Token | position |
Token ID | 2292 |
Feature activation | +4.95e+01 |
Pos logit contributions | |
things | +17.840 |
these | +17.298 |
similarities | +17.280 |
people | +17.254 |
those | +17.096 |
Neg logit contributions | |
uty | -12.314 |
elaide | -12.152 |
inion | -12.094 |
gex | -11.939 |
oultry | -11.616 |
Token | , |
Token ID | 11 |
Feature activation | +7.23e+01 |
Pos logit contributions | |
things | +17.705 |
these | +17.624 |
those | +17.218 |
changing | +17.199 |
many | +17.016 |
Neg logit contributions | |
uty | -14.015 |
ien | -13.161 |
elaide | -13.100 |
usk | -13.073 |
gex | -13.023 |
Token | however |
Token ID | 2158 |
Feature activation | +5.60e+01 |
Pos logit contributions | |
these | +19.697 |
those | +19.686 |
the | +19.356 |
things | +19.324 |
many | +19.317 |
Neg logit contributions | |
uty | -14.334 |
ien | -13.306 |
elaide | -13.207 |
lesiastical | -13.087 |
usk | -13.063 |
Token | � |
Token ID | 251 |
Feature activation | +3.07e+01 |
Pos logit contributions | |
� | +7.176 |
� | +6.827 |
� | +6.587 |
� | +6.466 |
� | +6.350 |
Neg logit contributions | |
pecul | -14.603 |
disadvantages | -14.206 |
hindsight | -14.020 |
similarities | -14.011 |
behavi | -13.979 |
Token | but |
Token ID | 475 |
Feature activation | +4.70e+01 |
Pos logit contributions | |
totality | +14.038 |
these | +14.027 |
distinguishing | +13.782 |
those | +13.780 |
things | +13.756 |
Neg logit contributions | |
ien | -11.362 |
uty | -11.320 |
usk | -11.260 |
ikes | -10.686 |
elaide | -10.684 |
Token | acknowledged |
Token ID | 10810 |
Feature activation | +4.06e+01 |
Pos logit contributions | |
these | +16.061 |
those | +16.006 |
many | +15.774 |
things | +15.389 |
people | +15.343 |
Neg logit contributions | |
elaide | -16.010 |
arter | -15.232 |
uty | -15.226 |
ikes | -14.926 |
igger | -14.922 |
Token | being |
Token ID | 852 |
Feature activation | +3.65e+01 |
Pos logit contributions | |
these | +15.935 |
those | +15.643 |
many | +15.252 |
things | +15.175 |
similarities | +15.098 |
Neg logit contributions | |
usk | -14.973 |
uty | -14.890 |
elaide | -14.730 |
ien | -14.398 |
ikes | -14.392 |
Token | acquainted |
Token ID | 36620 |
Feature activation | -6.27e+00 |
Pos logit contributions | |
those | +13.228 |
these | +13.149 |
things | +13.072 |
many | +13.010 |
people | +12.920 |
Neg logit contributions | |
uty | -15.113 |
usk | -14.859 |
ien | -14.789 |
ikes | -14.578 |
elaide | -14.522 |
Token | with |
Token ID | 351 |
Feature activation | +8.17e+01 |
Pos logit contributions | |
u | +1.471 |
ien | +1.450 |
ab | +1.448 |
а | +1.328 |
ale | +1.254 |
Neg logit contributions | |
totality | -4.009 |
deviations | -3.858 |
distractions | -3.852 |
temptation | -3.801 |
inaction | -3.785 |
Token | Sh |
Token ID | 911 |
Feature activation | -9.86e+00 |
Pos logit contributions | |
those | +21.023 |
the | +20.652 |
these | +20.624 |
many | +20.575 |
people | +20.217 |
Neg logit contributions | |
elaide | -19.123 |
RandomRedditor | -18.295 |
| -18.286 |
� | -18.275 |
| -18.275 |
Token | kind |
Token ID | 11031 |
Feature activation | -4.20e+01 |
Pos logit contributions | |
ien | +1.003 |
ank | +0.864 |
aven | +0.789 |
ok | +0.721 |
akh | +0.690 |
Neg logit contributions | |
behavi | -10.501 |
totality | -9.406 |
distinguishing | -9.150 |
anonymity | -9.023 |
inaction | -9.009 |
Token | el |
Token ID | 417 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
el | +9.178 |
u | +7.587 |
ock | +7.167 |
ell | +6.382 |
le | +6.241 |
Neg logit contributions | |
behavi | -29.516 |
tremend | -29.156 |
hemor | -29.081 |
cumbers | -28.873 |
reluct | -28.349 |
Token | . |
Token ID | 13 |
Feature activation | +5.57e+01 |
Pos logit contributions | |
totality | +15.078 |
deviations | +14.924 |
distinguishing | +14.644 |
disadvantages | +14.582 |
hindsight | +14.548 |
Neg logit contributions | |
ien | -6.431 |
usk | -6.257 |
u | -5.917 |
uty | -5.862 |
aga | -5.835 |
Token |
|
Token ID | 198 |
Feature activation | -5.40e+01 |
Pos logit contributions | |
"… | +16.142 |
these | +15.853 |
« | +15.405 |
Wikipedia | +15.359 |
The | +15.342 |
Neg logit contributions | |
elaide | -16.801 |
igger | -15.183 |
agin | -14.987 |
ikes | -14.886 |
inion | -14.836 |
Token | the |
Token ID | 262 |
Feature activation | +4.55e+01 |
Pos logit contributions | |
these | +15.375 |
totality | +15.287 |
those | +15.197 |
things | +14.696 |
deviations | +14.415 |
Neg logit contributions | |
usk | -14.413 |
uty | -14.238 |
ien | -13.823 |
inion | -13.558 |
ijah | -13.541 |
Token | previous |
Token ID | 2180 |
Feature activation | +8.91e+00 |
Pos logit contributions | |
totality | +15.200 |
many | +14.728 |
people | +14.598 |
these | +14.583 |
things | +14.523 |
Neg logit contributions | |
uty | -16.577 |
usk | -16.495 |
ijah | -16.476 |
union | -16.267 |
inion | -16.265 |
Token | years |
Token ID | 812 |
Feature activation | +2.89e+01 |
Pos logit contributions | |
similarities | +6.137 |
disadvantages | +6.057 |
distinguishing | +6.017 |
symbolism | +5.973 |
distractions | +5.942 |
Neg logit contributions | |
ien | -2.874 |
ire | -2.754 |
u | -2.669 |
year | -2.654 |
month | -2.382 |
Token | . |
Token ID | 13 |
Feature activation | +6.17e+01 |
Pos logit contributions | |
totality | +14.484 |
these | +14.074 |
distinguishing | +13.987 |
deviations | +13.929 |
things | +13.876 |
Neg logit contributions | |
uty | -10.560 |
ien | -10.496 |
usk | -10.360 |
aga | -9.852 |
� | -9.741 |
Token |
|
Token ID | 198 |
Feature activation | -5.07e+01 |
Pos logit contributions | |
The | +16.665 |
these | +16.305 |
Wikipedia | +15.986 |
the | +15.421 |
Meaning | +15.148 |
Neg logit contributions | |
elaide | -18.345 |
teasp | -17.270 |
� | -16.751 |
| -16.728 |
RandomRedditor | -16.721 |
Token |
|
Token ID | 198 |
Feature activation | +8.14e+01 |
Pos logit contributions | |
| +3.529 |
- | +2.966 |
u | +2.904 |
q | +2.221 |
ab | +1.329 |
Neg logit contributions | |
tremend | -42.760 |
eleph | -41.115 |
millenn | -39.274 |
cumbers | -39.203 |
exha | -38.965 |
Token | Please |
Token ID | 5492 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
these | +15.333 |
things | +15.228 |
The | +14.936 |
people | +14.848 |
it | +14.830 |
Neg logit contributions | |
teasp | -18.320 |
StreamerBot | -18.237 |
RandomRedditor | -18.182 |
| -18.169 |
� | -18.167 |
Token | note |
Token ID | 3465 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
u | +0.453 |
q | +0.443 |
ire | +0.428 |
aki | +0.410 |
ien | +0.405 |
Neg logit contributions | |
behavi | -0.795 |
totality | -0.791 |
deviations | -0.734 |
inaction | -0.733 |
fundamentals | -0.712 |
Token | that |
Token ID | 326 |
Feature activation | +6.22e+01 |
Pos logit contributions | |
these | +14.970 |
totality | +14.613 |
those | +14.517 |
things | +14.497 |
deviations | +14.444 |
Neg logit contributions | |
uty | -13.383 |
ien | -13.358 |
usk | -13.316 |
aga | -12.774 |
inion | -12.610 |
Token | due |
Token ID | 2233 |
Feature activation | -3.88e+01 |
Pos logit contributions | |
these | +20.699 |
many | +19.146 |
the | +19.021 |
those | +19.005 |
deviations | +18.241 |
Neg logit contributions | |
elaide | -17.253 |
uty | -16.579 |
� | -16.452 |
| -16.435 |
RandomRedditor | -16.411 |
Token | to |
Token ID | 284 |
Feature activation | +4.43e+01 |
Pos logit contributions | |
u | +7.363 |
- | +6.202 |
ll | +6.137 |
ud | +5.700 |
un | +5.691 |
Neg logit contributions | |
ccording | -17.069 |
Palestin | -16.848 |
tremend | -16.625 |
behavi | -16.398 |
unnecess | -15.839 |
Token | Sur |
Token ID | 4198 |
Feature activation | -5.50e+01 |
Pos logit contributions | |
ien | +0.289 |
ump | +0.286 |
u | +0.271 |
ab | +0.267 |
ire | +0.263 |
Neg logit contributions | |
deviations | -0.264 |
disadvantages | -0.263 |
inaction | -0.247 |
fundamentals | -0.246 |
hindsight | -0.245 |
Token | rog |
Token ID | 3828 |
Feature activation | -6.64e+01 |
Pos logit contributions | |
ien | +14.490 |
ab | +13.167 |
aga | +12.991 |
round | +12.806 |
ig | +12.518 |
Neg logit contributions | |
unnecess | -16.585 |
disparate | -15.998 |
disadvantages | -15.499 |
hindsight | -15.390 |
deviations | -15.336 |
Token | ate |
Token ID | 378 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
ate | +13.130 |
ates | +11.386 |
acy | +10.836 |
ather | +8.955 |
ath | +8.185 |
Neg logit contributions | |
hindsight | -26.248 |
disadvantages | -25.009 |
behavi | -24.872 |
fundamentals | -24.395 |
deviations | -23.758 |
Token | 's |
Token ID | 338 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
totality | +9.856 |
deviations | +9.528 |
disadvantages | +9.448 |
inaction | +9.357 |
hindsight | +9.333 |
Neg logit contributions | |
ien | -5.896 |
u | -5.615 |
ump | -5.376 |
ire | -5.315 |
ock | -5.304 |
Token | Court |
Token ID | 3078 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
totality | +8.984 |
deviations | +8.654 |
disadvantages | +8.610 |
inaction | +8.383 |
hindsight | +8.374 |
Neg logit contributions | |
ien | -5.371 |
ump | -5.074 |
u | -4.975 |
ock | -4.932 |
ire | -4.847 |
Token | . |
Token ID | 13 |
Feature activation | +8.13e+01 |
Pos logit contributions | |
totality | +8.615 |
inaction | +8.243 |
deviations | +8.132 |
disadvantages | +7.937 |
anonymity | +7.888 |
Neg logit contributions | |
ien | -3.271 |
u | -3.052 |
ock | -3.000 |
ire | -2.983 |
ump | -2.940 |
Token | Other |
Token ID | 3819 |
Feature activation | +4.93e+01 |
Pos logit contributions | |
The | +18.080 |
these | +16.668 |
Wikipedia | +16.227 |
One | +16.150 |
Standing | +15.747 |
Neg logit contributions | |
teasp | -21.480 |
� | -19.764 |
| -19.759 |
RandomRedditor | -19.724 |
� | -19.704 |
Token | sequences |
Token ID | 16311 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
things | +18.143 |
similarities | +17.182 |
elements | +17.098 |
moving | +17.030 |
people | +17.003 |
Neg logit contributions | |
gex | -14.527 |
inion | -14.435 |
elaide | -14.396 |
ien | -14.300 |
usk | -14.266 |
Token | like |
Token ID | 588 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
totality | +9.471 |
deviations | +8.924 |
inaction | +8.896 |
distinguishing | +8.725 |
similarities | +8.679 |
Neg logit contributions | |
ien | -11.512 |
usk | -11.342 |
uty | -11.247 |
aga | -10.943 |
u | -10.831 |
Token | the |
Token ID | 262 |
Feature activation | +4.36e+01 |
Pos logit contributions | |
disadvantages | +5.765 |
totality | +5.484 |
inaction | +5.453 |
deviations | +5.440 |
fundamentals | +5.436 |
Neg logit contributions | |
ien | -9.005 |
u | -8.460 |
uty | -8.431 |
ump | -8.409 |
usk | -8.231 |
Token | subway |
Token ID | 19612 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
many | +18.421 |
moving | +18.366 |
things | +18.306 |
these | +18.285 |
those | +18.158 |
Neg logit contributions | |
uty | -11.341 |
usk | -11.216 |
elaide | -11.047 |
inion | -10.728 |
ien | -10.593 |
Token | . |
Token ID | 13 |
Feature activation | +5.86e+01 |
Pos logit contributions | |
totality | +14.034 |
deviations | +13.768 |
similarities | +13.706 |
distinguishing | +13.483 |
inaction | +13.479 |
Neg logit contributions | |
uty | -6.654 |
ien | -6.563 |
usk | -6.345 |
ump | -6.209 |
aga | -6.111 |
Token |
|
Token ID | 198 |
Feature activation | -3.02e+01 |
Pos logit contributions | |
The | +16.065 |
these | +16.004 |
those | +15.363 |
people | +14.910 |
Meaning | +14.904 |
Neg logit contributions | |
elaide | -15.576 |
teasp | -14.946 |
inion | -14.801 |
� | -14.483 |
ikes | -14.416 |
Token |
|
Token ID | 198 |
Feature activation | +6.81e+01 |
Pos logit contributions | |
u | +2.203 |
q | +1.445 |
- | +1.246 |
ab | +0.817 |
o | +0.721 |
Neg logit contributions | |
tremend | -29.903 |
eleph | -28.508 |
undermin | -27.759 |
cumbers | -27.740 |
hemor | -27.692 |
Token | The |
Token ID | 464 |
Feature activation | +7.95e+01 |
Pos logit contributions | |
things | +15.349 |
those | +14.930 |
these | +14.895 |
people | +14.692 |
the | +13.983 |
Neg logit contributions | |
teasp | -18.730 |
RandomRedditor | -17.841 |
| -17.837 |
� | -17.837 |
� | -17.821 |
Token | all |
Token ID | 477 |
Feature activation | +5.99e-01 |
Pos logit contributions | |
folks | +18.041 |
only | +17.785 |
most | +17.721 |
actual | +17.624 |
people | +17.613 |
Neg logit contributions | |
teasp | -17.067 |
ubes | -16.400 |
ActionCode | -16.305 |
oultry | -16.259 |
� | -16.207 |
Token | new |
Token ID | 649 |
Feature activation | +8.11e+01 |
Pos logit contributions | |
totality | +0.322 |
behavi | +0.317 |
deviations | +0.292 |
whichever | +0.290 |
hindsight | +0.284 |
Neg logit contributions | |
u | -0.295 |
- | -0.292 |
ien | -0.281 |
ire | -0.272 |
ump | -0.262 |
Token | Washington |
Token ID | 2669 |
Feature activation | +4.38e+01 |
Pos logit contributions | |
folks | +17.493 |
operating | +17.094 |
Wikipedia | +16.928 |
these | +16.648 |
reality | +16.577 |
Neg logit contributions | |
teasp | -18.039 |
ubes | -17.419 |
byss | -17.274 |
oultry | -17.125 |
ActionCode | -16.505 |
Token | Beer |
Token ID | 16971 |
Feature activation | +4.58e+01 |
Pos logit contributions | |
these | +9.486 |
reality | +9.441 |
folks | +9.439 |
people | +9.267 |
Wikipedia | +9.205 |
Neg logit contributions | |
elaide | -16.808 |
unn | -16.495 |
uty | -16.329 |
iren | -16.308 |
airo | -16.243 |
Token | Mobile |
Token ID | 12173 |
Feature activation | +4.58e+01 |
Pos logit contributions | |
folks | +12.123 |
moving | +12.086 |
operating | +11.949 |
these | +11.895 |
Operation | +11.879 |
Neg logit contributions | |
eteen | -16.545 |
ubes | -16.451 |
ien | -16.256 |
utch | -15.835 |
uty | -15.804 |
Token | App |
Token ID | 2034 |
Feature activation | +3.59e+01 |
Pos logit contributions | |
operating | +11.165 |
these | +11.119 |
folks | +11.019 |
moving | +10.580 |
people | +10.518 |
Neg logit contributions | |
ubes | -17.623 |
eteen | -17.451 |
uty | -17.277 |
lesiastical | -16.854 |
� | -16.803 |
Token | will |
Token ID | 481 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
these | +13.340 |
things | +12.982 |
totality | +12.958 |
many | +12.734 |
those | +12.667 |
Neg logit contributions | |
uty | -14.371 |
ien | -14.262 |
usk | -13.938 |
� | -13.886 |
inion | -13.644 |
Token | major |
Token ID | 1688 |
Feature activation | +6.94e-01 |
Pos logit contributions | |
similarities | +1.777 |
deviations | +1.730 |
disadvantages | +1.702 |
distinguishing | +1.651 |
behavi | +1.631 |
Neg logit contributions | |
u | -1.538 |
ien | -1.529 |
agin | -1.508 |
ust | -1.495 |
ump | -1.492 |
Token | economic |
Token ID | 3034 |
Feature activation | -2.66e+01 |
Pos logit contributions | |
similarities | +0.352 |
distinguishing | +0.329 |
disadvantages | +0.324 |
behavi | +0.321 |
totality | +0.319 |
Neg logit contributions | |
ien | -0.319 |
ump | -0.301 |
u | -0.301 |
� | -0.295 |
ike | -0.293 |
Token | downturn |
Token ID | 34540 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
- | +4.419 |
ike | +3.835 |
uma | +3.621 |
� | +3.070 |
ricane | +2.995 |
Neg logit contributions | |
Everyday | -13.591 |
Subtle | -13.029 |
somew | -13.029 |
similarities | -13.018 |
embodiments | -12.694 |
Token | . |
Token ID | 13 |
Feature activation | +6.04e+01 |
Pos logit contributions | |
. | +3.288 |
ock | +2.299 |
u | +2.264 |
- | +2.139 |
s | +2.074 |
Neg logit contributions | |
deviations | -8.752 |
anonymity | -8.630 |
similarities | -8.586 |
theless | -8.529 |
uniqueness | -8.480 |
Token |
|
Token ID | 198 |
Feature activation | -3.64e+01 |
Pos logit contributions | |
The | +15.942 |
Proposition | +15.248 |
Operation | +14.744 |
"… | +14.524 |
Lack | +14.494 |
Neg logit contributions | |
elaide | -19.105 |
teasp | -18.293 |
enei | -18.028 |
� | -17.405 |
ubes | -17.393 |
Token |
|
Token ID | 198 |
Feature activation | +8.10e+01 |
Pos logit contributions | |
u | +1.805 |
- | +1.079 |
| +1.003 |
q | +0.695 |
o | +0.273 |
Neg logit contributions | |
tremend | -36.881 |
eleph | -34.857 |
cumbers | -33.933 |
hemor | -33.808 |
exha | -33.804 |
Token | City |
Token ID | 14941 |
Feature activation | +3.12e+01 |
Pos logit contributions | |
� | +12.420 |
The | +12.417 |
However | +12.251 |
The | +12.098 |
things | +11.377 |
Neg logit contributions | |
teasp | -26.064 |
pione | -25.479 |
StreamerBot | -24.928 |
� | -24.855 |
RandomRedditor | -24.836 |
Token | Council |
Token ID | 4281 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
these | +11.500 |
inaction | +11.430 |
totality | +11.406 |
bureaucrats | +11.306 |
things | +11.291 |
Neg logit contributions | |
ien | -13.329 |
usk | -13.113 |
uty | -13.111 |
elaide | -12.639 |
ump | -12.593 |
Token | — |
Token ID | 960 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
totality | +8.403 |
similarities | +8.049 |
deviations | +8.019 |
distinguishing | +7.991 |
hindsight | +7.803 |
Neg logit contributions | |
ien | -8.676 |
usk | -8.536 |
uty | -8.466 |
ump | -8.127 |
u | -8.127 |
Token | 75 |
Token ID | 2425 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
totality | +11.037 |
distinguishing | +10.951 |
deviations | +10.770 |
disadvantages | +10.615 |
anonymity | +10.584 |
Neg logit contributions | |
ien | -4.522 |
u | -4.313 |
usk | -4.240 |
uty | -4.140 |
ab | -3.954 |
Token | % |
Token ID | 4 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
anonymity | +1.310 |
distinguishing | +1.303 |
totality | +1.293 |
disadvantages | +1.286 |
behavi | +1.272 |
Neg logit contributions | |
u | -0.242 |
inch | -0.235 |
q | -0.224 |
ien | -0.223 |
- | -0.199 |
Token | - |
Token ID | 12 |
Feature activation | +6.93e+00 |
Pos logit contributions | |
these | +19.588 |
those | +18.976 |
people | +18.471 |
things | +18.459 |
many | +18.448 |
Neg logit contributions | |
uty | -11.261 |
agin | -11.168 |
inion | -10.817 |
ascript | -10.606 |
usk | -10.560 |
Token | 5 |
Token ID | 20 |
Feature activation | +4.06e+01 |
Pos logit contributions | |
totality | +6.056 |
inaction | +5.927 |
distinguishing | +5.875 |
disadvantages | +5.857 |
anonymity | +5.851 |
Neg logit contributions | |
u | -1.342 |
ien | -1.213 |
ab | -1.080 |
inch | -1.055 |
ump | -1.014 |
Token | was |
Token ID | 373 |
Feature activation | +4.85e+01 |
Pos logit contributions | |
these | +18.083 |
those | +17.742 |
things | +17.554 |
totality | +17.388 |
people | +17.386 |
Neg logit contributions | |
uty | -10.722 |
usk | -10.526 |
inion | -10.286 |
ien | -10.245 |
agin | -10.092 |
Token | directly |
Token ID | 3264 |
Feature activation | +2.26e+01 |
Pos logit contributions | |
moving | +16.559 |
operating | +16.153 |
these | +16.005 |
those | +15.658 |
the | +15.378 |
Neg logit contributions | |
uty | -16.083 |
ikes | -14.974 |
ien | -14.889 |
inion | -14.808 |
ijah | -14.772 |
Token | overhead |
Token ID | 16965 |
Feature activation | +5.02e+01 |
Pos logit contributions | |
totality | +8.894 |
deviations | +8.432 |
distinguishing | +8.380 |
similarities | +8.323 |
inaction | +8.311 |
Neg logit contributions | |
ien | -11.859 |
uty | -11.725 |
usk | -11.689 |
aga | -11.276 |
ump | -11.224 |
Token | and |
Token ID | 290 |
Feature activation | +8.10e+01 |
Pos logit contributions | |
these | +17.292 |
those | +16.258 |
things | +15.713 |
many | +15.641 |
the | +15.553 |
Neg logit contributions | |
ien | -16.291 |
inion | -16.198 |
ikes | -15.982 |
usk | -15.865 |
yssey | -15.817 |
Token | could |
Token ID | 714 |
Feature activation | +2.94e+01 |
Pos logit contributions | |
these | +20.620 |
those | +19.821 |
the | +19.808 |
many | +19.220 |
it | +18.791 |
Neg logit contributions | |
| -19.578 |
| -19.538 |
� | -19.536 |
RandomRedditor | -19.532 |
| -19.493 |
Token | have |
Token ID | 423 |
Feature activation | +3.25e+01 |
Pos logit contributions | |
totality | +11.781 |
these | +11.709 |
things | +11.433 |
those | +11.371 |
distinguishing | +11.165 |
Neg logit contributions | |
ien | -13.011 |
uty | -12.998 |
usk | -12.861 |
inion | -12.222 |
aga | -12.219 |
Token | potentially |
Token ID | 6196 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
totality | +11.712 |
these | +11.679 |
those | +11.369 |
things | +11.346 |
many | +11.250 |
Neg logit contributions | |
uty | -15.572 |
ien | -15.110 |
usk | -14.937 |
inion | -14.442 |
igger | -14.350 |
Token | have |
Token ID | 423 |
Feature activation | +3.15e+01 |
Pos logit contributions | |
totality | +8.686 |
deviations | +8.413 |
distinguishing | +8.324 |
inaction | +8.321 |
similarities | +8.226 |
Neg logit contributions | |
ien | -10.316 |
usk | -10.217 |
uty | -9.967 |
ump | -9.926 |
aga | -9.900 |
Token | had |
Token ID | 550 |
Feature activation | +4.31e+01 |
Pos logit contributions | |
totality | +11.553 |
these | +11.546 |
things | +11.236 |
those | +11.233 |
many | +11.136 |
Neg logit contributions | |
uty | -15.129 |
ien | -14.711 |
usk | -14.509 |
inion | -14.080 |
igger | -13.928 |
Token | . |
Token ID | 13 |
Feature activation | +6.28e+01 |
Pos logit contributions | |
u | +0.507 |
aga | +0.497 |
ale | +0.481 |
ass | +0.477 |
ump | +0.470 |
Neg logit contributions | |
distinguishing | -0.953 |
totality | -0.938 |
deviations | -0.918 |
similarities | -0.901 |
hindsight | -0.901 |
Token | � |
Token ID | 447 |
Feature activation | -3.17e+01 |
Pos logit contributions | |
The | +14.722 |
"[ | +14.338 |
Standing | +14.208 |
Lack | +13.943 |
Canadians | +13.870 |
Neg logit contributions | |
teasp | -23.311 |
elaide | -22.629 |
� | -21.825 |
RandomRedditor | -21.767 |
| -21.745 |
Token | � |
Token ID | 251 |
Feature activation | +6.93e+01 |
Pos logit contributions | |
� | +8.153 |
� | +6.994 |
� | +6.941 |
� | +6.939 |
� | +6.867 |
Neg logit contributions | |
similarities | -16.053 |
pecul | -15.777 |
totality | -15.715 |
anonymity | -15.712 |
disadvantages | -15.621 |
Token |
|
Token ID | 198 |
Feature activation | -5.40e+01 |
Pos logit contributions | |
The | +16.394 |
these | +15.666 |
Standing | +15.512 |
Canadians | +15.457 |
One | +15.421 |
Neg logit contributions | |
teasp | -20.004 |
elaide | -19.856 |
ikuman | -19.289 |
� | -18.811 |
| -18.767 |
Token |
|
Token ID | 198 |
Feature activation | +5.61e+01 |
Pos logit contributions | |
| +3.926 |
- | +3.070 |
u | +2.624 |
q | +1.624 |
. | +1.312 |
Neg logit contributions | |
tremend | -45.592 |
eleph | -43.437 |
cumbers | -42.145 |
millenn | -41.701 |
exha | -41.614 |
Token | But |
Token ID | 1537 |
Feature activation | +8.10e+01 |
Pos logit contributions | |
� | +11.784 |
things | +11.627 |
those | +11.282 |
these | +11.271 |
� | +11.246 |
Neg logit contributions | |
teasp | -24.266 |
RandomRedditor | -23.256 |
� | -23.214 |
� | -23.191 |
| -23.190 |
Token | this |
Token ID | 428 |
Feature activation | +3.76e+01 |
Pos logit contributions | |
those | +20.330 |
these | +20.272 |
many | +19.704 |
the | +19.339 |
it | +19.089 |
Neg logit contributions | |
teasp | -21.053 |
� | -20.387 |
| -20.313 |
| -20.306 |
| -20.305 |
Token | year |
Token ID | 614 |
Feature activation | +2.99e+01 |
Pos logit contributions | |
reality | +13.645 |
totality | +13.614 |
inaction | +13.153 |
these | +13.128 |
similarities | +13.107 |
Neg logit contributions | |
uty | -15.735 |
usk | -14.939 |
ien | -14.917 |
ikes | -14.881 |
elaide | -14.737 |
Token | looks |
Token ID | 3073 |
Feature activation | -2.99e+01 |
Pos logit contributions | |
totality | +14.272 |
these | +13.783 |
things | +13.723 |
distinguishing | +13.700 |
similarities | +13.622 |
Neg logit contributions | |
uty | -12.211 |
ien | -12.193 |
usk | -12.107 |
aga | -11.529 |
ump | -11.458 |
Token | different |
Token ID | 1180 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
ash | +6.228 |
ath | +6.203 |
- | +6.012 |
b | +5.860 |
ien | +5.590 |
Neg logit contributions | |
behavi | -11.281 |
Principle | -10.879 |
DRAG | -10.480 |
76561 | -10.454 |
Individuals | -10.408 |
Token | . |
Token ID | 13 |
Feature activation | +6.42e+01 |
Pos logit contributions | |
. | +4.087 |
é | +3.596 |
u | +3.496 |
ab | +3.196 |
- | +3.003 |
Neg logit contributions | |
anonymity | -9.795 |
deviations | -9.750 |
uniqueness | -9.271 |
designers | -9.021 |
bureaucrats | -9.016 |
Token | 15 |
Token ID | 1315 |
Feature activation | -9.78e+01 |
Pos logit contributions | |
8 | +8.354 |
25 | +7.973 |
6 | +7.813 |
24 | +7.769 |
30 | +7.741 |
Neg logit contributions | |
behavi | -35.570 |
tremend | -34.758 |
cumbers | -34.722 |
conflic | -34.434 |
eleph | -33.515 |
Token | to |
Token ID | 284 |
Feature activation | -5.01e+01 |
Pos logit contributions | |
- | +16.178 |
th | +9.198 |
to | +9.197 |
am | +8.824 |
up | +8.610 |
Neg logit contributions | |
behavi | -22.455 |
undermin | -20.506 |
cumbers | -20.235 |
unnecess | -20.136 |
conflic | -19.601 |
Token | 21 |
Token ID | 2310 |
Feature activation | -8.65e+01 |
Pos logit contributions | |
20 | +5.303 |
Aug | +4.941 |
16 | +4.562 |
17 | +4.555 |
18 | +4.484 |
Neg logit contributions | |
behavi | -24.643 |
unnecess | -22.956 |
cumbers | -22.926 |
eleph | -21.943 |
tremend | -21.813 |
Token | among |
Token ID | 1871 |
Feature activation | -8.27e+01 |
Pos logit contributions | |
. | +10.900 |
- | +9.320 |
, | +7.658 |
; | +7.179 |
ien | +6.782 |
Neg logit contributions | |
behavi | -22.985 |
comr | -22.931 |
cumbers | -22.681 |
unnecess | -22.259 |
ingred | -22.125 |
Token | 1 |
Token ID | 352 |
Feature activation | -1.45e+02 |
Pos logit contributions | |
1 | +8.327 |
ab | +7.817 |
ien | +6.907 |
1 | +6.823 |
8 | +6.773 |
Neg logit contributions | |
behavi | -21.672 |
cumbers | -20.269 |
unnecess | -20.011 |
multiplying | -19.220 |
disadvant | -19.209 |
Token | , |
Token ID | 11 |
Feature activation | -1.48e+02 |
Pos logit contributions | |
, | +11.240 |
- | +10.112 |
k | +8.237 |
α | +8.215 |
125 | +7.866 |
Neg logit contributions | |
behavi | -29.289 |
unnecess | -27.524 |
acron | -27.124 |
reconc | -26.620 |
disadvant | -26.415 |
Token | 488 |
Token ID | 33646 |
Feature activation | -6.20e+01 |
Pos logit contributions | |
07 | +15.409 |
005 | +15.356 |
08 | +15.330 |
016 | +15.313 |
06 | +15.196 |
Neg logit contributions | |
behavi | -26.772 |
unnecess | -25.353 |
hemor | -24.901 |
disadvant | -24.520 |
fundamentals | -22.757 |
Token | voters |
Token ID | 4446 |
Feature activation | -6.85e+01 |
Pos logit contributions | |
- | +7.736 |
usk | +7.006 |
1 | +6.993 |
2 | +6.911 |
ire | +6.791 |
Neg logit contributions | |
behavi | -20.203 |
tremend | -17.471 |
conflic | -17.294 |
undermin | -16.603 |
misunderstanding | -16.175 |
Token | in |
Token ID | 287 |
Feature activation | -4.51e+01 |
Pos logit contributions | |
. | +10.974 |
- | +8.727 |
ien | +7.926 |
, | +7.838 |
; | +7.767 |
Neg logit contributions | |
unnecess | -20.254 |
behavi | -20.167 |
cumbers | -19.705 |
pecul | -19.149 |
conflic | -18.240 |
Token | Florida |
Token ID | 4744 |
Feature activation | -3.62e+01 |
Pos logit contributions | |
- | +6.831 |
ien | +5.836 |
arter | +5.686 |
amp | +5.504 |
az | +5.487 |
Neg logit contributions | |
behavi | -16.484 |
unnecess | -15.516 |
cumbers | -14.108 |
misunder | -13.965 |
reluct | -13.293 |
Token | , |
Token ID | 11 |
Feature activation | -3.27e+00 |
Pos logit contributions | |
- | +6.292 |
usk | +6.251 |
. | +5.934 |
ien | +5.452 |
aga | +5.167 |
Neg logit contributions | |
unnecess | -15.091 |
behavi | -14.907 |
deviations | -14.812 |
tremend | -14.473 |
nefarious | -14.315 |
Token | . |
Token ID | 13 |
Feature activation | -8.35e+01 |
Pos logit contributions | |
. | +12.581 |
u | +10.259 |
- | +9.527 |
ien | +9.395 |
q | +8.522 |
Neg logit contributions | |
cumbers | -34.717 |
conflic | -33.371 |
behavi | -33.135 |
unnecess | -31.471 |
tremend | -31.396 |
Token | 15 |
Token ID | 1315 |
Feature activation | -9.78e+01 |
Pos logit contributions | |
8 | +8.354 |
25 | +7.973 |
6 | +7.813 |
24 | +7.769 |
30 | +7.741 |
Neg logit contributions | |
behavi | -35.570 |
tremend | -34.758 |
cumbers | -34.722 |
conflic | -34.434 |
eleph | -33.515 |
Token | to |
Token ID | 284 |
Feature activation | -5.01e+01 |
Pos logit contributions | |
- | +16.178 |
th | +9.198 |
to | +9.197 |
am | +8.824 |
up | +8.610 |
Neg logit contributions | |
behavi | -22.455 |
undermin | -20.506 |
cumbers | -20.235 |
unnecess | -20.136 |
conflic | -19.601 |
Token | 21 |
Token ID | 2310 |
Feature activation | -8.65e+01 |
Pos logit contributions | |
20 | +5.303 |
Aug | +4.941 |
16 | +4.562 |
17 | +4.555 |
18 | +4.484 |
Neg logit contributions | |
behavi | -24.643 |
unnecess | -22.956 |
cumbers | -22.926 |
eleph | -21.943 |
tremend | -21.813 |
Token | among |
Token ID | 1871 |
Feature activation | -8.27e+01 |
Pos logit contributions | |
. | +10.900 |
- | +9.320 |
, | +7.658 |
; | +7.179 |
ien | +6.782 |
Neg logit contributions | |
behavi | -22.985 |
comr | -22.931 |
cumbers | -22.681 |
unnecess | -22.259 |
ingred | -22.125 |
Token | 1 |
Token ID | 352 |
Feature activation | -1.45e+02 |
Pos logit contributions | |
1 | +8.327 |
ab | +7.817 |
ien | +6.907 |
1 | +6.823 |
8 | +6.773 |
Neg logit contributions | |
behavi | -21.672 |
cumbers | -20.269 |
unnecess | -20.011 |
multiplying | -19.220 |
disadvant | -19.209 |
Token | , |
Token ID | 11 |
Feature activation | -1.48e+02 |
Pos logit contributions | |
, | +11.240 |
- | +10.112 |
k | +8.237 |
α | +8.215 |
125 | +7.866 |
Neg logit contributions | |
behavi | -29.289 |
unnecess | -27.524 |
acron | -27.124 |
reconc | -26.620 |
disadvant | -26.415 |
Token | 488 |
Token ID | 33646 |
Feature activation | -6.20e+01 |
Pos logit contributions | |
07 | +15.409 |
005 | +15.356 |
08 | +15.330 |
016 | +15.313 |
06 | +15.196 |
Neg logit contributions | |
behavi | -26.772 |
unnecess | -25.353 |
hemor | -24.901 |
disadvant | -24.520 |
fundamentals | -22.757 |
Token | voters |
Token ID | 4446 |
Feature activation | -6.85e+01 |
Pos logit contributions | |
- | +7.736 |
usk | +7.006 |
1 | +6.993 |
2 | +6.911 |
ire | +6.791 |
Neg logit contributions | |
behavi | -20.203 |
tremend | -17.471 |
conflic | -17.294 |
undermin | -16.603 |
misunderstanding | -16.175 |
Token | in |
Token ID | 287 |
Feature activation | -4.51e+01 |
Pos logit contributions | |
. | +10.974 |
- | +8.727 |
ien | +7.926 |
, | +7.838 |
; | +7.767 |
Neg logit contributions | |
unnecess | -20.254 |
behavi | -20.167 |
cumbers | -19.705 |
pecul | -19.149 |
conflic | -18.240 |
Token | Florida |
Token ID | 4744 |
Feature activation | -3.62e+01 |
Pos logit contributions | |
- | +6.831 |
ien | +5.836 |
arter | +5.686 |
amp | +5.504 |
az | +5.487 |
Neg logit contributions | |
behavi | -16.484 |
unnecess | -15.516 |
cumbers | -14.108 |
misunder | -13.965 |
reluct | -13.293 |
Token |
|
Token ID | 198 |
Feature activation | -4.65e+01 |
Pos logit contributions | |
these | +9.847 |
Canadians | +9.302 |
things | +9.290 |
those | +9.287 |
Wikipedia | +9.201 |
Neg logit contributions | |
elaide | -16.055 |
usk | -15.764 |
uty | -15.730 |
teasp | -15.665 |
ien | -15.664 |
Token |
|
Token ID | 198 |
Feature activation | +2.76e+01 |
Pos logit contributions | |
| +2.746 |
- | +2.387 |
u | +1.967 |
q | +1.406 |
o | +0.886 |
Neg logit contributions | |
tremend | -42.219 |
eleph | -40.445 |
cumbers | -38.782 |
millenn | -38.454 |
exha | -38.366 |
Token | Be |
Token ID | 3856 |
Feature activation | -3.34e+01 |
Pos logit contributions | |
things | +10.758 |
these | +10.710 |
those | +10.420 |
deviations | +10.157 |
similarities | +10.139 |
Neg logit contributions | |
teasp | -11.224 |
usk | -11.027 |
elaide | -10.951 |
uty | -10.949 |
ien | -10.729 |
Token | that |
Token ID | 326 |
Feature activation | -9.82e+01 |
Pos logit contributions | |
ale | +11.108 |
ag | +11.017 |
ien | +11.015 |
am | +10.725 |
av | +10.637 |
Neg logit contributions | |
totality | -9.746 |
timelines | -8.863 |
VIDEOS | -8.637 |
fundamentals | -8.395 |
misinformation | -8.236 |
Token | as |
Token ID | 355 |
Feature activation | -1.24e+02 |
Pos logit contributions | |
as | +8.553 |
- | +8.403 |
ag | +7.329 |
as | +7.313 |
orn | +6.940 |
Neg logit contributions | |
Palestin | -26.036 |
tremend | -25.285 |
cumbers | -24.603 |
conflic | -24.151 |
unnecess | -23.903 |
Token | it |
Token ID | 340 |
Feature activation | -1.40e+02 |
Pos logit contributions | |
ak | +8.302 |
- | +7.757 |
ix | +7.362 |
od | +7.339 |
av | +7.104 |
Neg logit contributions | |
tremend | -34.896 |
cumbers | -33.044 |
conflic | -32.955 |
enthusi | -32.449 |
behavi | -32.336 |
Token | may |
Token ID | 743 |
Feature activation | -7.44e+01 |
Pos logit contributions | |
may | +8.692 |
- | +6.390 |
av | +5.978 |
ome | +4.796 |
ius | +4.664 |
Neg logit contributions | |
� | -40.727 |
� | -40.600 |
tremend | -39.617 |
ThumbnailImage | -39.079 |
unnecess | -38.122 |
Token | , |
Token ID | 11 |
Feature activation | +4.54e+01 |
Pos logit contributions | |
- | +9.782 |
, | +9.708 |
u | +9.128 |
ene | +8.521 |
ig | +8.179 |
Neg logit contributions | |
totality | -14.944 |
somew | -14.821 |
horizont | -14.821 |
acron | -14.665 |
sacrific | -14.415 |
Token | there |
Token ID | 612 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
these | +17.293 |
many | +16.451 |
those | +16.378 |
things | +16.103 |
distinguishing | +15.884 |
Neg logit contributions | |
usk | -16.600 |
teasp | -15.813 |
uty | -15.602 |
aga | -15.430 |
ien | -15.384 |
Token | seems |
Token ID | 2331 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
ab | +2.213 |
ien | +2.146 |
un | +2.140 |
aven | +2.053 |
ene | +1.927 |
Neg logit contributions | |
behavi | -8.937 |
totality | -8.774 |
Hitman | -8.620 |
inaction | -8.455 |
hemor | -8.452 |
Token | to |
Token ID | 284 |
Feature activation | -4.02e+01 |
Pos logit contributions | |
ire | +3.741 |
- | +3.740 |
ab | +3.696 |
un | +3.669 |
to | +3.600 |
Neg logit contributions | |
Changing | -8.508 |
Organizations | -8.335 |
behavi | -8.314 |
Newsp | -8.259 |
Individuals | -8.250 |
Token | 60 |
Token ID | 1899 |
Feature activation | -3.73e+01 |
Pos logit contributions | |
0 | +7.475 |
u | +6.050 |
un | +5.373 |
q | +5.331 |
1 | +5.324 |
Neg logit contributions | |
totality | -13.676 |
behavi | -12.098 |
distinguishing | -12.010 |
disparate | -11.934 |
hindsight | -11.742 |
Token | s |
Token ID | 82 |
Feature activation | -4.92e+01 |
Pos logit contributions | |
u | +9.055 |
s | +8.532 |
q | +8.225 |
k | +7.802 |
b | +7.167 |
Neg logit contributions | |
behavi | -20.211 |
hemor | -19.683 |
metic | -18.936 |
tremend | -18.787 |
undermin | -18.662 |
Token | )} |
Token ID | 38165 |
Feature activation | -5.00e+01 |
Pos logit contributions | |
)} | +6.696 |
) | +5.811 |
u | +5.640 |
+) | +4.627 |
} | +4.534 |
Neg logit contributions | |
tremend | -26.922 |
behavi | -26.681 |
hemor | -25.546 |
unnecess | -25.136 |
conflic | -24.902 |
Token | 4 |
Token ID | 604 |
Feature activation | -7.23e+01 |
Pos logit contributions | |
b | +9.614 |
u | +8.886 |
g | +8.508 |
q | +8.310 |
oe | +8.129 |
Neg logit contributions | |
corrid | -13.923 |
disproportion | -13.690 |
behavi | -13.653 |
totality | -13.569 |
deviations | -13.411 |
Token | . |
Token ID | 13 |
Feature activation | -1.25e+02 |
Pos logit contributions | |
. | +9.897 |
- | +6.301 |
u | +5.385 |
q | +4.564 |
b | +4.499 |
Neg logit contributions | |
eleph | -45.622 |
tremend | -45.464 |
conflic | -43.016 |
� | -42.577 |
reluct | -42.523 |
Token | B |
Token ID | 347 |
Feature activation | -1.40e+02 |
Pos logit contributions | |
b | +13.487 |
g | +12.247 |
c | +12.072 |
q | +12.063 |
u | +11.567 |
Neg logit contributions | |
behavi | -18.412 |
eleph | -17.055 |
totality | -17.031 |
anonymity | -16.663 |
76561 | -16.272 |
Token | g |
Token ID | 70 |
Feature activation | -7.89e+01 |
Pos logit contributions | |
b | +18.633 |
g | +17.739 |
c | +17.543 |
d | +17.232 |
f | +17.198 |
Neg logit contributions | |
eleph | -27.505 |
behavi | -26.671 |
totality | -25.863 |
reluct | -23.609 |
hemor | -23.426 |
Token | 2 |
Token ID | 17 |
Feature activation | -7.40e+01 |
Pos logit contributions | |
2 | +11.868 |
3 | +11.336 |
5 | +10.873 |
6 | +10.850 |
4 | +10.826 |
Neg logit contributions | |
behavi | -30.553 |
eleph | -29.266 |
totality | -28.204 |
unnecess | -27.660 |
conflic | -26.866 |
Token | { |
Token ID | 1391 |
Feature activation | -4.92e+01 |
Pos logit contributions | |
b | +12.024 |
u | +11.531 |
q | +11.004 |
g | +10.828 |
+ | +10.558 |
Neg logit contributions | |
totality | -16.248 |
anonymity | -16.077 |
behavi | -15.872 |
academics | -15.425 |
distractions | -15.406 |
Token | ( |
Token ID | 7 |
Feature activation | -1.84e+01 |
Pos logit contributions | |
u | +5.061 |
q | +4.185 |
0 | +3.738 |
b | +3.567 |
- | +3.256 |
Neg logit contributions | |
eleph | -37.669 |
tremend | -36.491 |
reluct | -35.499 |
metic | -35.241 |
occas | -35.075 |
Token | 0 |
Token ID | 15 |
Feature activation | -3.98e+01 |
Pos logit contributions | |
0 | +3.843 |
u | +3.503 |
ab | +2.996 |
q | +2.926 |
un | +2.756 |
Neg logit contributions | |
behavi | -12.171 |
totality | -11.907 |
distinguishing | -11.460 |
hemor | -11.199 |
conflic | -11.040 |
Token | 20 |
Token ID | 1238 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
u | +4.685 |
q | +4.485 |
k | +4.364 |
s | +4.319 |
b | +4.215 |
Neg logit contributions | |
totality | -9.508 |
dissatisfaction | -9.040 |
whichever | -9.015 |
behavi | -8.979 |
academics | -8.905 |
Token | s |
Token ID | 82 |
Feature activation | -5.64e+01 |
Pos logit contributions | |
u | +5.100 |
q | +4.509 |
s | +4.481 |
ag | +3.719 |
k | +3.670 |
Neg logit contributions | |
behavi | -16.814 |
hemor | -16.313 |
tremend | -15.658 |
undermin | -15.452 |
disadvant | -15.380 |
Token | )} |
Token ID | 38165 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
)} | +7.149 |
) | +5.997 |
} | +5.242 |
+) | +4.198 |
u | +4.047 |
Neg logit contributions | |
tremend | -32.929 |
behavi | -32.091 |
metic | -31.429 |
hemor | -31.352 |
cumbers | -31.171 |
Token | 9 |
Token ID | 860 |
Feature activation | -4.90e+01 |
Pos logit contributions | |
u | +4.940 |
q | +4.656 |
ab | +4.567 |
b | +4.521 |
ien | +4.395 |
Neg logit contributions | |
academics | -10.803 |
totality | -10.234 |
distinguishing | -9.908 |
deviations | -9.723 |
individuality | -9.590 |
Token | . |
Token ID | 13 |
Feature activation | -1.15e+02 |
Pos logit contributions | |
. | +6.841 |
u | +4.948 |
- | +4.653 |
q | +4.445 |
b | +4.426 |
Neg logit contributions | |
tremend | -34.680 |
eleph | -34.644 |
reluct | -34.114 |
cumbers | -33.072 |
conflic | -33.032 |
Token | B |
Token ID | 347 |
Feature activation | -1.38e+02 |
Pos logit contributions | |
b | +12.818 |
q | +12.290 |
u | +11.482 |
c | +11.336 |
g | +11.234 |
Neg logit contributions | |
behavi | -18.332 |
totality | -16.852 |
eleph | -16.588 |
anonymity | -16.142 |
deviations | -15.824 |
Token | g |
Token ID | 70 |
Feature activation | -7.55e+01 |
Pos logit contributions | |
b | +18.672 |
xd | +17.889 |
g | +17.654 |
d | +17.339 |
c | +17.333 |
Neg logit contributions | |
behavi | -24.765 |
eleph | -24.109 |
totality | -23.587 |
reluct | -21.069 |
distinguishing | -20.871 |
Token | 5 |
Token ID | 20 |
Feature activation | -4.55e+01 |
Pos logit contributions | |
2 | +12.483 |
3 | +12.009 |
5 | +11.339 |
6 | +11.295 |
4 | +11.236 |
Neg logit contributions | |
behavi | -25.730 |
eleph | -24.625 |
totality | -24.396 |
unnecess | -23.505 |
anonymity | -22.429 |
Token | { |
Token ID | 1391 |
Feature activation | -5.43e+01 |
Pos logit contributions | |
b | +8.141 |
u | +7.939 |
q | +7.544 |
+ | +7.319 |
h | +7.054 |
Neg logit contributions | |
academics | -15.604 |
deviations | -15.464 |
anonymity | -15.432 |
totality | -15.170 |
embodiments | -15.146 |
Token | ( |
Token ID | 7 |
Feature activation | -4.79e+00 |
Pos logit contributions | |
u | +5.101 |
q | +4.937 |
( | +3.879 |
b | +3.807 |
- | +3.695 |
Neg logit contributions | |
eleph | -40.910 |
tremend | -40.005 |
metic | -38.706 |
reluct | -38.590 |
occas | -37.922 |
Token | 8 |
Token ID | 23 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
u | +0.974 |
q | +0.872 |
ab | +0.870 |
ien | +0.830 |
0 | +0.780 |
Neg logit contributions | |
behavi | -3.718 |
totality | -3.691 |
distinguishing | -3.567 |
deviations | -3.461 |
disadvantages | -3.425 |
Token | 900 |
Token ID | 12865 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
20 | +8.623 |
30 | +8.337 |
25 | +7.923 |
00 | +7.823 |
40 | +7.388 |
Neg logit contributions | |
behavi | -28.455 |
hemor | -26.904 |
eleph | -26.730 |
tremend | -26.669 |
conflic | -26.439 |
Token | + |
Token ID | 10 |
Feature activation | -4.39e+01 |
Pos logit contributions | |
u | +3.717 |
"] | +3.490 |
q | +3.313 |
k | +3.190 |
o | +3.186 |
Neg logit contributions | |
distinguishing | -8.580 |
behavi | -8.260 |
totality | -8.106 |
irony | -8.050 |
anonymity | -7.994 |
Token | 30 |
Token ID | 1270 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
30 | +7.891 |
0 | +7.618 |
20 | +7.290 |
00 | +6.967 |
40 | +6.541 |
Neg logit contributions | |
behavi | -24.680 |
hemor | -24.057 |
conflic | -23.962 |
eleph | -23.229 |
tremend | -23.099 |
Token | "] |
Token ID | 8973 |
Feature activation | -4.15e+01 |
Pos logit contributions | |
u | +4.236 |
ien | +3.625 |
aga | +3.424 |
"] | +3.417 |
uty | +3.364 |
Neg logit contributions | |
totality | -10.852 |
distinguishing | -10.759 |
dissatisfaction | -10.307 |
irony | -10.277 |
spont | -10.108 |
Token | 1 |
Token ID | 352 |
Feature activation | -7.78e+01 |
Pos logit contributions | |
1 | +7.691 |
- | +7.023 |
u | +6.633 |
ab | +6.606 |
int | +6.326 |
Neg logit contributions | |
behavi | -15.320 |
behav | -15.122 |
compan | -14.248 |
lobb | -13.901 |
distractions | -13.792 |
Token | . |
Token ID | 13 |
Feature activation | -1.37e+02 |
Pos logit contributions | |
. | +11.764 |
- | +9.663 |
h | +9.051 |
hr | +6.904 |
m | +6.619 |
Neg logit contributions | |
destro | -28.831 |
ModLoader | -27.117 |
reluct | -26.159 |
therap | -26.090 |
cumbers | -25.616 |
Token | d |
Token ID | 288 |
Feature activation | -7.37e+01 |
Pos logit contributions | |
b | +15.678 |
c | +14.207 |
d | +13.584 |
f | +13.240 |
g | +13.161 |
Neg logit contributions | |
appropri | -21.154 |
gratification | -20.655 |
distinguishing | -20.604 |
etheless | -20.569 |
academics | -20.507 |
Token | 4 |
Token ID | 19 |
Feature activation | -8.81e+01 |
Pos logit contributions | |
4 | +10.801 |
xe | +10.778 |
6 | +10.598 |
5 | +10.527 |
xc | +9.950 |
Neg logit contributions | |
behavi | -31.702 |
eleph | -30.862 |
totality | -28.785 |
disparate | -28.621 |
unnecess | -27.965 |
Token | { |
Token ID | 1391 |
Feature activation | -4.28e+01 |
Pos logit contributions | |
b | +12.516 |
+ | +12.257 |
- | +11.871 |
u | +11.796 |
q | +11.712 |
Neg logit contributions | |
eleph | -16.345 |
behavi | -16.014 |
totality | -15.477 |
academics | -15.338 |
anonymity | -15.266 |
Token | ( |
Token ID | 7 |
Feature activation | -1.71e+01 |
Pos logit contributions | |
u | +11.159 |
end | +10.401 |
b | +10.006 |
ab | +9.772 |
ien | +9.540 |
Neg logit contributions | |
totality | -12.605 |
distractions | -11.635 |
hindsight | -11.521 |
revolving | -11.281 |
academics | -11.272 |
Token | 0 |
Token ID | 15 |
Feature activation | -4.58e+01 |
Pos logit contributions | |
u | +3.812 |
q | +3.582 |
0 | +3.544 |
ab | +3.476 |
un | +3.116 |
Neg logit contributions | |
totality | -10.823 |
behavi | -10.345 |
distinguishing | -10.059 |
deviations | -9.761 |
fundamentals | -9.587 |
Token | 28 |
Token ID | 2579 |
Feature activation | -9.78e+01 |
Pos logit contributions | |
- | +9.296 |
u | +7.992 |
25 | +7.184 |
24 | +7.145 |
8 | +7.099 |
Neg logit contributions | |
tremend | -32.703 |
cumbers | -32.156 |
behavi | -32.067 |
eleph | -31.859 |
unnecess | -30.460 |
Token | , |
Token ID | 11 |
Feature activation | -9.49e+01 |
Pos logit contributions | |
- | +9.885 |
, | +9.842 |
. | +9.010 |
th | +7.826 |
u | +7.561 |
Neg logit contributions | |
cumbers | -31.640 |
tremend | -31.520 |
unnecess | -29.553 |
behavi | -29.096 |
undermin | -29.016 |
Token | 2014 |
Token ID | 1946 |
Feature activation | -1.05e+02 |
Pos logit contributions | |
2014 | +8.286 |
2015 | +7.626 |
2016 | +7.102 |
2013 | +6.801 |
2017 | +6.580 |
Neg logit contributions | |
behavi | -27.241 |
hemor | -26.998 |
cumbers | -26.602 |
unnecess | -25.669 |
tremend | -24.963 |
Token | . |
Token ID | 13 |
Feature activation | -8.28e+01 |
Pos logit contributions | |
. | +14.317 |
- | +9.393 |
u | +7.488 |
., | +6.980 |
uty | +6.905 |
Neg logit contributions | |
cumbers | -32.087 |
tremend | -30.742 |
tiss | -28.979 |
eleph | -28.758 |
ccording | -28.021 |
Token | REUTERS |
Token ID | 15862 |
Feature activation | -7.71e+01 |
Pos logit contributions | |
REUTERS | +11.384 |
RE | +9.957 |
u | +8.835 |
- | +8.778 |
o | +8.647 |
Neg logit contributions | |
tremend | -20.868 |
distinguishing | -19.978 |
disadvantages | -19.707 |
totality | -19.603 |
fundamentals | -19.395 |
Token | / |
Token ID | 14 |
Feature activation | -1.35e+02 |
Pos logit contributions | |
/ | +11.400 |
- | +8.478 |
_ | +6.703 |
q | +5.557 |
u | +5.229 |
Neg logit contributions | |
eleph | -37.083 |
tremend | -36.431 |
hemor | -34.384 |
undermin | -34.194 |
cumbers | -33.840 |
Token | Michael |
Token ID | 13256 |
Feature activation | -9.69e+01 |
Pos logit contributions | |
V | +14.324 |
U | +13.588 |
u | +13.267 |
K | +13.235 |
Max | +12.751 |
Neg logit contributions | |
hemor | -30.575 |
eleph | -29.990 |
reluct | -28.881 |
totality | -28.761 |
tremend | -28.368 |
Token | K |
Token ID | 509 |
Feature activation | -1.15e+02 |
Pos logit contributions | |
a | +15.368 |
o | +14.413 |
ak | +13.022 |
k | +12.760 |
aa | +12.101 |
Neg logit contributions | |
totality | -30.055 |
unnecess | -26.374 |
inaction | -25.659 |
mileage | -25.478 |
temptation | -25.403 |
Token | lim |
Token ID | 2475 |
Feature activation | -9.36e+01 |
Pos logit contributions | |
orn | +15.136 |
lim | +14.579 |
arp | +13.812 |
ort | +12.652 |
iner | +12.609 |
Neg logit contributions | |
龍契士 | -39.610 |
contradictions | -35.313 |
fundamentals | -34.952 |
tremend | -34.851 |
undermin | -34.562 |
Token | enty |
Token ID | 3787 |
Feature activation | -5.66e+01 |
Pos logit contributions | |
enty | +13.172 |
ov | +5.449 |
kin | +5.099 |
ash | +4.308 |
chuk | +4.239 |
Neg logit contributions | |
misunder | -48.476 |
tremend | -46.785 |
morp | -45.941 |
convol | -45.939 |
unheard | -44.558 |
Token | ev |
Token ID | 1990 |
Feature activation | -5.51e+01 |
Pos logit contributions | |
ev | +8.397 |
uk | +8.028 |
v | +6.879 |
usk | +6.526 |
av | +5.547 |
Neg logit contributions | |
behavi | -29.944 |
Palestin | -28.506 |
unnecess | -27.969 |
cumbers | -27.705 |
hemor | -27.028 |
Token | 1 |
Token ID | 352 |
Feature activation | -1.15e+02 |
Pos logit contributions | |
24 | +8.233 |
8 | +8.183 |
20 | +8.139 |
25 | +8.072 |
u | +8.070 |
Neg logit contributions | |
behavi | -34.559 |
tremend | -34.357 |
cumbers | -33.655 |
conflic | -32.697 |
eleph | -32.516 |
Token | , |
Token ID | 11 |
Feature activation | -7.96e+01 |
Pos logit contributions | |
. | +11.933 |
, | +10.943 |
., | +9.426 |
q | +9.231 |
k | +9.063 |
Neg logit contributions | |
totality | -21.178 |
comr | -20.285 |
pesky | -19.930 |
behavi | -19.536 |
sacrific | -19.453 |
Token | 9 |
Token ID | 860 |
Feature activation | -8.34e+01 |
Pos logit contributions | |
2015 | +8.089 |
2016 | +7.475 |
u | +7.341 |
2014 | +7.301 |
2017 | +6.889 |
Neg logit contributions | |
unnecess | -21.787 |
behavi | -21.323 |
cumbers | -20.803 |
hemor | -20.623 |
welf | -20.455 |
Token | a |
Token ID | 257 |
Feature activation | -1.06e+02 |
Pos logit contributions | |
am | +14.615 |
pm | +12.867 |
- | +12.134 |
ab | +11.933 |
ix | +11.893 |
Neg logit contributions | |
behavi | -16.044 |
totality | -15.723 |
Palestin | -15.674 |
spont | -15.579 |
unnecess | -15.253 |
Token | . |
Token ID | 13 |
Feature activation | -1.19e+02 |
Pos logit contributions | |
. | +13.377 |
u | +8.303 |
- | +7.532 |
q | +7.322 |
o | +6.844 |
Neg logit contributions | |
cumbers | -43.782 |
tremend | -43.192 |
eleph | -42.051 |
conflic | -40.251 |
occas | -40.235 |
Token | m |
Token ID | 76 |
Feature activation | -1.35e+02 |
Pos logit contributions | |
m | +15.832 |
k | +8.565 |
u | +7.816 |
b | +7.565 |
d | +7.313 |
Neg logit contributions | |
tremend | -55.975 |
cumbers | -55.516 |
reluct | -54.828 |
conflic | -54.576 |
millenn | -54.477 |
Token | . |
Token ID | 13 |
Feature activation | -1.10e+02 |
Pos logit contributions | |
. | +15.849 |
., | +15.770 |
.; | +13.899 |
ire | +12.653 |
uty | +12.556 |
Neg logit contributions | |
totality | -19.919 |
resemb | -18.491 |
hindsight | -18.388 |
symbolism | -18.279 |
disadvantages | -18.276 |
Token | PT |
Token ID | 19310 |
Feature activation | -9.03e+01 |
Pos logit contributions | |
<|endoftext|> | +10.818 |
ock | +10.518 |
| | +9.905 |
c | +9.608 |
ok | +9.567 |
Neg logit contributions | |
resemb | -21.730 |
Sorceress | -20.722 |
totality | -19.848 |
somet | -19.799 |
comr | -19.770 |
Token | . |
Token ID | 13 |
Feature activation | -8.45e+01 |
Pos logit contributions | |
. | +13.831 |
inion | +11.129 |
| | +11.045 |
; | +10.700 |
ix | +10.603 |
Neg logit contributions | |
resemb | -19.132 |
pecul | -18.857 |
semblance | -17.641 |
totality | -17.618 |
comr | -17.230 |
Token |
|
Token ID | 198 |
Feature activation | -8.96e+01 |
Pos logit contributions | |
<|endoftext|> | +11.002 |
u | +10.538 |
| | +9.682 |
ix | +9.672 |
| +9.385 |
Neg logit contributions | |
totality | -20.088 |
disadvant | -19.168 |
pecul | -18.751 |
individuality | -18.718 |
spont | -18.573 |
Token |
|
Token ID | 198 |
Feature activation | -5.76e+01 |
Pos logit contributions | |
| +8.094 |
- | +5.901 |
u | +5.613 |
q | +4.531 |
. | +4.120 |
Neg logit contributions | |
tremend | -53.082 |
eleph | -49.853 |
cumbers | -48.389 |
exha | -47.735 |
� | -47.701 |
Token | 97 |
Token ID | 5607 |
Feature activation | -3.06e+01 |
Pos logit contributions | |
u | +0.188 |
ab | +0.166 |
ien | +0.164 |
q | +0.163 |
usk | +0.141 |
Neg logit contributions | |
totality | -0.780 |
behavi | -0.771 |
distinguishing | -0.753 |
deviations | -0.733 |
disadvantages | -0.726 |
Token | s |
Token ID | 82 |
Feature activation | -5.87e+01 |
Pos logit contributions | |
s | +7.167 |
k | +6.042 |
q | +5.938 |
u | +5.897 |
b | +5.111 |
Neg logit contributions | |
behavi | -16.388 |
hemor | -15.981 |
tremend | -15.304 |
unnecess | -14.959 |
comr | -14.933 |
Token | )} |
Token ID | 38165 |
Feature activation | -5.50e+00 |
Pos logit contributions | |
)} | +6.859 |
) | +5.263 |
} | +4.841 |
+) | +3.754 |
}) | +3.528 |
Neg logit contributions | |
tremend | -35.110 |
behavi | -34.081 |
eleph | -33.438 |
hemor | -33.385 |
metic | -33.379 |
Token | 10 |
Token ID | 838 |
Feature activation | -5.32e+01 |
Pos logit contributions | |
q | +1.411 |
u | +1.289 |
b | +1.264 |
ab | +1.175 |
oe | +1.122 |
Neg logit contributions | |
distinguishing | -3.712 |
academics | -3.680 |
totality | -3.603 |
similarities | -3.536 |
behavi | -3.519 |
Token | . |
Token ID | 13 |
Feature activation | -1.05e+02 |
Pos logit contributions | |
. | +7.831 |
u | +5.503 |
- | +5.420 |
b | +4.381 |
q | +4.288 |
Neg logit contributions | |
eleph | -37.531 |
tremend | -37.468 |
reluct | -35.727 |
cumbers | -35.327 |
conflic | -35.311 |
Token | B |
Token ID | 347 |
Feature activation | -1.35e+02 |
Pos logit contributions | |
b | +12.706 |
q | +12.048 |
u | +11.673 |
g | +11.225 |
c | +11.097 |
Neg logit contributions | |
behavi | -18.401 |
totality | -16.798 |
eleph | -16.491 |
anonymity | -16.058 |
deviations | -15.921 |
Token | xe |
Token ID | 27705 |
Feature activation | -5.15e+01 |
Pos logit contributions | |
b | +18.059 |
g | +17.756 |
xd | +17.182 |
xe | +17.140 |
c | +16.978 |
Neg logit contributions | |
behavi | -26.524 |
eleph | -25.725 |
totality | -24.584 |
reluct | -22.006 |
distinguishing | -21.828 |
Token | 7 |
Token ID | 22 |
Feature activation | -4.45e+01 |
Pos logit contributions | |
5 | +9.601 |
6 | +9.407 |
4 | +9.355 |
7 | +8.648 |
3 | +8.631 |
Neg logit contributions | |
behavi | -22.699 |
totality | -21.827 |
unnecess | -20.121 |
undermin | -19.998 |
conflic | -19.849 |
Token | { |
Token ID | 1391 |
Feature activation | -5.42e+01 |
Pos logit contributions | |
b | +7.723 |
xe | +7.636 |
+ | +7.500 |
u | +7.276 |
q | +7.057 |
Neg logit contributions | |
deviations | -16.232 |
totality | -15.946 |
academics | -15.890 |
anonymity | -15.869 |
embodiments | -15.811 |
Token | ( |
Token ID | 7 |
Feature activation | -7.51e+00 |
Pos logit contributions | |
u | +4.929 |
q | +4.718 |
( | +3.679 |
b | +3.570 |
0 | +3.344 |
Neg logit contributions | |
eleph | -41.405 |
tremend | -40.464 |
reluct | -38.890 |
metic | -38.835 |
occas | -38.300 |
Token | 66 |
Token ID | 2791 |
Feature activation | -3.55e+01 |
Pos logit contributions | |
u | +1.419 |
ab | +1.296 |
q | +1.256 |
ien | +1.169 |
0 | +1.133 |
Neg logit contributions | |
behavi | -5.800 |
totality | -5.715 |
distinguishing | -5.505 |
disadvantages | -5.337 |
deviations | -5.322 |
Token | for |
Token ID | 329 |
Feature activation | -7.85e+01 |
Pos logit contributions | |
- | +7.793 |
. | +6.270 |
uty | +6.203 |
ial | +5.946 |
/ | +5.873 |
Neg logit contributions | |
cumbers | -16.653 |
bureaucrats | -16.298 |
behavi | -15.933 |
totality | -15.707 |
inaction | -15.276 |
Token | the |
Token ID | 262 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
ong | +11.726 |
ok | +11.094 |
- | +10.688 |
ak | +10.498 |
oto | +10.147 |
Neg logit contributions | |
disadvant | -15.534 |
behavi | -14.282 |
totality | -14.170 |
distortions | -14.127 |
contraceptives | -13.923 |
Token | Score |
Token ID | 26595 |
Feature activation | -3.81e+01 |
Pos logit contributions | |
Score | +4.935 |
ong | +4.684 |
u | +4.343 |
inion | +4.303 |
ike | +4.255 |
Neg logit contributions | |
disadvant | -10.558 |
predators | -10.449 |
bureaucrats | -10.419 |
totality | -10.305 |
privile | -10.209 |
Token | esports |
Token ID | 37407 |
Feature activation | -3.81e+01 |
Pos logit contributions | |
eSports | +1.642 |
esports | +1.371 |
. | +0.209 |
Esports | +0.118 |
inion | +0.114 |
Neg logit contributions | |
bragging | -22.925 |
disadvant | -22.769 |
brute | -22.767 |
throats | -22.638 |
alienation | -22.614 |
Token | . |
Token ID | 13 |
Feature activation | -8.62e+01 |
Pos logit contributions | |
. | +7.937 |
amp | +5.141 |
ong | +4.926 |
ock | +4.699 |
u | +4.697 |
Neg logit contributions | |
unnecess | -16.897 |
cumbers | -16.423 |
behavi | -16.261 |
brute | -16.093 |
totality | -16.049 |
Token | You |
Token ID | 921 |
Feature activation | -1.34e+02 |
Pos logit contributions | |
ak | +8.445 |
io | +8.339 |
u | +7.757 |
ai | +7.738 |
k | +7.502 |
Neg logit contributions | |
disadvant | -24.919 |
unnecess | -23.158 |
hindsight | -23.118 |
reconc | -22.846 |
behavi | -22.283 |
Token | can |
Token ID | 460 |
Feature activation | -1.31e+02 |
Pos logit contributions | |
can | +8.061 |
j | +5.541 |
ang | +3.805 |
q | +3.450 |
u | +2.845 |
Neg logit contributions | |
totality | -32.526 |
Seym | -32.366 |
Izan | -31.735 |
theless | -31.067 |
hindsight | -31.039 |
Token | follow |
Token ID | 1061 |
Feature activation | -9.23e+01 |
Pos logit contributions | |
follow | +6.168 |
reach | +4.470 |
ai | +4.417 |
find | +4.263 |
ail | +4.148 |
Neg logit contributions | |
disadvant | -31.437 |
privile | -28.628 |
inaction | -28.527 |
cumbers | -28.249 |
misunder | -28.109 |
Token | him |
Token ID | 683 |
Feature activation | -9.96e+01 |
Pos logit contributions | |
him | +8.690 |
aki | +7.714 |
ire | +7.379 |
ash | +7.142 |
ach | +7.067 |
Neg logit contributions | |
disadvant | -22.201 |
bureaucrats | -20.667 |
totality | -20.616 |
privile | -20.082 |
bureaucr | -19.585 |
Token | on |
Token ID | 319 |
Feature activation | -9.19e+01 |
Pos logit contributions | |
on | +8.750 |
ale | +8.051 |
u | +8.034 |
onian | +7.800 |
ip | +7.399 |
Neg logit contributions | |
totality | -25.538 |
bureaucrats | -25.414 |
Consent | -25.356 |
hindsight | -24.754 |
disadvant | -23.925 |
Token | Twitter |
Token ID | 3009 |
Feature activation | -6.56e+01 |
Pos logit contributions | |
- | +8.333 |
V | +8.027 |
ob | +7.822 |
u | +7.708 |
twitch | +7.355 |
Neg logit contributions | |
totality | -21.307 |
bureaucrats | -20.465 |
embodiments | -19.667 |
intermedi | -19.323 |
cottage | -19.283 |
Token | for |
Token ID | 329 |
Feature activation | -3.04e+01 |
Pos logit contributions | |
. | +6.609 |
- | +6.358 |
ved | +4.655 |
u | +4.545 |
, | +4.539 |
Neg logit contributions | |
behavi | -18.263 |
unnecess | -17.161 |
conflic | -16.873 |
cumbers | -16.251 |
tremend | -15.491 |
Token | Portland |
Token ID | 10727 |
Feature activation | -3.10e+01 |
Pos logit contributions | |
u | +5.080 |
aga | +4.887 |
ien | +4.706 |
illo | +4.644 |
ia | +4.366 |
Neg logit contributions | |
behavi | -13.247 |
unnecess | -11.752 |
disadvant | -11.538 |
disadvantages | -11.303 |
conflic | -11.031 |
Token | and |
Token ID | 290 |
Feature activation | -2.64e+01 |
Pos logit contributions | |
. | +6.083 |
- | +5.805 |
u | +5.689 |
ia | +5.460 |
aga | +4.848 |
Neg logit contributions | |
unnecess | -13.444 |
behavi | -13.370 |
uniqueness | -13.301 |
individuality | -12.687 |
deviations | -12.597 |
Token | averaged |
Token ID | 16449 |
Feature activation | -9.60e+01 |
Pos logit contributions | |
- | +4.738 |
aga | +4.462 |
u | +4.416 |
ien | +4.276 |
ather | +4.235 |
Neg logit contributions | |
behavi | -13.886 |
unnecess | -12.030 |
conflic | -11.882 |
deviations | -11.182 |
tremend | -11.076 |
Token | 3 |
Token ID | 513 |
Feature activation | -9.68e+01 |
Pos logit contributions | |
7 | +8.584 |
11 | +8.427 |
6 | +8.320 |
8 | +8.238 |
12 | +7.987 |
Neg logit contributions | |
behavi | -24.922 |
conflic | -22.682 |
unnecess | -22.094 |
ortunately | -21.827 |
cumbers | -21.818 |
Token | . |
Token ID | 13 |
Feature activation | -1.33e+02 |
Pos logit contributions | |
. | +13.644 |
- | +10.594 |
½ | +9.698 |
pm | +8.346 |
b | +8.165 |
Neg logit contributions | |
Catalyst | -22.013 |
Mankind | -21.816 |
Situation | -21.652 |
totality | -21.524 |
pecul | -20.599 |
Token | 0 |
Token ID | 15 |
Feature activation | -8.36e+01 |
Pos logit contributions | |
8 | +15.704 |
0 | +15.396 |
6 | +15.253 |
7 | +15.036 |
5 | +14.412 |
Neg logit contributions | |
behavi | -32.787 |
conflic | -30.600 |
hemor | -30.089 |
tremend | -29.283 |
undermin | -28.894 |
Token | points |
Token ID | 2173 |
Feature activation | -6.17e+01 |
Pos logit contributions | |
p | +8.732 |
- | +8.698 |
g | +8.133 |
o | +8.058 |
pg | +7.778 |
Neg logit contributions | |
behavi | -20.911 |
pecul | -20.254 |
Canary | -19.359 |
behav | -19.296 |
reconc | -19.173 |
Token | and |
Token ID | 290 |
Feature activation | -7.86e+01 |
Pos logit contributions | |
. | +9.117 |
- | +8.433 |
, | +7.646 |
and | +6.791 |
/ | +6.715 |
Neg logit contributions | |
behavi | -19.627 |
conflic | -19.421 |
unnecess | -18.638 |
cumbers | -17.761 |
tremend | -17.609 |
Token | 3 |
Token ID | 513 |
Feature activation | -8.30e+01 |
Pos logit contributions | |
- | +8.426 |
0 | +8.217 |
1 | +7.798 |
2 | +7.779 |
3 | +7.318 |
Neg logit contributions | |
behavi | -19.518 |
ortunately | -17.961 |
conflic | -17.943 |
unnecess | -17.762 |
pecul | -16.327 |
Token | . |
Token ID | 13 |
Feature activation | -1.22e+02 |
Pos logit contributions | |
. | +11.424 |
- | +7.605 |
q | +5.014 |
u | +4.549 |
b | +4.505 |
Neg logit contributions | |
tremend | -43.187 |
ortunately | -42.362 |
conflic | -42.311 |
millenn | -41.169 |
eleph | -40.974 |
Token | has |
Token ID | 468 |
Feature activation | -4.72e+01 |
Pos logit contributions | |
ather | +6.065 |
's | +5.732 |
aded | +5.596 |
- | +5.531 |
u | +5.451 |
Neg logit contributions | |
behavi | -19.202 |
unnecess | -17.212 |
conflic | -16.727 |
Palestin | -16.420 |
senal | -15.863 |
Token | one |
Token ID | 530 |
Feature activation | -4.95e+01 |
Pos logit contributions | |
- | +7.369 |
scored | +6.637 |
been | +6.480 |
aga | +6.309 |
ather | +6.286 |
Neg logit contributions | |
behavi | -15.919 |
unnecess | -15.201 |
Dying | -13.751 |
conflic | -13.456 |
eleph | -13.387 |
Token | year |
Token ID | 614 |
Feature activation | -4.69e+01 |
Pos logit contributions | |
- | +10.684 |
u | +9.355 |
year | +8.776 |
ison | +8.449 |
ass | +7.865 |
Neg logit contributions | |
unnecess | -15.057 |
behavi | -14.844 |
Izan | -14.373 |
conflic | -13.890 |
Mankind | -13.721 |
Token | and |
Token ID | 290 |
Feature activation | -5.04e+01 |
Pos logit contributions | |
- | +7.766 |
of | +5.624 |
ago | +5.295 |
u | +4.892 |
long | +4.876 |
Neg logit contributions | |
unnecess | -17.613 |
conflic | -17.109 |
behavi | -17.097 |
Subtle | -16.937 |
Hast | -16.848 |
Token | $ |
Token ID | 720 |
Feature activation | -8.88e+01 |
Pos logit contributions | |
- | +7.327 |
ien | +5.651 |
$ | +5.265 |
aga | +4.775 |
11 | +4.769 |
Neg logit contributions | |
behavi | -19.045 |
unnecess | -18.128 |
conflic | -17.413 |
tremend | -16.291 |
eleph | -15.325 |
Token | 1 |
Token ID | 16 |
Feature activation | -1.32e+02 |
Pos logit contributions | |
8 | +12.079 |
6 | +11.694 |
7 | +11.297 |
12 | +10.920 |
10 | +10.806 |
Neg logit contributions | |
behavi | -41.630 |
conflic | -41.165 |
tremend | -40.720 |
hemor | -40.600 |
eleph | -39.810 |
Token | . |
Token ID | 13 |
Feature activation | -1.17e+02 |
Pos logit contributions | |
. | +15.152 |
- | +13.524 |
MM | +13.026 |
m | +12.597 |
million | +12.091 |
Neg logit contributions | |
resemb | -20.597 |
inaction | -20.103 |
totality | -19.781 |
behavi | -19.643 |
reflections | -19.617 |
Token | 35 |
Token ID | 2327 |
Feature activation | -1.03e+02 |
Pos logit contributions | |
8 | +14.147 |
6 | +13.967 |
5 | +13.965 |
25 | +13.601 |
7 | +13.313 |
Neg logit contributions | |
behavi | -40.293 |
tremend | -38.925 |
hemor | -38.648 |
conflic | -38.584 |
undermin | -38.332 |
Token | million |
Token ID | 1510 |
Feature activation | -4.36e+01 |
Pos logit contributions | |
- | +12.449 |
MM | +12.098 |
million | +11.645 |
m | +11.633 |
M | +11.207 |
Neg logit contributions | |
horizont | -22.583 |
totality | -21.926 |
behavi | -21.861 |
distortions | -20.874 |
resemb | -20.824 |
Token | left |
Token ID | 1364 |
Feature activation | -6.14e+01 |
Pos logit contributions | |
- | +6.781 |
ires | +4.758 |
ien | +4.591 |
ag | +4.504 |
. | +4.296 |
Neg logit contributions | |
Mothers | -18.886 |
tremend | -18.885 |
behavi | -18.381 |
Perspect | -18.146 |
Subtle | -17.841 |
Token | on |
Token ID | 319 |
Feature activation | -5.92e+01 |
Pos logit contributions | |
. | +6.495 |
on | +5.988 |
- | +5.829 |
u | +5.087 |
ien | +4.407 |
Neg logit contributions | |
Mothers | -22.217 |
unnecess | -22.019 |
Subtle | -21.908 |
comr | -21.859 |
tremend | -21.787 |
Token | the |
Token ID | 262 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
ong | +11.726 |
ok | +11.094 |
- | +10.688 |
ak | +10.498 |
oto | +10.147 |
Neg logit contributions | |
disadvant | -15.534 |
behavi | -14.282 |
totality | -14.170 |
distortions | -14.127 |
contraceptives | -13.923 |
Token | Score |
Token ID | 26595 |
Feature activation | -3.81e+01 |
Pos logit contributions | |
Score | +4.935 |
ong | +4.684 |
u | +4.343 |
inion | +4.303 |
ike | +4.255 |
Neg logit contributions | |
disadvant | -10.558 |
predators | -10.449 |
bureaucrats | -10.419 |
totality | -10.305 |
privile | -10.209 |
Token | esports |
Token ID | 37407 |
Feature activation | -3.81e+01 |
Pos logit contributions | |
eSports | +1.642 |
esports | +1.371 |
. | +0.209 |
Esports | +0.118 |
inion | +0.114 |
Neg logit contributions | |
bragging | -22.925 |
disadvant | -22.769 |
brute | -22.767 |
throats | -22.638 |
alienation | -22.614 |
Token | . |
Token ID | 13 |
Feature activation | -8.62e+01 |
Pos logit contributions | |
. | +7.937 |
amp | +5.141 |
ong | +4.926 |
ock | +4.699 |
u | +4.697 |
Neg logit contributions | |
unnecess | -16.897 |
cumbers | -16.423 |
behavi | -16.261 |
brute | -16.093 |
totality | -16.049 |
Token | You |
Token ID | 921 |
Feature activation | -1.34e+02 |
Pos logit contributions | |
ak | +8.445 |
io | +8.339 |
u | +7.757 |
ai | +7.738 |
k | +7.502 |
Neg logit contributions | |
disadvant | -24.919 |
unnecess | -23.158 |
hindsight | -23.118 |
reconc | -22.846 |
behavi | -22.283 |
Token | can |
Token ID | 460 |
Feature activation | -1.31e+02 |
Pos logit contributions | |
can | +8.061 |
j | +5.541 |
ang | +3.805 |
q | +3.450 |
u | +2.845 |
Neg logit contributions | |
totality | -32.526 |
Seym | -32.366 |
Izan | -31.735 |
theless | -31.067 |
hindsight | -31.039 |
Token | follow |
Token ID | 1061 |
Feature activation | -9.23e+01 |
Pos logit contributions | |
follow | +6.168 |
reach | +4.470 |
ai | +4.417 |
find | +4.263 |
ail | +4.148 |
Neg logit contributions | |
disadvant | -31.437 |
privile | -28.628 |
inaction | -28.527 |
cumbers | -28.249 |
misunder | -28.109 |
Token | him |
Token ID | 683 |
Feature activation | -9.96e+01 |
Pos logit contributions | |
him | +8.690 |
aki | +7.714 |
ire | +7.379 |
ash | +7.142 |
ach | +7.067 |
Neg logit contributions | |
disadvant | -22.201 |
bureaucrats | -20.667 |
totality | -20.616 |
privile | -20.082 |
bureaucr | -19.585 |
Token | on |
Token ID | 319 |
Feature activation | -9.19e+01 |
Pos logit contributions | |
on | +8.750 |
ale | +8.051 |
u | +8.034 |
onian | +7.800 |
ip | +7.399 |
Neg logit contributions | |
totality | -25.538 |
bureaucrats | -25.414 |
Consent | -25.356 |
hindsight | -24.754 |
disadvant | -23.925 |
Token | Twitter |
Token ID | 3009 |
Feature activation | -6.56e+01 |
Pos logit contributions | |
- | +8.333 |
V | +8.027 |
ob | +7.822 |
u | +7.708 |
twitch | +7.355 |
Neg logit contributions | |
totality | -21.307 |
bureaucrats | -20.465 |
embodiments | -19.667 |
intermedi | -19.323 |
cottage | -19.283 |
Token | . |
Token ID | 13 |
Feature activation | -5.65e+01 |
Pos logit contributions | |
. | +11.508 |
u | +9.876 |
ale | +8.541 |
ath | +8.358 |
- | +7.921 |
Neg logit contributions | |
totality | -18.505 |
bureaucrats | -17.975 |
behavi | -17.006 |
bureaucratic | -16.822 |
hindsight | -16.704 |
Token | t |
Token ID | 83 |
Feature activation | -9.10e+01 |
Pos logit contributions | |
t | +13.449 |
u | +9.162 |
k | +9.066 |
q | +8.917 |
o | +8.752 |
Neg logit contributions | |
eleph | -43.845 |
metic | -43.750 |
conflic | -43.009 |
tremend | -42.908 |
� | -42.834 |
Token | . |
Token ID | 13 |
Feature activation | +5.67e+00 |
Pos logit contributions | |
. | +11.985 |
- | +7.112 |
., | +6.457 |
u | +5.965 |
q | +5.931 |
Neg logit contributions | |
tremend | -49.389 |
eleph | -47.268 |
cumbers | -45.871 |
millenn | -45.275 |
practition | -44.843 |
Token | A |
Token ID | 317 |
Feature activation | -4.60e+01 |
Pos logit contributions | |
deviations | +2.657 |
distinguishing | +2.586 |
totality | +2.579 |
academics | +2.500 |
inaction | +2.494 |
Neg logit contributions | |
ien | -3.157 |
usk | -3.025 |
aga | -2.852 |
u | -2.848 |
illo | -2.807 |
Token | US |
Token ID | 2937 |
Feature activation | -4.07e+01 |
Pos logit contributions | |
US | +4.852 |
usk | +3.621 |
u | +2.687 |
AS | +2.627 |
UG | +2.542 |
Neg logit contributions | |
eleph | -35.757 |
tremend | -34.946 |
exha | -33.693 |
undermin | -33.437 |
cumbers | -33.314 |
Token | 12 |
Token ID | 1105 |
Feature activation | -8.27e+01 |
Pos logit contributions | |
u | +7.563 |
usk | +6.767 |
ar | +6.578 |
ale | +6.351 |
aru | +6.277 |
Neg logit contributions | |
morp | -17.155 |
hindsight | -15.421 |
inconven | -15.373 |
distinguishing | -15.316 |
ubiquitous | -15.284 |
Token | Michael |
Token ID | 3899 |
Feature activation | -1.31e+02 |
Pos logit contributions | |
athan | +10.688 |
ien | +9.833 |
- | +9.738 |
u | +9.731 |
o | +8.502 |
Neg logit contributions | |
behavi | -22.931 |
unnecess | -22.224 |
reluct | -21.636 |
undermin | -21.256 |
conflic | -20.617 |
Token | Matthews |
Token ID | 22233 |
Feature activation | -4.70e+01 |
Pos logit contributions | |
un | +13.717 |
um | +11.986 |
ia | +11.511 |
ina | +11.178 |
u | +11.136 |
Neg logit contributions | |
behavi | -29.316 |
hemor | -28.262 |
tremend | -28.063 |
76561 | -27.889 |
helicop | -27.453 |
Token | ( |
Token ID | 357 |
Feature activation | -6.74e+01 |
Pos logit contributions | |
- | +10.542 |
ien | +10.424 |
ak | +10.176 |
u | +10.049 |
aga | +9.749 |
Neg logit contributions | |
deviations | -14.751 |
totality | -14.624 |
embodiments | -14.462 |
inaction | -14.193 |
anonymity | -14.119 |
Token | R |
Token ID | 49 |
Feature activation | -7.89e+01 |
Pos logit contributions | |
GB | +10.056 |
O | +9.999 |
B | +9.022 |
Sky | +8.943 |
L | +8.910 |
Neg logit contributions | |
eleph | -30.601 |
reluct | -27.661 |
undermin | -27.025 |
citiz | -26.980 |
conflic | -26.691 |
Token | ab |
Token ID | 397 |
Feature activation | -5.34e+01 |
Pos logit contributions | |
ab | +17.968 |
amp | +15.494 |
abo | +15.018 |
ug | +14.776 |
ac | +14.760 |
Neg logit contributions | |
behavi | -22.402 |
Sorceress | -22.229 |
hemor | -22.011 |
totality | -21.905 |
moreover | -20.594 |
Token | ob |
Token ID | 672 |
Feature activation | -5.13e+01 |
Pos logit contributions | |
ob | +12.149 |
ab | +8.524 |
ib | +7.400 |
ub | +6.977 |
b | +6.624 |
Neg logit contributions | |
behavi | -34.603 |
unnecess | -31.254 |
hemor | -29.668 |
tremend | -29.555 |
cumbers | -28.943 |
Token | ( |
Token ID | 7 |
Feature activation | -2.42e+00 |
Pos logit contributions | |
u | +9.594 |
ien | +8.789 |
ab | +8.401 |
q | +8.176 |
un | +8.039 |
Neg logit contributions | |
totality | -13.420 |
deviations | -12.196 |
hindsight | -12.083 |
bureaucrats | -12.036 |
distinguishing | -11.978 |
Token | 0 |
Token ID | 15 |
Feature activation | -3.34e+01 |
Pos logit contributions | |
u | +0.370 |
ab | +0.329 |
q | +0.303 |
0 | +0.295 |
ien | +0.286 |
Neg logit contributions | |
totality | -2.109 |
behavi | -2.022 |
distinguishing | -2.013 |
deviations | -1.943 |
prevailing | -1.916 |
Token | s |
Token ID | 82 |
Feature activation | -4.96e+01 |
Pos logit contributions | |
u | +8.736 |
s | +8.592 |
q | +8.148 |
b | +7.879 |
ab | +7.734 |
Neg logit contributions | |
totality | -12.829 |
distinguishing | -12.627 |
whichever | -12.301 |
pecul | -12.208 |
geography | -12.164 |
Token | )} |
Token ID | 38165 |
Feature activation | -7.14e+01 |
Pos logit contributions | |
)} | +7.377 |
) | +6.635 |
u | +5.738 |
aga | +5.330 |
} | +5.278 |
Neg logit contributions | |
tremend | -24.992 |
behavi | -24.488 |
hemor | -23.710 |
unnecess | -23.217 |
cumbers | -23.007 |
Token | 2 |
Token ID | 362 |
Feature activation | -7.65e+01 |
Pos logit contributions | |
b | +11.680 |
u | +11.328 |
q | +11.002 |
c | +9.962 |
g | +9.273 |
Neg logit contributions | |
eleph | -14.995 |
moderation | -14.742 |
academics | -14.719 |
anonymity | -14.623 |
individuality | -14.547 |
Token | . |
Token ID | 13 |
Feature activation | -1.30e+02 |
Pos logit contributions | |
. | +10.460 |
- | +7.690 |
b | +6.981 |
u | +6.521 |
q | +5.837 |
Neg logit contributions | |
eleph | -43.562 |
tremend | -41.408 |
conflic | -41.394 |
reluct | -40.809 |
cumbers | -40.613 |
Token | N |
Token ID | 399 |
Feature activation | -1.25e+02 |
Pos logit contributions | |
b | +13.501 |
c | +12.462 |
q | +12.351 |
g | +11.756 |
f | +11.585 |
Neg logit contributions | |
behavi | -18.408 |
eleph | -18.055 |
totality | -17.029 |
76561 | -16.544 |
anonymity | -16.520 |
Token | f |
Token ID | 69 |
Feature activation | -6.88e+01 |
Pos logit contributions | |
f | +16.960 |
c | +16.931 |
b | +16.772 |
xd | +16.613 |
xe | +16.361 |
Neg logit contributions | |
eleph | -30.258 |
behavi | -28.461 |
totality | -27.487 |
reluct | -24.776 |
hemor | -24.688 |
Token | 3 |
Token ID | 18 |
Feature activation | -7.80e+01 |
Pos logit contributions | |
3 | +11.402 |
6 | +11.151 |
5 | +10.382 |
2 | +10.066 |
4 | +9.933 |
Neg logit contributions | |
behavi | -26.684 |
totality | -26.475 |
eleph | -25.777 |
unnecess | -25.115 |
anonymity | -24.410 |
Token | { |
Token ID | 1391 |
Feature activation | -5.06e+01 |
Pos logit contributions | |
b | +11.918 |
u | +11.778 |
+ | +11.137 |
q | +11.080 |
g | +10.920 |
Neg logit contributions | |
anonymity | -16.148 |
behavi | -15.923 |
totality | -15.903 |
eleph | -15.743 |
academics | -15.584 |
Token | ( |
Token ID | 7 |
Feature activation | -2.21e+01 |
Pos logit contributions | |
u | +6.341 |
q | +5.021 |
b | +4.438 |
0 | +4.424 |
ab | +4.034 |
Neg logit contributions | |
eleph | -33.571 |
tremend | -32.906 |
reluct | -32.101 |
occas | -31.719 |
hemor | -31.535 |
Token | , |
Token ID | 11 |
Feature activation | -1.37e+01 |
Pos logit contributions | |
. | +6.730 |
- | +5.512 |
, | +4.532 |
; | +4.142 |
u | +3.903 |
Neg logit contributions | |
behavi | -14.233 |
unnecess | -13.074 |
deviations | -12.838 |
conflic | -12.772 |
Palestin | -12.661 |
Token | worth |
Token ID | 2861 |
Feature activation | -7.28e+01 |
Pos logit contributions | |
ien | +4.068 |
u | +3.782 |
ag | +3.658 |
aga | +3.620 |
ak | +3.576 |
Neg logit contributions | |
behavi | -6.972 |
unnecess | -6.354 |
deviations | -6.318 |
Subtle | -5.998 |
Governments | -5.963 |
Token | a |
Token ID | 257 |
Feature activation | -8.14e+01 |
Pos logit contributions | |
$ | +7.193 |
ien | +6.833 |
- | +6.831 |
le | +6.548 |
up | +6.366 |
Neg logit contributions | |
behavi | -18.444 |
cumbers | -17.545 |
unnecess | -16.766 |
conflic | -16.411 |
pecul | -15.862 |
Token | reported |
Token ID | 2098 |
Feature activation | -7.04e+01 |
Pos logit contributions | |
- | +9.351 |
q | +8.648 |
ak | +8.533 |
ik | +8.088 |
ab | +7.993 |
Neg logit contributions | |
behavi | -18.595 |
secondly | -17.900 |
Secondly | -17.804 |
disadvantages | -17.467 |
similarities | -17.295 |
Token | $ |
Token ID | 720 |
Feature activation | -9.95e+01 |
Pos logit contributions | |
- | +6.896 |
$ | +6.292 |
ien | +6.114 |
ag | +5.222 |
o | +5.167 |
Neg logit contributions | |
behavi | -22.408 |
unnecess | -20.615 |
disadvantages | -20.179 |
cumbers | -19.745 |
tremend | -19.514 |
Token | 22 |
Token ID | 1828 |
Feature activation | -1.30e+02 |
Pos logit contributions | |
8 | +12.594 |
6 | +12.432 |
7 | +12.086 |
25 | +11.923 |
12 | +11.733 |
Neg logit contributions | |
behavi | -39.214 |
conflic | -37.948 |
hemor | -37.804 |
tremend | -36.777 |
eleph | -36.723 |
Token | million |
Token ID | 1510 |
Feature activation | -3.88e+01 |
Pos logit contributions | |
- | +15.985 |
. | +14.597 |
million | +12.470 |
m | +12.373 |
MM | +11.339 |
Neg logit contributions | |
resemb | -21.612 |
totality | -21.585 |
behavi | -21.369 |
inaction | -20.156 |
reluct | -19.956 |
Token | , |
Token ID | 11 |
Feature activation | -4.66e+00 |
Pos logit contributions | |
. | +8.622 |
- | +7.697 |
ock | +6.176 |
ien | +5.927 |
k | +5.617 |
Neg logit contributions | |
behavi | -14.914 |
Mothers | -14.307 |
tremend | -13.764 |
Machines | -13.715 |
inaction | -13.627 |
Token | and |
Token ID | 290 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
ien | +1.538 |
u | +1.489 |
ag | +1.453 |
aga | +1.322 |
aven | +1.318 |
Neg logit contributions | |
behavi | -2.699 |
deviations | -2.467 |
inaction | -2.431 |
totality | -2.397 |
pecul | -2.396 |
Token | helped |
Token ID | 4193 |
Feature activation | -9.02e+00 |
Pos logit contributions | |
deviations | +6.655 |
behavi | +6.597 |
distinguishing | +6.476 |
totality | +6.448 |
disadvantages | +6.388 |
Neg logit contributions | |
ien | -6.654 |
aga | -6.161 |
usk | -6.157 |
u | -6.101 |
ike | -6.042 |
Token | the |
Token ID | 262 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
ien | +3.060 |
ank | +3.048 |
aki | +2.992 |
ump | +2.923 |
ock | +2.923 |
Neg logit contributions | |
behavi | -4.768 |
deviations | -4.636 |
disadvantages | -4.062 |
totality | -4.046 |
distinguishing | -3.998 |
Token |
|
Token ID | 198 |
Feature activation | -5.24e+01 |
Pos logit contributions | |
Operation | +14.547 |
The | +14.372 |
these | +14.265 |
Wikipedia | +13.992 |
those | +13.954 |
Neg logit contributions | |
elaide | -18.202 |
igger | -16.781 |
ikes | -16.705 |
teasp | -16.680 |
� | -16.387 |
Token |
|
Token ID | 198 |
Feature activation | +4.33e+01 |
Pos logit contributions | |
| +4.062 |
u | +3.740 |
- | +3.458 |
q | +2.787 |
k | +2.118 |
Neg logit contributions | |
tremend | -42.750 |
eleph | -40.125 |
cumbers | -39.183 |
exha | -38.969 |
millenn | -38.597 |
Token | Ken |
Token ID | 27827 |
Feature activation | -4.40e+01 |
Pos logit contributions | |
those | +14.020 |
these | +13.916 |
people | +13.832 |
things | +13.747 |
many | +13.544 |
Neg logit contributions | |
teasp | -14.889 |
RandomRedditor | -14.500 |
| -14.469 |
� | -14.459 |
| -14.452 |
Token | ichi |
Token ID | 16590 |
Feature activation | -5.34e+01 |
Pos logit contributions | |
ichi | +12.381 |
ich | +12.249 |
aki | +11.549 |
ji | +11.278 |
j | +10.770 |
Neg logit contributions | |
behavi | -15.202 |
totality | -15.157 |
positives | -14.248 |
fundamentals | -13.841 |
disadvantages | -13.757 |
Token | Shin |
Token ID | 11466 |
Feature activation | -9.39e+01 |
Pos logit contributions | |
aki | +11.442 |
u | +10.820 |
aga | +10.090 |
- | +9.413 |
o | +9.176 |
Neg logit contributions | |
behavi | -16.477 |
totality | -14.655 |
unnecess | -14.580 |
reluct | -14.187 |
hindsight | -13.760 |
Token | oda |
Token ID | 11329 |
Feature activation | -1.29e+02 |
Pos logit contributions | |
ag | +16.818 |
ig | +16.589 |
ob | +16.412 |
ab | +16.144 |
oh | +15.946 |
Neg logit contributions | |
behavi | -23.714 |
totality | -20.124 |
unnecess | -19.915 |
reluct | -19.897 |
inaction | -19.561 |
Token | , |
Token ID | 11 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
aga | +14.967 |
aki | +14.313 |
u | +14.203 |
- | +13.947 |
o | +13.841 |
Neg logit contributions | |
totality | -16.574 |
distractions | -15.609 |
disadvantages | -15.209 |
positives | -14.957 |
deviations | -14.831 |
Token | the |
Token ID | 262 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
uty | +4.138 |
u | +3.937 |
ag | +3.914 |
aga | +3.878 |
aki | +3.850 |
Neg logit contributions | |
totality | -5.540 |
deviations | -5.368 |
disadvantages | -5.275 |
idiots | -5.211 |
distractions | -5.055 |
Token | boss |
Token ID | 6478 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
totality | +6.583 |
deviations | +6.326 |
hindsight | +6.156 |
similarities | +6.116 |
disadvantages | +6.067 |
Neg logit contributions | |
uty | -9.031 |
ien | -8.818 |
u | -8.656 |
aki | -8.630 |
usk | -8.625 |
Token | of |
Token ID | 286 |
Feature activation | +3.80e+01 |
Pos logit contributions | |
u | +3.893 |
ong | +3.398 |
- | +3.346 |
agin | +3.243 |
aga | +3.200 |
Neg logit contributions | |
totality | -10.410 |
deviations | -10.080 |
hindsight | -9.977 |
disadvantages | -9.897 |
uniqueness | -9.895 |
Token | Japan |
Token ID | 2869 |
Feature activation | -6.06e+00 |
Pos logit contributions | |
these | +15.644 |
those | +15.392 |
many | +15.065 |
totality | +14.961 |
things | +14.771 |
Neg logit contributions | |
ien | -14.478 |
usk | -14.472 |
uty | -14.071 |
� | -13.510 |
elaide | -13.433 |
Token | Boh |
Token ID | 44366 |
Feature activation | -3.53e+00 |
Pos logit contributions | |
many | +17.915 |
those | +17.770 |
these | +17.750 |
people | +17.164 |
neither | +17.132 |
Neg logit contributions | |
elaide | -16.944 |
� | -16.223 |
� | -15.917 |
| -15.909 |
RandomRedditor | -15.903 |
Token | oli |
Token ID | 11106 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
ol | +0.222 |
ale | +0.044 |
olo | +0.032 |
uty | +0.018 |
oe | +0.009 |
Neg logit contributions | |
distinguishing | -3.756 |
behavi | -3.753 |
bragging | -3.683 |
totality | -3.610 |
disparate | -3.597 |
Token | ub |
Token ID | 549 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
behavi | +0.209 |
totality | +0.203 |
deviations | +0.195 |
distinguishing | +0.194 |
inaction | +0.192 |
Neg logit contributions | |
ub | -0.000 |
ube | +0.003 |
u | +0.006 |
usk | +0.008 |
ab | +0.010 |
Token | ov |
Token ID | 709 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
ov | +3.908 |
u | +1.871 |
ovy | +1.360 |
un | +1.315 |
ove | +1.228 |
Neg logit contributions | |
behavi | -23.201 |
unnecess | -21.692 |
hemor | -21.668 |
cumbers | -21.657 |
tremend | -21.266 |
Token | could |
Token ID | 714 |
Feature activation | -1.12e+02 |
Pos logit contributions | |
aga | +3.663 |
u | +3.657 |
usk | +3.510 |
ien | +3.448 |
ube | +3.371 |
Neg logit contributions | |
disadvantages | -6.862 |
totality | -6.694 |
hindsight | -6.690 |
deviations | -6.478 |
distractions | -6.371 |
Token | not |
Token ID | 407 |
Feature activation | -1.28e+02 |
Pos logit contributions | |
o | +7.559 |
ada | +7.296 |
n | +7.211 |
ire | +7.073 |
ab | +6.835 |
Neg logit contributions | |
behavi | -28.487 |
Palestin | -24.233 |
millenn | -23.905 |
disadvant | -23.631 |
unnecess | -22.784 |
Token | be |
Token ID | 307 |
Feature activation | -1.12e+02 |
Pos logit contributions | |
be | +10.465 |
ate | +8.061 |
ire | +8.057 |
aki | +8.022 |
o | +7.885 |
Neg logit contributions | |
behavi | -27.815 |
soDeliveryDate | -24.163 |
senal | -22.779 |
millenn | -22.282 |
Palestin | -22.255 |
Token | located |
Token ID | 5140 |
Feature activation | -6.20e+01 |
Pos logit contributions | |
reached | +9.771 |
ached | +8.989 |
amed | +5.504 |
ire | +5.472 |
contacted | +5.327 |
Neg logit contributions | |
behavi | -25.399 |
pecul | -23.239 |
detrim | -23.194 |
conflic | -22.954 |
fundamentals | -22.898 |
Token | . |
Token ID | 13 |
Feature activation | +5.32e+01 |
Pos logit contributions | |
. | +11.477 |
un | +8.385 |
u | +8.189 |
ul | +7.798 |
o | +7.625 |
Neg logit contributions | |
cumbers | -16.229 |
disadvantages | -15.568 |
fundamentals | -15.562 |
inventions | -15.510 |
hindsight | -15.427 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +3.43e+01 |
Pos logit contributions | |
Wikipedia | +15.176 |
these | +15.078 |
The | +14.951 |
Priv | +14.927 |
"… | +14.786 |
Neg logit contributions | |
elaide | -18.397 |
teasp | -16.321 |
� | -16.022 |
RandomRedditor | -15.984 |
| -15.950 |
Token | The |
Token ID | 464 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
things | +16.913 |
these | +16.829 |
totality | +16.726 |
those | +16.520 |
inaction | +16.394 |
Neg logit contributions | |
uty | -10.030 |
usk | -9.930 |
ien | -9.840 |
aga | -9.294 |
� | -9.145 |
Token | an |
Token ID | 281 |
Feature activation | +3.37e+01 |
Pos logit contributions | |
u | +1.476 |
ved | +1.466 |
ada | +1.369 |
ab | +1.367 |
aga | +1.363 |
Neg logit contributions | |
behavi | -2.085 |
Actions | -2.060 |
unnecess | -2.047 |
Consumers | -2.032 |
Organizations | -1.967 |
Token | easy |
Token ID | 2562 |
Feature activation | +9.74e-01 |
Pos logit contributions | |
similarities | +11.915 |
totality | +11.748 |
everyday | +11.519 |
distinguishing | +11.471 |
these | +11.424 |
Neg logit contributions | |
usk | -14.859 |
ien | -14.588 |
elaide | -14.573 |
uty | -14.517 |
oultry | -14.345 |
Token | explanation |
Token ID | 7468 |
Feature activation | -7.33e+00 |
Pos logit contributions | |
behavi | +0.529 |
Actions | +0.522 |
deviations | +0.513 |
unnecess | +0.500 |
Organizations | +0.497 |
Neg logit contributions | |
- | -0.361 |
aga | -0.356 |
u | -0.352 |
ab | -0.343 |
aki | -0.335 |
Token | why |
Token ID | 1521 |
Feature activation | +4.83e+01 |
Pos logit contributions | |
. | +1.586 |
- | +1.365 |
u | +1.223 |
ip | +1.186 |
ab | +1.056 |
Neg logit contributions | |
cumbers | -4.870 |
behavi | -4.827 |
unnecess | -4.757 |
conflic | -4.745 |
ccording | -4.699 |
Token | . |
Token ID | 13 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
these | +16.884 |
people | +16.494 |
those | +16.358 |
things | +16.004 |
many | +15.242 |
Neg logit contributions | |
teasp | -19.245 |
| -19.003 |
� | -18.952 |
| -18.945 |
� | -18.926 |
Token |
|
Token ID | 198 |
Feature activation | -1.28e+02 |
Pos logit contributions | |
these | +8.721 |
things | +8.610 |
those | +8.378 |
totality | +8.294 |
people | +8.293 |
Neg logit contributions | |
uty | -15.310 |
elaide | -15.283 |
usk | -15.050 |
ien | -14.831 |
ump | -14.674 |
Token |
|
Token ID | 198 |
Feature activation | +4.98e+00 |
Pos logit contributions | |
| +10.181 |
- | +7.365 |
. | +5.030 |
u | +4.796 |
q | +4.360 |
Neg logit contributions | |
tremend | -61.506 |
eleph | -57.494 |
millenn | -56.626 |
� | -56.185 |
practition | -56.058 |
Token | " |
Token ID | 1 |
Feature activation | +3.84e+01 |
Pos logit contributions | |
totality | +4.376 |
hindsight | +4.118 |
behavi | +4.095 |
deviations | +4.073 |
distinguishing | +4.068 |
Neg logit contributions | |
u | -1.220 |
ien | -1.091 |
ab | -0.982 |
q | -0.938 |
un | -0.909 |
Token | It |
Token ID | 1026 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
people | +9.751 |
things | +9.735 |
those | +9.351 |
these | +9.294 |
Wikipedia | +8.824 |
Neg logit contributions | |
teasp | -20.873 |
| -19.334 |
StreamerBot | -19.311 |
RandomRedditor | -19.308 |
� | -19.294 |
Token | may |
Token ID | 743 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
behavi | +1.523 |
totality | +1.519 |
inaction | +1.514 |
Situation | +1.446 |
deviations | +1.424 |
Neg logit contributions | |
ab | -0.473 |
aven | -0.460 |
u | -0.459 |
ien | -0.433 |
ald | -0.420 |
Token | in |
Token ID | 287 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
ong | +4.162 |
o | +4.009 |
u | +3.858 |
ay | +3.825 |
- | +3.740 |
Neg logit contributions | |
behavi | -12.053 |
Palestin | -11.369 |
totality | -11.142 |
deviations | -10.979 |
Kinnikuman | -10.843 |
Token | 16 |
Token ID | 1467 |
Feature activation | -9.67e+01 |
Pos logit contributions | |
u | +8.667 |
- | +8.593 |
26 | +6.801 |
27 | +6.765 |
30 | +6.754 |
Neg logit contributions | |
behavi | -34.692 |
cumbers | -34.543 |
tremend | -34.022 |
eleph | -33.748 |
conflic | -33.171 |
Token | , |
Token ID | 11 |
Feature activation | -6.67e+01 |
Pos logit contributions | |
, | +8.474 |
- | +7.961 |
th | +6.816 |
. | +5.535 |
u | +5.469 |
Neg logit contributions | |
tremend | -50.110 |
cumbers | -47.218 |
conflic | -46.008 |
millenn | -45.842 |
exha | -45.512 |
Token | 2017 |
Token ID | 2177 |
Feature activation | -7.96e+01 |
Pos logit contributions | |
2017 | +6.156 |
2018 | +4.938 |
2017 | +4.910 |
u | +4.797 |
2016 | +4.773 |
Neg logit contributions | |
behavi | -25.540 |
hemor | -23.942 |
conflic | -23.680 |
cumbers | -23.425 |
Palestin | -23.176 |
Token | at |
Token ID | 379 |
Feature activation | -8.85e+01 |
Pos logit contributions | |
at | +6.503 |
- | +6.005 |
at | +5.329 |
. | +5.323 |
o | +4.444 |
Neg logit contributions | |
tremend | -36.604 |
cumbers | -35.705 |
Palestin | -34.985 |
conflic | -34.450 |
behavi | -34.265 |
Token | 9 |
Token ID | 860 |
Feature activation | -1.04e+02 |
Pos logit contributions | |
8 | +7.173 |
7 | +7.079 |
6 | +6.952 |
11 | +6.946 |
12 | +6.420 |
Neg logit contributions | |
behavi | -34.652 |
cumbers | -34.088 |
tremend | -33.845 |
conflic | -33.123 |
eleph | -32.489 |
Token | : |
Token ID | 25 |
Feature activation | -1.28e+02 |
Pos logit contributions | |
: | +10.421 |
am | +7.870 |
pm | +7.837 |
- | +7.717 |
. | +6.891 |
Neg logit contributions | |
tremend | -47.792 |
practition | -47.281 |
cumbers | -47.261 |
exha | -47.044 |
eleph | -46.966 |
Token | 28 |
Token ID | 2078 |
Feature activation | -9.04e+01 |
Pos logit contributions | |
06 | +14.188 |
08 | +13.989 |
02 | +13.761 |
07 | +13.433 |
05 | +13.243 |
Neg logit contributions | |
eleph | -52.283 |
behavi | -49.190 |
practition | -49.140 |
tremend | -49.119 |
conflic | -48.690 |
Token | am |
Token ID | 321 |
Feature activation | -8.40e+01 |
Pos logit contributions | |
am | +17.424 |
pm | +15.698 |
ab | +10.121 |
ak | +9.187 |
ag | +8.942 |
Neg logit contributions | |
fundamentals | -24.179 |
behavi | -24.162 |
inaction | -23.986 |
successors | -23.798 |
totality | -23.031 |
Token | PST |
Token ID | 28220 |
Feature activation | -6.38e+01 |
Pos logit contributions | |
- | +5.592 |
PST | +5.254 |
. | +4.500 |
id | +4.144 |
_ | +3.973 |
Neg logit contributions | |
cumbers | -31.566 |
tremend | -31.012 |
hemor | -29.931 |
conflic | -29.388 |
eleph | -28.213 |
Token |
|
Token ID | 198 |
Feature activation | -4.22e+01 |
Pos logit contributions | |
o | +9.703 |
| +9.350 |
illo | +9.164 |
ien | +9.080 |
ok | +8.963 |
Neg logit contributions | |
pecul | -15.113 |
hindsight | -14.645 |
deviations | -14.347 |
bureaucrats | -14.305 |
acron | -14.057 |
Token |
|
Token ID | 198 |
Feature activation | +4.58e+01 |
Pos logit contributions | |
u | +2.556 |
| +2.320 |
- | +2.143 |
q | +1.687 |
ab | +1.292 |
Neg logit contributions | |
tremend | -38.890 |
eleph | -37.222 |
cumbers | -36.336 |
undermin | -35.827 |
hemor | -35.707 |
Token |
|
Token ID | 198 |
Feature activation | -8.86e+01 |
Pos logit contributions | |
totality | +10.242 |
distinguishing | +10.000 |
deviations | +9.922 |
similarities | +9.779 |
inaction | +9.660 |
Neg logit contributions | |
ien | -9.779 |
usk | -9.643 |
uty | -9.564 |
aga | -9.222 |
u | -9.136 |
Token |
|
Token ID | 198 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
| +7.838 |
- | +5.899 |
u | +4.173 |
q | +3.801 |
. | +3.776 |
Neg logit contributions | |
tremend | -53.386 |
eleph | -50.809 |
cumbers | -49.207 |
undermin | -49.150 |
� | -48.701 |
Token | " |
Token ID | 1 |
Feature activation | +4.26e+01 |
Pos logit contributions | |
u | +2.305 |
q | +1.768 |
un | +1.731 |
ab | +1.658 |
ien | +1.543 |
Neg logit contributions | |
totality | -10.362 |
deviations | -10.010 |
dividing | -9.988 |
distinguishing | -9.946 |
behavi | -9.876 |
Token | So |
Token ID | 2396 |
Feature activation | +4.58e+01 |
Pos logit contributions | |
things | +9.247 |
people | +8.826 |
Canadians | +8.815 |
those | +8.810 |
these | +8.783 |
Neg logit contributions | |
teasp | -22.293 |
RandomRedditor | -21.625 |
| -21.622 |
� | -21.619 |
� | -21.615 |
Token | we |
Token ID | 356 |
Feature activation | +6.01e-01 |
Pos logit contributions | |
these | +14.715 |
those | +14.434 |
things | +14.280 |
people | +14.037 |
many | +13.991 |
Neg logit contributions | |
uty | -18.560 |
� | -18.407 |
| -18.400 |
| -18.397 |
� | -18.372 |
Token | know |
Token ID | 760 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
totality | +0.374 |
behavi | +0.374 |
inaction | +0.365 |
similarities | +0.347 |
Everyday | +0.341 |
Neg logit contributions | |
ien | -0.191 |
aven | -0.191 |
usk | -0.189 |
u | -0.189 |
q | -0.187 |
Token | that |
Token ID | 326 |
Feature activation | +5.82e+01 |
Pos logit contributions | |
totality | +7.530 |
distinguishing | +7.218 |
deviations | +7.161 |
similarities | +7.059 |
inaction | +7.036 |
Neg logit contributions | |
ien | -12.530 |
uty | -12.279 |
usk | -12.270 |
aga | -12.041 |
ump | -12.027 |
Token | 50 |
Token ID | 2026 |
Feature activation | -2.82e+01 |
Pos logit contributions | |
these | +17.417 |
many | +17.211 |
people | +17.003 |
those | +16.928 |
things | +16.712 |
Neg logit contributions | |
� | -21.942 |
| -21.914 |
| -21.889 |
RandomRedditor | -21.851 |
| -21.835 |
Token | per |
Token ID | 583 |
Feature activation | -7.61e+01 |
Pos logit contributions | |
- | +7.286 |
k | +6.102 |
u | +5.987 |
q | +5.832 |
pp | +5.821 |
Neg logit contributions | |
disadvantages | -10.624 |
dissatisfaction | -10.499 |
totality | -10.463 |
spont | -10.292 |
vanity | -10.249 |
Token | cent |
Token ID | 1247 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
u | +7.160 |
- | +6.347 |
cent | +6.263 |
ig | +6.137 |
k | +6.080 |
Neg logit contributions | |
unnecess | -30.812 |
misunder | -30.432 |
cumbers | -30.425 |
conflic | -30.243 |
tremend | -30.216 |
Token | of |
Token ID | 286 |
Feature activation | +6.02e+01 |
Pos logit contributions | |
distinguishing | +8.936 |
inaction | +8.779 |
totality | +8.708 |
deviations | +8.616 |
bureaucrats | +8.593 |
Neg logit contributions | |
ien | -5.514 |
aga | -5.481 |
u | -5.457 |
usk | -5.398 |
ire | -5.167 |
Token | � |
Token ID | 251 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
� | +10.330 |
� | +9.878 |
� | +8.641 |
� | +8.242 |
� | +8.197 |
Neg logit contributions | |
behavi | -24.394 |
misunder | -22.513 |
tremend | -22.411 |
similarities | -21.787 |
anonymity | -21.771 |
Token | or |
Token ID | 393 |
Feature activation | +4.72e+01 |
Pos logit contributions | |
totality | +6.674 |
similarities | +6.454 |
deviations | +6.451 |
bureaucrats | +6.410 |
disadvantages | +6.381 |
Neg logit contributions | |
u | -4.628 |
ien | -4.470 |
ump | -4.343 |
ab | -4.297 |
inch | -4.247 |
Token | the |
Token ID | 262 |
Feature activation | +4.65e+01 |
Pos logit contributions | |
lack | +18.888 |
whatever | +18.631 |
inaction | +18.503 |
those | +18.491 |
these | +18.452 |
Neg logit contributions | |
uty | -12.617 |
ien | -12.213 |
elaide | -11.814 |
gex | -11.721 |
usk | -11.672 |
Token | first |
Token ID | 717 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
totality | +18.465 |
things | +17.951 |
reality | +17.699 |
lack | +17.381 |
fundamentals | +17.273 |
Neg logit contributions | |
uty | -13.876 |
ien | -12.746 |
elaide | -12.722 |
aga | -12.671 |
inion | -12.585 |
Token | three |
Token ID | 1115 |
Feature activation | -7.12e+00 |
Pos logit contributions | |
bureaucrats | +6.776 |
totality | +6.627 |
hindsight | +6.533 |
deviations | +6.521 |
anonymity | +6.421 |
Neg logit contributions | |
ien | -5.787 |
u | -5.650 |
� | -5.597 |
inch | -5.437 |
ump | -5.435 |
Token | steps |
Token ID | 4831 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
- | +2.893 |
u | +2.667 |
� | +2.496 |
inch | +2.413 |
ump | +2.401 |
Neg logit contributions | |
behavi | -3.183 |
anonymity | -2.863 |
Bots | -2.851 |
bragging | -2.846 |
dissatisfaction | -2.842 |
Token | of |
Token ID | 286 |
Feature activation | +3.04e+01 |
Pos logit contributions | |
totality | +11.503 |
deviations | +11.099 |
similarities | +11.002 |
distinguishing | +10.874 |
inaction | +10.814 |
Neg logit contributions | |
ien | -9.785 |
usk | -9.407 |
uty | -9.351 |
u | -9.156 |
ump | -9.142 |
Token | any |
Token ID | 597 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
totality | +13.911 |
these | +13.431 |
things | +13.330 |
distinguishing | +13.279 |
inaction | +13.202 |
Neg logit contributions | |
uty | -12.649 |
ien | -12.435 |
usk | -12.355 |
aga | -11.806 |
ump | -11.769 |
Token | route |
Token ID | 6339 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
totality | +6.597 |
similarities | +6.584 |
bureaucrats | +6.581 |
hindsight | +6.404 |
distinguishing | +6.389 |
Neg logit contributions | |
ien | -7.888 |
usk | -7.827 |
� | -7.724 |
u | -7.689 |
ump | -7.540 |
Token | , |
Token ID | 11 |
Feature activation | +3.48e+01 |
Pos logit contributions | |
anecdotes | +1.439 |
bureaucrats | +1.389 |
disposable | +1.388 |
disadvantages | +1.378 |
Governments | +1.372 |
Neg logit contributions | |
- | -0.609 |
arm | -0.604 |
ien | -0.591 |
usk | -0.584 |
ag | -0.562 |
Token | that |
Token ID | 326 |
Feature activation | +4.15e+01 |
Pos logit contributions | |
these | +15.028 |
those | +14.842 |
things | +14.785 |
totality | +14.502 |
many | +14.488 |
Neg logit contributions | |
uty | -12.893 |
ien | -12.556 |
usk | -12.435 |
aga | -11.959 |
ikes | -11.934 |
Token | that |
Token ID | 326 |
Feature activation | +5.98e+01 |
Pos logit contributions | |
totality | +12.931 |
these | +12.663 |
things | +12.494 |
distinguishing | +12.353 |
those | +12.337 |
Neg logit contributions | |
ien | -14.131 |
uty | -14.104 |
usk | -14.023 |
aga | -13.492 |
ump | -13.366 |
Token | nearly |
Token ID | 3016 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
these | +19.996 |
those | +19.606 |
things | +19.365 |
many | +19.336 |
the | +18.780 |
Neg logit contributions | |
teasp | -16.072 |
uty | -15.790 |
usk | -15.447 |
| -15.384 |
� | -15.372 |
Token | 40 |
Token ID | 2319 |
Feature activation | +4.20e+00 |
Pos logit contributions | |
behavi | +0.922 |
deviations | +0.869 |
fundamentals | +0.790 |
totality | +0.767 |
disadvantages | +0.766 |
Neg logit contributions | |
u | -1.002 |
ien | -0.994 |
ire | -0.949 |
ab | -0.932 |
aga | -0.921 |
Token | % |
Token ID | 4 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
totality | +3.259 |
inaction | +3.143 |
behavi | +3.128 |
symmetry | +3.051 |
anonymity | +3.027 |
Neg logit contributions | |
u | -1.069 |
ikes | -0.912 |
am | -0.892 |
k | -0.863 |
ire | -0.854 |
Token | of |
Token ID | 286 |
Feature activation | +3.61e+01 |
Pos logit contributions | |
totality | +0.833 |
inaction | +0.816 |
deviations | +0.815 |
Situation | +0.810 |
disappearing | +0.804 |
Neg logit contributions | |
u | -0.310 |
ix | -0.276 |
usk | -0.262 |
aga | -0.260 |
ien | -0.257 |
Token | all |
Token ID | 477 |
Feature activation | +2.75e+01 |
Pos logit contributions | |
these | +15.303 |
those | +15.275 |
totality | +14.984 |
things | +14.717 |
people | +14.702 |
Neg logit contributions | |
uty | -14.411 |
ien | -14.099 |
usk | -14.004 |
� | -13.401 |
aga | -13.384 |
Token | of |
Token ID | 286 |
Feature activation | +2.79e+01 |
Pos logit contributions | |
totality | +12.216 |
distinguishing | +11.661 |
deviations | +11.646 |
similarities | +11.554 |
inaction | +11.531 |
Neg logit contributions | |
ien | -13.019 |
uty | -12.915 |
usk | -12.860 |
aga | -12.307 |
ump | -12.261 |
Token | the |
Token ID | 262 |
Feature activation | +4.46e+01 |
Pos logit contributions | |
totality | +12.352 |
deviations | +11.912 |
distinguishing | +11.872 |
similarities | +11.777 |
inaction | +11.724 |
Neg logit contributions | |
ien | -13.600 |
uty | -13.432 |
usk | -13.403 |
ump | -12.824 |
aga | -12.796 |
Token | hard |
Token ID | 1327 |
Feature activation | -2.55e+01 |
Pos logit contributions | |
people | +16.698 |
things | +16.263 |
folks | +16.077 |
totality | +15.887 |
those | +15.784 |
Neg logit contributions | |
uty | -15.042 |
usk | -14.665 |
ien | -14.535 |
� | -14.355 |
elaide | -14.308 |
Token | fought |
Token ID | 8350 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
- | +9.082 |
wood | +8.037 |
ass | +7.748 |
ies | +7.336 |
ax | +7.305 |
Neg logit contributions | |
behavi | -8.090 |
Bots | -8.077 |
Beware | -8.024 |
totality | -7.858 |
deviations | -7.824 |
Token | for |
Token ID | 329 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
totality | +10.924 |
hindsight | +10.430 |
distinguishing | +10.418 |
deviations | +10.370 |
inaction | +10.295 |
Neg logit contributions | |
ien | -9.667 |
usk | -9.436 |
uty | -9.401 |
aga | -9.024 |
u | -8.987 |
Token |
|
Token ID | 198 |
Feature activation | -6.63e+01 |
Pos logit contributions | |
The | +12.332 |
Standing | +12.221 |
"… | +11.783 |
Being | +11.731 |
One | +11.637 |
Neg logit contributions | |
teasp | -22.679 |
elaide | -22.557 |
� | -21.777 |
| -21.771 |
RandomRedditor | -21.717 |
Token |
|
Token ID | 198 |
Feature activation | +4.09e+01 |
Pos logit contributions | |
| +5.693 |
- | +4.383 |
u | +3.638 |
q | +2.727 |
. | +2.681 |
Neg logit contributions | |
tremend | -49.586 |
eleph | -47.319 |
cumbers | -45.446 |
exha | -45.370 |
millenn | -45.345 |
Token | � |
Token ID | 447 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
things | +13.921 |
those | +13.183 |
people | +13.111 |
these | +13.111 |
whatever | +12.761 |
Neg logit contributions | |
teasp | -14.836 |
| -14.658 |
� | -14.647 |
RandomRedditor | -14.636 |
� | -14.625 |
Token | � |
Token ID | 250 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
� | +2.604 |
� | +2.541 |
� | +2.401 |
� | +2.292 |
� | +2.016 |
Neg logit contributions | |
pecul | -14.080 |
disparate | -14.054 |
similarities | -14.051 |
Wikipedia | -13.905 |
totality | -13.886 |
Token | It |
Token ID | 1026 |
Feature activation | +6.83e+00 |
Pos logit contributions | |
totality | +10.902 |
distinguishing | +10.587 |
deviations | +10.523 |
similarities | +10.411 |
inaction | +10.298 |
Neg logit contributions | |
ien | -7.115 |
uty | -6.985 |
usk | -6.926 |
aga | -6.583 |
ump | -6.572 |
Token | 's |
Token ID | 338 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
behavi | +5.743 |
totality | +5.581 |
deviations | +5.534 |
inaction | +5.401 |
distinguishing | +5.366 |
Neg logit contributions | |
aven | -1.866 |
ien | -1.806 |
u | -1.713 |
amp | -1.646 |
ab | -1.587 |
Token | just |
Token ID | 655 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
totality | +8.902 |
these | +8.410 |
distinguishing | +8.367 |
things | +8.360 |
deviations | +8.315 |
Neg logit contributions | |
ien | -14.781 |
uty | -14.781 |
usk | -14.652 |
aga | -14.108 |
ump | -14.076 |
Token | that |
Token ID | 326 |
Feature activation | +3.92e+01 |
Pos logit contributions | |
deviations | +6.471 |
totality | +6.444 |
distinguishing | +6.255 |
similarities | +6.035 |
bureaucrats | +6.023 |
Neg logit contributions | |
ien | -9.100 |
u | -8.645 |
aga | -8.593 |
ike | -8.587 |
ump | -8.550 |
Token | die |
Token ID | 4656 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
these | +14.256 |
things | +14.249 |
those | +14.023 |
people | +13.513 |
reality | +13.397 |
Neg logit contributions | |
uty | -16.358 |
usk | -16.148 |
inion | -15.368 |
oultry | -15.179 |
ump | -15.004 |
Token | hard |
Token ID | 10424 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
u | +4.112 |
- | +3.998 |
h | +3.973 |
ice | +3.655 |
hard | +3.372 |
Neg logit contributions | |
behavi | -6.762 |
pecul | -6.397 |
similarities | -6.241 |
deviations | -6.190 |
totality | -6.160 |
Token | attitude |
Token ID | 9408 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
totality | +7.245 |
deviations | +7.124 |
distinguishing | +7.121 |
similarities | +6.875 |
disadvantages | +6.814 |
Neg logit contributions | |
ien | -6.851 |
ike | -6.385 |
aga | -6.303 |
u | -6.284 |
ire | -6.283 |
Token |
|
Token ID | 198 |
Feature activation | +4.03e+01 |
Pos logit contributions | |
| +6.412 |
- | +5.190 |
u | +4.264 |
q | +3.427 |
. | +3.215 |
Neg logit contributions | |
tremend | -49.033 |
eleph | -45.954 |
cumbers | -44.986 |
millenn | -44.985 |
exha | -44.956 |
Token | An |
Token ID | 2025 |
Feature activation | +2.83e+01 |
Pos logit contributions | |
things | +11.270 |
those | +10.967 |
these | +10.950 |
people | +10.621 |
many | +10.158 |
Neg logit contributions | |
teasp | -19.217 |
RandomRedditor | -18.172 |
� | -18.152 |
� | -18.152 |
| -18.140 |
Token | online |
Token ID | 2691 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
totality | +14.933 |
similarities | +14.712 |
distinguishing | +14.701 |
these | +14.627 |
things | +14.515 |
Neg logit contributions | |
uty | -8.690 |
usk | -8.602 |
ien | -8.426 |
aga | -8.205 |
ump | -7.978 |
Token | effort |
Token ID | 3626 |
Feature activation | -6.81e+00 |
Pos logit contributions | |
deviations | +1.304 |
unnecess | +1.221 |
disadvantages | +1.215 |
behavi | +1.210 |
inconven | +1.151 |
Neg logit contributions | |
ien | -0.960 |
u | -0.950 |
- | -0.904 |
ia | -0.900 |
inar | -0.867 |
Token | to |
Token ID | 284 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
u | +1.751 |
ire | +1.695 |
ump | +1.692 |
usk | +1.668 |
- | +1.647 |
Neg logit contributions | |
deviations | -3.967 |
totality | -3.966 |
behavi | -3.922 |
symbolism | -3.806 |
unnecess | -3.802 |
Token | get |
Token ID | 651 |
Feature activation | +3.12e+01 |
Pos logit contributions | |
u | +3.581 |
ire | +3.257 |
ob | +3.214 |
aru | +3.152 |
un | +3.121 |
Neg logit contributions | |
behavi | -6.204 |
deviations | -5.472 |
inaction | -5.125 |
Falling | -4.985 |
totality | -4.971 |
Token | volunteers |
Token ID | 11661 |
Feature activation | -8.38e+00 |
Pos logit contributions | |
these | +11.588 |
things | +11.511 |
those | +11.420 |
totality | +11.333 |
people | +11.318 |
Neg logit contributions | |
ien | -14.693 |
uty | -14.675 |
usk | -14.560 |
ike | -13.946 |
ump | -13.851 |
Token | to |
Token ID | 284 |
Feature activation | +5.72e+00 |
Pos logit contributions | |
u | +1.920 |
- | +1.842 |
ire | +1.754 |
ix | +1.639 |
ag | +1.596 |
Neg logit contributions | |
behavi | -5.321 |
totality | -5.150 |
Subtle | -4.972 |
tremend | -4.863 |
deviations | -4.847 |
Token | throw |
Token ID | 3714 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
behavi | +2.923 |
deviations | +2.889 |
totality | +2.848 |
distinguishing | +2.813 |
inaction | +2.703 |
Neg logit contributions | |
ien | -2.628 |
u | -2.588 |
usk | -2.538 |
ump | -2.534 |
uty | -2.487 |
Token | house |
Token ID | 2156 |
Feature activation | -2.25e+01 |
Pos logit contributions | |
u | +5.401 |
- | +5.220 |
urn | +5.151 |
icker | +5.126 |
ig | +5.020 |
Neg logit contributions | |
behavi | -6.339 |
adapting | -5.888 |
hindsight | -5.547 |
misunder | -5.505 |
deviations | -5.480 |
Token | parties |
Token ID | 4671 |
Feature activation | -9.51e-01 |
Pos logit contributions | |
- | +7.595 |
u | +7.002 |
b | +6.901 |
c | +6.478 |
urn | +6.417 |
Neg logit contributions | |
totality | -9.154 |
Mankind | -8.886 |
Subtle | -8.853 |
disadvant | -8.757 |
behavi | -8.751 |
Token | many |
Token ID | 867 |
Feature activation | +5.37e+01 |
Pos logit contributions | |
these | +18.428 |
those | +18.357 |
many | +17.845 |
people | +17.509 |
individuals | +16.751 |
Neg logit contributions | |
daq | -17.628 |
usk | -17.497 |
uty | -16.923 |
� | -16.628 |
teasp | -16.615 |
Token | live |
Token ID | 2107 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
people | +18.888 |
individuals | +18.131 |
Canadians | +18.097 |
those | +17.845 |
these | +17.706 |
Neg logit contributions | |
teasp | -16.988 |
� | -16.512 |
� | -16.504 |
RandomRedditor | -16.497 |
| -16.494 |
Token | in |
Token ID | 287 |
Feature activation | +7.37e+00 |
Pos logit contributions | |
ike | +4.107 |
- | +4.094 |
ab | +3.849 |
ien | +3.671 |
u | +3.629 |
Neg logit contributions | |
hindsight | -7.822 |
Subtle | -7.747 |
totality | -7.314 |
Meaning | -7.288 |
Failure | -7.176 |
Token | areas |
Token ID | 3006 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
hindsight | +3.319 |
distinguishing | +3.230 |
behavi | +3.115 |
fundamentals | +3.084 |
totality | +3.080 |
Neg logit contributions | |
ag | -3.977 |
ike | -3.937 |
ien | -3.805 |
ump | -3.799 |
ab | -3.795 |
Token | of |
Token ID | 286 |
Feature activation | +2.22e+00 |
Pos logit contributions | |
ire | +0.500 |
u | +0.481 |
ike | +0.464 |
ien | +0.456 |
ip | +0.444 |
Neg logit contributions | |
hindsight | -0.732 |
totality | -0.705 |
symmetry | -0.691 |
deviations | -0.678 |
uniqueness | -0.673 |
Token | high |
Token ID | 1029 |
Feature activation | -9.92e+00 |
Pos logit contributions | |
deviations | +0.895 |
behavi | +0.874 |
fundamentals | +0.842 |
hindsight | +0.839 |
bureaucrats | +0.837 |
Neg logit contributions | |
ab | -1.075 |
ike | -1.060 |
u | -1.060 |
ien | -1.058 |
ire | -1.049 |
Token | unemployment |
Token ID | 10681 |
Feature activation | +4.58e+00 |
Pos logit contributions | |
- | +3.956 |
ien | +3.550 |
ood | +3.204 |
amp | +3.122 |
ash | +3.051 |
Neg logit contributions | |
wiser | -4.447 |
hindsight | -4.442 |
Elements | -4.292 |
Pupp | -4.213 |
Statements | -4.120 |
Token | and |
Token ID | 290 |
Feature activation | +2.72e+01 |
Pos logit contributions | |
totality | +3.354 |
deviations | +3.326 |
hindsight | +3.303 |
inaction | +3.300 |
Intelligent | +3.254 |
Neg logit contributions | |
ock | -1.130 |
ien | -1.109 |
ike | -1.077 |
u | -1.011 |
ire | -0.986 |
Token | low |
Token ID | 1877 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
totality | +11.296 |
distinguishing | +10.747 |
deviations | +10.744 |
similarities | +10.636 |
these | +10.534 |
Neg logit contributions | |
ien | -13.843 |
uty | -13.658 |
usk | -13.561 |
aga | -13.112 |
ump | -13.024 |
Token | educational |
Token ID | 9856 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
- | +6.111 |
ien | +5.224 |
ash | +4.185 |
ood | +4.108 |
ish | +4.036 |
Neg logit contributions | |
Canaver | -6.921 |
detractors | -6.484 |
Subtle | -6.483 |
Elements | -6.474 |
totality | -6.445 |
Token | attainment |
Token ID | 40375 |
Feature activation | +9.98e+00 |
Pos logit contributions | |
- | +3.655 |
ien | +2.983 |
ach | +2.425 |
ash | +2.306 |
ab | +2.303 |
Neg logit contributions | |
Canaver | -9.107 |
theless | -9.034 |
DRAG | -8.885 |
Thoughts | -8.797 |
Beware | -8.649 |
Token | that |
Token ID | 326 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
similarities | +2.206 |
totality | +2.191 |
deviations | +2.188 |
behavi | +2.174 |
disadvantages | +2.122 |
Neg logit contributions | |
ien | -0.743 |
usk | -0.654 |
u | -0.632 |
ab | -0.616 |
ip | -0.605 |
Token | will |
Token ID | 481 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
totality | +7.976 |
deviations | +7.877 |
distinguishing | +7.862 |
similarities | +7.590 |
hindsight | +7.502 |
Neg logit contributions | |
ien | -9.350 |
usk | -9.074 |
u | -8.909 |
ump | -8.807 |
uty | -8.545 |
Token | be |
Token ID | 307 |
Feature activation | +6.61e-01 |
Pos logit contributions | |
u | +3.113 |
ire | +3.012 |
ien | +2.968 |
ump | +2.919 |
oe | +2.841 |
Neg logit contributions | |
behavi | -7.096 |
deviations | -5.956 |
transformations | -5.562 |
totality | -5.407 |
inaction | -5.360 |
Token | due |
Token ID | 2233 |
Feature activation | -2.00e+01 |
Pos logit contributions | |
behavi | +0.326 |
totality | +0.299 |
deviations | +0.298 |
disadvantages | +0.286 |
similarities | +0.284 |
Neg logit contributions | |
ien | -0.318 |
u | -0.305 |
aga | -0.298 |
usk | -0.295 |
� | -0.292 |
Token | to |
Token ID | 284 |
Feature activation | -9.88e+00 |
Pos logit contributions | |
. | +4.147 |
- | +4.023 |
ien | +3.979 |
ay | +3.826 |
u | +3.756 |
Neg logit contributions | |
behavi | -9.254 |
resemblance | -8.929 |
similarities | -8.819 |
deviations | -8.763 |
resemb | -8.731 |
Token | a |
Token ID | 257 |
Feature activation | -1.68e+01 |
Pos logit contributions | |
ien | +3.612 |
u | +3.512 |
� | +3.189 |
ire | +3.152 |
ip | +3.146 |
Neg logit contributions | |
behavi | -4.515 |
deviations | -4.337 |
disadvantages | -4.337 |
resemb | -4.102 |
distinguishing | -4.066 |
Token | military |
Token ID | 2422 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
ien | +5.393 |
oe | +5.248 |
u | +5.001 |
� | +4.483 |
ust | +4.433 |
Neg logit contributions | |
disadvantages | -7.827 |
behavi | -7.711 |
similarities | -7.180 |
misconceptions | -7.035 |
anecdotes | -6.916 |
Token | retirement |
Token ID | 10737 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
- | +7.020 |
ien | +5.545 |
ved | +4.702 |
j | +4.623 |
b | +4.344 |
Neg logit contributions | |
behavi | -11.144 |
theless | -10.061 |
Palestin | -9.667 |
*/( | -9.627 |
Occupations | -9.620 |
Token | fund |
Token ID | 1814 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
- | +5.917 |
ien | +5.193 |
. | +5.192 |
e | +4.274 |
un | +4.270 |
Neg logit contributions | |
Wicked | -10.522 |
Witches | -10.370 |
deviations | -10.344 |
DRAG | -10.210 |
totality | -10.161 |
Token | , |
Token ID | 11 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
deviations | +3.161 |
similarities | +3.107 |
behavi | +3.090 |
disadvantages | +3.040 |
totality | +3.033 |
Neg logit contributions | |
ien | -1.073 |
usk | -1.048 |
ock | -0.964 |
u | -0.896 |
ump | -0.890 |
Token | according |
Token ID | 1864 |
Feature activation | -5.56e+01 |
Pos logit contributions | |
totality | +10.057 |
deviations | +9.494 |
similarities | +9.482 |
distinguishing | +9.313 |
hindsight | +9.287 |
Neg logit contributions | |
ien | -12.986 |
uty | -12.600 |
usk | -12.443 |
ump | -12.121 |
u | -12.048 |
Token |
|
Token ID | 198 |
Feature activation | +4.27e+01 |
Pos logit contributions | |
u | +2.150 |
q | +1.842 |
ab | +1.579 |
amp | +1.530 |
ien | +1.472 |
Neg logit contributions | |
tremend | -14.315 |
hemor | -13.804 |
undermin | -13.573 |
eleph | -13.380 |
reluct | -13.241 |
Token | For |
Token ID | 1890 |
Feature activation | +2.82e+01 |
Pos logit contributions | |
things | +15.161 |
these | +14.705 |
those | +14.538 |
people | +14.237 |
many | +13.944 |
Neg logit contributions | |
teasp | -15.071 |
RandomRedditor | -14.442 |
� | -14.440 |
� | -14.434 |
| -14.419 |
Token | the |
Token ID | 262 |
Feature activation | +2.56e+01 |
Pos logit contributions | |
totality | +16.601 |
distinguishing | +16.003 |
deviations | +15.998 |
similarities | +15.888 |
inaction | +15.873 |
Neg logit contributions | |
ien | -9.643 |
uty | -9.510 |
usk | -9.388 |
aga | -8.900 |
ump | -8.876 |
Token | Yog |
Token ID | 31604 |
Feature activation | -6.18e+00 |
Pos logit contributions | |
totality | +12.057 |
deviations | +11.811 |
distinguishing | +11.657 |
inaction | +11.598 |
similarities | +11.448 |
Neg logit contributions | |
ien | -12.929 |
usk | -12.692 |
uty | -12.654 |
ump | -12.291 |
aga | -12.209 |
Token | ventures |
Token ID | 10065 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
u | +0.500 |
ak | +0.476 |
ventures | +0.356 |
urt | +0.278 |
usk | +0.269 |
Neg logit contributions | |
totality | -5.613 |
dividing | -5.455 |
anonymity | -5.449 |
inaction | -5.439 |
prevailing | -5.436 |
Token | Kickstarter |
Token ID | 14437 |
Feature activation | +4.76e+00 |
Pos logit contributions | |
totality | +11.390 |
deviations | +10.998 |
inaction | +10.837 |
distinguishing | +10.786 |
hindsight | +10.711 |
Neg logit contributions | |
ien | -8.131 |
u | -7.669 |
usk | -7.590 |
aga | -7.579 |
uty | -7.540 |
Token | backers |
Token ID | 18917 |
Feature activation | -9.93e-01 |
Pos logit contributions | |
behavi | +3.255 |
totality | +3.181 |
similarities | +3.015 |
deviations | +3.009 |
hindsight | +3.005 |
Neg logit contributions | |
icker | -1.614 |
u | -1.614 |
aki | -1.483 |
aga | -1.424 |
é | -1.376 |
Token | the |
Token ID | 262 |
Feature activation | +4.25e+01 |
Pos logit contributions | |
u | +0.249 |
icker | +0.232 |
ale | +0.225 |
aga | +0.209 |
- | +0.209 |
Neg logit contributions | |
behavi | -0.727 |
totality | -0.677 |
similarities | -0.663 |
inaction | -0.661 |
deviations | -0.648 |
Token | physical |
Token ID | 3518 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
totality | +17.124 |
things | +17.063 |
these | +16.759 |
similarities | +16.553 |
reality | +16.527 |
Neg logit contributions | |
uty | -14.220 |
ien | -14.184 |
elaide | -14.135 |
usk | -13.971 |
inion | -13.965 |
Token | rewards |
Token ID | 11530 |
Feature activation | +8.55e+00 |
Pos logit contributions | |
totality | +7.761 |
behavi | +7.655 |
hindsight | +7.655 |
inaction | +7.439 |
bureaucrats | +7.278 |
Neg logit contributions | |
ike | -6.944 |
ien | -6.841 |
ikes | -6.785 |
u | -6.747 |
aga | -6.701 |
Token | should |
Token ID | 815 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
behavi | +5.673 |
totality | +5.372 |
hindsight | +5.317 |
inaction | +5.271 |
bureaucrats | +5.060 |
Neg logit contributions | |
u | -3.162 |
ike | -3.136 |
ien | -3.026 |
ule | -3.013 |
ire | -3.008 |
Token | er |
Token ID | 263 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
er | +10.336 |
- | +7.304 |
ing | +7.025 |
u | +7.023 |
ester | +6.919 |
Neg logit contributions | |
bribes | -13.795 |
VIDEOS | -13.643 |
PEOPLE | -13.265 |
Shades | -13.186 |
anecdotes | -13.016 |
Token | and |
Token ID | 290 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
- | +2.352 |
u | +2.316 |
ong | +2.303 |
usk | +2.152 |
ien | +1.963 |
Neg logit contributions | |
totality | -7.830 |
hindsight | -7.787 |
disadvantages | -7.676 |
bureaucrats | -7.637 |
inaction | -7.626 |
Token | study |
Token ID | 2050 |
Feature activation | -4.02e+01 |
Pos logit contributions | |
totality | +7.571 |
deviations | +7.273 |
similarities | +7.112 |
distinguishing | +7.074 |
disadvantages | +6.979 |
Neg logit contributions | |
ien | -11.762 |
usk | -11.659 |
aga | -11.375 |
uty | -11.370 |
ump | -11.243 |
Token | co |
Token ID | 763 |
Feature activation | -5.89e+01 |
Pos logit contributions | |
- | +8.162 |
ien | +8.130 |
ab | +7.551 |
u | +7.191 |
q | +7.009 |
Neg logit contributions | |
idiots | -13.806 |
bribes | -13.304 |
Italians | -13.170 |
Shades | -13.005 |
Fired | -12.874 |
Token | - |
Token ID | 12 |
Feature activation | -6.22e+01 |
Pos logit contributions | |
- | +13.125 |
ö | +10.663 |
author | +9.564 |
un | +9.231 |
amp | +9.210 |
Neg logit contributions | |
similarities | -18.953 |
deviations | -17.941 |
hordes | -17.049 |
disadvantages | -16.816 |
distractions | -16.807 |
Token | author |
Token ID | 9800 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
author | +10.064 |
ord | +9.938 |
un | +9.921 |
anch | +9.912 |
lead | +8.982 |
Neg logit contributions | |
similarities | -22.397 |
resemb | -21.260 |
weddings | -21.116 |
loopholes | -20.918 |
distractions | -20.613 |
Token | . |
Token ID | 13 |
Feature activation | +4.15e+01 |
Pos logit contributions | |
u | +2.446 |
. | +2.377 |
usk | +2.349 |
ong | +2.167 |
aga | +1.991 |
Neg logit contributions | |
inaction | -8.109 |
totality | -8.062 |
temptation | -8.034 |
bureaucrats | -7.905 |
hindsight | -7.893 |
Token | � |
Token ID | 564 |
Feature activation | -2.85e+01 |
Pos logit contributions | |
these | +14.708 |
"… | +14.705 |
Canadians | +14.117 |
those | +14.113 |
many | +13.994 |
Neg logit contributions | |
uty | -14.354 |
ien | -14.112 |
ike | -13.845 |
ikes | -13.774 |
elaide | -13.719 |
Token | � |
Token ID | 250 |
Feature activation | +3.85e+01 |
Pos logit contributions | |
� | +6.227 |
� | +5.260 |
� | +4.965 |
� | +4.463 |
� | +4.460 |
Neg logit contributions | |
tremend | -20.346 |
behavi | -19.846 |
hemor | -19.448 |
cumbers | -18.880 |
misunder | -18.731 |
Token | This |
Token ID | 1212 |
Feature activation | +3.46e+01 |
Pos logit contributions | |
these | +12.224 |
those | +11.606 |
things | +11.572 |
people | +11.358 |
many | +11.295 |
Neg logit contributions | |
teasp | -15.860 |
elaide | -15.404 |
� | -14.949 |
RandomRedditor | -14.936 |
| -14.925 |
Token | study |
Token ID | 2050 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
totality | +12.597 |
these | +12.360 |
distinguishing | +12.139 |
things | +12.124 |
reality | +12.115 |
Neg logit contributions | |
uty | -15.370 |
ien | -14.750 |
usk | -14.445 |
ikes | -14.189 |
elaide | -14.059 |
Token | � |
Token ID | 247 |
Feature activation | -5.39e+01 |
Pos logit contributions | |
� | +7.675 |
� | +6.366 |
� | +5.654 |
� | +5.307 |
� | +5.182 |
Neg logit contributions | |
behavi | -26.684 |
tremend | -25.421 |
mathemat | -25.405 |
cumbers | -25.129 |
horizont | -25.049 |
Token | s |
Token ID | 82 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
� | +14.024 |
� | +13.829 |
� | +13.579 |
� | +13.161 |
� | +13.036 |
Neg logit contributions | |
behavi | -15.113 |
inconsistencies | -14.902 |
contradictions | -14.873 |
distortions | -14.833 |
anonymity | -14.697 |
Token | a |
Token ID | 257 |
Feature activation | +8.22e+00 |
Pos logit contributions | |
u | +4.719 |
orm | +4.604 |
ump | +4.545 |
rou | +4.535 |
o | +4.395 |
Neg logit contributions | |
bureaucrats | -4.971 |
behavi | -4.905 |
inaction | -4.785 |
embod | -4.592 |
idiots | -4.538 |
Token | ton |
Token ID | 5680 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
bureaucrats | +3.841 |
inaction | +3.832 |
academics | +3.719 |
deviations | +3.687 |
totality | +3.642 |
Neg logit contributions | |
ump | -4.494 |
rou | -4.400 |
u | -4.359 |
igg | -4.239 |
uty | -4.190 |
Token | to |
Token ID | 284 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
u | +5.786 |
а | +5.165 |
ar | +5.069 |
ong | +4.859 |
o | +4.822 |
Neg logit contributions | |
totality | -9.225 |
anonymity | -8.817 |
Borders | -8.763 |
distortions | -8.660 |
bureaucrats | -8.645 |
Token | discover |
Token ID | 7073 |
Feature activation | -8.18e+00 |
Pos logit contributions | |
un | +6.667 |
u | +6.343 |
aru | +5.846 |
ug | +5.844 |
ast | +5.731 |
Neg logit contributions | |
deviations | -10.152 |
disadvantages | -9.938 |
behavi | -9.356 |
distortions | -9.289 |
contradictions | -9.244 |
Token | in |
Token ID | 287 |
Feature activation | +3.06e+01 |
Pos logit contributions | |
u | +2.220 |
ump | +2.168 |
ab | +2.048 |
ong | +1.904 |
un | +1.892 |
Neg logit contributions | |
totality | -4.874 |
inaction | -4.760 |
anonymity | -4.737 |
bureaucrats | -4.507 |
deviations | -4.492 |
Token | the |
Token ID | 262 |
Feature activation | +4.86e+01 |
Pos logit contributions | |
totality | +14.843 |
these | +14.684 |
things | +14.337 |
those | +14.256 |
distinguishing | +14.255 |
Neg logit contributions | |
usk | -11.647 |
ien | -11.642 |
uty | -11.604 |
aga | -11.078 |
ump | -10.875 |
Token | New |
Token ID | 968 |
Feature activation | +2.96e+01 |
Pos logit contributions | |
many | +15.651 |
things | +15.515 |
these | +15.508 |
new | +15.259 |
various | +15.070 |
Neg logit contributions | |
uty | -16.176 |
usk | -16.165 |
elaide | -15.988 |
aga | -15.621 |
ien | -15.559 |
Token | Xbox |
Token ID | 9445 |
Feature activation | +3.62e+01 |
Pos logit contributions | |
things | +10.992 |
these | +10.965 |
totality | +10.912 |
those | +10.597 |
similarities | +10.540 |
Neg logit contributions | |
uty | -13.431 |
ien | -13.295 |
usk | -13.083 |
ump | -12.602 |
aga | -12.501 |
Token | One |
Token ID | 1881 |
Feature activation | +2.85e+01 |
Pos logit contributions | |
One | +10.574 |
things | +10.357 |
these | +10.297 |
many | +10.062 |
reality | +10.042 |
Neg logit contributions | |
uty | -15.609 |
usk | -15.352 |
ump | -15.081 |
airo | -15.022 |
agin | -14.916 |
Token | al |
Token ID | 282 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
u | +0.307 |
al | +0.186 |
ale | -0.163 |
ab | -0.180 |
ash | -0.397 |
Neg logit contributions | |
behavi | -21.396 |
tremend | -19.287 |
undermin | -18.841 |
unnecess | -18.793 |
cumbers | -18.665 |
Token | was |
Token ID | 373 |
Feature activation | +1.76e+01 |
Pos logit contributions | |
totality | +8.423 |
hindsight | +7.964 |
similarities | +7.904 |
deviations | +7.849 |
distinguishing | +7.809 |
Neg logit contributions | |
ien | -5.611 |
usk | -5.506 |
u | -5.487 |
ike | -5.452 |
aki | -5.188 |
Token | " |
Token ID | 366 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
totality | +7.446 |
similarities | +6.878 |
deviations | +6.738 |
fundamentals | +6.695 |
hindsight | +6.676 |
Neg logit contributions | |
ien | -10.371 |
uty | -10.123 |
u | -9.990 |
usk | -9.990 |
aga | -9.786 |
Token | a |
Token ID | 64 |
Feature activation | +8.58e+00 |
Pos logit contributions | |
totality | +13.900 |
similarities | +13.397 |
distinguishing | +13.167 |
deviations | +13.104 |
hindsight | +13.100 |
Neg logit contributions | |
ien | -2.994 |
u | -2.935 |
uty | -2.784 |
ab | -2.653 |
un | -2.541 |
Token | possible |
Token ID | 1744 |
Feature activation | -8.97e-01 |
Pos logit contributions | |
similarities | +3.771 |
deviations | +3.734 |
disadvantages | +3.708 |
hindsight | +3.697 |
fundamentals | +3.681 |
Neg logit contributions | |
ien | -5.070 |
u | -4.950 |
rou | -4.914 |
uty | -4.883 |
ab | -4.685 |
Token | no |
Token ID | 645 |
Feature activation | -4.65e+01 |
Pos logit contributions | |
rou | +0.373 |
u | +0.372 |
ab | +0.365 |
ien | +0.353 |
illo | +0.349 |
Neg logit contributions | |
fundamentals | -0.437 |
academics | -0.435 |
designers | -0.420 |
hindsight | -0.416 |
bureaucrats | -0.408 |
Token | board |
Token ID | 3096 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
- | +11.062 |
oe | +9.838 |
ose | +9.642 |
ire | +9.096 |
fly | +8.572 |
Neg logit contributions | |
Princ | -14.034 |
Numbers | -14.022 |
Generations | -13.883 |
totality | -13.751 |
theless | -13.608 |
Token | request |
Token ID | 2581 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
u | +0.075 |
illo | +0.068 |
ien | +0.066 |
aki | +0.066 |
uty | +0.066 |
Neg logit contributions | |
totality | -0.179 |
academics | -0.173 |
fundamentals | -0.172 |
similarities | -0.169 |
hindsight | -0.168 |
Token | ." |
Token ID | 526 |
Feature activation | +6.00e+01 |
Pos logit contributions | |
totality | +7.151 |
similarities | +7.039 |
hindsight | +6.849 |
fundamentals | +6.807 |
deviations | +6.766 |
Neg logit contributions | |
u | -3.556 |
ien | -3.483 |
illo | -3.370 |
ube | -3.355 |
uty | -3.350 |
Token | While |
Token ID | 3633 |
Feature activation | +5.40e+01 |
Pos logit contributions | |
The | +15.974 |
One | +14.833 |
Wikipedia | +14.738 |
these | +14.592 |
"[ | +14.484 |
Neg logit contributions | |
elaide | -17.928 |
teasp | -17.479 |
ascript | -16.652 |
igger | -16.563 |
oultry | -16.438 |
Token | that |
Token ID | 326 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
these | +18.834 |
many | +18.376 |
things | +18.314 |
those | +18.213 |
the | +17.388 |
Neg logit contributions | |
usk | -15.816 |
teasp | -15.480 |
oultry | -15.362 |
elaide | -14.996 |
gex | -14.932 |
Token | and |
Token ID | 290 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
u | +3.249 |
- | +2.961 |
. | +2.778 |
of | +2.333 |
ue | +2.230 |
Neg logit contributions | |
unnecess | -9.893 |
cumbers | -9.598 |
behavi | -9.365 |
Subtle | -9.268 |
similarities | -9.209 |
Token | moved |
Token ID | 3888 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
hindsight | +6.149 |
deviations | +6.089 |
distinguishing | +6.044 |
totality | +6.013 |
similarities | +5.973 |
Neg logit contributions | |
ien | -6.990 |
u | -6.924 |
amp | -6.736 |
usk | -6.703 |
aga | -6.663 |
Token | more |
Token ID | 517 |
Feature activation | -6.08e+00 |
Pos logit contributions | |
u | +3.859 |
- | +3.749 |
amp | +3.662 |
ip | +3.623 |
airo | +3.620 |
Neg logit contributions | |
Subtle | -4.460 |
behavi | -4.316 |
hindsight | -4.150 |
uniqueness | -3.965 |
disadvantages | -3.908 |
Token | than |
Token ID | 621 |
Feature activation | -5.01e+01 |
Pos logit contributions | |
u | +1.246 |
- | +1.097 |
amp | +1.063 |
airo | +1.032 |
ale | +1.023 |
Neg logit contributions | |
behavi | -3.999 |
Subtle | -3.841 |
hindsight | -3.799 |
totality | -3.671 |
uniqueness | -3.648 |
Token | 430 |
Token ID | 35090 |
Feature activation | -3.36e+01 |
Pos logit contributions | |
- | +5.783 |
u | +5.391 |
1 | +5.156 |
260 | +5.037 |
2 | +4.846 |
Neg logit contributions | |
behavi | -19.615 |
conflic | -17.737 |
unnecess | -17.160 |
cumbers | -16.991 |
misunder | -15.780 |
Token | , |
Token ID | 11 |
Feature activation | -6.99e+01 |
Pos logit contributions | |
k | +8.230 |
km | +8.067 |
u | +7.486 |
- | +7.481 |
ue | +7.370 |
Neg logit contributions | |
behavi | -11.550 |
Subtle | -11.249 |
symmetry | -11.073 |
disadvantages | -10.862 |
resemb | -10.811 |
Token | 000 |
Token ID | 830 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
000 | +11.522 |
00 | +7.401 |
u | +6.824 |
8 | +6.691 |
0 | +6.618 |
Neg logit contributions | |
behavi | -28.688 |
tremend | -25.974 |
unnecess | -25.842 |
conflic | -25.826 |
hemor | -25.675 |
Token | people |
Token ID | 661 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
u | +4.212 |
- | +4.131 |
ire | +4.034 |
un | +4.022 |
aga | +3.948 |
Neg logit contributions | |
behavi | -5.680 |
Subtle | -5.281 |
disadvantages | -4.904 |
similarities | -4.722 |
tremend | -4.696 |
Token | from |
Token ID | 422 |
Feature activation | -9.96e+00 |
Pos logit contributions | |
. | +4.171 |
- | +4.113 |
u | +3.746 |
amp | +3.449 |
am | +3.184 |
Neg logit contributions | |
behavi | -11.941 |
unnecess | -11.828 |
cumbers | -11.790 |
tremend | -11.062 |
conflic | -10.969 |
Token | the |
Token ID | 262 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
ien | +3.203 |
airo | +3.129 |
ire | +3.015 |
u | +2.976 |
- | +2.893 |
Neg logit contributions | |
behavi | -4.756 |
hindsight | -4.395 |
Subtle | -4.390 |
resemb | -4.220 |
pecul | -4.198 |
Token | southeast |
Token ID | 26015 |
Feature activation | -2.98e+01 |
Pos logit contributions | |
ire | +4.453 |
ien | +4.241 |
ale | +3.900 |
ip | +3.888 |
� | +3.885 |
Neg logit contributions | |
behavi | -8.384 |
hindsight | -7.994 |
promul | -7.972 |
deviations | -7.810 |
resemb | -7.729 |
Token | you |
Token ID | 345 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
totality | +8.479 |
deviations | +8.167 |
distinguishing | +8.028 |
similarities | +7.969 |
inaction | +7.936 |
Neg logit contributions | |
ien | -10.902 |
uty | -10.667 |
usk | -10.513 |
u | -10.467 |
ump | -10.302 |
Token | gay |
Token ID | 5650 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
totality | +7.288 |
similarities | +6.834 |
inaction | +6.797 |
deviations | +6.735 |
fundamentals | +6.714 |
Neg logit contributions | |
u | -4.090 |
ien | -3.813 |
aven | -3.804 |
uty | -3.770 |
ike | -3.766 |
Token | ? |
Token ID | 30 |
Feature activation | +2.76e+01 |
Pos logit contributions | |
totality | +8.541 |
distinguishing | +8.149 |
deviations | +7.929 |
similarities | +7.885 |
disadvantages | +7.809 |
Neg logit contributions | |
u | -4.061 |
ien | -4.020 |
aki | -3.875 |
ump | -3.812 |
ab | -3.800 |
Token | � |
Token ID | 447 |
Feature activation | -2.53e+01 |
Pos logit contributions | |
totality | +14.454 |
distinguishing | +13.892 |
deviations | +13.892 |
similarities | +13.748 |
inaction | +13.709 |
Neg logit contributions | |
ien | -11.044 |
uty | -10.984 |
usk | -10.888 |
aga | -10.382 |
ump | -10.359 |
Token | � |
Token ID | 251 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
� | +5.160 |
� | +4.807 |
� | +4.767 |
� | +4.674 |
� | +4.561 |
Neg logit contributions | |
pecul | -15.572 |
similarities | -15.179 |
disparate | -15.147 |
observers | -15.114 |
totality | -15.037 |
Token |
|
Token ID | 198 |
Feature activation | -5.64e+01 |
Pos logit contributions | |
u | +3.073 |
uty | +2.827 |
ien | +2.739 |
illo | +2.720 |
� | +2.707 |
Neg logit contributions | |
deviations | -7.097 |
similarities | -7.024 |
totality | -7.016 |
disparate | -6.984 |
disadvantages | -6.983 |
Token |
|
Token ID | 198 |
Feature activation | +6.21e+01 |
Pos logit contributions | |
| +4.184 |
- | +3.021 |
u | +2.560 |
q | +1.628 |
. | +1.394 |
Neg logit contributions | |
tremend | -47.597 |
eleph | -45.090 |
cumbers | -43.829 |
millenn | -43.519 |
undermin | -43.506 |
Token | Cash |
Token ID | 35361 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
people | +14.287 |
things | +14.170 |
these | +14.095 |
those | +13.622 |
the | +13.230 |
Neg logit contributions | |
teasp | -18.391 |
pione | -17.941 |
RandomRedditor | -17.840 |
| -17.822 |
� | -17.802 |
Token | ier |
Token ID | 959 |
Feature activation | -7.62e+00 |
Pos logit contributions | |
ien | +0.587 |
u | +0.114 |
ier | +0.064 |
icker | -0.014 |
ump | -0.121 |
Neg logit contributions | |
behavi | -12.142 |
totality | -11.631 |
deviations | -11.597 |
similarities | -11.412 |
disadvantages | -11.370 |
Token | : |
Token ID | 25 |
Feature activation | +2.76e+01 |
Pos logit contributions | |
u | +1.058 |
ien | +0.990 |
� | +0.853 |
uty | +0.833 |
ire | +0.772 |
Neg logit contributions | |
distinguishing | -5.545 |
totality | -5.466 |
similarities | -5.382 |
disparate | -5.345 |
academics | -5.284 |
Token | � |
Token ID | 564 |
Feature activation | -3.01e+01 |
Pos logit contributions | |
totality | +13.295 |
distinguishing | +12.744 |
deviations | +12.744 |
similarities | +12.639 |
these | +12.603 |
Neg logit contributions | |
ien | -11.949 |
uty | -11.872 |
usk | -11.773 |
aga | -11.256 |
ump | -11.220 |
Token | was |
Token ID | 373 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
things | +15.076 |
those | +14.660 |
these | +14.503 |
many | +14.094 |
everything | +13.732 |
Neg logit contributions | |
uty | -15.401 |
inion | -15.125 |
� | -15.019 |
usk | -14.853 |
igger | -14.756 |
Token | asked |
Token ID | 1965 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
totality | +4.922 |
similarities | +4.554 |
deviations | +4.530 |
disadvantages | +4.469 |
fundamentals | +4.378 |
Neg logit contributions | |
u | -5.587 |
ien | -5.463 |
aga | -5.267 |
ached | -5.221 |
usk | -5.219 |
Token | to |
Token ID | 284 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
u | +4.446 |
ien | +4.002 |
ached | +3.780 |
ire | +3.775 |
ump | +3.659 |
Neg logit contributions | |
totality | -10.003 |
pecul | -9.697 |
uniqueness | -9.131 |
behavi | -9.118 |
embodiments | -9.037 |
Token | take |
Token ID | 1011 |
Feature activation | -1.72e+01 |
Pos logit contributions | |
u | +3.766 |
ire | +3.598 |
ien | +3.421 |
q | +3.334 |
aki | +3.127 |
Neg logit contributions | |
behavi | -9.436 |
deviations | -8.275 |
disadvant | -8.096 |
disadvantages | -7.985 |
pecul | -7.966 |
Token | a |
Token ID | 257 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
aga | +5.603 |
ien | +4.853 |
- | +4.630 |
u | +4.587 |
ay | +4.582 |
Neg logit contributions | |
behavi | -7.103 |
multiplying | -6.752 |
uniqueness | -6.702 |
theless | -6.563 |
totality | -6.528 |
Token | 50 |
Token ID | 2026 |
Feature activation | -5.74e+01 |
Pos logit contributions | |
u | +7.142 |
ire | +6.895 |
aga | +6.672 |
usk | +6.330 |
ay | +6.172 |
Neg logit contributions | |
embodiments | -8.536 |
similarities | -8.314 |
inventions | -8.201 |
distortions | -8.156 |
anecdotes | -8.145 |
Token | - |
Token ID | 12 |
Feature activation | -6.53e+01 |
Pos logit contributions | |
- | +13.553 |
k | +12.081 |
% | +10.505 |
m | +10.454 |
u | +10.353 |
Neg logit contributions | |
theless | -15.197 |
disadvantages | -13.778 |
totality | -13.597 |
timelines | -13.235 |
symmetry | -13.139 |
Token | percent |
Token ID | 25067 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
minute | +15.880 |
min | +12.611 |
day | +12.468 |
week | +12.438 |
mile | +12.209 |
Neg logit contributions | |
acron | -18.452 |
tragedies | -17.907 |
totality | -17.817 |
successors | -17.752 |
inaction | -17.638 |
Token | pay |
Token ID | 1414 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
u | +6.930 |
ire | +6.711 |
ock | +6.693 |
ix | +6.663 |
ien | +6.542 |
Neg logit contributions | |
acron | -8.278 |
embodiments | -8.277 |
distortions | -8.113 |
contradictions | -8.062 |
anecdotes | -7.931 |
Token | cut |
Token ID | 2005 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
up | +5.142 |
- | +4.828 |
cut | +4.665 |
ola | +4.108 |
u | +4.080 |
Neg logit contributions | |
acron | -13.069 |
embodiments | -12.313 |
hordes | -12.209 |
reluct | -12.072 |
detractors | -12.040 |
Token | due |
Token ID | 2233 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
totality | +10.707 |
deviations | +10.189 |
similarities | +10.017 |
inaction | +9.968 |
distinguishing | +9.884 |
Neg logit contributions | |
ien | -5.907 |
uty | -5.873 |
usk | -5.743 |
ike | -5.561 |
u | -5.543 |
Token | ahead |
Token ID | 4058 |
Feature activation | -5.36e+01 |
Pos logit contributions | |
deviations | +0.842 |
disadvantages | +0.817 |
similarities | +0.812 |
uniqueness | +0.781 |
distinguishing | +0.778 |
Neg logit contributions | |
u | -0.265 |
ag | -0.262 |
aga | -0.253 |
uty | -0.249 |
ien | -0.244 |
Token | of |
Token ID | 286 |
Feature activation | -1.95e+01 |
Pos logit contributions | |
u | +6.771 |
of | +6.682 |
- | +6.634 |
. | +6.240 |
ada | +6.201 |
Neg logit contributions | |
tremend | -26.799 |
ccording | -25.962 |
behavi | -25.942 |
misunder | -25.563 |
Palestin | -25.418 |
Token | September |
Token ID | 2693 |
Feature activation | -3.59e+01 |
Pos logit contributions | |
- | +4.780 |
aga | +4.592 |
am | +4.302 |
ak | +4.162 |
ip | +4.145 |
Neg logit contributions | |
behavi | -9.509 |
conflic | -8.882 |
disadvantages | -8.386 |
behav | -7.729 |
Subtle | -7.698 |
Token | 30 |
Token ID | 1542 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
. | +7.268 |
's | +6.945 |
- | +6.288 |
ak | +6.044 |
ig | +5.941 |
Neg logit contributions | |
behavi | -14.326 |
Tycoon | -13.691 |
Hitman | -13.689 |
distinguishing | -13.448 |
VIDEOS | -13.273 |
Token | , |
Token ID | 11 |
Feature activation | +4.19e+00 |
Pos logit contributions | |
th | +2.782 |
. | +1.956 |
ien | +1.937 |
aga | +1.889 |
- | +1.854 |
Neg logit contributions | |
disadvantages | -7.488 |
deviations | -7.316 |
similarities | -7.217 |
distinguishing | -7.107 |
compan | -7.025 |
Token | according |
Token ID | 1864 |
Feature activation | -4.93e+01 |
Pos logit contributions | |
behavi | +2.427 |
pecul | +2.394 |
totality | +2.381 |
similarities | +2.377 |
disadvantages | +2.372 |
Neg logit contributions | |
ien | -1.669 |
uty | -1.606 |
ab | -1.602 |
u | -1.600 |
aga | -1.587 |
Token | to |
Token ID | 284 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
u | +5.767 |
- | +5.514 |
to | +5.406 |
q | +4.783 |
athan | +4.733 |
Neg logit contributions | |
tremend | -28.895 |
cumbers | -27.555 |
eleph | -27.115 |
reluct | -26.681 |
behavi | -26.626 |
Token | a |
Token ID | 257 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
ab | +5.993 |
ak | +5.708 |
ock | +5.583 |
� | +5.478 |
u | +5.472 |
Neg logit contributions | |
disadvantages | -8.704 |
inconven | -8.430 |
predators | -8.381 |
inaction | -8.258 |
behavi | -8.157 |
Token | new |
Token ID | 649 |
Feature activation | -2.65e+01 |
Pos logit contributions | |
ab | +6.178 |
ix | +6.080 |
ock | +5.763 |
u | +5.746 |
q | +5.721 |
Neg logit contributions | |
distractions | -8.657 |
disadvantages | -8.600 |
predators | -8.177 |
hindsight | -8.136 |
hordes | -8.097 |
Token | poll |
Token ID | 3278 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
- | +6.436 |
ix | +6.158 |
ak | +6.149 |
ab | +6.038 |
ien | +6.034 |
Neg logit contributions | |
distractions | -10.127 |
hindsight | -9.974 |
predators | -9.874 |
disadvantages | -9.732 |
hordes | -9.563 |
Token | released |
Token ID | 2716 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
usk | +3.275 |
. | +3.177 |
ix | +2.951 |
ak | +2.904 |
u | +2.883 |
Neg logit contributions | |
inaction | -7.582 |
hindsight | -7.330 |
similarities | -7.254 |
transformations | -7.218 |
embodiments | -7.216 |
Token | 2 |
Token ID | 17 |
Feature activation | -7.02e+01 |
Pos logit contributions | |
up | +3.478 |
ab | +3.447 |
un | +3.172 |
u | +3.092 |
ob | +2.972 |
Neg logit contributions | |
totality | -11.494 |
inaction | -10.553 |
anonymity | -10.538 |
distractions | -10.463 |
behavi | -10.451 |
Token | . |
Token ID | 13 |
Feature activation | -9.79e+01 |
Pos logit contributions | |
- | +13.352 |
cm | +13.032 |
mm | +12.920 |
inch | +12.470 |
. | +12.381 |
Neg logit contributions | |
totality | -16.593 |
inaction | -16.575 |
Situation | -15.685 |
behavi | -15.346 |
conflic | -14.985 |
Token | 6 |
Token ID | 21 |
Feature activation | -7.06e+01 |
Pos logit contributions | |
8 | +13.650 |
5 | +13.467 |
6 | +13.364 |
7 | +13.009 |
2 | +12.465 |
Neg logit contributions | |
behavi | -34.260 |
conflic | -33.335 |
undermin | -32.501 |
hemor | -32.188 |
tremend | -31.999 |
Token | – |
Token ID | 784 |
Feature activation | -2.71e+01 |
Pos logit contributions | |
mm | +13.962 |
cm | +13.783 |
m | +13.637 |
- | +13.614 |
inch | +13.120 |
Neg logit contributions | |
inaction | -16.773 |
Situation | -16.337 |
totality | -16.137 |
unnecess | -15.768 |
disadvantages | -15.464 |
Token | 3 |
Token ID | 513 |
Feature activation | -7.19e+01 |
Pos logit contributions | |
inch | +5.560 |
3 | +5.193 |
ump | +4.907 |
ab | +4.788 |
u | +4.773 |
Neg logit contributions | |
unnecess | -12.162 |
behavi | -11.810 |
totality | -11.674 |
inaction | -11.275 |
conflic | -11.052 |
Token | . |
Token ID | 13 |
Feature activation | -1.19e+02 |
Pos logit contributions | |
mm | +13.028 |
inch | +12.922 |
cm | +12.742 |
. | +12.385 |
m | +11.750 |
Neg logit contributions | |
inaction | -17.282 |
Situation | -17.273 |
totality | -16.856 |
dissatisfaction | -16.774 |
Catalyst | -16.210 |
Token | 5 |
Token ID | 20 |
Feature activation | -7.28e+01 |
Pos logit contributions | |
0 | +15.918 |
8 | +15.871 |
6 | +15.551 |
7 | +15.362 |
5 | +14.935 |
Neg logit contributions | |
behavi | -23.071 |
totality | -21.954 |
conflic | -20.043 |
hemor | -19.763 |
undermin | -19.752 |
Token | kg |
Token ID | 14211 |
Feature activation | -2.62e+01 |
Pos logit contributions | |
mm | +13.466 |
cm | +13.300 |
inch | +12.748 |
m | +12.039 |
- | +11.434 |
Neg logit contributions | |
Situation | -17.297 |
inaction | -17.105 |
Catalyst | -16.649 |
unnecess | -16.624 |
distractions | -16.233 |
Token | ), |
Token ID | 828 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
) | +6.453 |
q | +5.971 |
), | +5.800 |
ab | +5.412 |
ape | +5.181 |
Neg logit contributions | |
anonymity | -11.861 |
grievances | -11.772 |
behavi | -11.583 |
inaction | -11.576 |
frustrations | -11.326 |
Token | but |
Token ID | 475 |
Feature activation | +9.42e+00 |
Pos logit contributions | |
imb | +0.609 |
ab | +0.594 |
ike | +0.572 |
u | +0.570 |
inch | +0.560 |
Neg logit contributions | |
totality | -1.100 |
inaction | -1.029 |
Everyday | -1.024 |
fundamentals | -1.007 |
unnecess | -1.006 |
Token | differ |
Token ID | 13238 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
totality | +5.031 |
hindsight | +4.877 |
Situation | +4.846 |
inaction | +4.775 |
bureaucrats | +4.735 |
Neg logit contributions | |
ike | -4.467 |
u | -4.464 |
ire | -4.407 |
ab | -4.397 |
ien | -4.331 |
Token | entire |
Token ID | 2104 |
Feature activation | -4.22e+01 |
Pos logit contributions | |
o | +5.342 |
- | +5.305 |
oe | +4.914 |
ome | +3.891 |
. | +3.819 |
Neg logit contributions | |
reluct | -30.627 |
� | -30.445 |
Palestin | -29.876 |
ModLoader | -29.816 |
ccording | -29.727 |
Token | palm |
Token ID | 18057 |
Feature activation | -5.47e+01 |
Pos logit contributions | |
- | +2.999 |
illo | +2.535 |
u | +2.296 |
ul | +1.862 |
am | +1.813 |
Neg logit contributions | |
ccording | -25.429 |
conflic | -25.024 |
cumbers | -24.717 |
undermin | -24.689 |
� | -24.455 |
Token | opl |
Token ID | 20106 |
Feature activation | -6.58e+01 |
Pos logit contributions | |
opl | +9.366 |
op | +8.236 |
o | +7.693 |
agin | +7.061 |
ot | +6.936 |
Neg logit contributions | |
behavi | -32.836 |
hemor | -30.881 |
cumbers | -30.604 |
reluct | -30.449 |
millenn | -30.432 |
Token | ant |
Token ID | 415 |
Feature activation | -6.29e+01 |
Pos logit contributions | |
ant | +12.188 |
amp | +8.503 |
ag | +8.243 |
ab | +7.800 |
ank | +7.399 |
Neg logit contributions | |
behavi | -42.155 |
conflic | -41.832 |
cumbers | -41.524 |
tremend | -41.272 |
undermin | -40.974 |
Token | ar |
Token ID | 283 |
Feature activation | -4.93e+01 |
Pos logit contributions | |
ar | +12.889 |
arr | +7.023 |
ab | +6.544 |
ag | +6.408 |
art | +6.175 |
Neg logit contributions | |
cumbers | -42.922 |
behavi | -40.962 |
undermin | -40.845 |
tremend | -40.456 |
millenn | -40.139 |
Token | surfaces |
Token ID | 16649 |
Feature activation | -1.14e+02 |
Pos logit contributions | |
ikes | +3.092 |
- | +3.008 |
ates | +2.786 |
ia | +2.780 |
ines | +2.507 |
Neg logit contributions | |
ccording | -27.220 |
eleph | -26.685 |
conflic | -26.318 |
reluct | -25.797 |
� | -25.797 |
Token | . |
Token ID | 13 |
Feature activation | +6.61e+00 |
Pos logit contributions | |
. | +13.228 |
- | +6.635 |
., | +6.509 |
) | +5.572 |
.) | +5.328 |
Neg logit contributions | |
tremend | -56.884 |
millenn | -54.523 |
practition | -53.428 |
eleph | -53.335 |
cumbers | -52.529 |
Token | Type |
Token ID | 5994 |
Feature activation | -2.42e+01 |
Pos logit contributions | |
bureaucrats | +3.563 |
bragging | +3.552 |
inaction | +3.526 |
anonymity | +3.469 |
hindsight | +3.431 |
Neg logit contributions | |
u | -3.297 |
ab | -3.071 |
ong | -3.062 |
ien | -3.054 |
q | -3.040 |
Token | 3 |
Token ID | 513 |
Feature activation | -8.29e+00 |
Pos logit contributions | |
u | +6.256 |
ine | +5.765 |
ien | +5.687 |
ule | +5.556 |
- | +5.512 |
Neg logit contributions | |
wiser | -9.576 |
bragging | -9.468 |
inaction | -9.452 |
bureaucrats | -9.410 |
hindsight | -9.227 |
Token | : |
Token ID | 25 |
Feature activation | +3.48e+01 |
Pos logit contributions | |
u | +1.718 |
q | +1.357 |
ien | +1.324 |
b | +1.305 |
α | +1.288 |
Neg logit contributions | |
anonymity | -5.544 |
bragging | -5.543 |
inaction | -5.511 |
bureaucrats | -5.389 |
totality | -5.336 |
Token | F |
Token ID | 376 |
Feature activation | -3.36e+01 |
Pos logit contributions | |
these | +13.662 |
totality | +13.278 |
those | +13.067 |
many | +13.007 |
similarities | +12.839 |
Neg logit contributions | |
ien | -14.028 |
uty | -13.747 |
elaide | -13.633 |
usk | -13.605 |
aga | -13.187 |
Token | can |
Token ID | 460 |
Feature activation | -9.04e+01 |
Pos logit contributions | |
're | +4.687 |
can | +4.397 |
et | +3.497 |
T | +3.021 |
'd | +2.971 |
Neg logit contributions | |
totality | -32.232 |
xual | -32.115 |
horizont | -31.939 |
compan | -31.839 |
fundamentals | -30.166 |
Token | check |
Token ID | 2198 |
Feature activation | -7.35e+01 |
Pos logit contributions | |
ade | +8.536 |
ades | +7.825 |
ada | +6.833 |
ak | +6.611 |
k | +5.382 |
Neg logit contributions | |
disadvant | -32.408 |
compan | -31.510 |
weap | -30.967 |
thous | -30.779 |
facult | -30.743 |
Token | out |
Token ID | 503 |
Feature activation | -7.30e+01 |
Pos logit contributions | |
out | +5.972 |
out | +4.242 |
- | +3.570 |
ike | +2.815 |
ix | +1.232 |
Neg logit contributions | |
disadvant | -31.789 |
reluct | -31.457 |
misunder | -30.467 |
embr | -30.334 |
destro | -30.008 |
Token | my |
Token ID | 616 |
Feature activation | -8.14e+01 |
Pos logit contributions | |
ara | +3.455 |
my | +3.410 |
orm | +2.131 |
esar | +1.846 |
ick | +1.803 |
Neg logit contributions | |
pestic | -30.811 |
cumbers | -30.681 |
destro | -29.795 |
showc | -28.982 |
embr | -28.542 |
Token | Twitter |
Token ID | 3009 |
Feature activation | -9.26e+01 |
Pos logit contributions | |
Twitter | +4.490 |
ema | +4.068 |
ip | +4.015 |
y | +2.595 |
ash | +2.496 |
Neg logit contributions | |
intimid | -31.560 |
weap | -30.998 |
theless | -30.268 |
resemb | -29.248 |
informing | -28.874 |
Token | feed |
Token ID | 3745 |
Feature activation | -1.21e+02 |
Pos logit contributions | |
anna | +4.672 |
feed | +4.062 |
ae | +3.746 |
ast | +3.701 |
ze | +2.793 |
Neg logit contributions | |
Mankind | -34.012 |
Corpor | -31.856 |
Croat | -31.841 |
horizont | -31.407 |
theless | -30.752 |
Token | by |
Token ID | 416 |
Feature activation | -1.18e+02 |
Pos logit contributions | |
by | +6.408 |
able | +1.119 |
. | +0.050 |
, | -0.108 |
via | -0.398 |
Neg logit contributions | |
streng | -40.511 |
Mankind | -39.342 |
detrim | -39.114 |
challeng | -39.108 |
horizont | -38.881 |
Token | going |
Token ID | 1016 |
Feature activation | -1.21e+02 |
Pos logit contributions | |
u | +9.469 |
ocking | +8.051 |
och | +7.344 |
o | +6.806 |
g | +6.095 |
Neg logit contributions | |
anwhile | -34.705 |
perspect | -33.677 |
resemb | -32.788 |
neighb | -32.255 |
Inform | -32.135 |
Token | here |
Token ID | 994 |
Feature activation | -1.14e+02 |
Pos logit contributions | |
here | +3.771 |
onda | -0.348 |
rius | -0.502 |
og | -0.543 |
elle | -0.657 |
Neg logit contributions | |
Palestin | -44.238 |
totality | -43.664 |
conduc | -40.362 |
sacrific | -38.456 |
destro | -38.043 |
Token | . |
Token ID | 13 |
Feature activation | -1.04e+02 |
Pos logit contributions | |
. | +12.434 |
u | +5.350 |
| +4.700 |
: | +4.507 |
., | +3.706 |
Neg logit contributions | |
misunder | -42.177 |
exha | -39.639 |
tremend | -38.977 |
totality | -38.836 |
neighb | -38.816 |
Token | But |
Token ID | 887 |
Feature activation | -9.57e+01 |
Pos logit contributions | |
But | +4.434 |
<|endoftext|> | +4.200 |
| +3.238 |
u | +1.011 |
but | +0.714 |
Neg logit contributions | |
tremend | -38.821 |
ingred | -37.822 |
detrim | -37.553 |
throats | -37.038 |
blat | -36.928 |
Token | 495 |
Token ID | 33781 |
Feature activation | -3.43e+00 |
Pos logit contributions | |
8 | +13.889 |
08 | +13.699 |
06 | +13.665 |
07 | +13.597 |
05 | +13.284 |
Neg logit contributions | |
behavi | -22.421 |
disadvant | -20.651 |
totality | -20.605 |
unnecess | -20.510 |
hemor | -19.942 |
Token | voters |
Token ID | 4446 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
aga | +0.916 |
ene | +0.817 |
ien | +0.802 |
ika | +0.801 |
- | +0.799 |
Neg logit contributions | |
behavi | -2.415 |
acron | -2.245 |
symbolism | -2.173 |
Meaning | -2.170 |
inaction | -2.164 |
Token | in |
Token ID | 287 |
Feature activation | +2.63e+00 |
Pos logit contributions | |
u | +1.787 |
ien | +1.756 |
aga | +1.656 |
inion | +1.601 |
- | +1.564 |
Neg logit contributions | |
behavi | -7.735 |
pecul | -7.564 |
compan | -7.257 |
uniqueness | -7.243 |
symbolism | -7.168 |
Token | Ohio |
Token ID | 6835 |
Feature activation | -2.71e+01 |
Pos logit contributions | |
behavi | +2.156 |
unnecess | +1.888 |
deviations | +1.808 |
acron | +1.805 |
disadvantages | +1.804 |
Neg logit contributions | |
ien | -0.667 |
aga | -0.665 |
ire | -0.598 |
u | -0.577 |
uty | -0.559 |
Token | and |
Token ID | 290 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
usk | +6.436 |
aga | +6.348 |
ien | +6.346 |
u | +6.149 |
uty | +6.123 |
Neg logit contributions | |
behavi | -11.488 |
hindsight | -11.320 |
deviations | -11.301 |
disadvantages | -11.284 |
totality | -11.280 |
Token | 1 |
Token ID | 352 |
Feature activation | -1.16e+02 |
Pos logit contributions | |
ien | +2.301 |
aga | +2.088 |
ene | +1.993 |
u | +1.918 |
ip | +1.851 |
Neg logit contributions | |
behavi | -8.838 |
unnecess | -7.753 |
disadvantages | -7.567 |
distinguishing | -7.541 |
deviations | -7.533 |
Token | , |
Token ID | 11 |
Feature activation | -1.07e+02 |
Pos logit contributions | |
, | +10.048 |
- | +9.042 |
. | +8.419 |
) | +6.462 |
k | +6.425 |
Neg logit contributions | |
tremend | -48.839 |
eleph | -45.727 |
cumbers | -45.714 |
� | -44.980 |
conflic | -44.670 |
Token | 425 |
Token ID | 32114 |
Feature activation | -2.76e+00 |
Pos logit contributions | |
8 | +14.188 |
06 | +13.630 |
08 | +13.596 |
05 | +13.595 |
07 | +13.440 |
Neg logit contributions | |
behavi | -25.108 |
hemor | -22.115 |
unnecess | -21.913 |
disadvant | -21.539 |
totality | -21.377 |
Token | voters |
Token ID | 4446 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
aga | +0.862 |
- | +0.845 |
u | +0.842 |
ire | +0.797 |
v | +0.779 |
Neg logit contributions | |
behavi | -1.764 |
Meaning | -1.582 |
DRAG | -1.556 |
acron | -1.550 |
inaction | -1.520 |
Token | in |
Token ID | 287 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
- | +2.606 |
u | +2.566 |
ien | +2.131 |
ire | +1.987 |
oe | +1.682 |
Neg logit contributions | |
behavi | -14.391 |
tremend | -13.745 |
cumbers | -13.722 |
unnecess | -13.682 |
conflic | -13.198 |
Token | Wisconsin |
Token ID | 9279 |
Feature activation | -3.98e+01 |
Pos logit contributions | |
ien | +0.330 |
aga | +0.324 |
ire | +0.322 |
uty | +0.314 |
ust | +0.288 |
Neg logit contributions | |
behavi | -1.921 |
unnecess | -1.796 |
Firstly | -1.683 |
disadvantages | -1.676 |
acron | -1.669 |
Token | . |
Token ID | 13 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
. | +2.902 |
- | +2.241 |
u | +2.153 |
aga | +2.108 |
uty | +2.100 |
Neg logit contributions | |
tremend | -6.935 |
totality | -6.891 |
Nost | -6.797 |
uniqueness | -6.708 |
acron | -6.655 |
Token | The |
Token ID | 383 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
totality | +11.362 |
distinguishing | +10.948 |
deviations | +10.936 |
disadvantages | +10.861 |
fundamentals | +10.676 |
Neg logit contributions | |
uty | -5.705 |
ien | -5.670 |
usk | -5.391 |
u | -5.294 |
ire | -4.830 |
Token | 39 |
Token ID | 5014 |
Feature activation | -3.48e+01 |
Pos logit contributions | |
totality | +9.388 |
deviations | +8.859 |
distinguishing | +8.854 |
these | +8.832 |
things | +8.802 |
Neg logit contributions | |
ien | -13.952 |
uty | -13.936 |
usk | -13.825 |
ump | -13.378 |
aga | -13.370 |
Token | - |
Token ID | 12 |
Feature activation | -5.96e+01 |
Pos logit contributions | |
- | +9.914 |
th | +7.156 |
year | +5.917 |
ix | +5.748 |
ft | +5.672 |
Neg logit contributions | |
behavi | -14.821 |
totality | -14.570 |
theless | -13.714 |
Izan | -13.546 |
Situation | -13.503 |
Token | year |
Token ID | 1941 |
Feature activation | -5.98e+01 |
Pos logit contributions | |
year | +14.641 |
month | +12.896 |
minute | +12.082 |
page | +10.884 |
day | +10.553 |
Neg logit contributions | |
totality | -18.777 |
behavi | -18.537 |
deviations | -17.728 |
DRAG | -17.637 |
spont | -17.623 |
Token | - |
Token ID | 12 |
Feature activation | -1.13e+02 |
Pos logit contributions | |
- | +13.565 |
old | +6.187 |
u | +5.602 |
uty | +5.333 |
long | +5.000 |
Neg logit contributions | |
tremend | -25.374 |
behavi | -23.894 |
eleph | -23.781 |
cumbers | -23.251 |
undermin | -22.908 |
Token | old |
Token ID | 727 |
Feature activation | -4.31e+00 |
Pos logit contributions | |
old | +17.445 |
olds | +10.715 |
year | +10.267 |
long | +9.799 |
u | +9.111 |
Neg logit contributions | |
cumbers | -41.999 |
reluct | -41.579 |
behavi | -41.178 |
enthusi | -41.141 |
metic | -40.778 |
Token | Australian |
Token ID | 6638 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
ien | +1.553 |
- | +1.525 |
u | +1.392 |
uty | +1.275 |
aga | +1.249 |
Neg logit contributions | |
behavi | -2.328 |
inaction | -2.231 |
totality | -2.205 |
tremend | -2.189 |
deviations | -2.180 |
Token | , |
Token ID | 11 |
Feature activation | -2.49e+01 |
Pos logit contributions | |
- | +5.663 |
ien | +4.558 |
u | +4.014 |
ite | +3.841 |
ian | +3.325 |
Neg logit contributions | |
behavi | -8.181 |
tremend | -8.127 |
totality | -7.681 |
deviations | -7.567 |
unnecess | -7.448 |
Token | who |
Token ID | 508 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
ien | +5.911 |
usk | +5.569 |
uty | +5.420 |
u | +5.051 |
ass | +4.740 |
Neg logit contributions | |
VIDEOS | -10.254 |
deviations | -10.127 |
totality | -9.964 |
unnecess | -9.905 |
tremend | -9.870 |
Token | denies |
Token ID | 18866 |
Feature activation | -3.31e+01 |
Pos logit contributions | |
ia | +2.759 |
u | +2.717 |
ien | +2.679 |
- | +2.629 |
q | +2.478 |
Neg logit contributions | |
behavi | -8.316 |
unnecess | -8.211 |
tremend | -8.088 |
totality | -7.906 |
Meaning | -7.836 |