Token | release |
Token ID | 2650 |
Feature activation | -4.74e-01 |
Pos logit contributions | |
whence | +4.940 |
PLIED | +4.585 |
forgiveness | +4.382 |
accus | +4.050 |
where | +4.034 |
Neg logit contributions | |
olson | -7.446 |
dit | -6.401 |
� | -6.327 |
ctl | -6.078 |
advertising | -5.941 |
Token | , |
Token ID | 11 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
whence | +4.110 |
PLIED | +3.941 |
forgiveness | +3.629 |
where | +3.384 |
accus | +3.358 |
Neg logit contributions | |
olson | -5.259 |
dit | -4.424 |
� | -4.359 |
advertising | -4.159 |
ctl | -4.156 |
Token | Ken |
Token ID | 7148 |
Feature activation | +4.78e-01 |
Pos logit contributions | |
olson | +3.288 |
dit | +2.856 |
� | +2.782 |
advertising | +2.652 |
ctl | +2.629 |
Neg logit contributions | |
PLIED | -2.555 |
whence | -2.474 |
forgiveness | -2.168 |
repre | -2.053 |
accus | -2.044 |
Token | y |
Token ID | 88 |
Feature activation | +4.20e-01 |
Pos logit contributions | |
olson | +3.561 |
dit | +2.815 |
� | +2.658 |
ctl | +2.519 |
advertising | +2.510 |
Neg logit contributions | |
whence | -5.844 |
PLIED | -5.801 |
forgiveness | -5.359 |
accus | -5.118 |
hurled | -5.038 |
Token | atta |
Token ID | 25014 |
Feature activation | +3.04e-01 |
Pos logit contributions | |
olson | +4.633 |
dit | +4.001 |
� | +3.843 |
ctl | +3.756 |
advertising | +3.705 |
Neg logit contributions | |
whence | -3.610 |
PLIED | -3.572 |
forgiveness | -3.196 |
accus | -2.951 |
cropped | -2.908 |
Token | set |
Token ID | 900 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
olson | +3.442 |
dit | +2.932 |
� | +2.851 |
ctl | +2.791 |
advertising | +2.754 |
Neg logit contributions | |
PLIED | -2.483 |
whence | -2.419 |
forgiveness | -2.120 |
repre | -2.039 |
accus | -1.932 |
Token | about |
Token ID | 546 |
Feature activation | +8.71e-01 |
Pos logit contributions | |
olson | +17.768 |
dit | +14.641 |
customs | +14.550 |
Guinness | +14.299 |
ctl | +14.153 |
Neg logit contributions | |
PLIED | -18.659 |
whence | -16.554 |
repre | -16.035 |
ippi | -14.992 |
ateral | -14.953 |
Token | trying |
Token ID | 2111 |
Feature activation | +6.41e-01 |
Pos logit contributions | |
olson | +8.168 |
dit | +6.869 |
� | +6.724 |
advertising | +6.500 |
ctl | +6.372 |
Neg logit contributions | |
PLIED | -8.169 |
whence | -7.438 |
repre | -6.619 |
forgiveness | -6.510 |
aught | -6.423 |
Token | to |
Token ID | 284 |
Feature activation | +8.89e-01 |
Pos logit contributions | |
olson | +5.683 |
� | +4.737 |
dit | +4.631 |
ctl | +4.345 |
undo | +4.243 |
Neg logit contributions | |
PLIED | -6.440 |
whence | -6.288 |
forgiveness | -5.410 |
Applied | -5.401 |
hurled | -5.401 |
Token | ensure |
Token ID | 4155 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
olson | +8.627 |
dit | +7.128 |
� | +6.839 |
undo | +6.834 |
ctl | +6.681 |
Neg logit contributions | |
PLIED | -8.112 |
whence | -7.793 |
repre | -6.838 |
forgiveness | -6.709 |
hurled | -6.508 |
Token | that |
Token ID | 326 |
Feature activation | +3.50e-01 |
Pos logit contributions | |
olson | +8.557 |
dit | +7.450 |
� | +7.020 |
advertising | +6.846 |
customs | +6.614 |
Neg logit contributions | |
PLIED | -9.863 |
whence | -9.093 |
repre | -8.171 |
aught | -7.856 |
hurled | -7.760 |
Token | team |
Token ID | 1074 |
Feature activation | -2.94e-02 |
Pos logit contributions | |
whence | +2.191 |
PLIED | +2.103 |
forgiveness | +1.900 |
accus | +1.717 |
where | +1.709 |
Neg logit contributions | |
olson | -4.350 |
dit | -3.791 |
� | -3.729 |
advertising | -3.602 |
ctl | -3.564 |
Token | talk |
Token ID | 1561 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
whence | +0.277 |
PLIED | +0.274 |
forgiveness | +0.247 |
accus | +0.232 |
where | +0.227 |
Neg logit contributions | |
olson | -0.302 |
dit | -0.254 |
� | -0.249 |
ctl | -0.237 |
advertising | -0.235 |
Token | . |
Token ID | 13 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
whence | +3.487 |
PLIED | +3.387 |
forgiveness | +3.102 |
where | +2.938 |
accus | +2.913 |
Neg logit contributions | |
olson | -4.165 |
dit | -3.515 |
� | -3.443 |
advertising | -3.285 |
ctl | -3.251 |
Token | And |
Token ID | 843 |
Feature activation | +3.55e-01 |
Pos logit contributions | |
olson | +2.802 |
dit | +2.381 |
� | +2.329 |
advertising | +2.225 |
ctl | +2.194 |
Neg logit contributions | |
PLIED | -2.774 |
whence | -2.755 |
forgiveness | -2.508 |
accus | -2.373 |
hurled | -2.338 |
Token | he |
Token ID | 339 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
olson | +3.777 |
dit | +3.253 |
� | +3.153 |
ctl | +3.010 |
advertising | +2.996 |
Neg logit contributions | |
PLIED | -3.114 |
whence | -2.979 |
forgiveness | -2.660 |
accus | -2.492 |
repre | -2.478 |
Token | set |
Token ID | 900 |
Feature activation | +2.22e+00 |
Pos logit contributions | |
olson | +2.516 |
dit | +2.167 |
� | +2.076 |
ctl | +2.041 |
advertising | +2.009 |
Neg logit contributions | |
PLIED | -1.983 |
whence | -1.949 |
forgiveness | -1.747 |
accus | -1.587 |
repre | -1.585 |
Token | about |
Token ID | 546 |
Feature activation | +9.62e-01 |
Pos logit contributions | |
olson | +16.351 |
dit | +14.319 |
Guinness | +13.738 |
customs | +13.236 |
ctl | +13.096 |
Neg logit contributions | |
PLIED | -16.405 |
whence | -14.822 |
repre | -13.991 |
srfAttach | -13.575 |
ateral | -13.440 |
Token | us |
Token ID | 514 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
olson | +9.043 |
dit | +7.780 |
� | +7.477 |
advertising | +7.296 |
ctl | +7.252 |
Neg logit contributions | |
PLIED | -8.737 |
whence | -7.898 |
forgiveness | -7.069 |
repre | -6.893 |
aught | -6.795 |
Token | . |
Token ID | 13 |
Feature activation | +5.98e-02 |
Pos logit contributions | |
olson | +1.129 |
dit | +0.956 |
� | +0.934 |
ctl | +0.889 |
advertising | +0.885 |
Neg logit contributions | |
whence | -0.995 |
PLIED | -0.987 |
forgiveness | -0.881 |
accus | -0.826 |
Applied | -0.814 |
Token |
|
Token ID | 198 |
Feature activation | -8.86e-02 |
Pos logit contributions | |
olson | +0.606 |
dit | +0.512 |
� | +0.501 |
advertising | +0.476 |
ctl | +0.474 |
Neg logit contributions | |
whence | -0.568 |
PLIED | -0.565 |
forgiveness | -0.511 |
accus | -0.480 |
hurled | -0.471 |
Token |
|
Token ID | 198 |
Feature activation | +4.04e-03 |
Pos logit contributions | |
whence | +0.812 |
PLIED | +0.791 |
forgiveness | +0.716 |
where | +0.695 |
Applied | +0.664 |
Neg logit contributions | |
olson | -0.939 |
dit | -0.791 |
� | -0.779 |
ctl | -0.727 |
undo | -0.720 |
Token | such |
Token ID | 884 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
olson | +10.731 |
dit | +9.029 |
� | +8.607 |
ctl | +8.512 |
advertising | +8.283 |
Neg logit contributions | |
PLIED | -9.098 |
whence | -8.473 |
forgiveness | -7.430 |
repre | -7.213 |
srfAttach | -6.911 |
Token | a |
Token ID | 257 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
olson | +10.793 |
dit | +8.888 |
� | +8.539 |
ctl | +8.297 |
advertising | +8.278 |
Neg logit contributions | |
PLIED | -9.616 |
whence | -9.310 |
forgiveness | -8.023 |
aught | -7.635 |
repre | -7.500 |
Token | long |
Token ID | 890 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
olson | +12.703 |
dit | +10.039 |
� | +9.907 |
Guinness | +9.683 |
ctl | +9.629 |
Neg logit contributions | |
PLIED | -10.912 |
whence | -10.596 |
forgiveness | -8.960 |
Loans | -8.646 |
aught | -8.618 |
Token | and |
Token ID | 290 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
olson | +8.804 |
dit | +6.890 |
� | +6.719 |
undo | +6.451 |
advertising | +6.445 |
Neg logit contributions | |
PLIED | -10.033 |
whence | -9.600 |
forgiveness | -8.459 |
aught | -8.171 |
Loans | -8.070 |
Token | st |
Token ID | 336 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
olson | +14.973 |
dit | +11.982 |
� | +11.768 |
nex | +11.699 |
ctl | +11.439 |
Neg logit contributions | |
PLIED | -12.247 |
whence | -11.308 |
forgiveness | -9.709 |
Loans | -9.636 |
aught | -9.608 |
Token | oried |
Token ID | 42058 |
Feature activation | +2.16e+00 |
Pos logit contributions | |
olson | +8.992 |
dit | +6.747 |
undo | +5.795 |
item | +5.760 |
ctl | +5.736 |
Neg logit contributions | |
PLIED | -16.245 |
whence | -16.144 |
forgiveness | -14.899 |
flared | -14.298 |
srfAttach | -14.276 |
Token | history |
Token ID | 2106 |
Feature activation | +9.86e-01 |
Pos logit contributions | |
olson | +14.979 |
Guinness | +11.666 |
customs | +11.494 |
advertising | +11.443 |
� | +11.294 |
Neg logit contributions | |
PLIED | -19.571 |
whence | -16.914 |
aught | -15.492 |
repre | -15.467 |
srfAttach | -15.217 |
Token | of |
Token ID | 286 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
olson | +9.255 |
dit | +7.497 |
� | +7.381 |
advertising | +7.374 |
undo | +7.142 |
Neg logit contributions | |
PLIED | -8.886 |
whence | -8.057 |
forgiveness | -7.533 |
repre | -7.325 |
srfAttach | -7.013 |
Token | failure |
Token ID | 5287 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
olson | +3.545 |
dit | +2.979 |
� | +2.908 |
advertising | +2.848 |
ctl | +2.794 |
Neg logit contributions | |
PLIED | -2.757 |
whence | -2.672 |
forgiveness | -2.367 |
aught | -2.200 |
accus | -2.196 |
Token | they |
Token ID | 484 |
Feature activation | +6.16e-01 |
Pos logit contributions | |
olson | +2.191 |
dit | +1.803 |
� | +1.750 |
advertising | +1.706 |
ctl | +1.683 |
Neg logit contributions | |
PLIED | -2.197 |
whence | -2.165 |
forgiveness | -1.949 |
accus | -1.829 |
repre | -1.816 |
Token | made |
Token ID | 925 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
olson | +6.526 |
dit | +5.537 |
ctl | +5.204 |
� | +5.097 |
advertising | +5.095 |
Neg logit contributions | |
PLIED | -5.200 |
whence | -5.172 |
forgiveness | -4.598 |
repre | -4.281 |
srfAttach | -4.180 |
Token | held |
Token ID | 2714 |
Feature activation | +5.38e-01 |
Pos logit contributions | |
olson | +5.139 |
dit | +4.453 |
� | +4.428 |
ctl | +4.219 |
advertising | +4.095 |
Neg logit contributions | |
whence | -4.043 |
PLIED | -4.033 |
forgiveness | -3.535 |
repre | -3.206 |
accus | -3.172 |
Token | his |
Token ID | 465 |
Feature activation | -3.45e-03 |
Pos logit contributions | |
olson | +5.580 |
dit | +4.797 |
� | +4.635 |
ctl | +4.454 |
undo | +4.316 |
Neg logit contributions | |
whence | -4.658 |
PLIED | -4.655 |
forgiveness | -4.028 |
repre | -3.778 |
aught | -3.774 |
Token | identification |
Token ID | 11795 |
Feature activation | +5.96e-01 |
Pos logit contributions | |
whence | +0.030 |
PLIED | +0.030 |
forgiveness | +0.027 |
accus | +0.025 |
hurled | +0.024 |
Neg logit contributions | |
olson | -0.038 |
dit | -0.032 |
� | -0.032 |
ctl | -0.030 |
advertising | -0.030 |
Token | and |
Token ID | 290 |
Feature activation | +4.31e-01 |
Pos logit contributions | |
olson | +5.417 |
dit | +4.693 |
� | +4.442 |
ctl | +4.375 |
undo | +4.332 |
Neg logit contributions | |
PLIED | -5.739 |
whence | -5.607 |
forgiveness | -5.080 |
repre | -4.839 |
aught | -4.728 |
Token | other |
Token ID | 584 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
olson | +4.433 |
dit | +3.737 |
� | +3.725 |
ctl | +3.525 |
advertising | +3.490 |
Neg logit contributions | |
PLIED | -3.855 |
whence | -3.812 |
forgiveness | -3.331 |
repre | -3.162 |
aught | -3.146 |
Token | important |
Token ID | 1593 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
olson | +12.814 |
dit | +10.897 |
advertising | +10.837 |
� | +10.824 |
customs | +10.753 |
Neg logit contributions | |
PLIED | -12.879 |
whence | -12.690 |
forgiveness | -10.794 |
aught | -10.743 |
repre | -10.635 |
Token | materials |
Token ID | 5696 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
olson | +14.645 |
customs | +13.323 |
� | +12.990 |
advertising | +12.889 |
dit | +12.672 |
Neg logit contributions | |
PLIED | -16.098 |
whence | -15.996 |
aught | -13.522 |
repre | -13.430 |
forgiveness | -13.201 |
Token | , |
Token ID | 11 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
olson | +8.434 |
dit | +7.175 |
� | +7.119 |
ctl | +6.795 |
advertising | +6.699 |
Neg logit contributions | |
PLIED | -9.510 |
whence | -9.135 |
forgiveness | -8.340 |
repre | -7.784 |
Applied | -7.741 |
Token | into |
Token ID | 656 |
Feature activation | +2.16e-02 |
Pos logit contributions | |
olson | +1.767 |
dit | +1.479 |
� | +1.437 |
ctl | +1.377 |
advertising | +1.366 |
Neg logit contributions | |
PLIED | -1.901 |
whence | -1.878 |
forgiveness | -1.718 |
accus | -1.598 |
Applied | -1.589 |
Token | the |
Token ID | 262 |
Feature activation | -1.73e-01 |
Pos logit contributions | |
olson | +0.229 |
dit | +0.195 |
� | +0.190 |
ctl | +0.182 |
advertising | +0.179 |
Neg logit contributions | |
whence | -0.196 |
PLIED | -0.195 |
forgiveness | -0.174 |
accus | -0.163 |
hurled | -0.158 |
Token | trash |
Token ID | 13913 |
Feature activation | -6.34e-01 |
Pos logit contributions | |
whence | +1.483 |
PLIED | +1.453 |
forgiveness | +1.309 |
accus | +1.216 |
where | +1.200 |
Neg logit contributions | |
olson | -1.937 |
dit | -1.647 |
� | -1.623 |
ctl | -1.546 |
advertising | -1.544 |
Token | Identity |
Token ID | 27207 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
olson | +9.986 |
dit | +8.584 |
� | +8.112 |
undo | +7.848 |
advertising | +7.799 |
Neg logit contributions | |
PLIED | -10.590 |
whence | -10.127 |
forgiveness | -9.182 |
repre | -8.742 |
hurled | -8.433 |
Token | : |
Token ID | 25 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
olson | +8.993 |
dit | +7.767 |
� | +7.219 |
ctl | +7.070 |
undo | +6.929 |
Neg logit contributions | |
PLIED | -9.538 |
whence | -9.452 |
forgiveness | -8.485 |
repre | -8.252 |
accus | -7.878 |
Token | Gender |
Token ID | 20247 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
olson | +2.115 |
dit | +1.811 |
� | +1.756 |
advertising | +1.697 |
ctl | +1.670 |
Neg logit contributions | |
PLIED | -1.810 |
whence | -1.798 |
forgiveness | -1.616 |
accus | -1.494 |
repre | -1.492 |
Token | identity |
Token ID | 5369 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
olson | +7.866 |
dit | +6.421 |
� | +6.158 |
advertising | +6.044 |
ctl | +5.965 |
Neg logit contributions | |
PLIED | -10.705 |
whence | -10.273 |
forgiveness | -9.567 |
repre | -9.140 |
aught | -8.874 |
Token | is |
Token ID | 318 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
olson | +11.763 |
dit | +9.839 |
ctl | +9.748 |
customs | +9.477 |
advertising | +9.298 |
Neg logit contributions | |
PLIED | -10.961 |
whence | -10.190 |
forgiveness | -9.276 |
repre | -9.210 |
aught | -8.963 |
Token | an |
Token ID | 281 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
olson | +10.645 |
dit | +9.404 |
� | +8.842 |
advertising | +8.686 |
ctl | +8.587 |
Neg logit contributions | |
PLIED | -8.888 |
whence | -8.598 |
repre | -7.626 |
forgiveness | -7.470 |
Loans | -7.308 |
Token | inner |
Token ID | 8434 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
olson | +15.800 |
dit | +14.156 |
nex | +13.660 |
� | +13.272 |
advertising | +13.240 |
Neg logit contributions | |
whence | -15.123 |
PLIED | -14.760 |
repre | -13.227 |
Loans | -13.080 |
srfAttach | -12.829 |
Token | sense |
Token ID | 2565 |
Feature activation | +5.64e-01 |
Pos logit contributions | |
olson | +3.203 |
dit | +2.712 |
� | +2.638 |
advertising | +2.505 |
ctl | +2.495 |
Neg logit contributions | |
whence | -2.988 |
PLIED | -2.935 |
forgiveness | -2.638 |
accus | -2.489 |
repre | -2.462 |
Token | of |
Token ID | 286 |
Feature activation | -6.97e-02 |
Pos logit contributions | |
olson | +5.314 |
dit | +4.549 |
� | +4.400 |
advertising | +4.183 |
ctl | +4.138 |
Neg logit contributions | |
PLIED | -5.245 |
whence | -5.162 |
forgiveness | -4.742 |
repre | -4.572 |
Loans | -4.453 |
Token | being |
Token ID | 852 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
whence | +0.613 |
PLIED | +0.609 |
forgiveness | +0.544 |
accus | +0.507 |
hurled | +0.497 |
Neg logit contributions | |
olson | -0.758 |
dit | -0.645 |
� | -0.631 |
ctl | -0.602 |
advertising | -0.599 |
Token | female |
Token ID | 4048 |
Feature activation | +4.01e-01 |
Pos logit contributions | |
olson | +1.195 |
dit | +1.029 |
� | +1.002 |
ctl | +0.956 |
advertising | +0.946 |
Neg logit contributions | |
PLIED | -1.006 |
whence | -0.992 |
forgiveness | -0.898 |
accus | -0.823 |
repre | -0.821 |
Token | unique |
Token ID | 3748 |
Feature activation | +8.22e-01 |
Pos logit contributions | |
olson | +7.117 |
dit | +6.066 |
� | +5.770 |
ctl | +5.639 |
advertising | +5.455 |
Neg logit contributions | |
PLIED | -6.261 |
whence | -6.197 |
forgiveness | -5.347 |
aught | -5.092 |
Loans | -5.022 |
Token | ," |
Token ID | 553 |
Feature activation | +4.60e-01 |
Pos logit contributions | |
olson | +7.166 |
dit | +5.836 |
� | +5.556 |
ctl | +5.393 |
advertising | +5.356 |
Neg logit contributions | |
whence | -8.128 |
PLIED | -8.061 |
forgiveness | -7.162 |
accus | -6.926 |
hurled | -6.799 |
Token | and |
Token ID | 290 |
Feature activation | +9.85e-01 |
Pos logit contributions | |
olson | +4.902 |
dit | +4.184 |
� | +4.076 |
advertising | +3.973 |
undo | +3.871 |
Neg logit contributions | |
PLIED | -3.882 |
whence | -3.814 |
forgiveness | -3.391 |
repre | -3.187 |
aught | -3.167 |
Token | is |
Token ID | 318 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
olson | +10.018 |
dit | +8.493 |
� | +7.936 |
advertising | +7.923 |
ctl | +7.848 |
Neg logit contributions | |
PLIED | -8.112 |
whence | -7.837 |
forgiveness | -6.735 |
repre | -6.652 |
aught | -6.624 |
Token | already |
Token ID | 1541 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
olson | +9.793 |
dit | +8.333 |
advertising | +8.167 |
� | +7.866 |
ctl | +7.759 |
Neg logit contributions | |
PLIED | -9.468 |
whence | -9.033 |
forgiveness | -7.910 |
repre | -7.730 |
Loans | -7.561 |
Token | hitting |
Token ID | 9008 |
Feature activation | +2.07e+00 |
Pos logit contributions | |
olson | +9.362 |
dit | +7.979 |
advertising | +7.735 |
� | +7.540 |
customs | +7.337 |
Neg logit contributions | |
PLIED | -9.635 |
whence | -9.266 |
forgiveness | -8.287 |
repre | -7.928 |
aught | -7.845 |
Token | the |
Token ID | 262 |
Feature activation | +7.30e-01 |
Pos logit contributions | |
olson | +16.605 |
dit | +15.463 |
� | +14.463 |
customs | +14.293 |
advertising | +14.088 |
Neg logit contributions | |
PLIED | -14.119 |
whence | -13.872 |
aught | -11.832 |
repre | -11.687 |
forgiveness | -11.524 |
Token | gym |
Token ID | 11550 |
Feature activation | +2.82e-01 |
Pos logit contributions | |
olson | +7.309 |
dit | +6.245 |
� | +6.015 |
advertising | +5.859 |
ctl | +5.825 |
Neg logit contributions | |
PLIED | -6.526 |
whence | -6.331 |
forgiveness | -5.443 |
aught | -5.259 |
accus | -5.210 |
Token | and |
Token ID | 290 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
olson | +2.881 |
dit | +2.461 |
� | +2.350 |
ctl | +2.298 |
advertising | +2.286 |
Neg logit contributions | |
PLIED | -2.599 |
whence | -2.585 |
forgiveness | -2.313 |
accus | -2.176 |
repre | -2.143 |
Token | eating |
Token ID | 6600 |
Feature activation | +5.51e-01 |
Pos logit contributions | |
olson | +10.110 |
dit | +8.721 |
ctl | +8.074 |
� | +8.071 |
advertising | +7.918 |
Neg logit contributions | |
PLIED | -9.169 |
whence | -8.673 |
repre | -7.617 |
forgiveness | -7.509 |
aught | -7.294 |
Token | healthy |
Token ID | 5448 |
Feature activation | +3.87e-01 |
Pos logit contributions | |
olson | +5.528 |
dit | +4.777 |
� | +4.649 |
ctl | +4.503 |
advertising | +4.344 |
Neg logit contributions | |
PLIED | -4.860 |
whence | -4.715 |
forgiveness | -4.121 |
accus | -4.020 |
repre | -3.993 |
Token | French |
Token ID | 24111 |
Feature activation | -6.96e-01 |
Pos logit contributions | |
whence | +1.939 |
PLIED | +1.912 |
forgiveness | +1.754 |
accus | +1.659 |
where | +1.642 |
Neg logit contributions | |
olson | -1.659 |
dit | -1.357 |
� | -1.321 |
ctl | -1.247 |
advertising | -1.238 |
Token | President |
Token ID | 1992 |
Feature activation | +5.10e-01 |
Pos logit contributions | |
whence | +5.530 |
PLIED | +5.332 |
forgiveness | +4.972 |
where | +4.606 |
accus | +4.601 |
Neg logit contributions | |
olson | -7.901 |
dit | -6.693 |
� | -6.637 |
advertising | -6.322 |
ctl | -6.315 |
Token | Francois |
Token ID | 40419 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
olson | +4.393 |
dit | +3.802 |
� | +3.745 |
ctl | +3.584 |
advertising | +3.438 |
Neg logit contributions | |
PLIED | -5.291 |
whence | -5.107 |
forgiveness | -4.547 |
repre | -4.375 |
accus | -4.321 |
Token | Hollande |
Token ID | 33590 |
Feature activation | +4.40e-02 |
Pos logit contributions | |
olson | +1.966 |
� | +1.556 |
dit | +1.536 |
ctl | +1.440 |
undo | +1.417 |
Neg logit contributions | |
PLIED | -2.489 |
whence | -2.462 |
forgiveness | -2.210 |
repre | -2.103 |
accus | -2.094 |
Token | has |
Token ID | 468 |
Feature activation | +6.98e-01 |
Pos logit contributions | |
olson | +0.489 |
dit | +0.415 |
� | +0.411 |
ctl | +0.395 |
advertising | +0.387 |
Neg logit contributions | |
whence | -0.376 |
PLIED | -0.376 |
forgiveness | -0.331 |
accus | -0.305 |
repre | -0.301 |
Token | set |
Token ID | 900 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
olson | +7.454 |
dit | +6.463 |
ctl | +6.275 |
� | +6.230 |
nex | +5.894 |
Neg logit contributions | |
PLIED | -5.610 |
whence | -5.449 |
forgiveness | -4.763 |
repre | -4.534 |
Applied | -4.394 |
Token | out |
Token ID | 503 |
Feature activation | +4.48e-01 |
Pos logit contributions | |
olson | +16.553 |
dit | +14.149 |
� | +13.855 |
ctl | +13.411 |
customs | +12.968 |
Neg logit contributions | |
PLIED | -15.836 |
whence | -14.772 |
forgiveness | -12.729 |
repre | -12.648 |
hurled | -12.405 |
Token | an |
Token ID | 281 |
Feature activation | +6.28e-01 |
Pos logit contributions | |
olson | +4.252 |
dit | +3.571 |
� | +3.548 |
ctl | +3.395 |
advertising | +3.251 |
Neg logit contributions | |
PLIED | -4.417 |
whence | -4.317 |
forgiveness | -3.828 |
hurled | -3.595 |
accus | -3.589 |
Token | ambitious |
Token ID | 14742 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
olson | +5.493 |
dit | +4.531 |
� | +4.327 |
ctl | +4.183 |
undo | +4.154 |
Neg logit contributions | |
whence | -6.534 |
PLIED | -6.490 |
forgiveness | -5.747 |
hurled | -5.477 |
repre | -5.472 |
Token | goal |
Token ID | 3061 |
Feature activation | +4.75e-01 |
Pos logit contributions | |
olson | +1.361 |
dit | +1.175 |
� | +1.146 |
ctl | +1.109 |
advertising | +1.097 |
Neg logit contributions | |
whence | -0.953 |
PLIED | -0.953 |
forgiveness | -0.817 |
accus | -0.755 |
hurled | -0.749 |
Token | for |
Token ID | 329 |
Feature activation | +2.34e-02 |
Pos logit contributions | |
olson | +4.308 |
dit | +3.651 |
� | +3.591 |
ctl | +3.458 |
undo | +3.352 |
Neg logit contributions | |
PLIED | -4.811 |
whence | -4.665 |
forgiveness | -4.158 |
accus | -3.951 |
repre | -3.912 |
Token | Last |
Token ID | 5956 |
Feature activation | -9.08e-02 |
Pos logit contributions | |
whence | +2.934 |
PLIED | +2.895 |
forgiveness | +2.620 |
accus | +2.456 |
where | +2.443 |
Neg logit contributions | |
olson | -3.115 |
dit | -2.608 |
� | -2.534 |
ctl | -2.414 |
advertising | -2.389 |
Token | week |
Token ID | 1285 |
Feature activation | +5.20e-01 |
Pos logit contributions | |
whence | +0.821 |
PLIED | +0.816 |
forgiveness | +0.729 |
accus | +0.681 |
hurled | +0.667 |
Neg logit contributions | |
olson | -0.970 |
dit | -0.821 |
� | -0.806 |
ctl | -0.768 |
advertising | -0.764 |
Token | the |
Token ID | 262 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
olson | +4.991 |
� | +4.180 |
dit | +4.178 |
ctl | +3.928 |
advertising | +3.886 |
Neg logit contributions | |
PLIED | -4.997 |
whence | -4.977 |
forgiveness | -4.375 |
hurled | -4.087 |
cropped | -4.078 |
Token | Prime |
Token ID | 5537 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
whence | +1.121 |
PLIED | +1.103 |
forgiveness | +0.990 |
accus | +0.921 |
where | +0.906 |
Neg logit contributions | |
olson | -1.425 |
dit | -1.213 |
� | -1.191 |
ctl | -1.136 |
advertising | -1.132 |
Token | Minister |
Token ID | 4139 |
Feature activation | +7.68e-02 |
Pos logit contributions | |
whence | +0.858 |
PLIED | +0.808 |
forgiveness | +0.718 |
where | +0.674 |
accus | +0.651 |
Neg logit contributions | |
olson | -1.663 |
dit | -1.444 |
� | -1.413 |
advertising | -1.362 |
ctl | -1.356 |
Token | set |
Token ID | 900 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
olson | +0.853 |
dit | +0.727 |
� | +0.722 |
ctl | +0.689 |
advertising | +0.676 |
Neg logit contributions | |
whence | -0.655 |
PLIED | -0.650 |
forgiveness | -0.579 |
accus | -0.534 |
repre | -0.526 |
Token | out |
Token ID | 503 |
Feature activation | +5.40e-01 |
Pos logit contributions | |
olson | +15.269 |
dit | +12.778 |
ctl | +12.479 |
� | +12.427 |
customs | +12.056 |
Neg logit contributions | |
PLIED | -16.182 |
whence | -15.607 |
forgiveness | -13.404 |
hurled | -13.377 |
repre | -13.215 |
Token | plans |
Token ID | 3352 |
Feature activation | +1.32e-02 |
Pos logit contributions | |
olson | +4.750 |
dit | +3.921 |
� | +3.894 |
ctl | +3.783 |
advertising | +3.632 |
Neg logit contributions | |
PLIED | -5.580 |
whence | -5.441 |
forgiveness | -4.842 |
hurled | -4.598 |
accus | -4.585 |
Token | for |
Token ID | 329 |
Feature activation | -2.14e-01 |
Pos logit contributions | |
olson | +0.131 |
dit | +0.109 |
� | +0.108 |
ctl | +0.103 |
advertising | +0.101 |
Neg logit contributions | |
whence | -0.128 |
PLIED | -0.128 |
forgiveness | -0.115 |
accus | -0.108 |
hurled | -0.106 |
Token | Britain |
Token ID | 5491 |
Feature activation | -4.46e-02 |
Pos logit contributions | |
whence | +1.977 |
PLIED | +1.946 |
forgiveness | +1.761 |
accus | +1.647 |
where | +1.622 |
Neg logit contributions | |
olson | -2.243 |
dit | -1.891 |
� | -1.856 |
ctl | -1.763 |
advertising | -1.757 |
Token | to |
Token ID | 284 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
whence | +0.422 |
PLIED | +0.419 |
forgiveness | +0.376 |
accus | +0.353 |
hurled | +0.347 |
Neg logit contributions | |
olson | -0.456 |
dit | -0.385 |
� | -0.379 |
advertising | -0.358 |
ctl | -0.358 |
Token | several |
Token ID | 1811 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
whence | +0.777 |
PLIED | +0.767 |
forgiveness | +0.689 |
accus | +0.647 |
hurled | +0.638 |
Neg logit contributions | |
olson | -0.877 |
dit | -0.743 |
� | -0.728 |
ctl | -0.690 |
advertising | -0.686 |
Token | weeks |
Token ID | 2745 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
olson | +2.324 |
dit | +1.998 |
� | +1.963 |
ctl | +1.868 |
advertising | +1.852 |
Neg logit contributions | |
whence | -1.881 |
PLIED | -1.874 |
forgiveness | -1.639 |
accus | -1.523 |
hurled | -1.521 |
Token | in |
Token ID | 287 |
Feature activation | +6.31e-02 |
Pos logit contributions | |
whence | +0.927 |
PLIED | +0.923 |
forgiveness | +0.826 |
accus | +0.768 |
hurled | +0.758 |
Neg logit contributions | |
olson | -1.092 |
dit | -0.927 |
� | -0.912 |
ctl | -0.863 |
advertising | -0.859 |
Token | 2007 |
Token ID | 4343 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
olson | +0.708 |
dit | +0.610 |
� | +0.598 |
ctl | +0.572 |
advertising | +0.566 |
Neg logit contributions | |
PLIED | -0.529 |
whence | -0.526 |
forgiveness | -0.462 |
accus | -0.430 |
hurled | -0.426 |
Token | and |
Token ID | 290 |
Feature activation | +4.14e-02 |
Pos logit contributions | |
whence | +1.645 |
PLIED | +1.625 |
forgiveness | +1.462 |
accus | +1.362 |
hurled | +1.337 |
Neg logit contributions | |
olson | -1.981 |
dit | -1.680 |
� | -1.650 |
ctl | -1.569 |
advertising | -1.564 |
Token | set |
Token ID | 900 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
olson | +0.485 |
dit | +0.419 |
� | +0.411 |
ctl | +0.394 |
advertising | +0.390 |
Neg logit contributions | |
whence | -0.329 |
PLIED | -0.326 |
forgiveness | -0.288 |
accus | -0.266 |
repre | -0.259 |
Token | to |
Token ID | 284 |
Feature activation | +7.33e-01 |
Pos logit contributions | |
olson | +15.306 |
dit | +13.694 |
� | +12.461 |
ctl | +12.335 |
customs | +11.807 |
Neg logit contributions | |
PLIED | -15.795 |
whence | -15.208 |
repre | -13.373 |
forgiveness | -13.293 |
hurled | -13.052 |
Token | work |
Token ID | 670 |
Feature activation | +8.94e-01 |
Pos logit contributions | |
olson | +8.081 |
dit | +7.063 |
� | +6.910 |
ctl | +6.576 |
undo | +6.453 |
Neg logit contributions | |
PLIED | -5.829 |
whence | -5.683 |
forgiveness | -4.952 |
hurled | -4.741 |
repre | -4.713 |
Token | , |
Token ID | 11 |
Feature activation | +5.56e-01 |
Pos logit contributions | |
olson | +7.556 |
dit | +6.524 |
� | +6.484 |
ctl | +6.005 |
advertising | +5.879 |
Neg logit contributions | |
PLIED | -8.943 |
whence | -8.313 |
forgiveness | -7.566 |
hurled | -7.162 |
repre | -7.141 |
Token | with |
Token ID | 351 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
olson | +5.673 |
dit | +4.974 |
� | +4.874 |
ctl | +4.570 |
undo | +4.562 |
Neg logit contributions | |
PLIED | -4.835 |
whence | -4.645 |
forgiveness | -4.151 |
repre | -3.904 |
accus | -3.839 |
Token | the |
Token ID | 262 |
Feature activation | -3.88e-02 |
Pos logit contributions | |
olson | +4.401 |
dit | +3.843 |
� | +3.712 |
ctl | +3.532 |
undo | +3.435 |
Neg logit contributions | |
whence | -3.536 |
PLIED | -3.533 |
forgiveness | -3.017 |
hurled | -2.888 |
repre | -2.853 |
Token | oried |
Token ID | 42058 |
Feature activation | +2.16e+00 |
Pos logit contributions | |
olson | +8.992 |
dit | +6.747 |
undo | +5.795 |
item | +5.760 |
ctl | +5.736 |
Neg logit contributions | |
PLIED | -16.245 |
whence | -16.144 |
forgiveness | -14.899 |
flared | -14.298 |
srfAttach | -14.276 |
Token | history |
Token ID | 2106 |
Feature activation | +9.86e-01 |
Pos logit contributions | |
olson | +14.979 |
Guinness | +11.666 |
customs | +11.494 |
advertising | +11.443 |
� | +11.294 |
Neg logit contributions | |
PLIED | -19.571 |
whence | -16.914 |
aught | -15.492 |
repre | -15.467 |
srfAttach | -15.217 |
Token | of |
Token ID | 286 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
olson | +9.255 |
dit | +7.497 |
� | +7.381 |
advertising | +7.374 |
undo | +7.142 |
Neg logit contributions | |
PLIED | -8.886 |
whence | -8.057 |
forgiveness | -7.533 |
repre | -7.325 |
srfAttach | -7.013 |
Token | failure |
Token ID | 5287 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
olson | +3.545 |
dit | +2.979 |
� | +2.908 |
advertising | +2.848 |
ctl | +2.794 |
Neg logit contributions | |
PLIED | -2.757 |
whence | -2.672 |
forgiveness | -2.367 |
aught | -2.200 |
accus | -2.196 |
Token | they |
Token ID | 484 |
Feature activation | +6.16e-01 |
Pos logit contributions | |
olson | +2.191 |
dit | +1.803 |
� | +1.750 |
advertising | +1.706 |
ctl | +1.683 |
Neg logit contributions | |
PLIED | -2.197 |
whence | -2.165 |
forgiveness | -1.949 |
accus | -1.829 |
repre | -1.816 |
Token | made |
Token ID | 925 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
olson | +6.526 |
dit | +5.537 |
ctl | +5.204 |
� | +5.097 |
advertising | +5.095 |
Neg logit contributions | |
PLIED | -5.200 |
whence | -5.172 |
forgiveness | -4.598 |
repre | -4.281 |
srfAttach | -4.180 |
Token | the |
Token ID | 262 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
olson | +16.843 |
dit | +14.258 |
advertising | +13.793 |
� | +13.560 |
Guinness | +13.433 |
Neg logit contributions | |
PLIED | -14.800 |
whence | -13.788 |
repre | -12.098 |
forgiveness | -11.612 |
aught | -11.129 |
Token | Astros |
Token ID | 27463 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
olson | +11.961 |
dit | +10.194 |
Guinness | +9.812 |
undo | +9.764 |
� | +9.665 |
Neg logit contributions | |
PLIED | -9.140 |
whence | -8.560 |
forgiveness | -7.290 |
repre | -6.955 |
aught | -6.826 |
Token | look |
Token ID | 804 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
olson | +1.357 |
dit | +1.135 |
� | +1.123 |
advertising | +1.067 |
ctl | +1.064 |
Neg logit contributions | |
whence | -1.203 |
PLIED | -1.190 |
forgiveness | -1.068 |
accus | -1.000 |
hurled | -0.975 |
Token | like |
Token ID | 588 |
Feature activation | +5.02e-02 |
Pos logit contributions | |
olson | +3.105 |
dit | +2.569 |
� | +2.465 |
ctl | +2.396 |
advertising | +2.375 |
Neg logit contributions | |
PLIED | -3.307 |
whence | -3.236 |
forgiveness | -2.930 |
aught | -2.710 |
repre | -2.700 |
Token | the |
Token ID | 262 |
Feature activation | -1.42e-01 |
Pos logit contributions | |
olson | +0.542 |
dit | +0.460 |
� | +0.449 |
advertising | +0.430 |
ctl | +0.430 |
Neg logit contributions | |
PLIED | -0.447 |
whence | -0.446 |
forgiveness | -0.395 |
accus | -0.367 |
hurled | -0.360 |
Token | effect |
Token ID | 1245 |
Feature activation | +7.78e-01 |
Pos logit contributions | |
olson | +6.181 |
dit | +5.348 |
advertising | +5.115 |
� | +5.091 |
ctl | +4.971 |
Neg logit contributions | |
whence | -5.860 |
PLIED | -5.846 |
repre | -5.086 |
forgiveness | -5.075 |
srfAttach | -4.967 |
Token | to |
Token ID | 284 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
olson | +6.534 |
� | +5.518 |
dit | +5.487 |
advertising | +5.394 |
undo | +5.248 |
Neg logit contributions | |
PLIED | -7.523 |
whence | -7.445 |
forgiveness | -6.777 |
flared | -6.486 |
cropped | -6.478 |
Token | any |
Token ID | 597 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
olson | +10.028 |
dit | +8.920 |
advertising | +8.733 |
� | +8.370 |
customs | +8.229 |
Neg logit contributions | |
PLIED | -12.339 |
whence | -11.869 |
cropped | -10.232 |
forgiveness | -10.158 |
srfAttach | -10.130 |
Token | public |
Token ID | 1171 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
olson | +9.130 |
dit | +8.072 |
advertising | +8.061 |
nex | +7.822 |
customs | +7.765 |
Neg logit contributions | |
PLIED | -11.676 |
whence | -11.241 |
repre | -9.710 |
forgiveness | -9.503 |
aught | -9.465 |
Token | act |
Token ID | 719 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
olson | +10.198 |
dit | +8.888 |
advertising | +8.456 |
customs | +8.351 |
ctl | +8.340 |
Neg logit contributions | |
PLIED | -13.034 |
whence | -12.458 |
aught | -10.758 |
repre | -10.697 |
hurled | -10.581 |
Token | , |
Token ID | 11 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
olson | +9.074 |
dit | +7.914 |
advertising | +7.821 |
ctl | +7.598 |
customs | +7.532 |
Neg logit contributions | |
PLIED | -9.501 |
whence | -8.566 |
forgiveness | -8.083 |
srfAttach | -7.888 |
aught | -7.728 |
Token | record |
Token ID | 1700 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
olson | +13.071 |
customs | +12.382 |
undo | +11.659 |
Guinness | +11.582 |
advertising | +11.309 |
Neg logit contributions | |
PLIED | -16.865 |
whence | -15.945 |
srfAttach | -14.566 |
aught | -14.525 |
ammed | -14.375 |
Token | , |
Token ID | 11 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
olson | +7.824 |
advertising | +6.523 |
� | +6.484 |
dit | +6.446 |
ctl | +6.189 |
Neg logit contributions | |
whence | -10.914 |
PLIED | -10.888 |
forgiveness | -9.952 |
srfAttach | -9.508 |
repre | -9.485 |
Token | or |
Token ID | 393 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
olson | +12.330 |
customs | +10.983 |
undo | +10.789 |
advertising | +10.614 |
Guinness | +10.283 |
Neg logit contributions | |
whence | -13.501 |
PLIED | -13.456 |
srfAttach | -12.282 |
aught | -12.032 |
forgiveness | -11.645 |
Token | judicial |
Token ID | 13657 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
olson | +11.706 |
advertising | +10.261 |
customs | +10.030 |
undo | +9.743 |
� | +9.610 |
Neg logit contributions | |
whence | -13.817 |
PLIED | -13.300 |
srfAttach | -12.394 |
aught | -12.308 |
forgiveness | -12.102 |
Token | proceeding |
Token ID | 18788 |
Feature activation | +9.72e-01 |
Pos logit contributions | |
olson | +10.607 |
customs | +9.212 |
ctl | +9.081 |
advertising | +9.076 |
dit | +8.959 |
Neg logit contributions | |
PLIED | -13.380 |
whence | -12.014 |
aught | -11.070 |
srfAttach | -10.984 |
repre | -10.701 |
Token | hops |
Token ID | 29438 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
PLIED | +0.040 |
whence | +0.040 |
forgiveness | +0.035 |
accus | +0.033 |
Applied | +0.032 |
Neg logit contributions | |
olson | -0.051 |
dit | -0.044 |
� | -0.043 |
ctl | -0.041 |
advertising | -0.041 |
Token | on |
Token ID | 319 |
Feature activation | +7.65e-02 |
Pos logit contributions | |
olson | +1.840 |
dit | +1.522 |
� | +1.491 |
ctl | +1.412 |
advertising | +1.395 |
Neg logit contributions | |
whence | -2.049 |
PLIED | -2.038 |
forgiveness | -1.843 |
accus | -1.737 |
repre | -1.713 |
Token | her |
Token ID | 607 |
Feature activation | -3.48e-01 |
Pos logit contributions | |
olson | +0.794 |
dit | +0.679 |
� | +0.664 |
ctl | +0.635 |
advertising | +0.627 |
Neg logit contributions | |
whence | -0.702 |
PLIED | -0.702 |
forgiveness | -0.622 |
accus | -0.585 |
Applied | -0.572 |
Token | dragon |
Token ID | 10441 |
Feature activation | +4.26e-01 |
Pos logit contributions | |
whence | +2.910 |
PLIED | +2.823 |
forgiveness | +2.570 |
accus | +2.398 |
where | +2.358 |
Neg logit contributions | |
olson | -3.960 |
dit | -3.377 |
� | -3.325 |
advertising | -3.156 |
ctl | -3.153 |
Token | and |
Token ID | 290 |
Feature activation | +3.12e-01 |
Pos logit contributions | |
olson | +4.463 |
dit | +3.768 |
� | +3.760 |
ctl | +3.664 |
advertising | +3.533 |
Neg logit contributions | |
PLIED | -3.827 |
whence | -3.729 |
forgiveness | -3.332 |
Applied | -3.124 |
accus | -3.049 |
Token | sets |
Token ID | 5621 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
olson | +3.550 |
dit | +3.038 |
� | +3.022 |
ctl | +2.896 |
advertising | +2.869 |
Neg logit contributions | |
PLIED | -2.551 |
whence | -2.475 |
forgiveness | -2.173 |
repre | -2.021 |
accus | -2.002 |
Token | out |
Token ID | 503 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
olson | +14.710 |
dit | +12.511 |
� | +12.114 |
ctl | +11.999 |
advertising | +11.602 |
Neg logit contributions | |
PLIED | -15.881 |
whence | -14.698 |
repre | -13.731 |
Applied | -12.902 |
forgiveness | -12.812 |
Token | to |
Token ID | 284 |
Feature activation | +8.33e-01 |
Pos logit contributions | |
olson | +3.288 |
� | +2.781 |
dit | +2.757 |
ctl | +2.596 |
advertising | +2.584 |
Neg logit contributions | |
PLIED | -3.604 |
whence | -3.514 |
forgiveness | -3.183 |
cropped | -3.007 |
accus | -3.007 |
Token | free |
Token ID | 1479 |
Feature activation | +4.66e-02 |
Pos logit contributions | |
olson | +7.962 |
� | +6.782 |
dit | +6.759 |
ctl | +6.432 |
undo | +6.258 |
Neg logit contributions | |
PLIED | -7.591 |
whence | -7.297 |
repre | -6.378 |
forgiveness | -6.265 |
cropped | -6.151 |
Token | all |
Token ID | 477 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
olson | +0.491 |
dit | +0.420 |
� | +0.411 |
ctl | +0.391 |
advertising | +0.389 |
Neg logit contributions | |
whence | -0.421 |
PLIED | -0.420 |
forgiveness | -0.373 |
accus | -0.350 |
hurled | -0.343 |
Token | of |
Token ID | 286 |
Feature activation | +4.56e-01 |
Pos logit contributions | |
olson | +2.884 |
dit | +2.495 |
� | +2.446 |
ctl | +2.290 |
advertising | +2.289 |
Neg logit contributions | |
PLIED | -2.457 |
whence | -2.408 |
forgiveness | -2.140 |
Applied | -1.980 |
accus | -1.980 |
Token | . |
Token ID | 13 |
Feature activation | +4.02e-01 |
Pos logit contributions | |
whence | +3.693 |
PLIED | +3.578 |
forgiveness | +3.257 |
where | +3.073 |
accus | +3.040 |
Neg logit contributions | |
olson | -4.737 |
dit | -4.032 |
� | -3.920 |
ctl | -3.758 |
advertising | -3.718 |
Token |
|
Token ID | 198 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
olson | +4.004 |
dit | +3.401 |
� | +3.358 |
advertising | +3.225 |
ctl | +3.167 |
Neg logit contributions | |
whence | -3.718 |
PLIED | -3.702 |
forgiveness | -3.375 |
accus | -3.164 |
repre | -3.139 |
Token |
|
Token ID | 198 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
olson | +1.601 |
dit | +1.332 |
� | +1.307 |
ctl | +1.232 |
advertising | +1.226 |
Neg logit contributions | |
whence | -1.594 |
PLIED | -1.565 |
forgiveness | -1.427 |
where | -1.340 |
accus | -1.338 |
Token | They |
Token ID | 2990 |
Feature activation | +4.98e-01 |
Pos logit contributions | |
olson | +3.215 |
dit | +2.710 |
� | +2.692 |
advertising | +2.617 |
ctl | +2.521 |
Neg logit contributions | |
whence | -3.275 |
PLIED | -3.199 |
forgiveness | -2.969 |
accus | -2.809 |
flared | -2.786 |
Token | started |
Token ID | 2067 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
olson | +5.536 |
dit | +4.816 |
� | +4.685 |
ctl | +4.505 |
undo | +4.452 |
Neg logit contributions | |
PLIED | -4.020 |
whence | -3.995 |
forgiveness | -3.555 |
accus | -3.175 |
repre | -3.167 |
Token | shutting |
Token ID | 25136 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
olson | +10.391 |
� | +9.138 |
dit | +9.132 |
advertising | +8.587 |
undo | +8.373 |
Neg logit contributions | |
PLIED | -9.826 |
whence | -9.208 |
forgiveness | -8.127 |
aught | -7.580 |
repre | -7.518 |
Token | down |
Token ID | 866 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
olson | +12.992 |
dit | +11.691 |
ctl | +10.789 |
� | +10.773 |
advertising | +10.456 |
Neg logit contributions | |
PLIED | -16.394 |
whence | -16.204 |
forgiveness | -14.382 |
srfAttach | -13.942 |
hurled | -13.855 |
Token | businesses |
Token ID | 5692 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
olson | +9.998 |
dit | +8.773 |
� | +8.419 |
advertising | +8.278 |
ctl | +8.082 |
Neg logit contributions | |
PLIED | -8.917 |
whence | -8.397 |
forgiveness | -7.445 |
repre | -6.970 |
hurled | -6.952 |
Token | and |
Token ID | 290 |
Feature activation | +9.45e-01 |
Pos logit contributions | |
olson | +2.004 |
dit | +1.696 |
� | +1.672 |
ctl | +1.585 |
advertising | +1.584 |
Neg logit contributions | |
PLIED | -1.682 |
whence | -1.666 |
forgiveness | -1.503 |
accus | -1.382 |
Applied | -1.365 |
Token | locking |
Token ID | 22656 |
Feature activation | +9.84e-01 |
Pos logit contributions | |
olson | +9.835 |
dit | +8.426 |
� | +8.415 |
advertising | +8.179 |
ctl | +7.956 |
Neg logit contributions | |
PLIED | -7.415 |
whence | -7.194 |
forgiveness | -6.067 |
repre | -5.855 |
Applied | -5.723 |
Token | themselves |
Token ID | 2405 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
olson | +8.441 |
dit | +7.076 |
� | +6.803 |
ctl | +6.743 |
advertising | +6.511 |
Neg logit contributions | |
PLIED | -9.297 |
whence | -9.169 |
forgiveness | -8.177 |
Applied | -7.816 |
repre | -7.766 |
Token | x |
Token ID | 87 |
Feature activation | +4.24e-01 |
Pos logit contributions | |
olson | +1.613 |
dit | +1.353 |
� | +1.325 |
ctl | +1.260 |
advertising | +1.252 |
Neg logit contributions | |
whence | -1.515 |
PLIED | -1.491 |
forgiveness | -1.355 |
accus | -1.270 |
where | -1.248 |
Token | said |
Token ID | 531 |
Feature activation | -6.42e-01 |
Pos logit contributions | |
olson | +4.428 |
dit | +3.815 |
� | +3.748 |
ctl | +3.637 |
undo | +3.490 |
Neg logit contributions | |
whence | -3.762 |
PLIED | -3.712 |
forgiveness | -3.290 |
repre | -3.065 |
accus | -3.053 |
Token | just |
Token ID | 655 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
whence | +5.345 |
PLIED | +5.130 |
forgiveness | +4.700 |
where | +4.452 |
accus | +4.397 |
Neg logit contributions | |
olson | -7.194 |
dit | -6.152 |
� | -5.932 |
advertising | -5.746 |
ctl | -5.710 |
Token | after |
Token ID | 706 |
Feature activation | +6.74e-01 |
Pos logit contributions | |
whence | +0.957 |
PLIED | +0.940 |
forgiveness | +0.839 |
accus | +0.776 |
where | +0.762 |
Neg logit contributions | |
olson | -1.352 |
dit | -1.159 |
� | -1.141 |
ctl | -1.089 |
advertising | -1.086 |
Token | he |
Token ID | 339 |
Feature activation | -3.76e-02 |
Pos logit contributions | |
olson | +6.500 |
� | +5.607 |
dit | +5.505 |
ctl | +5.170 |
undo | +5.103 |
Neg logit contributions | |
PLIED | -6.249 |
whence | -6.086 |
forgiveness | -5.339 |
repre | -5.167 |
accus | -5.086 |
Token | set |
Token ID | 900 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
whence | +0.312 |
PLIED | +0.309 |
forgiveness | +0.275 |
accus | +0.252 |
repre | +0.246 |
Neg logit contributions | |
olson | -0.431 |
dit | -0.371 |
� | -0.364 |
ctl | -0.349 |
advertising | -0.343 |
Token | the |
Token ID | 262 |
Feature activation | +5.24e-01 |
Pos logit contributions | |
olson | +15.010 |
� | +14.112 |
dit | +13.668 |
ctl | +13.080 |
Guinness | +12.824 |
Neg logit contributions | |
PLIED | -14.869 |
whence | -14.272 |
forgiveness | -12.300 |
repre | -12.101 |
srfAttach | -11.742 |
Token | mark |
Token ID | 1317 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
olson | +5.265 |
dit | +4.554 |
� | +4.450 |
ctl | +4.309 |
undo | +4.236 |
Neg logit contributions | |
PLIED | -4.775 |
whence | -4.682 |
forgiveness | -4.115 |
repre | -3.874 |
accus | -3.817 |
Token | . |
Token ID | 13 |
Feature activation | +5.65e-02 |
Pos logit contributions | |
olson | +9.605 |
� | +8.594 |
dit | +8.209 |
ctl | +7.752 |
undo | +7.553 |
Neg logit contributions | |
PLIED | -10.189 |
whence | -9.687 |
forgiveness | -8.784 |
repre | -8.403 |
accus | -8.253 |
Token | � |
Token ID | 564 |
Feature activation | +8.01e-02 |
Pos logit contributions | |
olson | +0.582 |
dit | +0.492 |
� | +0.488 |
ctl | +0.458 |
advertising | +0.456 |
Neg logit contributions | |
whence | -0.530 |
PLIED | -0.524 |
forgiveness | -0.475 |
accus | -0.445 |
hurled | -0.439 |
Token | � |
Token ID | 250 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
olson | +0.771 |
dit | +0.647 |
� | +0.644 |
ctl | +0.603 |
advertising | +0.598 |
Neg logit contributions | |
whence | -0.797 |
PLIED | -0.790 |
forgiveness | -0.712 |
accus | -0.673 |
hurled | -0.667 |
Token | , |
Token ID | 11 |
Feature activation | +7.39e-02 |
Pos logit contributions | |
whence | +1.097 |
PLIED | +1.085 |
forgiveness | +0.972 |
accus | +0.906 |
hurled | +0.891 |
Neg logit contributions | |
olson | -1.316 |
dit | -1.115 |
� | -1.098 |
ctl | -1.045 |
advertising | -1.043 |
Token | Phil |
Token ID | 4543 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
olson | +0.783 |
dit | +0.667 |
� | +0.650 |
ctl | +0.624 |
advertising | +0.621 |
Neg logit contributions | |
PLIED | -0.662 |
whence | -0.662 |
forgiveness | -0.587 |
accus | -0.554 |
hurled | -0.542 |
Token | K |
Token ID | 509 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
olson | +8.768 |
dit | +7.168 |
� | +6.871 |
ctl | +6.706 |
item | +6.399 |
Neg logit contributions | |
PLIED | -11.526 |
whence | -10.670 |
forgiveness | -10.050 |
warranted | -9.683 |
accus | -9.633 |
Token | essel |
Token ID | 7878 |
Feature activation | -9.53e-02 |
Pos logit contributions | |
olson | +4.054 |
dit | +3.367 |
� | +3.091 |
ctl | +3.029 |
advertising | +2.965 |
Neg logit contributions | |
PLIED | -5.135 |
whence | -5.095 |
forgiveness | -4.815 |
accus | -4.611 |
Applied | -4.475 |
Token | and |
Token ID | 290 |
Feature activation | +3.69e-01 |
Pos logit contributions | |
whence | +0.855 |
PLIED | +0.846 |
forgiveness | +0.757 |
accus | +0.706 |
hurled | +0.693 |
Neg logit contributions | |
olson | -1.027 |
dit | -0.871 |
� | -0.858 |
ctl | -0.817 |
advertising | -0.814 |
Token | Kris |
Token ID | 27748 |
Feature activation | +1.92e+00 |
Pos logit contributions | |
olson | +3.780 |
dit | +3.208 |
� | +3.116 |
ctl | +3.030 |
advertising | +2.981 |
Neg logit contributions | |
PLIED | -3.373 |
whence | -3.301 |
forgiveness | -2.919 |
accus | -2.793 |
repre | -2.750 |
Token | Let |
Token ID | 3914 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
olson | +10.761 |
dit | +8.154 |
pie | +8.049 |
Statistics | +7.786 |
advertising | +7.459 |
Neg logit contributions | |
PLIED | -20.378 |
whence | -19.551 |
forgiveness | -17.746 |
cropped | -17.051 |
aught | -16.870 |
Token | ang |
Token ID | 648 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
olson | +3.414 |
dit | +2.863 |
� | +2.709 |
advertising | +2.578 |
ctl | +2.556 |
Neg logit contributions | |
whence | -3.858 |
PLIED | -3.855 |
forgiveness | -3.519 |
cropped | -3.273 |
accus | -3.262 |
Token | are |
Token ID | 389 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
olson | +4.464 |
dit | +3.802 |
� | +3.713 |
advertising | +3.541 |
ctl | +3.534 |
Neg logit contributions | |
PLIED | -4.108 |
whence | -3.972 |
forgiveness | -3.524 |
hurled | -3.303 |
accus | -3.269 |
Token | in |
Token ID | 287 |
Feature activation | +1.84e-01 |
Pos logit contributions | |
olson | +2.687 |
dit | +2.306 |
� | +2.253 |
ctl | +2.170 |
advertising | +2.154 |
Neg logit contributions | |
PLIED | -2.036 |
whence | -2.022 |
forgiveness | -1.759 |
accus | -1.632 |
repre | -1.617 |
Token | this |
Token ID | 428 |
Feature activation | +4.83e-01 |
Pos logit contributions | |
olson | +1.951 |
dit | +1.657 |
� | +1.634 |
ctl | +1.568 |
advertising | +1.528 |
Neg logit contributions | |
PLIED | -1.657 |
whence | -1.647 |
forgiveness | -1.448 |
accus | -1.360 |
hurled | -1.346 |
Token | ome |
Token ID | 462 |
Feature activation | +5.22e-01 |
Pos logit contributions | |
whence | +0.631 |
PLIED | +0.621 |
forgiveness | +0.562 |
accus | +0.528 |
hurled | +0.520 |
Neg logit contributions | |
olson | -0.665 |
dit | -0.553 |
� | -0.543 |
ctl | -0.515 |
advertising | -0.514 |
Token | ys |
Token ID | 893 |
Feature activation | +9.33e-02 |
Pos logit contributions | |
olson | +3.542 |
� | +2.648 |
dit | +2.624 |
ctl | +2.410 |
advertising | +2.363 |
Neg logit contributions | |
PLIED | -6.533 |
whence | -6.503 |
forgiveness | -5.940 |
hurled | -5.739 |
cropped | -5.681 |
Token | were |
Token ID | 547 |
Feature activation | +8.65e-02 |
Pos logit contributions | |
olson | +1.027 |
dit | +0.877 |
� | +0.856 |
ctl | +0.824 |
advertising | +0.810 |
Neg logit contributions | |
whence | -0.811 |
PLIED | -0.798 |
forgiveness | -0.710 |
accus | -0.660 |
repre | -0.649 |
Token | left |
Token ID | 1364 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
olson | +0.995 |
dit | +0.857 |
� | +0.843 |
ctl | +0.807 |
advertising | +0.804 |
Neg logit contributions | |
whence | -0.703 |
PLIED | -0.690 |
forgiveness | -0.609 |
accus | -0.560 |
repre | -0.552 |
Token | to |
Token ID | 284 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
olson | +10.514 |
dit | +9.162 |
� | +8.490 |
ctl | +8.390 |
advertising | +8.156 |
Neg logit contributions | |
whence | -10.100 |
PLIED | -9.822 |
srfAttach | -8.673 |
forgiveness | -8.570 |
repre | -8.431 |
Token | make |
Token ID | 787 |
Feature activation | +1.92e+00 |
Pos logit contributions | |
olson | +12.666 |
dit | +10.152 |
� | +9.795 |
ctl | +9.628 |
customs | +9.294 |
Neg logit contributions | |
PLIED | -11.209 |
whence | -10.978 |
repre | -10.111 |
aught | -9.572 |
forgiveness | -9.411 |
Token | the |
Token ID | 262 |
Feature activation | +6.67e-01 |
Pos logit contributions | |
olson | +15.048 |
dit | +13.251 |
� | +12.727 |
ctl | +11.892 |
customs | +11.845 |
Neg logit contributions | |
PLIED | -15.456 |
whence | -14.385 |
repre | -12.849 |
aught | -12.172 |
srfAttach | -11.930 |
Token | decision |
Token ID | 2551 |
Feature activation | +9.70e-01 |
Pos logit contributions | |
olson | +7.239 |
dit | +6.167 |
� | +6.085 |
ctl | +5.894 |
undo | +5.708 |
Neg logit contributions | |
PLIED | -5.460 |
whence | -5.384 |
forgiveness | -4.445 |
aught | -4.295 |
repre | -4.245 |
Token | . |
Token ID | 13 |
Feature activation | +2.06e-02 |
Pos logit contributions | |
olson | +9.206 |
dit | +7.905 |
� | +7.862 |
ctl | +7.431 |
advertising | +7.337 |
Neg logit contributions | |
PLIED | -8.747 |
whence | -7.810 |
forgiveness | -7.026 |
repre | -6.863 |
aught | -6.650 |
Token | They |
Token ID | 1119 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
olson | +0.197 |
dit | +0.164 |
� | +0.161 |
ctl | +0.151 |
advertising | +0.151 |
Neg logit contributions | |
whence | -0.208 |
PLIED | -0.205 |
forgiveness | -0.188 |
accus | -0.177 |
hurled | -0.175 |
Token | explored |
Token ID | 18782 |
Feature activation | +6.91e-03 |
Pos logit contributions | |
olson | +2.979 |
dit | +2.556 |
� | +2.436 |
ctl | +2.401 |
advertising | +2.328 |
Neg logit contributions | |
whence | -2.303 |
PLIED | -2.298 |
forgiveness | -2.022 |
repre | -1.885 |
accus | -1.866 |
Token | political |
Token ID | 1964 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
olson | +5.182 |
dit | +4.504 |
� | +4.377 |
advertising | +4.089 |
ctl | +4.029 |
Neg logit contributions | |
PLIED | -5.095 |
whence | -4.980 |
forgiveness | -4.419 |
aught | -4.159 |
hurled | -4.126 |
Token | , |
Token ID | 11 |
Feature activation | +9.50e-01 |
Pos logit contributions | |
olson | +9.163 |
dit | +8.051 |
� | +7.692 |
ctl | +7.199 |
customs | +7.186 |
Neg logit contributions | |
PLIED | -9.553 |
whence | -9.003 |
forgiveness | -7.937 |
aught | -7.751 |
repre | -7.583 |
Token | economic |
Token ID | 3034 |
Feature activation | +7.57e-01 |
Pos logit contributions | |
olson | +7.001 |
� | +6.007 |
dit | +5.584 |
advertising | +5.579 |
ctl | +5.538 |
Neg logit contributions | |
PLIED | -10.055 |
whence | -9.928 |
aught | -8.875 |
forgiveness | -8.829 |
repre | -8.606 |
Token | , |
Token ID | 11 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
olson | +6.308 |
dit | +5.344 |
� | +5.334 |
ctl | +4.896 |
advertising | +4.863 |
Neg logit contributions | |
PLIED | -7.707 |
whence | -7.654 |
forgiveness | -6.811 |
Applied | -6.490 |
hurled | -6.480 |
Token | and |
Token ID | 290 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
olson | +9.774 |
� | +8.670 |
ctl | +8.037 |
dit | +7.999 |
advertising | +7.998 |
Neg logit contributions | |
whence | -9.226 |
PLIED | -9.036 |
forgiveness | -7.936 |
aught | -7.884 |
repre | -7.654 |
Token | military |
Token ID | 2422 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
olson | +10.580 |
� | +9.245 |
customs | +8.510 |
ctl | +8.412 |
advertising | +8.279 |
Neg logit contributions | |
whence | -14.277 |
PLIED | -14.179 |
aught | -12.884 |
repre | -12.594 |
forgiveness | -12.527 |
Token | institutions |
Token ID | 6712 |
Feature activation | +6.26e-01 |
Pos logit contributions | |
olson | +14.566 |
dit | +13.258 |
� | +12.885 |
advertising | +12.332 |
customs | +12.158 |
Neg logit contributions | |
PLIED | -14.717 |
whence | -14.209 |
forgiveness | -12.623 |
aught | -12.089 |
ammed | -11.988 |
Token | that |
Token ID | 326 |
Feature activation | +7.23e-01 |
Pos logit contributions | |
olson | +5.799 |
� | +5.028 |
dit | +4.841 |
ctl | +4.474 |
advertising | +4.453 |
Neg logit contributions | |
PLIED | -6.083 |
whence | -5.782 |
forgiveness | -5.382 |
repre | -5.001 |
accus | -4.977 |
Token | have |
Token ID | 423 |
Feature activation | +9.09e-01 |
Pos logit contributions | |
olson | +7.374 |
� | +6.434 |
dit | +6.267 |
ctl | +5.895 |
undo | +5.714 |
Neg logit contributions | |
PLIED | -6.289 |
whence | -6.136 |
forgiveness | -5.475 |
repre | -5.135 |
accus | -5.037 |
Token | been |
Token ID | 587 |
Feature activation | +7.20e-01 |
Pos logit contributions | |
olson | +9.774 |
dit | +8.671 |
� | +8.505 |
ctl | +8.138 |
undo | +7.951 |
Neg logit contributions | |
PLIED | -6.697 |
whence | -6.415 |
forgiveness | -5.595 |
repre | -5.439 |
Applied | -5.094 |
Token | the |
Token ID | 262 |
Feature activation | +8.30e-02 |
Pos logit contributions | |
olson | +7.490 |
� | +6.666 |
dit | +6.558 |
ctl | +6.064 |
advertising | +5.997 |
Neg logit contributions | |
PLIED | -5.785 |
whence | -5.702 |
forgiveness | -5.151 |
repre | -4.743 |
aught | -4.610 |
Token | Caps |
Token ID | 23534 |
Feature activation | +2.22e-02 |
Pos logit contributions | |
olson | +2.899 |
dit | +2.427 |
� | +2.396 |
ctl | +2.291 |
advertising | +2.277 |
Neg logit contributions | |
PLIED | -2.571 |
whence | -2.551 |
forgiveness | -2.264 |
accus | -2.111 |
repre | -2.092 |
Token | didn |
Token ID | 1422 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
olson | +0.259 |
dit | +0.223 |
� | +0.219 |
ctl | +0.210 |
advertising | +0.209 |
Neg logit contributions | |
whence | -0.177 |
PLIED | -0.176 |
forgiveness | -0.155 |
accus | -0.143 |
repre | -0.139 |
Token | � |
Token ID | 447 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
whence | +1.531 |
PLIED | +1.504 |
forgiveness | +1.396 |
where | +1.341 |
accus | +1.311 |
Neg logit contributions | |
olson | -1.152 |
dit | -0.928 |
� | -0.877 |
ctl | -0.826 |
advertising | -0.823 |
Token | � |
Token ID | 247 |
Feature activation | -4.19e-01 |
Pos logit contributions | |
whence | +1.913 |
PLIED | +1.859 |
forgiveness | +1.716 |
accus | +1.604 |
where | +1.598 |
Neg logit contributions | |
olson | -2.087 |
dit | -1.749 |
� | -1.683 |
ctl | -1.596 |
advertising | -1.592 |
Token | t |
Token ID | 83 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
whence | +4.221 |
PLIED | +4.095 |
forgiveness | +3.767 |
where | +3.590 |
accus | +3.549 |
Neg logit contributions | |
olson | -4.013 |
� | -3.266 |
dit | -3.265 |
advertising | -3.085 |
ctl | -3.008 |
Token | let |
Token ID | 1309 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
olson | +1.192 |
dit | +1.014 |
� | +0.981 |
ctl | +0.950 |
advertising | +0.936 |
Neg logit contributions | |
PLIED | -0.991 |
whence | -0.983 |
forgiveness | -0.875 |
accus | -0.815 |
hurled | -0.798 |
Token | the |
Token ID | 262 |
Feature activation | +7.23e-01 |
Pos logit contributions | |
olson | +15.322 |
� | +13.290 |
dit | +12.853 |
advertising | +12.613 |
ctl | +12.175 |
Neg logit contributions | |
PLIED | -14.623 |
whence | -13.842 |
accus | -11.964 |
repre | -11.888 |
forgiveness | -11.875 |
Token | moment |
Token ID | 2589 |
Feature activation | -3.22e-01 |
Pos logit contributions | |
olson | +7.275 |
dit | +6.109 |
� | +6.085 |
advertising | +5.813 |
ctl | +5.808 |
Neg logit contributions | |
PLIED | -6.555 |
whence | -6.164 |
forgiveness | -5.336 |
repre | -5.108 |
aught | -5.082 |
Token | slip |
Token ID | 13819 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
whence | +2.609 |
PLIED | +2.524 |
forgiveness | +2.290 |
where | +2.129 |
accus | +2.115 |
Neg logit contributions | |
olson | -3.728 |
dit | -3.198 |
� | -3.145 |
ctl | -2.995 |
advertising | -2.985 |
Token | , |
Token ID | 11 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
olson | +1.595 |
dit | +1.335 |
� | +1.308 |
ctl | +1.238 |
advertising | +1.235 |
Neg logit contributions | |
PLIED | -1.615 |
whence | -1.592 |
forgiveness | -1.445 |
accus | -1.349 |
repre | -1.335 |
Token | crushing |
Token ID | 24949 |
Feature activation | +9.11e-01 |
Pos logit contributions | |
olson | +4.018 |
dit | +3.418 |
� | +3.404 |
advertising | +3.253 |
ctl | +3.196 |
Neg logit contributions | |
PLIED | -3.392 |
whence | -3.264 |
forgiveness | -2.922 |
accus | -2.740 |
repre | -2.701 |
Token | , |
Token ID | 11 |
Feature activation | +6.15e-01 |
Pos logit contributions | |
olson | +5.983 |
dit | +5.096 |
� | +4.855 |
ctl | +4.696 |
advertising | +4.657 |
Neg logit contributions | |
PLIED | -5.815 |
whence | -5.442 |
forgiveness | -5.111 |
repre | -4.729 |
accus | -4.687 |
Token | and |
Token ID | 290 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
olson | +6.505 |
� | +5.522 |
dit | +5.418 |
advertising | +5.237 |
ctl | +5.166 |
Neg logit contributions | |
PLIED | -5.225 |
whence | -4.995 |
forgiveness | -4.513 |
accus | -4.177 |
aught | -4.151 |
Token | that |
Token ID | 326 |
Feature activation | +4.21e-01 |
Pos logit contributions | |
olson | +6.275 |
� | +5.118 |
dit | +5.063 |
ctl | +4.934 |
advertising | +4.805 |
Neg logit contributions | |
PLIED | -5.310 |
whence | -5.190 |
forgiveness | -4.594 |
repre | -4.299 |
aught | -4.288 |
Token | this |
Token ID | 428 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
olson | +4.417 |
dit | +3.609 |
� | +3.590 |
advertising | +3.499 |
ctl | +3.481 |
Neg logit contributions | |
PLIED | -3.790 |
whence | -3.717 |
forgiveness | -3.263 |
repre | -3.062 |
accus | -3.044 |
Token | has |
Token ID | 468 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
olson | +1.171 |
dit | +0.980 |
� | +0.968 |
ctl | +0.931 |
advertising | +0.929 |
Neg logit contributions | |
whence | -0.925 |
PLIED | -0.921 |
forgiveness | -0.809 |
accus | -0.755 |
hurled | -0.739 |
Token | made |
Token ID | 925 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
olson | +4.581 |
dit | +3.996 |
� | +3.906 |
ctl | +3.793 |
advertising | +3.752 |
Neg logit contributions | |
whence | -2.735 |
PLIED | -2.722 |
forgiveness | -2.323 |
repre | -2.097 |
accus | -2.068 |
Token | it |
Token ID | 340 |
Feature activation | +7.28e-01 |
Pos logit contributions | |
olson | +15.472 |
customs | +12.972 |
advertising | +12.245 |
item | +12.028 |
dit | +12.006 |
Neg logit contributions | |
PLIED | -14.434 |
whence | -13.630 |
repre | -12.131 |
aught | -11.528 |
srfAttach | -11.343 |
Token | harder |
Token ID | 7069 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
olson | +8.494 |
� | +7.326 |
dit | +7.076 |
advertising | +6.901 |
ctl | +6.874 |
Neg logit contributions | |
PLIED | -5.172 |
whence | -5.146 |
forgiveness | -4.347 |
Applied | -3.970 |
aught | -3.920 |
Token | for |
Token ID | 329 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
olson | +2.151 |
dit | +1.752 |
� | +1.740 |
ctl | +1.645 |
advertising | +1.613 |
Neg logit contributions | |
PLIED | -2.381 |
whence | -2.369 |
forgiveness | -2.119 |
accus | -2.003 |
hurled | -1.999 |
Token | screen |
Token ID | 3159 |
Feature activation | +3.88e-01 |
Pos logit contributions | |
olson | +3.296 |
dit | +2.701 |
� | +2.625 |
ctl | +2.547 |
advertising | +2.513 |
Neg logit contributions | |
PLIED | -3.338 |
whence | -3.300 |
forgiveness | -2.928 |
repre | -2.798 |
aught | -2.754 |
Token | ers |
Token ID | 364 |
Feature activation | -7.38e-02 |
Pos logit contributions | |
olson | +4.168 |
� | +3.596 |
dit | +3.560 |
advertising | +3.388 |
ctl | +3.348 |
Neg logit contributions | |
whence | -3.310 |
PLIED | -3.296 |
forgiveness | -2.846 |
repre | -2.701 |
Applied | -2.687 |
Token | Beat |
Token ID | 12568 |
Feature activation | +7.81e-01 |
Pos logit contributions | |
whence | +2.288 |
PLIED | +2.245 |
forgiveness | +2.022 |
accus | +1.882 |
where | +1.855 |
Neg logit contributions | |
olson | -2.891 |
dit | -2.459 |
� | -2.416 |
ctl | -2.301 |
advertising | -2.294 |
Token | rice |
Token ID | 20970 |
Feature activation | +5.03e-01 |
Pos logit contributions | |
olson | +6.068 |
dit | +5.014 |
� | +4.819 |
undo | +4.373 |
ctl | +4.363 |
Neg logit contributions | |
PLIED | -8.575 |
whence | -8.468 |
forgiveness | -7.691 |
cropped | -7.297 |
flared | -7.288 |
Token | Joyce |
Token ID | 25936 |
Feature activation | +4.87e-02 |
Pos logit contributions | |
olson | +5.140 |
dit | +4.335 |
� | +4.222 |
ctl | +4.032 |
advertising | +4.006 |
Neg logit contributions | |
PLIED | -4.515 |
whence | -4.402 |
forgiveness | -3.941 |
repre | -3.710 |
accus | -3.675 |
Token | Ke |
Token ID | 3873 |
Feature activation | +7.35e-01 |
Pos logit contributions | |
olson | +0.532 |
dit | +0.449 |
� | +0.441 |
ctl | +0.423 |
advertising | +0.419 |
Neg logit contributions | |
PLIED | -0.427 |
whence | -0.426 |
forgiveness | -0.380 |
accus | -0.352 |
repre | -0.347 |
Token | an |
Token ID | 272 |
Feature activation | -5.59e-02 |
Pos logit contributions | |
olson | +6.528 |
dit | +5.183 |
ctl | +5.030 |
undo | +4.984 |
advertising | +4.949 |
Neg logit contributions | |
PLIED | -7.453 |
whence | -7.430 |
forgiveness | -6.781 |
flared | -6.435 |
hurled | -6.420 |
Token | set |
Token ID | 900 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
whence | +0.504 |
PLIED | +0.500 |
forgiveness | +0.449 |
accus | +0.419 |
hurled | +0.410 |
Neg logit contributions | |
olson | -0.600 |
dit | -0.504 |
� | -0.495 |
ctl | -0.471 |
advertising | -0.471 |
Token | up |
Token ID | 510 |
Feature activation | -8.92e-03 |
Pos logit contributions | |
olson | +15.317 |
dit | +13.082 |
Guinness | +12.191 |
ctl | +12.062 |
customs | +11.799 |
Neg logit contributions | |
PLIED | -14.873 |
whence | -14.062 |
repre | -12.902 |
forgiveness | -12.198 |
ateral | -12.081 |
Token | the |
Token ID | 262 |
Feature activation | +3.77e-01 |
Pos logit contributions | |
whence | +0.080 |
PLIED | +0.080 |
forgiveness | +0.071 |
accus | +0.067 |
hurled | +0.066 |
Neg logit contributions | |
olson | -0.095 |
dit | -0.081 |
� | -0.079 |
ctl | -0.075 |
advertising | -0.075 |
Token | Joyce |
Token ID | 25936 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
olson | +3.980 |
dit | +3.385 |
� | +3.286 |
ctl | +3.168 |
advertising | +3.125 |
Neg logit contributions | |
PLIED | -3.321 |
whence | -3.263 |
forgiveness | -2.844 |
hurled | -2.703 |
repre | -2.681 |
Token | Foundation |
Token ID | 5693 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
olson | +3.707 |
dit | +3.164 |
� | +3.092 |
advertising | +2.976 |
ctl | +2.970 |
Neg logit contributions | |
whence | -2.717 |
PLIED | -2.716 |
forgiveness | -2.360 |
hurled | -2.215 |
accus | -2.205 |
Token | in |
Token ID | 287 |
Feature activation | +1.98e-01 |
Pos logit contributions | |
olson | +1.123 |
dit | +0.943 |
� | +0.924 |
ctl | +0.880 |
advertising | +0.879 |
Neg logit contributions | |
PLIED | -1.034 |
whence | -1.022 |
forgiveness | -0.922 |
accus | -0.866 |
hurled | -0.853 |
Token | – |
Token ID | 784 |
Feature activation | -3.49e-01 |
Pos logit contributions | |
whence | +2.234 |
PLIED | +2.194 |
forgiveness | +1.976 |
accus | +1.841 |
where | +1.814 |
Neg logit contributions | |
olson | -2.783 |
dit | -2.365 |
� | -2.323 |
ctl | -2.212 |
advertising | -2.204 |
Token | even |
Token ID | 772 |
Feature activation | -5.63e-01 |
Pos logit contributions | |
whence | +3.138 |
PLIED | +3.067 |
forgiveness | +2.783 |
accus | +2.591 |
where | +2.583 |
Neg logit contributions | |
olson | -3.743 |
dit | -3.177 |
� | -3.117 |
ctl | -2.971 |
advertising | -2.949 |
Token | after |
Token ID | 706 |
Feature activation | -5.74e-01 |
Pos logit contributions | |
whence | +5.033 |
PLIED | +4.840 |
forgiveness | +4.490 |
where | +4.257 |
accus | +4.154 |
Neg logit contributions | |
olson | -5.969 |
dit | -5.056 |
� | -5.028 |
ctl | -4.779 |
advertising | -4.726 |
Token | you |
Token ID | 345 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
whence | +4.814 |
PLIED | +4.601 |
forgiveness | +4.266 |
where | +3.983 |
accus | +3.915 |
Neg logit contributions | |
olson | -6.373 |
dit | -5.442 |
� | -5.367 |
advertising | -5.102 |
ctl | -5.102 |
Token | know |
Token ID | 760 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
whence | +2.271 |
PLIED | +2.224 |
forgiveness | +2.004 |
accus | +1.865 |
where | +1.843 |
Neg logit contributions | |
olson | -2.918 |
dit | -2.479 |
� | -2.440 |
advertising | -2.323 |
ctl | -2.321 |
Token | exactly |
Token ID | 3446 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
whence | +12.357 |
where | +11.157 |
PLIED | +10.169 |
forgiveness | +10.146 |
Applied | +9.084 |
Neg logit contributions | |
olson | -17.726 |
� | -15.271 |
dit | -15.223 |
undo | -14.595 |
Quantity | -14.507 |
Token | what |
Token ID | 644 |
Feature activation | -4.75e-01 |
Pos logit contributions | |
whence | +13.187 |
where | +12.578 |
forgiveness | +8.993 |
PLIED | +8.690 |
Where | +8.517 |
Neg logit contributions | |
olson | -23.429 |
dit | -20.363 |
� | -20.083 |
advertising | -19.757 |
undo | -19.625 |
Token | to |
Token ID | 284 |
Feature activation | -3.45e-01 |
Pos logit contributions | |
whence | +3.687 |
PLIED | +3.590 |
forgiveness | +3.230 |
where | +2.984 |
accus | +2.974 |
Neg logit contributions | |
olson | -5.603 |
dit | -4.836 |
� | -4.746 |
advertising | -4.542 |
ctl | -4.515 |
Token | expect |
Token ID | 1607 |
Feature activation | -4.35e-01 |
Pos logit contributions | |
whence | +2.879 |
PLIED | +2.781 |
forgiveness | +2.521 |
accus | +2.359 |
where | +2.355 |
Neg logit contributions | |
olson | -3.918 |
dit | -3.361 |
� | -3.305 |
advertising | -3.157 |
ctl | -3.134 |
Token | next |
Token ID | 1306 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
whence | +3.627 |
PLIED | +3.504 |
forgiveness | +3.180 |
where | +2.973 |
accus | +2.952 |
Neg logit contributions | |
olson | -4.947 |
dit | -4.225 |
� | -4.179 |
advertising | -3.961 |
ctl | -3.960 |
Token | . |
Token ID | 13 |
Feature activation | -3.98e-02 |
Pos logit contributions | |
whence | +1.715 |
PLIED | +1.692 |
forgiveness | +1.520 |
accus | +1.417 |
where | +1.388 |
Neg logit contributions | |
olson | -2.106 |
dit | -1.787 |
� | -1.753 |
ctl | -1.673 |
advertising | -1.665 |
Token | moved |
Token ID | 3888 |
Feature activation | +6.00e-02 |
Pos logit contributions | |
PLIED | +0.738 |
whence | +0.738 |
forgiveness | +0.659 |
accus | +0.615 |
Applied | +0.599 |
Neg logit contributions | |
olson | -0.829 |
dit | -0.705 |
� | -0.683 |
ctl | -0.654 |
advertising | -0.644 |
Token | to |
Token ID | 284 |
Feature activation | -5.62e-01 |
Pos logit contributions | |
olson | +0.622 |
dit | +0.523 |
� | +0.513 |
ctl | +0.484 |
advertising | +0.483 |
Neg logit contributions | |
whence | -0.559 |
PLIED | -0.558 |
forgiveness | -0.500 |
accus | -0.468 |
hurled | -0.460 |
Token | the |
Token ID | 262 |
Feature activation | -9.96e-01 |
Pos logit contributions | |
whence | +4.800 |
PLIED | +4.662 |
forgiveness | +4.253 |
where | +4.033 |
accus | +3.964 |
Neg logit contributions | |
olson | -6.136 |
dit | -5.233 |
� | -5.146 |
advertising | -4.946 |
ctl | -4.942 |
Token | right |
Token ID | 826 |
Feature activation | -6.08e-01 |
Pos logit contributions | |
whence | +7.021 |
PLIED | +6.652 |
forgiveness | +6.166 |
where | +5.794 |
accus | +5.710 |
Neg logit contributions | |
olson | -11.849 |
dit | -10.286 |
� | -10.250 |
ctl | -9.780 |
advertising | -9.728 |
Token | , |
Token ID | 11 |
Feature activation | -3.54e-01 |
Pos logit contributions | |
whence | +5.516 |
PLIED | +5.306 |
forgiveness | +4.858 |
where | +4.702 |
accus | +4.556 |
Neg logit contributions | |
olson | -6.314 |
dit | -5.323 |
� | -5.245 |
advertising | -5.045 |
ctl | -5.020 |
Token | over |
Token ID | 625 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
whence | +3.866 |
PLIED | +3.791 |
forgiveness | +3.500 |
where | +3.312 |
accus | +3.311 |
Neg logit contributions | |
olson | -3.125 |
dit | -2.539 |
� | -2.462 |
ctl | -2.330 |
advertising | -2.311 |
Token | time |
Token ID | 640 |
Feature activation | -6.08e-01 |
Pos logit contributions | |
whence | +17.455 |
where | +16.074 |
PLIED | +15.482 |
forgiveness | +15.362 |
accus | +14.137 |
Neg logit contributions | |
olson | -17.823 |
dit | -14.923 |
� | -14.057 |
ctl | -13.716 |
undo | -13.403 |
Token | . |
Token ID | 13 |
Feature activation | +7.88e-02 |
Pos logit contributions | |
whence | +5.220 |
PLIED | +5.006 |
forgiveness | +4.614 |
where | +4.354 |
accus | +4.267 |
Neg logit contributions | |
olson | -6.636 |
dit | -5.678 |
� | -5.516 |
ctl | -5.315 |
advertising | -5.271 |
Token | And |
Token ID | 843 |
Feature activation | +2.54e-01 |
Pos logit contributions | |
olson | +0.784 |
dit | +0.655 |
� | +0.648 |
advertising | +0.608 |
ctl | +0.607 |
Neg logit contributions | |
whence | -0.770 |
PLIED | -0.760 |
forgiveness | -0.692 |
accus | -0.650 |
hurled | -0.644 |
Token | , |
Token ID | 11 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
olson | +2.688 |
dit | +2.275 |
� | +2.246 |
advertising | +2.125 |
ctl | +2.117 |
Neg logit contributions | |
PLIED | -2.275 |
whence | -2.244 |
forgiveness | -1.979 |
accus | -1.858 |
hurled | -1.839 |
Token | after |
Token ID | 706 |
Feature activation | -5.69e-01 |
Pos logit contributions | |
whence | +1.815 |
PLIED | +1.779 |
forgiveness | +1.608 |
accus | +1.500 |
where | +1.480 |
Neg logit contributions | |
olson | -2.215 |
dit | -1.877 |
� | -1.843 |
ctl | -1.756 |
advertising | -1.748 |
Token | Thomas |
Token ID | 5658 |
Feature activation | +2.32e-02 |
Pos logit contributions | |
olson | +1.114 |
dit | +0.957 |
� | +0.935 |
ctl | +0.895 |
advertising | +0.890 |
Neg logit contributions | |
whence | -0.833 |
PLIED | -0.829 |
forgiveness | -0.728 |
accus | -0.680 |
hurled | -0.669 |
Token | , |
Token ID | 11 |
Feature activation | -2.78e-01 |
Pos logit contributions | |
olson | +0.244 |
� | +0.203 |
dit | +0.203 |
ctl | +0.192 |
advertising | +0.190 |
Neg logit contributions | |
whence | -0.214 |
PLIED | -0.214 |
forgiveness | -0.191 |
accus | -0.177 |
hurled | -0.175 |
Token | who |
Token ID | 508 |
Feature activation | -6.63e-03 |
Pos logit contributions | |
whence | +2.489 |
PLIED | +2.439 |
forgiveness | +2.205 |
accus | +2.059 |
where | +2.039 |
Neg logit contributions | |
olson | -2.999 |
dit | -2.543 |
� | -2.490 |
ctl | -2.375 |
advertising | -2.363 |
Token | earned |
Token ID | 7366 |
Feature activation | -6.87e-01 |
Pos logit contributions | |
whence | +0.058 |
PLIED | +0.057 |
forgiveness | +0.051 |
accus | +0.047 |
hurled | +0.046 |
Neg logit contributions | |
olson | -0.073 |
dit | -0.062 |
� | -0.061 |
ctl | -0.059 |
advertising | -0.058 |
Token | her |
Token ID | 607 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
whence | +5.307 |
PLIED | +5.203 |
forgiveness | +4.853 |
where | +4.452 |
Applied | +4.354 |
Neg logit contributions | |
olson | -7.925 |
dit | -6.750 |
� | -6.619 |
advertising | -6.434 |
ctl | -6.420 |
Token | masters |
Token ID | 18159 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
PLIED | +7.931 |
whence | +7.915 |
forgiveness | +7.431 |
where | +6.983 |
Applied | +6.954 |
Neg logit contributions | |
olson | -12.007 |
dit | -10.230 |
� | -9.767 |
advertising | -9.711 |
ctl | -9.683 |
Token | in |
Token ID | 287 |
Feature activation | -7.38e-01 |
Pos logit contributions | |
whence | +15.081 |
PLIED | +14.770 |
where | +14.391 |
forgiveness | +13.958 |
Applied | +13.604 |
Neg logit contributions | |
olson | -18.729 |
dit | -16.123 |
advertising | -15.167 |
nex | -14.436 |
� | -14.371 |
Token | environmental |
Token ID | 6142 |
Feature activation | -6.46e-01 |
Pos logit contributions | |
whence | +6.700 |
PLIED | +6.499 |
forgiveness | +6.068 |
Applied | +5.778 |
where | +5.708 |
Neg logit contributions | |
olson | -7.514 |
dit | -6.356 |
� | -6.240 |
advertising | -5.903 |
ctl | -5.862 |
Token | science |
Token ID | 3783 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
whence | +5.497 |
PLIED | +5.342 |
forgiveness | +4.917 |
where | +4.564 |
accus | +4.502 |
Neg logit contributions | |
olson | -7.094 |
dit | -6.072 |
� | -6.006 |
ctl | -5.640 |
advertising | -5.615 |
Token | from |
Token ID | 422 |
Feature activation | -6.16e-01 |
Pos logit contributions | |
whence | +12.085 |
PLIED | +11.766 |
where | +11.211 |
forgiveness | +10.802 |
Applied | +10.050 |
Neg logit contributions | |
olson | -18.072 |
dit | -15.399 |
� | -14.906 |
advertising | -14.676 |
Quantity | -14.482 |
Token | Yale |
Token ID | 19681 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
whence | +5.288 |
PLIED | +5.158 |
forgiveness | +4.664 |
where | +4.419 |
Applied | +4.340 |
Neg logit contributions | |
olson | -6.719 |
dit | -5.717 |
� | -5.649 |
ctl | -5.399 |
advertising | -5.378 |
Token | are |
Token ID | 389 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
whence | +0.691 |
PLIED | +0.681 |
forgiveness | +0.609 |
accus | +0.565 |
hurled | +0.555 |
Neg logit contributions | |
olson | -0.865 |
dit | -0.729 |
� | -0.724 |
ctl | -0.689 |
advertising | -0.684 |
Token | far |
Token ID | 1290 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
whence | +1.486 |
PLIED | +1.460 |
forgiveness | +1.314 |
accus | +1.223 |
where | +1.205 |
Neg logit contributions | |
olson | -1.888 |
dit | -1.607 |
� | -1.579 |
ctl | -1.504 |
advertising | -1.500 |
Token | fewer |
Token ID | 7380 |
Feature activation | -5.04e-01 |
Pos logit contributions | |
whence | +7.278 |
PLIED | +6.968 |
forgiveness | +6.314 |
where | +6.091 |
accus | +5.817 |
Neg logit contributions | |
olson | -13.186 |
� | -11.705 |
dit | -11.630 |
advertising | -11.402 |
ctl | -11.229 |
Token | universities |
Token ID | 11155 |
Feature activation | -7.42e-01 |
Pos logit contributions | |
whence | +4.064 |
PLIED | +3.944 |
forgiveness | +3.605 |
where | +3.379 |
accus | +3.338 |
Neg logit contributions | |
olson | -5.827 |
dit | -4.990 |
� | -4.918 |
advertising | -4.713 |
ctl | -4.661 |
Token | that |
Token ID | 326 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
whence | +6.168 |
PLIED | +5.785 |
where | +5.434 |
forgiveness | +5.309 |
accus | +5.023 |
Neg logit contributions | |
olson | -8.271 |
dit | -7.118 |
� | -6.970 |
advertising | -6.604 |
ctl | -6.499 |
Token | offer |
Token ID | 2897 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
whence | +8.822 |
PLIED | +8.493 |
where | +8.198 |
forgiveness | +7.725 |
Applied | +7.549 |
Neg logit contributions | |
olson | -14.503 |
� | -12.480 |
dit | -12.434 |
advertising | -12.258 |
Quantity | -11.768 |
Token | Ph |
Token ID | 1380 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
whence | +13.438 |
Applied | +13.183 |
PLIED | +13.176 |
forgiveness | +13.063 |
where | +12.731 |
Neg logit contributions | |
olson | -19.799 |
dit | -17.115 |
� | -16.441 |
advertising | -15.985 |
undo | -15.671 |
Token | . |
Token ID | 13 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
whence | +7.471 |
PLIED | +7.231 |
where | +7.006 |
forgiveness | +6.384 |
aught | +6.173 |
Neg logit contributions | |
olson | -17.662 |
� | -15.814 |
dit | -15.785 |
ichick | -15.253 |
ovych | -14.701 |
Token | Ds |
Token ID | 30832 |
Feature activation | -6.74e-01 |
Pos logit contributions | |
whence | +8.020 |
PLIED | +7.918 |
where | +7.215 |
Applied | +7.038 |
forgiveness | +6.873 |
Neg logit contributions | |
olson | -12.398 |
� | -10.344 |
ovych | -9.977 |
dit | -9.944 |
ichick | -9.913 |
Token | . |
Token ID | 13 |
Feature activation | -2.76e-01 |
Pos logit contributions | |
whence | +5.844 |
PLIED | +5.705 |
forgiveness | +5.156 |
where | +4.938 |
accus | +4.803 |
Neg logit contributions | |
olson | -7.267 |
dit | -6.180 |
� | -6.036 |
advertising | -5.806 |
ctl | -5.764 |
Token | We |
Token ID | 775 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
whence | +2.484 |
PLIED | +2.441 |
forgiveness | +2.202 |
accus | +2.058 |
where | +2.046 |
Neg logit contributions | |
olson | -2.954 |
dit | -2.503 |
� | -2.452 |
ctl | -2.338 |
advertising | -2.332 |
Token | Huang |
Token ID | 31663 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
olson | +9.085 |
dit | +7.731 |
� | +7.500 |
ctl | +7.064 |
advertising | +7.052 |
Neg logit contributions | |
PLIED | -8.262 |
whence | -7.917 |
forgiveness | -7.191 |
accus | -6.772 |
flared | -6.757 |
Token | , |
Token ID | 11 |
Feature activation | -5.09e-01 |
Pos logit contributions | |
whence | +1.236 |
PLIED | +1.222 |
forgiveness | +1.103 |
accus | +1.031 |
hurled | +1.016 |
Neg logit contributions | |
olson | -1.367 |
dit | -1.150 |
� | -1.132 |
ctl | -1.072 |
advertising | -1.060 |
Token | a |
Token ID | 257 |
Feature activation | -6.15e-01 |
Pos logit contributions | |
whence | +4.460 |
PLIED | +4.355 |
forgiveness | +3.943 |
where | +3.679 |
accus | +3.659 |
Neg logit contributions | |
olson | -5.546 |
dit | -4.705 |
� | -4.621 |
advertising | -4.427 |
ctl | -4.390 |
Token | junior |
Token ID | 13430 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
whence | +5.054 |
PLIED | +4.939 |
forgiveness | +4.500 |
Applied | +4.238 |
where | +4.204 |
Neg logit contributions | |
olson | -6.871 |
dit | -5.841 |
� | -5.781 |
advertising | -5.587 |
ctl | -5.458 |
Token | computer |
Token ID | 3644 |
Feature activation | -9.88e-01 |
Pos logit contributions | |
whence | +9.711 |
PLIED | +9.672 |
forgiveness | +8.952 |
Applied | +8.734 |
where | +8.594 |
Neg logit contributions | |
olson | -11.521 |
dit | -9.849 |
� | -9.744 |
advertising | -9.488 |
Quantity | -9.145 |
Token | science |
Token ID | 3783 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
whence | +6.934 |
PLIED | +6.689 |
forgiveness | +6.041 |
where | +5.759 |
Applied | +5.701 |
Neg logit contributions | |
olson | -11.656 |
dit | -10.262 |
� | -10.024 |
advertising | -9.628 |
Quantity | -9.624 |
Token | major |
Token ID | 1688 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
whence | +11.769 |
PLIED | +10.811 |
where | +10.689 |
forgiveness | +10.598 |
Applied | +10.090 |
Neg logit contributions | |
olson | -21.741 |
� | -18.536 |
dit | -18.322 |
advertising | -18.147 |
Quantity | -17.872 |
Token | ; |
Token ID | 26 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
whence | +10.667 |
PLIED | +10.273 |
forgiveness | +9.356 |
where | +9.354 |
Applied | +8.827 |
Neg logit contributions | |
olson | -15.411 |
dit | -13.187 |
advertising | -12.807 |
� | -12.629 |
ctl | -12.306 |
Token | Michael |
Token ID | 3899 |
Feature activation | +5.25e-01 |
Pos logit contributions | |
whence | +4.622 |
PLIED | +4.473 |
forgiveness | +4.077 |
accus | +3.793 |
where | +3.793 |
Neg logit contributions | |
olson | -6.321 |
dit | -5.343 |
� | -5.271 |
advertising | -5.065 |
ctl | -5.047 |
Token | Shin |
Token ID | 11466 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
olson | +5.397 |
dit | +4.608 |
� | +4.458 |
ctl | +4.233 |
advertising | +4.203 |
Neg logit contributions | |
PLIED | -4.713 |
whence | -4.628 |
forgiveness | -4.184 |
accus | -3.918 |
cropped | -3.891 |
Token | , |
Token ID | 11 |
Feature activation | -3.93e-01 |
Pos logit contributions | |
olson | +2.318 |
dit | +1.906 |
� | +1.898 |
ctl | +1.761 |
undo | +1.750 |
Neg logit contributions | |
whence | -2.300 |
PLIED | -2.274 |
forgiveness | -2.063 |
accus | -1.916 |
hurled | -1.907 |
Token | lowest |
Token ID | 9016 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
whence | +9.720 |
PLIED | +9.208 |
forgiveness | +8.814 |
where | +8.391 |
accus | +8.327 |
Neg logit contributions | |
olson | -12.075 |
dit | -10.262 |
� | -9.884 |
undo | -9.488 |
advertising | -9.254 |
Token | - |
Token ID | 12 |
Feature activation | -6.50e-01 |
Pos logit contributions | |
whence | +10.149 |
PLIED | +9.574 |
forgiveness | +8.973 |
where | +8.866 |
hurled | +8.364 |
Neg logit contributions | |
olson | -14.062 |
dit | -12.505 |
� | -11.838 |
undo | -11.560 |
ctl | -11.312 |
Token | priced |
Token ID | 30883 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
whence | +6.559 |
PLIED | +6.434 |
forgiveness | +5.886 |
where | +5.744 |
repre | +5.606 |
Neg logit contributions | |
olson | -5.896 |
dit | -4.846 |
� | -4.833 |
ctl | -4.482 |
undo | -4.332 |
Token | models |
Token ID | 4981 |
Feature activation | -6.91e-01 |
Pos logit contributions | |
whence | +9.330 |
PLIED | +8.464 |
forgiveness | +8.244 |
accus | +8.049 |
where | +7.934 |
Neg logit contributions | |
olson | -12.897 |
dit | -10.908 |
� | -10.620 |
undo | -10.266 |
advertising | -10.056 |
Token | cost |
Token ID | 1575 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
whence | +5.715 |
PLIED | +5.438 |
forgiveness | +4.998 |
where | +4.830 |
accus | +4.698 |
Neg logit contributions | |
olson | -7.711 |
dit | -6.602 |
� | -6.457 |
advertising | -6.136 |
ctl | -6.034 |
Token | far |
Token ID | 1290 |
Feature activation | -2.04e+00 |
Pos logit contributions | |
whence | +7.897 |
PLIED | +7.604 |
forgiveness | +6.935 |
where | +6.857 |
accus | +6.557 |
Neg logit contributions | |
olson | -11.022 |
dit | -9.582 |
� | -9.287 |
undo | -8.874 |
ctl | -8.794 |
Token | more |
Token ID | 517 |
Feature activation | -8.12e-02 |
Pos logit contributions | |
whence | +11.806 |
where | +10.489 |
PLIED | +10.070 |
forgiveness | +9.517 |
farther | +9.261 |
Neg logit contributions | |
olson | -21.615 |
dit | -18.767 |
� | -18.300 |
ctl | -17.898 |
undo | -17.495 |
Token | than |
Token ID | 621 |
Feature activation | -6.45e-01 |
Pos logit contributions | |
whence | +0.772 |
PLIED | +0.763 |
forgiveness | +0.689 |
accus | +0.646 |
hurled | +0.637 |
Neg logit contributions | |
olson | -0.828 |
dit | -0.696 |
� | -0.682 |
ctl | -0.651 |
advertising | -0.647 |
Token | Dev |
Token ID | 6245 |
Feature activation | +3.06e-01 |
Pos logit contributions | |
whence | +5.307 |
PLIED | +5.042 |
forgiveness | +4.664 |
where | +4.416 |
accus | +4.373 |
Neg logit contributions | |
olson | -7.298 |
dit | -6.278 |
� | -6.096 |
advertising | -5.837 |
ctl | -5.822 |
Token | ial |
Token ID | 498 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
olson | +2.622 |
dit | +2.114 |
� | +2.058 |
ctl | +1.936 |
advertising | +1.925 |
Neg logit contributions | |
whence | -3.414 |
PLIED | -3.372 |
forgiveness | -3.108 |
accus | -2.942 |
hurled | -2.900 |
Token | et |
Token ID | 316 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
olson | +3.071 |
dit | +2.412 |
� | +2.286 |
ctl | +2.190 |
advertising | +2.131 |
Neg logit contributions | |
whence | -5.174 |
PLIED | -5.115 |
forgiveness | -4.791 |
accus | -4.536 |
hurled | -4.480 |
Token | : |
Token ID | 25 |
Feature activation | -6.12e-01 |
Pos logit contributions | |
olson | +1.596 |
dit | +1.304 |
� | +1.275 |
ctl | +1.194 |
advertising | +1.188 |
Neg logit contributions | |
whence | -1.893 |
PLIED | -1.862 |
forgiveness | -1.713 |
accus | -1.620 |
where | -1.610 |
Token | Chip |
Token ID | 17869 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
whence | +3.797 |
PLIED | +3.517 |
forgiveness | +3.368 |
where | +3.132 |
Applied | +2.916 |
Neg logit contributions | |
olson | -8.030 |
dit | -6.974 |
� | -6.836 |
undo | -6.509 |
Quantity | -6.431 |
Token | in |
Token ID | 287 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
whence | +3.923 |
PLIED | +3.834 |
where | +3.465 |
forgiveness | +3.403 |
accus | +3.242 |
Neg logit contributions | |
olson | -6.730 |
dit | -5.925 |
� | -5.801 |
ctl | -5.486 |
advertising | -5.457 |
Token | $ |
Token ID | 720 |
Feature activation | -9.09e-01 |
Pos logit contributions | |
whence | +4.462 |
where | +4.096 |
PLIED | +3.750 |
forgiveness | +3.679 |
Applied | +3.192 |
Neg logit contributions | |
olson | -17.858 |
dit | -15.725 |
� | -15.217 |
undo | -15.001 |
ovych | -14.686 |
Token | 10 |
Token ID | 940 |
Feature activation | -5.52e-01 |
Pos logit contributions | |
whence | +5.425 |
PLIED | +5.386 |
where | +5.077 |
forgiveness | +4.535 |
Applied | +4.158 |
Neg logit contributions | |
olson | -11.109 |
dit | -9.839 |
� | -9.563 |
undo | -9.281 |
livest | -9.185 |
Token | or |
Token ID | 393 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
whence | +5.005 |
PLIED | +4.686 |
where | +4.492 |
forgiveness | +4.451 |
accus | +4.142 |
Neg logit contributions | |
olson | -5.750 |
dit | -4.695 |
� | -4.677 |
undo | -4.337 |
ctl | -4.307 |
Token | more |
Token ID | 517 |
Feature activation | -9.72e-01 |
Pos logit contributions | |
whence | +6.257 |
where | +6.186 |
forgiveness | +4.841 |
farther | +4.620 |
accus | +4.226 |
Neg logit contributions | |
olson | -25.692 |
dit | -23.362 |
� | -22.821 |
ichick | -22.378 |
ctl | -22.165 |
Token | to |
Token ID | 284 |
Feature activation | -8.99e-01 |
Pos logit contributions | |
whence | +5.793 |
where | +5.460 |
PLIED | +5.154 |
forgiveness | +4.812 |
accus | +4.248 |
Neg logit contributions | |
olson | -12.249 |
dit | -10.435 |
� | -10.272 |
undo | -9.934 |
ichick | -9.732 |
Token | help |
Token ID | 1037 |
Feature activation | -3.27e-01 |
Pos logit contributions | |
whence | +3.137 |
PLIED | +2.625 |
forgiveness | +2.571 |
where | +2.566 |
accus | +1.919 |
Neg logit contributions | |
olson | -13.734 |
dit | -12.143 |
� | -11.984 |
Quantity | -11.734 |
advertising | -11.622 |
Token | us |
Token ID | 514 |
Feature activation | -4.11e-01 |
Pos logit contributions | |
whence | +2.368 |
PLIED | +2.260 |
forgiveness | +2.074 |
where | +2.013 |
accus | +1.935 |
Neg logit contributions | |
olson | -4.013 |
dit | -3.465 |
� | -3.419 |
advertising | -3.227 |
ctl | -3.208 |
Token | continue |
Token ID | 2555 |
Feature activation | -6.78e-02 |
Pos logit contributions | |
whence | +2.225 |
PLIED | +2.023 |
forgiveness | +1.858 |
where | +1.817 |
accus | +1.654 |
Neg logit contributions | |
olson | -5.693 |
dit | -5.128 |
� | -5.070 |
advertising | -4.817 |
ctl | -4.772 |
Token | re |
Token ID | 260 |
Feature activation | +3.17e-02 |
Pos logit contributions | |
olson | +0.610 |
dit | +0.506 |
� | +0.483 |
ctl | +0.467 |
advertising | +0.455 |
Neg logit contributions | |
whence | -0.712 |
PLIED | -0.702 |
forgiveness | -0.646 |
accus | -0.605 |
hurled | -0.596 |
Token | the |
Token ID | 262 |
Feature activation | -1.72e-01 |
Pos logit contributions | |
olson | +0.351 |
dit | +0.298 |
� | +0.294 |
ctl | +0.281 |
advertising | +0.281 |
Neg logit contributions | |
whence | -0.275 |
PLIED | -0.271 |
forgiveness | -0.242 |
accus | -0.225 |
hurled | -0.221 |
Token | only |
Token ID | 691 |
Feature activation | -7.92e-01 |
Pos logit contributions | |
whence | +1.285 |
PLIED | +1.260 |
forgiveness | +1.108 |
accus | +1.016 |
hurled | +0.993 |
Neg logit contributions | |
olson | -2.121 |
dit | -1.836 |
� | -1.807 |
ctl | -1.733 |
advertising | -1.728 |
Token | school |
Token ID | 1524 |
Feature activation | -7.92e-01 |
Pos logit contributions | |
whence | +6.528 |
PLIED | +6.392 |
forgiveness | +5.915 |
where | +5.673 |
Applied | +5.543 |
Neg logit contributions | |
olson | -8.608 |
dit | -7.453 |
� | -7.199 |
advertising | -6.831 |
ctl | -6.764 |
Token | that |
Token ID | 326 |
Feature activation | -7.20e-01 |
Pos logit contributions | |
whence | +6.681 |
PLIED | +6.412 |
where | +5.942 |
forgiveness | +5.818 |
accus | +5.451 |
Neg logit contributions | |
olson | -8.589 |
dit | -7.410 |
� | -7.186 |
advertising | -6.854 |
Quantity | -6.673 |
Token | offers |
Token ID | 4394 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
whence | +5.280 |
PLIED | +5.196 |
forgiveness | +4.667 |
where | +4.491 |
accus | +4.342 |
Neg logit contributions | |
olson | -8.407 |
dit | -7.336 |
� | -7.152 |
advertising | -6.922 |
undo | -6.737 |
Token | this |
Token ID | 428 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
whence | +13.068 |
PLIED | +12.775 |
forgiveness | +12.644 |
Applied | +12.433 |
where | +12.298 |
Neg logit contributions | |
olson | -19.432 |
dit | -16.660 |
� | -15.836 |
advertising | -15.663 |
undo | -15.153 |
Token | in |
Token ID | 287 |
Feature activation | -7.92e-01 |
Pos logit contributions | |
whence | +9.944 |
PLIED | +9.732 |
forgiveness | +9.414 |
where | +9.406 |
Applied | +8.900 |
Neg logit contributions | |
olson | -15.009 |
dit | -13.077 |
advertising | -12.451 |
� | -12.421 |
ctl | -11.895 |
Token | San |
Token ID | 2986 |
Feature activation | -6.30e-01 |
Pos logit contributions | |
whence | +6.574 |
PLIED | +6.503 |
forgiveness | +5.860 |
where | +5.533 |
Applied | +5.528 |
Neg logit contributions | |
olson | -8.689 |
dit | -7.413 |
� | -7.134 |
advertising | -6.888 |
undo | -6.839 |
Token | Diego |
Token ID | 9500 |
Feature activation | -3.32e-01 |
Pos logit contributions | |
whence | +5.171 |
PLIED | +5.075 |
forgiveness | +4.589 |
accus | +4.278 |
where | +4.232 |
Neg logit contributions | |
olson | -7.095 |
dit | -6.031 |
� | -5.992 |
advertising | -5.685 |
ctl | -5.664 |
Token | . |
Token ID | 13 |
Feature activation | -5.32e-01 |
Pos logit contributions | |
whence | +2.877 |
PLIED | +2.825 |
forgiveness | +2.539 |
accus | +2.363 |
where | +2.333 |
Neg logit contributions | |
olson | -3.680 |
dit | -3.132 |
� | -3.077 |
ctl | -2.929 |
advertising | -2.922 |
Token | even |
Token ID | 772 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
whence | +2.309 |
PLIED | +2.249 |
forgiveness | +2.033 |
accus | +1.892 |
where | +1.883 |
Neg logit contributions | |
olson | -2.890 |
dit | -2.453 |
� | -2.412 |
ctl | -2.299 |
advertising | -2.287 |
Token | as |
Token ID | 355 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
whence | +2.140 |
PLIED | +2.103 |
forgiveness | +1.920 |
accus | +1.805 |
where | +1.785 |
Neg logit contributions | |
olson | -2.121 |
dit | -1.763 |
� | -1.731 |
ctl | -1.637 |
advertising | -1.629 |
Token | its |
Token ID | 663 |
Feature activation | -9.60e-01 |
Pos logit contributions | |
whence | +1.318 |
PLIED | +1.307 |
forgiveness | +1.183 |
accus | +1.118 |
hurled | +1.091 |
Neg logit contributions | |
olson | -1.300 |
dit | -1.083 |
� | -1.055 |
ctl | -1.003 |
advertising | -0.991 |
Token | bottom |
Token ID | 4220 |
Feature activation | -4.44e-01 |
Pos logit contributions | |
whence | +8.223 |
PLIED | +7.675 |
forgiveness | +7.362 |
where | +6.947 |
accus | +6.884 |
Neg logit contributions | |
olson | -10.153 |
� | -8.771 |
dit | -8.688 |
advertising | -8.221 |
ctl | -8.060 |
Token | ( |
Token ID | 357 |
Feature activation | -4.63e-01 |
Pos logit contributions | |
whence | +4.236 |
PLIED | +4.123 |
forgiveness | +3.770 |
accus | +3.538 |
where | +3.525 |
Neg logit contributions | |
olson | -4.532 |
dit | -3.795 |
� | -3.747 |
advertising | -3.533 |
ctl | -3.526 |
Token | below |
Token ID | 35993 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
whence | +3.623 |
PLIED | +3.528 |
forgiveness | +3.122 |
where | +2.912 |
accus | +2.875 |
Neg logit contributions | |
olson | -5.453 |
dit | -4.659 |
� | -4.635 |
ctl | -4.402 |
advertising | -4.349 |
Token | water |
Token ID | 1660 |
Feature activation | -8.45e-01 |
Pos logit contributions | |
whence | +13.664 |
where | +12.308 |
PLIED | +12.233 |
forgiveness | +11.938 |
shallow | +10.849 |
Neg logit contributions | |
olson | -19.661 |
� | -16.579 |
dit | -16.165 |
advertising | -16.086 |
Quantity | -15.685 |
Token | ) |
Token ID | 8 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
whence | +4.514 |
PLIED | +4.231 |
forgiveness | +3.609 |
where | +3.368 |
accus | +3.184 |
Neg logit contributions | |
olson | -11.879 |
dit | -10.400 |
� | -10.356 |
advertising | -9.969 |
ctl | -9.937 |
Token | rises |
Token ID | 16736 |
Feature activation | -3.22e-01 |
Pos logit contributions | |
whence | +7.640 |
PLIED | +6.786 |
forgiveness | +6.373 |
where | +6.310 |
hurled | +6.033 |
Neg logit contributions | |
olson | -11.566 |
� | -10.206 |
dit | -9.969 |
advertising | -9.448 |
ctl | -9.404 |
Token | up |
Token ID | 510 |
Feature activation | -6.29e-01 |
Pos logit contributions | |
whence | +2.872 |
PLIED | +2.791 |
forgiveness | +2.532 |
accus | +2.363 |
where | +2.351 |
Neg logit contributions | |
olson | -3.504 |
dit | -2.960 |
� | -2.926 |
ctl | -2.777 |
advertising | -2.774 |
Token | to |
Token ID | 284 |
Feature activation | -7.36e-01 |
Pos logit contributions | |
whence | +5.342 |
PLIED | +5.031 |
forgiveness | +4.612 |
where | +4.430 |
accus | +4.296 |
Neg logit contributions | |
olson | -7.032 |
� | -5.917 |
dit | -5.910 |
advertising | -5.632 |
ctl | -5.608 |
Token | over |
Token ID | 625 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
whence | +4.638 |
PLIED | +4.470 |
forgiveness | +4.014 |
where | +3.879 |
accus | +3.752 |
Neg logit contributions | |
olson | -6.415 |
dit | -5.503 |
� | -5.371 |
advertising | -5.148 |
ctl | -5.119 |
Token | and |
Token ID | 290 |
Feature activation | -5.90e-01 |
Pos logit contributions | |
whence | +12.596 |
PLIED | +12.125 |
where | +11.613 |
forgiveness | +11.103 |
shallow | +10.770 |
Neg logit contributions | |
olson | -16.475 |
dit | -14.340 |
� | -13.758 |
advertising | -13.573 |
ctl | -13.228 |
Token | over |
Token ID | 625 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
whence | +4.934 |
PLIED | +4.777 |
forgiveness | +4.273 |
where | +4.082 |
accus | +3.968 |
Neg logit contributions | |
olson | -6.671 |
dit | -5.666 |
� | -5.565 |
ctl | -5.299 |
advertising | -5.279 |
Token | again |
Token ID | 757 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
whence | +8.114 |
PLIED | +7.410 |
where | +6.982 |
forgiveness | +6.816 |
accus | +6.319 |
Neg logit contributions | |
olson | -13.702 |
dit | -11.748 |
� | -11.616 |
advertising | -11.320 |
ctl | -11.092 |
Token | . |
Token ID | 13 |
Feature activation | -4.32e-01 |
Pos logit contributions | |
whence | +2.456 |
PLIED | +2.401 |
forgiveness | +2.168 |
accus | +2.021 |
where | +2.012 |
Neg logit contributions | |
olson | -3.059 |
dit | -2.603 |
� | -2.553 |
ctl | -2.432 |
advertising | -2.427 |
Token | Over |
Token ID | 3827 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
whence | +3.914 |
PLIED | +3.817 |
forgiveness | +3.431 |
where | +3.278 |
Applied | +3.241 |
Neg logit contributions | |
olson | -4.575 |
dit | -3.864 |
� | -3.755 |
ctl | -3.608 |
advertising | -3.581 |
Token | 55 |
Token ID | 5996 |
Feature activation | -7.60e-01 |
Pos logit contributions | |
whence | +15.606 |
where | +14.463 |
PLIED | +14.439 |
forgiveness | +13.563 |
cropped | +13.013 |
Neg logit contributions | |
olson | -16.835 |
dit | -13.934 |
� | -13.406 |
advertising | -13.104 |
ctl | -12.939 |
Token | days |
Token ID | 1528 |
Feature activation | +3.02e-02 |
Pos logit contributions | |
whence | +5.967 |
PLIED | +5.791 |
forgiveness | +5.260 |
where | +5.069 |
accus | +5.028 |
Neg logit contributions | |
olson | -8.536 |
dit | -7.405 |
� | -7.087 |
advertising | -6.898 |
ctl | -6.731 |
Token | in |
Token ID | 287 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
olson | +0.313 |
dit | +0.262 |
� | +0.261 |
ctl | +0.245 |
advertising | +0.242 |
Neg logit contributions | |
PLIED | -0.281 |
whence | -0.281 |
forgiveness | -0.252 |
accus | -0.235 |
hurled | -0.230 |
Token | the |
Token ID | 262 |
Feature activation | -2.70e-01 |
Pos logit contributions | |
whence | +1.976 |
PLIED | +1.942 |
forgiveness | +1.739 |
accus | +1.614 |
where | +1.585 |
Neg logit contributions | |
olson | -2.659 |
dit | -2.272 |
� | -2.233 |
ctl | -2.131 |
advertising | -2.124 |
Token | late |
Token ID | 2739 |
Feature activation | -6.80e-01 |
Pos logit contributions | |
whence | +2.169 |
PLIED | +2.125 |
forgiveness | +1.896 |
accus | +1.755 |
where | +1.725 |
Neg logit contributions | |
olson | -3.168 |
dit | -2.726 |
� | -2.685 |
ctl | -2.566 |
advertising | -2.561 |
Token | garbage |
Token ID | 15413 |
Feature activation | -3.71e-01 |
Pos logit contributions | |
whence | +0.372 |
PLIED | +0.371 |
forgiveness | +0.331 |
accus | +0.308 |
Applied | +0.299 |
Neg logit contributions | |
olson | -0.453 |
dit | -0.388 |
� | -0.379 |
ctl | -0.363 |
advertising | -0.358 |
Token | and |
Token ID | 290 |
Feature activation | -2.45e-01 |
Pos logit contributions | |
whence | +3.120 |
PLIED | +3.039 |
forgiveness | +2.730 |
accus | +2.538 |
where | +2.528 |
Neg logit contributions | |
olson | -4.219 |
dit | -3.598 |
� | -3.547 |
ctl | -3.377 |
advertising | -3.371 |
Token | diver |
Token ID | 12312 |
Feature activation | +5.69e-01 |
Pos logit contributions | |
whence | +2.120 |
PLIED | +2.075 |
forgiveness | +1.871 |
accus | +1.739 |
where | +1.720 |
Neg logit contributions | |
olson | -2.719 |
dit | -2.309 |
� | -2.272 |
ctl | -2.162 |
advertising | -2.159 |
Token | ting |
Token ID | 889 |
Feature activation | -3.46e-01 |
Pos logit contributions | |
olson | +2.387 |
dit | +1.708 |
� | +1.338 |
ctl | +1.338 |
advertising | +1.151 |
Neg logit contributions | |
PLIED | -8.584 |
whence | -8.440 |
forgiveness | -8.017 |
accus | -7.724 |
Applied | -7.640 |
Token | the |
Token ID | 262 |
Feature activation | -8.65e-01 |
Pos logit contributions | |
whence | +2.996 |
PLIED | +2.930 |
forgiveness | +2.641 |
accus | +2.456 |
where | +2.433 |
Neg logit contributions | |
olson | -3.844 |
dit | -3.261 |
� | -3.210 |
advertising | -3.062 |
ctl | -3.056 |
Token | creek |
Token ID | 39459 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
whence | +6.108 |
PLIED | +5.745 |
forgiveness | +5.188 |
where | +4.864 |
accus | +4.750 |
Neg logit contributions | |
olson | -10.671 |
� | -9.044 |
dit | -9.032 |
advertising | -8.837 |
ctl | -8.618 |
Token | water |
Token ID | 1660 |
Feature activation | -4.88e-01 |
Pos logit contributions | |
whence | +12.682 |
where | +10.805 |
PLIED | +10.306 |
forgiveness | +10.293 |
shallow | +9.327 |
Neg logit contributions | |
olson | -21.620 |
dit | -18.141 |
� | -17.892 |
advertising | -17.736 |
undo | -17.288 |
Token | so |
Token ID | 523 |
Feature activation | -2.65e-01 |
Pos logit contributions | |
whence | +4.271 |
PLIED | +4.068 |
forgiveness | +3.727 |
where | +3.522 |
accus | +3.461 |
Neg logit contributions | |
olson | -5.414 |
dit | -4.561 |
� | -4.513 |
advertising | -4.298 |
ctl | -4.297 |
Token | as |
Token ID | 355 |
Feature activation | -3.34e-01 |
Pos logit contributions | |
whence | +2.487 |
PLIED | +2.451 |
forgiveness | +2.220 |
accus | +2.078 |
where | +2.044 |
Neg logit contributions | |
olson | -2.741 |
dit | -2.305 |
� | -2.260 |
ctl | -2.147 |
advertising | -2.137 |
Token | to |
Token ID | 284 |
Feature activation | -3.16e-01 |
Pos logit contributions | |
whence | +3.002 |
PLIED | +2.952 |
forgiveness | +2.664 |
accus | +2.486 |
where | +2.447 |
Neg logit contributions | |
olson | -3.600 |
dit | -3.049 |
� | -2.993 |
ctl | -2.849 |
advertising | -2.839 |
Token | facilitate |
Token ID | 15570 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
whence | +2.858 |
PLIED | +2.782 |
forgiveness | +2.538 |
accus | +2.366 |
where | +2.364 |
Neg logit contributions | |
olson | -3.376 |
dit | -2.846 |
� | -2.808 |
advertising | -2.674 |
ctl | -2.669 |
Token | and |
Token ID | 290 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
whence | +1.833 |
PLIED | +1.804 |
forgiveness | +1.619 |
accus | +1.505 |
where | +1.478 |
Neg logit contributions | |
olson | -2.344 |
dit | -1.996 |
� | -1.961 |
ctl | -1.871 |
advertising | -1.862 |
Token | the |
Token ID | 262 |
Feature activation | +1.27e-01 |
Pos logit contributions | |
olson | +1.250 |
dit | +1.059 |
� | +1.046 |
ctl | +0.992 |
advertising | +0.973 |
Neg logit contributions | |
whence | -1.044 |
PLIED | -1.038 |
forgiveness | -0.925 |
accus | -0.849 |
repre | -0.846 |
Token | media |
Token ID | 2056 |
Feature activation | -1.56e-01 |
Pos logit contributions | |
olson | +1.326 |
dit | +1.128 |
� | +1.100 |
ctl | +1.048 |
advertising | +1.034 |
Neg logit contributions | |
whence | -1.156 |
PLIED | -1.153 |
forgiveness | -1.023 |
repre | -0.942 |
aught | -0.940 |
Token | ( |
Token ID | 357 |
Feature activation | -4.14e-01 |
Pos logit contributions | |
whence | +1.390 |
PLIED | +1.370 |
forgiveness | +1.233 |
accus | +1.148 |
where | +1.128 |
Neg logit contributions | |
olson | -1.683 |
dit | -1.427 |
� | -1.401 |
ctl | -1.336 |
advertising | -1.328 |
Token | I |
Token ID | 40 |
Feature activation | -5.94e-01 |
Pos logit contributions | |
whence | +4.206 |
PLIED | +4.114 |
forgiveness | +3.779 |
accus | +3.575 |
where | +3.565 |
Neg logit contributions | |
olson | -3.912 |
dit | -3.220 |
� | -3.171 |
ctl | -2.986 |
advertising | -2.942 |
Token | know |
Token ID | 760 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
whence | +5.182 |
PLIED | +5.039 |
forgiveness | +4.628 |
accus | +4.389 |
where | +4.347 |
Neg logit contributions | |
olson | -6.353 |
dit | -5.329 |
� | -5.149 |
advertising | -5.092 |
ctl | -5.007 |
Token | , |
Token ID | 11 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
whence | +14.450 |
where | +13.084 |
forgiveness | +12.416 |
PLIED | +12.070 |
accus | +11.863 |
Neg logit contributions | |
olson | -19.180 |
dit | -15.799 |
advertising | -15.320 |
� | -15.121 |
Quantity | -15.068 |
Token | that |
Token ID | 326 |
Feature activation | -4.42e-02 |
Pos logit contributions | |
whence | +1.703 |
PLIED | +1.681 |
forgiveness | +1.513 |
accus | +1.411 |
where | +1.387 |
Neg logit contributions | |
olson | -2.009 |
dit | -1.702 |
� | -1.672 |
ctl | -1.588 |
advertising | -1.581 |
Token | � |
Token ID | 447 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
whence | +0.445 |
PLIED | +0.441 |
forgiveness | +0.399 |
accus | +0.373 |
hurled | +0.368 |
Neg logit contributions | |
olson | -0.426 |
dit | -0.355 |
� | -0.351 |
ctl | -0.329 |
advertising | -0.327 |
Token | � |
Token ID | 247 |
Feature activation | -4.08e-01 |
Pos logit contributions | |
whence | +1.415 |
PLIED | +1.397 |
forgiveness | +1.273 |
accus | +1.198 |
where | +1.180 |
Neg logit contributions | |
olson | -1.350 |
dit | -1.121 |
� | -1.099 |
ctl | -1.038 |
advertising | -1.033 |
Token | s |
Token ID | 82 |
Feature activation | -8.88e-01 |
Pos logit contributions | |
whence | +3.864 |
PLIED | +3.787 |
forgiveness | +3.457 |
accus | +3.255 |
where | +3.227 |
Neg logit contributions | |
olson | -4.138 |
dit | -3.443 |
� | -3.394 |
ctl | -3.211 |
advertising | -3.207 |
Token | , |
Token ID | 11 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
olson | +0.638 |
dit | +0.550 |
� | +0.530 |
ctl | +0.513 |
advertising | +0.504 |
Neg logit contributions | |
whence | -0.523 |
PLIED | -0.522 |
forgiveness | -0.465 |
accus | -0.428 |
Applied | -0.426 |
Token | there |
Token ID | 612 |
Feature activation | -4.22e-01 |
Pos logit contributions | |
whence | +7.627 |
PLIED | +7.186 |
where | +6.636 |
forgiveness | +6.593 |
accus | +6.328 |
Neg logit contributions | |
olson | -11.833 |
� | -10.025 |
dit | -9.895 |
advertising | -9.634 |
Quantity | -9.367 |
Token | are |
Token ID | 389 |
Feature activation | -1.95e-02 |
Pos logit contributions | |
whence | +4.386 |
PLIED | +4.331 |
forgiveness | +3.984 |
accus | +3.770 |
where | +3.753 |
Neg logit contributions | |
olson | -3.904 |
dit | -3.206 |
� | -3.133 |
advertising | -2.947 |
ctl | -2.940 |
Token | ways |
Token ID | 2842 |
Feature activation | -7.69e-01 |
Pos logit contributions | |
whence | +0.174 |
PLIED | +0.172 |
forgiveness | +0.153 |
accus | +0.142 |
Applied | +0.141 |
Neg logit contributions | |
olson | -0.209 |
dit | -0.177 |
� | -0.173 |
ctl | -0.167 |
advertising | -0.163 |
Token | this |
Token ID | 428 |
Feature activation | -5.50e-01 |
Pos logit contributions | |
whence | +6.223 |
PLIED | +5.955 |
forgiveness | +5.579 |
where | +5.389 |
accus | +5.163 |
Neg logit contributions | |
olson | -8.746 |
dit | -7.421 |
� | -7.290 |
advertising | -7.011 |
ctl | -6.867 |
Token | could |
Token ID | 714 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
whence | +4.135 |
PLIED | +4.027 |
forgiveness | +3.707 |
where | +3.427 |
accus | +3.424 |
Neg logit contributions | |
olson | -6.592 |
dit | -5.718 |
� | -5.617 |
advertising | -5.358 |
ctl | -5.307 |
Token | have |
Token ID | 423 |
Feature activation | -9.81e-01 |
Pos logit contributions | |
whence | +11.221 |
where | +10.933 |
PLIED | +10.663 |
flared | +10.177 |
forgiveness | +10.106 |
Neg logit contributions | |
olson | -19.454 |
� | -17.883 |
dit | -17.658 |
advertising | -17.341 |
Quantity | -16.980 |
Token | been |
Token ID | 587 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
whence | +7.046 |
PLIED | +6.745 |
forgiveness | +6.267 |
flared | +6.064 |
where | +6.022 |
Neg logit contributions | |
olson | -11.452 |
dit | -10.077 |
� | -10.059 |
ctl | -9.476 |
advertising | -9.423 |
Token | handled |
Token ID | 12118 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
whence | +5.836 |
PLIED | +5.774 |
forgiveness | +5.493 |
where | +5.126 |
hurled | +4.927 |
Neg logit contributions | |
olson | -13.961 |
dit | -12.322 |
� | -12.256 |
advertising | -11.837 |
ctl | -11.830 |
Token | without |
Token ID | 1231 |
Feature activation | -8.41e-01 |
Pos logit contributions | |
whence | +1.492 |
PLIED | +1.463 |
forgiveness | +1.301 |
accus | +1.200 |
where | +1.179 |
Neg logit contributions | |
olson | -2.244 |
dit | -1.931 |
� | -1.900 |
ctl | -1.818 |
advertising | -1.813 |
Token | striking |
Token ID | 8871 |
Feature activation | +5.99e-01 |
Pos logit contributions | |
whence | +6.599 |
PLIED | +6.372 |
forgiveness | +6.101 |
where | +5.783 |
accus | +5.672 |
Neg logit contributions | |
olson | -9.542 |
� | -8.110 |
dit | -8.100 |
ctl | -7.665 |
advertising | -7.632 |
Token | — |
Token ID | 851 |
Feature activation | +4.44e-01 |
Pos logit contributions | |
olson | +5.419 |
dit | +4.425 |
� | +4.365 |
advertising | +4.231 |
ctl | +4.186 |
Neg logit contributions | |
PLIED | -5.700 |
whence | -5.466 |
forgiveness | -4.968 |
repre | -4.747 |
accus | -4.705 |
Token | but |
Token ID | 475 |
Feature activation | +5.74e-01 |
Pos logit contributions | |
olson | +4.686 |
dit | +3.938 |
� | +3.890 |
advertising | +3.728 |
ctl | +3.631 |
Neg logit contributions | |
PLIED | -3.876 |
whence | -3.802 |
forgiveness | -3.402 |
accus | -3.234 |
repre | -3.202 |
Token | as |
Token ID | 355 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
olson | +5.830 |
dit | +4.843 |
� | +4.784 |
ctl | +4.589 |
advertising | +4.536 |
Neg logit contributions | |
PLIED | -5.239 |
whence | -4.887 |
forgiveness | -4.335 |
repre | -4.180 |
accus | -4.121 |
Token | the |
Token ID | 262 |
Feature activation | +3.45e-01 |
Pos logit contributions | |
olson | +2.142 |
dit | +1.815 |
� | +1.764 |
ctl | +1.693 |
advertising | +1.676 |
Neg logit contributions | |
PLIED | -1.894 |
whence | -1.869 |
forgiveness | -1.648 |
accus | -1.552 |
repre | -1.544 |
Token | housing |
Token ID | 5627 |
Feature activation | -3.77e-01 |
Pos logit contributions | |
olson | +3.642 |
dit | +3.086 |
� | +2.968 |
ctl | +2.873 |
advertising | +2.849 |
Neg logit contributions | |
PLIED | -3.082 |
whence | -3.002 |
forgiveness | -2.647 |
repre | -2.479 |
accus | -2.459 |
Token | slump |
Token ID | 37758 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
whence | +3.106 |
PLIED | +2.999 |
forgiveness | +2.721 |
where | +2.512 |
accus | +2.511 |
Neg logit contributions | |
olson | -4.349 |
dit | -3.730 |
� | -3.679 |
ctl | -3.505 |
advertising | -3.496 |
Token | and |
Token ID | 290 |
Feature activation | +4.02e-01 |
Pos logit contributions | |
whence | +13.083 |
where | +11.570 |
flared | +11.539 |
cropped | +11.294 |
hurled | +11.214 |
Neg logit contributions | |
olson | -19.487 |
� | -17.912 |
dit | -17.488 |
Quantity | -16.114 |
advertising | -16.111 |
Token | the |
Token ID | 262 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
olson | +4.142 |
dit | +3.528 |
� | +3.421 |
ctl | +3.334 |
undo | +3.233 |
Neg logit contributions | |
PLIED | -3.622 |
whence | -3.513 |
forgiveness | -3.067 |
repre | -2.908 |
accus | -2.890 |
Token | associated |
Token ID | 3917 |
Feature activation | +6.18e-01 |
Pos logit contributions | |
olson | +4.619 |
dit | +3.945 |
� | +3.809 |
ctl | +3.714 |
advertising | +3.638 |
Neg logit contributions | |
PLIED | -3.846 |
whence | -3.747 |
forgiveness | -3.223 |
repre | -3.040 |
aught | -3.029 |
Token | credit |
Token ID | 3884 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
olson | +6.258 |
dit | +5.336 |
� | +5.169 |
ctl | +5.068 |
undo | +4.946 |
Neg logit contributions | |
PLIED | -5.509 |
whence | -5.285 |
forgiveness | -4.495 |
repre | -4.317 |
aught | -4.292 |
Token | crunch |
Token ID | 23527 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
whence | +8.235 |
forgiveness | +7.498 |
PLIED | +7.359 |
where | +7.043 |
cropped | +6.636 |
Neg logit contributions | |
olson | -12.975 |
� | -11.350 |
dit | -11.098 |
advertising | -10.652 |
undo | -10.330 |
Token | Al |
Token ID | 978 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
olson | +5.929 |
dit | +5.014 |
� | +4.868 |
advertising | +4.689 |
ctl | +4.604 |
Neg logit contributions | |
PLIED | -5.576 |
whence | -5.547 |
forgiveness | -4.877 |
accus | -4.648 |
hurled | -4.551 |
Token | now |
Token ID | 783 |
Feature activation | +6.56e-01 |
Pos logit contributions | |
olson | +10.219 |
� | +8.711 |
dit | +8.597 |
advertising | +7.957 |
undo | +7.922 |
Neg logit contributions | |
PLIED | -9.354 |
whence | -9.067 |
forgiveness | -8.294 |
repre | -7.684 |
accus | -7.538 |
Token | . |
Token ID | 13 |
Feature activation | +7.75e-03 |
Pos logit contributions | |
olson | +6.037 |
dit | +5.020 |
� | +5.000 |
advertising | +4.662 |
ctl | +4.655 |
Neg logit contributions | |
PLIED | -6.308 |
whence | -6.230 |
forgiveness | -5.687 |
repre | -5.265 |
accus | -5.243 |
Token | And |
Token ID | 843 |
Feature activation | +2.15e-01 |
Pos logit contributions | |
olson | +0.082 |
dit | +0.070 |
� | +0.069 |
advertising | +0.065 |
ctl | +0.065 |
Neg logit contributions | |
whence | -0.070 |
PLIED | -0.070 |
forgiveness | -0.063 |
accus | -0.059 |
hurled | -0.058 |
Token | you |
Token ID | 345 |
Feature activation | -9.24e-03 |
Pos logit contributions | |
olson | +2.322 |
dit | +1.973 |
� | +1.933 |
advertising | +1.862 |
ctl | +1.844 |
Neg logit contributions | |
PLIED | -1.891 |
whence | -1.845 |
forgiveness | -1.633 |
accus | -1.521 |
repre | -1.505 |
Token | know |
Token ID | 760 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
whence | +0.095 |
PLIED | +0.094 |
forgiveness | +0.085 |
accus | +0.080 |
hurled | +0.079 |
Neg logit contributions | |
olson | -0.087 |
dit | -0.073 |
� | -0.072 |
ctl | -0.067 |
advertising | -0.067 |
Token | how |
Token ID | 703 |
Feature activation | +4.05e-01 |
Pos logit contributions | |
whence | +13.038 |
where | +12.011 |
forgiveness | +10.490 |
accus | +9.610 |
PLIED | +9.591 |
Neg logit contributions | |
olson | -19.698 |
� | -17.057 |
dit | -16.727 |
ctl | -16.180 |
Quantity | -16.112 |
Token | Batman |
Token ID | 9827 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
olson | +4.302 |
dit | +3.599 |
� | +3.547 |
ctl | +3.423 |
advertising | +3.417 |
Neg logit contributions | |
PLIED | -3.578 |
whence | -3.494 |
forgiveness | -3.020 |
repre | -2.834 |
aught | -2.827 |
Token | has |
Token ID | 468 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
olson | +3.720 |
dit | +3.123 |
� | +3.108 |
ctl | +2.975 |
advertising | +2.954 |
Neg logit contributions | |
PLIED | -3.143 |
whence | -3.121 |
forgiveness | -2.741 |
accus | -2.526 |
repre | -2.522 |
Token | always |
Token ID | 1464 |
Feature activation | +7.05e-01 |
Pos logit contributions | |
olson | +11.224 |
dit | +9.597 |
� | +9.303 |
ctl | +9.173 |
advertising | +8.850 |
Neg logit contributions | |
PLIED | -9.507 |
whence | -8.943 |
forgiveness | -7.424 |
repre | -7.310 |
aught | -7.176 |
Token | driven |
Token ID | 7986 |
Feature activation | +7.15e-01 |
Pos logit contributions | |
olson | +7.092 |
dit | +5.875 |
� | +5.700 |
ctl | +5.610 |
advertising | +5.591 |
Neg logit contributions | |
PLIED | -6.202 |
whence | -6.125 |
forgiveness | -5.357 |
repre | -5.119 |
srfAttach | -5.044 |
Token | Kh |
Token ID | 5311 |
Feature activation | -6.59e-02 |
Pos logit contributions | |
whence | +3.319 |
PLIED | +3.219 |
forgiveness | +2.934 |
accus | +2.734 |
where | +2.705 |
Neg logit contributions | |
olson | -4.370 |
dit | -3.722 |
� | -3.661 |
ctl | -3.499 |
advertising | -3.486 |
Token | ark |
Token ID | 668 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
whence | +0.812 |
PLIED | +0.800 |
forgiveness | +0.743 |
where | +0.711 |
accus | +0.709 |
Neg logit contributions | |
olson | -0.482 |
dit | -0.377 |
� | -0.372 |
ctl | -0.340 |
advertising | -0.334 |
Token | iv |
Token ID | 452 |
Feature activation | -4.89e-01 |
Pos logit contributions | |
olson | +7.465 |
dit | +5.738 |
� | +5.305 |
ctl | +5.261 |
undo | +5.096 |
Neg logit contributions | |
PLIED | -12.352 |
whence | -11.886 |
forgiveness | -11.076 |
flared | -10.578 |
cropped | -10.495 |
Token | businesses |
Token ID | 5692 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
whence | +4.506 |
PLIED | +4.368 |
forgiveness | +4.007 |
accus | +3.773 |
where | +3.753 |
Neg logit contributions | |
olson | -5.101 |
dit | -4.321 |
� | -4.258 |
ctl | -4.024 |
advertising | -3.997 |
Token | that |
Token ID | 326 |
Feature activation | -5.05e-01 |
Pos logit contributions | |
whence | +1.162 |
PLIED | +1.157 |
forgiveness | +1.030 |
accus | +0.957 |
hurled | +0.933 |
Neg logit contributions | |
olson | -1.489 |
dit | -1.268 |
� | -1.244 |
ctl | -1.193 |
advertising | -1.179 |
Token | received |
Token ID | 2722 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
whence | +4.019 |
PLIED | +3.855 |
forgiveness | +3.502 |
where | +3.275 |
accus | +3.264 |
Neg logit contributions | |
olson | -5.909 |
dit | -5.043 |
� | -4.989 |
advertising | -4.805 |
ctl | -4.725 |
Token | Priv |
Token ID | 9243 |
Feature activation | -8.55e-01 |
Pos logit contributions | |
whence | +13.605 |
forgiveness | +13.073 |
Loans | +12.432 |
PLIED | +12.130 |
where | +12.035 |
Neg logit contributions | |
olson | -18.055 |
dit | -15.465 |
� | -15.025 |
ctl | -14.490 |
advertising | -14.457 |
Token | at |
Token ID | 265 |
Feature activation | -3.98e-01 |
Pos logit contributions | |
whence | +5.833 |
PLIED | +5.800 |
forgiveness | +5.330 |
where | +5.309 |
aught | +5.105 |
Neg logit contributions | |
olson | -9.584 |
� | -8.534 |
dit | -8.065 |
advertising | -7.595 |
ctl | -7.545 |
Token | bank |
Token ID | 17796 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
whence | +2.951 |
PLIED | +2.852 |
forgiveness | +2.574 |
where | +2.380 |
accus | +2.334 |
Neg logit contributions | |
olson | -4.815 |
dit | -4.126 |
� | -4.119 |
ctl | -3.902 |
advertising | -3.870 |
Token | loans |
Token ID | 10021 |
Feature activation | -4.66e-01 |
Pos logit contributions | |
whence | +9.465 |
forgiveness | +8.971 |
PLIED | +8.793 |
Loans | +8.178 |
where | +7.982 |
Neg logit contributions | |
olson | -16.279 |
dit | -14.040 |
� | -13.719 |
ctl | -13.290 |
advertising | -13.130 |
Token | are |
Token ID | 389 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
whence | +3.766 |
PLIED | +3.637 |
forgiveness | +3.304 |
where | +3.050 |
accus | +3.040 |
Neg logit contributions | |
olson | -5.421 |
dit | -4.639 |
� | -4.594 |
advertising | -4.368 |
ctl | -4.352 |
Token | CC |
Token ID | 4093 |
Feature activation | -4.35e-01 |
Pos logit contributions | |
whence | +3.188 |
PLIED | +3.141 |
forgiveness | +2.850 |
accus | +2.675 |
where | +2.648 |
Neg logit contributions | |
olson | -3.338 |
dit | -2.791 |
� | -2.739 |
ctl | -2.593 |
advertising | -2.590 |
Token | As |
Token ID | 1081 |
Feature activation | -5.44e-01 |
Pos logit contributions | |
whence | +3.965 |
PLIED | +3.884 |
forgiveness | +3.526 |
accus | +3.316 |
where | +3.288 |
Neg logit contributions | |
olson | -4.573 |
dit | -3.839 |
� | -3.796 |
ctl | -3.578 |
advertising | -3.569 |
Token | king |
Token ID | 3364 |
Feature activation | -5.50e-01 |
Pos logit contributions | |
whence | +5.185 |
PLIED | +5.086 |
forgiveness | +4.646 |
accus | +4.443 |
Applied | +4.397 |
Neg logit contributions | |
olson | -5.373 |
� | -4.414 |
dit | -4.404 |
ctl | -4.171 |
advertising | -4.146 |
Token | Koch |
Token ID | 17009 |
Feature activation | -5.04e-01 |
Pos logit contributions | |
whence | +4.801 |
PLIED | +4.606 |
forgiveness | +4.261 |
where | +3.992 |
accus | +3.980 |
Neg logit contributions | |
olson | -5.996 |
� | -5.016 |
dit | -4.996 |
ctl | -4.736 |
advertising | -4.664 |
Token | s |
Token ID | 82 |
Feature activation | -6.30e-01 |
Pos logit contributions | |
whence | +5.425 |
PLIED | +5.280 |
forgiveness | +4.913 |
accus | +4.688 |
where | +4.665 |
Neg logit contributions | |
olson | -4.435 |
dit | -3.551 |
� | -3.522 |
ctl | -3.326 |
advertising | -3.247 |
Token | for |
Token ID | 329 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
whence | +5.506 |
PLIED | +5.257 |
forgiveness | +4.864 |
where | +4.586 |
accus | +4.525 |
Neg logit contributions | |
olson | -6.840 |
dit | -5.699 |
� | -5.665 |
ctl | -5.410 |
advertising | -5.325 |
Token | Cash |
Token ID | 16210 |
Feature activation | -5.54e-01 |
Pos logit contributions | |
whence | +13.471 |
forgiveness | +12.674 |
PLIED | +12.287 |
Applied | +12.121 |
where | +11.911 |
Neg logit contributions | |
olson | -17.947 |
� | -14.789 |
dit | -14.360 |
Quantity | -14.088 |
ctl | -13.895 |
Token | � |
Token ID | 447 |
Feature activation | +5.64e-02 |
Pos logit contributions | |
whence | +5.087 |
PLIED | +4.937 |
forgiveness | +4.549 |
where | +4.265 |
accus | +4.239 |
Neg logit contributions | |
olson | -5.737 |
dit | -4.780 |
� | -4.706 |
ctl | -4.512 |
advertising | -4.454 |
Token | � |
Token ID | 251 |
Feature activation | -2.51e-01 |
Pos logit contributions | |
olson | +0.513 |
dit | +0.422 |
� | +0.415 |
ctl | +0.388 |
advertising | +0.387 |
Neg logit contributions | |
whence | -0.597 |
PLIED | -0.595 |
forgiveness | -0.537 |
accus | -0.509 |
hurled | -0.502 |
Token | ( |
Token ID | 357 |
Feature activation | -3.96e-01 |
Pos logit contributions | |
whence | +2.394 |
PLIED | +2.355 |
forgiveness | +2.139 |
accus | +2.006 |
where | +1.980 |
Neg logit contributions | |
olson | -2.570 |
dit | -2.153 |
� | -2.113 |
ctl | -2.004 |
advertising | -1.997 |
Token | Polit |
Token ID | 39866 |
Feature activation | +2.99e-01 |
Pos logit contributions | |
whence | +4.118 |
PLIED | +4.063 |
forgiveness | +3.699 |
accus | +3.501 |
where | +3.493 |
Neg logit contributions | |
olson | -3.652 |
dit | -2.974 |
� | -2.935 |
ctl | -2.766 |
advertising | -2.716 |
Token | well |
Token ID | 880 |
Feature activation | -2.97e-01 |
Pos logit contributions | |
whence | +5.631 |
PLIED | +5.407 |
forgiveness | +5.055 |
where | +4.719 |
accus | +4.691 |
Neg logit contributions | |
olson | -7.166 |
dit | -5.989 |
� | -5.933 |
ctl | -5.624 |
advertising | -5.599 |
Token | , |
Token ID | 11 |
Feature activation | -3.02e-01 |
Pos logit contributions | |
whence | +2.742 |
PLIED | +2.687 |
forgiveness | +2.439 |
accus | +2.281 |
where | +2.260 |
Neg logit contributions | |
olson | -3.117 |
dit | -2.624 |
� | -2.575 |
ctl | -2.447 |
advertising | -2.435 |
Token | and |
Token ID | 290 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
whence | +2.626 |
PLIED | +2.563 |
forgiveness | +2.318 |
accus | +2.158 |
where | +2.137 |
Neg logit contributions | |
olson | -3.349 |
dit | -2.841 |
� | -2.790 |
ctl | -2.663 |
advertising | -2.651 |
Token | tells |
Token ID | 4952 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
olson | +1.111 |
dit | +0.946 |
� | +0.928 |
ctl | +0.887 |
advertising | +0.879 |
Neg logit contributions | |
PLIED | -0.900 |
whence | -0.900 |
forgiveness | -0.789 |
accus | -0.738 |
hurled | -0.724 |
Token | you |
Token ID | 345 |
Feature activation | -8.79e-01 |
Pos logit contributions | |
whence | +0.853 |
PLIED | +0.843 |
forgiveness | +0.734 |
accus | +0.675 |
hurled | +0.664 |
Neg logit contributions | |
olson | -1.370 |
dit | -1.189 |
� | -1.169 |
ctl | -1.124 |
advertising | -1.116 |
Token | exactly |
Token ID | 3446 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
whence | +7.278 |
PLIED | +6.689 |
forgiveness | +6.380 |
where | +6.297 |
accus | +5.828 |
Neg logit contributions | |
olson | -9.777 |
dit | -8.288 |
� | -8.092 |
advertising | -7.701 |
ctl | -7.628 |
Token | how |
Token ID | 703 |
Feature activation | +7.31e-02 |
Pos logit contributions | |
whence | +11.546 |
where | +10.608 |
forgiveness | +8.508 |
PLIED | +8.077 |
accus | +7.836 |
Neg logit contributions | |
olson | -21.822 |
dit | -18.616 |
� | -18.158 |
advertising | -18.075 |
Quantity | -17.859 |
Token | to |
Token ID | 284 |
Feature activation | -2.06e-01 |
Pos logit contributions | |
olson | +0.757 |
dit | +0.638 |
� | +0.628 |
ctl | +0.599 |
advertising | +0.587 |
Neg logit contributions | |
whence | -0.679 |
PLIED | -0.674 |
forgiveness | -0.599 |
accus | -0.559 |
hurled | -0.554 |
Token | improve |
Token ID | 2987 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
whence | +1.885 |
PLIED | +1.838 |
forgiveness | +1.682 |
accus | +1.569 |
where | +1.563 |
Neg logit contributions | |
olson | -2.179 |
dit | -1.843 |
� | -1.807 |
advertising | -1.725 |
ctl | -1.708 |
Token | . |
Token ID | 13 |
Feature activation | -5.93e-02 |
Pos logit contributions | |
whence | +2.624 |
PLIED | +2.562 |
forgiveness | +2.343 |
where | +2.177 |
accus | +2.174 |
Neg logit contributions | |
olson | -3.110 |
dit | -2.632 |
� | -2.577 |
ctl | -2.450 |
advertising | -2.448 |
Token | Let |
Token ID | 3914 |
Feature activation | +5.74e-01 |
Pos logit contributions | |
whence | +0.544 |
PLIED | +0.537 |
forgiveness | +0.485 |
accus | +0.453 |
hurled | +0.445 |
Neg logit contributions | |
olson | -0.625 |
dit | -0.529 |
� | -0.520 |
ctl | -0.494 |
advertising | -0.492 |
Token | . |
Token ID | 13 |
Feature activation | +1.27e-01 |
Pos logit contributions | |
olson | +2.740 |
dit | +2.298 |
� | +2.236 |
ctl | +2.151 |
advertising | +2.129 |
Neg logit contributions | |
PLIED | -2.546 |
whence | -2.508 |
forgiveness | -2.271 |
accus | -2.090 |
repre | -2.065 |
Token | His |
Token ID | 2399 |
Feature activation | -6.88e-01 |
Pos logit contributions | |
olson | +1.406 |
dit | +1.202 |
� | +1.185 |
advertising | +1.127 |
ctl | +1.122 |
Neg logit contributions | |
whence | -1.090 |
PLIED | -1.082 |
forgiveness | -0.968 |
accus | -0.903 |
repre | -0.885 |
Token | curl |
Token ID | 29249 |
Feature activation | -8.97e-01 |
Pos logit contributions | |
whence | +5.646 |
PLIED | +5.278 |
forgiveness | +5.068 |
where | +4.736 |
accus | +4.692 |
Neg logit contributions | |
olson | -7.650 |
dit | -6.596 |
� | -6.473 |
ctl | -6.163 |
advertising | -6.124 |
Token | routes |
Token ID | 11926 |
Feature activation | -8.28e-01 |
Pos logit contributions | |
whence | +7.360 |
PLIED | +6.815 |
forgiveness | +6.521 |
where | +6.345 |
accus | +6.103 |
Neg logit contributions | |
olson | -9.716 |
dit | -8.186 |
� | -8.135 |
ctl | -7.686 |
advertising | -7.684 |
Token | require |
Token ID | 2421 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
whence | +6.730 |
PLIED | +6.302 |
forgiveness | +5.854 |
where | +5.783 |
cropped | +5.546 |
Neg logit contributions | |
olson | -9.196 |
dit | -7.842 |
� | -7.764 |
advertising | -7.366 |
ctl | -7.296 |
Token | far |
Token ID | 1290 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
whence | +8.208 |
forgiveness | +7.617 |
PLIED | +7.613 |
where | +7.185 |
accus | +6.950 |
Neg logit contributions | |
olson | -11.213 |
dit | -9.656 |
� | -9.449 |
advertising | -9.400 |
ctl | -9.168 |
Token | too |
Token ID | 1165 |
Feature activation | -6.60e-01 |
Pos logit contributions | |
whence | +11.471 |
forgiveness | +10.230 |
where | +10.088 |
PLIED | +9.881 |
accus | +9.281 |
Neg logit contributions | |
olson | -19.020 |
advertising | -16.984 |
� | -16.856 |
dit | -16.744 |
ctl | -16.543 |
Token | many |
Token ID | 867 |
Feature activation | -4.40e-01 |
Pos logit contributions | |
whence | +5.779 |
PLIED | +5.516 |
forgiveness | +5.222 |
where | +4.897 |
accus | +4.885 |
Neg logit contributions | |
olson | -6.959 |
dit | -6.010 |
� | -5.838 |
advertising | -5.593 |
ctl | -5.577 |
Token | steps |
Token ID | 4831 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
whence | +3.556 |
PLIED | +3.419 |
forgiveness | +3.158 |
accus | +2.918 |
where | +2.899 |
Neg logit contributions | |
olson | -5.102 |
dit | -4.373 |
� | -4.319 |
advertising | -4.145 |
ctl | -4.116 |
Token | , |
Token ID | 11 |
Feature activation | -9.06e-01 |
Pos logit contributions | |
whence | +1.431 |
PLIED | +1.412 |
forgiveness | +1.271 |
accus | +1.186 |
where | +1.161 |
Neg logit contributions | |
olson | -1.708 |
dit | -1.447 |
� | -1.419 |
ctl | -1.351 |
advertising | -1.344 |
Token | allowing |
Token ID | 5086 |
Feature activation | -4.73e-01 |
Pos logit contributions | |
whence | +7.533 |
PLIED | +6.997 |
forgiveness | +6.607 |
where | +6.482 |
hurled | +6.144 |
Neg logit contributions | |
olson | -9.827 |
dit | -8.482 |
� | -8.153 |
advertising | -8.018 |
ctl | -7.936 |
Token | � |
Token ID | 447 |
Feature activation | +4.88e-02 |
Pos logit contributions | |
whence | +6.339 |
PLIED | +6.170 |
forgiveness | +5.765 |
accus | +5.432 |
where | +5.424 |
Neg logit contributions | |
olson | -6.691 |
dit | -5.540 |
� | -5.289 |
advertising | -5.214 |
ctl | -5.160 |
Token | � |
Token ID | 247 |
Feature activation | -1.44e-01 |
Pos logit contributions | |
olson | +0.480 |
dit | +0.400 |
� | +0.392 |
ctl | +0.371 |
advertising | +0.369 |
Neg logit contributions | |
whence | -0.484 |
PLIED | -0.477 |
forgiveness | -0.435 |
accus | -0.408 |
where | -0.403 |
Token | d |
Token ID | 67 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
whence | +1.477 |
PLIED | +1.453 |
forgiveness | +1.333 |
accus | +1.257 |
where | +1.242 |
Neg logit contributions | |
olson | -1.358 |
dit | -1.119 |
� | -1.094 |
ctl | -1.031 |
advertising | -1.031 |
Token | rather |
Token ID | 2138 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
whence | +1.306 |
PLIED | +1.291 |
forgiveness | +1.157 |
accus | +1.074 |
hurled | +1.057 |
Neg logit contributions | |
olson | -1.599 |
dit | -1.364 |
� | -1.335 |
ctl | -1.272 |
advertising | -1.260 |
Token | not |
Token ID | 407 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
whence | +0.889 |
PLIED | +0.879 |
forgiveness | +0.784 |
accus | +0.728 |
hurled | +0.716 |
Neg logit contributions | |
olson | -1.126 |
dit | -0.959 |
� | -0.942 |
ctl | -0.899 |
advertising | -0.892 |
Token | know |
Token ID | 760 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
whence | +1.331 |
PLIED | +1.312 |
forgiveness | +1.175 |
accus | +1.091 |
where | +1.072 |
Neg logit contributions | |
olson | -1.707 |
dit | -1.454 |
� | -1.429 |
ctl | -1.363 |
advertising | -1.356 |
Token | ). |
Token ID | 737 |
Feature activation | +7.15e-02 |
Pos logit contributions | |
whence | +14.228 |
where | +12.812 |
forgiveness | +11.993 |
PLIED | +11.239 |
accus | +10.936 |
Neg logit contributions | |
olson | -18.992 |
dit | -15.433 |
Quantity | -15.112 |
undo | -15.024 |
� | -14.901 |
Token | Team |
Token ID | 4816 |
Feature activation | +5.10e-01 |
Pos logit contributions | |
olson | +0.675 |
dit | +0.557 |
� | +0.551 |
advertising | +0.519 |
ctl | +0.517 |
Neg logit contributions | |
PLIED | -0.728 |
whence | -0.725 |
forgiveness | -0.658 |
accus | -0.621 |
hurled | -0.616 |
Token | Sweden |
Token ID | 10710 |
Feature activation | -5.29e-01 |
Pos logit contributions | |
olson | +4.327 |
dit | +3.471 |
� | +3.414 |
advertising | +3.214 |
ctl | +3.164 |
Neg logit contributions | |
PLIED | -5.537 |
whence | -5.487 |
forgiveness | -4.960 |
repre | -4.717 |
aught | -4.710 |
Token | also |
Token ID | 635 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
whence | +4.323 |
PLIED | +4.158 |
forgiveness | +3.764 |
where | +3.554 |
accus | +3.506 |
Neg logit contributions | |
olson | -6.054 |
dit | -5.167 |
� | -5.062 |
ctl | -4.828 |
advertising | -4.800 |
Token | left |
Token ID | 1364 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
whence | +1.397 |
PLIED | +1.373 |
forgiveness | +1.216 |
accus | +1.119 |
where | +1.094 |
Neg logit contributions | |
olson | -2.159 |
dit | -1.864 |
� | -1.832 |
ctl | -1.756 |
advertising | -1.750 |
Token | is |
Token ID | 318 |
Feature activation | +1.04e-01 |
Pos logit contributions | |
olson | +2.966 |
dit | +2.512 |
� | +2.471 |
advertising | +2.386 |
ctl | +2.382 |
Neg logit contributions | |
PLIED | -2.442 |
whence | -2.418 |
forgiveness | -2.110 |
accus | -1.951 |
hurled | -1.941 |
Token | treated |
Token ID | 5716 |
Feature activation | +2.11e-01 |
Pos logit contributions | |
olson | +1.140 |
dit | +0.976 |
� | +0.962 |
advertising | +0.918 |
ctl | +0.916 |
Neg logit contributions | |
whence | -0.888 |
PLIED | -0.873 |
forgiveness | -0.780 |
accus | -0.718 |
repre | -0.708 |
Token | as |
Token ID | 355 |
Feature activation | +7.64e-01 |
Pos logit contributions | |
olson | +2.308 |
dit | +2.009 |
� | +1.960 |
ctl | +1.895 |
advertising | +1.874 |
Neg logit contributions | |
PLIED | -1.752 |
whence | -1.750 |
forgiveness | -1.550 |
accus | -1.416 |
hurled | -1.410 |
Token | a |
Token ID | 257 |
Feature activation | +6.20e-01 |
Pos logit contributions | |
olson | +7.016 |
dit | +6.059 |
� | +5.767 |
advertising | +5.634 |
customs | +5.530 |
Neg logit contributions | |
PLIED | -6.881 |
whence | -6.861 |
forgiveness | -6.057 |
aught | -5.756 |
repre | -5.701 |
Token | marriage |
Token ID | 4845 |
Feature activation | +9.07e-01 |
Pos logit contributions | |
olson | +6.035 |
dit | +5.183 |
� | +4.980 |
ctl | +4.795 |
advertising | +4.760 |
Neg logit contributions | |
whence | -5.658 |
PLIED | -5.592 |
forgiveness | -4.856 |
aught | -4.650 |
repre | -4.566 |
Token | under |
Token ID | 739 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
olson | +8.369 |
dit | +7.215 |
advertising | +6.631 |
ctl | +6.604 |
� | +6.572 |
Neg logit contributions | |
PLIED | -7.943 |
whence | -7.734 |
forgiveness | -6.965 |
aught | -6.821 |
repre | -6.733 |
Token | the |
Token ID | 262 |
Feature activation | +7.98e-01 |
Pos logit contributions | |
olson | +10.518 |
dit | +9.801 |
customs | +9.044 |
advertising | +8.941 |
ctl | +8.721 |
Neg logit contributions | |
PLIED | -12.267 |
whence | -12.254 |
srfAttach | -10.400 |
forgiveness | -10.282 |
repre | -10.185 |
Token | laws |
Token ID | 3657 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
olson | +6.331 |
dit | +5.544 |
customs | +4.882 |
advertising | +4.866 |
� | +4.782 |
Neg logit contributions | |
PLIED | -8.300 |
whence | -8.293 |
forgiveness | -7.278 |
repre | -7.267 |
aught | -7.149 |
Token | of |
Token ID | 286 |
Feature activation | +4.07e-01 |
Pos logit contributions | |
olson | +2.977 |
dit | +2.537 |
� | +2.447 |
advertising | +2.408 |
ctl | +2.354 |
Neg logit contributions | |
PLIED | -3.104 |
whence | -3.037 |
forgiveness | -2.747 |
accus | -2.605 |
repre | -2.580 |
Token | such |
Token ID | 884 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
olson | +3.904 |
dit | +3.327 |
� | +3.228 |
advertising | +3.151 |
ctl | +3.059 |
Neg logit contributions | |
PLIED | -3.804 |
whence | -3.738 |
forgiveness | -3.382 |
accus | -3.172 |
repre | -3.142 |
Token | other |
Token ID | 584 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
olson | +3.020 |
dit | +2.569 |
� | +2.466 |
advertising | +2.357 |
ctl | +2.338 |
Neg logit contributions | |
PLIED | -3.127 |
whence | -3.077 |
forgiveness | -2.759 |
repre | -2.600 |
accus | -2.583 |
Token | is |
Token ID | 318 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
whence | +2.623 |
PLIED | +2.564 |
forgiveness | +2.325 |
accus | +2.167 |
where | +2.145 |
Neg logit contributions | |
olson | -3.336 |
dit | -2.827 |
� | -2.777 |
ctl | -2.648 |
advertising | -2.644 |
Token | one |
Token ID | 530 |
Feature activation | +4.03e-02 |
Pos logit contributions | |
whence | +1.434 |
PLIED | +1.411 |
forgiveness | +1.267 |
accus | +1.179 |
where | +1.157 |
Neg logit contributions | |
olson | -1.825 |
dit | -1.554 |
� | -1.527 |
ctl | -1.454 |
advertising | -1.450 |
Token | of |
Token ID | 286 |
Feature activation | +2.26e-01 |
Pos logit contributions | |
olson | +0.409 |
� | +0.347 |
dit | +0.347 |
ctl | +0.324 |
advertising | +0.319 |
Neg logit contributions | |
whence | -0.378 |
PLIED | -0.377 |
forgiveness | -0.338 |
accus | -0.314 |
hurled | -0.310 |
Token | the |
Token ID | 262 |
Feature activation | +5.01e-01 |
Pos logit contributions | |
olson | +2.269 |
dit | +1.924 |
� | +1.895 |
advertising | +1.771 |
ctl | +1.768 |
Neg logit contributions | |
PLIED | -2.120 |
whence | -2.116 |
forgiveness | -1.876 |
accus | -1.780 |
repre | -1.777 |
Token | most |
Token ID | 749 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
olson | +6.188 |
dit | +5.445 |
� | +5.405 |
ctl | +5.062 |
advertising | +5.054 |
Neg logit contributions | |
PLIED | -3.388 |
whence | -3.308 |
forgiveness | -2.771 |
repre | -2.540 |
hurled | -2.501 |
Token | defining |
Token ID | 16215 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
olson | +10.729 |
� | +9.326 |
dit | +9.296 |
ctl | +8.741 |
Quantity | +8.465 |
Neg logit contributions | |
whence | -10.023 |
PLIED | -9.907 |
forgiveness | -8.673 |
srfAttach | -8.614 |
Loans | -8.425 |
Token | human |
Token ID | 1692 |
Feature activation | +8.91e-01 |
Pos logit contributions | |
olson | +12.763 |
� | +11.814 |
customs | +10.991 |
dit | +10.854 |
ctl | +10.691 |
Neg logit contributions | |
PLIED | -12.877 |
whence | -12.650 |
repre | -10.878 |
forgiveness | -10.779 |
aught | -10.251 |
Token | behaviors |
Token ID | 14301 |
Feature activation | +4.75e-01 |
Pos logit contributions | |
olson | +8.314 |
� | +7.229 |
dit | +7.109 |
advertising | +6.758 |
ctl | +6.648 |
Neg logit contributions | |
whence | -8.016 |
PLIED | -7.842 |
forgiveness | -6.997 |
repre | -6.774 |
flared | -6.564 |
Token | , |
Token ID | 11 |
Feature activation | +4.28e-01 |
Pos logit contributions | |
olson | +4.558 |
� | +3.833 |
dit | +3.749 |
ctl | +3.531 |
advertising | +3.522 |
Neg logit contributions | |
PLIED | -4.548 |
whence | -4.547 |
forgiveness | -4.076 |
accus | -3.818 |
repre | -3.762 |
Token | � |
Token ID | 447 |
Feature activation | -2.77e-02 |
Pos logit contributions | |
olson | +4.615 |
� | +3.963 |
dit | +3.935 |
advertising | +3.743 |
ctl | +3.660 |
Neg logit contributions | |
PLIED | -3.556 |
whence | -3.482 |
forgiveness | -3.129 |
accus | -2.910 |
repre | -2.853 |
Token | � |
Token ID | 251 |
Feature activation | -3.63e-01 |
Pos logit contributions | |
whence | +0.270 |
PLIED | +0.265 |
forgiveness | +0.242 |
accus | +0.227 |
where | +0.224 |
Neg logit contributions | |
olson | -0.278 |
dit | -0.232 |
� | -0.228 |
ctl | -0.216 |
advertising | -0.215 |
Token | " |
Token ID | 1 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
whence | +0.843 |
PLIED | +0.829 |
forgiveness | +0.754 |
accus | +0.707 |
where | +0.695 |
Neg logit contributions | |
olson | -0.899 |
dit | -0.754 |
� | -0.740 |
ctl | -0.702 |
advertising | -0.701 |
Token | It |
Token ID | 1026 |
Feature activation | +6.58e-01 |
Pos logit contributions | |
whence | +1.252 |
PLIED | +1.235 |
forgiveness | +1.116 |
accus | +1.044 |
where | +1.035 |
Neg logit contributions | |
olson | -1.379 |
dit | -1.159 |
� | -1.137 |
ctl | -1.079 |
advertising | -1.071 |
Token | 's |
Token ID | 338 |
Feature activation | +8.44e-01 |
Pos logit contributions | |
olson | +5.907 |
dit | +4.844 |
� | +4.638 |
ctl | +4.614 |
advertising | +4.488 |
Neg logit contributions | |
PLIED | -6.652 |
whence | -6.533 |
forgiveness | -5.821 |
Applied | -5.432 |
repre | -5.419 |
Token | making |
Token ID | 1642 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
olson | +8.042 |
dit | +6.762 |
� | +6.433 |
ctl | +6.388 |
advertising | +6.352 |
Neg logit contributions | |
PLIED | -7.587 |
whence | -7.419 |
forgiveness | -6.285 |
Loans | -5.970 |
aught | -5.933 |
Token | a |
Token ID | 257 |
Feature activation | +9.74e-01 |
Pos logit contributions | |
olson | +13.264 |
dit | +11.292 |
� | +10.769 |
ctl | +10.622 |
customs | +10.515 |
Neg logit contributions | |
PLIED | -11.597 |
whence | -11.043 |
repre | -9.628 |
srfAttach | -9.130 |
hurled | -9.119 |
Token | very |
Token ID | 845 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
olson | +8.604 |
dit | +6.702 |
� | +6.669 |
undo | +6.426 |
ctl | +6.361 |
Neg logit contributions | |
PLIED | -9.436 |
whence | -9.105 |
forgiveness | -7.874 |
repre | -7.661 |
aught | -7.653 |
Token | powerful |
Token ID | 3665 |
Feature activation | +3.96e-01 |
Pos logit contributions | |
olson | +11.663 |
� | +9.084 |
dit | +8.894 |
undo | +8.717 |
ctl | +8.702 |
Neg logit contributions | |
PLIED | -13.914 |
whence | -13.063 |
forgiveness | -11.511 |
Loans | -11.401 |
repre | -11.325 |
Token | statement |
Token ID | 2643 |
Feature activation | +5.04e-01 |
Pos logit contributions | |
olson | +4.075 |
dit | +3.374 |
� | +3.353 |
advertising | +3.218 |
undo | +3.203 |
Neg logit contributions | |
PLIED | -3.563 |
whence | -3.562 |
forgiveness | -3.087 |
repre | -2.905 |
hurled | -2.885 |
Token | about |
Token ID | 546 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
olson | +4.670 |
dit | +3.820 |
� | +3.692 |
ctl | +3.543 |
advertising | +3.503 |
Neg logit contributions | |
PLIED | -5.021 |
whence | -4.915 |
forgiveness | -4.398 |
repre | -4.176 |
accus | -4.144 |
Token | the |
Token ID | 262 |
Feature activation | +2.61e-01 |
Pos logit contributions | |
whence | +2.562 |
PLIED | +2.480 |
forgiveness | +2.246 |
where | +2.083 |
accus | +2.070 |
Neg logit contributions | |
olson | -3.641 |
dit | -3.137 |
� | -3.100 |
ctl | -2.937 |
advertising | -2.931 |
Token | importance |
Token ID | 6817 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
olson | +2.537 |
dit | +2.102 |
� | +2.005 |
ctl | +1.952 |
advertising | +1.937 |
Neg logit contributions | |
PLIED | -2.554 |
whence | -2.548 |
forgiveness | -2.237 |
accus | -2.115 |
hurled | -2.114 |
Token | London |
Token ID | 3576 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
whence | +0.425 |
PLIED | +0.420 |
forgiveness | +0.375 |
accus | +0.352 |
hurled | +0.346 |
Neg logit contributions | |
olson | -0.525 |
dit | -0.445 |
� | -0.436 |
ctl | -0.415 |
advertising | -0.413 |
Token | 's |
Token ID | 338 |
Feature activation | -9.04e-02 |
Pos logit contributions | |
whence | +1.470 |
PLIED | +1.450 |
forgiveness | +1.314 |
accus | +1.230 |
where | +1.205 |
Neg logit contributions | |
olson | -1.622 |
dit | -1.362 |
� | -1.334 |
ctl | -1.269 |
advertising | -1.265 |
Token | Kens |
Token ID | 29018 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
whence | +0.811 |
PLIED | +0.801 |
forgiveness | +0.718 |
accus | +0.672 |
hurled | +0.658 |
Neg logit contributions | |
olson | -0.973 |
dit | -0.824 |
� | -0.807 |
ctl | -0.768 |
advertising | -0.767 |
Token | ington |
Token ID | 9557 |
Feature activation | +6.55e-02 |
Pos logit contributions | |
olson | +2.909 |
dit | +1.885 |
� | +1.735 |
advertising | +1.599 |
ctl | +1.558 |
Neg logit contributions | |
whence | -7.663 |
PLIED | -7.606 |
forgiveness | -7.137 |
accus | -6.865 |
repre | -6.802 |
Token | Gardens |
Token ID | 29330 |
Feature activation | -4.51e-01 |
Pos logit contributions | |
olson | +0.676 |
dit | +0.564 |
� | +0.546 |
advertising | +0.527 |
ctl | +0.521 |
Neg logit contributions | |
whence | -0.610 |
PLIED | -0.606 |
forgiveness | -0.547 |
accus | -0.510 |
repre | -0.502 |
Token | has |
Token ID | 468 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
whence | +3.765 |
PLIED | +3.636 |
forgiveness | +3.280 |
where | +3.079 |
accus | +3.042 |
Neg logit contributions | |
olson | -5.132 |
dit | -4.403 |
� | -4.361 |
ctl | -4.119 |
advertising | -4.101 |
Token | been |
Token ID | 587 |
Feature activation | +7.32e-01 |
Pos logit contributions | |
olson | +13.795 |
dit | +12.189 |
Guinness | +11.112 |
ctl | +11.099 |
customs | +11.066 |
Neg logit contributions | |
PLIED | -10.689 |
whence | -10.230 |
repre | -8.987 |
forgiveness | -8.735 |
srfAttach | -8.658 |
Token | at |
Token ID | 379 |
Feature activation | +8.29e-01 |
Pos logit contributions | |
olson | +7.968 |
dit | +6.911 |
� | +6.528 |
ctl | +6.347 |
nex | +6.263 |
Neg logit contributions | |
PLIED | -5.711 |
whence | -5.690 |
forgiveness | -4.909 |
repre | -4.609 |
accus | -4.523 |
Token | the |
Token ID | 262 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
olson | +8.093 |
dit | +6.784 |
� | +6.322 |
nex | +6.085 |
ctl | +6.075 |
Neg logit contributions | |
whence | -7.328 |
PLIED | -7.319 |
forgiveness | -6.409 |
accus | -6.170 |
hurled | -6.065 |
Token | nexus |
Token ID | 45770 |
Feature activation | -6.21e-02 |
Pos logit contributions | |
olson | +4.523 |
dit | +3.904 |
� | +3.805 |
ctl | +3.721 |
advertising | +3.666 |
Neg logit contributions | |
PLIED | -2.332 |
whence | -2.317 |
forgiveness | -1.923 |
accus | -1.762 |
hurled | -1.747 |
Token | of |
Token ID | 286 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
whence | +0.572 |
PLIED | +0.570 |
forgiveness | +0.510 |
accus | +0.479 |
hurled | +0.468 |
Neg logit contributions | |
olson | -0.647 |
dit | -0.546 |
� | -0.535 |
ctl | -0.510 |
advertising | -0.505 |
Token | a |
Token ID | 257 |
Feature activation | +4.96e-01 |
Pos logit contributions | |
olson | +3.279 |
dit | +2.768 |
� | +2.716 |
advertising | +2.568 |
ctl | +2.566 |
Neg logit contributions | |
PLIED | -3.113 |
whence | -3.097 |
forgiveness | -2.743 |
accus | -2.590 |
hurled | -2.566 |
Token | mall |
Token ID | 17374 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
olson | +5.117 |
dit | +4.315 |
� | +4.191 |
ctl | +4.053 |
advertising | +4.032 |
Neg logit contributions | |
PLIED | -4.464 |
whence | -4.370 |
forgiveness | -3.829 |
aught | -3.584 |
accus | -3.583 |
Token | . |
Token ID | 13 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
whence | +3.151 |
PLIED | +3.066 |
forgiveness | +2.777 |
where | +2.629 |
accus | +2.583 |
Neg logit contributions | |
olson | -3.910 |
dit | -3.353 |
� | -3.284 |
ctl | -3.121 |
advertising | -3.083 |
Token | They |
Token ID | 1119 |
Feature activation | +3.57e-01 |
Pos logit contributions | |
olson | +1.132 |
dit | +0.957 |
� | +0.943 |
advertising | +0.905 |
ctl | +0.893 |
Neg logit contributions | |
whence | -0.988 |
PLIED | -0.981 |
forgiveness | -0.889 |
accus | -0.832 |
hurled | -0.818 |
Token | visit |
Token ID | 3187 |
Feature activation | +6.01e-01 |
Pos logit contributions | |
olson | +3.756 |
dit | +3.171 |
� | +3.118 |
ctl | +3.031 |
advertising | +2.949 |
Neg logit contributions | |
PLIED | -3.236 |
whence | -3.172 |
forgiveness | -2.837 |
repre | -2.600 |
accus | -2.593 |
Token | an |
Token ID | 281 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
olson | +5.932 |
dit | +5.020 |
� | +4.857 |
ctl | +4.782 |
advertising | +4.734 |
Neg logit contributions | |
PLIED | -5.365 |
whence | -5.309 |
forgiveness | -4.692 |
repre | -4.467 |
accus | -4.442 |
Token | arcade |
Token ID | 27210 |
Feature activation | -9.54e-02 |
Pos logit contributions | |
olson | +13.244 |
dit | +11.293 |
advertising | +11.287 |
nex | +10.812 |
undo | +10.546 |
Neg logit contributions | |
PLIED | -11.618 |
whence | -11.491 |
forgiveness | -9.939 |
repre | -9.702 |
hurled | -9.480 |
Token | , |
Token ID | 11 |
Feature activation | -1.77e-01 |
Pos logit contributions | |
whence | +0.810 |
PLIED | +0.803 |
forgiveness | +0.717 |
accus | +0.666 |
hurled | +0.649 |
Neg logit contributions | |
olson | -1.069 |
dit | -0.911 |
� | -0.896 |
ctl | -0.857 |
advertising | -0.853 |
Token | a |
Token ID | 257 |
Feature activation | +6.21e-01 |
Pos logit contributions | |
whence | +1.368 |
PLIED | +1.350 |
forgiveness | +1.193 |
accus | +1.098 |
hurled | +1.069 |
Neg logit contributions | |
olson | -2.118 |
dit | -1.829 |
� | -1.799 |
ctl | -1.723 |
advertising | -1.718 |
Token | Pay |
Token ID | 7119 |
Feature activation | +4.00e-01 |
Pos logit contributions | |
olson | +6.458 |
dit | +5.493 |
� | +5.333 |
advertising | +5.216 |
ctl | +5.192 |
Neg logit contributions | |
PLIED | -5.358 |
whence | -5.189 |
forgiveness | -4.614 |
accus | -4.288 |
aught | -4.218 |
Token | less |
Token ID | 1203 |
Feature activation | +6.96e-01 |
Pos logit contributions | |
olson | +3.749 |
dit | +3.141 |
� | +2.978 |
advertising | +2.866 |
ctl | +2.798 |
Neg logit contributions | |
PLIED | -4.126 |
whence | -4.080 |
forgiveness | -3.690 |
accus | -3.459 |
repre | -3.439 |
Token | Act |
Token ID | 2191 |
Feature activation | +8.75e-01 |
Pos logit contributions | |
olson | +4.811 |
dit | +4.105 |
� | +3.903 |
ctl | +3.799 |
advertising | +3.701 |
Neg logit contributions | |
whence | -4.782 |
PLIED | -4.760 |
forgiveness | -4.287 |
accus | -4.034 |
hurled | -3.996 |
Token | , |
Token ID | 11 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
olson | +7.608 |
dit | +6.393 |
� | +6.127 |
ctl | +6.089 |
undo | +5.971 |
Neg logit contributions | |
PLIED | -8.413 |
whence | -8.170 |
forgiveness | -7.148 |
repre | -7.073 |
aught | -6.905 |
Token | required |
Token ID | 2672 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
olson | +5.685 |
dit | +4.844 |
� | +4.690 |
ctl | +4.608 |
advertising | +4.490 |
Neg logit contributions | |
PLIED | -4.957 |
whence | -4.723 |
forgiveness | -4.187 |
repre | -4.003 |
accus | -3.954 |
Token | Americans |
Token ID | 3399 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
olson | +10.258 |
dit | +8.644 |
� | +8.516 |
ctl | +8.293 |
customs | +7.987 |
Neg logit contributions | |
PLIED | -10.004 |
whence | -9.780 |
repre | -8.538 |
aught | -8.389 |
forgiveness | -8.138 |
Token | who |
Token ID | 508 |
Feature activation | +7.33e-01 |
Pos logit contributions | |
olson | +3.197 |
dit | +2.686 |
� | +2.651 |
ctl | +2.467 |
undo | +2.415 |
Neg logit contributions | |
PLIED | -3.391 |
whence | -3.319 |
forgiveness | -2.974 |
accus | -2.812 |
repre | -2.808 |
Token | qualified |
Token ID | 10617 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
olson | +7.223 |
dit | +6.173 |
ctl | +5.914 |
� | +5.909 |
nex | +5.764 |
Neg logit contributions | |
PLIED | -6.439 |
whence | -6.347 |
forgiveness | -5.765 |
repre | -5.394 |
srfAttach | -5.342 |
Token | for |
Token ID | 329 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
olson | +1.940 |
dit | +1.632 |
� | +1.585 |
ctl | +1.510 |
advertising | +1.483 |
Neg logit contributions | |
PLIED | -2.239 |
whence | -2.217 |
forgiveness | -1.988 |
accus | -1.880 |
aught | -1.876 |
Token | the |
Token ID | 262 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
olson | +1.347 |
dit | +1.125 |
� | +1.109 |
ctl | +1.053 |
advertising | +1.038 |
Neg logit contributions | |
whence | -1.352 |
PLIED | -1.343 |
forgiveness | -1.192 |
accus | -1.135 |
repre | -1.127 |
Token | individual |
Token ID | 1981 |
Feature activation | -8.28e-02 |
Pos logit contributions | |
olson | +4.136 |
dit | +3.475 |
� | +3.375 |
ctl | +3.272 |
advertising | +3.230 |
Neg logit contributions | |
PLIED | -3.819 |
whence | -3.818 |
forgiveness | -3.239 |
repre | -3.145 |
hurled | -3.134 |
Token | market |
Token ID | 1910 |
Feature activation | +3.95e-01 |
Pos logit contributions | |
whence | +0.784 |
PLIED | +0.774 |
forgiveness | +0.697 |
accus | +0.655 |
hurled | +0.643 |
Neg logit contributions | |
olson | -0.849 |
dit | -0.714 |
� | -0.699 |
ctl | -0.665 |
advertising | -0.662 |
Token | , |
Token ID | 11 |
Feature activation | +8.26e-01 |
Pos logit contributions | |
olson | +3.823 |
dit | +3.237 |
� | +3.163 |
ctl | +3.027 |
advertising | +2.961 |
Neg logit contributions | |
PLIED | -3.774 |
whence | -3.714 |
forgiveness | -3.235 |
accus | -3.150 |
repre | -3.103 |
Token | absor |
Token ID | 46303 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
olson | +2.499 |
dit | +2.061 |
� | +1.952 |
advertising | +1.877 |
ctl | +1.838 |
Neg logit contributions | |
whence | -3.510 |
PLIED | -3.489 |
forgiveness | -3.205 |
accus | -3.071 |
hurled | -3.036 |
Token | ptive |
Token ID | 21665 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
olson | +4.077 |
dit | +3.441 |
� | +3.343 |
ctl | +3.221 |
advertising | +3.197 |
Neg logit contributions | |
whence | -5.267 |
PLIED | -5.136 |
forgiveness | -4.786 |
accus | -4.640 |
Applied | -4.486 |
Token | state |
Token ID | 1181 |
Feature activation | +4.91e-01 |
Pos logit contributions | |
olson | +8.194 |
dit | +7.104 |
� | +7.066 |
ctl | +6.694 |
undo | +6.460 |
Neg logit contributions | |
PLIED | -10.072 |
whence | -9.658 |
forgiveness | -8.565 |
hurled | -8.501 |
aught | -8.408 |
Token | , |
Token ID | 11 |
Feature activation | +6.78e-02 |
Pos logit contributions | |
olson | +5.429 |
dit | +4.784 |
� | +4.679 |
ctl | +4.520 |
undo | +4.415 |
Neg logit contributions | |
PLIED | -3.964 |
whence | -3.676 |
forgiveness | -3.366 |
accus | -3.128 |
repre | -3.123 |
Token | during |
Token ID | 1141 |
Feature activation | -5.03e-01 |
Pos logit contributions | |
olson | +0.934 |
dit | +0.827 |
� | +0.815 |
ctl | +0.787 |
advertising | +0.786 |
Neg logit contributions | |
PLIED | -0.391 |
whence | -0.384 |
forgiveness | -0.325 |
accus | -0.291 |
hurled | -0.282 |
Token | which |
Token ID | 543 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
whence | +3.432 |
PLIED | +3.233 |
forgiveness | +2.864 |
where | +2.642 |
accus | +2.564 |
Neg logit contributions | |
olson | -6.558 |
dit | -5.684 |
� | -5.632 |
ctl | -5.399 |
advertising | -5.399 |
Token | the |
Token ID | 262 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
olson | +2.124 |
dit | +1.803 |
� | +1.754 |
ctl | +1.692 |
advertising | +1.659 |
Neg logit contributions | |
PLIED | -1.873 |
whence | -1.829 |
forgiveness | -1.622 |
accus | -1.545 |
hurled | -1.527 |
Token | components |
Token ID | 6805 |
Feature activation | +4.11e-01 |
Pos logit contributions | |
olson | +2.178 |
dit | +1.852 |
� | +1.806 |
ctl | +1.711 |
advertising | +1.688 |
Neg logit contributions | |
PLIED | -2.186 |
whence | -2.153 |
forgiveness | -1.912 |
accus | -1.820 |
hurled | -1.803 |
Token | of |
Token ID | 286 |
Feature activation | +5.30e-01 |
Pos logit contributions | |
olson | +3.873 |
dit | +3.261 |
� | +3.234 |
ctl | +3.055 |
advertising | +2.994 |
Neg logit contributions | |
PLIED | -3.992 |
whence | -3.852 |
forgiveness | -3.508 |
accus | -3.373 |
repre | -3.271 |
Token | the |
Token ID | 262 |
Feature activation | +8.53e-01 |
Pos logit contributions | |
olson | +6.051 |
dit | +5.243 |
� | +5.177 |
ctl | +4.946 |
undo | +4.856 |
Neg logit contributions | |
PLIED | -4.080 |
whence | -3.909 |
forgiveness | -3.405 |
accus | -3.278 |
repre | -3.201 |
Token | last |
Token ID | 938 |
Feature activation | +4.76e-01 |
Pos logit contributions | |
olson | +7.395 |
dit | +6.270 |
� | +6.241 |
ctl | +5.748 |
undo | +5.664 |
Neg logit contributions | |
PLIED | -8.423 |
whence | -8.059 |
forgiveness | -7.231 |
accus | -6.914 |
repre | -6.896 |
Token | Unfortunately |
Token ID | 8989 |
Feature activation | +3.10e-01 |
Pos logit contributions | |
olson | +0.519 |
dit | +0.443 |
� | +0.435 |
advertising | +0.418 |
ctl | +0.413 |
Neg logit contributions | |
whence | -0.414 |
PLIED | -0.411 |
forgiveness | -0.369 |
accus | -0.343 |
hurled | -0.337 |
Token | , |
Token ID | 11 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
olson | +2.881 |
dit | +2.418 |
� | +2.389 |
advertising | +2.302 |
ctl | +2.224 |
Neg logit contributions | |
PLIED | -3.160 |
whence | -3.075 |
forgiveness | -2.748 |
hurled | -2.601 |
accus | -2.588 |
Token | there |
Token ID | 612 |
Feature activation | +1.92e-01 |
Pos logit contributions | |
olson | +3.792 |
dit | +3.236 |
� | +3.169 |
advertising | +3.149 |
ctl | +3.012 |
Neg logit contributions | |
PLIED | -3.173 |
whence | -3.077 |
forgiveness | -2.720 |
repre | -2.532 |
accus | -2.511 |
Token | � |
Token ID | 447 |
Feature activation | -3.21e-01 |
Pos logit contributions | |
olson | +1.817 |
� | +1.504 |
dit | +1.502 |
advertising | +1.409 |
ctl | +1.407 |
Neg logit contributions | |
whence | -1.968 |
PLIED | -1.958 |
forgiveness | -1.763 |
accus | -1.652 |
hurled | -1.641 |
Token | � |
Token ID | 247 |
Feature activation | -2.66e-01 |
Pos logit contributions | |
whence | +2.913 |
PLIED | +2.819 |
forgiveness | +2.608 |
where | +2.443 |
accus | +2.437 |
Neg logit contributions | |
olson | -3.405 |
dit | -2.882 |
� | -2.769 |
advertising | -2.639 |
ctl | -2.625 |
Token | s |
Token ID | 82 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
whence | +2.521 |
PLIED | +2.479 |
forgiveness | +2.252 |
accus | +2.110 |
where | +2.082 |
Neg logit contributions | |
olson | -2.728 |
dit | -2.290 |
� | -2.247 |
ctl | -2.129 |
advertising | -2.122 |
Token | no |
Token ID | 645 |
Feature activation | -3.00e-01 |
Pos logit contributions | |
olson | +2.834 |
dit | +2.384 |
� | +2.364 |
advertising | +2.283 |
ctl | +2.248 |
Neg logit contributions | |
PLIED | -2.417 |
whence | -2.411 |
forgiveness | -2.114 |
hurled | -1.958 |
accus | -1.956 |
Token | mention |
Token ID | 3068 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
whence | +2.646 |
PLIED | +2.567 |
forgiveness | +2.364 |
accus | +2.209 |
where | +2.185 |
Neg logit contributions | |
olson | -3.277 |
dit | -2.779 |
� | -2.740 |
ctl | -2.593 |
advertising | -2.557 |
Token | of |
Token ID | 286 |
Feature activation | +3.06e-03 |
Pos logit contributions | |
olson | +1.085 |
dit | +0.920 |
� | +0.906 |
advertising | +0.860 |
ctl | +0.853 |
Neg logit contributions | |
PLIED | -0.993 |
whence | -0.986 |
forgiveness | -0.892 |
accus | -0.821 |
repre | -0.816 |
Token | which |
Token ID | 543 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
olson | +0.033 |
dit | +0.028 |
� | +0.027 |
advertising | +0.026 |
ctl | +0.026 |
Neg logit contributions | |
PLIED | -0.027 |
whence | -0.027 |
forgiveness | -0.024 |
accus | -0.022 |
hurled | -0.022 |
Token | actresses |
Token ID | 49798 |
Feature activation | -4.71e-02 |
Pos logit contributions | |
olson | +2.328 |
dit | +2.000 |
� | +1.911 |
advertising | +1.889 |
ctl | +1.852 |
Neg logit contributions | |
PLIED | -2.015 |
whence | -1.976 |
forgiveness | -1.749 |
repre | -1.610 |
aught | -1.600 |
Token | here |
Token ID | 994 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
whence | +1.953 |
PLIED | +1.908 |
forgiveness | +1.704 |
accus | +1.574 |
where | +1.565 |
Neg logit contributions | |
olson | -2.986 |
dit | -2.564 |
� | -2.523 |
advertising | -2.418 |
ctl | -2.412 |
Token | ( |
Token ID | 357 |
Feature activation | +3.83e-01 |
Pos logit contributions | |
olson | +0.162 |
dit | +0.136 |
� | +0.135 |
ctl | +0.127 |
advertising | +0.126 |
Neg logit contributions | |
whence | -0.152 |
PLIED | -0.151 |
forgiveness | -0.137 |
accus | -0.128 |
hurled | -0.125 |
Token | in |
Token ID | 259 |
Feature activation | -2.52e-01 |
Pos logit contributions | |
olson | +3.123 |
dit | +2.543 |
� | +2.458 |
advertising | +2.381 |
ctl | +2.273 |
Neg logit contributions | |
whence | -4.407 |
PLIED | -4.352 |
forgiveness | -4.037 |
accus | -3.820 |
hurled | -3.754 |
Token | 2014 |
Token ID | 1946 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
whence | +2.505 |
PLIED | +2.458 |
forgiveness | +2.247 |
accus | +2.116 |
where | +2.092 |
Neg logit contributions | |
olson | -2.480 |
dit | -2.065 |
� | -2.015 |
ctl | -1.915 |
advertising | -1.902 |
Token | ), |
Token ID | 828 |
Feature activation | +4.70e-02 |
Pos logit contributions | |
whence | +0.702 |
PLIED | +0.692 |
forgiveness | +0.603 |
accus | +0.546 |
hurled | +0.532 |
Neg logit contributions | |
olson | -1.291 |
dit | -1.125 |
� | -1.111 |
ctl | -1.065 |
advertising | -1.064 |
Token | we |
Token ID | 356 |
Feature activation | +6.19e-01 |
Pos logit contributions | |
olson | +0.504 |
dit | +0.425 |
� | +0.423 |
ctl | +0.397 |
advertising | +0.396 |
Neg logit contributions | |
PLIED | -0.422 |
whence | -0.421 |
forgiveness | -0.375 |
accus | -0.349 |
hurled | -0.342 |
Token | said |
Token ID | 531 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
olson | +6.640 |
� | +5.664 |
dit | +5.594 |
ctl | +5.341 |
advertising | +5.246 |
Neg logit contributions | |
whence | -5.337 |
PLIED | -5.292 |
forgiveness | -4.754 |
repre | -4.228 |
accus | -4.217 |
Token | we |
Token ID | 356 |
Feature activation | +3.36e-01 |
Pos logit contributions | |
whence | +2.139 |
PLIED | +2.093 |
forgiveness | +1.896 |
accus | +1.768 |
where | +1.746 |
Neg logit contributions | |
olson | -2.647 |
dit | -2.250 |
� | -2.204 |
ctl | -2.101 |
advertising | -2.096 |
Token | were |
Token ID | 547 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
olson | +3.519 |
dit | +2.956 |
� | +2.947 |
ctl | +2.769 |
advertising | +2.735 |
Neg logit contributions | |
whence | -3.116 |
PLIED | -3.057 |
forgiveness | -2.754 |
accus | -2.509 |
repre | -2.470 |
Token | going |
Token ID | 1016 |
Feature activation | +4.52e-01 |
Pos logit contributions | |
olson | +2.567 |
dit | +2.174 |
� | +2.153 |
advertising | +2.060 |
ctl | +2.043 |
Neg logit contributions | |
PLIED | -2.066 |
whence | -2.048 |
forgiveness | -1.807 |
accus | -1.665 |
repre | -1.643 |
Token | to |
Token ID | 284 |
Feature activation | +5.62e-01 |
Pos logit contributions | |
olson | +4.184 |
� | +3.517 |
dit | +3.435 |
ctl | +3.249 |
advertising | +3.190 |
Neg logit contributions | |
PLIED | -4.546 |
whence | -4.495 |
forgiveness | -4.011 |
hurled | -3.810 |
cropped | -3.768 |
Token | from |
Token ID | 422 |
Feature activation | -5.73e-01 |
Pos logit contributions | |
olson | +1.660 |
dit | +1.416 |
� | +1.378 |
ctl | +1.314 |
advertising | +1.287 |
Neg logit contributions | |
PLIED | -1.491 |
whence | -1.471 |
forgiveness | -1.316 |
accus | -1.228 |
repre | -1.222 |
Token | Earth |
Token ID | 3668 |
Feature activation | -5.18e-02 |
Pos logit contributions | |
whence | +4.661 |
PLIED | +4.358 |
forgiveness | +3.978 |
where | +3.792 |
accus | +3.696 |
Neg logit contributions | |
olson | -6.698 |
dit | -5.737 |
� | -5.630 |
advertising | -5.389 |
ctl | -5.370 |
Token | it |
Token ID | 340 |
Feature activation | -9.40e-02 |
Pos logit contributions | |
whence | +0.486 |
PLIED | +0.484 |
forgiveness | +0.437 |
accus | +0.408 |
repre | +0.399 |
Neg logit contributions | |
olson | -0.535 |
dit | -0.452 |
� | -0.442 |
ctl | -0.420 |
advertising | -0.417 |
Token | takes |
Token ID | 2753 |
Feature activation | -3.21e-01 |
Pos logit contributions | |
whence | +0.809 |
PLIED | +0.800 |
forgiveness | +0.714 |
accus | +0.663 |
where | +0.648 |
Neg logit contributions | |
olson | -1.049 |
dit | -0.894 |
� | -0.881 |
ctl | -0.839 |
advertising | -0.833 |
Token | : |
Token ID | 25 |
Feature activation | +4.38e-02 |
Pos logit contributions | |
whence | +2.805 |
PLIED | +2.716 |
forgiveness | +2.480 |
accus | +2.310 |
where | +2.310 |
Neg logit contributions | |
olson | -3.528 |
dit | -3.003 |
� | -2.937 |
ctl | -2.820 |
advertising | -2.816 |
Token | Years |
Token ID | 13212 |
Feature activation | +3.03e-01 |
Pos logit contributions | |
olson | +0.412 |
dit | +0.341 |
� | +0.338 |
ctl | +0.315 |
advertising | +0.311 |
Neg logit contributions | |
PLIED | -0.446 |
whence | -0.445 |
forgiveness | -0.404 |
accus | -0.381 |
hurled | -0.375 |
Token | Days |
Token ID | 12579 |
Feature activation | +3.44e-01 |
Pos logit contributions | |
olson | +2.937 |
dit | +2.437 |
� | +2.401 |
ctl | +2.260 |
advertising | +2.244 |
Neg logit contributions | |
PLIED | -2.995 |
whence | -2.934 |
forgiveness | -2.650 |
accus | -2.490 |
repre | -2.489 |
Token |
|
Token ID | 198 |
Feature activation | +3.62e-01 |
Pos logit contributions | |
olson | +3.477 |
dit | +2.920 |
� | +2.890 |
ctl | +2.708 |
advertising | +2.683 |
Neg logit contributions | |
PLIED | -3.243 |
whence | -3.193 |
forgiveness | -2.883 |
repre | -2.671 |
accus | -2.656 |
Token |
|
Token ID | 198 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
olson | +3.383 |
dit | +2.793 |
� | +2.730 |
ctl | +2.589 |
advertising | +2.576 |
Neg logit contributions | |
whence | -3.739 |
PLIED | -3.707 |
forgiveness | -3.383 |
accus | -3.199 |
hurled | -3.157 |
Token | to |
Token ID | 1462 |
Feature activation | -8.99e-02 |
Pos logit contributions | |
olson | +3.492 |
dit | +2.947 |
� | +2.913 |
Quantity | +2.743 |
advertising | +2.733 |
Neg logit contributions | |
whence | -3.376 |
PLIED | -3.376 |
forgiveness | -3.061 |
accus | -2.901 |
flared | -2.855 |
Token | reach |
Token ID | 3151 |
Feature activation | -8.62e-01 |
Pos logit contributions | |
whence | +0.771 |
PLIED | +0.766 |
forgiveness | +0.682 |
accus | +0.634 |
hurled | +0.622 |
Neg logit contributions | |
olson | -1.001 |
dit | -0.854 |
� | -0.839 |
ctl | -0.798 |
advertising | -0.793 |
Token | agen |
Token ID | 11286 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
whence | +0.406 |
PLIED | +0.401 |
forgiveness | +0.371 |
accus | +0.349 |
where | +0.342 |
Neg logit contributions | |
olson | -0.315 |
dit | -0.255 |
� | -0.248 |
ctl | -0.234 |
advertising | -0.232 |
Token | related |
Token ID | 3519 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
whence | +1.695 |
PLIED | +1.673 |
forgiveness | +1.536 |
accus | +1.452 |
where | +1.430 |
Neg logit contributions | |
olson | -1.417 |
dit | -1.157 |
� | -1.133 |
ctl | -1.062 |
advertising | -1.059 |
Token | , |
Token ID | 11 |
Feature activation | +5.33e-01 |
Pos logit contributions | |
olson | +3.420 |
dit | +2.905 |
� | +2.831 |
ctl | +2.705 |
advertising | +2.683 |
Neg logit contributions | |
PLIED | -3.316 |
whence | -3.255 |
forgiveness | -2.972 |
accus | -2.739 |
repre | -2.713 |
Token | or |
Token ID | 393 |
Feature activation | -3.33e-01 |
Pos logit contributions | |
olson | +5.524 |
dit | +4.733 |
� | +4.707 |
advertising | +4.459 |
ctl | +4.397 |
Neg logit contributions | |
PLIED | -4.558 |
whence | -4.467 |
forgiveness | -4.057 |
repre | -3.742 |
aught | -3.729 |
Token | it |
Token ID | 340 |
Feature activation | -4.19e-01 |
Pos logit contributions | |
whence | +3.084 |
PLIED | +3.018 |
forgiveness | +2.750 |
accus | +2.582 |
where | +2.561 |
Neg logit contributions | |
olson | -3.477 |
dit | -2.923 |
� | -2.873 |
advertising | -2.728 |
ctl | -2.725 |
Token | could |
Token ID | 714 |
Feature activation | -7.63e-01 |
Pos logit contributions | |
whence | +3.413 |
PLIED | +3.326 |
forgiveness | +2.989 |
accus | +2.785 |
where | +2.765 |
Neg logit contributions | |
olson | -4.844 |
dit | -4.150 |
� | -4.085 |
advertising | -3.888 |
ctl | -3.884 |
Token | in |
Token ID | 287 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
whence | +5.821 |
PLIED | +5.597 |
forgiveness | +5.057 |
where | +4.763 |
accus | +4.691 |
Neg logit contributions | |
olson | -8.921 |
dit | -7.667 |
� | -7.533 |
advertising | -7.324 |
ctl | -7.178 |
Token | some |
Token ID | 617 |
Feature activation | +7.31e-01 |
Pos logit contributions | |
olson | +2.566 |
dit | +2.156 |
� | +2.093 |
ctl | +1.995 |
advertising | +1.942 |
Neg logit contributions | |
whence | -2.891 |
PLIED | -2.875 |
forgiveness | -2.586 |
accus | -2.442 |
hurled | -2.428 |
Token | way |
Token ID | 835 |
Feature activation | -3.39e-01 |
Pos logit contributions | |
olson | +8.384 |
dit | +7.315 |
� | +7.008 |
ctl | +6.873 |
undo | +6.649 |
Neg logit contributions | |
PLIED | -5.421 |
whence | -5.253 |
forgiveness | -4.594 |
aught | -4.347 |
repre | -4.205 |
Token | mean |
Token ID | 1612 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
whence | +2.788 |
PLIED | +2.724 |
forgiveness | +2.444 |
accus | +2.265 |
where | +2.239 |
Neg logit contributions | |
olson | -3.899 |
dit | -3.338 |
� | -3.288 |
advertising | -3.137 |
ctl | -3.134 |
Token | that |
Token ID | 326 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
whence | +2.703 |
PLIED | +2.647 |
forgiveness | +2.405 |
accus | +2.245 |
where | +2.224 |
Neg logit contributions | |
olson | -3.184 |
dit | -2.684 |
� | -2.642 |
ctl | -2.508 |
advertising | -2.503 |
Token | above |
Token ID | 2029 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
olson | +3.651 |
dit | +3.186 |
� | +3.156 |
advertising | +3.025 |
ctl | +2.989 |
Neg logit contributions | |
PLIED | -2.219 |
whence | -2.197 |
forgiveness | -1.936 |
accus | -1.754 |
hurled | -1.753 |
Token | and |
Token ID | 290 |
Feature activation | -4.99e-01 |
Pos logit contributions | |
olson | +0.292 |
dit | +0.252 |
� | +0.249 |
ctl | +0.237 |
advertising | +0.237 |
Neg logit contributions | |
whence | -0.193 |
PLIED | -0.192 |
forgiveness | -0.169 |
accus | -0.156 |
hurled | -0.152 |
Token | you |
Token ID | 345 |
Feature activation | +2.12e-01 |
Pos logit contributions | |
whence | +3.308 |
PLIED | +3.196 |
forgiveness | +2.831 |
where | +2.614 |
accus | +2.547 |
Neg logit contributions | |
olson | -6.430 |
dit | -5.591 |
� | -5.491 |
ctl | -5.310 |
advertising | -5.310 |
Token | would |
Token ID | 561 |
Feature activation | +9.04e-02 |
Pos logit contributions | |
olson | +2.186 |
dit | +1.877 |
� | +1.842 |
ctl | +1.743 |
advertising | +1.709 |
Neg logit contributions | |
whence | -1.971 |
PLIED | -1.948 |
forgiveness | -1.751 |
accus | -1.634 |
hurled | -1.600 |
Token | like |
Token ID | 588 |
Feature activation | +2.14e-01 |
Pos logit contributions | |
olson | +0.779 |
dit | +0.637 |
� | +0.620 |
ctl | +0.579 |
advertising | +0.577 |
Neg logit contributions | |
whence | -1.004 |
PLIED | -0.995 |
forgiveness | -0.908 |
accus | -0.864 |
hurled | -0.853 |
Token | a |
Token ID | 257 |
Feature activation | -6.79e-02 |
Pos logit contributions | |
olson | +2.164 |
dit | +1.821 |
� | +1.779 |
advertising | +1.711 |
ctl | +1.671 |
Neg logit contributions | |
whence | -2.036 |
PLIED | -2.026 |
forgiveness | -1.763 |
hurled | -1.688 |
accus | -1.679 |
Token | hi |
Token ID | 23105 |
Feature activation | -7.66e-01 |
Pos logit contributions | |
whence | +0.606 |
PLIED | +0.600 |
forgiveness | +0.534 |
accus | +0.500 |
hurled | +0.491 |
Neg logit contributions | |
olson | -0.737 |
dit | -0.623 |
� | -0.612 |
ctl | -0.583 |
advertising | -0.582 |
Token | - |
Token ID | 12 |
Feature activation | -1.44e-01 |
Pos logit contributions | |
whence | +6.622 |
PLIED | +6.409 |
forgiveness | +5.941 |
where | +5.585 |
cropped | +5.517 |
Neg logit contributions | |
olson | -8.180 |
dit | -6.895 |
� | -6.735 |
advertising | -6.474 |
ctl | -6.354 |
Token | res |
Token ID | 411 |
Feature activation | -2.55e-01 |
Pos logit contributions | |
whence | +1.453 |
PLIED | +1.431 |
forgiveness | +1.306 |
accus | +1.231 |
where | +1.210 |
Neg logit contributions | |
olson | -1.399 |
dit | -1.164 |
� | -1.135 |
ctl | -1.075 |
advertising | -1.072 |
Token | version |
Token ID | 2196 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
whence | +2.292 |
PLIED | +2.249 |
forgiveness | +2.035 |
accus | +1.900 |
where | +1.876 |
Neg logit contributions | |
olson | -2.743 |
dit | -2.322 |
� | -2.282 |
ctl | -2.172 |
advertising | -2.163 |
Token | of |
Token ID | 286 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
olson | +3.393 |
dit | +2.892 |
� | +2.822 |
ctl | +2.669 |
undo | +2.602 |
Neg logit contributions | |
PLIED | -3.442 |
whence | -3.395 |
forgiveness | -3.046 |
accus | -2.854 |
hurled | -2.821 |
Token | ada |
Token ID | 4763 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
whence | +2.268 |
PLIED | +2.239 |
forgiveness | +2.068 |
accus | +1.962 |
where | +1.940 |
Neg logit contributions | |
olson | -1.647 |
dit | -1.320 |
� | -1.286 |
ctl | -1.201 |
advertising | -1.195 |
Token | over |
Token ID | 625 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
olson | +1.610 |
dit | +1.368 |
� | +1.361 |
ctl | +1.285 |
advertising | +1.265 |
Neg logit contributions | |
whence | -1.417 |
PLIED | -1.413 |
forgiveness | -1.257 |
accus | -1.162 |
repre | -1.149 |
Token | incorrect |
Token ID | 11491 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
whence | +10.292 |
PLIED | +9.530 |
forgiveness | +9.377 |
accus | +8.925 |
where | +8.916 |
Neg logit contributions | |
olson | -11.741 |
dit | -9.638 |
� | -9.553 |
ctl | -9.096 |
advertising | -9.037 |
Token | handling |
Token ID | 9041 |
Feature activation | -2.44e-01 |
Pos logit contributions | |
whence | +2.885 |
PLIED | +2.803 |
forgiveness | +2.586 |
accus | +2.425 |
where | +2.388 |
Neg logit contributions | |
olson | -3.319 |
dit | -2.792 |
� | -2.734 |
ctl | -2.594 |
advertising | -2.589 |
Token | of |
Token ID | 286 |
Feature activation | -4.82e-01 |
Pos logit contributions | |
whence | +2.195 |
PLIED | +2.148 |
forgiveness | +1.950 |
accus | +1.823 |
where | +1.798 |
Neg logit contributions | |
olson | -2.632 |
dit | -2.224 |
� | -2.183 |
ctl | -2.078 |
advertising | -2.073 |
Token | Mam |
Token ID | 29926 |
Feature activation | -3.29e-01 |
Pos logit contributions | |
whence | +4.232 |
PLIED | +4.065 |
forgiveness | +3.786 |
accus | +3.565 |
where | +3.522 |
Neg logit contributions | |
olson | -5.273 |
dit | -4.432 |
� | -4.350 |
advertising | -4.178 |
ctl | -4.142 |
Token | ad |
Token ID | 324 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
whence | +2.781 |
PLIED | +2.666 |
forgiveness | +2.432 |
accus | +2.274 |
where | +2.270 |
Neg logit contributions | |
olson | -3.685 |
dit | -3.162 |
� | -3.093 |
advertising | -2.958 |
ctl | -2.949 |
Token | ou |
Token ID | 280 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
olson | +2.059 |
dit | +1.601 |
� | +1.579 |
ctl | +1.430 |
advertising | +1.411 |
Neg logit contributions | |
PLIED | -3.113 |
whence | -3.067 |
forgiveness | -2.790 |
accus | -2.669 |
cropped | -2.651 |
Token | Sak |
Token ID | 13231 |
Feature activation | -9.07e-02 |
Pos logit contributions | |
olson | +7.522 |
dit | +6.988 |
� | +6.741 |
ete | +6.521 |
undo | +6.228 |
Neg logit contributions | |
whence | -10.770 |
PLIED | -10.531 |
forgiveness | -9.510 |
repre | -9.297 |
cropped | -8.981 |
Token | ho |
Token ID | 8873 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
whence | +0.823 |
PLIED | +0.804 |
forgiveness | +0.738 |
where | +0.686 |
accus | +0.684 |
Neg logit contributions | |
olson | -0.958 |
dit | -0.810 |
� | -0.800 |
ctl | -0.755 |
advertising | -0.752 |
Token | drugs |
Token ID | 5010 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
olson | +2.509 |
� | +2.128 |
dit | +2.122 |
ctl | +2.006 |
advertising | +1.987 |
Neg logit contributions | |
PLIED | -2.223 |
whence | -2.211 |
forgiveness | -1.946 |
accus | -1.787 |
hurled | -1.783 |
Token | Dallas |
Token ID | 8533 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
whence | +5.588 |
PLIED | +5.196 |
forgiveness | +4.906 |
where | +4.676 |
accus | +4.469 |
Neg logit contributions | |
olson | -7.481 |
dit | -6.432 |
� | -6.368 |
ctl | -5.996 |
advertising | -5.988 |
Token | ' |
Token ID | 6 |
Feature activation | -3.90e-01 |
Pos logit contributions | |
olson | +1.546 |
dit | +1.265 |
� | +1.244 |
advertising | +1.200 |
ctl | +1.181 |
Neg logit contributions | |
PLIED | -1.609 |
whence | -1.600 |
forgiveness | -1.429 |
accus | -1.363 |
hurled | -1.331 |
Token | finances |
Token ID | 20903 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
whence | +3.644 |
PLIED | +3.519 |
forgiveness | +3.273 |
accus | +3.049 |
where | +3.040 |
Neg logit contributions | |
olson | -4.060 |
dit | -3.434 |
� | -3.384 |
ctl | -3.192 |
advertising | -3.170 |
Token | from |
Token ID | 422 |
Feature activation | -5.79e-01 |
Pos logit contributions | |
olson | +1.284 |
dit | +1.092 |
� | +1.053 |
ctl | +1.021 |
advertising | +1.019 |
Neg logit contributions | |
PLIED | -1.103 |
whence | -1.085 |
forgiveness | -0.964 |
accus | -0.912 |
repre | -0.897 |
Token | free |
Token ID | 1479 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
whence | +4.989 |
PLIED | +4.614 |
forgiveness | +4.328 |
where | +4.114 |
accus | +3.980 |
Neg logit contributions | |
olson | -6.535 |
dit | -5.591 |
� | -5.496 |
ctl | -5.216 |
advertising | -5.158 |
Token | agents |
Token ID | 6554 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
whence | +9.247 |
PLIED | +8.587 |
forgiveness | +8.405 |
where | +7.768 |
accus | +7.444 |
Neg logit contributions | |
olson | -15.430 |
dit | -13.318 |
� | -12.590 |
undo | -12.378 |
ctl | -12.232 |
Token | hitting |
Token ID | 9008 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
whence | +0.984 |
PLIED | +0.977 |
forgiveness | +0.874 |
accus | +0.820 |
hurled | +0.800 |
Neg logit contributions | |
olson | -1.148 |
dit | -0.970 |
� | -0.953 |
ctl | -0.908 |
advertising | -0.906 |
Token | the |
Token ID | 262 |
Feature activation | -8.26e-02 |
Pos logit contributions | |
olson | +2.702 |
dit | +2.306 |
� | +2.296 |
ctl | +2.172 |
advertising | +2.156 |
Neg logit contributions | |
PLIED | -2.388 |
whence | -2.337 |
forgiveness | -2.053 |
accus | -1.972 |
aught | -1.954 |
Token | market |
Token ID | 1910 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
whence | +0.759 |
PLIED | +0.752 |
forgiveness | +0.672 |
accus | +0.632 |
hurled | +0.617 |
Neg logit contributions | |
olson | -0.870 |
dit | -0.731 |
� | -0.720 |
ctl | -0.685 |
advertising | -0.683 |
Token | , |
Token ID | 11 |
Feature activation | -4.17e-01 |
Pos logit contributions | |
whence | +3.342 |
PLIED | +3.220 |
forgiveness | +2.941 |
where | +2.749 |
accus | +2.712 |
Neg logit contributions | |
olson | -4.376 |
dit | -3.714 |
� | -3.669 |
ctl | -3.476 |
advertising | -3.460 |
Token | and |
Token ID | 290 |
Feature activation | -8.11e-02 |
Pos logit contributions | |
whence | +3.515 |
PLIED | +3.380 |
forgiveness | +3.085 |
where | +2.868 |
accus | +2.846 |
Neg logit contributions | |
olson | -4.742 |
dit | -4.060 |
� | -3.975 |
ctl | -3.796 |
advertising | -3.764 |
Token | agreement |
Token ID | 4381 |
Feature activation | -3.26e-01 |
Pos logit contributions | |
olson | +3.654 |
dit | +3.081 |
� | +3.021 |
advertising | +2.944 |
ctl | +2.894 |
Neg logit contributions | |
whence | -3.240 |
PLIED | -3.209 |
forgiveness | -2.800 |
hurled | -2.699 |
repre | -2.660 |
Token | to |
Token ID | 284 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
whence | +2.991 |
PLIED | +2.915 |
forgiveness | +2.664 |
where | +2.484 |
accus | +2.483 |
Neg logit contributions | |
olson | -3.453 |
dit | -2.915 |
� | -2.858 |
ctl | -2.707 |
advertising | -2.703 |
Token | become |
Token ID | 1716 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
olson | +2.224 |
dit | +1.906 |
� | +1.853 |
ctl | +1.796 |
advertising | +1.764 |
Neg logit contributions | |
PLIED | -1.620 |
whence | -1.594 |
forgiveness | -1.398 |
accus | -1.304 |
repre | -1.293 |
Token | partners |
Token ID | 4887 |
Feature activation | -6.05e-01 |
Pos logit contributions | |
whence | +1.722 |
PLIED | +1.693 |
forgiveness | +1.525 |
accus | +1.422 |
where | +1.396 |
Neg logit contributions | |
olson | -2.104 |
dit | -1.786 |
� | -1.754 |
ctl | -1.670 |
advertising | -1.664 |
Token | on |
Token ID | 319 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
whence | +5.354 |
PLIED | +5.064 |
forgiveness | +4.705 |
where | +4.527 |
accus | +4.383 |
Neg logit contributions | |
olson | -6.562 |
dit | -5.539 |
� | -5.481 |
ctl | -5.169 |
advertising | -5.169 |
Token | the |
Token ID | 262 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
olson | +1.198 |
dit | +1.014 |
� | +0.985 |
ctl | +0.943 |
advertising | +0.932 |
Neg logit contributions | |
PLIED | -1.091 |
whence | -1.090 |
forgiveness | -0.966 |
accus | -0.915 |
hurled | -0.914 |
Token | project |
Token ID | 1628 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
olson | +0.200 |
dit | +0.173 |
� | +0.168 |
ctl | +0.162 |
advertising | +0.161 |
Neg logit contributions | |
whence | -0.145 |
PLIED | -0.145 |
forgiveness | -0.127 |
accus | -0.118 |
hurled | -0.117 |
Token | , |
Token ID | 11 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
whence | +2.466 |
PLIED | +2.417 |
forgiveness | +2.188 |
accus | +2.040 |
where | +2.019 |
Neg logit contributions | |
olson | -2.950 |
dit | -2.495 |
� | -2.453 |
ctl | -2.331 |
advertising | -2.320 |
Token | replacing |
Token ID | 13586 |
Feature activation | +2.15e-01 |
Pos logit contributions | |
olson | +0.163 |
dit | +0.140 |
� | +0.137 |
advertising | +0.131 |
ctl | +0.131 |
Neg logit contributions | |
PLIED | -0.124 |
whence | -0.124 |
forgiveness | -0.110 |
accus | -0.102 |
hurled | -0.100 |
Token | the |
Token ID | 262 |
Feature activation | +3.09e-01 |
Pos logit contributions | |
olson | +2.282 |
dit | +1.958 |
� | +1.892 |
ctl | +1.820 |
advertising | +1.794 |
Neg logit contributions | |
whence | -1.883 |
PLIED | -1.877 |
forgiveness | -1.672 |
hurled | -1.562 |
accus | -1.553 |
Token | role |
Token ID | 2597 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
olson | +3.452 |
dit | +2.997 |
� | +2.888 |
ctl | +2.801 |
advertising | +2.777 |
Neg logit contributions | |
PLIED | -2.518 |
whence | -2.493 |
forgiveness | -2.173 |
hurled | -2.025 |
aught | -2.006 |
Token | meant |
Token ID | 4001 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
whence | +3.564 |
PLIED | +3.424 |
forgiveness | +3.063 |
where | +2.819 |
accus | +2.795 |
Neg logit contributions | |
olson | -6.058 |
dit | -5.230 |
� | -5.194 |
advertising | -4.963 |
ctl | -4.963 |
Token | that |
Token ID | 326 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
olson | +3.503 |
dit | +2.876 |
� | +2.801 |
ctl | +2.658 |
undo | +2.573 |
Neg logit contributions | |
PLIED | -3.898 |
whence | -3.882 |
forgiveness | -3.415 |
accus | -3.294 |
aught | -3.229 |
Token | the |
Token ID | 262 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
whence | +3.424 |
PLIED | +3.337 |
forgiveness | +3.060 |
where | +2.834 |
accus | +2.833 |
Neg logit contributions | |
olson | -4.226 |
dit | -3.586 |
� | -3.541 |
advertising | -3.368 |
ctl | -3.364 |
Token | asteroid |
Token ID | 27460 |
Feature activation | -5.98e-01 |
Pos logit contributions | |
whence | +2.037 |
PLIED | +1.996 |
forgiveness | +1.805 |
accus | +1.675 |
where | +1.655 |
Neg logit contributions | |
olson | -2.634 |
dit | -2.245 |
� | -2.206 |
ctl | -2.103 |
advertising | -2.102 |
Token | was |
Token ID | 373 |
Feature activation | -6.84e-01 |
Pos logit contributions | |
whence | +5.221 |
PLIED | +4.974 |
forgiveness | +4.622 |
where | +4.374 |
hurled | +4.318 |
Neg logit contributions | |
olson | -6.431 |
dit | -5.488 |
� | -5.472 |
advertising | -5.206 |
ctl | -5.115 |
Token | not |
Token ID | 407 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
whence | +5.421 |
PLIED | +5.173 |
forgiveness | +4.741 |
where | +4.585 |
hurled | +4.504 |
Neg logit contributions | |
olson | -7.868 |
dit | -6.789 |
� | -6.731 |
advertising | -6.405 |
ctl | -6.367 |
Token | bright |
Token ID | 6016 |
Feature activation | -3.31e-01 |
Pos logit contributions | |
whence | +8.613 |
PLIED | +7.975 |
where | +7.646 |
forgiveness | +7.576 |
hurled | +7.449 |
Neg logit contributions | |
olson | -11.613 |
dit | -9.941 |
� | -9.893 |
advertising | -9.425 |
ctl | -9.318 |
Token | enough |
Token ID | 1576 |
Feature activation | -7.76e-02 |
Pos logit contributions | |
whence | +1.972 |
PLIED | +1.906 |
forgiveness | +1.628 |
where | +1.472 |
accus | +1.460 |
Neg logit contributions | |
olson | -4.538 |
dit | -4.008 |
� | -3.978 |
advertising | -3.804 |
ctl | -3.803 |
Token | for |
Token ID | 329 |
Feature activation | -8.62e-01 |
Pos logit contributions | |
whence | +0.737 |
PLIED | +0.730 |
forgiveness | +0.659 |
accus | +0.620 |
hurled | +0.608 |
Neg logit contributions | |
olson | -0.792 |
dit | -0.665 |
� | -0.648 |
ctl | -0.617 |
advertising | -0.614 |
Token | the |
Token ID | 262 |
Feature activation | -2.78e-01 |
Pos logit contributions | |
whence | +7.287 |
PLIED | +7.048 |
forgiveness | +6.668 |
where | +6.220 |
Applied | +6.170 |
Neg logit contributions | |
olson | -9.110 |
dit | -7.701 |
� | -7.624 |
advertising | -7.333 |
ctl | -7.281 |
Token | Aut |
Token ID | 5231 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
whence | +2.393 |
PLIED | +2.346 |
forgiveness | +2.124 |
accus | +1.970 |
where | +1.950 |
Neg logit contributions | |
olson | -3.086 |
dit | -2.628 |
� | -2.582 |
ctl | -2.462 |
advertising | -2.462 |
Token | however |
Token ID | 2158 |
Feature activation | +1.77e-02 |
Pos logit contributions | |
olson | +6.297 |
dit | +5.366 |
� | +5.304 |
undo | +5.024 |
advertising | +4.947 |
Neg logit contributions | |
PLIED | -7.477 |
whence | -7.005 |
forgiveness | -6.379 |
repre | -6.261 |
aught | -6.029 |
Token | , |
Token ID | 11 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
olson | +0.192 |
dit | +0.164 |
� | +0.161 |
advertising | +0.153 |
ctl | +0.152 |
Neg logit contributions | |
whence | -0.157 |
PLIED | -0.153 |
forgiveness | -0.140 |
where | -0.131 |
accus | -0.130 |
Token | continue |
Token ID | 2555 |
Feature activation | +7.14e-01 |
Pos logit contributions | |
olson | +3.727 |
dit | +3.130 |
� | +3.013 |
ctl | +2.960 |
undo | +2.874 |
Neg logit contributions | |
PLIED | -3.160 |
whence | -3.145 |
forgiveness | -2.771 |
repre | -2.584 |
accus | -2.567 |
Token | to |
Token ID | 284 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
olson | +6.395 |
� | +5.308 |
dit | +5.205 |
advertising | +4.891 |
ctl | +4.886 |
Neg logit contributions | |
PLIED | -7.079 |
whence | -6.992 |
forgiveness | -6.184 |
hurled | -5.951 |
aught | -5.899 |
Token | offer |
Token ID | 2897 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
olson | +5.408 |
dit | +4.503 |
� | +4.355 |
ctl | +4.283 |
undo | +4.147 |
Neg logit contributions | |
whence | -4.368 |
PLIED | -4.366 |
forgiveness | -3.848 |
repre | -3.591 |
hurled | -3.531 |
Token | employees |
Token ID | 4409 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
whence | +8.354 |
PLIED | +8.138 |
forgiveness | +7.970 |
where | +7.443 |
accus | +7.154 |
Neg logit contributions | |
olson | -11.764 |
dit | -10.091 |
� | -10.013 |
advertising | -9.842 |
ctl | -9.492 |
Token | the |
Token ID | 262 |
Feature activation | -5.97e-01 |
Pos logit contributions | |
whence | +11.414 |
PLIED | +10.890 |
forgiveness | +10.753 |
where | +10.669 |
accus | +9.621 |
Neg logit contributions | |
olson | -16.320 |
dit | -13.952 |
� | -13.905 |
advertising | -13.901 |
Quantity | -13.372 |
Token | opportunity |
Token ID | 3663 |
Feature activation | -8.24e-01 |
Pos logit contributions | |
whence | +4.292 |
PLIED | +4.243 |
forgiveness | +3.901 |
where | +3.561 |
accus | +3.529 |
Neg logit contributions | |
olson | -7.199 |
dit | -6.260 |
� | -6.176 |
advertising | -5.966 |
ctl | -5.932 |
Token | for |
Token ID | 329 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
whence | +6.567 |
PLIED | +6.365 |
forgiveness | +5.912 |
where | +5.620 |
accus | +5.396 |
Neg logit contributions | |
olson | -9.277 |
dit | -7.944 |
� | -7.692 |
advertising | -7.500 |
ctl | -7.340 |
Token | language |
Token ID | 3303 |
Feature activation | -4.88e-01 |
Pos logit contributions | |
whence | +8.725 |
PLIED | +8.356 |
forgiveness | +8.180 |
where | +7.679 |
accus | +7.378 |
Neg logit contributions | |
olson | -11.816 |
dit | -10.199 |
� | -9.962 |
advertising | -9.775 |
ctl | -9.470 |
Token | training |
Token ID | 3047 |
Feature activation | -9.94e-01 |
Pos logit contributions | |
whence | +3.882 |
PLIED | +3.773 |
forgiveness | +3.495 |
where | +3.213 |
accus | +3.172 |
Neg logit contributions | |
olson | -5.669 |
dit | -4.851 |
� | -4.801 |
advertising | -4.597 |
ctl | -4.527 |
Token | crowd |
Token ID | 4315 |
Feature activation | -6.66e-01 |
Pos logit contributions | |
olson | +1.539 |
dit | +1.309 |
� | +1.289 |
ctl | +1.235 |
advertising | +1.229 |
Neg logit contributions | |
PLIED | -1.165 |
whence | -1.161 |
forgiveness | -1.024 |
accus | -0.942 |
repre | -0.935 |
Token | and |
Token ID | 290 |
Feature activation | +5.64e-02 |
Pos logit contributions | |
whence | +5.555 |
PLIED | +5.172 |
forgiveness | +4.774 |
where | +4.637 |
accus | +4.514 |
Neg logit contributions | |
olson | -7.518 |
dit | -6.492 |
� | -6.386 |
ctl | -6.084 |
advertising | -5.987 |
Token | accusations |
Token ID | 14227 |
Feature activation | -5.39e-01 |
Pos logit contributions | |
olson | +0.621 |
dit | +0.523 |
� | +0.517 |
ctl | +0.493 |
advertising | +0.488 |
Neg logit contributions | |
PLIED | -0.488 |
whence | -0.488 |
forgiveness | -0.429 |
accus | -0.396 |
Applied | -0.394 |
Token | of |
Token ID | 286 |
Feature activation | -5.63e-01 |
Pos logit contributions | |
whence | +4.773 |
PLIED | +4.591 |
forgiveness | +4.220 |
accus | +3.996 |
hurled | +3.987 |
Neg logit contributions | |
olson | -5.813 |
dit | -4.970 |
� | -4.840 |
advertising | -4.647 |
ctl | -4.619 |
Token | coward |
Token ID | 26769 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
whence | +4.773 |
PLIED | +4.636 |
forgiveness | +4.293 |
accus | +3.987 |
where | +3.959 |
Neg logit contributions | |
olson | -6.229 |
dit | -5.348 |
� | -5.213 |
ctl | -4.990 |
advertising | -4.976 |
Token | ice |
Token ID | 501 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
olson | +0.161 |
dit | +0.133 |
� | +0.132 |
ctl | +0.125 |
advertising | +0.124 |
Neg logit contributions | |
whence | -0.160 |
PLIED | -0.159 |
forgiveness | -0.143 |
accus | -0.135 |
hurled | -0.133 |
Token | on |
Token ID | 319 |
Feature activation | +8.37e-02 |
Pos logit contributions | |
whence | +8.271 |
PLIED | +7.672 |
forgiveness | +7.196 |
hurled | +7.177 |
where | +7.096 |
Neg logit contributions | |
olson | -11.090 |
� | -9.730 |
dit | -9.649 |
ctl | -9.098 |
advertising | -9.025 |
Token | social |
Token ID | 1919 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
olson | +0.885 |
dit | +0.737 |
� | +0.736 |
ctl | +0.697 |
advertising | +0.687 |
Neg logit contributions | |
PLIED | -0.761 |
whence | -0.756 |
forgiveness | -0.667 |
accus | -0.624 |
repre | -0.620 |
Token | media |
Token ID | 2056 |
Feature activation | -3.96e-01 |
Pos logit contributions | |
whence | +1.068 |
PLIED | +1.059 |
forgiveness | +0.938 |
accus | +0.872 |
Applied | +0.855 |
Neg logit contributions | |
olson | -1.340 |
dit | -1.142 |
� | -1.127 |
ctl | -1.075 |
advertising | -1.065 |
Token | . |
Token ID | 13 |
Feature activation | +5.63e-02 |
Pos logit contributions | |
whence | +3.460 |
PLIED | +3.352 |
forgiveness | +3.048 |
accus | +2.854 |
where | +2.843 |
Neg logit contributions | |
olson | -4.361 |
dit | -3.715 |
� | -3.660 |
ctl | -3.478 |
advertising | -3.468 |
Token |
|
Token ID | 198 |
Feature activation | -4.36e-01 |
Pos logit contributions | |
olson | +0.551 |
dit | +0.454 |
� | +0.450 |
advertising | +0.424 |
ctl | +0.422 |
Neg logit contributions | |
whence | -0.558 |
PLIED | -0.555 |
forgiveness | -0.504 |
accus | -0.474 |
repre | -0.466 |
Token | actually |
Token ID | 1682 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
olson | +6.745 |
� | +5.807 |
dit | +5.804 |
ctl | +5.540 |
undo | +5.278 |
Neg logit contributions | |
PLIED | -5.577 |
whence | -5.563 |
forgiveness | -4.790 |
hurled | -4.537 |
repre | -4.532 |
Token | gets |
Token ID | 3011 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
olson | +2.742 |
dit | +2.328 |
� | +2.313 |
ctl | +2.201 |
advertising | +2.145 |
Neg logit contributions | |
whence | -2.196 |
PLIED | -2.190 |
forgiveness | -1.948 |
accus | -1.806 |
hurled | -1.764 |
Token | loaded |
Token ID | 9639 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
whence | +10.210 |
PLIED | +10.040 |
where | +9.203 |
forgiveness | +8.904 |
cropped | +8.881 |
Neg logit contributions | |
olson | -15.211 |
� | -12.837 |
dit | -12.759 |
advertising | -12.697 |
Quantity | -12.086 |
Token | in |
Token ID | 287 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
olson | +1.103 |
dit | +0.946 |
� | +0.928 |
ctl | +0.890 |
advertising | +0.878 |
Neg logit contributions | |
PLIED | -0.907 |
whence | -0.903 |
forgiveness | -0.801 |
accus | -0.749 |
repre | -0.731 |
Token | depends |
Token ID | 8338 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
whence | +3.323 |
PLIED | +3.240 |
forgiveness | +2.925 |
accus | +2.713 |
where | +2.702 |
Neg logit contributions | |
olson | -4.357 |
dit | -3.718 |
� | -3.643 |
advertising | -3.486 |
ctl | -3.467 |
Token | on |
Token ID | 319 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
whence | +1.951 |
PLIED | +1.935 |
forgiveness | +1.769 |
accus | +1.667 |
hurled | +1.641 |
Neg logit contributions | |
olson | -1.760 |
dit | -1.456 |
� | -1.427 |
ctl | -1.342 |
advertising | -1.331 |
Token | the |
Token ID | 262 |
Feature activation | -4.22e-01 |
Pos logit contributions | |
whence | +10.851 |
where | +9.637 |
PLIED | +9.318 |
forgiveness | +9.097 |
accus | +8.115 |
Neg logit contributions | |
olson | -15.495 |
dit | -13.519 |
� | -13.328 |
advertising | -12.942 |
ctl | -12.636 |
Token | OS |
Token ID | 7294 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
whence | +3.926 |
PLIED | +3.794 |
forgiveness | +3.488 |
where | +3.276 |
accus | +3.255 |
Neg logit contributions | |
olson | -4.389 |
dit | -3.715 |
� | -3.659 |
advertising | -3.471 |
ctl | -3.444 |
Token | p |
Token ID | 279 |
Feature activation | -4.14e-01 |
Pos logit contributions | |
whence | +9.259 |
PLIED | +8.699 |
where | +8.264 |
forgiveness | +8.065 |
accus | +7.516 |
Neg logit contributions | |
olson | -11.366 |
dit | -9.571 |
� | -9.548 |
advertising | -9.276 |
undo | -9.094 |
Token | aging |
Token ID | 3039 |
Feature activation | -3.26e-01 |
Pos logit contributions | |
whence | +4.283 |
PLIED | +4.206 |
forgiveness | +3.868 |
accus | +3.644 |
where | +3.633 |
Neg logit contributions | |
olson | -3.846 |
dit | -3.148 |
� | -3.102 |
advertising | -2.901 |
ctl | -2.876 |
Token | if |
Token ID | 611 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
whence | +2.864 |
PLIED | +2.803 |
forgiveness | +2.532 |
accus | +2.357 |
where | +2.338 |
Neg logit contributions | |
olson | -3.578 |
dit | -3.036 |
� | -2.989 |
advertising | -2.839 |
ctl | -2.835 |
Token | have |
Token ID | 423 |
Feature activation | +6.62e-02 |
Pos logit contributions | |
whence | +2.158 |
PLIED | +2.122 |
forgiveness | +1.905 |
accus | +1.770 |
where | +1.740 |
Neg logit contributions | |
olson | -2.804 |
dit | -2.389 |
� | -2.347 |
ctl | -2.238 |
advertising | -2.231 |
Token | received |
Token ID | 2722 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
olson | +0.750 |
dit | +0.645 |
� | +0.625 |
ctl | +0.606 |
advertising | +0.597 |
Neg logit contributions | |
PLIED | -0.547 |
whence | -0.547 |
forgiveness | -0.479 |
accus | -0.440 |
repre | -0.440 |
Token | enormous |
Token ID | 9812 |
Feature activation | -3.23e-01 |
Pos logit contributions | |
whence | +8.324 |
PLIED | +7.953 |
forgiveness | +7.802 |
accus | +7.267 |
where | +7.182 |
Neg logit contributions | |
olson | -11.027 |
dit | -9.401 |
� | -9.183 |
Quantity | -8.721 |
ctl | -8.695 |
Token | amounts |
Token ID | 6867 |
Feature activation | -8.50e-01 |
Pos logit contributions | |
whence | +2.436 |
PLIED | +2.374 |
forgiveness | +2.144 |
accus | +1.964 |
where | +1.925 |
Neg logit contributions | |
olson | -3.938 |
dit | -3.408 |
� | -3.349 |
ctl | -3.206 |
advertising | -3.186 |
Token | of |
Token ID | 286 |
Feature activation | -7.34e-01 |
Pos logit contributions | |
whence | +6.277 |
PLIED | +5.836 |
forgiveness | +5.556 |
where | +5.237 |
accus | +5.037 |
Neg logit contributions | |
olson | -10.153 |
dit | -8.676 |
� | -8.619 |
advertising | -8.068 |
ctl | -8.056 |
Token | criticism |
Token ID | 7734 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
whence | +5.863 |
PLIED | +5.611 |
forgiveness | +5.371 |
accus | +4.930 |
where | +4.854 |
Neg logit contributions | |
olson | -8.397 |
dit | -7.197 |
� | -7.074 |
ctl | -6.712 |
Quantity | -6.677 |
Token | for |
Token ID | 329 |
Feature activation | -7.63e-01 |
Pos logit contributions | |
whence | +8.863 |
PLIED | +8.115 |
forgiveness | +7.778 |
where | +7.749 |
hurled | +7.527 |
Neg logit contributions | |
olson | -12.027 |
dit | -10.463 |
� | -10.418 |
advertising | -9.708 |
ctl | -9.634 |
Token | esp |
Token ID | 15024 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
whence | +6.413 |
PLIED | +6.048 |
forgiveness | +5.720 |
where | +5.426 |
accus | +5.338 |
Neg logit contributions | |
olson | -8.420 |
dit | -7.212 |
� | -7.140 |
ctl | -6.809 |
advertising | -6.676 |
Token | ousing |
Token ID | 12752 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
whence | +1.586 |
PLIED | +1.556 |
forgiveness | +1.397 |
accus | +1.314 |
where | +1.306 |
Neg logit contributions | |
olson | -2.010 |
dit | -1.716 |
� | -1.699 |
ctl | -1.609 |
advertising | -1.594 |
Token | ideas |
Token ID | 4213 |
Feature activation | -4.68e-01 |
Pos logit contributions | |
olson | +0.135 |
dit | +0.114 |
� | +0.112 |
ctl | +0.107 |
advertising | +0.106 |
Neg logit contributions | |
whence | -0.111 |
PLIED | -0.110 |
forgiveness | -0.098 |
accus | -0.091 |
hurled | -0.089 |
Token | that |
Token ID | 326 |
Feature activation | -3.20e-01 |
Pos logit contributions | |
whence | +4.385 |
PLIED | +4.247 |
forgiveness | +3.897 |
where | +3.694 |
accus | +3.670 |
Neg logit contributions | |
olson | -4.885 |
dit | -4.089 |
� | -4.027 |
advertising | -3.809 |
ctl | -3.803 |