Token | � |
Token ID | 447 |
Feature activation | -2.99e+01 |
Pos logit contributions | |
� | +43.457 |
� | +41.012 |
policies | +35.284 |
climate | +33.835 |
needs | +33.706 |
Neg logit contributions | |
�� | -25.291 |
��極 | -21.886 |
senal | -21.297 |
�� | -20.840 |
arthed | -20.694 |
Token | � |
Token ID | 247 |
Feature activation | +2.55e+01 |
Pos logit contributions | |
�� | +27.647 |
�� | +25.357 |
� | +25.274 |
� | +25.123 |
� | +25.071 |
Neg logit contributions | |
� | -18.328 |
� | -18.110 |
behavi | -17.638 |
policies | -15.947 |
ideology | -14.653 |
Token | s |
Token ID | 82 |
Feature activation | +2.60e+01 |
Pos logit contributions | |
� | +28.342 |
� | +26.671 |
policies | +23.462 |
climate | +21.897 |
institutions | +21.791 |
Neg logit contributions | |
�� | -19.201 |
�� | -16.422 |
arthed | -16.037 |
��極 | -15.986 |
�� | -15.576 |
Token | collapse |
Token ID | 9807 |
Feature activation | +4.58e+01 |
Pos logit contributions | |
� | +27.615 |
� | +26.531 |
policies | +24.764 |
climate | +23.804 |
institutions | +23.186 |
Neg logit contributions | |
�� | -19.558 |
arthed | -17.130 |
��極 | -17.004 |
senal | -16.304 |
�� | -16.085 |
Token | requires |
Token ID | 4433 |
Feature activation | +3.02e+01 |
Pos logit contributions | |
� | +39.499 |
� | +37.320 |
policies | +32.502 |
policy | +30.814 |
| +30.191 |
Neg logit contributions | |
senal | -25.642 |
�� | -25.404 |
��極 | -23.404 |
�� | -22.856 |
�� | -22.068 |
Token | active |
Token ID | 4075 |
Feature activation | +6.81e+01 |
Pos logit contributions | |
� | +30.545 |
� | +29.242 |
policies | +27.495 |
institutions | +25.585 |
climate | +25.523 |
Neg logit contributions | |
�� | -22.146 |
��極 | -19.927 |
�� | -19.619 |
senal | -19.359 |
�� | -19.184 |
Token | involvement |
Token ID | 9750 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
� | +42.488 |
policies | +41.011 |
� | +40.496 |
policy | +39.213 |
governance | +38.982 |
Neg logit contributions | |
�� | -29.839 |
��極 | -28.099 |
�� | -26.644 |
senal | -26.539 |
�� | -24.977 |
Token | of |
Token ID | 286 |
Feature activation | +2.90e+01 |
Pos logit contributions | |
� | +18.887 |
� | +17.608 |
policies | +15.401 |
institutions | +14.211 |
policy | +13.812 |
Neg logit contributions | |
�� | -15.849 |
arthed | -15.029 |
�� | -14.755 |
��極 | -14.340 |
senal | -14.262 |
Token | international |
Token ID | 3230 |
Feature activation | +5.81e+01 |
Pos logit contributions | |
� | +30.276 |
� | +28.928 |
policies | +26.770 |
institutions | +25.779 |
climate | +25.427 |
Neg logit contributions | |
�� | -21.424 |
��極 | -19.557 |
�� | -18.754 |
arthed | -18.742 |
�� | -18.255 |
Token | organisations |
Token ID | 16435 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
� | +41.836 |
� | +39.660 |
institutions | +39.190 |
policies | +38.249 |
organizations | +37.649 |
Neg logit contributions | |
�� | -26.583 |
arthed | -26.289 |
��極 | -26.259 |
senal | -25.276 |
�� | -24.293 |
Token | that |
Token ID | 326 |
Feature activation | +3.45e+01 |
Pos logit contributions | |
� | +24.776 |
� | +23.512 |
policies | +19.869 |
institutions | +18.856 |
climate | +18.717 |
Neg logit contributions | |
�� | -18.761 |
arthed | -18.146 |
�� | -17.411 |
senal | -17.177 |
��極 | -17.073 |
Token | have |
Token ID | 423 |
Feature activation | +2.48e+01 |
Pos logit contributions | |
� | +41.575 |
� | +40.320 |
policies | +33.584 |
institutions | +33.172 |
| +32.096 |
Neg logit contributions | |
�� | -21.785 |
arthed | -19.745 |
��極 | -18.857 |
�� | -18.694 |
senal | -17.810 |
Token | been |
Token ID | 587 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
� | +28.376 |
� | +27.591 |
policies | +23.957 |
institutions | +23.109 |
economic | +22.273 |
Neg logit contributions | |
�� | -18.327 |
senal | -16.156 |
�� | -15.872 |
arthed | -15.816 |
�� | -15.787 |
Token | the |
Token ID | 262 |
Feature activation | +3.78e+01 |
Pos logit contributions | |
� | +21.145 |
� | +20.094 |
policies | +17.575 |
institutions | +16.757 |
climate | +16.181 |
Neg logit contributions | |
�� | -15.156 |
�� | -13.424 |
arthed | -12.778 |
nesday | -12.592 |
��極 | -12.478 |
Token | basis |
Token ID | 4308 |
Feature activation | +3.39e+01 |
Pos logit contributions | |
� | +35.726 |
� | +34.749 |
policies | +31.433 |
institutions | +30.670 |
economic | +29.442 |
Neg logit contributions | |
�� | -23.652 |
nesday | -19.211 |
�� | -19.074 |
��極 | -18.849 |
arthed | -18.773 |
Token | of |
Token ID | 286 |
Feature activation | +4.88e+01 |
Pos logit contributions | |
� | +35.129 |
� | +32.688 |
policies | +28.057 |
institutions | +26.308 |
climate | +25.709 |
Neg logit contributions | |
�� | -21.495 |
Blossom | -19.040 |
arthed | -19.009 |
�� | -18.526 |
�� | -18.438 |
Token | American |
Token ID | 1605 |
Feature activation | +6.60e+01 |
Pos logit contributions | |
� | +42.457 |
� | +41.073 |
policies | +36.103 |
institutions | +34.790 |
governance | +34.620 |
Neg logit contributions | |
�� | -24.861 |
��極 | -21.437 |
arthed | -20.216 |
�� | -20.054 |
yne | -20.035 |
Token | foreign |
Token ID | 3215 |
Feature activation | +5.09e+01 |
Pos logit contributions | |
� | +45.357 |
� | +43.446 |
policies | +41.003 |
institutions | +39.498 |
governance | +39.308 |
Neg logit contributions | |
�� | -29.466 |
��極 | -24.289 |
nesday | -23.861 |
Canaver | -23.634 |
�� | -22.615 |
Token | policy |
Token ID | 2450 |
Feature activation | +3.70e+01 |
Pos logit contributions | |
policies | +37.140 |
� | +36.657 |
policy | +36.618 |
� | +36.312 |
institutions | +31.885 |
Neg logit contributions | |
�� | -31.020 |
��極 | -26.862 |
nesday | -26.536 |
�� | -25.571 |
Canaver | -24.657 |
Token | for |
Token ID | 329 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
� | +36.260 |
� | +34.056 |
policies | +30.669 |
institutions | +28.255 |
policy | +28.144 |
Neg logit contributions | |
�� | -23.510 |
��極 | -21.168 |
arthed | -21.049 |
�� | -20.395 |
mington | -20.187 |
Token | a |
Token ID | 257 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
� | +18.301 |
� | +17.392 |
policies | +15.626 |
institutions | +14.579 |
climate | +14.365 |
Neg logit contributions | |
�� | -11.945 |
�� | -10.469 |
arthed | -10.396 |
yne | -10.039 |
��極 | -9.997 |
Token | very |
Token ID | 845 |
Feature activation | +6.84e+00 |
Pos logit contributions | |
� | +19.717 |
� | +18.831 |
policies | +15.930 |
climate | +15.147 |
policy | +14.981 |
Neg logit contributions | |
�� | -15.884 |
arthed | -14.398 |
�� | -13.890 |
Blossom | -13.635 |
yne | -13.608 |
Token | the |
Token ID | 262 |
Feature activation | +8.23e+00 |
Pos logit contributions | |
� | +9.620 |
� | +9.157 |
policies | +8.269 |
institutions | +7.665 |
climate | +7.611 |
Neg logit contributions | |
�� | -6.782 |
�� | -6.172 |
arthed | -6.049 |
yne | -5.984 |
��極 | -5.762 |
Token | front |
Token ID | 2166 |
Feature activation | +2.19e+01 |
Pos logit contributions | |
� | +8.911 |
� | +8.334 |
policies | +7.383 |
institutions | +6.723 |
climate | +6.646 |
Neg logit contributions | |
�� | -9.218 |
�� | -8.441 |
arthed | -8.400 |
yne | -8.112 |
senal | -8.047 |
Token | lines |
Token ID | 3951 |
Feature activation | +9.24e+00 |
Pos logit contributions | |
� | +19.999 |
� | +18.678 |
policies | +16.603 |
economic | +14.900 |
institutions | +14.800 |
Neg logit contributions | |
�� | -22.191 |
arthed | -20.315 |
�� | -20.193 |
senal | -20.051 |
��極 | -19.761 |
Token | of |
Token ID | 286 |
Feature activation | +3.36e+01 |
Pos logit contributions | |
� | +10.483 |
� | +9.849 |
policies | +8.506 |
institutions | +7.787 |
climate | +7.714 |
Neg logit contributions | |
�� | -9.763 |
�� | -9.203 |
arthed | -8.998 |
��極 | -8.681 |
�� | -8.657 |
Token | major |
Token ID | 1688 |
Feature activation | +5.16e+01 |
Pos logit contributions | |
� | +31.879 |
� | +30.835 |
policies | +29.599 |
economic | +28.122 |
policy | +28.026 |
Neg logit contributions | |
�� | -22.702 |
��極 | -20.100 |
senal | -19.341 |
�� | -19.244 |
yne | -19.064 |
Token | global |
Token ID | 3298 |
Feature activation | +6.45e+01 |
Pos logit contributions | |
� | +37.201 |
policies | +37.093 |
� | +36.259 |
policy | +36.094 |
economic | +35.923 |
Neg logit contributions | |
�� | -26.938 |
��極 | -23.138 |
senal | -22.761 |
�� | -21.672 |
�� | -21.357 |
Token | and |
Token ID | 290 |
Feature activation | +2.42e+01 |
Pos logit contributions | |
� | +40.436 |
policies | +39.480 |
� | +39.113 |
economic | +39.014 |
governance | +38.655 |
Neg logit contributions | |
�� | -29.932 |
senal | -26.394 |
��極 | -26.390 |
arthed | -25.245 |
�� | -24.618 |
Token | societal |
Token ID | 26877 |
Feature activation | +5.26e+01 |
Pos logit contributions | |
� | +23.381 |
� | +22.352 |
policies | +20.820 |
economic | +20.469 |
policy | +20.095 |
Neg logit contributions | |
�� | -20.801 |
��極 | -18.665 |
senal | -18.428 |
arthed | -18.177 |
�� | -18.107 |
Token | change |
Token ID | 1487 |
Feature activation | +2.70e+01 |
Pos logit contributions | |
� | +35.873 |
policies | +35.633 |
� | +34.750 |
policy | +34.314 |
institutions | +34.039 |
Neg logit contributions | |
�� | -31.253 |
��極 | -27.403 |
senal | -26.848 |
yne | -26.014 |
arthed | -25.757 |
Token | . |
Token ID | 13 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
� | +29.568 |
� | +27.677 |
policies | +24.091 |
institutions | +22.365 |
policy | +22.085 |
Neg logit contributions | |
�� | -20.481 |
�� | -18.425 |
arthed | -18.215 |
senal | -18.063 |
��極 | -17.737 |
Token | The |
Token ID | 383 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
� | +27.481 |
� | +26.007 |
policies | +21.616 |
| +20.564 |
climate | +20.339 |
Neg logit contributions | |
�� | -17.320 |
senal | -15.107 |
�� | -14.675 |
arthed | -14.313 |
��極 | -13.994 |
Token | � |
Token ID | 564 |
Feature activation | -5.79e+00 |
Pos logit contributions | |
� | +27.798 |
policies | +27.146 |
� | +27.006 |
policy | +24.694 |
economic | +24.393 |
Neg logit contributions | |
�� | -20.329 |
senal | -16.630 |
arthed | -16.320 |
�� | -16.294 |
�� | -16.196 |
Token | � |
Token ID | 250 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
�� | +1.998 |
�� | +1.927 |
�� | +1.521 |
arthed | +1.495 |
�� | +1.404 |
Neg logit contributions | |
� | -10.125 |
� | -9.778 |
policies | -9.203 |
climate | -8.785 |
ideology | -8.755 |
Token | wild |
Token ID | 21992 |
Feature activation | +4.30e+01 |
Pos logit contributions | |
� | +16.338 |
� | +15.431 |
policies | +14.220 |
institutions | +13.068 |
policy | +12.970 |
Neg logit contributions | |
�� | -8.676 |
�� | -7.303 |
arthed | -7.208 |
�� | -6.938 |
yne | -6.865 |
Token | ly |
Token ID | 306 |
Feature activation | +2.83e+01 |
Pos logit contributions | |
� | +42.840 |
� | +41.011 |
policies | +37.622 |
policy | +34.679 |
economic | +34.425 |
Neg logit contributions | |
�� | -23.439 |
�� | -17.595 |
senal | -17.036 |
zzo | -16.259 |
arthed | -16.127 |
Token | unaff |
Token ID | 25312 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
� | +30.325 |
� | +29.059 |
policies | +25.827 |
policy | +24.136 |
economic | +23.878 |
Neg logit contributions | |
�� | -22.653 |
�� | -17.881 |
senal | -17.602 |
arthed | -17.417 |
nesday | -16.952 |
Token | ordable |
Token ID | 16819 |
Feature activation | +6.40e+01 |
Pos logit contributions | |
� | +0.425 |
� | +0.405 |
policies | +0.372 |
institutions | +0.352 |
climate | +0.348 |
Neg logit contributions | |
�� | -0.175 |
arthed | -0.162 |
�� | -0.159 |
yne | -0.154 |
Remy | -0.148 |
Token | � |
Token ID | 447 |
Feature activation | -8.46e+00 |
Pos logit contributions | |
� | +49.611 |
� | +47.141 |
policies | +43.420 |
policy | +39.440 |
economic | +38.915 |
Neg logit contributions | |
�� | -28.979 |
senal | -22.166 |
arthed | -21.610 |
�� | -20.871 |
nesday | -19.836 |
Token | � |
Token ID | 251 |
Feature activation | +3.60e+01 |
Pos logit contributions | |
�� | +2.935 |
�� | +2.859 |
�� | +2.262 |
arthed | +2.254 |
�� | +2.180 |
Neg logit contributions | |
� | -14.574 |
� | -14.031 |
policies | -13.004 |
institutions | -12.483 |
climate | -12.449 |
Token | tax |
Token ID | 1687 |
Feature activation | +4.43e+01 |
Pos logit contributions | |
� | +37.713 |
� | +35.838 |
policies | +34.970 |
policy | +31.979 |
economic | +31.433 |
Neg logit contributions | |
�� | -22.323 |
�� | -16.295 |
senal | -16.193 |
�� | -15.857 |
arthed | -15.709 |
Token | cuts |
Token ID | 6630 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
� | +36.309 |
policies | +35.430 |
� | +34.612 |
policy | +32.580 |
reforms | +30.474 |
Neg logit contributions | |
�� | -28.230 |
senal | -22.469 |
�� | -22.053 |
ometown | -21.893 |
nesday | -21.627 |
Token | . |
Token ID | 13 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
� | +21.077 |
� | +19.602 |
policies | +17.090 |
policy | +15.484 |
institutions | +15.327 |
Neg logit contributions | |
�� | -16.457 |
arthed | -14.539 |
�� | -14.437 |
senal | -14.313 |
yne | -13.943 |
Token | transition |
Token ID | 6801 |
Feature activation | +4.45e+01 |
Pos logit contributions | |
� | +33.502 |
policies | +32.237 |
� | +31.856 |
climate | +30.326 |
governance | +30.180 |
Neg logit contributions | |
�� | -26.275 |
��極 | -24.181 |
senal | -23.856 |
arthed | -23.758 |
ometown | -22.098 |
Token | — |
Token ID | 960 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
� | +42.446 |
� | +38.947 |
policies | +36.510 |
policy | +33.464 |
governance | +32.915 |
Neg logit contributions | |
�� | -23.932 |
arthed | -21.674 |
�� | -20.727 |
��極 | -20.558 |
senal | -20.545 |
Token | yet |
Token ID | 25907 |
Feature activation | +3.39e+01 |
Pos logit contributions | |
� | +20.205 |
� | +18.594 |
policies | +16.321 |
institutions | +15.253 |
| +15.046 |
Neg logit contributions | |
�� | -14.154 |
�� | -12.692 |
�� | -12.438 |
arthed | -12.406 |
senal | -11.922 |
Token | the |
Token ID | 262 |
Feature activation | +3.08e+01 |
Pos logit contributions | |
� | +34.195 |
� | +32.676 |
policies | +31.054 |
climate | +29.182 |
institutions | +29.102 |
Neg logit contributions | |
�� | -20.610 |
senal | -17.791 |
��極 | -17.361 |
arthed | -17.297 |
�� | -16.953 |
Token | federal |
Token ID | 2717 |
Feature activation | +3.76e+01 |
Pos logit contributions | |
� | +31.600 |
� | +30.342 |
policies | +29.337 |
institutions | +27.711 |
climate | +27.181 |
Neg logit contributions | |
�� | -19.780 |
senal | -17.726 |
arthed | -17.714 |
�� | -17.176 |
��極 | -17.045 |
Token | government |
Token ID | 1230 |
Feature activation | +6.37e+01 |
Pos logit contributions | |
� | +35.171 |
� | +33.926 |
policies | +32.487 |
institutions | +30.051 |
climate | +30.043 |
Neg logit contributions | |
�� | -22.967 |
arthed | -20.106 |
senal | -19.730 |
Canaver | -19.300 |
��極 | -19.105 |
Token | has |
Token ID | 468 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
� | +47.580 |
� | +45.238 |
policies | +39.631 |
institutions | +37.181 |
policy | +36.300 |
Neg logit contributions | |
�� | -25.854 |
�� | -22.214 |
�� | -21.411 |
senal | -21.407 |
arthed | -21.186 |
Token | withdrawn |
Token ID | 23019 |
Feature activation | +2.21e+01 |
Pos logit contributions | |
� | +15.989 |
� | +15.332 |
policies | +13.932 |
institutions | +12.937 |
climate | +12.671 |
Neg logit contributions | |
�� | -10.850 |
�� | -9.679 |
arthed | -9.354 |
�� | -9.312 |
senal | -9.260 |
Token | and |
Token ID | 290 |
Feature activation | +2.55e+01 |
Pos logit contributions | |
� | +25.769 |
� | +24.857 |
policies | +23.258 |
climate | +21.371 |
institutions | +21.333 |
Neg logit contributions | |
�� | -16.506 |
�� | -14.775 |
��極 | -14.454 |
senal | -14.081 |
arthed | -14.057 |
Token | many |
Token ID | 867 |
Feature activation | +4.07e+01 |
Pos logit contributions | |
� | +29.045 |
� | +27.722 |
policies | +26.752 |
institutions | +25.143 |
climate | +24.645 |
Neg logit contributions | |
�� | -17.684 |
senal | -15.085 |
�� | -15.084 |
arthed | -14.475 |
��極 | -14.427 |
Token | state |
Token ID | 1181 |
Feature activation | +4.54e+01 |
Pos logit contributions | |
� | +35.559 |
� | +34.320 |
policies | +34.009 |
institutions | +32.251 |
policy | +31.178 |
Neg logit contributions | |
�� | -25.228 |
senal | -21.356 |
��極 | -20.168 |
�� | -20.019 |
arthed | -20.010 |
Token | registered |
Token ID | 6823 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
� | +26.114 |
� | +24.644 |
policies | +22.771 |
institutions | +21.644 |
policy | +21.216 |
Neg logit contributions | |
�� | -21.534 |
senal | -18.241 |
�� | -18.034 |
arthed | -17.950 |
Canaver | -17.040 |
Token | voters |
Token ID | 4446 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
� | +16.744 |
� | +15.761 |
policies | +13.820 |
climate | +12.710 |
institutions | +12.561 |
Neg logit contributions | |
�� | -23.342 |
�� | -21.079 |
arthed | -20.613 |
senal | -20.472 |
Canaver | -19.973 |
Token | say |
Token ID | 910 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
� | +29.034 |
� | +27.382 |
policies | +23.411 |
climate | +21.991 |
ideology | +21.503 |
Neg logit contributions | |
�� | -21.698 |
senal | -19.024 |
arthed | -18.438 |
�� | -18.224 |
�� | -17.668 |
Token | the |
Token ID | 262 |
Feature activation | +3.19e+01 |
Pos logit contributions | |
� | +22.164 |
� | +21.215 |
policies | +19.554 |
ideology | +17.769 |
climate | +17.759 |
Neg logit contributions | |
�� | -20.373 |
arthed | -17.556 |
senal | -17.140 |
��極 | -16.955 |
�� | -16.429 |
Token | Republican |
Token ID | 3415 |
Feature activation | +3.59e+01 |
Pos logit contributions | |
� | +29.768 |
� | +28.600 |
policies | +27.470 |
ideology | +25.154 |
policy | +25.054 |
Neg logit contributions | |
�� | -25.112 |
senal | -21.071 |
arthed | -21.035 |
��極 | -20.875 |
yne | -20.356 |
Token | Party |
Token ID | 3615 |
Feature activation | +6.37e+01 |
Pos logit contributions | |
� | +32.729 |
� | +30.308 |
policies | +28.791 |
ideology | +26.893 |
policy | +26.108 |
Neg logit contributions | |
�� | -27.374 |
�� | -22.400 |
arthed | -22.321 |
��極 | -21.920 |
senal | -21.768 |
Token | has |
Token ID | 468 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
� | +46.517 |
� | +43.203 |
policies | +38.965 |
ideology | +36.223 |
institutions | +35.773 |
Neg logit contributions | |
�� | -29.386 |
arthed | -24.960 |
senal | -24.391 |
��極 | -24.360 |
�� | -23.457 |
Token | more |
Token ID | 517 |
Feature activation | +3.33e+01 |
Pos logit contributions | |
� | +25.389 |
� | +24.537 |
policies | +23.597 |
institutions | +21.381 |
economic | +21.156 |
Neg logit contributions | |
�� | -19.043 |
senal | -17.223 |
��極 | -17.217 |
�� | -16.883 |
arthed | -16.474 |
Token | concern |
Token ID | 2328 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
� | +30.834 |
policies | +30.307 |
� | +29.462 |
policy | +27.839 |
economic | +27.564 |
Neg logit contributions | |
�� | -23.124 |
��極 | -21.159 |
�� | -21.029 |
senal | -20.352 |
�� | -20.127 |
Token | for |
Token ID | 329 |
Feature activation | +3.93e+01 |
Pos logit contributions | |
� | +23.917 |
� | +22.258 |
policies | +20.000 |
policy | +18.123 |
climate | +18.036 |
Neg logit contributions | |
�� | -19.014 |
arthed | -17.059 |
�� | -17.049 |
��極 | -16.645 |
senal | -15.943 |
Token | Hispanics |
Token ID | 30714 |
Feature activation | +3.08e+01 |
Pos logit contributions | |
� | +33.409 |
policies | +32.061 |
� | +31.391 |
economic | +29.955 |
policy | +29.911 |
Neg logit contributions | |
�� | -27.112 |
��極 | -24.320 |
senal | -23.989 |
arthed | -22.615 |
�� | -21.451 |
Token | by |
Token ID | 416 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
� | +38.174 |
� | +35.703 |
policies | +29.835 |
climate | +28.092 |
| +27.915 |
Neg logit contributions | |
�� | -22.675 |
�� | -20.899 |
��極 | -20.875 |
�� | -20.727 |
arthed | -20.588 |
Token | paying |
Token ID | 5989 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
� | +2.253 |
� | +2.097 |
policies | +1.846 |
institutions | +1.691 |
climate | +1.656 |
Neg logit contributions | |
�� | -2.242 |
�� | -2.095 |
arthed | -2.077 |
yne | -2.008 |
Remy | -1.985 |
Token | close |
Token ID | 1969 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
� | +16.557 |
� | +15.586 |
policies | +14.156 |
institutions | +13.030 |
policy | +12.797 |
Neg logit contributions | |
�� | -13.405 |
�� | -12.401 |
�� | -11.986 |
��極 | -11.697 |
arthed | -11.693 |
Token | attention |
Token ID | 3241 |
Feature activation | +2.79e+01 |
Pos logit contributions | |
� | +18.094 |
� | +17.121 |
policies | +15.012 |
economic | +13.560 |
policy | +13.376 |
Neg logit contributions | |
�� | -24.621 |
�� | -24.244 |
�� | -22.919 |
��極 | -22.635 |
arthed | -22.290 |
Token | to |
Token ID | 284 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
� | +29.390 |
� | +27.556 |
policies | +24.083 |
policy | +21.857 |
institutions | +21.487 |
Neg logit contributions | |
�� | -19.167 |
�� | -18.893 |
�� | -18.696 |
arthed | -18.210 |
Canaver | -18.052 |
Token | Apple |
Token ID | 4196 |
Feature activation | +6.36e+01 |
Pos logit contributions | |
� | +27.185 |
� | +25.775 |
policies | +23.959 |
policy | +22.183 |
economic | +21.617 |
Neg logit contributions | |
�� | -21.788 |
��極 | -19.527 |
�� | -19.340 |
�� | -18.257 |
senal | -18.136 |
Token |
|
Token ID | 198 |
Feature activation | +2.50e+01 |
Pos logit contributions | |
� | +50.082 |
� | +45.611 |
policies | +42.066 |
policy | +38.925 |
ideology | +37.221 |
Neg logit contributions | |
�� | -23.968 |
�� | -21.850 |
�� | -20.882 |
Canaver | -20.644 |
Vaugh | -20.534 |
Token |
|
Token ID | 198 |
Feature activation | +2.35e+01 |
Pos logit contributions | |
� | +20.056 |
� | +18.394 |
| +13.920 |
policies | +12.678 |
| +11.819 |
Neg logit contributions | |
senal | -33.202 |
�� | -30.970 |
everal | -29.515 |
srf | -29.268 |
��極 | -28.406 |
Token | Why |
Token ID | 5195 |
Feature activation | +2.36e+01 |
Pos logit contributions | |
� | +27.834 |
� | +24.627 |
| +20.662 |
policies | +20.643 |
institutions | +18.977 |
Neg logit contributions | |
�� | -19.137 |
senal | -16.119 |
�� | -15.810 |
�� | -15.658 |
��極 | -15.637 |
Token | women |
Token ID | 1466 |
Feature activation | +3.52e+01 |
Pos logit contributions | |
� | +28.121 |
� | +26.873 |
policies | +24.167 |
institutions | +22.954 |
climate | +22.431 |
Neg logit contributions | |
�� | -15.931 |
�� | -14.107 |
arthed | -13.995 |
�� | -13.921 |
��極 | -13.443 |
Token | are |
Token ID | 389 |
Feature activation | +8.82e-02 |
Pos logit contributions | |
� | +34.481 |
� | +32.305 |
policies | +28.191 |
institutions | +26.625 |
organizations | +26.385 |
Neg logit contributions | |
�� | -22.303 |
arthed | -21.411 |
�� | -21.397 |
senal | -20.061 |
��極 | -19.992 |
Token | far |
Token ID | 1290 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
� | +31.654 |
� | +30.652 |
policies | +28.372 |
climate | +27.428 |
economic | +26.925 |
Neg logit contributions | |
�� | -19.428 |
arthed | -17.438 |
senal | -17.316 |
��極 | -17.111 |
�� | -16.800 |
Token | - |
Token ID | 12 |
Feature activation | +2.47e+00 |
Pos logit contributions | |
� | +18.082 |
� | +17.065 |
policies | +14.927 |
climate | +14.175 |
institutions | +13.795 |
Neg logit contributions | |
�� | -14.217 |
arthed | -12.693 |
�� | -12.522 |
��極 | -12.335 |
yne | -12.287 |
Token | reaching |
Token ID | 30771 |
Feature activation | +5.09e+01 |
Pos logit contributions | |
� | +3.242 |
� | +3.052 |
policies | +2.747 |
institutions | +2.559 |
climate | +2.520 |
Neg logit contributions | |
�� | -2.199 |
�� | -2.015 |
arthed | -1.994 |
yne | -1.912 |
Remy | -1.887 |
Token | socio |
Token ID | 21790 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
� | +38.094 |
� | +38.044 |
policies | +36.239 |
climate | +35.787 |
economic | +35.274 |
Neg logit contributions | |
�� | -26.042 |
senal | -23.999 |
arthed | -23.665 |
��極 | -23.627 |
nesday | -22.704 |
Token | - |
Token ID | 12 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
� | +20.504 |
� | +19.109 |
policies | +16.546 |
economic | +15.721 |
institutions | +15.664 |
Neg logit contributions | |
�� | -19.333 |
Blossom | -17.936 |
�� | -17.799 |
arthed | -17.435 |
��極 | -17.434 |
Token | economic |
Token ID | 17079 |
Feature activation | +6.36e+01 |
Pos logit contributions | |
� | +24.611 |
� | +23.301 |
policies | +20.931 |
economic | +20.618 |
climate | +20.381 |
Neg logit contributions | |
�� | -20.862 |
��極 | -17.416 |
arthed | -17.416 |
�� | -17.368 |
�� | -17.257 |
Token | effects |
Token ID | 3048 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
� | +39.249 |
policies | +38.838 |
� | +38.715 |
climate | +37.002 |
policy | +36.346 |
Neg logit contributions | |
�� | -31.272 |
��極 | -28.135 |
senal | -28.073 |
arthed | -26.353 |
nesday | -26.077 |
Token | , |
Token ID | 11 |
Feature activation | +2.49e+01 |
Pos logit contributions | |
� | +15.504 |
� | +14.527 |
policies | +12.643 |
climate | +11.906 |
institutions | +11.633 |
Neg logit contributions | |
�� | -13.217 |
arthed | -11.954 |
�� | -11.928 |
yne | -11.811 |
�� | -11.634 |
Token | and |
Token ID | 290 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
� | +29.205 |
� | +27.645 |
policies | +25.465 |
climate | +24.574 |
institutions | +23.850 |
Neg logit contributions | |
�� | -17.641 |
��極 | -14.890 |
arthed | -14.737 |
�� | -14.656 |
nesday | -14.533 |
Token | human |
Token ID | 1692 |
Feature activation | +5.01e+01 |
Pos logit contributions | |
� | +23.918 |
� | +22.958 |
policies | +20.831 |
climate | +19.995 |
institutions | +19.567 |
Neg logit contributions | |
�� | -17.016 |
��極 | -15.142 |
�� | -15.069 |
arthed | -15.056 |
yne | -15.027 |
Token | health |
Token ID | 1535 |
Feature activation | +3.97e+01 |
Pos logit contributions | |
� | +39.160 |
� | +38.514 |
policies | +36.912 |
climate | +35.475 |
economic | +35.247 |
Neg logit contributions | |
�� | -25.687 |
��極 | -22.981 |
senal | -21.882 |
nesday | -21.839 |
�� | -21.110 |
Token | important |
Token ID | 1593 |
Feature activation | +2.81e+01 |
Pos logit contributions | |
� | +10.069 |
� | +9.545 |
policies | +8.526 |
ideology | +7.770 |
institutions | +7.755 |
Neg logit contributions | |
�� | -9.823 |
arthed | -9.069 |
�� | -8.938 |
�� | -8.712 |
senal | -8.559 |
Token | contemporary |
Token ID | 11811 |
Feature activation | +3.09e+01 |
Pos logit contributions | |
� | +27.151 |
� | +26.784 |
policy | +24.051 |
policies | +24.050 |
economic | +23.610 |
Neg logit contributions | |
�� | -21.512 |
arthed | -20.178 |
senal | -19.628 |
��極 | -19.301 |
�� | -18.694 |
Token | challenge |
Token ID | 4427 |
Feature activation | +3.06e+01 |
Pos logit contributions | |
� | +29.133 |
� | +28.936 |
policy | +26.289 |
policies | +26.147 |
climate | +25.524 |
Neg logit contributions | |
�� | -22.221 |
arthed | -20.749 |
��極 | -20.713 |
senal | -20.256 |
�� | -19.900 |
Token | in |
Token ID | 287 |
Feature activation | +2.78e+01 |
Pos logit contributions | |
� | +29.238 |
� | +27.684 |
policies | +25.133 |
policy | +23.499 |
climate | +23.408 |
Neg logit contributions | |
�� | -22.958 |
�� | -21.350 |
senal | -20.667 |
��極 | -20.595 |
arthed | -20.491 |
Token | injury |
Token ID | 5095 |
Feature activation | +5.16e+01 |
Pos logit contributions | |
� | +27.950 |
� | +26.978 |
policies | +25.955 |
policy | +24.628 |
climate | +24.231 |
Neg logit contributions | |
�� | -21.526 |
��極 | -18.478 |
�� | -18.397 |
arthed | -18.305 |
�� | -17.911 |
Token | prevention |
Token ID | 14196 |
Feature activation | +6.33e+01 |
Pos logit contributions | |
� | +36.639 |
� | +35.897 |
policies | +35.564 |
policy | +34.829 |
climate | +31.666 |
Neg logit contributions | |
�� | -27.966 |
senal | -25.713 |
�� | -25.421 |
arthed | -25.354 |
��極 | -25.049 |
Token | is |
Token ID | 318 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
� | +41.593 |
policies | +40.388 |
� | +39.450 |
policy | +38.678 |
initiatives | +35.997 |
Neg logit contributions | |
�� | -28.073 |
�� | -25.098 |
arthed | -24.820 |
��極 | -24.749 |
�� | -24.102 |
Token | the |
Token ID | 262 |
Feature activation | +2.37e+01 |
Pos logit contributions | |
� | +20.607 |
� | +19.880 |
policies | +18.451 |
climate | +17.329 |
policy | +17.076 |
Neg logit contributions | |
�� | -17.450 |
arthed | -15.964 |
�� | -15.836 |
��極 | -15.450 |
�� | -15.279 |
Token | need |
Token ID | 761 |
Feature activation | +7.55e+00 |
Pos logit contributions | |
� | +24.717 |
� | +23.928 |
policies | +22.462 |
policy | +21.172 |
climate | +21.157 |
Neg logit contributions | |
�� | -17.909 |
arthed | -17.131 |
�� | -16.255 |
senal | -15.971 |
��極 | -15.837 |
Token | to |
Token ID | 284 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
� | +9.132 |
� | +8.563 |
policies | +7.689 |
institutions | +7.076 |
climate | +6.996 |
Neg logit contributions | |
�� | -7.197 |
�� | -6.753 |
arthed | -6.738 |
yne | -6.387 |
�� | -6.378 |
Token | make |
Token ID | 787 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
� | +13.232 |
� | +12.525 |
policies | +11.020 |
climate | +9.981 |
policy | +9.958 |
Neg logit contributions | |
�� | -16.350 |
arthed | -15.347 |
��極 | -15.042 |
�� | -14.967 |
senal | -14.903 |
Token | This |
Token ID | 770 |
Feature activation | +3.02e+01 |
Pos logit contributions | |
� | +29.637 |
� | +28.045 |
policies | +24.036 |
| +22.594 |
institutions | +22.208 |
Neg logit contributions | |
�� | -19.323 |
senal | -17.407 |
�� | -16.555 |
avorite | -16.047 |
srf | -16.016 |
Token | � |
Token ID | 564 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
� | +29.277 |
� | +28.642 |
policies | +26.982 |
policy | +25.883 |
climate | +25.805 |
Neg logit contributions | |
�� | -20.040 |
arthed | -18.684 |
senal | -17.977 |
�� | -17.296 |
��極 | -17.164 |
Token | � |
Token ID | 250 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
�� | +0.888 |
�� | +0.794 |
arthed | +0.712 |
�� | +0.672 |
��極 | +0.641 |
Neg logit contributions | |
� | -3.343 |
� | -3.194 |
policies | -2.986 |
institutions | -2.821 |
climate | -2.803 |
Token | new |
Token ID | 649 |
Feature activation | +3.99e+01 |
Pos logit contributions | |
� | +19.410 |
� | +18.318 |
policies | +16.448 |
institutions | +15.596 |
climate | +15.431 |
Neg logit contributions | |
�� | -9.064 |
�� | -7.752 |
arthed | -7.678 |
�� | -7.410 |
yne | -7.405 |
Token | local |
Token ID | 1957 |
Feature activation | +4.93e+01 |
Pos logit contributions | |
� | +39.474 |
� | +39.292 |
policies | +33.770 |
economic | +33.277 |
climate | +33.188 |
Neg logit contributions | |
�� | -17.873 |
arthed | -17.628 |
senal | -16.566 |
�� | -15.540 |
fg | -15.375 |
Token | ism |
Token ID | 1042 |
Feature activation | +6.28e+01 |
Pos logit contributions | |
� | +41.505 |
� | +40.897 |
governance | +37.683 |
policies | +37.457 |
policy | +36.451 |
Neg logit contributions | |
�� | -21.173 |
senal | -19.559 |
arthed | -19.471 |
��極 | -18.768 |
�� | -18.218 |
Token | � |
Token ID | 447 |
Feature activation | -1.61e+01 |
Pos logit contributions | |
� | +49.608 |
� | +48.132 |
policies | +40.541 |
policy | +38.552 |
ideology | +38.301 |
Neg logit contributions | |
�� | -21.477 |
arthed | -19.546 |
senal | -19.051 |
��極 | -17.583 |
�� | -17.571 |
Token | � |
Token ID | 251 |
Feature activation | +4.61e+01 |
Pos logit contributions | |
�� | +10.394 |
�� | +10.123 |
arthed | +9.107 |
�� | +9.033 |
� | +8.894 |
Neg logit contributions | |
� | -20.102 |
� | -18.977 |
policies | -17.911 |
behavi | -17.307 |
climate | -16.581 |
Token | is |
Token ID | 318 |
Feature activation | +8.53e+00 |
Pos logit contributions | |
� | +43.129 |
� | +41.013 |
policies | +36.199 |
| +34.365 |
institutions | +34.300 |
Neg logit contributions | |
�� | -19.648 |
senal | -16.793 |
arthed | -16.608 |
�� | -16.397 |
��極 | -16.379 |
Token | pragmatic |
Token ID | 33119 |
Feature activation | +4.14e+01 |
Pos logit contributions | |
� | +10.727 |
� | +10.139 |
policies | +9.084 |
institutions | +8.523 |
climate | +8.394 |
Neg logit contributions | |
�� | -7.914 |
arthed | -7.082 |
�� | -7.046 |
yne | -6.818 |
�� | -6.718 |
Token | and |
Token ID | 290 |
Feature activation | +4.43e+01 |
Pos logit contributions | |
� | +37.615 |
� | +36.399 |
policies | +32.754 |
policy | +31.376 |
governance | +30.821 |
Neg logit contributions | |
�� | -25.096 |
arthed | -22.349 |
senal | -21.754 |
��極 | -20.876 |
ometown | -20.819 |
Token | The |
Token ID | 464 |
Feature activation | +2.70e+01 |
Pos logit contributions | |
� | +28.524 |
� | +25.684 |
| +20.677 |
policies | +20.592 |
institutions | +19.063 |
Neg logit contributions | |
�� | -19.648 |
senal | -17.717 |
��極 | -16.265 |
srf | -16.031 |
arthed | -15.978 |
Token | truth |
Token ID | 3872 |
Feature activation | +3.68e+01 |
Pos logit contributions | |
� | +31.023 |
� | +30.032 |
policies | +27.181 |
policy | +25.362 |
climate | +25.246 |
Neg logit contributions | |
�� | -17.023 |
arthed | -15.458 |
��極 | -14.160 |
senal | -14.132 |
�� | -14.124 |
Token | is |
Token ID | 318 |
Feature activation | +2.79e+01 |
Pos logit contributions | |
� | +36.332 |
� | +34.711 |
policies | +28.820 |
climate | +27.614 |
policy | +27.509 |
Neg logit contributions | |
�� | -22.324 |
�� | -20.268 |
senal | -19.847 |
arthed | -19.476 |
��極 | -19.038 |
Token | , |
Token ID | 11 |
Feature activation | +2.75e+01 |
Pos logit contributions | |
� | +31.612 |
� | +30.656 |
policies | +26.247 |
institutions | +24.724 |
climate | +24.662 |
Neg logit contributions | |
�� | -18.647 |
arthed | -16.600 |
�� | -15.381 |
��極 | -15.093 |
senal | -14.875 |
Token | Better |
Token ID | 11625 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
� | +31.787 |
� | +30.729 |
policies | +27.405 |
institutions | +25.720 |
policy | +25.375 |
Neg logit contributions | |
�� | -17.894 |
arthed | -15.828 |
�� | -15.189 |
��極 | -14.912 |
�� | -14.474 |
Token | Together |
Token ID | 17083 |
Feature activation | +6.19e+01 |
Pos logit contributions | |
� | +1.211 |
� | +1.134 |
policies | +1.009 |
institutions | +0.929 |
climate | +0.912 |
Neg logit contributions | |
�� | -1.084 |
�� | -1.018 |
arthed | -1.012 |
yne | -0.982 |
Remy | -0.975 |
Token | do |
Token ID | 466 |
Feature activation | +3.04e+01 |
Pos logit contributions | |
� | +48.087 |
� | +45.031 |
policies | +39.573 |
ideology | +37.019 |
policy | +36.714 |
Neg logit contributions | |
�� | -23.594 |
arthed | -19.970 |
�� | -18.916 |
��極 | -18.557 |
senal | -17.806 |
Token | no |
Token ID | 645 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
� | +34.472 |
� | +32.596 |
policies | +28.358 |
| +26.758 |
institutions | +26.407 |
Neg logit contributions | |
�� | -17.450 |
arthed | -15.688 |
�� | -15.396 |
��極 | -15.104 |
nesday | -14.262 |
Token | love |
Token ID | 1842 |
Feature activation | +1.98e+01 |
Pos logit contributions | |
� | +23.084 |
� | +22.085 |
policies | +19.482 |
ideology | +18.224 |
policy | +18.051 |
Neg logit contributions | |
�� | -15.821 |
�� | -14.223 |
arthed | -14.161 |
��極 | -13.619 |
senal | -13.187 |
Token | the |
Token ID | 262 |
Feature activation | +2.60e+01 |
Pos logit contributions | |
� | +25.542 |
� | +24.350 |
policies | +21.749 |
institutions | +20.045 |
policy | +20.030 |
Neg logit contributions | |
�� | -14.682 |
�� | -12.933 |
arthed | -12.849 |
��極 | -11.881 |
�� | -11.742 |
Token | union |
Token ID | 6441 |
Feature activation | +3.51e+01 |
Pos logit contributions | |
� | +29.790 |
� | +29.042 |
policies | +25.906 |
institutions | +24.417 |
ideology | +23.887 |
Neg logit contributions | |
�� | -18.286 |
arthed | -16.043 |
�� | -15.302 |
senal | -14.470 |
��極 | -14.398 |
Token | warned |
Token ID | 7728 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
� | +6.709 |
� | +6.395 |
policies | +5.880 |
institutions | +5.579 |
climate | +5.532 |
Neg logit contributions | |
�� | -2.169 |
�� | -1.846 |
arthed | -1.825 |
yne | -1.678 |
�� | -1.641 |
Token | Monday |
Token ID | 3321 |
Feature activation | +9.36e+00 |
Pos logit contributions | |
� | +18.482 |
� | +17.489 |
policies | +15.760 |
climate | +15.329 |
institutions | +14.751 |
Neg logit contributions | |
�� | -13.992 |
�� | -12.578 |
arthed | -12.147 |
��極 | -12.110 |
yne | -11.610 |
Token | that |
Token ID | 326 |
Feature activation | +2.72e+01 |
Pos logit contributions | |
� | +11.000 |
� | +10.350 |
policies | +9.103 |
climate | +8.483 |
institutions | +8.423 |
Neg logit contributions | |
�� | -9.407 |
�� | -8.719 |
arthed | -8.585 |
yne | -8.255 |
��極 | -8.236 |
Token | the |
Token ID | 262 |
Feature activation | +2.25e+01 |
Pos logit contributions | |
� | +29.112 |
� | +27.588 |
policies | +26.119 |
climate | +25.873 |
institutions | +24.414 |
Neg logit contributions | |
�� | -20.801 |
�� | -17.811 |
��極 | -17.346 |
arthed | -17.246 |
yne | -16.540 |
Token | international |
Token ID | 3230 |
Feature activation | +4.21e+01 |
Pos logit contributions | |
� | +25.153 |
� | +23.701 |
policies | +22.707 |
climate | +22.280 |
institutions | +21.151 |
Neg logit contributions | |
�� | -17.659 |
arthed | -15.579 |
�� | -15.480 |
senal | -14.970 |
��極 | -14.916 |
Token | community |
Token ID | 2055 |
Feature activation | +6.18e+01 |
Pos logit contributions | |
� | +34.856 |
climate | +33.683 |
� | +32.682 |
institutions | +31.931 |
policies | +31.887 |
Neg logit contributions | |
�� | -25.187 |
��極 | -23.546 |
arthed | -23.186 |
�� | -22.945 |
senal | -21.468 |
Token | had |
Token ID | 550 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
� | +45.006 |
� | +43.305 |
policies | +37.238 |
climate | +35.877 |
needs | +35.765 |
Neg logit contributions | |
�� | -27.840 |
�� | -26.314 |
senal | -25.403 |
arthed | -24.711 |
��極 | -24.225 |
Token | no |
Token ID | 645 |
Feature activation | +3.64e+01 |
Pos logit contributions | |
� | +15.768 |
� | +15.024 |
policies | +13.487 |
institutions | +12.545 |
climate | +12.497 |
Neg logit contributions | |
�� | -10.861 |
�� | -9.814 |
arthed | -9.711 |
�� | -9.459 |
senal | -9.439 |
Token | option |
Token ID | 3038 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
� | +31.585 |
� | +30.940 |
policies | +29.426 |
economic | +27.577 |
policy | +27.574 |
Neg logit contributions | |
�� | -25.234 |
�� | -23.101 |
��極 | -23.084 |
�� | -22.988 |
senal | -22.126 |
Token | but |
Token ID | 475 |
Feature activation | +1.88e+01 |
Pos logit contributions | |
� | +14.902 |
� | +13.892 |
policies | +11.536 |
institutions | +10.551 |
climate | +10.425 |
Neg logit contributions | |
�� | -16.310 |
�� | -15.049 |
arthed | -14.900 |
senal | -14.611 |
yne | -14.570 |
Token | to |
Token ID | 284 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
� | +19.840 |
� | +18.611 |
policies | +16.343 |
climate | +15.151 |
ideology | +14.784 |
Neg logit contributions | |
�� | -17.844 |
�� | -17.242 |
arthed | -16.629 |
yne | -15.648 |
nox | -15.613 |
Token | what |
Token ID | 644 |
Feature activation | +3.83e+01 |
Pos logit contributions | |
� | +19.597 |
� | +18.695 |
policies | +16.741 |
climate | +15.488 |
policy | +15.472 |
Neg logit contributions | |
�� | -14.187 |
arthed | -12.832 |
�� | -12.580 |
senal | -12.161 |
��極 | -12.151 |
Token | many |
Token ID | 867 |
Feature activation | +3.42e+01 |
Pos logit contributions | |
� | +38.945 |
� | +37.651 |
policies | +34.146 |
policy | +31.900 |
institutions | +31.760 |
Neg logit contributions | |
�� | -21.053 |
arthed | -18.619 |
�� | -17.935 |
senal | -17.253 |
�� | -17.020 |
Token | thought |
Token ID | 1807 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
� | +34.907 |
� | +33.315 |
policies | +29.618 |
institutions | +28.495 |
policy | +27.868 |
Neg logit contributions | |
�� | -22.337 |
arthed | -19.574 |
senal | -18.687 |
�� | -18.618 |
Canaver | -17.838 |
Token | the |
Token ID | 262 |
Feature activation | +2.78e+01 |
Pos logit contributions | |
� | +32.352 |
� | +30.892 |
policies | +26.820 |
institutions | +25.162 |
policy | +25.044 |
Neg logit contributions | |
�� | -19.188 |
�� | -17.073 |
senal | -16.758 |
arthed | -16.757 |
yne | -15.676 |
Token | public |
Token ID | 1171 |
Feature activation | +4.98e+01 |
Pos logit contributions | |
� | +30.329 |
� | +29.075 |
policies | +27.001 |
policy | +25.145 |
institutions | +24.765 |
Neg logit contributions | |
�� | -18.994 |
arthed | -17.313 |
�� | -17.127 |
senal | -16.821 |
��極 | -16.237 |
Token | service |
Token ID | 2139 |
Feature activation | +6.18e+01 |
Pos logit contributions | |
� | +42.518 |
� | +39.731 |
policies | +35.616 |
institutions | +34.307 |
policy | +34.210 |
Neg logit contributions | |
�� | -25.464 |
�� | -21.932 |
Canaver | -21.415 |
arthed | -21.143 |
yne | -20.335 |
Token | was |
Token ID | 373 |
Feature activation | +2.74e+01 |
Pos logit contributions | |
� | +46.799 |
� | +44.185 |
policies | +38.732 |
institutions | +37.302 |
policy | +37.066 |
Neg logit contributions | |
�� | -26.456 |
�� | -22.295 |
arthed | -22.233 |
senal | -21.681 |
bris | -20.762 |
Token | returning |
Token ID | 8024 |
Feature activation | +2.34e+01 |
Pos logit contributions | |
� | +30.492 |
� | +28.345 |
policies | +23.432 |
institutions | +22.561 |
| +22.181 |
Neg logit contributions | |
�� | -20.710 |
arthed | -19.048 |
�� | -18.338 |
Canaver | -17.608 |
senal | -17.557 |
Token | to |
Token ID | 284 |
Feature activation | +3.19e+01 |
Pos logit contributions | |
� | +26.251 |
� | +24.655 |
policies | +20.937 |
institutions | +19.570 |
climate | +19.507 |
Neg logit contributions | |
�� | -18.533 |
arthed | -17.232 |
�� | -17.226 |
yne | -16.206 |
��極 | -15.871 |
Token | under |
Token ID | 739 |
Feature activation | +2.09e+01 |
Pos logit contributions | |
� | +35.476 |
� | +33.779 |
policies | +28.985 |
institutions | +27.672 |
economic | +27.343 |
Neg logit contributions | |
�� | -19.132 |
arthed | -17.950 |
�� | -17.188 |
yne | -16.543 |
senal | -16.381 |
Token | the |
Token ID | 262 |
Feature activation | +2.34e+01 |
Pos logit contributions | |
� | +25.628 |
� | +24.882 |
policies | +22.490 |
institutions | +20.879 |
climate | +20.733 |
Neg logit contributions | |
�� | -14.393 |
arthed | -13.151 |
senal | -12.608 |
��極 | -12.278 |
�� | -12.056 |
Token | real |
Token ID | 1103 |
Feature activation | +3.50e+01 |
Pos logit contributions | |
� | +11.586 |
� | +10.975 |
policies | +10.027 |
institutions | +9.280 |
climate | +9.241 |
Neg logit contributions | |
�� | -8.043 |
�� | -7.308 |
arthed | -7.271 |
�� | -6.877 |
yne | -6.855 |
Token | problem |
Token ID | 1917 |
Feature activation | +3.11e+01 |
Pos logit contributions | |
� | +36.206 |
� | +35.443 |
policies | +32.160 |
economic | +30.841 |
climate | +30.730 |
Neg logit contributions | |
�� | -19.233 |
��極 | -16.476 |
arthed | -16.136 |
�� | -16.117 |
�� | -15.070 |
Token | for |
Token ID | 329 |
Feature activation | +8.72e+00 |
Pos logit contributions | |
� | +34.464 |
� | +32.671 |
policies | +27.479 |
climate | +26.249 |
policy | +26.007 |
Neg logit contributions | |
�� | -18.919 |
�� | -17.138 |
arthed | -16.993 |
��極 | -16.768 |
senal | -16.487 |
Token | the |
Token ID | 262 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
� | +11.624 |
� | +11.026 |
policies | +10.038 |
institutions | +9.376 |
climate | +9.336 |
Neg logit contributions | |
�� | -7.347 |
�� | -6.653 |
arthed | -6.534 |
��極 | -6.316 |
yne | -6.230 |
Token | United |
Token ID | 1578 |
Feature activation | -3.71e+00 |
Pos logit contributions | |
� | +19.215 |
� | +18.342 |
policies | +16.894 |
climate | +15.719 |
institutions | +15.665 |
Neg logit contributions | |
�� | -13.886 |
�� | -12.327 |
arthed | -12.270 |
��極 | -11.727 |
�� | -11.460 |
Token | States |
Token ID | 1829 |
Feature activation | +6.18e+01 |
Pos logit contributions | |
�� | +4.597 |
arthed | +4.446 |
�� | +4.422 |
Blossom | +4.385 |
yne | +4.383 |
Neg logit contributions | |
� | -3.094 |
� | -2.826 |
policies | -2.471 |
institutions | -2.214 |
ideology | -2.167 |
Token | in |
Token ID | 287 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
� | +48.740 |
� | +45.952 |
policies | +38.606 |
policy | +37.612 |
institutions | +36.512 |
Neg logit contributions | |
�� | -24.223 |
�� | -22.222 |
��極 | -21.817 |
arthed | -21.101 |
�� | -19.635 |
Token | this |
Token ID | 428 |
Feature activation | +2.58e+01 |
Pos logit contributions | |
� | +23.657 |
� | +22.780 |
policies | +20.441 |
climate | +19.291 |
institutions | +19.015 |
Neg logit contributions | |
�� | -15.511 |
�� | -14.237 |
��極 | -13.528 |
arthed | -13.398 |
�� | -13.092 |
Token | arrangement |
Token ID | 13888 |
Feature activation | +4.84e+01 |
Pos logit contributions | |
� | +28.148 |
� | +27.180 |
climate | +24.346 |
policies | +24.275 |
economic | +23.621 |
Neg logit contributions | |
�� | -19.465 |
arthed | -17.279 |
�� | -16.747 |
��極 | -16.417 |
�� | -16.378 |
Token | appears |
Token ID | 3568 |
Feature activation | +3.58e+00 |
Pos logit contributions | |
� | +42.104 |
� | +39.887 |
policies | +33.153 |
concerns | +32.165 |
| +31.605 |
Neg logit contributions | |
�� | -22.987 |
senal | -22.546 |
arthed | -22.269 |
�� | -22.061 |
��極 | -21.405 |
Token | to |
Token ID | 284 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
� | +4.566 |
� | +4.298 |
policies | +3.852 |
institutions | +3.580 |
climate | +3.523 |
Neg logit contributions | |
�� | -3.283 |
�� | -3.021 |
arthed | -3.002 |
yne | -2.885 |
Remy | -2.837 |
Token | � |
Token ID | 564 |
Feature activation | -2.17e+01 |
Pos logit contributions | |
� | +45.615 |
� | +43.415 |
policies | +38.083 |
policy | +36.167 |
ideology | +35.416 |
Neg logit contributions | |
�� | -24.227 |
arthed | -21.149 |
��極 | -19.884 |
senal | -19.694 |
�� | -19.003 |
Token | � |
Token ID | 250 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
�� | +23.425 |
�� | +23.330 |
�� | +21.775 |
�� | +21.742 |
� | +21.561 |
Neg logit contributions | |
� | -13.839 |
� | -12.838 |
policies | -11.644 |
climate | -10.714 |
behavi | -10.502 |
Token | prov |
Token ID | 15234 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
� | +23.270 |
� | +21.452 |
policies | +18.917 |
institutions | +17.546 |
| +17.396 |
Neg logit contributions | |
�� | -15.630 |
�� | -13.269 |
�� | -13.259 |
arthed | -12.886 |
senal | -12.832 |
Token | ides |
Token ID | 1460 |
Feature activation | +3.69e+01 |
Pos logit contributions | |
� | +17.389 |
� | +16.264 |
policies | +14.342 |
institutions | +13.268 |
policy | +13.101 |
Neg logit contributions | |
�� | -12.241 |
�� | -11.039 |
arthed | -10.688 |
senal | -10.592 |
��極 | -10.506 |
Token | responsible |
Token ID | 4497 |
Feature activation | +4.44e+01 |
Pos logit contributions | |
� | +36.630 |
� | +36.171 |
policies | +31.792 |
institutions | +30.019 |
climate | +29.941 |
Neg logit contributions | |
�� | -22.901 |
arthed | -20.535 |
��極 | -19.235 |
senal | -19.049 |
�� | -18.467 |
Token | economic |
Token ID | 3034 |
Feature activation | +6.14e+01 |
Pos logit contributions | |
� | +38.388 |
� | +37.697 |
policies | +36.142 |
governance | +33.816 |
policy | +33.701 |
Neg logit contributions | |
�� | -27.067 |
arthed | -25.307 |
senal | -22.986 |
��極 | -22.920 |
�� | -21.820 |
Token | leadership |
Token ID | 5531 |
Feature activation | +3.15e+01 |
Pos logit contributions | |
policies | +41.945 |
� | +40.890 |
policy | +39.791 |
� | +39.650 |
governance | +38.243 |
Neg logit contributions | |
�� | -33.356 |
��極 | -29.948 |
arthed | -29.293 |
senal | -29.165 |
�� | -27.188 |
Token | in |
Token ID | 287 |
Feature activation | +3.47e+01 |
Pos logit contributions | |
� | +34.325 |
� | +31.902 |
policies | +27.279 |
institutions | +25.056 |
policy | +25.023 |
Neg logit contributions | |
�� | -21.798 |
arthed | -20.532 |
senal | -19.168 |
�� | -18.677 |
��極 | -18.677 |
Token | tough |
Token ID | 5802 |
Feature activation | +4.04e+01 |
Pos logit contributions | |
� | +35.002 |
� | +33.670 |
policies | +30.896 |
climate | +29.374 |
economic | +29.302 |
Neg logit contributions | |
�� | -22.078 |
arthed | -19.947 |
senal | -18.501 |
��極 | -18.383 |
�� | -18.126 |
Token | times |
Token ID | 1661 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
� | +35.599 |
� | +33.901 |
policies | +32.870 |
economic | +32.798 |
climate | +31.466 |
Neg logit contributions | |
�� | -27.413 |
arthed | -23.276 |
�� | -22.448 |
��極 | -21.536 |
�� | -21.276 |
Token | . |
Token ID | 13 |
Feature activation | +3.07e+01 |
Pos logit contributions | |
� | +21.798 |
� | +20.448 |
policies | +17.100 |
climate | +16.059 |
institutions | +15.834 |
Neg logit contributions | |
�� | -15.928 |
arthed | -14.630 |
senal | -13.788 |
�� | -13.688 |
��極 | -13.366 |
Token | making |
Token ID | 1642 |
Feature activation | +8.31e+00 |
Pos logit contributions | |
�� | +17.427 |
�� | +17.236 |
Reeves | +17.129 |
yne | +16.887 |
arthed | +16.866 |
Neg logit contributions | |
� | -11.811 |
� | -10.260 |
policies | -9.686 |
behavi | -8.781 |
institutions | -8.387 |
Token | today |
Token ID | 1909 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
� | +10.059 |
� | +9.473 |
policies | +8.204 |
institutions | +7.599 |
climate | +7.540 |
Neg logit contributions | |
�� | -8.280 |
�� | -7.630 |
arthed | -7.615 |
��極 | -7.243 |
senal | -7.192 |
Token | : |
Token ID | 25 |
Feature activation | +3.67e+01 |
Pos logit contributions | |
� | +23.619 |
� | +22.076 |
policies | +18.310 |
climate | +17.304 |
policy | +17.070 |
Neg logit contributions | |
�� | -17.153 |
arthed | -16.285 |
�� | -15.834 |
senal | -15.486 |
��極 | -15.437 |
Token | that |
Token ID | 326 |
Feature activation | +3.62e+01 |
Pos logit contributions | |
� | +38.166 |
� | +37.327 |
policies | +32.657 |
economic | +30.939 |
climate | +30.784 |
Neg logit contributions | |
�� | -20.373 |
arthed | -18.831 |
�� | -16.362 |
senal | -16.249 |
��極 | -16.215 |
Token | the |
Token ID | 262 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
� | +37.181 |
� | +36.291 |
policies | +32.162 |
climate | +30.552 |
institutions | +30.401 |
Neg logit contributions | |
�� | -21.359 |
arthed | -19.284 |
��極 | -17.501 |
senal | -17.344 |
�� | -16.349 |
Token | coalition |
Token ID | 9906 |
Feature activation | +6.14e+01 |
Pos logit contributions | |
� | +25.126 |
� | +24.215 |
policies | +22.378 |
institutions | +20.876 |
climate | +20.691 |
Neg logit contributions | |
�� | -16.307 |
arthed | -15.052 |
��極 | -14.051 |
�� | -14.021 |
senal | -13.850 |
Token | was |
Token ID | 373 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
� | +47.024 |
� | +45.292 |
policies | +39.448 |
institutions | +37.271 |
policy | +37.126 |
Neg logit contributions | |
�� | -25.234 |
arthed | -22.874 |
��極 | -21.834 |
senal | -20.717 |
�� | -20.499 |
Token | illegitimate |
Token ID | 41368 |
Feature activation | +2.21e+01 |
Pos logit contributions | |
� | +18.262 |
� | +17.494 |
policies | +15.496 |
institutions | +14.546 |
climate | +14.413 |
Neg logit contributions | |
�� | -13.871 |
arthed | -12.356 |
�� | -11.844 |
��極 | -11.523 |
�� | -11.471 |
Token | , |
Token ID | 11 |
Feature activation | +2.56e+01 |
Pos logit contributions | |
� | +24.694 |
� | +23.367 |
policies | +19.974 |
institutions | +18.763 |
ideology | +18.264 |
Neg logit contributions | |
�� | -19.518 |
arthed | -17.728 |
�� | -16.926 |
senal | -16.848 |
�� | -16.810 |
Token | divisive |
Token ID | 29656 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
� | +27.623 |
� | +26.539 |
policies | +23.591 |
institutions | +22.252 |
climate | +21.797 |
Neg logit contributions | |
�� | -19.844 |
arthed | -17.238 |
senal | -17.143 |
�� | -16.659 |
�� | -16.360 |
Token | , |
Token ID | 11 |
Feature activation | +3.14e+01 |
Pos logit contributions | |
� | +28.812 |
� | +27.544 |
policies | +24.327 |
institutions | +22.587 |
ideology | +22.511 |
Neg logit contributions | |
�� | -23.826 |
arthed | -21.404 |
��極 | -19.846 |
�� | -19.349 |
�� | -19.338 |
Token | are |
Token ID | 389 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
� | +39.569 |
� | +36.625 |
policies | +30.665 |
| +29.635 |
policy | +28.501 |
Neg logit contributions | |
�� | -21.869 |
senal | -20.709 |
arthed | -19.407 |
��極 | -19.266 |
�� | -18.963 |
Token | trying |
Token ID | 2111 |
Feature activation | +3.51e+01 |
Pos logit contributions | |
� | +23.656 |
� | +22.290 |
policies | +19.361 |
institutions | +17.855 |
climate | +17.760 |
Neg logit contributions | |
�� | -16.692 |
arthed | -14.443 |
�� | -13.804 |
��極 | -13.800 |
senal | -13.467 |
Token | to |
Token ID | 284 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
� | +35.467 |
� | +33.400 |
policies | +27.794 |
institutions | +25.975 |
| +25.953 |
Neg logit contributions | |
�� | -21.233 |
arthed | -20.430 |
Remy | -19.009 |
�� | -19.002 |
ometown | -18.925 |
Token | alleviate |
Token ID | 30885 |
Feature activation | +3.32e+01 |
Pos logit contributions | |
� | +25.553 |
� | +23.805 |
policies | +19.640 |
climate | +18.224 |
policy | +18.096 |
Neg logit contributions | |
�� | -22.853 |
senal | -20.254 |
arthed | -20.148 |
��極 | -20.099 |
�� | -19.130 |
Token | , |
Token ID | 11 |
Feature activation | +4.42e+01 |
Pos logit contributions | |
� | +34.955 |
� | +32.924 |
policies | +27.675 |
climate | +26.193 |
policy | +25.679 |
Neg logit contributions | |
�� | -22.167 |
arthed | -19.720 |
senal | -19.307 |
��極 | -18.794 |
�� | -18.421 |
Token | that |
Token ID | 326 |
Feature activation | +6.12e+01 |
Pos logit contributions | |
� | +42.628 |
� | +40.484 |
policies | +34.218 |
policy | +32.043 |
climate | +32.013 |
Neg logit contributions | |
�� | -22.595 |
senal | -19.537 |
arthed | -19.366 |
��極 | -18.438 |
ometown | -16.811 |
Token | is |
Token ID | 318 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
� | +47.560 |
� | +45.062 |
policies | +37.466 |
policy | +36.263 |
| +35.919 |
Neg logit contributions | |
�� | -26.612 |
senal | -22.691 |
��極 | -21.893 |
arthed | -21.464 |
�� | -20.434 |
Token | something |
Token ID | 1223 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
� | +15.187 |
� | +14.439 |
policies | +12.675 |
policy | +11.679 |
climate | +11.642 |
Neg logit contributions | |
�� | -11.176 |
arthed | -9.679 |
�� | -9.396 |
��極 | -9.261 |
senal | -9.184 |
Token | I |
Token ID | 314 |
Feature activation | +3.79e+01 |
Pos logit contributions | |
� | +19.063 |
� | +18.107 |
policies | +15.427 |
policy | +14.237 |
climate | +14.093 |
Neg logit contributions | |
�� | -17.337 |
arthed | -15.074 |
senal | -14.934 |
�� | -14.680 |
�� | -14.564 |
Token | would |
Token ID | 561 |
Feature activation | +1.73e+01 |
Pos logit contributions | |
� | +37.453 |
� | +35.276 |
policies | +28.510 |
| +27.379 |
policy | +27.329 |
Neg logit contributions | |
�� | -26.168 |
senal | -24.551 |
arthed | -22.829 |
��極 | -21.212 |
�� | -20.614 |
Token | be |
Token ID | 307 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
� | +18.558 |
� | +17.293 |
policies | +14.496 |
policy | +13.328 |
climate | +13.105 |
Neg logit contributions | |
�� | -17.806 |
senal | -16.787 |
arthed | -16.427 |
��極 | -15.803 |
�� | -15.620 |
Token | s |
Token ID | 82 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
� | +0.705 |
� | +0.663 |
policies | +0.599 |
institutions | +0.557 |
climate | +0.548 |
Neg logit contributions | |
�� | -0.503 |
arthed | -0.467 |
�� | -0.466 |
yne | -0.449 |
Remy | -0.443 |
Token | civil |
Token ID | 3026 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
� | +28.878 |
� | +27.831 |
policies | +26.483 |
climate | +24.966 |
policy | +24.597 |
Neg logit contributions | |
�� | -18.137 |
�� | -16.298 |
arthed | -15.877 |
��極 | -15.548 |
Canaver | -15.495 |
Token | - |
Token ID | 12 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
� | +27.249 |
� | +25.974 |
policies | +24.481 |
institutions | +22.707 |
policy | +22.161 |
Neg logit contributions | |
�� | -29.196 |
senal | -27.439 |
��極 | -26.322 |
�� | -26.158 |
�� | -25.962 |
Token | rights |
Token ID | 28046 |
Feature activation | +3.43e+01 |
Pos logit contributions | |
� | +10.753 |
� | +9.835 |
policies | +8.253 |
institutions | +7.316 |
| +7.209 |
Neg logit contributions | |
�� | -15.598 |
senal | -14.561 |
�� | -14.303 |
��極 | -14.269 |
�� | -13.970 |
Token | office |
Token ID | 2607 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
� | +31.528 |
� | +30.181 |
policies | +29.382 |
policy | +27.401 |
climate | +26.649 |
Neg logit contributions | |
�� | -24.195 |
�� | -21.271 |
Canaver | -20.212 |
��極 | -20.144 |
arthed | -19.881 |
Token | : |
Token ID | 25 |
Feature activation | +6.10e+01 |
Pos logit contributions | |
� | +24.465 |
� | +23.063 |
policies | +19.895 |
policy | +18.298 |
climate | +18.128 |
Neg logit contributions | |
�� | -17.997 |
�� | -16.617 |
arthed | -16.197 |
��極 | -15.453 |
�� | -15.453 |
Token | develop |
Token ID | 1205 |
Feature activation | +4.69e+01 |
Pos logit contributions | |
� | +48.042 |
� | +46.359 |
policies | +39.401 |
climate | +36.879 |
economic | +36.652 |
Neg logit contributions | |
�� | -20.111 |
�� | -19.767 |
zzy | -19.552 |
arthed | -18.977 |
Canaver | -18.863 |
Token | a |
Token ID | 257 |
Feature activation | +2.98e+01 |
Pos logit contributions | |
� | +39.466 |
� | +39.134 |
policies | +37.972 |
policy | +34.525 |
climate | +34.049 |
Neg logit contributions | |
�� | -23.092 |
�� | -21.210 |
�� | -20.247 |
Canaver | -20.247 |
��極 | -19.980 |
Token | � |
Token ID | 564 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
� | +30.510 |
� | +30.210 |
policies | +27.232 |
policy | +26.731 |
climate | +26.660 |
Neg logit contributions | |
�� | -20.124 |
arthed | -18.297 |
�� | -17.796 |
Canaver | -17.092 |
�� | -17.006 |
Token | � |
Token ID | 250 |
Feature activation | +2.46e+01 |
Pos logit contributions | |
�� | +24.854 |
�� | +24.828 |
� | +24.124 |
� | +23.139 |
�� | +23.133 |
Neg logit contributions | |
� | -15.663 |
� | -14.360 |
behavi | -13.524 |
policies | -13.387 |
climate | -11.997 |
Token | pro |
Token ID | 1676 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
� | +29.807 |
� | +27.611 |
policies | +25.052 |
climate | +23.671 |
policy | +23.519 |
Neg logit contributions | |
�� | -16.238 |
�� | -13.712 |
�� | -13.673 |
Canaver | -13.229 |
Remy | -13.217 |
Token | Cruz |
Token ID | 8742 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
� | +15.245 |
� | +14.390 |
policies | +12.777 |
climate | +11.792 |
institutions | +11.764 |
Neg logit contributions | |
�� | -9.690 |
arthed | -8.535 |
�� | -8.345 |
senal | -8.202 |
��極 | -8.137 |
Token | continued |
Token ID | 3767 |
Feature activation | -8.15e+00 |
Pos logit contributions | |
� | +16.084 |
� | +15.106 |
policies | +13.191 |
climate | +12.119 |
policy | +12.045 |
Neg logit contributions | |
�� | -11.226 |
arthed | -9.743 |
�� | -9.694 |
senal | -9.668 |
�� | -9.335 |
Token | . |
Token ID | 13 |
Feature activation | +4.30e+01 |
Pos logit contributions | |
�� | +6.976 |
�� | +6.561 |
arthed | +6.509 |
yne | +6.274 |
Remy | +6.209 |
Neg logit contributions | |
� | -9.388 |
� | -8.841 |
policies | -8.181 |
institutions | -7.680 |
ideology | -7.458 |
Token | � |
Token ID | 564 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
� | +40.730 |
� | +39.759 |
policies | +31.232 |
| +29.809 |
climate | +29.449 |
Neg logit contributions | |
�� | -21.308 |
arthed | -19.600 |
senal | -19.273 |
�� | -18.383 |
yne | -18.092 |
Token | � |
Token ID | 250 |
Feature activation | +3.60e+01 |
Pos logit contributions | |
�� | +20.450 |
�� | +19.826 |
� | +19.767 |
�� | +18.980 |
�� | +18.817 |
Neg logit contributions | |
� | -15.714 |
� | -14.321 |
policies | -14.287 |
behavi | -14.184 |
governance | -13.101 |
Token | That |
Token ID | 2504 |
Feature activation | +6.03e+01 |
Pos logit contributions | |
� | +35.389 |
� | +32.506 |
policies | +27.382 |
| +26.616 |
policy | +24.965 |
Neg logit contributions | |
�� | -25.323 |
senal | -22.141 |
arthed | -19.606 |
srf | -19.571 |
��極 | -19.447 |
Token | is |
Token ID | 318 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
� | +47.730 |
� | +45.311 |
policies | +39.637 |
policy | +38.054 |
ideology | +38.044 |
Neg logit contributions | |
�� | -26.335 |
arthed | -20.367 |
senal | -19.898 |
��極 | -19.406 |
yne | -19.278 |
Token | fundamentally |
Token ID | 17640 |
Feature activation | +3.00e+01 |
Pos logit contributions | |
� | +30.264 |
� | +29.429 |
policies | +25.701 |
policy | +24.244 |
ideology | +24.006 |
Neg logit contributions | |
�� | -22.325 |
arthed | -18.010 |
��極 | -17.686 |
yne | -17.530 |
�� | -17.484 |
Token | dangerous |
Token ID | 4923 |
Feature activation | +4.03e+01 |
Pos logit contributions | |
� | +29.719 |
� | +29.051 |
policies | +25.051 |
political | +23.489 |
policy | +23.477 |
Neg logit contributions | |
�� | -26.028 |
arthed | -21.026 |
senal | -20.644 |
��極 | -20.263 |
nesday | -19.963 |
Token | to |
Token ID | 284 |
Feature activation | +4.05e+01 |
Pos logit contributions | |
� | +37.017 |
� | +35.928 |
policies | +31.653 |
policy | +30.507 |
ideology | +29.971 |
Neg logit contributions | |
�� | -27.126 |
arthed | -22.958 |
senal | -21.916 |
��極 | -21.527 |
�� | -21.151 |
Token | the |
Token ID | 262 |
Feature activation | +3.98e+01 |
Pos logit contributions | |
� | +36.740 |
� | +36.229 |
policies | +32.542 |
institutions | +31.278 |
policy | +30.688 |
Neg logit contributions | |
�� | -25.913 |
��極 | -21.382 |
arthed | -21.355 |
senal | -20.558 |
yne | -20.355 |
Token | to |
Token ID | 284 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
� | +9.233 |
� | +8.664 |
policies | +7.746 |
institutions | +7.163 |
climate | +7.056 |
Neg logit contributions | |
�� | -7.125 |
�� | -6.595 |
arthed | -6.571 |
yne | -6.313 |
Remy | -6.188 |
Token | ignore |
Token ID | 8856 |
Feature activation | +3.05e+01 |
Pos logit contributions | |
� | +14.335 |
� | +13.551 |
policies | +11.924 |
policy | +10.728 |
institutions | +10.710 |
Neg logit contributions | |
�� | -15.191 |
arthed | -13.882 |
senal | -13.665 |
�� | -13.655 |
��極 | -13.418 |
Token | [ |
Token ID | 685 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
� | +31.279 |
� | +30.090 |
policies | +27.938 |
policy | +25.635 |
climate | +25.250 |
Neg logit contributions | |
�� | -23.066 |
senal | -19.650 |
��極 | -18.923 |
arthed | -18.753 |
�� | -18.039 |
Token | them |
Token ID | 18855 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
� | +25.437 |
� | +23.387 |
policies | +21.586 |
| +19.744 |
policy | +19.709 |
Neg logit contributions | |
�� | -16.859 |
�� | -13.276 |
�� | -13.016 |
senal | -13.003 |
��極 | -12.892 |
Token | ]. |
Token ID | 4083 |
Feature activation | +4.53e+01 |
Pos logit contributions | |
� | +16.272 |
� | +15.157 |
policies | +13.408 |
institutions | +12.312 |
climate | +12.193 |
Neg logit contributions | |
�� | -11.310 |
�� | -10.124 |
arthed | -10.123 |
senal | -9.738 |
��極 | -9.658 |
Token | That |
Token ID | 1320 |
Feature activation | +6.02e+01 |
Pos logit contributions | |
� | +44.514 |
� | +41.068 |
policies | +32.089 |
| +32.060 |
¨ | +30.085 |
Neg logit contributions | |
�� | -22.410 |
senal | -20.544 |
arthed | -19.542 |
avorite | -18.578 |
�� | -18.241 |
Token | is |
Token ID | 318 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
� | +48.092 |
� | +44.512 |
policies | +39.334 |
policy | +37.879 |
ideology | +37.228 |
Neg logit contributions | |
�� | -26.175 |
arthed | -20.597 |
��極 | -20.417 |
senal | -19.873 |
�� | -18.707 |
Token | a |
Token ID | 257 |
Feature activation | +3.99e+01 |
Pos logit contributions | |
� | +30.734 |
� | +29.601 |
policies | +25.818 |
policy | +24.406 |
ideology | +24.067 |
Neg logit contributions | |
�� | -21.878 |
arthed | -17.975 |
��極 | -17.460 |
�� | -17.180 |
yne | -17.109 |
Token | very |
Token ID | 845 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
� | +36.897 |
� | +35.851 |
policy | +32.148 |
policies | +31.487 |
political | +30.869 |
Neg logit contributions | |
�� | -25.259 |
��極 | -20.648 |
arthed | -20.302 |
�� | -19.728 |
senal | -19.505 |
Token | dangerous |
Token ID | 4923 |
Feature activation | +4.38e+01 |
Pos logit contributions | |
� | +23.800 |
� | +23.135 |
policies | +20.350 |
policy | +19.465 |
political | +19.099 |
Neg logit contributions | |
�� | -21.846 |
arthed | -18.584 |
senal | -18.061 |
��極 | -17.959 |
�� | -17.527 |
Token | precedent |
Token ID | 19719 |
Feature activation | +2.73e+01 |
Pos logit contributions | |
� | +38.437 |
� | +37.654 |
policy | +34.466 |
policies | +34.134 |
ideology | +33.668 |
Neg logit contributions | |
�� | -27.793 |
arthed | -22.541 |
��極 | -22.423 |
senal | -21.706 |
�� | -20.726 |
Token | meters |
Token ID | 10700 |
Feature activation | -2.38e+01 |
Pos logit contributions | |
�� | +13.229 |
arthed | +12.775 |
Miles | +12.754 |
Reeves | +12.650 |
yne | +12.636 |
Neg logit contributions | |
� | -14.600 |
� | -13.641 |
policies | -12.201 |
ideology | -11.379 |
behavi | -11.287 |
Token | per |
Token ID | 583 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
arthed | +20.467 |
�� | +20.331 |
flown | +20.292 |
Reeves | +19.852 |
Miles | +19.843 |
Neg logit contributions | |
� | -16.261 |
� | -15.042 |
policies | -13.326 |
behavi | -12.627 |
institutions | -12.348 |
Token | second |
Token ID | 1218 |
Feature activation | -2.62e+01 |
Pos logit contributions | |
�� | +6.834 |
arthed | +6.262 |
�� | +5.966 |
Reeves | +5.933 |
yne | +5.870 |
Neg logit contributions | |
� | -15.425 |
� | -14.563 |
policies | -13.542 |
institutions | -12.833 |
ideology | -12.580 |
Token | ( |
Token ID | 357 |
Feature activation | -5.53e+01 |
Pos logit contributions | |
�� | +27.458 |
flown | +26.930 |
Reeves | +26.927 |
Remy | +26.589 |
yne | +26.432 |
Neg logit contributions | |
� | -10.525 |
� | -9.779 |
policies | -9.025 |
institutions | -7.851 |
behavi | -7.810 |
Token | 5 |
Token ID | 20 |
Feature activation | -4.41e+01 |
Pos logit contributions | |
666 | +39.423 |
6 | +38.787 |
135 | +38.465 |
302 | +37.821 |
8 | +37.415 |
Neg logit contributions | |
behavi | -14.737 |
� | -13.205 |
policies | -13.085 |
� | -13.022 |
governance | -11.662 |
Token | , |
Token ID | 11 |
Feature activation | -1.38e+02 |
Pos logit contributions | |
666 | +32.557 |
135 | +32.000 |
Miles | +31.982 |
�� | +31.616 |
JJ | +31.320 |
Neg logit contributions | |
� | -17.482 |
� | -16.178 |
policies | -14.194 |
behavi | -13.932 |
institutions | -12.549 |
Token | 9 |
Token ID | 24 |
Feature activation | -5.26e+01 |
Pos logit contributions | |
666 | +46.428 |
135 | +45.249 |
302 | +44.517 |
06 | +44.057 |
333 | +43.872 |
Neg logit contributions | |
behavi | -17.517 |
� | -17.257 |
� | -15.971 |
policies | -14.350 |
institutions | -14.347 |
Token | 46 |
Token ID | 3510 |
Feature activation | -2.51e+01 |
Pos logit contributions | |
06 | +38.033 |
26 | +36.515 |
22 | +36.457 |
08 | +35.881 |
666 | +35.851 |
Neg logit contributions | |
behavi | -24.045 |
policies | -16.333 |
conflic | -15.974 |
institutions | -14.809 |
� | -14.806 |
Token | miles |
Token ID | 4608 |
Feature activation | -2.97e+01 |
Pos logit contributions | |
Miles | +21.668 |
�� | +20.739 |
�� | +20.573 |
Reeves | +20.526 |
Remy | +20.406 |
Neg logit contributions | |
� | -18.348 |
� | -17.085 |
policies | -14.508 |
behavi | -13.951 |
ideology | -13.529 |
Token | per |
Token ID | 583 |
Feature activation | -1.61e+01 |
Pos logit contributions | |
�� | +25.946 |
arthed | +25.862 |
flown | +25.532 |
Reeves | +25.463 |
yne | +25.405 |
Neg logit contributions | |
� | -14.956 |
� | -13.958 |
policies | -12.543 |
institutions | -11.443 |
behavi | -10.935 |
Token | hour |
Token ID | 1711 |
Feature activation | -2.85e+01 |
Pos logit contributions | |
�� | +11.105 |
arthed | +9.986 |
Reeves | +9.555 |
�� | +9.507 |
Remy | +9.235 |
Neg logit contributions | |
� | -18.912 |
� | -17.517 |
policies | -16.574 |
institutions | -15.498 |
governance | -14.913 |
Token | Fort |
Token ID | 21926 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
yne | +27.113 |
666 | +27.014 |
135 | +26.831 |
nox | +26.756 |
arthed | +26.724 |
Neg logit contributions | |
� | -9.008 |
� | -8.737 |
policies | -8.145 |
behavi | -7.655 |
ideology | -6.844 |
Token | e |
Token ID | 68 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
�� | +0.875 |
�� | +0.792 |
arthed | +0.784 |
yne | +0.754 |
Remy | +0.734 |
Neg logit contributions | |
� | -1.807 |
� | -1.719 |
policies | -1.587 |
institutions | -1.496 |
climate | -1.470 |
Token | finished |
Token ID | 5201 |
Feature activation | -4.09e+01 |
Pos logit contributions | |
�� | +1.970 |
�� | +1.874 |
arthed | +1.859 |
yne | +1.808 |
Remy | +1.795 |
Neg logit contributions | |
� | -1.647 |
� | -1.524 |
policies | -1.351 |
institutions | -1.228 |
climate | -1.195 |
Token | with |
Token ID | 351 |
Feature activation | -4.52e+01 |
Pos logit contributions | |
JJ | +33.454 |
Blossom | +33.164 |
yne | +32.691 |
Dee | +32.633 |
Remy | +32.601 |
Neg logit contributions | |
� | -14.334 |
behavi | -12.102 |
� | -11.903 |
policies | -11.452 |
institutions | -9.661 |
Token | 1 |
Token ID | 352 |
Feature activation | -2.83e+01 |
Pos logit contributions | |
Blossom | +33.345 |
JJ | +33.225 |
Reeves | +33.177 |
666 | +33.175 |
Remy | +33.157 |
Neg logit contributions | |
� | -15.921 |
behavi | -13.646 |
� | -12.450 |
policies | -11.295 |
governance | -10.400 |
Token | , |
Token ID | 11 |
Feature activation | -1.33e+02 |
Pos logit contributions | |
yne | +21.513 |
�� | +21.316 |
Blossom | +20.613 |
135 | +20.555 |
JJ | +20.463 |
Neg logit contributions | |
� | -19.975 |
behavi | -18.479 |
� | -18.229 |
policies | -17.355 |
governance | -15.789 |
Token | 07 |
Token ID | 2998 |
Feature activation | -2.91e+01 |
Pos logit contributions | |
135 | +45.947 |
666 | +45.870 |
302 | +44.700 |
06 | +44.472 |
336 | +43.986 |
Neg logit contributions | |
behavi | -22.394 |
� | -16.434 |
institutions | -16.102 |
governance | -15.611 |
policies | -15.588 |
Token | 6 |
Token ID | 21 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
6 | +23.272 |
8 | +22.757 |
JJ | +22.715 |
zzo | +22.471 |
yne | +22.454 |
Neg logit contributions | |
� | -19.033 |
� | -17.476 |
behavi | -16.314 |
policies | -15.539 |
governance | -14.934 |
Token | ); |
Token ID | 1776 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
�� | +14.429 |
�� | +13.891 |
yne | +13.814 |
Remy | +13.794 |
Blossom | +13.688 |
Neg logit contributions | |
� | -11.729 |
� | -10.582 |
policies | -9.770 |
behavi | -8.723 |
governance | -8.701 |
Token | 7 |
Token ID | 767 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
�� | +18.293 |
Blossom | +17.876 |
arthed | +17.683 |
�� | +17.680 |
Remy | +17.661 |
Neg logit contributions | |
� | -11.320 |
� | -10.104 |
policies | -8.985 |
institutions | -8.064 |
behavi | -7.931 |
Token | 22 |
Token ID | 1828 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
�� | +23.601 |
�� | +23.504 |
ometown | +23.390 |
Blossom | +23.362 |
yne | +23.342 |
Neg logit contributions | |
� | -12.025 |
� | -10.723 |
policies | -9.329 |
behavi | -9.213 |
ideology | -8.516 |
Token | pic |
Token ID | 8301 |
Feature activation | -3.08e+01 |
Pos logit contributions | |
�� | +6.887 |
Remy | +6.576 |
arthed | +6.562 |
�� | +6.556 |
Blossom | +6.550 |
Neg logit contributions | |
� | -4.837 |
� | -4.381 |
policies | -3.937 |
institutions | -3.560 |
governance | -3.416 |
Token | . |
Token ID | 13 |
Feature activation | -1.81e+01 |
Pos logit contributions | |
Blossom | +23.515 |
JJ | +23.062 |
Gomez | +22.847 |
Remy | +22.574 |
Reeves | +22.517 |
Neg logit contributions | |
behavi | -23.249 |
conflic | -18.450 |
policies | -18.179 |
� | -17.992 |
institutions | -16.871 |
Token | twitter |
Token ID | 6956 |
Feature activation | -4.97e+01 |
Pos logit contributions | |
agle | +11.173 |
fg | +10.939 |
yne | +10.882 |
Blossom | +10.837 |
nox | +10.825 |
Neg logit contributions | |
behavi | -20.183 |
� | -18.934 |
policies | -18.829 |
� | -18.049 |
institutions | -17.658 |
Token | . |
Token ID | 13 |
Feature activation | -2.64e+01 |
Pos logit contributions | |
666 | +29.104 |
Blossom | +28.326 |
135 | +28.090 |
fg | +27.917 |
JJ | +27.864 |
Neg logit contributions | |
behavi | -33.283 |
conflic | -28.135 |
practition | -27.120 |
� | -25.481 |
cumbers | -22.456 |
Token | com |
Token ID | 785 |
Feature activation | -3.08e+01 |
Pos logit contributions | |
zzo | +18.442 |
fg | +18.417 |
666 | +18.250 |
agle | +18.237 |
nova | +18.093 |
Neg logit contributions | |
behavi | -24.968 |
policies | -20.518 |
� | -19.930 |
ideology | -19.178 |
� | -19.077 |
Token | / |
Token ID | 14 |
Feature activation | -1.27e+02 |
Pos logit contributions | |
666 | +22.605 |
Blossom | +22.438 |
JJ | +22.009 |
fg | +21.734 |
135 | +21.707 |
Neg logit contributions | |
behavi | -24.773 |
conflic | -19.237 |
policies | -18.524 |
� | -18.305 |
ideology | -17.668 |
Token | CS |
Token ID | 7902 |
Feature activation | -9.97e+01 |
Pos logit contributions | |
fg | +46.317 |
yx | +44.951 |
yne | +44.754 |
6 | +43.706 |
uo | +43.616 |
Neg logit contributions | |
behavi | -15.241 |
� | -14.550 |
� | -14.429 |
policies | -14.072 |
climate | -12.823 |
Token | 3 |
Token ID | 18 |
Feature activation | -1.04e+02 |
Pos logit contributions | |
fg | +45.409 |
yx | +43.910 |
yne | +43.822 |
zzy | +43.111 |
6 | +42.775 |
Neg logit contributions | |
behavi | -14.649 |
� | -14.326 |
� | -14.283 |
policies | -13.387 |
climate | -11.841 |
Token | IV |
Token ID | 3824 |
Feature activation | -1.16e+02 |
Pos logit contributions | |
fg | +45.392 |
yne | +44.348 |
yx | +44.170 |
zzy | +43.187 |
uo | +42.909 |
Neg logit contributions | |
� | -14.442 |
behavi | -14.439 |
� | -14.269 |
policies | -13.560 |
climate | -12.211 |
Token | IP |
Token ID | 4061 |
Feature activation | -1.11e+02 |
Pos logit contributions | |
fg | +46.327 |
yne | +44.652 |
yx | +44.425 |
uo | +43.750 |
6 | +43.303 |
Neg logit contributions | |
behavi | -15.612 |
� | -14.508 |
� | -14.366 |
policies | -13.696 |
climate | -12.496 |
Token | 9 |
Token ID | 24 |
Feature activation | -1.05e+02 |
Pos logit contributions | |
fg | +45.972 |
yx | +44.395 |
yne | +44.158 |
6 | +43.456 |
zzy | +43.373 |
Neg logit contributions | |
behavi | -15.540 |
� | -13.979 |
� | -13.909 |
policies | -13.738 |
climate | -12.197 |
Token | for |
Token ID | 329 |
Feature activation | -3.10e+01 |
Pos logit contributions | |
coached | +32.321 |
Gomez | +32.002 |
Blossom | +31.756 |
Remy | +31.734 |
Reeves | +31.640 |
Neg logit contributions | |
� | -17.687 |
behavi | -16.233 |
� | -14.463 |
policies | -13.615 |
institutions | -12.266 |
Token | Portland |
Token ID | 10727 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
Remy | +26.241 |
Blossom | +25.906 |
JJ | +25.561 |
Reeves | +25.423 |
Gomez | +25.417 |
Neg logit contributions | |
� | -20.027 |
� | -17.376 |
behavi | -15.305 |
policies | -14.972 |
ideology | -13.179 |
Token | and |
Token ID | 290 |
Feature activation | -3.45e+01 |
Pos logit contributions | |
Blossom | +21.557 |
zzo | +21.104 |
JJ | +20.992 |
�� | +20.925 |
Gomez | +20.855 |
Neg logit contributions | |
� | -17.227 |
� | -15.773 |
policies | -13.915 |
behavi | -13.333 |
ideology | -12.435 |
Token | averaged |
Token ID | 16449 |
Feature activation | -5.17e+01 |
Pos logit contributions | |
Remy | +28.481 |
Reeves | +28.331 |
coached | +28.306 |
Blossom | +28.143 |
Gomez | +28.129 |
Neg logit contributions | |
� | -18.398 |
behavi | -15.820 |
� | -15.691 |
policies | -13.542 |
governance | -12.246 |
Token | 3 |
Token ID | 513 |
Feature activation | -3.26e+01 |
Pos logit contributions | |
6 | +33.422 |
26 | +33.041 |
JJ | +32.629 |
Reeves | +32.548 |
Blossom | +32.389 |
Neg logit contributions | |
� | -21.108 |
behavi | -19.909 |
� | -17.571 |
policies | -15.773 |
¨ | -14.084 |
Token | . |
Token ID | 13 |
Feature activation | -1.26e+02 |
Pos logit contributions | |
�� | +25.340 |
fg | +24.868 |
JJ | +24.640 |
Remy | +24.572 |
�� | +24.274 |
Neg logit contributions | |
� | -19.546 |
� | -18.239 |
policies | -15.613 |
ideology | -15.066 |
modernization | -14.952 |
Token | 0 |
Token ID | 15 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
6 | +44.977 |
8 | +44.234 |
7 | +43.142 |
06 | +42.307 |
0 | +42.270 |
Neg logit contributions | |
behavi | -27.720 |
governance | -19.643 |
policies | -19.459 |
institutions | -18.962 |
conflic | -18.781 |
Token | points |
Token ID | 2173 |
Feature activation | -3.67e+01 |
Pos logit contributions | |
Remy | +16.887 |
Blossom | +16.810 |
�� | +16.252 |
JJ | +16.251 |
Reeves | +15.627 |
Neg logit contributions | |
� | -18.399 |
� | -16.885 |
policies | -15.175 |
behavi | -14.720 |
ideology | -14.022 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+01 |
Pos logit contributions | |
Blossom | +28.706 |
Remy | +28.686 |
JJ | +27.702 |
Reeves | +27.410 |
Miles | +27.222 |
Neg logit contributions | |
� | -17.996 |
� | -15.751 |
behavi | -15.233 |
policies | -14.146 |
institutions | -12.848 |
Token | 3 |
Token ID | 513 |
Feature activation | -3.66e+01 |
Pos logit contributions | |
JJ | +31.415 |
Remy | +30.885 |
coached | +30.791 |
Reeves | +30.712 |
6 | +30.512 |
Neg logit contributions | |
� | -18.828 |
behavi | -15.214 |
� | -15.032 |
policies | -13.926 |
institutions | -12.096 |
Token | . |
Token ID | 13 |
Feature activation | -9.02e+01 |
Pos logit contributions | |
Blossom | +23.760 |
JJ | +23.342 |
Remy | +22.637 |
Miles | +22.442 |
zzo | +22.434 |
Neg logit contributions | |
behavi | -26.874 |
conflic | -22.185 |
� | -22.165 |
� | -19.975 |
policies | -19.827 |
Token | pic |
Token ID | 8301 |
Feature activation | -3.00e+01 |
Pos logit contributions | |
�� | +17.785 |
Remy | +17.552 |
JJ | +17.490 |
arthed | +17.366 |
yne | +17.275 |
Neg logit contributions | |
� | -10.557 |
� | -9.366 |
policies | -8.278 |
institutions | -7.296 |
ideology | -7.146 |
Token | . |
Token ID | 13 |
Feature activation | -1.56e+01 |
Pos logit contributions | |
Blossom | +22.692 |
Gomez | +22.071 |
JJ | +22.064 |
Reeves | +21.700 |
Remy | +21.674 |
Neg logit contributions | |
behavi | -23.263 |
policies | -18.778 |
conflic | -18.653 |
� | -18.008 |
institutions | -17.370 |
Token | twitter |
Token ID | 6956 |
Feature activation | -4.99e+01 |
Pos logit contributions | |
agle | +7.386 |
Blossom | +7.308 |
yne | +7.284 |
fg | +7.274 |
arthed | +7.187 |
Neg logit contributions | |
behavi | -19.741 |
� | -19.411 |
policies | -19.173 |
� | -18.573 |
institutions | -18.079 |
Token | . |
Token ID | 13 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
666 | +28.898 |
135 | +28.054 |
Blossom | +27.865 |
fg | +27.662 |
JJ | +27.544 |
Neg logit contributions | |
behavi | -34.156 |
conflic | -29.328 |
practition | -28.124 |
� | -26.534 |
cumbers | -23.547 |
Token | com |
Token ID | 785 |
Feature activation | -2.92e+01 |
Pos logit contributions | |
fg | +18.889 |
zzo | +18.641 |
agle | +18.543 |
666 | +18.509 |
yne | +18.413 |
Neg logit contributions | |
behavi | -23.827 |
policies | -19.698 |
� | -18.840 |
ideology | -18.329 |
ideologies | -18.194 |
Token | / |
Token ID | 14 |
Feature activation | -1.26e+02 |
Pos logit contributions | |
666 | +21.947 |
Blossom | +21.819 |
JJ | +21.403 |
yne | +21.172 |
135 | +21.153 |
Neg logit contributions | |
behavi | -23.666 |
conflic | -18.298 |
policies | -18.197 |
� | -17.933 |
ideology | -17.231 |
Token | z |
Token ID | 89 |
Feature activation | -1.23e+02 |
Pos logit contributions | |
fg | +46.213 |
yx | +44.904 |
yne | +44.775 |
uo | +43.607 |
6 | +43.607 |
Neg logit contributions | |
behavi | -15.228 |
� | -14.413 |
� | -14.391 |
policies | -14.085 |
climate | -12.736 |
Token | J |
Token ID | 41 |
Feature activation | -1.03e+02 |
Pos logit contributions | |
fg | +46.165 |
yx | +44.333 |
yne | +43.731 |
6 | +43.572 |
zzy | +43.467 |
Neg logit contributions | |
behavi | -15.938 |
� | -14.832 |
� | -14.738 |
policies | -13.996 |
climate | -13.022 |
Token | X |
Token ID | 55 |
Feature activation | -1.08e+02 |
Pos logit contributions | |
fg | +45.892 |
yx | +44.108 |
yne | +43.816 |
6 | +42.919 |
zzy | +42.779 |
Neg logit contributions | |
behavi | -14.844 |
� | -14.742 |
� | -14.451 |
policies | -13.479 |
climate | -12.311 |
Token | w |
Token ID | 86 |
Feature activation | -1.09e+02 |
Pos logit contributions | |
fg | +45.740 |
yx | +44.183 |
yne | +44.074 |
zzy | +43.102 |
6 | +43.038 |
Neg logit contributions | |
behavi | -15.169 |
� | -14.336 |
� | -14.169 |
policies | -13.649 |
climate | -12.378 |
Token | 2 |
Token ID | 17 |
Feature activation | -1.03e+02 |
Pos logit contributions | |
fg | +45.618 |
yne | +43.434 |
zzy | +43.284 |
yx | +43.231 |
6 | +43.207 |
Neg logit contributions | |
behavi | -15.258 |
� | -14.289 |
� | -14.164 |
policies | -13.836 |
climate | -12.378 |
Token | pic |
Token ID | 8301 |
Feature activation | -3.18e+01 |
Pos logit contributions | |
Remy | +22.004 |
�� | +21.941 |
arthed | +21.538 |
Blossom | +21.309 |
JJ | +21.289 |
Neg logit contributions | |
� | -9.127 |
� | -8.106 |
policies | -7.317 |
institutions | -5.906 |
ideology | -5.784 |
Token | . |
Token ID | 13 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
Blossom | +26.148 |
JJ | +25.769 |
Remy | +25.601 |
Gomez | +25.485 |
Rowe | +25.108 |
Neg logit contributions | |
behavi | -19.586 |
� | -16.339 |
policies | -16.084 |
� | -14.771 |
ideology | -14.428 |
Token | twitter |
Token ID | 6956 |
Feature activation | -5.36e+01 |
Pos logit contributions | |
yne | +11.943 |
agle | +11.915 |
fg | +11.895 |
arthed | +11.760 |
zzo | +11.757 |
Neg logit contributions | |
behavi | -18.054 |
� | -17.269 |
policies | -17.017 |
� | -16.408 |
institutions | -15.681 |
Token | . |
Token ID | 13 |
Feature activation | -2.73e+01 |
Pos logit contributions | |
666 | +30.027 |
JJ | +29.041 |
135 | +29.013 |
Blossom | +28.592 |
. | +28.511 |
Neg logit contributions | |
behavi | -34.241 |
conflic | -29.208 |
practition | -28.251 |
� | -26.587 |
cumbers | -23.753 |
Token | com |
Token ID | 785 |
Feature activation | -3.13e+01 |
Pos logit contributions | |
zzo | +19.890 |
fg | +19.774 |
agle | +19.352 |
666 | +19.309 |
yne | +19.255 |
Neg logit contributions | |
behavi | -24.717 |
policies | -20.546 |
� | -19.696 |
� | -18.900 |
ideology | -18.870 |
Token | / |
Token ID | 14 |
Feature activation | -1.24e+02 |
Pos logit contributions | |
666 | +23.274 |
Blossom | +22.938 |
JJ | +22.637 |
yne | +22.426 |
135 | +22.383 |
Neg logit contributions | |
behavi | -24.420 |
conflic | -18.871 |
policies | -18.525 |
� | -18.055 |
ideology | -17.579 |
Token | u |
Token ID | 84 |
Feature activation | -1.00e+02 |
Pos logit contributions | |
fg | +46.235 |
yne | +44.847 |
yx | +44.800 |
uo | +43.696 |
6 | +43.640 |
Neg logit contributions | |
behavi | -14.662 |
� | -14.183 |
� | -14.149 |
policies | -13.925 |
climate | -12.565 |
Token | I |
Token ID | 40 |
Feature activation | -7.59e+01 |
Pos logit contributions | |
fg | +43.970 |
yx | +43.073 |
6 | +43.015 |
yne | +43.008 |
zzy | +42.710 |
Neg logit contributions | |
behavi | -15.295 |
� | -14.643 |
� | -14.316 |
policies | -14.049 |
climate | -12.977 |
Token | ba |
Token ID | 7012 |
Feature activation | -8.75e+01 |
Pos logit contributions | |
fg | +43.437 |
zzy | +42.665 |
yne | +42.343 |
zzo | +42.011 |
yx | +41.942 |
Neg logit contributions | |
� | -14.732 |
� | -14.374 |
behavi | -14.358 |
policies | -13.284 |
climate | -12.154 |
Token | H |
Token ID | 39 |
Feature activation | -8.65e+01 |
Pos logit contributions | |
fg | +42.401 |
6 | +42.401 |
666 | +41.768 |
yne | +41.755 |
yx | +41.647 |
Neg logit contributions | |
behavi | -15.442 |
policies | -13.792 |
� | -13.622 |
� | -13.487 |
climate | -12.822 |
Token | Ex |
Token ID | 3109 |
Feature activation | -1.04e+02 |
Pos logit contributions | |
fg | +45.243 |
yx | +42.910 |
yne | +42.731 |
zzy | +42.137 |
uo | +42.104 |
Neg logit contributions | |
� | -14.364 |
behavi | -14.086 |
� | -13.507 |
policies | -12.929 |
climate | -11.488 |
Token | pic |
Token ID | 8301 |
Feature activation | -2.96e+01 |
Pos logit contributions | |
� | +16.138 |
� | +15.149 |
policies | +12.957 |
climate | +12.093 |
institutions | +12.037 |
Neg logit contributions | |
�� | -11.239 |
�� | -10.135 |
arthed | -9.941 |
��極 | -9.636 |
Canaver | -9.441 |
Token | . |
Token ID | 13 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
Blossom | +25.815 |
Gomez | +25.520 |
JJ | +25.463 |
Remy | +25.122 |
666 | +24.914 |
Neg logit contributions | |
behavi | -18.630 |
policies | -14.478 |
conflic | -13.912 |
institutions | -13.310 |
� | -13.180 |
Token | twitter |
Token ID | 6956 |
Feature activation | -4.38e+01 |
Pos logit contributions | |
Blossom | +12.938 |
agle | +12.913 |
arthed | +12.798 |
yne | +12.780 |
nox | +12.749 |
Neg logit contributions | |
behavi | -13.326 |
� | -13.010 |
policies | -12.967 |
� | -12.114 |
institutions | -11.854 |
Token | . |
Token ID | 13 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
666 | +30.715 |
Blossom | +30.014 |
135 | +29.921 |
fg | +29.852 |
JJ | +29.814 |
Neg logit contributions | |
behavi | -26.638 |
conflic | -21.336 |
practition | -19.544 |
policies | -17.785 |
� | -17.466 |
Token | com |
Token ID | 785 |
Feature activation | -2.15e+01 |
Pos logit contributions | |
zzo | +18.027 |
agle | +17.974 |
fg | +17.906 |
Blossom | +17.899 |
yne | +17.745 |
Neg logit contributions | |
behavi | -13.659 |
policies | -12.119 |
� | -11.600 |
ideology | -10.846 |
� | -10.835 |
Token | / |
Token ID | 14 |
Feature activation | -1.24e+02 |
Pos logit contributions | |
666 | +20.588 |
Blossom | +20.373 |
yne | +20.169 |
JJ | +20.139 |
agle | +20.043 |
Neg logit contributions | |
behavi | -15.102 |
policies | -12.610 |
� | -12.037 |
ideology | -11.670 |
institutions | -11.524 |
Token | xx |
Token ID | 5324 |
Feature activation | -1.14e+02 |
Pos logit contributions | |
fg | +46.221 |
yx | +44.972 |
yne | +44.790 |
6 | +43.770 |
uo | +43.716 |
Neg logit contributions | |
behavi | -14.654 |
policies | -13.755 |
� | -13.700 |
� | -13.608 |
climate | -12.423 |
Token | A |
Token ID | 32 |
Feature activation | -6.64e+01 |
Pos logit contributions | |
fg | +45.528 |
yx | +44.536 |
yne | +44.402 |
zzy | +43.765 |
uo | +43.438 |
Neg logit contributions | |
behavi | -14.767 |
� | -13.782 |
� | -13.681 |
policies | -13.357 |
climate | -12.261 |
Token | II |
Token ID | 3978 |
Feature activation | -9.05e+01 |
Pos logit contributions | |
fg | +42.005 |
zzy | +41.963 |
yx | +41.507 |
agle | +41.467 |
zzo | +41.344 |
Neg logit contributions | |
� | -12.376 |
� | -12.266 |
policies | -12.024 |
behavi | -11.838 |
institutions | -10.429 |
Token | 1 |
Token ID | 16 |
Feature activation | -1.01e+02 |
Pos logit contributions | |
fg | +45.355 |
yne | +44.210 |
yx | +43.581 |
zzy | +43.223 |
zzo | +43.124 |
Neg logit contributions | |
behavi | -14.021 |
� | -13.095 |
� | -12.890 |
policies | -12.457 |
climate | -11.592 |
Token | k |
Token ID | 74 |
Feature activation | -1.01e+02 |
Pos logit contributions | |
fg | +45.210 |
yne | +44.548 |
yx | +44.180 |
zzy | +43.226 |
uo | +43.168 |
Neg logit contributions | |
behavi | -13.422 |
� | -13.337 |
� | -13.122 |
policies | -12.924 |
institutions | -11.529 |
Token | pic |
Token ID | 8301 |
Feature activation | -2.53e+01 |
Pos logit contributions | |
� | +14.440 |
� | +13.706 |
policies | +11.976 |
institutions | +11.181 |
climate | +11.076 |
Neg logit contributions | |
�� | -8.947 |
arthed | -8.063 |
�� | -7.979 |
��極 | -7.585 |
yne | -7.545 |
Token | . |
Token ID | 13 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
Blossom | +22.422 |
Gomez | +22.346 |
JJ | +22.157 |
Remy | +22.151 |
Reeves | +21.713 |
Neg logit contributions | |
behavi | -17.122 |
policies | -14.528 |
� | -14.455 |
institutions | -13.339 |
� | -13.009 |
Token | twitter |
Token ID | 6956 |
Feature activation | -4.43e+01 |
Pos logit contributions | |
arthed | +8.421 |
agle | +8.351 |
�� | +8.285 |
Blossom | +8.280 |
Remy | +8.205 |
Neg logit contributions | |
� | -12.378 |
policies | -11.653 |
� | -11.579 |
behavi | -11.362 |
institutions | -10.815 |
Token | . |
Token ID | 13 |
Feature activation | -1.97e+01 |
Pos logit contributions | |
666 | +29.760 |
Blossom | +29.382 |
JJ | +28.991 |
fg | +28.719 |
135 | +28.619 |
Neg logit contributions | |
behavi | -28.157 |
conflic | -22.618 |
practition | -20.821 |
policies | -18.957 |
� | -18.898 |
Token | com |
Token ID | 785 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
zzo | +16.745 |
agle | +16.650 |
fg | +16.598 |
Blossom | +16.499 |
yne | +16.343 |
Neg logit contributions | |
behavi | -16.816 |
policies | -15.048 |
� | -14.752 |
� | -13.892 |
ideology | -13.655 |
Token | / |
Token ID | 14 |
Feature activation | -1.24e+02 |
Pos logit contributions | |
Blossom | +18.555 |
666 | +18.284 |
JJ | +18.247 |
Remy | +18.142 |
agle | +18.051 |
Neg logit contributions | |
behavi | -16.034 |
� | -13.874 |
policies | -13.755 |
� | -12.838 |
ideology | -12.708 |
Token | 74 |
Token ID | 4524 |
Feature activation | -1.07e+02 |
Pos logit contributions | |
fg | +46.231 |
yx | +44.971 |
yne | +44.850 |
uo | +43.642 |
6 | +43.629 |
Neg logit contributions | |
behavi | -14.375 |
� | -13.870 |
� | -13.839 |
policies | -13.661 |
climate | -12.288 |
Token | E |
Token ID | 36 |
Feature activation | -8.25e+01 |
Pos logit contributions | |
fg | +45.544 |
yne | +44.653 |
yx | +44.428 |
zzy | +43.778 |
uo | +43.462 |
Neg logit contributions | |
behavi | -13.923 |
� | -13.821 |
� | -13.774 |
policies | -13.379 |
climate | -11.835 |
Token | g |
Token ID | 70 |
Feature activation | -1.00e+02 |
Pos logit contributions | |
fg | +44.936 |
agle | +43.284 |
zzy | +43.142 |
yx | +43.087 |
yne | +42.864 |
Neg logit contributions | |
� | -13.472 |
behavi | -13.415 |
� | -13.364 |
policies | -12.778 |
institutions | -11.168 |
Token | V |
Token ID | 53 |
Feature activation | -9.21e+01 |
Pos logit contributions | |
fg | +45.198 |
6 | +43.152 |
zzy | +43.063 |
yne | +43.033 |
yx | +42.796 |
Neg logit contributions | |
behavi | -14.418 |
� | -13.367 |
policies | -13.101 |
� | -13.003 |
climate | -11.944 |
Token | V |
Token ID | 53 |
Feature activation | -8.99e+01 |
Pos logit contributions | |
fg | +45.820 |
yne | +44.472 |
yx | +43.866 |
uo | +43.256 |
zzy | +43.025 |
Neg logit contributions | |
behavi | -13.915 |
� | -13.700 |
� | -13.220 |
policies | -12.757 |
institutions | -11.468 |
Token | pic |
Token ID | 8301 |
Feature activation | -2.58e+01 |
Pos logit contributions | |
� | +5.374 |
� | +5.017 |
policies | +4.351 |
institutions | +3.995 |
climate | +3.946 |
Neg logit contributions | |
�� | -4.752 |
�� | -4.420 |
arthed | -4.383 |
yne | -4.208 |
�� | -4.160 |
Token | . |
Token ID | 13 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
Gomez | +23.358 |
Blossom | +23.287 |
JJ | +22.998 |
Remy | +22.978 |
666 | +22.786 |
Neg logit contributions | |
behavi | -17.002 |
policies | -14.196 |
� | -13.167 |
institutions | -12.938 |
ideology | -12.579 |
Token | twitter |
Token ID | 6956 |
Feature activation | -4.66e+01 |
Pos logit contributions | |
agle | +12.161 |
yne | +12.141 |
nox | +12.139 |
fg | +12.013 |
Blossom | +11.802 |
Neg logit contributions | |
behavi | -16.501 |
policies | -15.900 |
� | -15.676 |
� | -14.803 |
ideology | -14.670 |
Token | . |
Token ID | 13 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
666 | +30.865 |
fg | +30.108 |
135 | +30.098 |
JJ | +29.988 |
Blossom | +29.923 |
Neg logit contributions | |
behavi | -28.222 |
conflic | -22.898 |
practition | -21.117 |
� | -19.086 |
policies | -18.906 |
Token | com |
Token ID | 785 |
Feature activation | -2.45e+01 |
Pos logit contributions | |
zzo | +20.846 |
fg | +20.808 |
agle | +20.611 |
666 | +20.471 |
nova | +20.282 |
Neg logit contributions | |
behavi | -19.862 |
policies | -16.640 |
� | -15.249 |
ideology | -15.090 |
institutions | -14.918 |
Token | / |
Token ID | 14 |
Feature activation | -1.23e+02 |
Pos logit contributions | |
666 | +22.192 |
Blossom | +21.927 |
fg | +21.735 |
JJ | +21.690 |
agle | +21.656 |
Neg logit contributions | |
behavi | -17.485 |
policies | -13.974 |
� | -13.009 |
ideology | -12.956 |
institutions | -12.778 |
Token | E |
Token ID | 36 |
Feature activation | -8.55e+01 |
Pos logit contributions | |
fg | +46.324 |
yx | +44.954 |
yne | +44.857 |
6 | +43.699 |
uo | +43.674 |
Neg logit contributions | |
behavi | -14.545 |
policies | -13.803 |
� | -13.661 |
� | -13.625 |
climate | -12.457 |
Token | q |
Token ID | 80 |
Feature activation | -1.17e+02 |
Pos logit contributions | |
fg | +45.309 |
yx | +43.496 |
agle | +43.406 |
zzy | +42.994 |
yne | +42.833 |
Neg logit contributions | |
� | -13.351 |
� | -13.279 |
behavi | -13.129 |
policies | -12.707 |
climate | -11.132 |
Token | 4 |
Token ID | 19 |
Feature activation | -1.01e+02 |
Pos logit contributions | |
fg | +45.951 |
yx | +44.734 |
yne | +44.472 |
6 | +43.609 |
zzy | +43.462 |
Neg logit contributions | |
behavi | -14.946 |
� | -14.006 |
� | -13.718 |
policies | -13.697 |
climate | -12.424 |
Token | R |
Token ID | 49 |
Feature activation | -8.39e+01 |
Pos logit contributions | |
fg | +45.212 |
yne | +44.358 |
yx | +44.277 |
zzy | +43.159 |
uo | +43.124 |
Neg logit contributions | |
� | -13.589 |
behavi | -13.532 |
� | -13.322 |
policies | -13.233 |
climate | -11.724 |
Token | IL |
Token ID | 4146 |
Feature activation | -1.10e+02 |
Pos logit contributions | |
fg | +45.158 |
yx | +43.350 |
yne | +43.025 |
zzy | +42.570 |
dd | +42.494 |
Neg logit contributions | |
� | -13.605 |
behavi | -13.386 |
� | -12.959 |
policies | -12.857 |
climate | -11.171 |
Token | . |
Token ID | 13 |
Feature activation | -1.56e+01 |
Pos logit contributions | |
Blossom | +22.692 |
Gomez | +22.071 |
JJ | +22.064 |
Reeves | +21.700 |
Remy | +21.674 |
Neg logit contributions | |
behavi | -23.263 |
policies | -18.778 |
conflic | -18.653 |
� | -18.008 |
institutions | -17.370 |
Token | twitter |
Token ID | 6956 |
Feature activation | -4.99e+01 |
Pos logit contributions | |
agle | +7.386 |
Blossom | +7.308 |
yne | +7.284 |
fg | +7.274 |
arthed | +7.187 |
Neg logit contributions | |
behavi | -19.741 |
� | -19.411 |
policies | -19.173 |
� | -18.573 |
institutions | -18.079 |
Token | . |
Token ID | 13 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
666 | +28.898 |
135 | +28.054 |
Blossom | +27.865 |
fg | +27.662 |
JJ | +27.544 |
Neg logit contributions | |
behavi | -34.156 |
conflic | -29.328 |
practition | -28.124 |
� | -26.534 |
cumbers | -23.547 |
Token | com |
Token ID | 785 |
Feature activation | -2.92e+01 |
Pos logit contributions | |
fg | +18.889 |
zzo | +18.641 |
agle | +18.543 |
666 | +18.509 |
yne | +18.413 |
Neg logit contributions | |
behavi | -23.827 |
policies | -19.698 |
� | -18.840 |
ideology | -18.329 |
ideologies | -18.194 |
Token | / |
Token ID | 14 |
Feature activation | -1.26e+02 |
Pos logit contributions | |
666 | +21.947 |
Blossom | +21.819 |
JJ | +21.403 |
yne | +21.172 |
135 | +21.153 |
Neg logit contributions | |
behavi | -23.666 |
conflic | -18.298 |
policies | -18.197 |
� | -17.933 |
ideology | -17.231 |
Token | z |
Token ID | 89 |
Feature activation | -1.23e+02 |
Pos logit contributions | |
fg | +46.213 |
yx | +44.904 |
yne | +44.775 |
uo | +43.607 |
6 | +43.607 |
Neg logit contributions | |
behavi | -15.228 |
� | -14.413 |
� | -14.391 |
policies | -14.085 |
climate | -12.736 |
Token | J |
Token ID | 41 |
Feature activation | -1.03e+02 |
Pos logit contributions | |
fg | +46.165 |
yx | +44.333 |
yne | +43.731 |
6 | +43.572 |
zzy | +43.467 |
Neg logit contributions | |
behavi | -15.938 |
� | -14.832 |
� | -14.738 |
policies | -13.996 |
climate | -13.022 |
Token | X |
Token ID | 55 |
Feature activation | -1.08e+02 |
Pos logit contributions | |
fg | +45.892 |
yx | +44.108 |
yne | +43.816 |
6 | +42.919 |
zzy | +42.779 |
Neg logit contributions | |
behavi | -14.844 |
� | -14.742 |
� | -14.451 |
policies | -13.479 |
climate | -12.311 |
Token | w |
Token ID | 86 |
Feature activation | -1.09e+02 |
Pos logit contributions | |
fg | +45.740 |
yx | +44.183 |
yne | +44.074 |
zzy | +43.102 |
6 | +43.038 |
Neg logit contributions | |
behavi | -15.169 |
� | -14.336 |
� | -14.169 |
policies | -13.649 |
climate | -12.378 |
Token | 2 |
Token ID | 17 |
Feature activation | -1.03e+02 |
Pos logit contributions | |
fg | +45.618 |
yne | +43.434 |
zzy | +43.284 |
yx | +43.231 |
6 | +43.207 |
Neg logit contributions | |
behavi | -15.258 |
� | -14.289 |
� | -14.164 |
policies | -13.836 |
climate | -12.378 |
Token | cv |
Token ID | 33967 |
Feature activation | -1.09e+02 |
Pos logit contributions | |
fg | +45.428 |
yne | +44.385 |
yx | +44.006 |
zzy | +42.949 |
uo | +42.947 |
Neg logit contributions | |
behavi | -14.598 |
� | -14.267 |
� | -14.058 |
policies | -13.637 |
institutions | -12.146 |
Token | pic |
Token ID | 8301 |
Feature activation | -3.61e+01 |
Pos logit contributions | |
�� | +0.008 |
�� | +0.007 |
arthed | +0.007 |
yne | +0.007 |
Remy | +0.007 |
Neg logit contributions | |
� | -0.008 |
� | -0.007 |
policies | -0.007 |
institutions | -0.006 |
climate | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | -2.34e+01 |
Pos logit contributions | |
Blossom | +27.159 |
Gomez | +26.950 |
JJ | +26.831 |
666 | +26.668 |
Remy | +26.504 |
Neg logit contributions | |
behavi | -23.292 |
conflic | -18.475 |
policies | -16.990 |
practition | -16.005 |
institutions | -15.726 |
Token | twitter |
Token ID | 6956 |
Feature activation | -6.25e+01 |
Pos logit contributions | |
nox | +21.034 |
fg | +21.029 |
zzo | +20.882 |
arthed | +20.620 |
yne | +20.507 |
Neg logit contributions | |
behavi | -16.809 |
policies | -14.717 |
� | -13.932 |
� | -13.545 |
ideology | -13.309 |
Token | . |
Token ID | 13 |
Feature activation | -2.70e+01 |
Pos logit contributions | |
666 | +32.026 |
. | +31.267 |
Blossom | +30.896 |
JJ | +30.859 |
135 | +30.743 |
Neg logit contributions | |
behavi | -34.792 |
conflic | -29.737 |
practition | -29.207 |
� | -27.276 |
cumbers | -24.021 |
Token | com |
Token ID | 785 |
Feature activation | -3.37e+01 |
Pos logit contributions | |
zzo | +21.133 |
fg | +21.038 |
yne | +20.778 |
dd | +20.610 |
agle | +20.413 |
Neg logit contributions | |
behavi | -22.684 |
policies | -18.328 |
� | -17.423 |
ideology | -16.716 |
ideologies | -16.659 |
Token | / |
Token ID | 14 |
Feature activation | -1.23e+02 |
Pos logit contributions | |
666 | +26.759 |
Blossom | +26.405 |
JJ | +25.966 |
135 | +25.782 |
Remy | +25.580 |
Neg logit contributions | |
behavi | -22.840 |
conflic | -17.302 |
policies | -16.385 |
practition | -15.516 |
ideology | -15.376 |
Token | F |
Token ID | 37 |
Feature activation | -8.69e+01 |
Pos logit contributions | |
fg | +46.125 |
yx | +44.901 |
yne | +44.681 |
uo | +43.641 |
6 | +43.592 |
Neg logit contributions | |
behavi | -14.861 |
� | -14.300 |
� | -14.178 |
policies | -13.911 |
climate | -12.509 |
Token | c |
Token ID | 66 |
Feature activation | -1.02e+02 |
Pos logit contributions | |
fg | +44.930 |
yne | +43.627 |
yx | +43.389 |
zzy | +42.917 |
dd | +42.555 |
Neg logit contributions | |
� | -13.748 |
behavi | -13.602 |
� | -13.273 |
policies | -12.704 |
climate | -11.279 |
Token | ce |
Token ID | 344 |
Feature activation | -1.17e+02 |
Pos logit contributions | |
fg | +44.752 |
zzy | +43.159 |
6 | +43.036 |
yx | +43.024 |
yne | +43.003 |
Neg logit contributions | |
behavi | -15.152 |
� | -14.032 |
� | -13.835 |
policies | -13.530 |
climate | -12.483 |
Token | W |
Token ID | 54 |
Feature activation | -9.54e+01 |
Pos logit contributions | |
fg | +45.635 |
yx | +44.485 |
yne | +44.395 |
6 | +43.466 |
zzy | +43.424 |
Neg logit contributions | |
behavi | -14.580 |
� | -14.028 |
� | -13.930 |
policies | -13.312 |
climate | -12.169 |
Token | x |
Token ID | 87 |
Feature activation | -1.15e+02 |
Pos logit contributions | |
fg | +45.776 |
yne | +43.721 |
yx | +43.533 |
zzy | +43.000 |
agle | +42.686 |
Neg logit contributions | |
behavi | -14.250 |
� | -14.228 |
� | -13.971 |
policies | -13.379 |
climate | -11.904 |
Token | x |
Token ID | 87 |
Feature activation | -5.30e+01 |
Pos logit contributions | |
fg | +29.111 |
yx | +28.984 |
fx | +28.487 |
zzo | +28.219 |
yne | +28.201 |
Neg logit contributions | |
behavi | -30.392 |
conflic | -23.928 |
policies | -21.018 |
practition | -20.518 |
� | -20.122 |
Token | . |
Token ID | 13 |
Feature activation | -3.28e+01 |
Pos logit contributions | |
666 | +30.304 |
135 | +30.047 |
yx | +29.816 |
fg | +29.136 |
zzo | +29.135 |
Neg logit contributions | |
behavi | -33.806 |
conflic | -28.983 |
practition | -26.856 |
� | -25.885 |
cumbers | -22.173 |
Token | x |
Token ID | 87 |
Feature activation | -3.42e+01 |
Pos logit contributions | |
nox | +24.257 |
yx | +24.111 |
fg | +23.403 |
zzo | +23.362 |
135 | +23.323 |
Neg logit contributions | |
behavi | -27.050 |
� | -20.649 |
policies | -20.644 |
conflic | -20.450 |
� | -19.993 |
Token | . |
Token ID | 13 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
135 | +26.298 |
amed | +25.249 |
nox | +25.189 |
666 | +25.097 |
agle | +25.044 |
Neg logit contributions | |
behavi | -24.291 |
� | -18.599 |
policies | -18.459 |
conflic | -17.702 |
� | -17.681 |
Token | 144 |
Token ID | 18444 |
Feature activation | -3.00e+01 |
Pos logit contributions | |
arthed | +2.660 |
nox | +2.434 |
agle | +1.973 |
135 | +1.970 |
akov | +1.947 |
Neg logit contributions | |
� | -22.318 |
� | -21.735 |
behavi | -20.555 |
policies | -20.483 |
ideology | -19.660 |
Token | 1024 |
Token ID | 28119 |
Feature activation | -1.22e+02 |
Pos logit contributions | |
Remy | +27.214 |
Blossom | +26.479 |
Reeves | +26.321 |
Winchester | +26.298 |
arthed | +26.183 |
Neg logit contributions | |
� | -15.023 |
behavi | -14.164 |
policies | -13.201 |
� | -12.770 |
institutions | -12.588 |
Token | 556 |
Token ID | 37864 |
Feature activation | -2.73e+01 |
Pos logit contributions | |
666 | +46.394 |
135 | +45.103 |
302 | +44.445 |
336 | +43.699 |
333 | +43.638 |
Neg logit contributions | |
behavi | -20.723 |
� | -16.863 |
institutions | -16.061 |
policies | -15.840 |
governance | -15.222 |
Token | x |
Token ID | 2124 |
Feature activation | -4.62e+01 |
Pos logit contributions | |
Remy | +18.873 |
Xander | +18.506 |
Blossom | +18.027 |
JJ | +17.978 |
Elias | +17.854 |
Neg logit contributions | |
� | -22.408 |
behavi | -22.260 |
� | -19.654 |
policies | -19.326 |
institutions | -19.276 |
Token | . |
Token ID | 13 |
Feature activation | -4.15e+01 |
Pos logit contributions | |
666 | +28.826 |
135 | +28.108 |
6 | +27.716 |
fg | +27.633 |
Blossom | +27.182 |
Neg logit contributions | |
behavi | -30.406 |
conflic | -25.868 |
practition | -23.329 |
� | -22.811 |
policies | -20.051 |
Token | x |
Token ID | 87 |
Feature activation | -5.46e+01 |
Pos logit contributions | |
yx | +28.796 |
fg | +28.760 |
zzo | +28.199 |
fx | +28.051 |
yne | +27.958 |
Neg logit contributions | |
behavi | -30.395 |
conflic | -23.975 |
policies | -20.888 |
practition | -20.723 |
� | -20.188 |
Token | . |
Token ID | 13 |
Feature activation | -3.35e+01 |
Pos logit contributions | |
666 | +30.654 |
135 | +29.991 |
yx | +29.668 |
6 | +29.282 |
Blossom | +29.168 |
Neg logit contributions | |
behavi | -34.102 |
conflic | -29.338 |
practition | -27.540 |
� | -26.490 |
cumbers | -22.613 |
Token | com |
Token ID | 785 |
Feature activation | -1.56e+01 |
Pos logit contributions | |
agle | +16.209 |
fg | +15.920 |
nova | +15.787 |
zzo | +15.723 |
yne | +15.661 |
Neg logit contributions | |
behavi | -19.950 |
� | -17.501 |
policies | -17.398 |
� | -16.714 |
ideology | -15.983 |
Token | / |
Token ID | 14 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
Blossom | +13.664 |
�� | +13.511 |
arthed | +13.510 |
yne | +13.449 |
JJ | +13.415 |
Neg logit contributions | |
� | -13.460 |
� | -12.740 |
behavi | -12.496 |
policies | -12.115 |
institutions | -11.219 |
Token | watch |
Token ID | 8340 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
�� | +2.028 |
arthed | +1.872 |
�� | +1.859 |
yne | +1.792 |
Blossom | +1.744 |
Neg logit contributions | |
� | -3.352 |
� | -3.189 |
policies | -2.924 |
institutions | -2.725 |
climate | -2.692 |
Token | ? |
Token ID | 30 |
Feature activation | -6.63e+00 |
Pos logit contributions | |
Blossom | +7.961 |
arthed | +7.796 |
JJ | +7.779 |
yne | +7.729 |
agle | +7.725 |
Neg logit contributions | |
� | -13.980 |
behavi | -13.715 |
� | -13.427 |
policies | -13.152 |
institutions | -12.300 |
Token | v |
Token ID | 85 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
�� | +3.968 |
arthed | +3.802 |
yne | +3.637 |
�� | +3.581 |
agle | +3.517 |
Neg logit contributions | |
� | -9.498 |
� | -9.122 |
policies | -8.523 |
institutions | -8.082 |
behavi | -7.899 |
Token | = |
Token ID | 28 |
Feature activation | -1.22e+02 |
Pos logit contributions | |
� | +1.699 |
� | +1.599 |
policies | +1.444 |
institutions | +1.342 |
climate | +1.319 |
Neg logit contributions | |
�� | -1.245 |
�� | -1.158 |
arthed | -1.143 |
yne | -1.110 |
Remy | -1.089 |
Token | 2 |
Token ID | 17 |
Feature activation | -9.88e+01 |
Pos logit contributions | |
fg | +45.566 |
yx | +44.616 |
yne | +44.418 |
uo | +43.552 |
6 | +43.527 |
Neg logit contributions | |
behavi | -15.162 |
� | -15.033 |
� | -14.529 |
policies | -13.806 |
climate | -12.734 |
Token | g |
Token ID | 70 |
Feature activation | -9.92e+01 |
Pos logit contributions | |
fg | +44.995 |
yne | +44.222 |
yx | +43.981 |
zzy | +42.972 |
uo | +42.934 |
Neg logit contributions | |
� | -14.289 |
� | -14.032 |
behavi | -13.872 |
policies | -13.354 |
climate | -11.992 |
Token | 7 |
Token ID | 22 |
Feature activation | -9.25e+01 |
Pos logit contributions | |
fg | +44.744 |
6 | +43.102 |
zzy | +42.810 |
yne | +42.766 |
yx | +42.761 |
Neg logit contributions | |
behavi | -14.204 |
� | -13.345 |
� | -13.321 |
policies | -12.929 |
climate | -12.023 |
Token | p |
Token ID | 79 |
Feature activation | -8.62e+01 |
Pos logit contributions | |
fg | +44.774 |
yx | +43.786 |
yne | +43.612 |
zzy | +42.879 |
uo | +42.527 |
Neg logit contributions | |
behavi | -13.504 |
� | -13.423 |
� | -13.260 |
policies | -12.853 |
climate | -11.613 |
Token | k |
Token ID | 74 |
Feature activation | -8.84e+01 |
Pos logit contributions | |
fg | +44.190 |
zzy | +42.486 |
6 | +42.225 |
yne | +42.143 |
yx | +42.068 |
Neg logit contributions | |
behavi | -14.029 |
� | -12.940 |
� | -12.856 |
policies | -12.629 |
climate | -11.579 |
Token | https |
Token ID | 3740 |
Feature activation | -5.80e+00 |
Pos logit contributions | |
� | +5.246 |
� | +4.938 |
policies | +4.413 |
institutions | +4.104 |
climate | +4.046 |
Neg logit contributions | |
�� | -3.620 |
�� | -3.328 |
arthed | -3.284 |
yne | -3.151 |
�� | -3.103 |
Token | :// |
Token ID | 1378 |
Feature activation | -1.52e+01 |
Pos logit contributions | |
�� | +3.893 |
arthed | +3.812 |
yne | +3.682 |
Remy | +3.678 |
Blossom | +3.655 |
Neg logit contributions | |
� | -7.641 |
� | -7.255 |
policies | -6.955 |
behavi | -6.750 |
institutions | -6.542 |
Token | t |
Token ID | 83 |
Feature activation | -3.95e+01 |
Pos logit contributions | |
nox | +10.042 |
yne | +9.977 |
fg | +9.904 |
arthed | +9.677 |
nova | +9.557 |
Neg logit contributions | |
� | -16.573 |
behavi | -16.396 |
policies | -15.780 |
� | -15.674 |
ideology | -14.606 |
Token | . |
Token ID | 13 |
Feature activation | -2.37e+01 |
Pos logit contributions | |
666 | +27.109 |
agle | +26.671 |
fg | +26.471 |
zzo | +26.455 |
135 | +26.084 |
Neg logit contributions | |
behavi | -27.497 |
conflic | -22.538 |
policies | -19.775 |
practition | -19.480 |
institutions | -18.228 |
Token | co |
Token ID | 1073 |
Feature activation | -2.98e+01 |
Pos logit contributions | |
agle | +19.425 |
fg | +19.374 |
zzo | +19.199 |
666 | +18.965 |
zzy | +18.769 |
Neg logit contributions | |
behavi | -20.388 |
policies | -16.916 |
� | -16.393 |
ideology | -15.642 |
� | -15.565 |
Token | / |
Token ID | 14 |
Feature activation | -1.22e+02 |
Pos logit contributions | |
666 | +23.196 |
agle | +23.118 |
zzo | +23.025 |
yne | +22.981 |
fg | +22.906 |
Neg logit contributions | |
behavi | -22.940 |
conflic | -17.564 |
policies | -17.032 |
ideology | -16.207 |
� | -16.079 |
Token | l |
Token ID | 75 |
Feature activation | -1.03e+02 |
Pos logit contributions | |
fg | +46.020 |
yx | +45.014 |
yne | +44.766 |
uo | +43.620 |
6 | +43.607 |
Neg logit contributions | |
behavi | -14.407 |
� | -13.739 |
� | -13.717 |
policies | -13.660 |
climate | -12.220 |
Token | g |
Token ID | 70 |
Feature activation | -9.62e+01 |
Pos logit contributions | |
fg | +45.163 |
zzy | +42.967 |
6 | +42.945 |
yx | +42.685 |
yne | +42.539 |
Neg logit contributions | |
behavi | -14.814 |
� | -14.369 |
� | -13.823 |
policies | -13.551 |
climate | -12.395 |
Token | S |
Token ID | 50 |
Feature activation | -6.84e+01 |
Pos logit contributions | |
fg | +44.884 |
6 | +42.841 |
zzy | +42.740 |
yne | +42.545 |
dd | +42.427 |
Neg logit contributions | |
behavi | -13.973 |
� | -13.667 |
policies | -13.293 |
� | -13.220 |
climate | -12.084 |
Token | wh |
Token ID | 1929 |
Feature activation | -1.12e+02 |
Pos logit contributions | |
fg | +42.807 |
yx | +41.353 |
zzy | +41.215 |
yne | +41.155 |
dd | +41.151 |
Neg logit contributions | |
� | -13.529 |
� | -13.069 |
behavi | -12.712 |
policies | -12.140 |
climate | -10.770 |
Token | X |
Token ID | 55 |
Feature activation | -1.06e+02 |
Pos logit contributions | |
fg | +45.642 |
yne | +44.244 |
yx | +44.089 |
6 | +43.305 |
uo | +43.171 |
Neg logit contributions | |
behavi | -14.141 |
� | -13.737 |
policies | -13.246 |
� | -13.211 |
climate | -12.019 |
Token | pic |
Token ID | 8301 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
�� | +1.154 |
�� | +1.082 |
arthed | +1.081 |
yne | +1.045 |
Remy | +1.038 |
Neg logit contributions | |
� | -1.176 |
� | -1.094 |
policies | -0.975 |
institutions | -0.897 |
climate | -0.872 |
Token | . |
Token ID | 13 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
Blossom | +14.305 |
Gomez | +14.078 |
Remy | +14.037 |
JJ | +13.927 |
Reeves | +13.818 |
Neg logit contributions | |
behavi | -18.603 |
� | -17.272 |
policies | -16.743 |
� | -15.983 |
institutions | -15.736 |
Token | twitter |
Token ID | 6956 |
Feature activation | -3.96e+01 |
Pos logit contributions | |
agle | +5.934 |
Blossom | +5.887 |
arthed | +5.885 |
yne | +5.882 |
nox | +5.648 |
Neg logit contributions | |
� | -17.556 |
behavi | -17.335 |
policies | -17.085 |
� | -16.633 |
institutions | -16.103 |
Token | . |
Token ID | 13 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
666 | +25.672 |
Blossom | +25.588 |
JJ | +25.278 |
fg | +25.195 |
135 | +25.159 |
Neg logit contributions | |
behavi | -29.717 |
conflic | -24.705 |
practition | -22.979 |
� | -21.651 |
policies | -20.924 |
Token | com |
Token ID | 785 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
fg | +12.484 |
zzo | +12.417 |
agle | +12.400 |
yne | +12.338 |
Blossom | +12.146 |
Neg logit contributions | |
behavi | -21.029 |
� | -18.955 |
policies | -18.894 |
� | -18.083 |
ideology | -17.624 |
Token | / |
Token ID | 14 |
Feature activation | -1.22e+02 |
Pos logit contributions | |
Blossom | +16.508 |
666 | +16.286 |
JJ | +16.229 |
yne | +16.089 |
Remy | +16.059 |
Neg logit contributions | |
behavi | -20.429 |
� | -17.738 |
policies | -17.234 |
� | -16.582 |
ideology | -16.296 |
Token | gy |
Token ID | 1360 |
Feature activation | -1.19e+02 |
Pos logit contributions | |
fg | +46.122 |
yx | +44.736 |
yne | +44.531 |
uo | +43.536 |
6 | +43.512 |
Neg logit contributions | |
behavi | -15.144 |
� | -14.226 |
� | -14.209 |
policies | -14.036 |
climate | -12.793 |
Token | d |
Token ID | 67 |
Feature activation | -1.04e+02 |
Pos logit contributions | |
fg | +45.793 |
yx | +44.203 |
yne | +43.772 |
zzy | +43.719 |
6 | +43.512 |
Neg logit contributions | |
behavi | -15.859 |
� | -14.254 |
� | -14.205 |
policies | -13.987 |
climate | -12.640 |
Token | 3 |
Token ID | 18 |
Feature activation | -1.02e+02 |
Pos logit contributions | |
fg | +45.097 |
yx | +43.465 |
yne | +43.441 |
zzy | +43.429 |
6 | +43.169 |
Neg logit contributions | |
behavi | -14.546 |
� | -13.835 |
� | -13.778 |
policies | -13.610 |
climate | -12.619 |
Token | p |
Token ID | 79 |
Feature activation | -9.89e+01 |
Pos logit contributions | |
fg | +45.384 |
yne | +44.420 |
yx | +44.191 |
zzy | +43.235 |
uo | +43.130 |
Neg logit contributions | |
behavi | -14.110 |
� | -14.083 |
� | -13.829 |
policies | -13.484 |
climate | -12.098 |
Token | W |
Token ID | 54 |
Feature activation | -9.28e+01 |
Pos logit contributions | |
fg | +45.126 |
zzy | +43.096 |
6 | +42.803 |
yx | +42.601 |
yne | +42.584 |
Neg logit contributions | |
behavi | -15.446 |
� | -13.846 |
policies | -13.753 |
� | -13.692 |
climate | -12.499 |
Token | https |
Token ID | 3740 |
Feature activation | -1.69e+01 |
Pos logit contributions | |
�� | +10.163 |
Remy | +9.926 |
arthed | +9.899 |
�� | +9.846 |
Blossom | +9.809 |
Neg logit contributions | |
� | -8.612 |
� | -7.842 |
policies | -7.133 |
institutions | -6.520 |
ideology | -6.432 |
Token | :// |
Token ID | 1378 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
arthed | +11.283 |
yne | +11.171 |
agle | +11.031 |
666 | +11.001 |
fg | +11.000 |
Neg logit contributions | |
behavi | -18.119 |
� | -16.825 |
policies | -16.196 |
� | -15.978 |
ideology | -15.349 |
Token | t |
Token ID | 83 |
Feature activation | -3.02e+01 |
Pos logit contributions | |
fg | +15.311 |
nox | +15.088 |
yne | +14.986 |
ilver | +14.515 |
nova | +14.409 |
Neg logit contributions | |
behavi | -18.918 |
� | -17.255 |
policies | -16.731 |
� | -16.396 |
ideology | -15.472 |
Token | . |
Token ID | 13 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
agle | +23.506 |
fg | +23.179 |
Blossom | +23.096 |
zzo | +23.077 |
666 | +22.982 |
Neg logit contributions | |
behavi | -21.518 |
� | -17.285 |
policies | -17.178 |
� | -15.905 |
institutions | -15.896 |
Token | co |
Token ID | 1073 |
Feature activation | -2.97e+01 |
Pos logit contributions | |
agle | +16.945 |
fg | +16.875 |
zzo | +16.406 |
Blossom | +16.339 |
yne | +16.215 |
Neg logit contributions | |
behavi | -22.343 |
� | -19.802 |
policies | -19.565 |
� | -18.415 |
ideology | -18.249 |
Token | / |
Token ID | 14 |
Feature activation | -1.22e+02 |
Pos logit contributions | |
yne | +23.502 |
666 | +23.428 |
fg | +23.277 |
zzo | +23.273 |
agle | +23.157 |
Neg logit contributions | |
behavi | -22.986 |
conflic | -17.607 |
policies | -16.760 |
ideology | -16.080 |
� | -16.002 |
Token | ni |
Token ID | 8461 |
Feature activation | -1.07e+02 |
Pos logit contributions | |
fg | +46.049 |
yne | +44.987 |
yx | +44.912 |
uo | +43.650 |
6 | +43.535 |
Neg logit contributions | |
behavi | -14.135 |
� | -14.007 |
� | -13.872 |
policies | -13.528 |
climate | -12.256 |
Token | WB |
Token ID | 45607 |
Feature activation | -9.65e+01 |
Pos logit contributions | |
fg | +44.202 |
yx | +43.393 |
6 | +43.353 |
yne | +43.218 |
zzy | +42.961 |
Neg logit contributions | |
behavi | -14.989 |
� | -13.802 |
� | -13.773 |
policies | -13.477 |
climate | -12.520 |
Token | qv |
Token ID | 44179 |
Feature activation | -1.09e+02 |
Pos logit contributions | |
fg | +45.731 |
yne | +43.699 |
yx | +43.442 |
zzy | +43.191 |
dd | +43.074 |
Neg logit contributions | |
behavi | -14.928 |
� | -13.985 |
� | -13.793 |
policies | -13.511 |
climate | -12.198 |
Token | fi |
Token ID | 12463 |
Feature activation | -9.91e+01 |
Pos logit contributions | |
fg | +45.425 |
yne | +43.889 |
yx | +43.512 |
uo | +43.325 |
6 | +43.289 |
Neg logit contributions | |
behavi | -15.517 |
� | -13.838 |
policies | -13.810 |
� | -13.732 |
climate | -12.205 |
Token | W |
Token ID | 54 |
Feature activation | -8.34e+01 |
Pos logit contributions | |
fg | +44.304 |
6 | +43.189 |
yne | +43.158 |
yx | +42.772 |
zzy | +42.588 |
Neg logit contributions | |
behavi | -15.629 |
policies | -13.629 |
� | -13.378 |
� | -13.139 |
climate | -12.326 |
Token | at |
Token ID | 379 |
Feature activation | -4.08e+01 |
Pos logit contributions | |
�� | +13.363 |
�� | +13.329 |
yne | +13.141 |
agle | +13.107 |
arthed | +13.086 |
Neg logit contributions | |
� | -11.918 |
� | -11.004 |
policies | -9.901 |
institutions | -9.238 |
ideology | -8.810 |
Token | a |
Token ID | 257 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
Reeves | +34.105 |
Griff | +33.884 |
Hank | +33.709 |
Dee | +33.625 |
Remy | +33.602 |
Neg logit contributions | |
� | -14.794 |
� | -12.086 |
policies | -11.112 |
behavi | -10.689 |
institutions | -8.955 |
Token | speed |
Token ID | 2866 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
Blossom | +18.741 |
Reeves | +18.731 |
JJ | +18.724 |
yne | +18.644 |
flown | +18.551 |
Neg logit contributions | |
� | -15.186 |
� | -13.479 |
policies | -12.391 |
institutions | -10.844 |
ideology | -10.468 |
Token | of |
Token ID | 286 |
Feature activation | -3.35e+01 |
Pos logit contributions | |
Reeves | +23.080 |
Remy | +23.045 |
flown | +23.005 |
agle | +22.853 |
JJ | +22.605 |
Neg logit contributions | |
� | -14.154 |
� | -12.654 |
policies | -11.775 |
behavi | -10.724 |
institutions | -10.381 |
Token | 2 |
Token ID | 362 |
Feature activation | -3.26e+01 |
Pos logit contributions | |
Reeves | +28.966 |
Remy | +28.800 |
Ventura | +28.687 |
JJ | +28.586 |
Elias | +28.583 |
Neg logit contributions | |
� | -14.945 |
� | -12.304 |
policies | -11.594 |
behavi | -11.153 |
institutions | -9.692 |
Token | , |
Token ID | 11 |
Feature activation | -1.21e+02 |
Pos logit contributions | |
Miles | +29.642 |
666 | +29.208 |
�� | +29.153 |
yne | +29.142 |
135 | +29.056 |
Neg logit contributions | |
� | -14.261 |
� | -13.126 |
behavi | -11.247 |
policies | -11.232 |
institutions | -9.940 |
Token | 658 |
Token ID | 38431 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
666 | +45.661 |
135 | +44.729 |
302 | +44.062 |
200 | +43.595 |
400 | +43.557 |
Neg logit contributions | |
behavi | -17.974 |
� | -17.838 |
� | -16.121 |
institutions | -14.853 |
policies | -14.393 |
Token | meters |
Token ID | 10700 |
Feature activation | -2.38e+01 |
Pos logit contributions | |
�� | +13.229 |
arthed | +12.775 |
Miles | +12.754 |
Reeves | +12.650 |
yne | +12.636 |
Neg logit contributions | |
� | -14.600 |
� | -13.641 |
policies | -12.201 |
ideology | -11.379 |
behavi | -11.287 |
Token | per |
Token ID | 583 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
arthed | +20.467 |
�� | +20.331 |
flown | +20.292 |
Reeves | +19.852 |
Miles | +19.843 |
Neg logit contributions | |
� | -16.261 |
� | -15.042 |
policies | -13.326 |
behavi | -12.627 |
institutions | -12.348 |
Token | second |
Token ID | 1218 |
Feature activation | -2.62e+01 |
Pos logit contributions | |
�� | +6.834 |
arthed | +6.262 |
�� | +5.966 |
Reeves | +5.933 |
yne | +5.870 |
Neg logit contributions | |
� | -15.425 |
� | -14.563 |
policies | -13.542 |
institutions | -12.833 |
ideology | -12.580 |
Token | ( |
Token ID | 357 |
Feature activation | -5.53e+01 |
Pos logit contributions | |
�� | +27.458 |
flown | +26.930 |
Reeves | +26.927 |
Remy | +26.589 |
yne | +26.432 |
Neg logit contributions | |
� | -10.525 |
� | -9.779 |
policies | -9.025 |
institutions | -7.851 |
behavi | -7.810 |
Token | pic |
Token ID | 8301 |
Feature activation | -2.67e+01 |
Pos logit contributions | |
�� | +4.696 |
arthed | +4.419 |
�� | +4.411 |
Remy | +4.381 |
yne | +4.330 |
Neg logit contributions | |
� | -4.444 |
� | -4.108 |
policies | -3.655 |
institutions | -3.362 |
ideology | -3.275 |
Token | . |
Token ID | 13 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
Blossom | +19.948 |
Gomez | +19.778 |
JJ | +19.711 |
Remy | +19.521 |
666 | +19.463 |
Neg logit contributions | |
behavi | -22.792 |
policies | -18.494 |
conflic | -18.363 |
� | -17.892 |
institutions | -17.280 |
Token | twitter |
Token ID | 6956 |
Feature activation | -4.83e+01 |
Pos logit contributions | |
fg | +6.054 |
yne | +6.032 |
agle | +5.993 |
Blossom | +5.927 |
nox | +5.892 |
Neg logit contributions | |
behavi | -18.940 |
� | -18.726 |
policies | -18.250 |
� | -17.904 |
ideology | -17.231 |
Token | . |
Token ID | 13 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
666 | +28.782 |
135 | +27.977 |
fg | +27.751 |
JJ | +27.570 |
Blossom | +27.558 |
Neg logit contributions | |
behavi | -33.071 |
conflic | -28.245 |
practition | -26.763 |
� | -25.317 |
cumbers | -22.528 |
Token | com |
Token ID | 785 |
Feature activation | -2.53e+01 |
Pos logit contributions | |
fg | +16.406 |
zzo | +16.232 |
agle | +16.115 |
666 | +16.034 |
yne | +15.891 |
Neg logit contributions | |
behavi | -24.300 |
policies | -20.347 |
� | -20.006 |
ideology | -19.001 |
� | -18.986 |
Token | / |
Token ID | 14 |
Feature activation | -1.21e+02 |
Pos logit contributions | |
666 | +18.518 |
Blossom | +18.509 |
JJ | +18.274 |
yne | +18.131 |
fg | +17.959 |
Neg logit contributions | |
behavi | -22.722 |
� | -18.451 |
policies | -18.351 |
conflic | -17.583 |
ideology | -17.373 |
Token | Eh |
Token ID | 43894 |
Feature activation | -1.05e+02 |
Pos logit contributions | |
fg | +46.010 |
yx | +44.713 |
yne | +44.656 |
6 | +43.425 |
uo | +43.365 |
Neg logit contributions | |
behavi | -14.940 |
� | -14.564 |
� | -14.435 |
policies | -14.074 |
climate | -12.714 |
Token | U |
Token ID | 52 |
Feature activation | -7.68e+01 |
Pos logit contributions | |
fg | +45.622 |
yx | +43.776 |
yne | +43.460 |
6 | +43.093 |
zzy | +43.046 |
Neg logit contributions | |
behavi | -15.093 |
� | -14.495 |
� | -14.471 |
policies | -13.625 |
climate | -12.689 |
Token | g |
Token ID | 70 |
Feature activation | -9.54e+01 |
Pos logit contributions | |
fg | +43.752 |
zzy | +42.550 |
yx | +42.487 |
yne | +42.196 |
dd | +41.584 |
Neg logit contributions | |
behavi | -14.755 |
� | -14.564 |
� | -14.337 |
policies | -13.871 |
institutions | -12.402 |
Token | I |
Token ID | 40 |
Feature activation | -7.04e+01 |
Pos logit contributions | |
fg | +44.815 |
6 | +42.629 |
yne | +42.449 |
zzy | +42.401 |
dd | +42.372 |
Neg logit contributions | |
behavi | -15.280 |
� | -14.369 |
� | -13.906 |
policies | -13.877 |
climate | -12.580 |
Token | x |
Token ID | 87 |
Feature activation | -1.08e+02 |
Pos logit contributions | |
fg | +42.696 |
zzy | +42.127 |
yne | +41.673 |
yx | +41.356 |
zzo | +41.274 |
Neg logit contributions | |
� | -14.640 |
behavi | -14.445 |
� | -13.975 |
policies | -12.920 |
climate | -11.891 |
Token | pic |
Token ID | 8301 |
Feature activation | -3.45e+01 |
Pos logit contributions | |
�� | +14.767 |
arthed | +14.377 |
�� | +14.241 |
yne | +14.190 |
Remy | +14.153 |
Neg logit contributions | |
� | -10.115 |
� | -9.128 |
policies | -7.970 |
institutions | -7.202 |
ideology | -7.013 |
Token | . |
Token ID | 13 |
Feature activation | -2.37e+01 |
Pos logit contributions | |
Blossom | +23.662 |
Gomez | +23.515 |
666 | +23.498 |
JJ | +23.211 |
fg | +22.790 |
Neg logit contributions | |
behavi | -26.691 |
conflic | -21.769 |
policies | -19.950 |
practition | -19.356 |
� | -19.241 |
Token | twitter |
Token ID | 6956 |
Feature activation | -6.22e+01 |
Pos logit contributions | |
fg | +17.991 |
nox | +17.650 |
zzo | +17.528 |
yne | +17.355 |
agle | +17.348 |
Neg logit contributions | |
behavi | -21.113 |
policies | -18.604 |
� | -18.064 |
� | -17.526 |
ideology | -17.121 |
Token | . |
Token ID | 13 |
Feature activation | -2.35e+01 |
Pos logit contributions | |
666 | +31.471 |
. | +30.581 |
135 | +30.159 |
Blossom | +30.147 |
JJ | +29.949 |
Neg logit contributions | |
behavi | -36.328 |
conflic | -31.450 |
practition | -30.995 |
� | -29.282 |
cumbers | -25.653 |
Token | com |
Token ID | 785 |
Feature activation | -3.38e+01 |
Pos logit contributions | |
zzo | +17.234 |
fg | +17.136 |
yne | +17.088 |
agle | +16.729 |
666 | +16.651 |
Neg logit contributions | |
behavi | -22.643 |
policies | -19.060 |
� | -18.735 |
� | -17.916 |
ideology | -17.568 |
Token | / |
Token ID | 14 |
Feature activation | -1.20e+02 |
Pos logit contributions | |
666 | +25.607 |
Blossom | +25.227 |
JJ | +24.812 |
135 | +24.591 |
yx | +24.520 |
Neg logit contributions | |
behavi | -24.004 |
conflic | -18.462 |
policies | -17.666 |
� | -17.005 |
ideology | -16.610 |
Token | j |
Token ID | 73 |
Feature activation | -1.16e+02 |
Pos logit contributions | |
fg | +46.052 |
yx | +44.769 |
yne | +44.608 |
uo | +43.561 |
6 | +43.433 |
Neg logit contributions | |
behavi | -15.060 |
� | -14.411 |
� | -14.342 |
policies | -13.964 |
climate | -12.651 |
Token | Ax |
Token ID | 31554 |
Feature activation | -1.19e+02 |
Pos logit contributions | |
fg | +45.732 |
yx | +43.938 |
yne | +43.766 |
6 | +43.340 |
zzy | +42.985 |
Neg logit contributions | |
behavi | -15.458 |
� | -14.967 |
� | -14.946 |
policies | -14.056 |
climate | -12.667 |
Token | 6 |
Token ID | 21 |
Feature activation | -9.90e+01 |
Pos logit contributions | |
fg | +45.999 |
yne | +44.347 |
yx | +44.024 |
6 | +43.329 |
uo | +43.291 |
Neg logit contributions | |
behavi | -15.506 |
� | -14.435 |
� | -14.431 |
policies | -13.871 |
climate | -12.566 |
Token | c |
Token ID | 66 |
Feature activation | -9.89e+01 |
Pos logit contributions | |
fg | +45.057 |
yne | +44.045 |
yx | +44.016 |
zzy | +43.033 |
uo | +42.776 |
Neg logit contributions | |
behavi | -14.145 |
� | -14.119 |
� | -13.969 |
policies | -13.609 |
climate | -12.037 |
Token | U |
Token ID | 52 |
Feature activation | -7.82e+01 |
Pos logit contributions | |
fg | +44.910 |
zzy | +42.941 |
yne | +42.841 |
yx | +42.782 |
6 | +42.773 |
Neg logit contributions | |
behavi | -15.389 |
� | -14.001 |
� | -13.916 |
policies | -13.663 |
climate | -12.463 |
Token | https |
Token ID | 3740 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
� | +24.307 |
� | +23.111 |
policies | +19.997 |
institutions | +18.566 |
climate | +18.527 |
Neg logit contributions | |
�� | -14.340 |
�� | -12.921 |
arthed | -12.724 |
yne | -12.353 |
�� | -12.073 |
Token | :// |
Token ID | 1378 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
arthed | +9.151 |
yne | +9.070 |
Remy | +9.068 |
Blossom | +9.050 |
Gomez | +8.930 |
Neg logit contributions | |
behavi | -13.723 |
� | -13.504 |
policies | -13.010 |
� | -12.832 |
institutions | -12.235 |
Token | t |
Token ID | 83 |
Feature activation | -3.26e+01 |
Pos logit contributions | |
nox | +6.853 |
yne | +6.754 |
fg | +6.540 |
ilver | +6.449 |
arthed | +6.402 |
Neg logit contributions | |
� | -17.482 |
� | -16.776 |
behavi | -16.677 |
policies | -16.398 |
institutions | -15.433 |
Token | . |
Token ID | 13 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
agle | +25.230 |
fg | +24.859 |
zzo | +24.846 |
666 | +24.804 |
Blossom | +24.625 |
Neg logit contributions | |
behavi | -21.956 |
policies | -16.952 |
� | -16.850 |
conflic | -16.355 |
institutions | -15.740 |
Token | co |
Token ID | 1073 |
Feature activation | -2.74e+01 |
Pos logit contributions | |
fg | +18.240 |
agle | +18.064 |
Blossom | +17.948 |
zzo | +17.924 |
yne | +17.803 |
Neg logit contributions | |
behavi | -22.872 |
policies | -19.396 |
� | -19.283 |
ideology | -18.086 |
� | -17.911 |
Token | / |
Token ID | 14 |
Feature activation | -1.20e+02 |
Pos logit contributions | |
yne | +21.707 |
zzo | +21.587 |
fg | +21.582 |
666 | +21.511 |
agle | +21.279 |
Neg logit contributions | |
behavi | -22.066 |
conflic | -16.962 |
policies | -16.729 |
� | -16.128 |
ideology | -15.922 |
Token | c |
Token ID | 66 |
Feature activation | -1.05e+02 |
Pos logit contributions | |
fg | +46.034 |
yx | +44.867 |
yne | +44.799 |
uo | +43.550 |
6 | +43.541 |
Neg logit contributions | |
behavi | -14.499 |
� | -14.050 |
� | -14.010 |
policies | -13.593 |
climate | -12.341 |
Token | Q |
Token ID | 48 |
Feature activation | -1.09e+02 |
Pos logit contributions | |
fg | +44.912 |
yx | +43.364 |
yne | +43.263 |
zzy | +43.192 |
6 | +43.121 |
Neg logit contributions | |
behavi | -14.950 |
� | -13.989 |
� | -13.868 |
policies | -13.553 |
climate | -12.563 |
Token | 3 |
Token ID | 18 |
Feature activation | -9.62e+01 |
Pos logit contributions | |
fg | +45.818 |
yx | +44.512 |
yne | +44.139 |
6 | +43.062 |
uo | +43.002 |
Neg logit contributions | |
behavi | -14.650 |
� | -13.897 |
� | -13.879 |
policies | -13.681 |
climate | -12.312 |
Token | x |
Token ID | 87 |
Feature activation | -1.11e+02 |
Pos logit contributions | |
fg | +44.993 |
yne | +44.218 |
yx | +43.826 |
zzy | +42.766 |
uo | +42.752 |
Neg logit contributions | |
� | -14.091 |
� | -13.809 |
behavi | -13.687 |
policies | -13.255 |
climate | -11.851 |
Token | mb |
Token ID | 2022 |
Feature activation | -1.10e+02 |
Pos logit contributions | |
fg | +45.599 |
yx | +43.888 |
yne | +43.788 |
zzy | +43.297 |
uo | +43.267 |
Neg logit contributions | |
behavi | -14.897 |
� | -14.148 |
� | -13.899 |
policies | -13.634 |
climate | -12.546 |
Token | I |
Token ID | 314 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
� | +15.005 |
� | +13.990 |
policies | +12.346 |
institutions | +11.468 |
climate | +11.319 |
Neg logit contributions | |
�� | -11.867 |
arthed | -10.717 |
�� | -10.597 |
�� | -10.164 |
yne | -10.147 |
Token | have |
Token ID | 423 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
� | +27.394 |
� | +25.270 |
policies | +21.407 |
climate | +20.209 |
institutions | +20.046 |
Neg logit contributions | |
�� | -15.045 |
arthed | -13.861 |
�� | -12.762 |
Canaver | -12.656 |
senal | -12.649 |
Token | finally |
Token ID | 3443 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
�� | +12.155 |
�� | +12.146 |
Remy | +11.956 |
Blossom | +11.885 |
arthed | +11.860 |
Neg logit contributions | |
� | -10.149 |
� | -9.420 |
policies | -7.926 |
behavi | -7.199 |
institutions | -7.176 |
Token | started |
Token ID | 2067 |
Feature activation | -6.01e+00 |
Pos logit contributions | |
flown | +21.667 |
�� | +21.450 |
Blossom | +21.302 |
JJ | +21.260 |
zzo | +21.214 |
Neg logit contributions | |
� | -11.700 |
� | -10.533 |
policies | -9.387 |
behavi | -9.225 |
institutions | -8.271 |
Token | pursuing |
Token ID | 15461 |
Feature activation | +8.57e+00 |
Pos logit contributions | |
�� | +5.749 |
�� | +5.516 |
arthed | +5.445 |
Remy | +5.366 |
yne | +5.329 |
Neg logit contributions | |
� | -6.620 |
� | -6.183 |
policies | -5.521 |
institutions | -5.054 |
ideology | -4.970 |
Token | music |
Token ID | 2647 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
� | +11.589 |
� | +10.943 |
policies | +9.941 |
institutions | +9.326 |
climate | +9.169 |
Neg logit contributions | |
�� | -7.303 |
arthed | -6.451 |
�� | -6.383 |
��極 | -6.021 |
�� | -5.994 |
Token | seriously |
Token ID | 6411 |
Feature activation | +7.51e-01 |
Pos logit contributions | |
� | +23.594 |
� | +22.252 |
policies | +19.626 |
institutions | +18.348 |
policy | +18.196 |
Neg logit contributions | |
�� | -16.756 |
arthed | -14.854 |
��極 | -14.525 |
�� | -14.490 |
�� | -13.665 |
Token | , |
Token ID | 11 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
� | +0.948 |
� | +0.891 |
policies | +0.804 |
institutions | +0.747 |
climate | +0.733 |
Neg logit contributions | |
�� | -0.690 |
�� | -0.640 |
arthed | -0.632 |
yne | -0.609 |
Remy | -0.603 |
Token | I |
Token ID | 314 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
� | +15.848 |
� | +14.802 |
policies | +12.929 |
institutions | +12.019 |
climate | +11.928 |
Neg logit contributions | |
�� | -12.837 |
arthed | -11.658 |
�� | -11.411 |
��極 | -11.192 |
�� | -11.022 |
Token | live |
Token ID | 2107 |
Feature activation | -5.00e+00 |
Pos logit contributions | |
� | +21.490 |
� | +19.894 |
policies | +16.586 |
climate | +15.638 |
institutions | +15.484 |
Neg logit contributions | |
�� | -14.892 |
arthed | -13.813 |
�� | -12.881 |
senal | -12.750 |
Canaver | -12.546 |
Token | in |
Token ID | 287 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
�� | +4.294 |
�� | +4.095 |
arthed | +4.028 |
yne | +3.967 |
Remy | +3.950 |
Neg logit contributions | |
� | -6.104 |
� | -5.726 |
policies | -5.158 |
institutions | -4.790 |
ideology | -4.743 |
Token | expand |
Token ID | 4292 |
Feature activation | +3.10e+01 |
Pos logit contributions | |
� | +21.523 |
� | +20.346 |
policies | +18.225 |
institutions | +17.660 |
economic | +17.182 |
Neg logit contributions | |
�� | -15.664 |
arthed | -14.266 |
�� | -13.878 |
�� | -13.358 |
��極 | -13.347 |
Token | the |
Token ID | 262 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
� | +31.430 |
� | +30.124 |
policies | +27.449 |
economic | +27.074 |
institutions | +26.692 |
Neg logit contributions | |
�� | -20.464 |
�� | -18.146 |
arthed | -17.850 |
senal | -17.732 |
Canaver | -17.642 |
Token | nation |
Token ID | 3277 |
Feature activation | +3.60e+01 |
Pos logit contributions | |
� | +19.618 |
� | +18.725 |
policies | +16.970 |
economic | +16.063 |
institutions | +15.949 |
Neg logit contributions | |
�� | -16.089 |
arthed | -14.841 |
�� | -14.774 |
�� | -14.143 |
yne | -14.121 |
Token | � |
Token ID | 447 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
� | +36.387 |
� | +33.736 |
policies | +28.000 |
| +27.049 |
institutions | +26.733 |
Neg logit contributions | |
�� | -23.041 |
�� | -22.701 |
arthed | -21.638 |
Canaver | -21.172 |
�� | -20.554 |
Token | � |
Token ID | 247 |
Feature activation | +2.17e+01 |
Pos logit contributions | |
�� | +20.973 |
�� | +20.474 |
� | +19.372 |
� | +19.275 |
� | +19.237 |
Neg logit contributions | |
� | -19.284 |
� | -18.644 |
policies | -17.469 |
behavi | -17.407 |
climate | -16.150 |
Token | s |
Token ID | 82 |
Feature activation | +2.30e+01 |
Pos logit contributions | |
� | +24.279 |
� | +22.990 |
policies | +20.123 |
institutions | +19.319 |
economic | +18.825 |
Neg logit contributions | |
�� | -18.081 |
�� | -16.872 |
�� | -15.999 |
arthed | -15.828 |
��極 | -15.307 |
Token | internet |
Token ID | 5230 |
Feature activation | +4.14e+01 |
Pos logit contributions | |
� | +24.696 |
� | +23.573 |
policies | +21.663 |
economic | +20.948 |
institutions | +20.947 |
Neg logit contributions | |
�� | -18.636 |
arthed | -16.877 |
�� | -16.851 |
�� | -16.461 |
nesday | -15.803 |
Token | bandwidth |
Token ID | 19484 |
Feature activation | +4.10e+01 |
Pos logit contributions | |
� | +38.850 |
� | +37.088 |
policies | +32.341 |
infrastructure | +31.698 |
institutions | +30.984 |
Neg logit contributions | |
�� | -23.315 |
Canaver | -21.488 |
�� | -21.481 |
arthed | -21.003 |
nesday | -20.105 |
Token | availability |
Token ID | 11500 |
Feature activation | +3.75e+01 |
Pos logit contributions | |
� | +38.915 |
� | +36.955 |
policies | +32.164 |
infrastructure | +30.358 |
policy | +30.347 |
Neg logit contributions | |
�� | -22.348 |
arthed | -20.758 |
Canaver | -20.665 |
�� | -20.230 |
�� | -19.371 |
Token | and |
Token ID | 290 |
Feature activation | +3.09e+01 |
Pos logit contributions | |
� | +37.193 |
� | +35.067 |
policies | +29.839 |
policy | +27.830 |
institutions | +27.749 |
Neg logit contributions | |
�� | -22.053 |
arthed | -20.432 |
�� | -19.832 |
senal | -19.428 |
Canaver | -19.346 |
Token | speed |
Token ID | 2866 |
Feature activation | +3.66e+01 |
Pos logit contributions | |
� | +32.452 |
� | +31.051 |
policies | +28.297 |
institutions | +26.726 |
economic | +26.722 |
Neg logit contributions | |
�� | -19.738 |
arthed | -17.999 |
�� | -17.212 |
�� | -17.104 |
senal | -17.038 |
Token | supervised |
Token ID | 28679 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
� | +0.975 |
� | +0.917 |
policies | +0.826 |
institutions | +0.769 |
climate | +0.756 |
Neg logit contributions | |
�� | -0.659 |
�� | -0.608 |
arthed | -0.599 |
yne | -0.576 |
Remy | -0.571 |
Token | injection |
Token ID | 16954 |
Feature activation | +3.01e+01 |
Pos logit contributions | |
� | +13.412 |
� | +12.558 |
policies | +11.170 |
institutions | +10.443 |
climate | +10.034 |
Neg logit contributions | |
�� | -14.887 |
arthed | -14.104 |
�� | -13.940 |
senal | -13.564 |
��極 | -13.516 |
Token | site |
Token ID | 2524 |
Feature activation | +2.19e+01 |
Pos logit contributions | |
� | +30.746 |
� | +29.806 |
policies | +27.981 |
institutions | +26.773 |
policy | +26.348 |
Neg logit contributions | |
�� | -22.251 |
�� | -19.241 |
arthed | -18.536 |
�� | -18.228 |
yne | -17.873 |
Token | , |
Token ID | 11 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
� | +27.575 |
� | +26.488 |
policies | +23.767 |
policy | +22.297 |
institutions | +22.212 |
Neg logit contributions | |
�� | -14.827 |
arthed | -12.873 |
yne | -12.665 |
�� | -12.551 |
��極 | -12.170 |
Token | the |
Token ID | 262 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
� | +19.376 |
� | +18.434 |
policies | +16.768 |
institutions | +15.659 |
policy | +15.365 |
Neg logit contributions | |
�� | -11.175 |
arthed | -10.056 |
�� | -10.002 |
yne | -9.708 |
�� | -9.548 |
Token | challenging |
Token ID | 9389 |
Feature activation | +2.21e+01 |
Pos logit contributions | |
� | +17.456 |
� | +16.627 |
policies | +15.123 |
institutions | +14.211 |
climate | +13.919 |
Neg logit contributions | |
�� | -11.368 |
arthed | -10.562 |
�� | -10.296 |
yne | -9.929 |
senal | -9.795 |
Token | of |
Token ID | 286 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
� | +25.792 |
� | +24.948 |
policies | +23.640 |
climate | +22.083 |
policy | +21.996 |
Neg logit contributions | |
�� | -15.945 |
arthed | -15.000 |
�� | -14.583 |
��極 | -14.001 |
senal | -13.987 |
Token | federal |
Token ID | 2717 |
Feature activation | +4.20e+01 |
Pos logit contributions | |
� | +21.950 |
� | +21.154 |
policies | +19.879 |
institutions | +18.406 |
policy | +18.253 |
Neg logit contributions | |
�� | -13.338 |
arthed | -12.044 |
�� | -11.757 |
senal | -11.489 |
yne | -11.467 |
Token | drug |
Token ID | 2563 |
Feature activation | +3.77e+01 |
Pos logit contributions | |
policies | +36.391 |
� | +35.725 |
� | +35.299 |
policy | +34.072 |
institutions | +32.734 |
Neg logit contributions | |
�� | -22.588 |
��極 | -20.351 |
senal | -20.232 |
arthed | -19.962 |
�� | -19.232 |
Token | laws |
Token ID | 3657 |
Feature activation | +9.24e+00 |
Pos logit contributions | |
policies | +34.089 |
� | +33.838 |
� | +32.430 |
policy | +31.566 |
laws | +29.374 |
Neg logit contributions | |
�� | -23.809 |
�� | -21.636 |
�� | -21.426 |
��極 | -21.129 |
senal | -20.844 |
Token | , |
Token ID | 11 |
Feature activation | +2.35e+01 |
Pos logit contributions | |
� | +12.039 |
� | +11.335 |
policies | +10.103 |
institutions | +9.307 |
climate | +9.188 |
Neg logit contributions | |
�� | -8.137 |
arthed | -7.502 |
�� | -7.451 |
yne | -7.100 |
�� | -7.002 |
Token | and |
Token ID | 290 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
�� | +1.145 |
�� | +1.066 |
arthed | +1.065 |
yne | +1.033 |
Remy | +1.024 |
Neg logit contributions | |
� | -1.334 |
� | -1.242 |
policies | -1.103 |
institutions | -1.022 |
climate | -0.997 |
Token | the |
Token ID | 262 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
� | +17.989 |
� | +17.042 |
policies | +16.162 |
economic | +15.144 |
climate | +15.027 |
Neg logit contributions | |
�� | -14.276 |
�� | -12.791 |
arthed | -12.467 |
��極 | -12.309 |
senal | -12.225 |
Token | associated |
Token ID | 3917 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
� | +15.259 |
� | +14.418 |
policies | +13.487 |
economic | +12.467 |
climate | +12.412 |
Neg logit contributions | |
�� | -12.890 |
�� | -11.809 |
arthed | -11.584 |
senal | -11.183 |
��極 | -11.080 |
Token | credit |
Token ID | 3884 |
Feature activation | +2.75e+01 |
Pos logit contributions | |
� | +24.746 |
� | +23.850 |
policies | +23.523 |
economic | +22.248 |
climate | +21.574 |
Neg logit contributions | |
�� | -20.250 |
�� | -17.509 |
arthed | -17.169 |
senal | -17.092 |
��極 | -16.796 |
Token | crunch |
Token ID | 23527 |
Feature activation | +5.14e+00 |
Pos logit contributions | |
� | +25.695 |
� | +24.312 |
policies | +23.738 |
climate | +21.874 |
policy | +21.865 |
Neg logit contributions | |
�� | -24.935 |
�� | -20.957 |
arthed | -20.836 |
��極 | -20.384 |
Canaver | -20.084 |
Token | accelerate |
Token ID | 22636 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
� | +6.603 |
� | +6.230 |
policies | +5.611 |
institutions | +5.208 |
climate | +5.155 |
Neg logit contributions | |
�� | -4.694 |
�� | -4.330 |
arthed | -4.255 |
yne | -4.038 |
�� | -4.014 |
Token | and |
Token ID | 290 |
Feature activation | +2.40e+01 |
Pos logit contributions | |
� | +21.400 |
� | +20.245 |
policies | +18.535 |
economic | +17.324 |
climate | +17.038 |
Neg logit contributions | |
�� | -18.956 |
�� | -16.772 |
arthed | -16.290 |
��極 | -16.147 |
senal | -15.823 |
Token | spill |
Token ID | 19431 |
Feature activation | +8.32e+00 |
Pos logit contributions | |
� | +25.895 |
� | +24.728 |
policies | +24.035 |
economic | +22.479 |
institutions | +22.326 |
Neg logit contributions | |
�� | -18.655 |
�� | -15.984 |
arthed | -15.787 |
��極 | -15.628 |
senal | -15.140 |
Token | over |
Token ID | 625 |
Feature activation | +8.97e+00 |
Pos logit contributions | |
� | +10.208 |
� | +9.601 |
policies | +8.749 |
institutions | +8.101 |
climate | +8.015 |
Neg logit contributions | |
�� | -7.798 |
�� | -7.138 |
arthed | -6.970 |
yne | -6.685 |
Remy | -6.634 |
Token | to |
Token ID | 284 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
� | +11.304 |
� | +10.721 |
policies | +9.762 |
institutions | +9.139 |
climate | +8.948 |
Neg logit contributions | |
�� | -8.175 |
�� | -7.404 |
arthed | -7.255 |
yne | -6.936 |
��極 | -6.932 |
Token | the |
Token ID | 262 |
Feature activation | +8.33e+00 |
Pos logit contributions | |
� | +12.597 |
� | +11.906 |
policies | +10.951 |
institutions | +10.205 |
climate | +9.994 |
Neg logit contributions | |
�� | -10.090 |
�� | -9.095 |
arthed | -8.929 |
��極 | -8.619 |
yne | -8.486 |
Token | , |
Token ID | 11 |
Feature activation | +2.31e+01 |
Pos logit contributions | |
� | +22.729 |
� | +21.142 |
policies | +18.665 |
institutions | +16.944 |
climate | +16.939 |
Neg logit contributions | |
�� | -16.330 |
arthed | -15.238 |
�� | -14.380 |
��極 | -14.019 |
senal | -13.968 |
Token | and |
Token ID | 290 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
� | +27.032 |
� | +25.295 |
policies | +22.866 |
climate | +21.134 |
institutions | +21.001 |
Neg logit contributions | |
�� | -17.370 |
arthed | -15.639 |
�� | -14.714 |
��極 | -14.541 |
senal | -14.436 |
Token | they |
Token ID | 484 |
Feature activation | +3.42e+01 |
Pos logit contributions | |
� | +20.630 |
� | +19.568 |
policies | +17.867 |
climate | +16.438 |
institutions | +16.398 |
Neg logit contributions | |
�� | -14.721 |
arthed | -12.982 |
��極 | -12.369 |
senal | -12.222 |
�� | -12.185 |
Token | probably |
Token ID | 2192 |
Feature activation | +2.31e+01 |
Pos logit contributions | |
� | +36.861 |
� | +34.332 |
policies | +28.418 |
climate | +27.068 |
| +26.779 |
Neg logit contributions | |
�� | -22.768 |
senal | -19.886 |
arthed | -19.728 |
��極 | -18.632 |
�� | -18.491 |
Token | hate |
Token ID | 5465 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
� | +26.515 |
� | +24.945 |
policies | +21.365 |
climate | +19.917 |
institutions | +19.518 |
Neg logit contributions | |
�� | -19.902 |
arthed | -17.860 |
senal | -17.526 |
�� | -16.662 |
��極 | -16.472 |
Token | black |
Token ID | 2042 |
Feature activation | +3.21e+01 |
Pos logit contributions | |
� | +20.043 |
� | +19.107 |
policies | +17.394 |
climate | +16.146 |
institutions | +16.124 |
Neg logit contributions | |
�� | -11.765 |
arthed | -10.198 |
�� | -9.960 |
��極 | -9.787 |
senal | -9.599 |
Token | people |
Token ID | 661 |
Feature activation | +1.89e+01 |
Pos logit contributions | |
� | +32.204 |
� | +30.731 |
policies | +27.619 |
institutions | +26.276 |
political | +25.810 |
Neg logit contributions | |
�� | -24.367 |
arthed | -21.390 |
senal | -20.004 |
�� | -19.399 |
Canaver | -19.210 |
Token | , |
Token ID | 11 |
Feature activation | +2.30e+01 |
Pos logit contributions | |
� | +22.777 |
� | +21.131 |
policies | +18.107 |
climate | +16.671 |
institutions | +16.671 |
Neg logit contributions | |
�� | -16.514 |
arthed | -15.351 |
�� | -14.565 |
senal | -14.313 |
��極 | -13.805 |
Token | too |
Token ID | 1165 |
Feature activation | +1.73e+01 |
Pos logit contributions | |
� | +26.247 |
� | +24.614 |
policies | +22.231 |
climate | +21.054 |
institutions | +20.913 |
Neg logit contributions | |
�� | -18.475 |
arthed | -16.513 |
�� | -15.332 |
��極 | -15.246 |
senal | -15.128 |
Token | … |
Token ID | 1399 |
Feature activation | +3.14e+01 |
Pos logit contributions | |
� | +21.441 |
� | +20.009 |
policies | +17.131 |
climate | +15.884 |
institutions | +15.794 |
Neg logit contributions | |
�� | -14.633 |
arthed | -13.578 |
�� | -12.808 |
��極 | -12.389 |
�� | -12.354 |
Token | Oh |
Token ID | 3966 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
� | +34.749 |
� | +32.660 |
policies | +28.955 |
climate | +27.314 |
institutions | +26.939 |
Neg logit contributions | |
�� | -18.165 |
arthed | -15.784 |
senal | -15.489 |
��極 | -15.244 |
�� | -14.886 |
Token | 19 |
Token ID | 678 |
Feature activation | +6.74e+00 |
Pos logit contributions | |
� | +26.589 |
� | +25.331 |
policies | +23.106 |
institutions | +21.839 |
climate | +21.597 |
Neg logit contributions | |
�� | -10.114 |
�� | -8.870 |
arthed | -8.599 |
�� | -8.035 |
yne | -7.996 |
Token | P |
Token ID | 47 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
� | +9.540 |
� | +9.045 |
policies | +8.177 |
institutions | +7.668 |
climate | +7.548 |
Neg logit contributions | |
�� | -5.187 |
�� | -4.680 |
arthed | -4.621 |
yne | -4.365 |
�� | -4.311 |
Token | / |
Token ID | 14 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
�� | +0.962 |
�� | +0.896 |
arthed | +0.885 |
yne | +0.857 |
Remy | +0.848 |
Neg logit contributions | |
� | -1.381 |
� | -1.298 |
policies | -1.174 |
institutions | -1.096 |
climate | -1.072 |
Token | B |
Token ID | 33 |
Feature activation | +3.71e+00 |
Pos logit contributions | |
�� | +18.340 |
arthed | +17.946 |
�� | +17.877 |
yne | +17.779 |
nox | +17.383 |
Neg logit contributions | |
� | -11.323 |
� | -10.370 |
policies | -9.206 |
institutions | -8.207 |
ideology | -7.762 |
Token | or |
Token ID | 273 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
� | +5.233 |
� | +4.952 |
policies | +4.490 |
institutions | +4.210 |
climate | +4.147 |
Neg logit contributions | |
�� | -2.908 |
�� | -2.629 |
arthed | -2.602 |
yne | -2.464 |
Remy | -2.432 |
Token | rell |
Token ID | 11252 |
Feature activation | -8.22e+00 |
Pos logit contributions | |
�� | +1.859 |
�� | +1.686 |
arthed | +1.677 |
yne | +1.637 |
Blossom | +1.592 |
Neg logit contributions | |
� | -3.724 |
� | -3.543 |
policies | -3.250 |
institutions | -3.060 |
climate | -3.017 |
Token | y |
Token ID | 88 |
Feature activation | -6.23e+00 |
Pos logit contributions | |
�� | +8.546 |
�� | +8.200 |
yne | +8.172 |
arthed | +8.086 |
Blossom | +8.004 |
Neg logit contributions | |
� | -8.227 |
� | -7.595 |
policies | -6.829 |
institutions | -6.241 |
ideology | -6.064 |
Token | Animation |
Token ID | 23535 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
�� | +6.583 |
�� | +6.307 |
arthed | +6.246 |
yne | +6.183 |
Blossom | +6.084 |
Neg logit contributions | |
� | -6.413 |
� | -5.936 |
policies | -5.311 |
institutions | -4.851 |
ideology | -4.726 |
Token | of |
Token ID | 286 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
� | +15.387 |
� | +14.641 |
policies | +13.212 |
institutions | +12.346 |
policy | +12.159 |
Neg logit contributions | |
�� | -8.103 |
�� | -7.240 |
arthed | -7.148 |
�� | -6.812 |
yne | -6.561 |
Token | tra |
Token ID | 9535 |
Feature activation | -7.31e+00 |
Pos logit contributions | |
� | +2.151 |
� | +2.032 |
policies | +1.843 |
institutions | +1.726 |
climate | +1.699 |
Neg logit contributions | |
�� | -1.243 |
�� | -1.134 |
arthed | -1.121 |
yne | -1.069 |
Remy | -1.055 |
Token | ject |
Token ID | 752 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
�� | +5.877 |
arthed | +5.367 |
�� | +5.291 |
yne | +5.186 |
agle | +5.046 |
Neg logit contributions | |
� | -9.536 |
� | -9.071 |
policies | -8.198 |
institutions | -7.608 |
climate | -7.546 |
Token | kilometres |
Token ID | 23990 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
� | +0.538 |
� | +0.512 |
policies | +0.472 |
institutions | +0.446 |
climate | +0.440 |
Neg logit contributions | |
�� | -0.192 |
�� | -0.172 |
arthed | -0.168 |
yne | -0.159 |
Remy | -0.154 |
Token | to |
Token ID | 284 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
�� | +1.269 |
�� | +1.204 |
arthed | +1.190 |
yne | +1.164 |
Remy | +1.149 |
Neg logit contributions | |
� | -1.332 |
� | -1.238 |
policies | -1.119 |
institutions | -1.029 |
ideology | -0.997 |
Token | Tan |
Token ID | 11818 |
Feature activation | -4.85e+00 |
Pos logit contributions | |
�� | +11.004 |
Remy | +10.737 |
�� | +10.630 |
yne | +10.533 |
Reeves | +10.407 |
Neg logit contributions | |
� | -9.942 |
� | -9.110 |
policies | -8.336 |
institutions | -7.574 |
behavi | -7.398 |
Token | unda |
Token ID | 46535 |
Feature activation | +3.84e+00 |
Pos logit contributions | |
�� | +3.548 |
arthed | +3.397 |
�� | +3.251 |
yne | +3.188 |
agle | +3.159 |
Neg logit contributions | |
� | -6.630 |
� | -6.274 |
policies | -5.740 |
institutions | -5.395 |
ideology | -5.313 |
Token | and |
Token ID | 290 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
� | +4.915 |
� | +4.613 |
policies | +4.107 |
institutions | +3.826 |
climate | +3.772 |
Neg logit contributions | |
�� | -3.552 |
�� | -3.258 |
arthed | -3.231 |
yne | -3.073 |
Remy | -3.053 |
Token | may |
Token ID | 743 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
Remy | +16.018 |
Blossom | +15.933 |
�� | +15.854 |
�� | +15.831 |
yne | +15.819 |
Neg logit contributions | |
� | -10.108 |
� | -9.091 |
policies | -7.902 |
behavi | -7.089 |
institutions | -7.014 |
Token | see |
Token ID | 766 |
Feature activation | -2.33e+01 |
Pos logit contributions | |
�� | +2.064 |
�� | +1.956 |
arthed | +1.911 |
yne | +1.890 |
Remy | +1.863 |
Neg logit contributions | |
� | -1.949 |
� | -1.801 |
policies | -1.603 |
institutions | -1.463 |
ideology | -1.420 |
Token | overall |
Token ID | 4045 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
Remy | +24.728 |
Rowe | +24.516 |
JJ | +24.405 |
Richie | +24.244 |
Gomez | +24.204 |
Neg logit contributions | |
� | -12.674 |
� | -11.369 |
policies | -9.582 |
behavi | -8.662 |
ideology | -8.455 |
Token | contenders |
Token ID | 29467 |
Feature activation | -2.90e+01 |
Pos logit contributions | |
� | +12.328 |
� | +11.573 |
policies | +10.286 |
institutions | +9.524 |
climate | +9.438 |
Neg logit contributions | |
�� | -10.401 |
arthed | -9.314 |
�� | -9.295 |
��極 | -9.025 |
�� | -8.931 |
Token | who |
Token ID | 508 |
Feature activation | +8.10e+00 |
Pos logit contributions | |
Remy | +31.603 |
JJ | +30.976 |
yne | +30.659 |
Gomez | +30.638 |
Rowe | +30.541 |
Neg logit contributions | |
� | -10.802 |
� | -9.116 |
policies | -8.023 |
behavi | -7.162 |
institutions | -6.598 |
Token | are |
Token ID | 389 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
� | +9.479 |
� | +8.886 |
policies | +7.737 |
climate | +7.094 |
institutions | +7.065 |
Neg logit contributions | |
�� | -8.407 |
arthed | -7.674 |
�� | -7.651 |
senal | -7.238 |
�� | -7.225 |
Token | little |
Token ID | 1310 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
�� | +3.857 |
arthed | +3.497 |
�� | +3.490 |
Remy | +3.411 |
yne | +3.404 |
Neg logit contributions | |
� | -5.290 |
� | -4.951 |
policies | -4.509 |
institutions | -4.165 |
ideology | -4.011 |
Token | basic |
Token ID | 4096 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
�� | +1.578 |
�� | +1.470 |
arthed | +1.467 |
Remy | +1.420 |
yne | +1.415 |
Neg logit contributions | |
� | -1.809 |
� | -1.683 |
policies | -1.503 |
institutions | -1.379 |
climate | -1.346 |
Token | . |
Token ID | 13 |
Feature activation | +8.91e+00 |
Pos logit contributions | |
� | +5.051 |
� | +4.771 |
policies | +4.296 |
institutions | +4.012 |
climate | +3.957 |
Neg logit contributions | |
�� | -3.241 |
�� | -2.963 |
arthed | -2.937 |
yne | -2.781 |
�� | -2.760 |
Token | That |
Token ID | 1320 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
� | +10.596 |
� | +9.904 |
policies | +8.462 |
climate | +7.749 |
institutions | +7.740 |
Neg logit contributions | |
�� | -9.011 |
�� | -8.317 |
arthed | -8.116 |
senal | -7.890 |
�� | -7.805 |
Token | may |
Token ID | 743 |
Feature activation | +3.75e+00 |
Pos logit contributions | |
� | +16.460 |
� | +15.463 |
policies | +13.661 |
climate | +12.735 |
ideology | +12.699 |
Neg logit contributions | |
�� | -14.456 |
�� | -13.512 |
arthed | -13.238 |
senal | -12.806 |
�� | -12.737 |
Token | not |
Token ID | 407 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
� | +4.010 |
� | +3.733 |
policies | +3.251 |
institutions | +2.964 |
climate | +2.919 |
Neg logit contributions | |
�� | -4.238 |
�� | -3.971 |
arthed | -3.958 |
yne | -3.784 |
�� | -3.766 |
Token | be |
Token ID | 307 |
Feature activation | -1.79e+01 |
Pos logit contributions | |
�� | +1.251 |
�� | +1.169 |
arthed | +1.156 |
yne | +1.134 |
Remy | +1.120 |
Neg logit contributions | |
� | -1.269 |
� | -1.177 |
policies | -1.046 |
institutions | -0.961 |
climate | -0.934 |
Token | the |
Token ID | 262 |
Feature activation | +9.62e+00 |
Pos logit contributions | |
Remy | +15.812 |
JJ | +15.527 |
�� | +15.441 |
�� | +15.256 |
Reeves | +15.202 |
Neg logit contributions | |
� | -15.630 |
� | -14.296 |
policies | -12.574 |
institutions | -11.568 |
behavi | -11.485 |
Token | case |
Token ID | 1339 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
� | +7.854 |
� | +7.119 |
policies | +6.022 |
climate | +5.277 |
institutions | +5.266 |
Neg logit contributions | |
�� | -12.906 |
arthed | -12.258 |
�� | -12.191 |
�� | -11.763 |
senal | -11.719 |
Token | for |
Token ID | 329 |
Feature activation | -9.51e+00 |
Pos logit contributions | |
JJ | +24.508 |
Remy | +24.433 |
yne | +24.030 |
Reeves | +23.778 |
Gomez | +23.758 |
Neg logit contributions | |
� | -14.109 |
� | -12.544 |
policies | -11.327 |
behavi | -10.619 |
governance | -10.412 |
Token | much |
Token ID | 881 |
Feature activation | +4.04e+00 |
Pos logit contributions | |
�� | +9.127 |
Remy | +8.918 |
JJ | +8.826 |
Reeves | +8.801 |
yne | +8.725 |
Neg logit contributions | |
� | -9.771 |
� | -9.039 |
policies | -7.839 |
ideology | -7.086 |
institutions | -7.069 |
Token | interest |
Token ID | 1393 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
� | +12.986 |
� | +12.121 |
policies | +10.911 |
institutions | +10.151 |
policy | +9.897 |
Neg logit contributions | |
�� | -12.639 |
�� | -11.712 |
arthed | -11.402 |
��極 | -11.279 |
�� | -11.258 |
Token | litigation |
Token ID | 19284 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
� | +10.272 |
� | +9.614 |
policies | +8.433 |
institutions | +7.721 |
climate | +7.559 |
Neg logit contributions | |
�� | -11.973 |
�� | -11.101 |
arthed | -10.874 |
ometown | -10.762 |
��極 | -10.715 |
Token | ( |
Token ID | 357 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
�� | +9.691 |
arthed | +9.254 |
JJ | +9.248 |
Remy | +9.180 |
�� | +9.124 |
Neg logit contributions | |
� | -10.514 |
� | -9.632 |
policies | -8.545 |
behavi | -7.838 |
institutions | -7.799 |
Token | P |
Token ID | 47 |
Feature activation | -2.44e+01 |
Pos logit contributions | |
�� | +12.643 |
arthed | +12.144 |
�� | +11.926 |
yne | +11.566 |
Remy | +11.509 |
Neg logit contributions | |
� | -15.072 |
� | -14.421 |
policies | -12.913 |
institutions | -11.925 |
behavi | -11.723 |
Token | IL |
Token ID | 4146 |
Feature activation | -1.37e+01 |
Pos logit contributions | |
agle | +22.999 |
arthed | +22.916 |
�� | +22.760 |
JJ | +22.539 |
yne | +22.451 |
Neg logit contributions | |
� | -15.759 |
� | -14.913 |
policies | -13.835 |
behavi | -12.700 |
institutions | -12.020 |
Token | ) |
Token ID | 8 |
Feature activation | -6.39e+00 |
Pos logit contributions | |
�� | +11.557 |
arthed | +11.157 |
JJ | +11.037 |
Remy | +10.802 |
�� | +10.721 |
Neg logit contributions | |
� | -14.456 |
� | -13.475 |
policies | -12.209 |
institutions | -11.508 |
behavi | -11.383 |
Token | in |
Token ID | 287 |
Feature activation | -7.92e+00 |
Pos logit contributions | |
�� | +6.168 |
arthed | +5.845 |
�� | +5.679 |
Remy | +5.647 |
yne | +5.610 |
Neg logit contributions | |
� | -7.185 |
� | -6.641 |
policies | -5.955 |
institutions | -5.476 |
ideology | -5.367 |
Token | the |
Token ID | 262 |
Feature activation | -6.16e+00 |
Pos logit contributions | |
�� | +8.590 |
arthed | +7.966 |
�� | +7.903 |
JJ | +7.895 |
Remy | +7.846 |
Neg logit contributions | |
� | -7.875 |
� | -7.201 |
policies | -6.388 |
institutions | -5.664 |
ideology | -5.637 |
Token | high |
Token ID | 1029 |
Feature activation | -2.11e+00 |
Pos logit contributions | |
�� | +7.949 |
arthed | +7.491 |
�� | +7.475 |
JJ | +7.387 |
Reeves | +7.382 |
Neg logit contributions | |
� | -5.073 |
� | -4.540 |
policies | -3.834 |
institutions | -3.297 |
ideology | -3.250 |
Token | court |
Token ID | 2184 |
Feature activation | -6.21e+00 |
Pos logit contributions | |
�� | +2.253 |
�� | +2.125 |
arthed | +2.117 |
Blossom | +2.038 |
Remy | +2.029 |
Neg logit contributions | |
� | -2.300 |
� | -2.138 |
policies | -1.880 |
institutions | -1.699 |
ideology | -1.667 |
Token | . |
Token ID | 13 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
�� | +7.049 |
arthed | +6.578 |
�� | +6.541 |
JJ | +6.416 |
Remy | +6.414 |
Neg logit contributions | |
� | -6.052 |
� | -5.541 |
policies | -4.824 |
institutions | -4.323 |
ideology | -4.260 |
Token | icious |
Token ID | 6243 |
Feature activation | -2.67e+01 |
Pos logit contributions | |
�� | +20.684 |
arthed | +20.656 |
yne | +20.353 |
agle | +20.261 |
nox | +20.098 |
Neg logit contributions | |
� | -13.167 |
� | -12.438 |
policies | -10.773 |
institutions | -9.882 |
behavi | -9.778 |
Token | s |
Token ID | 82 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
yne | +28.161 |
arthed | +28.024 |
nox | +28.007 |
agle | +27.657 |
bris | +27.645 |
Neg logit contributions | |
� | -12.893 |
� | -12.374 |
policies | -10.361 |
behavi | -9.396 |
institutions | -9.155 |
Token | > |
Token ID | 29 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
�� | +21.383 |
arthed | +21.370 |
agle | +21.301 |
ometown | +21.199 |
ilver | +21.115 |
Neg logit contributions | |
� | -12.257 |
� | -11.854 |
policies | -10.096 |
behavi | -10.093 |
institutions | -9.067 |
Token | lol |
Token ID | 19462 |
Feature activation | -1.89e+01 |
Pos logit contributions | |
Remy | +22.640 |
JJ | +22.124 |
Blossom | +22.102 |
�� | +21.997 |
�� | +21.933 |
Neg logit contributions | |
� | -12.775 |
� | -11.009 |
policies | -9.549 |
institutions | -8.715 |
behavi | -7.989 |
Token | m |
Token ID | 285 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
�� | +20.185 |
�� | +19.526 |
Remy | +19.243 |
arthed | +19.041 |
yne | +18.941 |
Neg logit contributions | |
� | -13.318 |
� | -11.938 |
policies | -10.284 |
institutions | -9.540 |
governance | -8.788 |
Token | 2 |
Token ID | 17 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
�� | +19.716 |
�� | +19.363 |
arthed | +19.110 |
fg | +18.844 |
itsu | +18.465 |
Neg logit contributions | |
� | -19.226 |
� | -17.832 |
policies | -15.838 |
behavi | -15.436 |
institutions | -15.131 |
Token | k |
Token ID | 74 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
yne | +14.102 |
fg | +14.092 |
agle | +14.023 |
nova | +13.862 |
Blossom | +13.806 |
Neg logit contributions | |
� | -22.094 |
behavi | -20.796 |
� | -20.605 |
policies | -19.182 |
institutions | -18.654 |
Token | [ |
Token ID | 685 |
Feature activation | -3.83e+00 |
Pos logit contributions | |
�� | +11.099 |
�� | +10.476 |
Remy | +10.368 |
arthed | +10.317 |
yne | +10.218 |
Neg logit contributions | |
� | -10.549 |
� | -9.680 |
policies | -8.549 |
institutions | -8.007 |
climate | -7.581 |
Token | 10 |
Token ID | 940 |
Feature activation | -3.26e+01 |
Pos logit contributions | |
�� | +1.244 |
arthed | +1.187 |
yne | +1.134 |
�� | +1.080 |
Remy | +1.051 |
Neg logit contributions | |
� | -6.631 |
� | -6.389 |
policies | -6.051 |
institutions | -5.765 |
behavi | -5.748 |
Token | : |
Token ID | 25 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
666 | +22.759 |
fg | +22.022 |
agle | +22.022 |
zzo | +22.013 |
Blossom | +22.000 |
Neg logit contributions | |
behavi | -27.391 |
conflic | -21.359 |
policies | -19.246 |
practition | -19.196 |
� | -18.662 |
Token | 47 |
Token ID | 2857 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
�� | +20.438 |
arthed | +20.309 |
�� | +19.654 |
Blossom | +19.610 |
�� | +19.458 |
Neg logit contributions | |
� | -19.435 |
� | -17.806 |
policies | -16.826 |
governance | -15.098 |
climate | -15.087 |
Token | MY |
Token ID | 17615 |
Feature activation | -8.70e+00 |
Pos logit contributions | |
�� | +3.408 |
�� | +3.217 |
arthed | +3.149 |
Remy | +3.079 |
Blossom | +3.074 |
Neg logit contributions | |
� | -6.063 |
� | -5.717 |
policies | -5.279 |
institutions | -4.961 |
ideology | -4.858 |
Token | BASE |
Token ID | 49688 |
Feature activation | -4.48e+00 |
Pos logit contributions | |
�� | +6.745 |
Remy | +6.442 |
Blossom | +6.403 |
�� | +6.294 |
arthed | +6.267 |
Neg logit contributions | |
� | -10.668 |
� | -10.005 |
policies | -9.284 |
institutions | -8.762 |
governance | -8.513 |
Token | CH |
Token ID | 5870 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
�� | +4.642 |
�� | +4.424 |
arthed | +4.318 |
Remy | +4.270 |
Blossom | +4.261 |
Neg logit contributions | |
� | -4.809 |
� | -4.463 |
policies | -4.012 |
institutions | -3.715 |
climate | -3.585 |
Token | ILL |
Token ID | 8267 |
Feature activation | +2.79e+00 |
Pos logit contributions | |
� | +1.919 |
� | +1.816 |
policies | +1.652 |
institutions | +1.550 |
climate | +1.526 |
Neg logit contributions | |
�� | -1.048 |
�� | -0.956 |
arthed | -0.944 |
yne | -0.901 |
Remy | -0.888 |
Token |
|
Token ID | 198 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
� | +3.782 |
� | +3.570 |
policies | +3.225 |
institutions | +3.011 |
climate | +2.967 |
Neg logit contributions | |
�� | -2.338 |
�� | -2.136 |
arthed | -2.118 |
yne | -2.020 |
Remy | -1.986 |
Token |
|
Token ID | 198 |
Feature activation | -4.77e+01 |
Pos logit contributions | |
� | +7.557 |
� | +6.685 |
policies | +4.173 |
| +3.585 |
climate | +3.246 |
Neg logit contributions | |
�� | -20.431 |
senal | -20.293 |
�� | -19.003 |
��極 | -18.832 |
everal | -18.736 |
Token | J |
Token ID | 41 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
nox | +38.948 |
fg | +38.585 |
agle | +38.522 |
zzy | +38.244 |
nova | +38.215 |
Neg logit contributions | |
� | -11.916 |
� | -11.687 |
policies | -11.396 |
behavi | -10.217 |
institutions | -9.361 |
Token | aaaa |
Token ID | 24794 |
Feature activation | -7.08e+00 |
Pos logit contributions | |
yne | +21.897 |
agle | +21.710 |
�� | +21.687 |
arthed | +21.647 |
ometown | +21.403 |
Neg logit contributions | |
� | -14.043 |
� | -13.159 |
policies | -11.513 |
institutions | -10.360 |
climate | -10.144 |
Token | asper |
Token ID | 32981 |
Feature activation | -2.15e+01 |
Pos logit contributions | |
�� | +5.395 |
arthed | +5.096 |
�� | +5.072 |
yne | +4.915 |
agle | +4.880 |
Neg logit contributions | |
� | -9.184 |
� | -8.774 |
policies | -8.052 |
institutions | -7.581 |
climate | -7.507 |
Token | Profile |
Token ID | 13118 |
Feature activation | -1.68e+01 |
Pos logit contributions | |
�� | +23.776 |
�� | +23.755 |
agle | +23.324 |
666 | +23.290 |
arthed | +23.258 |
Neg logit contributions | |
� | -11.696 |
� | -11.211 |
policies | -9.668 |
institutions | -8.989 |
governance | -8.427 |
Token | Blog |
Token ID | 14001 |
Feature activation | -2.34e+01 |
Pos logit contributions | |
Remy | +13.917 |
�� | +13.912 |
�� | +13.481 |
arthed | +13.346 |
ometown | +13.173 |
Neg logit contributions | |
� | -16.204 |
� | -15.009 |
policies | -13.678 |
institutions | -13.075 |
behavi | -12.452 |
Token | that |
Token ID | 326 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
�� | +2.562 |
�� | +2.432 |
arthed | +2.380 |
Remy | +2.336 |
yne | +2.312 |
Neg logit contributions | |
� | -3.236 |
� | -3.031 |
policies | -2.740 |
institutions | -2.538 |
climate | -2.472 |
Token | was |
Token ID | 373 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
� | +27.621 |
� | +25.846 |
policies | +22.038 |
climate | +21.214 |
policy | +20.954 |
Neg logit contributions | |
�� | -15.886 |
arthed | -14.606 |
�� | -13.878 |
�� | -13.821 |
��極 | -13.639 |
Token | when |
Token ID | 618 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
�� | +19.144 |
�� | +19.078 |
JJ | +18.907 |
Remy | +18.903 |
Blossom | +18.701 |
Neg logit contributions | |
� | -7.994 |
� | -6.976 |
policies | -6.357 |
institutions | -5.454 |
governance | -4.938 |
Token | I |
Token ID | 314 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
� | +2.219 |
� | +2.080 |
policies | +1.857 |
institutions | +1.719 |
climate | +1.688 |
Neg logit contributions | |
�� | -1.774 |
�� | -1.644 |
arthed | -1.630 |
yne | -1.569 |
Remy | -1.550 |
Token | wasn |
Token ID | 2492 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
zzo | +24.488 |
JJ | +24.094 |
�� | +24.023 |
Remy | +23.873 |
kissed | +23.873 |
Neg logit contributions | |
� | -6.793 |
� | -5.913 |
policies | -5.846 |
behavi | -5.555 |
institutions | -4.477 |
Token | � |
Token ID | 447 |
Feature activation | -3.78e+01 |
Pos logit contributions | |
� | +12.282 |
� | +11.002 |
policies | +8.294 |
| +7.876 |
institutions | +7.509 |
Neg logit contributions | |
�� | -14.596 |
senal | -13.842 |
�� | -13.301 |
��極 | -12.857 |
arthed | -12.809 |
Token | � |
Token ID | 247 |
Feature activation | -1.97e+01 |
Pos logit contributions | |
�� | +34.424 |
� | +33.528 |
�� | +32.844 |
� | +32.112 |
� | +32.095 |
Neg logit contributions | |
behavi | -16.678 |
� | -15.135 |
policies | -14.876 |
� | -14.469 |
climate | -13.637 |
Token | t |
Token ID | 83 |
Feature activation | -2.90e+01 |
Pos logit contributions | |
fg | +16.619 |
agle | +16.375 |
arthed | +16.188 |
yne | +16.046 |
zzo | +15.995 |
Neg logit contributions | |
� | -16.387 |
policies | -15.500 |
� | -15.451 |
behavi | -15.410 |
institutions | -14.263 |
Token | even |
Token ID | 772 |
Feature activation | -3.55e+01 |
Pos logit contributions | |
agle | +27.656 |
�� | +27.383 |
JJ | +27.362 |
coached | +27.321 |
yne | +27.155 |
Neg logit contributions | |
� | -13.769 |
� | -12.056 |
policies | -11.110 |
behavi | -9.765 |
institutions | -9.124 |
Token | really |
Token ID | 1107 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
Remy | +31.820 |
coached | +31.709 |
JJ | +31.617 |
flown | +31.027 |
Reeves | +30.873 |
Neg logit contributions | |
� | -13.783 |
� | -12.138 |
policies | -10.693 |
behavi | -10.328 |
modernization | -9.226 |
Token | playing |
Token ID | 2712 |
Feature activation | -9.92e+00 |
Pos logit contributions | |
JJ | +26.527 |
coached | +26.022 |
Remy | +26.007 |
flown | +25.847 |
zzo | +25.777 |
Neg logit contributions | |
� | -12.117 |
� | -10.482 |
policies | -9.793 |
behavi | -8.903 |
governance | -8.180 |
Token | more |
Token ID | 517 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
�� | +12.406 |
�� | +12.146 |
Remy | +12.069 |
arthed | +12.017 |
Blossom | +11.991 |
Neg logit contributions | |
� | -11.026 |
� | -10.212 |
policies | -8.732 |
ideology | -7.957 |
behavi | -7.841 |
Token | , |
Token ID | 11 |
Feature activation | -2.86e+01 |
Pos logit contributions | |
Remy | +17.013 |
Blossom | +16.978 |
Reeves | +16.717 |
JJ | +16.652 |
�� | +16.649 |
Neg logit contributions | |
� | -13.777 |
� | -12.290 |
policies | -10.570 |
behavi | -9.935 |
ideology | -9.631 |
Token | with |
Token ID | 351 |
Feature activation | -2.62e+01 |
Pos logit contributions | |
Blossom | +26.589 |
Reeves | +26.438 |
Remy | +26.404 |
JJ | +26.183 |
agle | +25.687 |
Neg logit contributions | |
� | -15.747 |
� | -13.933 |
policies | -11.367 |
behavi | -11.143 |
ideology | -10.114 |
Token | another |
Token ID | 1194 |
Feature activation | -2.71e+01 |
Pos logit contributions | |
Remy | +25.668 |
Reeves | +25.290 |
Blossom | +25.189 |
Dee | +24.529 |
JJ | +24.506 |
Neg logit contributions | |
� | -16.331 |
� | -14.089 |
behavi | -11.004 |
policies | -10.753 |
ideology | -9.794 |
Token | due |
Token ID | 2233 |
Feature activation | -2.70e+01 |
Pos logit contributions | |
Reeves | +24.832 |
Remy | +24.756 |
JJ | +24.628 |
Blossom | +24.551 |
Winchester | +24.077 |
Neg logit contributions | |
� | -16.921 |
� | -14.904 |
policies | -13.155 |
behavi | -12.664 |
institutions | -11.257 |
Token | out |
Token ID | 503 |
Feature activation | -4.54e+01 |
Pos logit contributions | |
Blossom | +23.180 |
Remy | +22.832 |
Reeves | +22.741 |
arthed | +22.618 |
agle | +22.053 |
Neg logit contributions | |
� | -18.315 |
� | -16.041 |
behavi | -13.761 |
policies | -13.733 |
institutions | -12.076 |
Token | this |
Token ID | 428 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
Reeves | +31.792 |
Blossom | +31.749 |
Remy | +31.690 |
Gomez | +30.898 |
JJ | +30.851 |
Neg logit contributions | |
� | -19.269 |
� | -16.120 |
behavi | -15.160 |
policies | -13.066 |
institutions | -11.463 |
Token | year |
Token ID | 614 |
Feature activation | -3.66e+01 |
Pos logit contributions | |
�� | +9.649 |
�� | +9.323 |
Blossom | +9.317 |
Reeves | +9.240 |
Remy | +9.198 |
Neg logit contributions | |
� | -13.274 |
� | -12.250 |
policies | -10.898 |
institutions | -10.114 |
behavi | -10.038 |
Token | . |
Token ID | 13 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
Blossom | +27.993 |
Remy | +27.706 |
Reeves | +27.675 |
zzo | +27.464 |
JJ | +27.397 |
Neg logit contributions | |
� | -18.950 |
� | -16.646 |
behavi | -15.077 |
policies | -14.504 |
governance | -13.205 |
Token | But |
Token ID | 887 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
Remy | +13.925 |
Blossom | +13.842 |
Reeves | +13.743 |
�� | +13.686 |
Gomez | +13.445 |
Neg logit contributions | |
� | -9.291 |
� | -8.299 |
policies | -7.779 |
behavi | -7.153 |
institutions | -6.995 |
Token | in |
Token ID | 287 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
Remy | +20.702 |
Blossom | +20.599 |
Reeves | +20.508 |
Gomez | +20.088 |
JJ | +19.946 |
Neg logit contributions | |
� | -15.450 |
� | -13.696 |
policies | -11.302 |
behavi | -11.058 |
ideology | -9.934 |
Token | { |
Token ID | 1391 |
Feature activation | -2.00e+01 |
Pos logit contributions | |
�� | +27.010 |
Remy | +26.567 |
�� | +26.069 |
agle | +25.765 |
JJ | +25.572 |
Neg logit contributions | |
� | -22.327 |
� | -20.030 |
policies | -17.068 |
institutions | -16.870 |
ideology | -15.989 |
Token | ( |
Token ID | 7 |
Feature activation | -9.62e+01 |
Pos logit contributions | |
666 | +16.205 |
fg | +15.559 |
Blossom | +15.355 |
yne | +15.352 |
135 | +15.327 |
Neg logit contributions | |
behavi | -18.220 |
� | -16.524 |
� | -16.208 |
policies | -16.069 |
institutions | -15.171 |
Token | 171 |
Token ID | 27192 |
Feature activation | -2.97e+01 |
Pos logit contributions | |
135 | +45.107 |
666 | +44.852 |
302 | +43.343 |
6 | +42.960 |
336 | +42.503 |
Neg logit contributions | |
behavi | -15.944 |
� | -13.762 |
policies | -12.319 |
� | -12.191 |
institutions | -11.708 |
Token | s |
Token ID | 82 |
Feature activation | -3.69e+01 |
Pos logit contributions | |
fg | +22.917 |
agle | +22.065 |
Blossom | +21.905 |
yne | +21.832 |
nova | +21.586 |
Neg logit contributions | |
behavi | -19.952 |
� | -19.760 |
� | -18.840 |
policies | -16.237 |
governance | -16.223 |
Token | )} |
Token ID | 38165 |
Feature activation | -3.04e+01 |
Pos logit contributions | |
Blossom | +24.921 |
agle | +24.734 |
arthed | +24.562 |
zzo | +24.519 |
fg | +24.320 |
Neg logit contributions | |
behavi | -25.250 |
� | -21.500 |
policies | -20.558 |
� | -20.176 |
ideology | -19.533 |
Token | 12 |
Token ID | 1105 |
Feature activation | -4.00e+01 |
Pos logit contributions | |
Remy | +27.991 |
Ned | +26.861 |
JJ | +26.732 |
�� | +26.498 |
Blossom | +26.184 |
Neg logit contributions | |
� | -17.501 |
� | -14.688 |
policies | -13.073 |
institutions | -12.536 |
ideology | -11.960 |
Token | . |
Token ID | 13 |
Feature activation | -4.45e+01 |
Pos logit contributions | |
Blossom | +26.698 |
666 | +26.247 |
fg | +26.017 |
JJ | +25.944 |
Remy | +25.819 |
Neg logit contributions | |
behavi | -26.365 |
conflic | -21.020 |
� | -19.708 |
policies | -19.219 |
ideology | -18.747 |
Token | Na |
Token ID | 11013 |
Feature activation | -3.03e+01 |
Pos logit contributions | |
Remy | +33.056 |
JJ | +32.333 |
Reeves | +32.091 |
Yose | +31.962 |
fg | +31.720 |
Neg logit contributions | |
� | -19.544 |
� | -16.202 |
behavi | -14.356 |
policies | -13.197 |
institutions | -13.102 |
Token | 3 |
Token ID | 18 |
Feature activation | -3.92e+01 |
Pos logit contributions | |
fg | +23.647 |
6 | +23.556 |
nox | +23.118 |
yne | +22.894 |
8 | +22.863 |
Neg logit contributions | |
� | -19.425 |
� | -18.558 |
behavi | -17.568 |
policies | -16.216 |
institutions | -15.564 |
Token | { |
Token ID | 1391 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
fg | +28.616 |
�� | +28.390 |
�� | +28.306 |
yne | +28.007 |
Remy | +27.787 |
Neg logit contributions | |
� | -21.802 |
� | -19.010 |
policies | -16.168 |
institutions | -16.078 |
behavi | -15.223 |
Token | ( |
Token ID | 7 |
Feature activation | -9.94e+01 |
Pos logit contributions | |
666 | +15.923 |
fg | +15.400 |
Blossom | +15.118 |
yne | +15.111 |
135 | +15.041 |
Neg logit contributions | |
behavi | -18.203 |
� | -16.657 |
� | -16.404 |
policies | -16.237 |
institutions | -15.374 |
Token | Virginia |
Token ID | 6025 |
Feature activation | +7.92e+00 |
Pos logit contributions | |
� | +2.044 |
� | +1.928 |
policies | +1.757 |
institutions | +1.646 |
climate | +1.620 |
Neg logit contributions | |
�� | -1.109 |
�� | -1.013 |
arthed | -0.999 |
yne | -0.952 |
Remy | -0.945 |
Token | . |
Token ID | 13 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
� | +9.885 |
� | +9.340 |
policies | +8.372 |
institutions | +7.756 |
climate | +7.715 |
Neg logit contributions | |
�� | -7.337 |
�� | -6.706 |
arthed | -6.647 |
yne | -6.415 |
��極 | -6.343 |
Token |
|
Token ID | 198 |
Feature activation | +2.81e+01 |
Pos logit contributions | |
�� | +0.131 |
�� | +0.123 |
arthed | +0.122 |
Remy | +0.118 |
yne | +0.118 |
Neg logit contributions | |
� | -0.139 |
� | -0.130 |
policies | -0.116 |
institutions | -0.107 |
climate | -0.104 |
Token |
|
Token ID | 198 |
Feature activation | +4.28e-01 |
Pos logit contributions | |
� | +22.942 |
� | +21.047 |
| +16.479 |
| +14.733 |
policies | +14.700 |
Neg logit contributions | |
senal | -34.347 |
�� | -32.073 |
everal | -30.859 |
srf | -30.663 |
��極 | -28.560 |
Token | Del |
Token ID | 13856 |
Feature activation | -9.89e+00 |
Pos logit contributions | |
� | +0.504 |
� | +0.474 |
policies | +0.423 |
institutions | +0.391 |
climate | +0.383 |
Neg logit contributions | |
�� | -0.430 |
�� | -0.402 |
arthed | -0.399 |
yne | -0.385 |
Remy | -0.380 |
Token | . |
Token ID | 13 |
Feature activation | -3.87e+01 |
Pos logit contributions | |
�� | +8.215 |
�� | +7.787 |
arthed | +7.631 |
Remy | +7.560 |
yne | +7.509 |
Neg logit contributions | |
� | -11.718 |
� | -11.180 |
policies | -10.023 |
institutions | -9.312 |
climate | -9.098 |
Token | Todd |
Token ID | 14377 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
Gomez | +34.354 |
Remy | +34.309 |
Reeves | +33.780 |
�� | +33.477 |
Blossom | +33.289 |
Neg logit contributions | |
� | -15.013 |
� | -13.662 |
behavi | -12.608 |
policies | -12.500 |
institutions | -11.084 |
Token | Gilbert |
Token ID | 24023 |
Feature activation | -4.82e+00 |
Pos logit contributions | |
�� | +14.011 |
Remy | +13.584 |
Gomez | +13.516 |
�� | +13.426 |
Reeves | +13.353 |
Neg logit contributions | |
� | -14.167 |
� | -13.317 |
policies | -11.756 |
institutions | -10.901 |
behavi | -10.768 |
Token | ( |
Token ID | 357 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
�� | +5.669 |
�� | +5.458 |
arthed | +5.385 |
Remy | +5.317 |
yne | +5.284 |
Neg logit contributions | |
� | -4.419 |
� | -4.053 |
policies | -3.502 |
institutions | -3.218 |
climate | -3.095 |
Token | R |
Token ID | 49 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
�� | +6.605 |
arthed | +6.402 |
�� | +6.302 |
yne | +6.031 |
ometown | +5.957 |
Neg logit contributions | |
� | -13.549 |
� | -13.112 |
policies | -12.034 |
institutions | -11.387 |
ideology | -11.165 |
Token | - |
Token ID | 12 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
�� | +11.924 |
arthed | +11.455 |
�� | +11.018 |
ometown | +10.924 |
yne | +10.911 |
Neg logit contributions | |
� | -12.162 |
� | -11.484 |
policies | -10.327 |
institutions | -9.485 |
behavi | -9.133 |
Token | , |
Token ID | 11 |
Feature activation | -9.42e+00 |
Pos logit contributions | |
� | +10.522 |
� | +9.878 |
policies | +8.608 |
institutions | +8.013 |
climate | +7.929 |
Neg logit contributions | |
�� | -7.332 |
arthed | -6.743 |
�� | -6.674 |
yne | -6.373 |
�� | -6.272 |
Token | ending |
Token ID | 7464 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
�� | +12.324 |
�� | +11.913 |
Remy | +11.839 |
arthed | +11.754 |
Blossom | +11.715 |
Neg logit contributions | |
� | -6.093 |
� | -5.453 |
policies | -4.862 |
institutions | -4.185 |
ideology | -4.023 |
Token | it |
Token ID | 340 |
Feature activation | -9.12e+00 |
Pos logit contributions | |
Reeves | +25.125 |
JJ | +25.093 |
�� | +24.941 |
Remy | +24.920 |
Blossom | +24.801 |
Neg logit contributions | |
� | -13.311 |
� | -11.297 |
policies | -9.792 |
behavi | -8.828 |
institutions | -8.265 |
Token | with |
Token ID | 351 |
Feature activation | -4.07e+01 |
Pos logit contributions | |
�� | +10.821 |
�� | +10.465 |
Blossom | +10.214 |
Remy | +10.205 |
Reeves | +10.163 |
Neg logit contributions | |
� | -7.096 |
� | -6.488 |
policies | -5.953 |
institutions | -5.285 |
ideology | -5.033 |
Token | 3 |
Token ID | 513 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
Remy | +34.328 |
Blossom | +34.069 |
Reeves | +34.051 |
Grayson | +33.721 |
Gomez | +33.596 |
Neg logit contributions | |
� | -13.499 |
� | -10.496 |
behavi | -9.811 |
policies | -9.720 |
governance | -8.845 |
Token | , |
Token ID | 11 |
Feature activation | -1.15e+02 |
Pos logit contributions | |
�� | +12.659 |
�� | +12.309 |
yne | +12.028 |
Remy | +11.810 |
ometown | +11.760 |
Neg logit contributions | |
� | -12.285 |
� | -11.433 |
policies | -10.362 |
ideology | -9.737 |
behavi | -9.564 |
Token | 457 |
Token ID | 33032 |
Feature activation | -4.50e+00 |
Pos logit contributions | |
666 | +45.748 |
135 | +44.648 |
302 | +43.901 |
06 | +43.611 |
333 | +43.537 |
Neg logit contributions | |
� | -16.702 |
behavi | -15.754 |
� | -14.472 |
institutions | -13.620 |
policies | -13.403 |
Token | rushing |
Token ID | 15795 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
�� | +3.439 |
�� | +3.170 |
arthed | +3.127 |
yne | +3.058 |
Remy | +3.050 |
Neg logit contributions | |
� | -6.033 |
� | -5.652 |
policies | -5.240 |
institutions | -4.879 |
climate | -4.835 |
Token | yards |
Token ID | 5695 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
� | +3.218 |
� | +3.041 |
policies | +2.759 |
institutions | +2.585 |
climate | +2.545 |
Neg logit contributions | |
�� | -1.839 |
�� | -1.675 |
arthed | -1.657 |
yne | -1.580 |
Remy | -1.558 |
Token | and |
Token ID | 290 |
Feature activation | -3.65e+01 |
Pos logit contributions | |
�� | +17.890 |
�� | +17.794 |
Remy | +17.705 |
yne | +17.332 |
arthed | +17.203 |
Neg logit contributions | |
� | -7.201 |
� | -6.161 |
policies | -5.952 |
institutions | -5.079 |
behavi | -4.984 |
Token | 32 |
Token ID | 3933 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
Remy | +30.707 |
Reeves | +30.422 |
JJ | +30.213 |
Grayson | +29.974 |
Blossom | +29.937 |
Neg logit contributions | |
� | -15.343 |
� | -12.742 |
behavi | -12.280 |
policies | -11.176 |
governance | -9.473 |
Token | pic |
Token ID | 8301 |
Feature activation | -2.96e+01 |
Pos logit contributions | |
� | +16.138 |
� | +15.149 |
policies | +12.957 |
climate | +12.093 |
institutions | +12.037 |
Neg logit contributions | |
�� | -11.239 |
�� | -10.135 |
arthed | -9.941 |
��極 | -9.636 |
Canaver | -9.441 |
Token | . |
Token ID | 13 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
Blossom | +25.815 |
Gomez | +25.520 |
JJ | +25.463 |
Remy | +25.122 |
666 | +24.914 |
Neg logit contributions | |
behavi | -18.630 |
policies | -14.478 |
conflic | -13.912 |
institutions | -13.310 |
� | -13.180 |
Token | twitter |
Token ID | 6956 |
Feature activation | -4.38e+01 |
Pos logit contributions | |
Blossom | +12.938 |
agle | +12.913 |
arthed | +12.798 |
yne | +12.780 |
nox | +12.749 |
Neg logit contributions | |
behavi | -13.326 |
� | -13.010 |
policies | -12.967 |
� | -12.114 |
institutions | -11.854 |
Token | . |
Token ID | 13 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
666 | +30.715 |
Blossom | +30.014 |
135 | +29.921 |
fg | +29.852 |
JJ | +29.814 |
Neg logit contributions | |
behavi | -26.638 |
conflic | -21.336 |
practition | -19.544 |
policies | -17.785 |
� | -17.466 |
Token | com |
Token ID | 785 |
Feature activation | -2.15e+01 |
Pos logit contributions | |
zzo | +18.027 |
agle | +17.974 |
fg | +17.906 |
Blossom | +17.899 |
yne | +17.745 |
Neg logit contributions | |
behavi | -13.659 |
policies | -12.119 |
� | -11.600 |
ideology | -10.846 |
� | -10.835 |
Token | / |
Token ID | 14 |
Feature activation | -1.24e+02 |
Pos logit contributions | |
666 | +20.588 |
Blossom | +20.373 |
yne | +20.169 |
JJ | +20.139 |
agle | +20.043 |
Neg logit contributions | |
behavi | -15.102 |
policies | -12.610 |
� | -12.037 |
ideology | -11.670 |
institutions | -11.524 |
Token | xx |
Token ID | 5324 |
Feature activation | -1.14e+02 |
Pos logit contributions | |
fg | +46.221 |
yx | +44.972 |
yne | +44.790 |
6 | +43.770 |
uo | +43.716 |
Neg logit contributions | |
behavi | -14.654 |
policies | -13.755 |
� | -13.700 |
� | -13.608 |
climate | -12.423 |
Token | A |
Token ID | 32 |
Feature activation | -6.64e+01 |
Pos logit contributions | |
fg | +45.528 |
yx | +44.536 |
yne | +44.402 |
zzy | +43.765 |
uo | +43.438 |
Neg logit contributions | |
behavi | -14.767 |
� | -13.782 |
� | -13.681 |
policies | -13.357 |
climate | -12.261 |
Token | II |
Token ID | 3978 |
Feature activation | -9.05e+01 |
Pos logit contributions | |
fg | +42.005 |
zzy | +41.963 |
yx | +41.507 |
agle | +41.467 |
zzo | +41.344 |
Neg logit contributions | |
� | -12.376 |
� | -12.266 |
policies | -12.024 |
behavi | -11.838 |
institutions | -10.429 |
Token | 1 |
Token ID | 16 |
Feature activation | -1.01e+02 |
Pos logit contributions | |
fg | +45.355 |
yne | +44.210 |
yx | +43.581 |
zzy | +43.223 |
zzo | +43.124 |
Neg logit contributions | |
behavi | -14.021 |
� | -13.095 |
� | -12.890 |
policies | -12.457 |
climate | -11.592 |
Token | k |
Token ID | 74 |
Feature activation | -1.01e+02 |
Pos logit contributions | |
fg | +45.210 |
yne | +44.548 |
yx | +44.180 |
zzy | +43.226 |
uo | +43.168 |
Neg logit contributions | |
behavi | -13.422 |
� | -13.337 |
� | -13.122 |
policies | -12.924 |
institutions | -11.529 |
Token | . |
Token ID | 13 |
Feature activation | -4.51e+01 |
Pos logit contributions | |
Blossom | +27.414 |
Remy | +27.263 |
fg | +27.231 |
JJ | +27.215 |
666 | +27.212 |
Neg logit contributions | |
behavi | -28.014 |
conflic | -22.594 |
practition | -20.292 |
� | -19.644 |
policies | -19.544 |
Token | Q |
Token ID | 1195 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
Remy | +32.987 |
JJ | +32.383 |
Reeves | +32.229 |
Yose | +31.952 |
Ng | +31.638 |
Neg logit contributions | |
� | -19.788 |
� | -16.346 |
behavi | -14.665 |
policies | -13.365 |
institutions | -13.238 |
Token | e |
Token ID | 68 |
Feature activation | -3.28e+01 |
Pos logit contributions | |
fg | +31.828 |
dd | +30.864 |
yne | +30.249 |
fx | +30.045 |
yx | +30.032 |
Neg logit contributions | |
� | -19.759 |
behavi | -19.155 |
� | -18.580 |
policies | -16.643 |
institutions | -16.079 |
Token | 1 |
Token ID | 16 |
Feature activation | -3.41e+01 |
Pos logit contributions | |
6 | +23.661 |
agle | +22.873 |
8 | +22.581 |
yne | +22.482 |
zzo | +22.464 |
Neg logit contributions | |
� | -22.110 |
behavi | -21.458 |
� | -21.172 |
policies | -18.971 |
institutions | -18.364 |
Token | { |
Token ID | 1391 |
Feature activation | -2.33e+01 |
Pos logit contributions | |
�� | +25.437 |
�� | +25.423 |
fg | +25.194 |
Remy | +25.072 |
yne | +25.003 |
Neg logit contributions | |
� | -21.716 |
� | -19.560 |
policies | -16.626 |
institutions | -16.280 |
behavi | -15.583 |
Token | ( |
Token ID | 7 |
Feature activation | -1.03e+02 |
Pos logit contributions | |
666 | +19.509 |
fg | +18.781 |
135 | +18.415 |
Blossom | +18.331 |
yne | +18.317 |
Neg logit contributions | |
behavi | -19.586 |
� | -16.563 |
policies | -16.451 |
� | -16.136 |
institutions | -15.510 |
Token | 132 |
Token ID | 19924 |
Feature activation | -2.70e+01 |
Pos logit contributions | |
666 | +45.840 |
135 | +45.124 |
302 | +43.885 |
333 | +43.413 |
336 | +43.331 |
Neg logit contributions | |
behavi | -16.893 |
� | -13.916 |
policies | -12.851 |
� | -12.577 |
institutions | -12.556 |
Token | s |
Token ID | 82 |
Feature activation | -3.92e+01 |
Pos logit contributions | |
fg | +20.039 |
agle | +19.029 |
Blossom | +18.891 |
nova | +18.802 |
yne | +18.775 |
Neg logit contributions | |
behavi | -20.829 |
� | -20.807 |
� | -19.708 |
ideology | -17.308 |
policies | -17.279 |
Token | )} |
Token ID | 38165 |
Feature activation | -4.54e+01 |
Pos logit contributions | |
agle | +25.169 |
Blossom | +25.056 |
fg | +24.666 |
zzo | +24.585 |
arthed | +24.585 |
Neg logit contributions | |
behavi | -26.900 |
� | -22.727 |
policies | -21.491 |
� | -21.211 |
ideology | -20.572 |
Token | B |
Token ID | 347 |
Feature activation | -5.06e+01 |
Pos logit contributions | |
Remy | +33.969 |
Reeves | +33.492 |
JJ | +33.487 |
Ned | +32.833 |
Yose | +32.803 |
Neg logit contributions | |
� | -19.062 |
� | -15.792 |
behavi | -14.447 |
policies | -13.141 |
institutions | -12.877 |
Token | d |
Token ID | 67 |
Feature activation | -3.67e+01 |
Pos logit contributions | |
fg | +36.213 |
dd | +34.509 |
fx | +34.051 |
xd | +33.071 |
agle | +32.779 |
Neg logit contributions | |
� | -19.291 |
behavi | -18.610 |
� | -17.992 |
policies | -15.840 |
climate | -15.630 |
Token | . |
Token ID | 13 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
666 | +29.736 |
yx | +28.852 |
135 | +28.682 |
zzo | +28.524 |
Blossom | +28.509 |
Neg logit contributions | |
behavi | -32.421 |
conflic | -27.381 |
practition | -25.216 |
� | -24.699 |
cumbers | -20.867 |
Token | x |
Token ID | 87 |
Feature activation | -3.33e+01 |
Pos logit contributions | |
yne | +16.548 |
zzo | +16.215 |
yx | +16.204 |
fg | +16.027 |
nox | +15.910 |
Neg logit contributions | |
behavi | -22.851 |
� | -20.106 |
policies | -19.445 |
� | -19.145 |
institutions | -18.443 |
Token | . |
Token ID | 13 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
yne | +24.075 |
zzo | +23.900 |
666 | +23.592 |
agle | +23.528 |
fg | +23.300 |
Neg logit contributions | |
behavi | -25.753 |
conflic | -19.915 |
policies | -19.474 |
� | -19.058 |
institutions | -18.021 |
Token | 99 |
Token ID | 2079 |
Feature activation | -2.60e+01 |
Pos logit contributions | |
� | +2.052 |
� | +1.957 |
policies | +1.810 |
institutions | +1.720 |
climate | +1.695 |
Neg logit contributions | |
�� | -0.627 |
�� | -0.545 |
arthed | -0.538 |
yne | -0.503 |
Remy | -0.482 |
Token | 10 |
Token ID | 838 |
Feature activation | -6.17e+01 |
Pos logit contributions | |
Remy | +25.676 |
JJ | +24.937 |
arthed | +24.894 |
Reeves | +24.820 |
Blossom | +24.800 |
Neg logit contributions | |
� | -13.454 |
behavi | -12.423 |
policies | -11.923 |
� | -11.618 |
institutions | -11.286 |
Token | 88 |
Token ID | 3459 |
Feature activation | -9.07e+01 |
Pos logit contributions | |
666 | +40.955 |
336 | +38.290 |
678 | +38.118 |
333 | +37.992 |
135 | +37.984 |
Neg logit contributions | |
behavi | -24.187 |
policies | -17.215 |
institutions | -16.934 |
governance | -16.730 |
� | -16.478 |
Token | 350 |
Token ID | 14877 |
Feature activation | -2.19e+01 |
Pos logit contributions | |
666 | +44.829 |
135 | +43.545 |
302 | +42.408 |
333 | +42.260 |
336 | +42.153 |
Neg logit contributions | |
behavi | -18.186 |
� | -16.860 |
policies | -14.792 |
� | -14.789 |
institutions | -14.651 |
Token | x |
Token ID | 2124 |
Feature activation | -4.05e+01 |
Pos logit contributions | |
Remy | +15.815 |
Xander | +15.375 |
Blossom | +15.035 |
JJ | +14.996 |
Reeves | +14.872 |
Neg logit contributions | |
� | -20.583 |
behavi | -18.739 |
� | -18.526 |
policies | -17.762 |
institutions | -17.256 |
Token | . |
Token ID | 13 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
666 | +27.520 |
135 | +26.836 |
fg | +26.435 |
Blossom | +26.189 |
6 | +26.093 |
Neg logit contributions | |
behavi | -27.426 |
conflic | -22.970 |
practition | -20.003 |
� | -19.431 |
policies | -19.103 |
Token | x |
Token ID | 87 |
Feature activation | -4.14e+01 |
Pos logit contributions | |
fg | +20.410 |
yne | +20.321 |
yx | +20.233 |
zzo | +20.188 |
nox | +19.878 |
Neg logit contributions | |
behavi | -22.984 |
� | -19.073 |
policies | -18.729 |
� | -18.247 |
institutions | -17.749 |
Token | . |
Token ID | 13 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
666 | +27.649 |
fg | +27.093 |
yne | +27.055 |
yx | +27.029 |
zzo | +26.911 |
Neg logit contributions | |
behavi | -29.445 |
conflic | -24.047 |
practition | -20.896 |
� | -20.617 |
policies | -20.156 |
Token | . |
Token ID | 13 |
Feature activation | -2.80e+01 |
Pos logit contributions | |
666 | +30.226 |
Blossom | +29.447 |
135 | +29.428 |
JJ | +29.114 |
fg | +29.091 |
Neg logit contributions | |
behavi | -32.148 |
conflic | -27.288 |
practition | -26.130 |
� | -24.653 |
cumbers | -21.392 |
Token | com |
Token ID | 785 |
Feature activation | -2.72e+01 |
Pos logit contributions | |
fg | +21.587 |
zzo | +21.444 |
666 | +21.378 |
agle | +21.286 |
yne | +21.066 |
Neg logit contributions | |
behavi | -23.851 |
policies | -18.801 |
conflic | -17.630 |
ideology | -17.360 |
� | -17.332 |
Token | / |
Token ID | 14 |
Feature activation | -1.17e+02 |
Pos logit contributions | |
666 | +21.636 |
Blossom | +21.491 |
JJ | +20.948 |
yne | +20.829 |
135 | +20.816 |
Neg logit contributions | |
behavi | -22.268 |
conflic | -17.068 |
policies | -17.027 |
� | -16.244 |
ideology | -16.203 |
Token | W |
Token ID | 54 |
Feature activation | -8.91e+01 |
Pos logit contributions | |
fg | +45.850 |
yne | +44.519 |
yx | +44.518 |
uo | +43.338 |
6 | +43.318 |
Neg logit contributions | |
behavi | -15.019 |
� | -14.275 |
� | -14.267 |
policies | -13.957 |
climate | -12.620 |
Token | 8 |
Token ID | 23 |
Feature activation | -1.01e+02 |
Pos logit contributions | |
fg | +45.340 |
yne | +43.234 |
yx | +43.232 |
zzy | +42.659 |
agle | +42.390 |
Neg logit contributions | |
behavi | -14.749 |
� | -14.437 |
� | -14.364 |
policies | -13.710 |
climate | -12.360 |
Token | v |
Token ID | 85 |
Feature activation | -9.91e+01 |
Pos logit contributions | |
fg | +45.055 |
yne | +44.217 |
yx | +44.158 |
zzy | +43.228 |
uo | +42.934 |
Neg logit contributions | |
behavi | -13.995 |
� | -13.933 |
� | -13.901 |
policies | -13.355 |
climate | -11.958 |
Token | X |
Token ID | 55 |
Feature activation | -1.00e+02 |
Pos logit contributions | |
fg | +45.130 |
yne | +43.364 |
zzy | +42.936 |
dd | +42.851 |
6 | +42.820 |
Neg logit contributions | |
behavi | -14.992 |
� | -14.004 |
� | -14.002 |
policies | -13.574 |
climate | -12.231 |
Token | Ds |
Token ID | 30832 |
Feature activation | -1.00e+02 |
Pos logit contributions | |
fg | +45.593 |
yx | +43.883 |
yne | +43.861 |
zzy | +42.860 |
uo | +42.741 |
Neg logit contributions | |
behavi | -15.163 |
� | -14.212 |
� | -14.120 |
policies | -13.554 |
climate | -12.322 |
Token | 4 |
Token ID | 19 |
Feature activation | -9.92e+01 |
Pos logit contributions | |
fg | +45.309 |
yx | +43.719 |
yne | +43.655 |
zzy | +43.137 |
6 | +42.865 |
Neg logit contributions | |
behavi | -15.206 |
� | -13.965 |
� | -13.929 |
policies | -13.432 |
climate | -12.377 |
Token | j |
Token ID | 73 |
Feature activation | -1.10e+02 |
Pos logit contributions | |
fg | +45.115 |
yne | +44.309 |
yx | +44.051 |
zzy | +43.014 |
uo | +42.914 |
Neg logit contributions | |
� | -13.883 |
behavi | -13.773 |
� | -13.603 |
policies | -13.179 |
climate | -11.869 |
Token | 0 |
Token ID | 15 |
Feature activation | -9.11e+01 |
Pos logit contributions | |
fg | +45.636 |
yne | +43.778 |
yx | +43.626 |
6 | +43.103 |
zzy | +42.986 |
Neg logit contributions | |
behavi | -15.545 |
� | -14.401 |
� | -14.126 |
policies | -13.782 |
climate | -12.267 |