Token | SR |
Token ID | 12562 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
u | +13.874 |
- | +13.488 |
ia | +12.475 |
. | +12.436 |
ire | +12.106 |
Neg logit contributions | |
disparate | -15.452 |
relentless | -14.910 |
newer | -14.838 |
venerable | -14.830 |
totality | -14.665 |
Token | . |
Token ID | 13 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
. | +31.298 |
- | +29.330 |
u | +28.508 |
ag | +25.972 |
ia | +25.811 |
Neg logit contributions | |
disparate | -18.152 |
relentless | -17.873 |
gradual | -17.467 |
anecdotal | -17.446 |
blatant | -17.300 |
Token | Width |
Token ID | 30916 |
Feature activation | +9.98e+00 |
Pos logit contributions | |
u | +0.448 |
- | +0.434 |
acy | +0.405 |
ia | +0.396 |
ine | +0.390 |
Neg logit contributions | |
disparate | -0.991 |
relentless | -0.969 |
venerable | -0.969 |
newer | -0.967 |
blatant | -0.962 |
Token | ), |
Token ID | 828 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
- | +22.508 |
. | +21.067 |
u | +20.626 |
/ | +18.651 |
acy | +18.574 |
Neg logit contributions | |
disparate | -15.498 |
relentless | -15.137 |
venerable | -15.124 |
blatant | -14.811 |
spontaneous | -14.597 |
Token | ($ |
Token ID | 16763 |
Feature activation | +9.08e+00 |
Pos logit contributions | |
u | +2.017 |
- | +2.003 |
acy | +1.808 |
ia | +1.787 |
. | +1.763 |
Neg logit contributions | |
disparate | -4.399 |
relentless | -4.278 |
blatant | -4.276 |
venerable | -4.266 |
gradual | -4.255 |
Token | SR |
Token ID | 12562 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
u | +16.056 |
- | +15.677 |
. | +14.347 |
ia | +14.179 |
id | +13.910 |
Neg logit contributions | |
disparate | -20.223 |
totality | -19.849 |
venerable | -19.782 |
newer | -19.656 |
relentless | -19.369 |
Token | . |
Token ID | 13 |
Feature activation | +2.26e+00 |
Pos logit contributions | |
. | +32.026 |
- | +28.163 |
u | +24.239 |
' | +23.648 |
_ | +22.626 |
Neg logit contributions | |
tremend | -47.953 |
mathemat | -42.785 |
metic | -41.869 |
cumbers | -41.778 |
hemor | -41.467 |
Token | Height |
Token ID | 23106 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
- | +3.380 |
u | +3.346 |
ia | +3.000 |
. | +2.986 |
acy | +2.977 |
Neg logit contributions | |
disparate | -7.288 |
relentless | -7.113 |
venerable | -7.110 |
newer | -7.059 |
anecdotal | -7.053 |
Token | ))) |
Token ID | 22305 |
Feature activation | +2.92e+00 |
Pos logit contributions | |
- | +22.621 |
u | +21.338 |
. | +21.276 |
ine | +19.503 |
acy | +19.488 |
Neg logit contributions | |
disparate | -16.030 |
relentless | -16.020 |
venerable | -15.835 |
blatant | -15.663 |
anecdotal | -15.587 |
Token | ) |
Token ID | 1267 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
- | +6.783 |
u | +6.611 |
. | +6.385 |
ia | +6.226 |
acy | +6.197 |
Neg logit contributions | |
disparate | -6.488 |
anecdotal | -6.344 |
relentless | -6.331 |
venerable | -6.285 |
blatant | -6.203 |
Token | } |
Token ID | 1782 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
- | +0.874 |
u | +0.868 |
acy | +0.814 |
. | +0.808 |
ia | +0.803 |
Neg logit contributions | |
disparate | -1.187 |
relentless | -1.159 |
venerable | -1.154 |
anecdotal | -1.153 |
blatant | -1.153 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
u | +16.262 |
- | +15.352 |
. | +15.078 |
ia | +14.842 |
ine | +14.754 |
Neg logit contributions | |
tremend | -27.361 |
hemor | -26.233 |
mathemat | -26.068 |
venerable | -25.935 |
disparate | -25.785 |
Token | = |
Token ID | 796 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
. | +19.825 |
- | +19.212 |
u | +19.212 |
ia | +17.707 |
ine | +17.558 |
Neg logit contributions | |
disparate | -18.222 |
anecdotal | -17.630 |
relentless | -17.148 |
venerable | -17.051 |
blatant | -17.007 |
Token | [ |
Token ID | 685 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
disparate | +5.585 |
blatant | +5.439 |
newer | +5.421 |
relentless | +5.418 |
various | +5.411 |
Neg logit contributions | |
u | -5.915 |
- | -5.807 |
acy | -5.707 |
ia | -5.535 |
ine | -5.480 |
Token | system |
Token ID | 10057 |
Feature activation | +1.94e+01 |
Pos logit contributions | |
u | +3.048 |
- | +2.986 |
acy | +2.700 |
ia | +2.630 |
ine | +2.628 |
Neg logit contributions | |
disparate | -6.902 |
newer | -6.783 |
relentless | -6.774 |
blatant | -6.772 |
gradual | -6.769 |
Token | . |
Token ID | 13 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
. | +30.075 |
- | +26.213 |
u | +23.662 |
' | +22.268 |
_ | +21.004 |
Neg logit contributions | |
tremend | -44.861 |
cumbers | -40.424 |
mathemat | -40.370 |
hemor | -39.571 |
metic | -39.275 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
u | +7.499 |
- | +7.446 |
. | +6.862 |
ine | +6.830 |
id | +6.756 |
Neg logit contributions | |
disparate | -9.095 |
relentless | -8.961 |
totality | -8.924 |
blatant | -8.905 |
gradual | -8.876 |
Token | ing |
Token ID | 278 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
ing | +26.385 |
- | +24.464 |
. | +23.515 |
u | +22.334 |
er | +21.711 |
Neg logit contributions | |
tremend | -46.461 |
cumbers | -42.389 |
mathemat | -42.218 |
metic | -41.477 |
hemor | -40.954 |
Token | . |
Token ID | 13 |
Feature activation | -2.67e+00 |
Pos logit contributions | |
. | +26.915 |
- | +23.484 |
u | +20.042 |
' | +19.890 |
/ | +18.497 |
Neg logit contributions | |
tremend | -42.301 |
cumbers | -37.362 |
mathemat | -37.246 |
hemor | -36.664 |
eleph | -36.366 |
Token | String |
Token ID | 10100 |
Feature activation | +7.32e+00 |
Pos logit contributions | |
disparate | +7.775 |
newer | +7.667 |
various | +7.663 |
blatant | +7.632 |
genuine | +7.596 |
Neg logit contributions | |
u | -4.481 |
acy | -4.372 |
- | -4.302 |
ia | -4.122 |
aga | -4.104 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
- | +12.639 |
. | +11.998 |
u | +11.784 |
ine | +11.335 |
ade | +10.762 |
Neg logit contributions | |
disparate | -17.617 |
venerable | -17.299 |
relentless | -17.254 |
totality | -17.173 |
anecdotal | -17.112 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
u | +16.112 |
- | +16.004 |
. | +15.519 |
ine | +15.106 |
id | +15.033 |
Neg logit contributions | |
tremend | -27.649 |
hemor | -27.186 |
venerable | -26.364 |
disparate | -26.317 |
cumbers | -26.187 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
- | +18.484 |
u | +18.299 |
. | +18.219 |
id | +17.546 |
ia | +17.348 |
Neg logit contributions | |
tremend | -29.681 |
hemor | -28.198 |
mathemat | -27.659 |
cumbers | -27.585 |
venerable | -26.892 |
Token | = |
Token ID | 796 |
Feature activation | +3.42e+00 |
Pos logit contributions | |
. | +21.181 |
- | +20.291 |
u | +19.366 |
' | +17.257 |
ia | +17.246 |
Neg logit contributions | |
tremend | -29.737 |
mathemat | -28.120 |
hemor | -26.912 |
cumbers | -25.625 |
metic | -25.167 |
Token | [ |
Token ID | 685 |
Feature activation | +6.39e+00 |
Pos logit contributions | |
- | +6.693 |
u | +6.429 |
. | +6.319 |
acy | +5.671 |
id | +5.653 |
Neg logit contributions | |
disparate | -8.544 |
venerable | -8.475 |
blatant | -8.467 |
theless | -8.403 |
relentless | -8.403 |
Token | system |
Token ID | 10057 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
u | +7.615 |
- | +7.501 |
. | +6.871 |
ine | +6.301 |
id | +6.279 |
Neg logit contributions | |
disparate | -19.885 |
hemor | -19.835 |
mathemat | -19.786 |
totality | -19.703 |
blatant | -19.694 |
Token | . |
Token ID | 13 |
Feature activation | +6.25e+00 |
Pos logit contributions | |
. | +30.792 |
- | +27.115 |
u | +23.943 |
' | +23.130 |
s | +21.474 |
Neg logit contributions | |
tremend | -45.980 |
cumbers | -41.495 |
mathemat | -41.378 |
hemor | -39.995 |
metic | -39.932 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
- | +11.121 |
u | +11.084 |
. | +10.401 |
id | +10.089 |
ine | +10.053 |
Neg logit contributions | |
mathemat | -16.597 |
tremend | -16.422 |
disparate | -16.227 |
venerable | -16.186 |
totality | -16.063 |
Token | ing |
Token ID | 278 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
ing | +26.179 |
- | +24.233 |
. | +23.162 |
u | +22.332 |
ling | +21.360 |
Neg logit contributions | |
tremend | -47.124 |
mathemat | -42.999 |
cumbers | -42.958 |
metic | -42.348 |
hemor | -41.535 |
Token | . |
Token ID | 13 |
Feature activation | +4.39e+00 |
Pos logit contributions | |
. | +28.065 |
- | +24.555 |
u | +21.112 |
' | +21.058 |
/ | +19.593 |
Neg logit contributions | |
tremend | -43.436 |
cumbers | -38.572 |
mathemat | -38.538 |
hemor | -37.572 |
eleph | -37.285 |
Token | String |
Token ID | 10100 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
- | +4.996 |
u | +4.965 |
. | +4.448 |
ine | +4.095 |
id | +4.004 |
Neg logit contributions | |
disparate | -15.049 |
relentless | -15.043 |
venerable | -14.951 |
totality | -14.938 |
mathemat | -14.822 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
- | +19.444 |
. | +19.023 |
al | +17.913 |
u | +17.232 |
' | +16.603 |
Neg logit contributions | |
tremend | -39.750 |
mathemat | -36.334 |
hemor | -35.672 |
metic | -34.673 |
cumbers | -33.992 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
u | +17.433 |
- | +17.044 |
. | +16.911 |
ia | +16.185 |
ire | +16.182 |
Neg logit contributions | |
tremend | -28.815 |
hemor | -27.875 |
cumbers | -27.300 |
mathemat | -26.907 |
disparate | -26.806 |
Token | image |
Token ID | 9060 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
disparate | +0.067 |
newer | +0.066 |
various | +0.066 |
relentless | +0.066 |
blatant | +0.066 |
Neg logit contributions | |
u | -0.026 |
- | -0.024 |
acy | -0.023 |
ia | -0.023 |
ine | -0.022 |
Token | = |
Token ID | 796 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
. | +23.367 |
- | +22.562 |
u | +21.745 |
ate | +20.659 |
ia | +20.636 |
Neg logit contributions | |
disparate | -15.534 |
venerable | -14.935 |
relentless | -14.706 |
anecdotal | -14.655 |
stringent | -14.655 |
Token | [ |
Token ID | 685 |
Feature activation | +3.56e+00 |
Pos logit contributions | |
disparate | +2.680 |
blatant | +2.622 |
relentless | +2.616 |
gradual | +2.591 |
venerable | +2.590 |
Neg logit contributions | |
u | -2.853 |
- | -2.828 |
acy | -2.731 |
ia | -2.669 |
ine | -2.637 |
Token | System |
Token ID | 11964 |
Feature activation | +1.81e+01 |
Pos logit contributions | |
u | +4.816 |
- | +4.697 |
ia | +4.157 |
. | +4.073 |
ine | +4.039 |
Neg logit contributions | |
disparate | -11.441 |
gradual | -11.307 |
relentless | -11.290 |
blatant | -11.236 |
newer | -11.211 |
Token | . |
Token ID | 13 |
Feature activation | +4.70e+00 |
Pos logit contributions | |
. | +28.742 |
- | +24.774 |
u | +22.304 |
' | +20.916 |
| +19.596 |
Neg logit contributions | |
tremend | -43.060 |
mathemat | -39.177 |
cumbers | -37.917 |
hemor | -37.887 |
eleph | -37.512 |
Token | Draw |
Token ID | 25302 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
u | +6.281 |
- | +6.178 |
ia | +5.503 |
ine | +5.480 |
. | +5.443 |
Neg logit contributions | |
disparate | -14.537 |
gradual | -14.414 |
totality | -14.380 |
relentless | -14.316 |
venerable | -14.296 |
Token | ing |
Token ID | 278 |
Feature activation | +1.57e+01 |
Pos logit contributions | |
ing | +26.163 |
- | +24.032 |
. | +23.359 |
u | +22.365 |
er | +21.580 |
Neg logit contributions | |
tremend | -45.039 |
mathemat | -41.190 |
cumbers | -40.428 |
metic | -39.427 |
eleph | -39.369 |
Token | . |
Token ID | 13 |
Feature activation | +3.40e+00 |
Pos logit contributions | |
. | +26.260 |
- | +22.596 |
u | +19.621 |
' | +19.131 |
ia | +17.922 |
Neg logit contributions | |
tremend | -39.835 |
mathemat | -35.017 |
hemor | -34.056 |
eleph | -33.934 |
cumbers | -33.673 |
Token | Graphics |
Token ID | 18172 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
u | +7.016 |
- | +6.995 |
ia | +6.535 |
ine | +6.533 |
acy | +6.509 |
Neg logit contributions | |
disparate | -8.405 |
relentless | -8.269 |
totality | -8.245 |
venerable | -8.219 |
anecdotal | -8.216 |
Token | ] |
Token ID | 60 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
. | +28.124 |
- | +27.340 |
u | +26.723 |
ine | +25.428 |
ia | +25.050 |
Neg logit contributions | |
venerable | -16.756 |
disparate | -16.707 |
theless | -16.620 |
gradual | -16.490 |
relentless | -16.328 |
Token | :: |
Token ID | 3712 |
Feature activation | +6.66e+00 |
Pos logit contributions | |
- | +14.221 |
. | +14.197 |
u | +12.602 |
' | +11.806 |
ia | +11.349 |
Neg logit contributions | |
tremend | -28.423 |
mathemat | -26.408 |
hemor | -25.994 |
cumbers | -25.515 |
undermin | -25.287 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
u | +17.564 |
- | +16.995 |
. | +16.672 |
id | +16.455 |
ine | +16.261 |
Neg logit contributions | |
tremend | -28.120 |
mathemat | -27.529 |
hemor | -26.948 |
venerable | -26.449 |
disparate | -26.338 |
Token | = |
Token ID | 796 |
Feature activation | -3.62e-02 |
Pos logit contributions | |
. | +23.386 |
- | +21.772 |
u | +21.203 |
ia | +19.666 |
ine | +19.349 |
Neg logit contributions | |
disparate | -18.512 |
anecdotal | -18.211 |
relentless | -17.619 |
venerable | -17.572 |
gradual | -17.433 |
Token | [ |
Token ID | 685 |
Feature activation | +3.54e+00 |
Pos logit contributions | |
disparate | +0.083 |
blatant | +0.081 |
relentless | +0.080 |
gradual | +0.080 |
anecdotal | +0.080 |
Neg logit contributions | |
u | -0.087 |
- | -0.086 |
acy | -0.083 |
ia | -0.082 |
ine | -0.081 |
Token | system |
Token ID | 10057 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
u | +4.763 |
- | +4.643 |
acy | +4.156 |
ia | +4.078 |
. | +4.058 |
Neg logit contributions | |
disparate | -11.471 |
newer | -11.299 |
gradual | -11.289 |
relentless | -11.255 |
blatant | -11.241 |
Token | . |
Token ID | 13 |
Feature activation | +4.56e+00 |
Pos logit contributions | |
. | +29.875 |
- | +26.110 |
u | +23.382 |
' | +22.272 |
_ | +20.852 |
Neg logit contributions | |
tremend | -44.808 |
mathemat | -40.447 |
cumbers | -40.412 |
hemor | -39.520 |
metic | -39.228 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
u | +9.083 |
- | +8.995 |
. | +8.413 |
ine | +8.275 |
id | +8.218 |
Neg logit contributions | |
disparate | -11.640 |
venerable | -11.492 |
totality | -11.465 |
relentless | -11.421 |
blatant | -11.389 |
Token | ing |
Token ID | 278 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
ing | +25.995 |
- | +24.277 |
. | +23.348 |
u | +22.073 |
er | +21.408 |
Neg logit contributions | |
tremend | -45.991 |
cumbers | -41.973 |
mathemat | -41.913 |
metic | -40.952 |
hemor | -40.478 |
Token | . |
Token ID | 13 |
Feature activation | -3.64e-01 |
Pos logit contributions | |
. | +26.087 |
- | +22.798 |
u | +19.548 |
' | +19.363 |
/ | +17.869 |
Neg logit contributions | |
tremend | -41.444 |
mathemat | -36.843 |
cumbers | -36.575 |
hemor | -36.069 |
eleph | -35.521 |
Token | String |
Token ID | 10100 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
disparate | +1.124 |
newer | +1.108 |
relentless | +1.102 |
various | +1.100 |
venerable | +1.096 |
Neg logit contributions | |
u | -0.609 |
- | -0.589 |
acy | -0.562 |
ine | -0.543 |
ia | -0.543 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
- | +17.165 |
. | +16.648 |
u | +15.660 |
al | +15.393 |
ine | +14.961 |
Neg logit contributions | |
disparate | -21.501 |
venerable | -21.437 |
totality | -21.108 |
relentless | -21.054 |
stringent | -20.757 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
u | +16.650 |
- | +16.579 |
. | +16.203 |
id | +15.603 |
ire | +15.408 |
Neg logit contributions | |
tremend | -29.382 |
hemor | -28.403 |
cumbers | -27.927 |
disparate | -27.258 |
mathemat | -27.252 |
Token | image |
Token ID | 2939 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
- | +8.588 |
u | +8.145 |
. | +8.086 |
ia | +7.605 |
ine | +7.480 |
Neg logit contributions | |
mathemat | -9.151 |
theless | -9.017 |
venerable | -8.770 |
tremend | -8.755 |
relentless | -8.650 |
Token | Path |
Token ID | 15235 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
. | +15.070 |
- | +14.986 |
u | +13.797 |
' | +12.363 |
Path | +12.326 |
Neg logit contributions | |
tremend | -37.285 |
mathemat | -35.541 |
hemor | -33.394 |
undermin | -32.796 |
anwhile | -32.649 |
Token | in |
Token ID | 287 |
Feature activation | +4.29e+00 |
Pos logit contributions | |
. | +19.964 |
- | +19.917 |
u | +18.299 |
' | +16.514 |
ine | +16.501 |
Neg logit contributions | |
tremend | -30.357 |
mathemat | -28.858 |
hemor | -27.823 |
cumbers | -26.774 |
undermin | -26.735 |
Token | paths |
Token ID | 13532 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
- | +9.446 |
. | +8.899 |
u | +8.713 |
ia | +7.932 |
acy | +7.891 |
Neg logit contributions | |
tremend | -9.780 |
mathemat | -9.668 |
blatant | -9.254 |
venerable | -9.210 |
theless | -9.035 |
Token | . |
Token ID | 13 |
Feature activation | +5.63e+00 |
Pos logit contributions | |
. | +24.412 |
- | +21.112 |
u | +18.752 |
' | +18.195 |
; | +17.684 |
Neg logit contributions | |
tremend | -30.349 |
mathemat | -27.862 |
cumbers | -27.222 |
hemor | -26.393 |
undermin | -26.095 |
Token | list |
Token ID | 4868 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
- | +4.155 |
u | +4.146 |
. | +3.475 |
ine | +3.420 |
id | +3.349 |
Neg logit contributions | |
mathemat | -21.202 |
tremend | -21.090 |
behavi | -20.898 |
venerable | -20.810 |
disparate | -20.744 |
Token | _ |
Token ID | 62 |
Feature activation | +9.33e+00 |
Pos logit contributions | |
- | +28.084 |
_ | +27.325 |
. | +26.072 |
u | +23.867 |
‐ | +22.505 |
Neg logit contributions | |
tremend | -43.632 |
mathemat | -39.967 |
cumbers | -39.684 |
hemor | -38.426 |
metic | -38.000 |
Token | images |
Token ID | 17566 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
u | +12.389 |
- | +11.370 |
ine | +10.605 |
ia | +10.583 |
. | +10.526 |
Neg logit contributions | |
mathemat | -27.534 |
tremend | -27.386 |
hemor | -26.627 |
behavi | -26.526 |
venerable | -26.321 |
Token | ( |
Token ID | 7 |
Feature activation | +7.79e+00 |
Pos logit contributions | |
- | +19.013 |
. | +18.893 |
u | +17.339 |
( | +16.748 |
' | +16.736 |
Neg logit contributions | |
tremend | -34.494 |
mathemat | -32.633 |
hemor | -32.090 |
undermin | -31.498 |
cumbers | -31.209 |
Token | args |
Token ID | 22046 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
u | +9.266 |
- | +8.839 |
. | +8.315 |
ag | +8.242 |
args | +7.967 |
Neg logit contributions | |
tremend | -24.328 |
mathemat | -23.978 |
totality | -22.741 |
venerable | -22.653 |
behavi | -22.627 |
Token | [" |
Token ID | 14692 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
. | +20.035 |
u | +19.172 |
- | +18.957 |
' | +16.106 |
ia | +15.949 |
Neg logit contributions | |
tremend | -34.396 |
mathemat | -32.652 |
behavi | -32.166 |
undermin | -31.228 |
cumbers | -31.077 |
Token | , |
Token ID | 11 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
- | +16.373 |
. | +16.245 |
, | +14.677 |
u | +14.398 |
ia | +13.614 |
Neg logit contributions | |
tremend | -30.656 |
mathemat | -28.681 |
cumbers | -27.845 |
undermin | -27.043 |
hemor | -26.667 |
Token | characterized |
Token ID | 16264 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
- | +0.350 |
u | +0.350 |
. | +0.334 |
ia | +0.334 |
acy | +0.330 |
Neg logit contributions | |
disparate | -0.291 |
blatant | -0.288 |
relentless | -0.286 |
newer | -0.286 |
genuine | -0.282 |
Token | by |
Token ID | 416 |
Feature activation | +4.36e+00 |
Pos logit contributions | |
. | +22.294 |
- | +22.000 |
' | +18.306 |
ia | +18.076 |
's | +17.987 |
Neg logit contributions | |
tremend | -32.721 |
mathemat | -30.918 |
cumbers | -29.386 |
hemor | -28.529 |
ccording | -28.280 |
Token | multiple |
Token ID | 3294 |
Feature activation | +7.43e+00 |
Pos logit contributions | |
- | +13.371 |
. | +12.845 |
u | +12.006 |
ine | +11.803 |
ia | +11.749 |
Neg logit contributions | |
mathemat | -6.920 |
tremend | -6.331 |
venerable | -5.888 |
theless | -5.757 |
blatant | -5.536 |
Token | tiny |
Token ID | 7009 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
- | +21.051 |
. | +20.229 |
u | +18.463 |
ia | +18.158 |
y | +18.041 |
Neg logit contributions | |
mathemat | -9.140 |
anwhile | -8.541 |
Palestin | -8.209 |
tremend | -8.097 |
totality | -8.047 |
Token | ker |
Token ID | 41927 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
- | +26.176 |
. | +25.207 |
u | +22.234 |
er | +22.219 |
‐ | +21.948 |
Neg logit contributions | |
tremend | -20.324 |
mathemat | -19.772 |
Palestin | -18.549 |
ccording | -18.373 |
anwhile | -18.177 |
Token | at |
Token ID | 265 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
at | +25.869 |
- | +22.736 |
ati | +22.356 |
acy | +22.133 |
ate | +21.989 |
Neg logit contributions | |
tremend | -40.493 |
cumbers | -39.653 |
reluct | -38.997 |
mathemat | -38.112 |
misunder | -37.674 |
Token | otic |
Token ID | 6210 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
- | +7.735 |
ic | +7.719 |
ite | +7.176 |
os | +6.985 |
. | +6.584 |
Neg logit contributions | |
mathemat | -32.964 |
hemor | -32.858 |
tremend | -32.565 |
disparate | -32.225 |
behavi | -32.075 |
Token | plugs |
Token ID | 37008 |
Feature activation | +1.57e+01 |
Pos logit contributions | |
- | +16.965 |
. | +16.195 |
u | +13.154 |
ig | +13.043 |
' | +12.762 |
Neg logit contributions | |
mathemat | -23.893 |
tremend | -23.735 |
anwhile | -22.734 |
theless | -22.143 |
hemor | -21.588 |
Token | , |
Token ID | 11 |
Feature activation | +2.05e-01 |
Pos logit contributions | |
. | +22.695 |
- | +22.420 |
, | +21.569 |
u | +19.252 |
' | +18.749 |
Neg logit contributions | |
tremend | -38.690 |
cumbers | -35.235 |
mathemat | -34.752 |
undermin | -33.560 |
reluct | -33.363 |
Token | mim |
Token ID | 17007 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
- | +0.579 |
u | +0.560 |
. | +0.553 |
acy | +0.537 |
ia | +0.537 |
Neg logit contributions | |
disparate | -0.382 |
venerable | -0.372 |
relentless | -0.369 |
newer | -0.368 |
totality | -0.364 |
Token | Line |
Token ID | 13949 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
disparate | +4.708 |
newer | +4.639 |
various | +4.621 |
relentless | +4.606 |
blatant | +4.605 |
Neg logit contributions | |
u | -2.422 |
- | -2.326 |
acy | -2.301 |
ia | -2.182 |
ine | -2.153 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
- | +18.352 |
. | +17.482 |
al | +17.253 |
u | +16.847 |
ine | +15.683 |
Neg logit contributions | |
tremend | -22.267 |
disparate | -21.998 |
venerable | -21.977 |
mathemat | -21.845 |
relentless | -21.356 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
- | +18.484 |
u | +18.299 |
. | +18.219 |
id | +17.546 |
ia | +17.348 |
Neg logit contributions | |
tremend | -29.681 |
hemor | -28.198 |
mathemat | -27.659 |
cumbers | -27.585 |
venerable | -26.892 |
Token | = |
Token ID | 796 |
Feature activation | +3.42e+00 |
Pos logit contributions | |
. | +21.181 |
- | +20.291 |
u | +19.366 |
' | +17.257 |
ia | +17.246 |
Neg logit contributions | |
tremend | -29.737 |
mathemat | -28.120 |
hemor | -26.912 |
cumbers | -25.625 |
metic | -25.167 |
Token | [ |
Token ID | 685 |
Feature activation | +6.39e+00 |
Pos logit contributions | |
- | +6.693 |
u | +6.429 |
. | +6.319 |
acy | +5.671 |
id | +5.653 |
Neg logit contributions | |
disparate | -8.544 |
venerable | -8.475 |
blatant | -8.467 |
theless | -8.403 |
relentless | -8.403 |
Token | system |
Token ID | 10057 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
u | +7.615 |
- | +7.501 |
. | +6.871 |
ine | +6.301 |
id | +6.279 |
Neg logit contributions | |
disparate | -19.885 |
hemor | -19.835 |
mathemat | -19.786 |
totality | -19.703 |
blatant | -19.694 |
Token | . |
Token ID | 13 |
Feature activation | +6.25e+00 |
Pos logit contributions | |
. | +30.792 |
- | +27.115 |
u | +23.943 |
' | +23.130 |
s | +21.474 |
Neg logit contributions | |
tremend | -45.980 |
cumbers | -41.495 |
mathemat | -41.378 |
hemor | -39.995 |
metic | -39.932 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
- | +11.121 |
u | +11.084 |
. | +10.401 |
id | +10.089 |
ine | +10.053 |
Neg logit contributions | |
mathemat | -16.597 |
tremend | -16.422 |
disparate | -16.227 |
venerable | -16.186 |
totality | -16.063 |
Token | ing |
Token ID | 278 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
ing | +26.179 |
- | +24.233 |
. | +23.162 |
u | +22.332 |
ling | +21.360 |
Neg logit contributions | |
tremend | -47.124 |
mathemat | -42.999 |
cumbers | -42.958 |
metic | -42.348 |
hemor | -41.535 |
Token | . |
Token ID | 13 |
Feature activation | +4.39e+00 |
Pos logit contributions | |
. | +28.065 |
- | +24.555 |
u | +21.112 |
' | +21.058 |
/ | +19.593 |
Neg logit contributions | |
tremend | -43.436 |
cumbers | -38.572 |
mathemat | -38.538 |
hemor | -37.572 |
eleph | -37.285 |
Token | String |
Token ID | 10100 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
- | +4.996 |
u | +4.965 |
. | +4.448 |
ine | +4.095 |
id | +4.004 |
Neg logit contributions | |
disparate | -15.049 |
relentless | -15.043 |
venerable | -14.951 |
totality | -14.938 |
mathemat | -14.822 |
Token | v |
Token ID | 410 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
- | +3.452 |
u | +3.325 |
. | +3.232 |
acy | +2.932 |
ia | +2.900 |
Neg logit contributions | |
blatant | -4.605 |
venerable | -4.594 |
relentless | -4.571 |
disparate | -4.569 |
tremendous | -4.483 |
Token | ars |
Token ID | 945 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
- | +19.724 |
. | +19.032 |
ar | +18.677 |
u | +18.450 |
ab | +17.681 |
Neg logit contributions | |
tremend | -31.747 |
hemor | -30.668 |
mathemat | -29.674 |
undermin | -29.643 |
metic | -29.374 |
Token | ( |
Token ID | 7 |
Feature activation | +6.16e+00 |
Pos logit contributions | |
- | +20.277 |
. | +20.101 |
u | +18.336 |
( | +17.784 |
' | +17.503 |
Neg logit contributions | |
tremend | -34.962 |
mathemat | -33.034 |
hemor | -32.893 |
undermin | -31.771 |
cumbers | -31.386 |
Token | ap |
Token ID | 499 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
u | +8.065 |
- | +7.781 |
ab | +7.564 |
ag | +7.406 |
acy | +7.395 |
Neg logit contributions | |
disparate | -19.532 |
mathemat | -19.405 |
tremend | -19.287 |
totality | -19.174 |
venerable | -19.161 |
Token | . |
Token ID | 13 |
Feature activation | +5.49e+00 |
Pos logit contributions | |
. | +27.295 |
- | +23.291 |
u | +21.839 |
' | +20.249 |
_ | +19.324 |
Neg logit contributions | |
tremend | -41.604 |
mathemat | -37.679 |
cumbers | -37.340 |
hemor | -37.230 |
metic | -36.553 |
Token | parse |
Token ID | 29572 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
- | +4.410 |
u | +4.181 |
ine | +3.697 |
. | +3.696 |
ade | +3.661 |
Neg logit contributions | |
disparate | -20.258 |
relentless | -19.987 |
venerable | -19.955 |
totality | -19.767 |
blatant | -19.699 |
Token | _ |
Token ID | 62 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
- | +26.791 |
_ | +26.716 |
. | +25.333 |
u | +23.182 |
' | +21.422 |
Neg logit contributions | |
tremend | -43.672 |
mathemat | -40.291 |
cumbers | -39.313 |
metic | -39.078 |
hemor | -38.578 |
Token | args |
Token ID | 22046 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
u | +15.947 |
args | +15.499 |
- | +15.478 |
. | +14.874 |
ag | +14.729 |
Neg logit contributions | |
tremend | -31.474 |
mathemat | -30.646 |
metic | -29.891 |
hemor | -29.085 |
behavi | -28.701 |
Token | ()) |
Token ID | 28955 |
Feature activation | +3.34e+00 |
Pos logit contributions | |
- | +10.283 |
. | +10.113 |
u | +9.378 |
() | +8.182 |
_ | +8.000 |
Neg logit contributions | |
tremend | -33.360 |
mathemat | -33.354 |
streng | -31.361 |
metic | -31.338 |
hemor | -31.131 |
Token | # |
Token ID | 1303 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
u | +6.778 |
- | +6.754 |
. | +6.274 |
acy | +6.210 |
ia | +6.111 |
Neg logit contributions | |
disparate | -8.159 |
relentless | -8.025 |
anecdotal | -7.995 |
venerable | -7.985 |
tremendous | -7.965 |
Token | initialize |
Token ID | 41216 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
- | +2.806 |
u | +2.711 |
ine | +2.635 |
. | +2.627 |
acy | +2.624 |
Neg logit contributions | |
disparate | -2.569 |
venerable | -2.535 |
blatant | -2.516 |
relentless | -2.492 |
drastic | -2.467 |
Token | oker |
Token ID | 11020 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
ong | +20.629 |
- | +20.562 |
u | +20.384 |
. | +19.592 |
illo | +19.091 |
Neg logit contributions | |
disparate | -23.977 |
tremend | -23.446 |
mathemat | -22.600 |
behavi | -22.312 |
relentless | -22.301 |
Token | at |
Token ID | 265 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
at | +23.158 |
- | +21.345 |
ate | +21.075 |
acy | +20.471 |
ati | +20.211 |
Neg logit contributions | |
tremend | -36.854 |
hemor | -34.073 |
mathemat | -33.937 |
cumbers | -33.451 |
metic | -33.030 |
Token | osis |
Token ID | 5958 |
Feature activation | +8.34e+00 |
Pos logit contributions | |
ia | +15.998 |
- | +15.576 |
id | +15.175 |
u | +15.003 |
ode | +14.850 |
Neg logit contributions | |
tremend | -27.482 |
mathemat | -26.142 |
disparate | -25.988 |
hemor | -25.877 |
venerable | -25.427 |
Token | punct |
Token ID | 21025 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
- | +19.758 |
. | +18.708 |
u | +17.176 |
' | +16.808 |
‐ | +16.551 |
Neg logit contributions | |
theless | -11.983 |
anwhile | -11.862 |
disparate | -11.802 |
mathemat | -11.757 |
totality | -11.594 |
Token | ata |
Token ID | 1045 |
Feature activation | +8.76e+00 |
Pos logit contributions | |
ata | +25.718 |
ate | +24.257 |
ati | +23.694 |
acy | +23.038 |
u | +22.947 |
Neg logit contributions | |
tremend | -32.728 |
behavi | -32.211 |
mathemat | -32.203 |
hemor | -31.866 |
reluct | -31.572 |
Token | pal |
Token ID | 6340 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
- | +16.719 |
. | +15.368 |
u | +14.046 |
ia | +13.756 |
' | +13.594 |
Neg logit contributions | |
mathemat | -17.353 |
anwhile | -17.041 |
DRAG | -16.897 |
theless | -16.637 |
disparate | -16.396 |
Token | mar |
Token ID | 3876 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
- | +25.208 |
ar | +24.806 |
u | +24.278 |
. | +24.137 |
ab | +23.060 |
Neg logit contributions | |
tremend | -37.499 |
cumbers | -36.924 |
mathemat | -33.409 |
undermin | -33.130 |
hemor | -32.941 |
Token | is |
Token ID | 271 |
Feature activation | +8.14e+00 |
Pos logit contributions | |
is | +22.953 |
- | +22.808 |
ia | +22.705 |
i | +22.281 |
u | +22.127 |
Neg logit contributions | |
tremend | -37.383 |
mathemat | -35.353 |
hemor | -34.820 |
cumbers | -33.849 |
misunder | -33.381 |
Token | et |
Token ID | 2123 |
Feature activation | +8.52e+00 |
Pos logit contributions | |
- | +13.560 |
. | +12.457 |
u | +12.201 |
id | +11.646 |
ati | +11.493 |
Neg logit contributions | |
disparate | -17.752 |
venerable | -17.551 |
relentless | -17.504 |
totality | -17.267 |
blatant | -17.256 |
Token | plant |
Token ID | 4618 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
- | +16.646 |
. | +15.747 |
u | +14.728 |
ia | +14.314 |
ine | +13.477 |
Neg logit contributions | |
mathemat | -18.555 |
theless | -17.315 |
tremend | -16.994 |
anwhile | -16.857 |
undermin | -16.586 |
Token | aris |
Token ID | 20066 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
ar | +18.720 |
ire | +18.328 |
aria | +18.315 |
- | +18.272 |
. | +17.772 |
Neg logit contributions | |
tremend | -31.851 |
mathemat | -31.495 |
hemor | -30.998 |
misunder | -30.610 |
metic | -30.505 |
Token | in |
Token ID | 287 |
Feature activation | +8.03e+00 |
Pos logit contributions | |
- | +19.847 |
. | +19.042 |
u | +16.590 |
' | +16.091 |
ine | +15.908 |
Neg logit contributions | |
tremend | -26.183 |
mathemat | -24.750 |
cumbers | -24.178 |
undermin | -23.924 |
hemor | -23.555 |
Token | the |
Token ID | 262 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
- | +21.330 |
. | +20.662 |
u | +19.077 |
ia | +18.306 |
' | +18.039 |
Neg logit contributions | |
tremend | -14.891 |
mathemat | -13.660 |
cumbers | -12.682 |
hemor | -11.953 |
undermin | -11.854 |
Token | skillet |
Token ID | 41306 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
- | +8.021 |
. | +7.642 |
u | +7.086 |
ine | +6.920 |
ite | +6.876 |
Neg logit contributions | |
disparate | -7.994 |
blatant | -7.767 |
venerable | -7.526 |
drastic | -7.509 |
relentless | -7.509 |
Token | ( |
Token ID | 357 |
Feature activation | +5.91e+00 |
Pos logit contributions | |
. | +21.492 |
- | +20.845 |
u | +17.851 |
; | +17.329 |
's | +16.473 |
Neg logit contributions | |
tremend | -25.671 |
cumbers | -23.846 |
mathemat | -23.488 |
behavi | -22.292 |
undermin | -22.079 |
Token | don |
Token ID | 9099 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
u | +5.852 |
- | +5.574 |
. | +4.941 |
ine | +4.383 |
acy | +4.242 |
Neg logit contributions | |
disparate | -20.636 |
totality | -20.524 |
tremend | -20.357 |
venerable | -20.307 |
mathemat | -20.154 |
Token | � |
Token ID | 447 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
u | +19.004 |
- | +18.479 |
. | +18.303 |
acy | +17.221 |
ine | +17.166 |
Neg logit contributions | |
disparate | -21.869 |
venerable | -21.304 |
tremend | -21.094 |
mathemat | -21.062 |
totality | -20.473 |
Token | � |
Token ID | 247 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
� | +23.101 |
u | +20.479 |
� | +19.538 |
� | +19.328 |
aga | +18.799 |
Neg logit contributions | |
mathemat | -35.267 |
tremend | -33.353 |
anwhile | -32.793 |
cumbers | -32.144 |
misunder | -31.895 |
Token | t |
Token ID | 83 |
Feature activation | +7.95e+00 |
Pos logit contributions | |
u | +21.521 |
- | +19.507 |
. | +19.432 |
id | +18.473 |
t | +18.326 |
Neg logit contributions | |
tremend | -30.538 |
mathemat | -30.522 |
metic | -29.001 |
hemor | -28.899 |
cumbers | -28.578 |
Token | crowd |
Token ID | 4315 |
Feature activation | +1.73e+01 |
Pos logit contributions | |
- | +17.012 |
. | +16.292 |
u | +15.560 |
' | +14.521 |
ong | +14.506 |
Neg logit contributions | |
mathemat | -14.474 |
tremend | -14.319 |
DRAG | -14.219 |
venerable | -13.992 |
cumbers | -13.479 |
Token | the |
Token ID | 262 |
Feature activation | +7.02e+00 |
Pos logit contributions | |
- | +28.951 |
. | +28.239 |
u | +24.772 |
' | +24.371 |
's | +23.723 |
Neg logit contributions | |
tremend | -32.260 |
mathemat | -30.303 |
cumbers | -28.154 |
misunder | -26.715 |
ccording | -26.659 |
Token | pan |
Token ID | 3425 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
- | +15.240 |
. | +14.400 |
u | +12.909 |
' | +12.569 |
ia | +12.445 |
Neg logit contributions | |
tremend | -14.882 |
mathemat | -14.841 |
cumbers | -14.079 |
undermin | -13.844 |
hemor | -13.769 |
Token | cv |
Token ID | 33967 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
u | +1.438 |
- | +1.363 |
acy | +1.303 |
ia | +1.232 |
ade | +1.217 |
Neg logit contributions | |
disparate | -3.159 |
newer | -3.086 |
relentless | -3.077 |
blatant | -3.072 |
venerable | -3.064 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
- | +24.524 |
. | +24.074 |
u | +23.724 |
2 | +21.409 |
b | +20.653 |
Neg logit contributions | |
tremend | -41.178 |
hemor | -38.363 |
mathemat | -38.285 |
metic | -37.850 |
exha | -37.390 |
Token | . |
Token ID | 13 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
. | +25.668 |
- | +22.368 |
u | +20.312 |
' | +19.156 |
_ | +17.886 |
Neg logit contributions | |
tremend | -40.825 |
mathemat | -37.048 |
hemor | -36.438 |
cumbers | -36.331 |
metic | -35.795 |
Token | M |
Token ID | 44 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
u | +1.441 |
- | +1.422 |
acy | +1.248 |
. | +1.217 |
ia | +1.201 |
Neg logit contributions | |
disparate | -4.218 |
newer | -4.138 |
relentless | -4.135 |
blatant | -4.133 |
venerable | -4.116 |
Token | OR |
Token ID | 1581 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
- | +20.740 |
. | +20.134 |
u | +18.321 |
_ | +17.083 |
ong | +16.806 |
Neg logit contributions | |
tremend | -29.390 |
mathemat | -28.588 |
hemor | -27.059 |
theless | -27.030 |
streng | -26.584 |
Token | PH |
Token ID | 11909 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
- | +23.089 |
. | +22.010 |
_ | +18.583 |
u | +18.314 |
' | +17.967 |
Neg logit contributions | |
tremend | -37.479 |
mathemat | -34.573 |
cumbers | -32.275 |
hemor | -32.268 |
undermin | -32.018 |
Token | _ |
Token ID | 62 |
Feature activation | +6.86e-02 |
Pos logit contributions | |
- | +26.983 |
_ | +26.964 |
. | +25.922 |
u | +24.014 |
' | +22.577 |
Neg logit contributions | |
tremend | -39.980 |
mathemat | -36.816 |
hemor | -36.471 |
cumbers | -36.258 |
undermin | -34.792 |
Token | RECT |
Token ID | 23988 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
u | +0.097 |
- | +0.094 |
acy | +0.088 |
ia | +0.083 |
. | +0.083 |
Neg logit contributions | |
disparate | -0.229 |
newer | -0.226 |
venerable | -0.225 |
relentless | -0.225 |
blatant | -0.225 |
Token | , |
Token ID | 11 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
- | +25.633 |
u | +24.657 |
. | +24.233 |
ong | +22.567 |
ade | +22.483 |
Neg logit contributions | |
disparate | -16.747 |
blatant | -16.275 |
venerable | -16.266 |
relentless | -16.233 |
anecdotal | -16.221 |
Token | ( |
Token ID | 357 |
Feature activation | +3.43e-01 |
Pos logit contributions | |
disparate | +0.445 |
blatant | +0.435 |
relentless | +0.434 |
newer | +0.432 |
tremendous | +0.431 |
Neg logit contributions | |
u | -0.243 |
- | -0.239 |
acy | -0.226 |
ia | -0.216 |
ine | -0.215 |
Token | 21 |
Token ID | 2481 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
u | +0.459 |
- | +0.445 |
acy | +0.410 |
ia | +0.391 |
ine | +0.387 |
Neg logit contributions | |
disparate | -1.185 |
blatant | -1.159 |
newer | -1.155 |
relentless | -1.155 |
venerable | -1.155 |
Token | cv |
Token ID | 33967 |
Feature activation | +1.89e+01 |
Pos logit contributions | |
u | +7.986 |
- | +7.213 |
. | +6.680 |
acy | +5.984 |
ab | +5.944 |
Neg logit contributions | |
mathemat | -23.951 |
disparate | -23.692 |
tremend | -23.486 |
venerable | -23.463 |
totality | -23.377 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
- | +25.163 |
. | +24.783 |
u | +23.421 |
2 | +22.567 |
' | +21.025 |
Neg logit contributions | |
tremend | -44.924 |
mathemat | -41.449 |
hemor | -40.646 |
undermin | -40.087 |
exha | -39.773 |
Token | . |
Token ID | 13 |
Feature activation | +5.53e+00 |
Pos logit contributions | |
. | +26.687 |
- | +23.149 |
u | +20.412 |
' | +19.900 |
_ | +18.742 |
Neg logit contributions | |
tremend | -41.349 |
mathemat | -37.962 |
cumbers | -36.816 |
hemor | -36.262 |
undermin | -35.402 |
Token | M |
Token ID | 44 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
- | +4.546 |
. | +4.054 |
u | +3.725 |
id | +2.646 |
ia | +2.612 |
Neg logit contributions | |
tremend | -21.804 |
mathemat | -21.230 |
totality | -20.681 |
disparate | -20.394 |
venerable | -20.389 |
Token | OR |
Token ID | 1581 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
- | +19.476 |
. | +19.197 |
u | +16.418 |
' | +15.684 |
+ | +15.225 |
Neg logit contributions | |
tremend | -39.048 |
mathemat | -36.733 |
undermin | -34.475 |
hemor | -34.256 |
anwhile | -34.188 |
Token | PH |
Token ID | 11909 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
- | +20.038 |
. | +19.232 |
| +15.694 |
' | +15.622 |
u | +15.368 |
Neg logit contributions | |
tremend | -40.241 |
mathemat | -36.953 |
anwhile | -34.601 |
streng | -34.595 |
hemor | -34.461 |
Token | _ |
Token ID | 62 |
Feature activation | +6.14e+00 |
Pos logit contributions | |
- | +27.458 |
_ | +26.963 |
. | +25.877 |
u | +23.068 |
' | +22.819 |
Neg logit contributions | |
tremend | -42.951 |
mathemat | -39.604 |
cumbers | -38.757 |
hemor | -37.990 |
metic | -37.006 |
Token | RECT |
Token ID | 23988 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
- | +8.435 |
. | +7.726 |
u | +7.656 |
' | +6.304 |
ine | +6.213 |
Neg logit contributions | |
tremend | -19.691 |
mathemat | -19.544 |
totality | -19.049 |
venerable | -19.009 |
relentless | -18.916 |
Token | , |
Token ID | 11 |
Feature activation | +6.04e+00 |
Pos logit contributions | |
. | +23.056 |
- | +22.888 |
, | +21.449 |
u | +20.357 |
' | +19.253 |
Neg logit contributions | |
tremend | -37.070 |
mathemat | -34.405 |
hemor | -33.135 |
cumbers | -32.692 |
undermin | -31.633 |
Token | ( |
Token ID | 357 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
- | +9.483 |
. | +8.944 |
u | +8.576 |
ia | +7.665 |
ine | +7.514 |
Neg logit contributions | |
tremend | -18.512 |
mathemat | -18.044 |
hemor | -16.886 |
undermin | -16.696 |
cumbers | -16.591 |
Token | 21 |
Token ID | 2481 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
- | +3.816 |
u | +3.553 |
. | +3.110 |
acy | +3.042 |
ab | +2.985 |
Neg logit contributions | |
disparate | -12.830 |
totality | -12.382 |
relentless | -12.341 |
genuine | -12.278 |
anecdotal | -12.264 |
Token | Line |
Token ID | 13949 |
Feature activation | +6.56e+00 |
Pos logit contributions | |
disparate | +8.526 |
newer | +8.417 |
various | +8.413 |
blatant | +8.383 |
genuine | +8.333 |
Neg logit contributions | |
u | -4.499 |
acy | -4.367 |
- | -4.320 |
ia | -4.112 |
aga | -4.107 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
- | +14.435 |
u | +13.995 |
. | +13.949 |
acy | +13.390 |
ade | +13.223 |
Neg logit contributions | |
disparate | -12.906 |
anecdotal | -12.579 |
relentless | -12.347 |
newer | -12.310 |
venerable | -12.226 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
u | +16.262 |
- | +15.352 |
. | +15.078 |
ia | +14.842 |
ine | +14.754 |
Neg logit contributions | |
tremend | -27.361 |
hemor | -26.233 |
mathemat | -26.068 |
venerable | -25.935 |
disparate | -25.785 |
Token | = |
Token ID | 796 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
. | +19.825 |
- | +19.212 |
u | +19.212 |
ia | +17.707 |
ine | +17.558 |
Neg logit contributions | |
disparate | -18.222 |
anecdotal | -17.630 |
relentless | -17.148 |
venerable | -17.051 |
blatant | -17.007 |
Token | [ |
Token ID | 685 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
disparate | +5.585 |
blatant | +5.439 |
newer | +5.421 |
relentless | +5.418 |
various | +5.411 |
Neg logit contributions | |
u | -5.915 |
- | -5.807 |
acy | -5.707 |
ia | -5.535 |
ine | -5.480 |
Token | system |
Token ID | 10057 |
Feature activation | +1.94e+01 |
Pos logit contributions | |
u | +3.048 |
- | +2.986 |
acy | +2.700 |
ia | +2.630 |
ine | +2.628 |
Neg logit contributions | |
disparate | -6.902 |
newer | -6.783 |
relentless | -6.774 |
blatant | -6.772 |
gradual | -6.769 |
Token | . |
Token ID | 13 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
. | +30.075 |
- | +26.213 |
u | +23.662 |
' | +22.268 |
_ | +21.004 |
Neg logit contributions | |
tremend | -44.861 |
cumbers | -40.424 |
mathemat | -40.370 |
hemor | -39.571 |
metic | -39.275 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
u | +7.499 |
- | +7.446 |
. | +6.862 |
ine | +6.830 |
id | +6.756 |
Neg logit contributions | |
disparate | -9.095 |
relentless | -8.961 |
totality | -8.924 |
blatant | -8.905 |
gradual | -8.876 |
Token | ing |
Token ID | 278 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
ing | +26.385 |
- | +24.464 |
. | +23.515 |
u | +22.334 |
er | +21.711 |
Neg logit contributions | |
tremend | -46.461 |
cumbers | -42.389 |
mathemat | -42.218 |
metic | -41.477 |
hemor | -40.954 |
Token | . |
Token ID | 13 |
Feature activation | -2.67e+00 |
Pos logit contributions | |
. | +26.915 |
- | +23.484 |
u | +20.042 |
' | +19.890 |
/ | +18.497 |
Neg logit contributions | |
tremend | -42.301 |
cumbers | -37.362 |
mathemat | -37.246 |
hemor | -36.664 |
eleph | -36.366 |
Token | String |
Token ID | 10100 |
Feature activation | +7.32e+00 |
Pos logit contributions | |
disparate | +7.775 |
newer | +7.667 |
various | +7.663 |
blatant | +7.632 |
genuine | +7.596 |
Neg logit contributions | |
u | -4.481 |
acy | -4.372 |
- | -4.302 |
ia | -4.122 |
aga | -4.104 |
Token | cv |
Token ID | 33967 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
u | +6.119 |
- | +5.382 |
. | +4.926 |
acy | +4.551 |
ong | +4.452 |
Neg logit contributions | |
disparate | -20.583 |
venerable | -20.191 |
totality | -20.147 |
relentless | -19.990 |
mathemat | -19.891 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
- | +24.755 |
. | +24.166 |
u | +23.290 |
2 | +22.122 |
' | +20.556 |
Neg logit contributions | |
tremend | -44.219 |
mathemat | -40.500 |
hemor | -40.252 |
undermin | -39.520 |
exha | -39.317 |
Token | . |
Token ID | 13 |
Feature activation | +5.38e+00 |
Pos logit contributions | |
. | +25.077 |
- | +22.085 |
u | +19.796 |
' | +18.872 |
_ | +17.674 |
Neg logit contributions | |
tremend | -39.389 |
mathemat | -35.879 |
cumbers | -34.898 |
hemor | -34.519 |
metic | -33.613 |
Token | M |
Token ID | 44 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
- | +4.184 |
. | +3.669 |
u | +3.524 |
id | +2.508 |
ia | +2.402 |
Neg logit contributions | |
tremend | -20.948 |
mathemat | -20.588 |
totality | -20.362 |
disparate | -20.083 |
venerable | -20.061 |
Token | OR |
Token ID | 1581 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
- | +19.725 |
. | +19.155 |
u | +16.496 |
' | +15.590 |
_ | +15.399 |
Neg logit contributions | |
tremend | -37.146 |
mathemat | -35.804 |
anwhile | -33.772 |
streng | -33.457 |
undermin | -33.290 |
Token | PH |
Token ID | 11909 |
Feature activation | +1.94e+01 |
Pos logit contributions | |
- | +21.729 |
. | +20.638 |
| +17.134 |
u | +17.076 |
‐ | +16.995 |
Neg logit contributions | |
tremend | -36.878 |
mathemat | -34.182 |
streng | -31.727 |
cumbers | -31.614 |
anwhile | -31.540 |
Token | _ |
Token ID | 62 |
Feature activation | +5.13e+00 |
Pos logit contributions | |
- | +26.840 |
_ | +26.724 |
. | +25.516 |
u | +23.120 |
' | +22.552 |
Neg logit contributions | |
tremend | -42.486 |
mathemat | -39.226 |
cumbers | -38.426 |
hemor | -37.877 |
undermin | -36.685 |
Token | RECT |
Token ID | 23988 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
- | +7.658 |
u | +7.215 |
. | +7.039 |
ine | +6.065 |
ong | +6.025 |
Neg logit contributions | |
venerable | -15.742 |
relentless | -15.679 |
totality | -15.626 |
disparate | -15.615 |
mathemat | -15.489 |
Token | , |
Token ID | 11 |
Feature activation | +3.36e+00 |
Pos logit contributions | |
- | +23.005 |
. | +22.933 |
, | +21.325 |
u | +20.485 |
' | +19.438 |
Neg logit contributions | |
tremend | -36.684 |
mathemat | -33.691 |
hemor | -32.894 |
cumbers | -32.602 |
undermin | -31.396 |
Token | ( |
Token ID | 357 |
Feature activation | +3.69e+00 |
Pos logit contributions | |
- | +5.493 |
u | +5.465 |
. | +4.887 |
ine | +4.809 |
ia | +4.776 |
Neg logit contributions | |
disparate | -9.644 |
blatant | -9.441 |
anecdotal | -9.406 |
relentless | -9.381 |
totality | -9.286 |
Token | 13 |
Token ID | 1485 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
- | +4.492 |
u | +4.434 |
. | +3.830 |
ire | +3.798 |
acy | +3.707 |
Neg logit contributions | |
disparate | -12.667 |
totality | -12.333 |
venerable | -12.309 |
gradual | -12.307 |
blatant | -12.290 |
Token | new |
Token ID | 649 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
disparate | +3.646 |
blatant | +3.542 |
relentless | +3.521 |
venerable | +3.482 |
gradual | +3.472 |
Neg logit contributions | |
u | -5.813 |
- | -5.784 |
acy | -5.633 |
ia | -5.523 |
ine | -5.456 |
Token | - |
Token ID | 12 |
Feature activation | +8.20e+00 |
Pos logit contributions | |
- | +21.368 |
. | +17.317 |
u | +16.544 |
‐ | +15.429 |
‑ | +15.360 |
Neg logit contributions | |
tremend | -23.027 |
mathemat | -21.923 |
cumbers | -20.925 |
undermin | -20.814 |
reluct | -20.276 |
Token | object |
Token ID | 15252 |
Feature activation | +3.00e+00 |
Pos logit contributions | |
u | +8.576 |
- | +8.164 |
ine | +7.131 |
. | +7.124 |
ab | +6.498 |
Neg logit contributions | |
tremend | -26.225 |
mathemat | -26.125 |
venerable | -25.596 |
hemor | -25.518 |
disparate | -25.407 |
Token | system |
Token ID | 1080 |
Feature activation | +1.73e+01 |
Pos logit contributions | |
- | +6.475 |
u | +6.115 |
. | +5.988 |
ia | +5.860 |
ine | +5.714 |
Neg logit contributions | |
disparate | -6.823 |
blatant | -6.794 |
relentless | -6.716 |
anecdotal | -6.689 |
gradual | -6.688 |
Token | . |
Token ID | 13 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
. | +27.986 |
- | +24.585 |
u | +21.794 |
' | +20.650 |
; | +19.421 |
Neg logit contributions | |
tremend | -41.949 |
mathemat | -37.827 |
cumbers | -37.474 |
hemor | -36.548 |
metic | -36.387 |
Token | draw |
Token ID | 19334 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
u | +7.158 |
- | +6.973 |
ia | +6.534 |
acy | +6.518 |
ine | +6.516 |
Neg logit contributions | |
disparate | -7.709 |
relentless | -7.497 |
gradual | -7.482 |
newer | -7.451 |
blatant | -7.446 |
Token | ing |
Token ID | 278 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
ing | +25.665 |
- | +24.303 |
. | +23.523 |
u | +22.394 |
al | +21.384 |
Neg logit contributions | |
tremend | -42.868 |
mathemat | -39.416 |
cumbers | -39.356 |
metic | -37.888 |
hemor | -37.875 |
Token | . |
Token ID | 13 |
Feature activation | -7.63e-01 |
Pos logit contributions | |
. | +23.095 |
- | +20.661 |
u | +17.654 |
' | +16.742 |
ia | +16.348 |
Neg logit contributions | |
tremend | -34.633 |
cumbers | -30.962 |
mathemat | -30.868 |
hemor | -30.328 |
reluct | -29.755 |
Token | bit |
Token ID | 2545 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
disparate | +2.763 |
newer | +2.723 |
various | +2.709 |
blatant | +2.705 |
relentless | +2.705 |
Neg logit contributions | |
u | -0.856 |
- | -0.815 |
acy | -0.785 |
ia | -0.740 |
ine | -0.722 |
Token | map |
Token ID | 8899 |
Feature activation | +5.54e+00 |
Pos logit contributions | |
- | +20.123 |
. | +19.089 |
u | +19.070 |
map | +18.804 |
ade | +17.896 |
Neg logit contributions | |
cumbers | -31.787 |
tremend | -31.473 |
undermin | -31.086 |
reluct | -30.665 |
behavi | -30.595 |
Token | ($ |
Token ID | 16763 |
Feature activation | +4.87e+00 |
Pos logit contributions | |
- | +14.107 |
. | +13.522 |
u | +12.996 |
ine | +12.472 |
ia | +12.313 |
Neg logit contributions | |
disparate | -9.636 |
anecdotal | -9.375 |
stringent | -9.141 |
venerable | -9.140 |
blatant | -9.081 |
Token | East |
Token ID | 3687 |
Feature activation | +2.86e+00 |
Pos logit contributions | |
- | +9.804 |
. | +9.350 |
u | +9.196 |
acy | +9.073 |
ia | +9.017 |
Neg logit contributions | |
disparate | -7.041 |
relentless | -6.958 |
anecdotal | -6.886 |
blatant | -6.850 |
venerable | -6.817 |
Token | , |
Token ID | 11 |
Feature activation | -5.82e+00 |
Pos logit contributions | |
- | +7.182 |
. | +6.910 |
u | +6.866 |
acy | +6.609 |
ia | +6.597 |
Neg logit contributions | |
disparate | -5.765 |
relentless | -5.731 |
anecdotal | -5.659 |
blatant | -5.637 |
venerable | -5.633 |
Token | image |
Token ID | 2939 |
Feature activation | +6.24e+00 |
Pos logit contributions | |
various | +14.434 |
disparate | +14.428 |
newer | +14.316 |
blatant | +14.195 |
genuine | +14.153 |
Neg logit contributions | |
u | -11.259 |
acy | -11.106 |
- | -10.654 |
aga | -10.484 |
ia | -10.471 |
Token | courtesy |
Token ID | 12537 |
Feature activation | +7.67e+00 |
Pos logit contributions | |
- | +14.245 |
. | +13.534 |
u | +13.217 |
ia | +12.832 |
acy | +12.705 |
Neg logit contributions | |
disparate | -11.654 |
relentless | -11.379 |
anecdotal | -11.262 |
tremendous | -11.187 |
gradual | -11.170 |
Token | of |
Token ID | 286 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
- | +14.882 |
. | +14.663 |
u | +13.526 |
ia | +12.728 |
acy | +12.395 |
Neg logit contributions | |
tremend | -18.303 |
mathemat | -17.581 |
cumbers | -16.594 |
hemor | -16.250 |
misunder | -15.868 |
Token | Dav |
Token ID | 2544 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
disparate | +4.224 |
newer | +4.108 |
various | +4.089 |
blatant | +4.059 |
relentless | +4.040 |
Neg logit contributions | |
u | -8.567 |
- | -8.388 |
acy | -8.385 |
ia | -8.160 |
aga | -8.108 |
Token | part |
Token ID | 3911 |
Feature activation | +7.19e+00 |
Pos logit contributions | |
- | +23.598 |
. | +22.858 |
b | +19.933 |
id | +19.882 |
ab | +19.867 |
Neg logit contributions | |
tremend | -37.607 |
cumbers | -36.364 |
metic | -36.219 |
hemor | -35.933 |
mathemat | -35.537 |
Token | . |
Token ID | 13 |
Feature activation | +6.67e-01 |
Pos logit contributions | |
. | +17.192 |
- | +16.882 |
u | +16.303 |
acy | +15.717 |
ia | +15.706 |
Neg logit contributions | |
disparate | -12.948 |
gradual | -12.492 |
relentless | -12.452 |
venerable | -12.435 |
tremendous | -12.339 |
Token |
|
Token ID | 198 |
Feature activation | +2.51e+00 |
Pos logit contributions | |
u | +1.206 |
- | +1.175 |
acy | +1.147 |
ia | +1.103 |
ine | +1.093 |
Neg logit contributions | |
disparate | -1.922 |
relentless | -1.881 |
newer | -1.880 |
venerable | -1.873 |
blatant | -1.872 |
Token |
|
Token ID | 198 |
Feature activation | -7.19e+00 |
Pos logit contributions | |
- | +3.703 |
u | +3.437 |
. | +3.387 |
ia | +3.020 |
ine | +2.964 |
Neg logit contributions | |
tremend | -9.132 |
mathemat | -8.957 |
disparate | -8.600 |
venerable | -8.534 |
hemor | -8.505 |
Token | Panel |
Token ID | 26639 |
Feature activation | +3.66e+00 |
Pos logit contributions | |
various | +18.365 |
blatant | +18.352 |
newer | +18.291 |
disparate | +18.245 |
genuine | +18.245 |
Neg logit contributions | |
acy | -9.569 |
aga | -9.355 |
u | -9.104 |
ong | -8.605 |
illo | -8.587 |
Token | ARM |
Token ID | 33456 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
disparate | +4.911 |
newer | +4.835 |
various | +4.823 |
blatant | +4.811 |
relentless | +4.802 |
Neg logit contributions | |
u | -2.705 |
- | -2.602 |
acy | -2.590 |
ia | -2.460 |
aga | -2.423 |
Token | version |
Token ID | 2196 |
Feature activation | +8.32e+00 |
Pos logit contributions | |
- | +23.477 |
. | +22.316 |
u | +21.791 |
ia | +19.828 |
id | +19.812 |
Neg logit contributions | |
disparate | -15.296 |
anecdotal | -14.422 |
relentless | -14.365 |
blatant | -14.342 |
totality | -14.217 |
Token | , |
Token ID | 11 |
Feature activation | -9.25e-01 |
Pos logit contributions | |
- | +19.527 |
u | +18.958 |
. | +18.845 |
ia | +17.613 |
acy | +17.489 |
Neg logit contributions | |
disparate | -13.271 |
relentless | -13.016 |
tremendous | -12.899 |
blatant | -12.736 |
drastic | -12.652 |
Token | detected |
Token ID | 12326 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
disparate | +2.068 |
relentless | +2.017 |
venerable | +2.002 |
tremendous | +1.991 |
blatant | +1.985 |
Neg logit contributions | |
u | -2.304 |
- | -2.290 |
acy | -2.187 |
ia | -2.154 |
. | -2.139 |
Token | as |
Token ID | 355 |
Feature activation | +5.97e-01 |
Pos logit contributions | |
. | +21.029 |
- | +20.787 |
u | +19.020 |
ia | +17.958 |
ine | +17.390 |
Neg logit contributions | |
tremend | -26.200 |
mathemat | -25.857 |
hemor | -23.942 |
misunder | -23.680 |
cumbers | -23.413 |
Token | EL |
Token ID | 17852 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
- | +1.571 |
u | +1.569 |
acy | +1.491 |
. | +1.477 |
ia | +1.477 |
Neg logit contributions | |
disparate | -1.219 |
blatant | -1.188 |
relentless | -1.187 |
tremendous | -1.166 |
gradual | -1.165 |
Token | F |
Token ID | 37 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
- | +23.038 |
. | +22.059 |
u | +20.045 |
_ | +19.720 |
F | +19.520 |
Neg logit contributions | |
tremend | -45.636 |
mathemat | -42.791 |
metic | -41.798 |
hemor | -40.225 |
undermin | -39.629 |
Token | _ |
Token ID | 62 |
Feature activation | +7.37e+00 |
Pos logit contributions | |
- | +24.314 |
_ | +23.812 |
. | +23.067 |
u | +20.883 |
' | +19.583 |
Neg logit contributions | |
tremend | -40.263 |
mathemat | -37.349 |
metic | -36.135 |
cumbers | -36.038 |
hemor | -35.735 |
Token | UM |
Token ID | 5883 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
u | +9.053 |
- | +8.891 |
. | +8.139 |
ia | +7.056 |
um | +6.911 |
Neg logit contributions | |
mathemat | -22.506 |
disparate | -22.371 |
relentless | -22.294 |
tremend | -22.199 |
gradual | -22.172 |
Token | RE |
Token ID | 2200 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
- | +21.925 |
. | +21.508 |
u | +18.981 |
' | +18.347 |
_ | +18.285 |
Neg logit contributions | |
tremend | -40.376 |
mathemat | -38.472 |
metic | -37.168 |
undermin | -36.577 |
cumbers | -36.221 |
Token | ON |
Token ID | 1340 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
- | +19.174 |
. | +18.535 |
u | +16.084 |
' | +15.569 |
_ | +15.037 |
Neg logit contributions | |
tremend | -37.758 |
mathemat | -36.730 |
hemor | -34.865 |
metic | -34.626 |
cumbers | -34.386 |
Token | Dan |
Token ID | 6035 |
Feature activation | +8.34e+00 |
Pos logit contributions | |
disparate | +1.066 |
gradual | +1.029 |
newer | +1.027 |
blatant | +1.008 |
relentless | +1.005 |
Neg logit contributions | |
u | -2.018 |
- | -1.996 |
acy | -1.939 |
ia | -1.915 |
. | -1.887 |
Token | Mer |
Token ID | 4638 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
- | +15.518 |
u | +14.767 |
. | +14.602 |
ia | +13.908 |
er | +13.387 |
Neg logit contributions | |
disparate | -17.396 |
mathemat | -17.352 |
blatant | -17.088 |
tremend | -16.954 |
gradual | -16.881 |
Token | ica |
Token ID | 3970 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
ica | +22.800 |
ia | +22.134 |
ic | +20.789 |
- | +20.624 |
. | +20.574 |
Neg logit contributions | |
tremend | -34.115 |
cumbers | -34.105 |
mathemat | -33.068 |
reluct | -32.233 |
hemor | -32.135 |
Token | (@ |
Token ID | 4275 |
Feature activation | +7.73e+00 |
Pos logit contributions | |
- | +20.844 |
. | +20.776 |
u | +18.224 |
(@ | +18.043 |
/ | +17.687 |
Neg logit contributions | |
tremend | -33.174 |
mathemat | -31.603 |
cumbers | -30.366 |
undermin | -29.635 |
hemor | -29.576 |
Token | dan |
Token ID | 25604 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
u | +4.853 |
- | +4.689 |
. | +4.196 |
acy | +3.595 |
ag | +3.307 |
Neg logit contributions | |
totality | -28.138 |
mathemat | -27.349 |
tremend | -27.289 |
disparate | -27.054 |
stringent | -26.887 |
Token | meric |
Token ID | 946 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
- | +14.257 |
u | +13.885 |
meric | +13.506 |
. | +13.252 |
ag | +12.887 |
Neg logit contributions | |
totality | -30.349 |
tremend | -29.377 |
mathemat | -29.216 |
disparate | -28.889 |
relentless | -28.739 |
Token | a |
Token ID | 64 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
u | +24.218 |
- | +23.801 |
ia | +23.547 |
a | +23.444 |
ab | +22.954 |
Neg logit contributions | |
tremend | -40.638 |
mathemat | -40.210 |
cumbers | -39.885 |
hemor | -39.097 |
undermin | -38.642 |
Token | CNN |
Token ID | 18474 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
- | +15.958 |
. | +15.080 |
u | +14.453 |
' | +12.676 |
_ | +12.460 |
Neg logit contributions | |
tremend | -30.176 |
mathemat | -28.830 |
cumbers | -27.520 |
metic | -26.932 |
streng | -26.548 |
Token | ) |
Token ID | 8 |
Feature activation | +8.38e-01 |
Pos logit contributions | |
- | +20.795 |
. | +20.131 |
u | +18.004 |
) | +17.732 |
ia | +16.913 |
Neg logit contributions | |
tremend | -40.283 |
mathemat | -37.850 |
cumbers | -36.569 |
hemor | -36.098 |
metic | -36.053 |
Token | October |
Token ID | 3267 |
Feature activation | +6.39e+00 |
Pos logit contributions | |
- | +2.455 |
u | +2.444 |
acy | +2.405 |
ia | +2.343 |
. | +2.320 |
Neg logit contributions | |
disparate | -1.428 |
newer | -1.370 |
relentless | -1.362 |
venerable | -1.353 |
gradual | -1.353 |
Token | 23 |
Token ID | 2242 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
- | +12.394 |
. | +11.601 |
u | +11.488 |
ine | +10.389 |
ia | +10.115 |
Neg logit contributions | |
disparate | -15.277 |
mathemat | -14.731 |
venerable | -14.684 |
tremend | -14.510 |
gradual | -14.141 |
Token | ," |
Token ID | 553 |
Feature activation | +6.23e+00 |
Pos logit contributions | |
- | +15.039 |
. | +14.372 |
u | +13.349 |
ine | +12.336 |
; | +12.138 |
Neg logit contributions | |
tremend | -24.938 |
mathemat | -24.254 |
behavi | -22.747 |
cumbers | -22.714 |
streng | -22.359 |
Token | " |
Token ID | 366 |
Feature activation | +5.51e+00 |
Pos logit contributions | |
- | +16.499 |
. | +15.975 |
u | +15.468 |
ia | +14.719 |
ine | +14.545 |
Neg logit contributions | |
tremend | -12.107 |
mathemat | -11.903 |
hemor | -10.577 |
undermin | -10.413 |
disparate | -10.395 |
Token | P |
Token ID | 47 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
- | +3.629 |
. | +3.053 |
u | +2.824 |
id | +1.945 |
ine | +1.910 |
Neg logit contributions | |
mathemat | -23.319 |
tremend | -23.278 |
hemor | -21.987 |
streng | -21.897 |
disparate | -21.873 |
Token | unct |
Token ID | 16260 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
u | +15.974 |
- | +15.489 |
ong | +14.848 |
. | +14.675 |
id | +14.154 |
Neg logit contributions | |
mathemat | -27.684 |
tremend | -27.073 |
totality | -26.161 |
disparate | -26.047 |
metic | -25.836 |
Token | ate |
Token ID | 378 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
ate | +28.235 |
ine | +24.511 |
- | +24.411 |
acy | +24.185 |
u | +23.808 |
Neg logit contributions | |
tremend | -36.384 |
mathemat | -34.078 |
cumbers | -33.606 |
hemor | -33.472 |
behavi | -33.208 |
Token | ker |
Token ID | 41927 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
- | +19.878 |
. | +18.764 |
u | +17.416 |
' | +16.853 |
‐ | +16.595 |
Neg logit contributions | |
mathemat | -18.521 |
tremend | -18.316 |
undermin | -16.884 |
anwhile | -16.882 |
disparate | -16.604 |
Token | at |
Token ID | 265 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
at | +25.800 |
- | +24.210 |
acy | +23.439 |
. | +23.151 |
ate | +23.044 |
Neg logit contributions | |
tremend | -39.765 |
cumbers | -37.997 |
reluct | -36.868 |
mathemat | -36.716 |
hemor | -36.023 |
Token | oder |
Token ID | 12342 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
- | +16.320 |
ode | +15.690 |
. | +15.489 |
id | +15.447 |
ine | +15.151 |
Neg logit contributions | |
tremend | -26.695 |
mathemat | -25.835 |
disparate | -24.724 |
cumbers | -24.552 |
hemor | -24.100 |
Token | ma |
Token ID | 2611 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
ia | +21.965 |
- | +20.624 |
u | +19.702 |
. | +19.558 |
id | +18.564 |
Neg logit contributions | |
tremend | -29.817 |
mathemat | -29.031 |
cumbers | -28.130 |
undermin | -27.871 |
misunder | -27.187 |
Token | ," |
Token ID | 553 |
Feature activation | +9.60e+00 |
Pos logit contributions | |
- | +15.952 |
. | +15.475 |
, | +13.749 |
ia | +13.455 |
u | +13.315 |
Neg logit contributions | |
tremend | -25.158 |
mathemat | -25.113 |
cumbers | -23.310 |
behavi | -22.944 |
undermin | -22.442 |
Token | and |
Token ID | 290 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
- | +16.999 |
. | +16.124 |
u | +14.406 |
and | +13.928 |
& | +13.839 |
Neg logit contributions | |
tremend | -26.350 |
mathemat | -24.972 |
misunder | -23.462 |
hemor | -23.039 |
undermin | -23.039 |
Token | reducing |
Token ID | 8868 |
Feature activation | -4.20e+00 |
Pos logit contributions | |
disparate | +22.639 |
various | +22.511 |
newer | +22.452 |
genuine | +22.370 |
blatant | +22.304 |
Neg logit contributions | |
u | -10.411 |
acy | -10.004 |
ia | -9.353 |
aga | -9.311 |
ong | -9.310 |
Token | the |
Token ID | 262 |
Feature activation | -6.78e+00 |
Pos logit contributions | |
disparate | +11.500 |
newer | +11.325 |
various | +11.286 |
blatant | +11.251 |
relentless | +11.223 |
Neg logit contributions | |
u | -8.093 |
- | -7.843 |
acy | -7.814 |
ia | -7.473 |
aga | -7.386 |
Token | shelter |
Token ID | 11772 |
Feature activation | +5.15e+00 |
Pos logit contributions | |
disparate | +19.628 |
various | +19.424 |
sheer | +19.226 |
newer | +19.209 |
genuine | +19.145 |
Neg logit contributions | |
u | -10.339 |
acy | -10.046 |
aga | -9.334 |
ong | -9.301 |
- | -9.298 |
Token | population |
Token ID | 3265 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
- | +14.189 |
. | +13.304 |
u | +12.775 |
acy | +12.632 |
ia | +12.599 |
Neg logit contributions | |
newer | -7.981 |
disparate | -7.974 |
blatant | -7.935 |
venerable | -7.901 |
relentless | -7.861 |
Token | . |
Token ID | 13 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
- | +3.684 |
. | +3.598 |
u | +3.509 |
acy | +3.454 |
ia | +3.220 |
Neg logit contributions | |
disparate | -5.015 |
venerable | -4.921 |
blatant | -4.921 |
newer | -4.880 |
relentless | -4.852 |
Token | But |
Token ID | 887 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
various | +25.505 |
newer | +25.223 |
modern | +24.872 |
genuine | +24.669 |
those | +24.514 |
Neg logit contributions | |
acy | -12.243 |
u | -11.957 |
aga | -11.859 |
iev | -11.647 |
ire | -11.564 |
Token | , |
Token ID | 11 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
various | +35.684 |
those | +35.491 |
anecdotal | +35.313 |
many | +35.297 |
disparate | +35.010 |
Neg logit contributions | |
u | -11.841 |
acy | -11.676 |
ire | -11.255 |
ong | -11.225 |
aga | -11.214 |
Token | of |
Token ID | 286 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
various | +29.816 |
anecdotal | +29.196 |
disparate | +29.146 |
newer | +29.118 |
relentless | +29.078 |
Neg logit contributions | |
u | -12.922 |
ire | -12.377 |
acy | -12.092 |
elle | -11.972 |
aga | -11.963 |
Token | course |
Token ID | 1781 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
disparate | +3.431 |
newer | +3.348 |
venerable | +3.327 |
blatant | +3.325 |
relentless | +3.313 |
Neg logit contributions | |
u | -4.658 |
- | -4.602 |
acy | -4.516 |
ia | -4.397 |
aga | -4.361 |
Token | , |
Token ID | 11 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
- | +1.103 |
u | +1.085 |
acy | +0.910 |
. | +0.890 |
ia | +0.805 |
Neg logit contributions | |
disparate | -6.079 |
venerable | -5.985 |
blatant | -5.969 |
newer | -5.958 |
relentless | -5.945 |
Token | there |
Token ID | 612 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
various | +28.924 |
disparate | +28.810 |
newer | +28.517 |
anecdotal | +28.439 |
those | +28.380 |
Neg logit contributions | |
u | -12.312 |
acy | -12.141 |
aga | -11.469 |
ong | -11.210 |
ire | -11.102 |
Token | a |
Token ID | 257 |
Feature activation | -3.90e+00 |
Pos logit contributions | |
disparate | +14.475 |
newer | +14.264 |
various | +14.244 |
relentless | +14.207 |
blatant | +14.184 |
Neg logit contributions | |
u | -7.720 |
acy | -7.434 |
- | -7.352 |
ia | -7.050 |
aga | -6.956 |
Token | game |
Token ID | 983 |
Feature activation | +4.97e+00 |
Pos logit contributions | |
disparate | +9.613 |
newer | +9.445 |
various | +9.422 |
blatant | +9.371 |
venerable | +9.321 |
Neg logit contributions | |
u | -8.648 |
- | -8.434 |
acy | -8.349 |
ia | -8.040 |
aga | -7.961 |
Token | of |
Token ID | 286 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
- | +13.760 |
. | +13.455 |
u | +12.815 |
ia | +12.078 |
ine | +11.966 |
Neg logit contributions | |
disparate | -7.758 |
anecdotal | -7.630 |
blatant | -7.466 |
venerable | -7.454 |
genuine | -7.412 |
Token | inches |
Token ID | 8331 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
disparate | +9.593 |
newer | +9.444 |
various | +9.400 |
blatant | +9.372 |
relentless | +9.344 |
Neg logit contributions | |
u | -7.478 |
- | -7.269 |
acy | -7.229 |
ia | -6.930 |
aga | -6.858 |
Token | , |
Token ID | 11 |
Feature activation | -7.52e+00 |
Pos logit contributions | |
- | +10.152 |
. | +9.974 |
u | +9.693 |
ong | +9.115 |
acy | +9.009 |
Neg logit contributions | |
venerable | -7.859 |
blatant | -7.839 |
disparate | -7.834 |
anecdotal | -7.825 |
genuine | -7.735 |
Token | and |
Token ID | 290 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
various | +22.142 |
disparate | +22.035 |
relentless | +21.774 |
newer | +21.704 |
blatant | +21.660 |
Neg logit contributions | |
u | -8.911 |
acy | -8.760 |
aga | -8.287 |
ire | -8.284 |
ia | -8.243 |
Token | taking |
Token ID | 2263 |
Feature activation | -4.46e+00 |
Pos logit contributions | |
various | +34.713 |
disparate | +34.197 |
those | +33.924 |
relentless | +33.909 |
tremendous | +33.872 |
Neg logit contributions | |
acy | -12.632 |
u | -12.611 |
aga | -12.438 |
iev | -11.917 |
ong | -11.749 |
Token | splash |
Token ID | 22870 |
Feature activation | +7.54e+00 |
Pos logit contributions | |
disparate | +11.799 |
newer | +11.604 |
various | +11.577 |
blatant | +11.531 |
relentless | +11.501 |
Neg logit contributions | |
u | -8.943 |
acy | -8.652 |
- | -8.647 |
ia | -8.285 |
aga | -8.205 |
Token | y |
Token ID | 88 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
- | +18.817 |
y | +17.823 |
. | +17.128 |
u | +17.042 |
ade | +16.503 |
Neg logit contributions | |
venerable | -11.721 |
disparate | -11.518 |
totality | -11.362 |
theless | -11.076 |
stringent | -10.997 |
Token | , |
Token ID | 11 |
Feature activation | -6.87e+00 |
Pos logit contributions | |
disparate | +4.417 |
newer | +4.341 |
venerable | +4.337 |
relentless | +4.315 |
various | +4.308 |
Neg logit contributions | |
u | -4.224 |
- | -4.215 |
acy | -4.084 |
ia | -3.955 |
ine | -3.899 |
Token | cash |
Token ID | 5003 |
Feature activation | +4.55e+00 |
Pos logit contributions | |
disparate | +19.950 |
blatant | +19.616 |
relentless | +19.521 |
various | +19.515 |
genuine | +19.437 |
Neg logit contributions | |
u | -10.214 |
acy | -9.841 |
aga | -9.471 |
ia | -9.426 |
- | -9.366 |
Token | and |
Token ID | 290 |
Feature activation | -8.49e+00 |
Pos logit contributions | |
u | +16.281 |
- | +15.765 |
ia | +14.648 |
ul | +14.612 |
. | +14.403 |
Neg logit contributions | |
blatant | -10.962 |
disparate | -10.880 |
newer | -10.675 |
relentless | -10.636 |
anecdotal | -10.627 |
Token | so |
Token ID | 523 |
Feature activation | +2.43e+00 |
Pos logit contributions | |
various | +25.209 |
newer | +24.670 |
disparate | +24.645 |
genuine | +24.316 |
venerable | +24.306 |
Neg logit contributions | |
acy | -9.516 |
u | -8.764 |
aga | -8.198 |
ire | -8.189 |
ia | -8.163 |
Token | on |
Token ID | 319 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
- | +4.641 |
u | +4.547 |
. | +4.151 |
acy | +4.118 |
ia | +4.101 |
Neg logit contributions | |
disparate | -6.564 |
newer | -6.404 |
anecdotal | -6.403 |
blatant | -6.391 |
tremendous | -6.367 |
Token | ). |
Token ID | 737 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
u | +1.086 |
- | +1.084 |
. | +0.960 |
acy | +0.937 |
ia | +0.901 |
Neg logit contributions | |
disparate | -3.936 |
relentless | -3.885 |
blatant | -3.882 |
tremendous | -3.863 |
newer | -3.862 |
Token | However |
Token ID | 2102 |
Feature activation | -9.62e-01 |
Pos logit contributions | |
various | +25.879 |
newer | +25.422 |
modern | +25.328 |
disparate | +24.951 |
genuine | +24.822 |
Neg logit contributions | |
acy | -12.294 |
aga | -11.310 |
u | -11.245 |
elle | -10.955 |
ine | -10.933 |
Token | , |
Token ID | 11 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
disparate | +3.627 |
newer | +3.584 |
various | +3.574 |
blatant | +3.569 |
relentless | +3.565 |
Neg logit contributions | |
u | -0.861 |
- | -0.803 |
acy | -0.791 |
ia | -0.717 |
aga | -0.697 |
Token | names |
Token ID | 3891 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
various | +34.410 |
newer | +33.943 |
modern | +33.895 |
many | +33.423 |
widespread | +33.035 |
Neg logit contributions | |
acy | -13.438 |
ée | -12.883 |
u | -12.500 |
elle | -12.306 |
ade | -12.178 |
Token | of |
Token ID | 286 |
Feature activation | -8.63e+00 |
Pos logit contributions | |
- | +0.315 |
u | +0.313 |
. | +0.293 |
acy | +0.292 |
ia | +0.287 |
Neg logit contributions | |
disparate | -0.312 |
relentless | -0.310 |
tremendous | -0.305 |
totality | -0.305 |
blatant | -0.304 |
Token | other |
Token ID | 584 |
Feature activation | -5.00e+00 |
Pos logit contributions | |
various | +25.182 |
disparate | +25.025 |
newer | +24.750 |
genuine | +24.621 |
venerable | +24.591 |
Neg logit contributions | |
acy | -11.058 |
u | -10.931 |
ade | -10.142 |
aga | -10.110 |
ine | -9.967 |
Token | foreign |
Token ID | 3215 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
disparate | +13.835 |
various | +13.621 |
newer | +13.586 |
blatant | +13.473 |
venerable | +13.448 |
Neg logit contributions | |
u | -9.118 |
acy | -8.877 |
- | -8.642 |
ia | -8.337 |
aga | -8.316 |
Token | origin |
Token ID | 8159 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
- | +6.430 |
u | +6.102 |
ia | +5.984 |
. | +5.979 |
acy | +5.938 |
Neg logit contributions | |
relentless | -3.443 |
newer | -3.372 |
blatant | -3.328 |
tremendous | -3.326 |
disparate | -3.304 |
Token | � |
Token ID | 447 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
u | +8.114 |
- | +8.035 |
acy | +7.702 |
. | +7.487 |
ate | +7.464 |
Neg logit contributions | |
disparate | -10.068 |
venerable | -9.653 |
totality | -9.634 |
newer | -9.630 |
relentless | -9.598 |
Token | � |
Token ID | 247 |
Feature activation | +4.65e+00 |
Pos logit contributions | |
� | +17.847 |
u | +17.569 |
- | +16.557 |
� | +16.306 |
� | +16.281 |
Neg logit contributions | |
mathemat | -23.010 |
disparate | -22.693 |
blatant | -22.661 |
theless | -22.003 |
totality | -21.777 |
Token | t |
Token ID | 83 |
Feature activation | -3.02e+00 |
Pos logit contributions | |
u | +7.423 |
- | +6.878 |
. | +6.551 |
acy | +6.508 |
ia | +6.252 |
Neg logit contributions | |
disparate | -13.743 |
venerable | -13.271 |
newer | -13.134 |
blatant | -13.114 |
totality | -13.094 |
Token | . |
Token ID | 13 |
Feature activation | -8.10e+00 |
Pos logit contributions | |
disparate | +11.375 |
newer | +11.234 |
various | +11.203 |
blatant | +11.179 |
relentless | +11.170 |
Neg logit contributions | |
u | -2.770 |
- | -2.616 |
acy | -2.572 |
ia | -2.335 |
aga | -2.253 |
Token | However |
Token ID | 2102 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
various | +21.822 |
newer | +21.504 |
blatant | +21.293 |
disparate | +21.242 |
genuine | +21.199 |
Neg logit contributions | |
acy | -10.332 |
u | -10.326 |
aga | -9.919 |
ong | -9.524 |
- | -9.471 |
Token | , |
Token ID | 11 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
u | +1.938 |
- | +1.901 |
acy | +1.760 |
ia | +1.701 |
. | +1.664 |
Neg logit contributions | |
disparate | -5.379 |
newer | -5.291 |
relentless | -5.263 |
various | -5.254 |
blatant | -5.244 |
Token | when |
Token ID | 618 |
Feature activation | -7.82e+00 |
Pos logit contributions | |
various | +33.680 |
many | +32.940 |
newer | +32.830 |
those | +32.748 |
anecdotal | +32.516 |
Neg logit contributions | |
acy | -13.564 |
u | -13.125 |
aga | -12.681 |
ong | -11.921 |
ade | -11.779 |
Token | it |
Token ID | 340 |
Feature activation | -2.14e+00 |
Pos logit contributions | |
various | +22.849 |
disparate | +22.823 |
newer | +22.556 |
blatant | +22.445 |
genuine | +22.372 |
Neg logit contributions | |
u | -10.564 |
acy | -10.417 |
aga | -9.585 |
ade | -9.467 |
ong | -9.391 |
Token | becomes |
Token ID | 4329 |
Feature activation | -5.01e+00 |
Pos logit contributions | |
disparate | +5.806 |
newer | +5.671 |
blatant | +5.655 |
relentless | +5.651 |
venerable | +5.639 |
Neg logit contributions | |
u | -4.325 |
- | -4.219 |
acy | -4.141 |
ia | -3.984 |
ine | -3.922 |
Token | � |
Token ID | 564 |
Feature activation | +9.19e+00 |
Pos logit contributions | |
disparate | +12.568 |
newer | +12.374 |
blatant | +12.361 |
various | +12.359 |
relentless | +12.265 |
Neg logit contributions | |
u | -10.398 |
acy | -10.094 |
- | -9.998 |
ia | -9.710 |
aga | -9.681 |
Token | � |
Token ID | 250 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
u | +15.593 |
- | +15.564 |
� | +15.503 |
ine | +15.316 |
acy | +14.891 |
Neg logit contributions | |
disparate | -17.388 |
blatant | -17.100 |
venerable | -17.060 |
newer | -16.771 |
relentless | -16.721 |
Token | to |
Token ID | 284 |
Feature activation | -6.53e+00 |
Pos logit contributions | |
- | +4.650 |
u | +4.512 |
. | +4.453 |
acy | +4.316 |
ong | +4.169 |
Neg logit contributions | |
disparate | -5.486 |
relentless | -5.437 |
venerable | -5.414 |
blatant | -5.366 |
totality | -5.354 |
Token | track |
Token ID | 2610 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
various | +17.818 |
disparate | +17.771 |
newer | +17.716 |
modern | +17.424 |
genuine | +17.422 |
Neg logit contributions | |
u | -10.625 |
acy | -10.258 |
aga | -9.757 |
ia | -9.749 |
- | -9.642 |
Token | bottleneck |
Token ID | 49936 |
Feature activation | +5.06e+00 |
Pos logit contributions | |
disparate | +3.624 |
newer | +3.531 |
relentless | +3.520 |
blatant | +3.517 |
venerable | +3.502 |
Neg logit contributions | |
- | -5.019 |
u | -4.995 |
acy | -4.836 |
. | -4.740 |
ia | -4.730 |
Token | bandwidth |
Token ID | 19484 |
Feature activation | +3.49e+00 |
Pos logit contributions | |
- | +13.867 |
. | +12.829 |
u | +12.740 |
acy | +12.511 |
ine | +12.282 |
Neg logit contributions | |
disparate | -8.160 |
venerable | -8.017 |
blatant | -7.943 |
relentless | -7.891 |
newer | -7.874 |
Token | , |
Token ID | 11 |
Feature activation | -9.54e+00 |
Pos logit contributions | |
- | +8.076 |
. | +8.051 |
u | +7.839 |
acy | +7.515 |
ine | +7.219 |
Neg logit contributions | |
disparate | -7.630 |
venerable | -7.503 |
relentless | -7.443 |
anecdotal | -7.399 |
blatant | -7.370 |
Token | but |
Token ID | 475 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
various | +25.480 |
disparate | +25.269 |
genuine | +25.160 |
newer | +25.073 |
gradual | +25.043 |
Neg logit contributions | |
u | -11.441 |
acy | -11.041 |
aga | -10.781 |
ire | -10.738 |
ati | -10.591 |
Token | a |
Token ID | 257 |
Feature activation | -9.26e+00 |
Pos logit contributions | |
various | +34.847 |
newer | +34.224 |
disparate | +33.912 |
many | +33.750 |
those | +33.749 |
Neg logit contributions | |
acy | -12.214 |
aga | -11.717 |
u | -11.644 |
igr | -10.584 |
ade | -10.496 |
Token | good |
Token ID | 922 |
Feature activation | -2.40e+00 |
Pos logit contributions | |
newer | +26.650 |
disparate | +26.541 |
gradual | +26.356 |
genuine | +26.338 |
widespread | +26.181 |
Neg logit contributions | |
acy | -10.039 |
u | -9.779 |
aga | -9.399 |
ia | -8.836 |
ade | -8.819 |
Token | estimate |
Token ID | 8636 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
disparate | +6.468 |
newer | +6.353 |
blatant | +6.335 |
various | +6.328 |
relentless | +6.313 |
Neg logit contributions | |
u | -4.788 |
- | -4.732 |
acy | -4.615 |
ia | -4.443 |
ine | -4.382 |
Token | results |
Token ID | 2482 |
Feature activation | +7.86e-01 |
Pos logit contributions | |
- | +3.837 |
u | +3.705 |
acy | +3.468 |
. | +3.468 |
ia | +3.282 |
Neg logit contributions | |
disparate | -6.529 |
blatant | -6.422 |
relentless | -6.404 |
venerable | -6.382 |
newer | -6.363 |
Token | from |
Token ID | 422 |
Feature activation | -8.23e+00 |
Pos logit contributions | |
- | +1.423 |
u | +1.373 |
. | +1.348 |
acy | +1.323 |
ia | +1.261 |
Neg logit contributions | |
disparate | -2.253 |
relentless | -2.236 |
venerable | -2.227 |
blatant | -2.227 |
newer | -2.214 |
Token | appropriate |
Token ID | 13335 |
Feature activation | +3.75e+00 |
Pos logit contributions | |
disparate | +0.460 |
newer | +0.454 |
venerable | +0.450 |
gradual | +0.448 |
tremendous | +0.446 |
Neg logit contributions | |
- | -0.487 |
u | -0.485 |
acy | -0.465 |
ine | -0.451 |
ia | -0.449 |
Token | language |
Token ID | 3303 |
Feature activation | +4.56e+00 |
Pos logit contributions | |
- | +10.290 |
u | +9.890 |
acy | +9.718 |
. | +9.567 |
ia | +9.393 |
Neg logit contributions | |
disparate | -6.374 |
gradual | -6.317 |
newer | -6.251 |
venerable | -6.195 |
tremendous | -6.150 |
Token | � |
Token ID | 447 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
- | +10.030 |
. | +9.939 |
u | +9.772 |
acy | +9.196 |
ia | +9.187 |
Neg logit contributions | |
venerable | -9.738 |
disparate | -9.656 |
gradual | -9.587 |
tremendous | -9.541 |
totality | -9.510 |
Token | � |
Token ID | 247 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
� | +15.023 |
� | +14.320 |
u | +14.244 |
- | +13.559 |
� | +13.446 |
Neg logit contributions | |
blatant | -21.484 |
venerable | -21.461 |
disparate | -21.035 |
gradual | -20.921 |
mathemat | -20.834 |
Token | . |
Token ID | 13 |
Feature activation | -9.38e+00 |
Pos logit contributions | |
u | +3.307 |
- | +3.291 |
acy | +3.190 |
. | +3.144 |
ia | +3.110 |
Neg logit contributions | |
disparate | -2.906 |
newer | -2.865 |
venerable | -2.864 |
gradual | -2.864 |
tremendous | -2.827 |
Token | But |
Token ID | 887 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
various | +21.489 |
modern | +21.075 |
newer | +21.068 |
genuine | +20.798 |
those | +20.652 |
Neg logit contributions | |
acy | -14.252 |
aga | -13.907 |
u | -13.695 |
iev | -13.489 |
ire | -12.987 |
Token | when |
Token ID | 618 |
Feature activation | -8.64e+00 |
Pos logit contributions | |
those | +34.329 |
various | +34.141 |
genuine | +34.020 |
modern | +33.976 |
widespread | +33.852 |
Neg logit contributions | |
acy | -12.392 |
u | -12.094 |
iev | -11.918 |
aga | -11.802 |
ire | -11.386 |
Token | a |
Token ID | 257 |
Feature activation | -8.95e+00 |
Pos logit contributions | |
disparate | +25.017 |
various | +24.926 |
blatant | +24.884 |
genuine | +24.800 |
relentless | +24.671 |
Neg logit contributions | |
u | -10.700 |
acy | -10.502 |
aga | -9.950 |
iev | -9.539 |
ade | -9.516 |
Token | politician |
Token ID | 14971 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
genuine | +24.975 |
blatant | +24.829 |
disparate | +24.818 |
newer | +24.651 |
modern | +24.620 |
Neg logit contributions | |
acy | -11.570 |
u | -11.458 |
aga | -10.751 |
iev | -10.629 |
ong | -10.439 |
Token | tries |
Token ID | 8404 |
Feature activation | -7.18e-01 |
Pos logit contributions | |
- | +0.250 |
u | +0.244 |
acy | +0.234 |
ia | +0.232 |
. | +0.231 |
Neg logit contributions | |
disparate | -0.269 |
venerable | -0.263 |
newer | -0.263 |
totality | -0.263 |
gradual | -0.262 |
Token | to |
Token ID | 284 |
Feature activation | -6.05e+00 |
Pos logit contributions | |
disparate | +2.153 |
newer | +2.120 |
venerable | +2.108 |
various | +2.101 |
blatant | +2.098 |
Neg logit contributions | |
u | -1.202 |
- | -1.184 |
acy | -1.152 |
ia | -1.093 |
ine | -1.077 |
Token | 's |
Token ID | 338 |
Feature activation | -6.04e+00 |
Pos logit contributions | |
- | +8.935 |
u | +8.802 |
acy | +8.560 |
. | +8.466 |
ia | +8.404 |
Neg logit contributions | |
disparate | -7.836 |
blatant | -7.658 |
gradual | -7.634 |
newer | -7.581 |
stringent | -7.559 |
Token | a |
Token ID | 257 |
Feature activation | -4.00e+00 |
Pos logit contributions | |
disparate | +17.882 |
various | +17.713 |
newer | +17.701 |
relentless | +17.602 |
blatant | +17.540 |
Neg logit contributions | |
u | -9.089 |
acy | -8.738 |
- | -8.528 |
ia | -8.317 |
aga | -8.272 |
Token | big |
Token ID | 1263 |
Feature activation | +3.24e-01 |
Pos logit contributions | |
disparate | +12.158 |
newer | +12.001 |
various | +11.953 |
blatant | +11.919 |
relentless | +11.896 |
Neg logit contributions | |
u | -6.351 |
acy | -6.115 |
- | -6.062 |
ia | -5.775 |
aga | -5.712 |
Token | place |
Token ID | 1295 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
- | +0.999 |
u | +0.984 |
acy | +0.944 |
. | +0.938 |
ia | +0.927 |
Neg logit contributions | |
disparate | -0.529 |
blatant | -0.514 |
venerable | -0.511 |
genuine | -0.509 |
newer | -0.509 |
Token | , |
Token ID | 11 |
Feature activation | -8.66e+00 |
Pos logit contributions | |
- | +3.466 |
u | +3.432 |
. | +3.357 |
acy | +3.224 |
ia | +3.168 |
Neg logit contributions | |
disparate | -4.291 |
gradual | -4.243 |
venerable | -4.227 |
blatant | -4.226 |
totality | -4.215 |
Token | and |
Token ID | 290 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
various | +23.682 |
newer | +23.555 |
disparate | +23.519 |
relentless | +23.383 |
genuine | +23.238 |
Neg logit contributions | |
u | -10.742 |
acy | -10.430 |
iev | -10.307 |
aga | -10.255 |
ire | -10.065 |
Token | we |
Token ID | 356 |
Feature activation | -3.86e+00 |
Pos logit contributions | |
various | +34.739 |
newer | +34.453 |
many | +33.893 |
disparate | +33.824 |
those | +33.726 |
Neg logit contributions | |
u | -11.960 |
aga | -11.733 |
acy | -11.601 |
ée | -11.519 |
iev | -11.449 |
Token | 're |
Token ID | 821 |
Feature activation | -5.28e+00 |
Pos logit contributions | |
disparate | +9.750 |
newer | +9.606 |
various | +9.577 |
blatant | +9.524 |
relentless | +9.510 |
Neg logit contributions | |
u | -8.133 |
acy | -7.890 |
- | -7.862 |
ia | -7.565 |
aga | -7.499 |
Token | sure |
Token ID | 1654 |
Feature activation | -6.21e+00 |
Pos logit contributions | |
disparate | +13.827 |
newer | +13.673 |
various | +13.654 |
relentless | +13.605 |
blatant | +13.554 |
Neg logit contributions | |
u | -10.264 |
acy | -10.007 |
- | -9.839 |
ia | -9.552 |
aga | -9.486 |
Token | there |
Token ID | 612 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
disparate | +18.593 |
newer | +18.549 |
various | +18.528 |
genuine | +18.218 |
blatant | +18.210 |
Neg logit contributions | |
u | -9.212 |
acy | -8.902 |
- | -8.609 |
aga | -8.393 |
ia | -8.342 |
Token | are |
Token ID | 389 |
Feature activation | -8.02e+00 |
Pos logit contributions | |
disparate | +7.796 |
newer | +7.706 |
various | +7.689 |
blatant | +7.666 |
relentless | +7.652 |
Neg logit contributions | |
u | -2.304 |
- | -2.164 |
acy | -2.162 |
ia | -1.983 |
aga | -1.943 |
Token | storms |
Token ID | 20228 |
Feature activation | +3.63e+00 |
Pos logit contributions | |
- | +14.206 |
u | +13.202 |
. | +12.958 |
ia | +12.930 |
ite | +12.571 |
Neg logit contributions | |
disparate | -8.670 |
venerable | -8.571 |
blatant | -8.452 |
anecdotal | -8.431 |
genuine | -8.418 |
Token | . |
Token ID | 13 |
Feature activation | -7.94e+00 |
Pos logit contributions | |
. | +8.957 |
- | +8.763 |
u | +8.650 |
ong | +8.066 |
acy | +8.031 |
Neg logit contributions | |
venerable | -7.337 |
disparate | -7.268 |
blatant | -7.072 |
anecdotal | -7.022 |
tremendous | -6.964 |
Token |
|
Token ID | 198 |
Feature activation | +3.50e+00 |
Pos logit contributions | |
various | +19.603 |
disparate | +19.297 |
newer | +19.295 |
genuine | +19.263 |
modern | +19.174 |
Neg logit contributions | |
acy | -12.530 |
u | -12.377 |
aga | -12.153 |
igr | -11.633 |
- | -11.530 |
Token |
|
Token ID | 198 |
Feature activation | -7.73e+00 |
Pos logit contributions | |
- | +4.909 |
. | +4.519 |
u | +4.437 |
ine | +3.825 |
ia | +3.799 |
Neg logit contributions | |
tremend | -13.109 |
mathemat | -12.701 |
hemor | -12.171 |
undermin | -11.979 |
disparate | -11.954 |
Token | However |
Token ID | 4864 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
genuine | +19.392 |
widespread | +19.336 |
various | +19.257 |
blatant | +19.169 |
newer | +19.139 |
Neg logit contributions | |
acy | -9.886 |
aga | -9.640 |
u | -9.081 |
igr | -8.939 |
illo | -8.849 |
Token | , |
Token ID | 11 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
disparate | +8.078 |
various | +7.994 |
newer | +7.982 |
blatant | +7.952 |
genuine | +7.937 |
Neg logit contributions | |
u | -2.078 |
acy | -1.976 |
- | -1.869 |
ia | -1.748 |
aga | -1.744 |
Token | this |
Token ID | 428 |
Feature activation | -8.39e+00 |
Pos logit contributions | |
various | +34.160 |
genuine | +33.609 |
gradual | +33.600 |
widespread | +33.522 |
drastic | +33.515 |
Neg logit contributions | |
acy | -13.045 |
u | -12.777 |
aga | -12.269 |
ée | -12.084 |
elle | -11.973 |
Token | is |
Token ID | 318 |
Feature activation | -7.14e+00 |
Pos logit contributions | |
disparate | +24.610 |
gradual | +24.455 |
newer | +24.350 |
relentless | +24.236 |
various | +24.191 |
Neg logit contributions | |
u | -10.227 |
acy | -9.981 |
aga | -9.628 |
ia | -9.294 |
ine | -9.157 |
Token | barely |
Token ID | 8523 |
Feature activation | -2.93e+00 |
Pos logit contributions | |
disparate | +19.916 |
various | +19.618 |
gradual | +19.560 |
newer | +19.540 |
anecdotal | +19.472 |
Neg logit contributions | |
u | -11.124 |
acy | -10.798 |
aga | -10.289 |
- | -10.174 |
ia | -10.098 |
Token | enough |
Token ID | 1576 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
disparate | +6.315 |
newer | +6.187 |
various | +6.141 |
blatant | +6.122 |
venerable | +6.122 |
Neg logit contributions | |
u | -7.429 |
- | -7.302 |
acy | -7.175 |
ia | -6.984 |
aga | -6.899 |
Token | for |
Token ID | 329 |
Feature activation | -9.96e+00 |
Pos logit contributions | |
disparate | +8.396 |
newer | +8.298 |
various | +8.286 |
blatant | +8.263 |
relentless | +8.245 |
Neg logit contributions | |
u | -1.901 |
acy | -1.761 |
- | -1.741 |
ia | -1.576 |
aga | -1.540 |
Token | governments |
Token ID | 6905 |
Feature activation | +3.08e+00 |
Pos logit contributions | |
- | +2.682 |
u | +2.602 |
acy | +2.544 |
. | +2.524 |
ia | +2.505 |
Neg logit contributions | |
anecdotal | -1.561 |
disparate | -1.560 |
sheer | -1.542 |
blatant | -1.531 |
relentless | -1.527 |
Token | . |
Token ID | 13 |
Feature activation | -8.92e+00 |
Pos logit contributions | |
. | +5.404 |
- | +5.296 |
u | +5.083 |
acy | +4.717 |
ong | +4.697 |
Neg logit contributions | |
disparate | -8.513 |
venerable | -8.500 |
gradual | -8.464 |
anecdotal | -8.455 |
newer | -8.373 |
Token |
|
Token ID | 198 |
Feature activation | +3.49e+00 |
Pos logit contributions | |
various | +22.973 |
newer | +22.495 |
genuine | +22.363 |
modern | +22.271 |
blatant | +22.244 |
Neg logit contributions | |
acy | -11.466 |
aga | -11.098 |
u | -10.723 |
ia | -10.273 |
ire | -10.254 |
Token |
|
Token ID | 198 |
Feature activation | -7.57e+00 |
Pos logit contributions | |
- | +4.847 |
. | +4.515 |
u | +4.441 |
ia | +3.869 |
ine | +3.798 |
Neg logit contributions | |
tremend | -12.980 |
mathemat | -12.627 |
hemor | -12.043 |
disparate | -11.929 |
venerable | -11.914 |
Token | However |
Token ID | 4864 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
blatant | +18.881 |
various | +18.770 |
widespread | +18.681 |
genuine | +18.643 |
disparate | +18.569 |
Neg logit contributions | |
acy | -10.194 |
aga | -10.071 |
u | -9.394 |
ia | -9.191 |
igr | -9.188 |
Token | , |
Token ID | 11 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
- | +0.776 |
u | +0.721 |
. | +0.642 |
ia | +0.504 |
ine | +0.497 |
Neg logit contributions | |
disparate | -4.217 |
venerable | -4.211 |
relentless | -4.162 |
totality | -4.160 |
newer | -4.149 |
Token | the |
Token ID | 262 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
various | +33.697 |
newer | +32.701 |
genuine | +32.656 |
many | +32.613 |
those | +32.583 |
Neg logit contributions | |
acy | -13.554 |
aga | -12.874 |
u | -12.784 |
elle | -12.193 |
igr | -11.922 |
Token | United |
Token ID | 1578 |
Feature activation | +7.32e+00 |
Pos logit contributions | |
various | +29.998 |
newer | +29.704 |
genuine | +29.693 |
sheer | +29.598 |
blatant | +29.479 |
Neg logit contributions | |
acy | -12.498 |
u | -12.048 |
aga | -11.958 |
elle | -11.737 |
igr | -11.619 |
Token | States |
Token ID | 1829 |
Feature activation | -9.29e-01 |
Pos logit contributions | |
- | +14.515 |
. | +13.755 |
u | +13.059 |
ia | +12.857 |
ine | +12.311 |
Neg logit contributions | |
tremend | -16.923 |
mathemat | -16.777 |
hemor | -15.596 |
venerable | -15.350 |
disparate | -15.317 |
Token | � |
Token ID | 447 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
disparate | +2.506 |
newer | +2.456 |
venerable | +2.448 |
blatant | +2.435 |
various | +2.435 |
Neg logit contributions | |
u | -1.866 |
- | -1.861 |
acy | -1.800 |
ia | -1.721 |
. | -1.699 |
Token | � |
Token ID | 247 |
Feature activation | +5.52e+00 |
Pos logit contributions | |
� | +18.688 |
� | +18.450 |
� | +18.165 |
u | +18.146 |
- | +17.573 |
Neg logit contributions | |
tremend | -27.639 |
mathemat | -27.568 |
anwhile | -26.305 |
theless | -25.704 |
disparate | -25.230 |
Token | end |
Token ID | 886 |
Feature activation | +5.19e+00 |
Pos logit contributions | |
disparate | +17.929 |
various | +17.844 |
relentless | +17.741 |
newer | +17.737 |
gradual | +17.732 |
Neg logit contributions | |
u | -11.768 |
acy | -11.552 |
- | -11.053 |
aga | -10.991 |
ia | -10.883 |
Token | . |
Token ID | 13 |
Feature activation | -7.86e+00 |
Pos logit contributions | |
- | +12.199 |
. | +12.022 |
u | +11.814 |
acy | +11.436 |
ine | +10.851 |
Neg logit contributions | |
disparate | -10.371 |
blatant | -10.150 |
anecdotal | -10.124 |
newer | -10.114 |
venerable | -10.109 |
Token |
|
Token ID | 198 |
Feature activation | +4.90e+00 |
Pos logit contributions | |
various | +19.347 |
newer | +19.229 |
modern | +19.101 |
disparate | +18.989 |
genuine | +18.957 |
Neg logit contributions | |
acy | -12.586 |
u | -12.238 |
aga | -12.039 |
ong | -11.579 |
ire | -11.485 |
Token |
|
Token ID | 198 |
Feature activation | -6.92e+00 |
Pos logit contributions | |
- | +6.404 |
. | +5.915 |
u | +5.627 |
ia | +4.868 |
ine | +4.671 |
Neg logit contributions | |
tremend | -18.971 |
mathemat | -18.151 |
hemor | -17.404 |
undermin | -17.250 |
cumbers | -17.038 |
Token | However |
Token ID | 4864 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
newer | +16.962 |
various | +16.926 |
widespread | +16.919 |
genuine | +16.914 |
blatant | +16.870 |
Neg logit contributions | |
acy | -10.221 |
aga | -9.843 |
u | -9.417 |
ong | -9.169 |
iev | -9.133 |
Token | , |
Token ID | 11 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
disparate | +4.251 |
newer | +4.202 |
various | +4.182 |
tremendous | +4.171 |
relentless | +4.169 |
Neg logit contributions | |
u | -0.984 |
- | -0.959 |
acy | -0.856 |
ia | -0.812 |
. | -0.802 |
Token | it |
Token ID | 340 |
Feature activation | -5.12e+00 |
Pos logit contributions | |
various | +33.603 |
modern | +33.276 |
newer | +33.165 |
gradual | +33.023 |
genuine | +32.955 |
Neg logit contributions | |
acy | -13.709 |
u | -13.254 |
aga | -13.131 |
iev | -12.618 |
ong | -12.522 |
Token | is |
Token ID | 318 |
Feature activation | -7.13e+00 |
Pos logit contributions | |
disparate | +16.285 |
various | +16.253 |
newer | +16.176 |
relentless | +16.041 |
blatant | +16.016 |
Neg logit contributions | |
u | -6.410 |
acy | -6.198 |
- | -5.912 |
aga | -5.824 |
ia | -5.716 |
Token | utter |
Token ID | 10517 |
Feature activation | +2.93e+00 |
Pos logit contributions | |
disparate | +20.578 |
various | +20.548 |
newer | +20.478 |
genuine | +20.400 |
relentless | +20.324 |
Neg logit contributions | |
u | -10.380 |
acy | -10.124 |
aga | -9.582 |
- | -9.484 |
ia | -9.432 |
Token | nonsense |
Token ID | 18149 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
- | +8.599 |
u | +8.409 |
. | +8.158 |
acy | +8.080 |
ia | +7.906 |
Neg logit contributions | |
disparate | -4.524 |
newer | -4.391 |
venerable | -4.373 |
various | -4.284 |
tremendous | -4.237 |
Token | to |
Token ID | 284 |
Feature activation | -5.66e+00 |
Pos logit contributions | |
- | +2.258 |
u | +2.226 |
. | +2.198 |
acy | +2.073 |
ine | +1.993 |
Neg logit contributions | |
disparate | -3.771 |
venerable | -3.703 |
newer | -3.702 |
blatant | -3.698 |
tremendous | -3.693 |
Token | on |
Token ID | 319 |
Feature activation | -3.93e+00 |
Pos logit contributions | |
. | +12.523 |
- | +12.347 |
u | +11.624 |
ine | +11.294 |
ia | +11.143 |
Neg logit contributions | |
venerable | -8.186 |
blatant | -8.105 |
genuine | -7.868 |
disparate | -7.823 |
totality | -7.781 |
Token | Fisher |
Token ID | 14388 |
Feature activation | +9.44e+00 |
Pos logit contributions | |
disparate | +9.703 |
newer | +9.514 |
blatant | +9.476 |
various | +9.439 |
relentless | +9.422 |
Neg logit contributions | |
u | -8.784 |
- | -8.605 |
acy | -8.471 |
ia | -8.200 |
ine | -8.097 |
Token | s |
Token ID | 82 |
Feature activation | +5.19e+00 |
Pos logit contributions | |
- | +22.222 |
. | +20.889 |
ia | +20.213 |
y | +20.181 |
u | +19.691 |
Neg logit contributions | |
disparate | -13.566 |
blatant | -13.440 |
genuine | -13.103 |
gradual | -12.872 |
anecdotal | -12.796 |
Token | Island |
Token ID | 5451 |
Feature activation | +5.66e+00 |
Pos logit contributions | |
- | +13.122 |
. | +12.615 |
ia | +12.309 |
u | +12.173 |
acy | +11.864 |
Neg logit contributions | |
disparate | -9.504 |
blatant | -8.946 |
genuine | -8.798 |
totality | -8.755 |
anecdotal | -8.707 |
Token | -- |
Token ID | 1377 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
. | +15.052 |
- | +14.874 |
u | +14.290 |
ia | +13.876 |
ine | +13.784 |
Neg logit contributions | |
blatant | -8.677 |
venerable | -8.604 |
disparate | -8.501 |
anecdotal | -8.377 |
drastic | -8.333 |
Token | but |
Token ID | 475 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
disparate | +12.659 |
newer | +12.511 |
various | +12.476 |
blatant | +12.406 |
relentless | +12.394 |
Neg logit contributions | |
u | -6.418 |
acy | -6.153 |
- | -6.133 |
ia | -5.817 |
aga | -5.745 |
Token | early |
Token ID | 1903 |
Feature activation | -3.14e+00 |
Pos logit contributions | |
various | +34.647 |
newer | +34.330 |
those | +34.059 |
disparate | +33.959 |
many | +33.848 |
Neg logit contributions | |
acy | -11.926 |
u | -11.865 |
iev | -11.375 |
ache | -11.113 |
ire | -10.934 |
Token | in |
Token ID | 287 |
Feature activation | -2.86e+00 |
Pos logit contributions | |
disparate | +10.064 |
newer | +9.887 |
various | +9.876 |
blatant | +9.874 |
relentless | +9.844 |
Neg logit contributions | |
u | -4.695 |
- | -4.582 |
acy | -4.462 |
ia | -4.245 |
ine | -4.164 |
Token | 1989 |
Token ID | 11104 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
disparate | +4.661 |
blatant | +4.495 |
newer | +4.463 |
relentless | +4.451 |
various | +4.438 |
Neg logit contributions | |
u | -8.886 |
- | -8.767 |
acy | -8.618 |
ia | -8.454 |
ine | -8.358 |
Token | he |
Token ID | 339 |
Feature activation | -2.46e+00 |
Pos logit contributions | |
- | +5.732 |
u | +5.464 |
. | +5.421 |
acy | +5.304 |
ia | +5.287 |
Neg logit contributions | |
disparate | -3.117 |
blatant | -3.050 |
relentless | -3.035 |
gradual | -3.009 |
totality | -2.979 |
Token | found |
Token ID | 1043 |
Feature activation | -2.89e+00 |
Pos logit contributions | |
disparate | +6.277 |
newer | +6.157 |
blatant | +6.140 |
relentless | +6.107 |
various | +6.106 |
Neg logit contributions | |
u | -5.331 |
- | -5.248 |
acy | -5.146 |
ia | -4.976 |
ine | -4.919 |
Token | iots |
Token ID | 16228 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
- | +7.935 |
acy | +7.446 |
u | +7.366 |
ine | +7.348 |
. | +7.212 |
Neg logit contributions | |
disparate | -11.676 |
blatant | -11.502 |
genuine | -11.475 |
gradual | -11.467 |
relentless | -11.429 |
Token | level |
Token ID | 1241 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
- | +9.613 |
u | +9.127 |
. | +9.049 |
acy | +8.793 |
ia | +8.749 |
Neg logit contributions | |
venerable | -4.937 |
disparate | -4.918 |
newer | -4.780 |
relentless | -4.777 |
genuine | -4.771 |
Token | Saturday |
Token ID | 3909 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
u | +0.156 |
- | +0.155 |
acy | +0.139 |
. | +0.137 |
ia | +0.124 |
Neg logit contributions | |
disparate | -0.810 |
venerable | -0.802 |
newer | -0.799 |
relentless | -0.797 |
blatant | -0.795 |
Token | night |
Token ID | 1755 |
Feature activation | +8.34e-01 |
Pos logit contributions | |
- | +0.709 |
u | +0.704 |
. | +0.670 |
acy | +0.666 |
ia | +0.653 |
Neg logit contributions | |
disparate | -1.072 |
venerable | -1.055 |
newer | -1.050 |
relentless | -1.047 |
blatant | -1.045 |
Token | , |
Token ID | 11 |
Feature activation | -8.55e+00 |
Pos logit contributions | |
- | +0.733 |
u | +0.725 |
. | +0.666 |
acy | +0.651 |
ia | +0.602 |
Neg logit contributions | |
disparate | -3.166 |
venerable | -3.120 |
relentless | -3.110 |
newer | -3.109 |
blatant | -3.108 |
Token | but |
Token ID | 475 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
various | +22.487 |
newer | +22.313 |
disparate | +22.186 |
genuine | +22.041 |
blatant | +21.946 |
Neg logit contributions | |
u | -12.116 |
acy | -11.740 |
ire | -11.276 |
ong | -11.235 |
- | -11.164 |
Token | just |
Token ID | 655 |
Feature activation | -8.76e+00 |
Pos logit contributions | |
various | +34.738 |
disparate | +33.968 |
those | +33.902 |
newer | +33.761 |
widespread | +33.673 |
Neg logit contributions | |
acy | -11.945 |
u | -11.799 |
aga | -11.018 |
ache | -10.896 |
igr | -10.866 |
Token | being |
Token ID | 852 |
Feature activation | -4.59e+00 |
Pos logit contributions | |
disparate | +25.830 |
various | +25.740 |
relentless | +25.531 |
tremendous | +25.500 |
sheer | +25.498 |
Neg logit contributions | |
acy | -9.316 |
u | -9.188 |
aga | -8.311 |
ia | -8.124 |
ire | -8.110 |
Token | outside |
Token ID | 2354 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
disparate | +12.543 |
various | +12.346 |
newer | +12.337 |
blatant | +12.295 |
relentless | +12.277 |
Neg logit contributions | |
u | -8.588 |
acy | -8.341 |
- | -8.201 |
ia | -7.942 |
aga | -7.869 |
Token | was |
Token ID | 373 |
Feature activation | -6.44e+00 |
Pos logit contributions | |
disparate | +8.469 |
newer | +8.354 |
blatant | +8.305 |
various | +8.295 |
venerable | +8.285 |
Neg logit contributions | |
u | -3.977 |
- | -3.914 |
acy | -3.765 |
ia | -3.585 |
. | -3.519 |
Token | illegal |
Token ID | 5293 |
Feature activation | -4.66e-01 |
Pos logit contributions | |
disparate | +23.541 |
various | +23.401 |
relentless | +23.361 |
blatant | +23.343 |
newer | +23.288 |
Neg logit contributions | |
u | -4.512 |
acy | -4.450 |
ia | -3.678 |
- | -3.675 |
ong | -3.619 |
Token | of |
Token ID | 286 |
Feature activation | -4.25e+00 |
Pos logit contributions | |
- | +2.195 |
u | +2.145 |
. | +2.084 |
acy | +2.030 |
ia | +1.937 |
Neg logit contributions | |
disparate | -4.073 |
relentless | -4.057 |
newer | -4.036 |
blatant | -4.023 |
venerable | -4.017 |
Token | DOM |
Token ID | 24121 |
Feature activation | +7.91e+00 |
Pos logit contributions | |
disparate | +8.751 |
newer | +8.570 |
various | +8.563 |
blatant | +8.489 |
relentless | +8.452 |
Neg logit contributions | |
u | -10.944 |
acy | -10.664 |
- | -10.646 |
ia | -10.322 |
aga | -10.247 |
Token | A |
Token ID | 32 |
Feature activation | +3.46e+00 |
Pos logit contributions | |
- | +12.837 |
. | +12.819 |
u | +11.407 |
acy | +11.168 |
ire | +10.913 |
Neg logit contributions | |
anecdotal | -18.291 |
relentless | -18.253 |
spontaneous | -17.983 |
venerable | -17.949 |
gradual | -17.830 |
Token | . |
Token ID | 13 |
Feature activation | -8.76e+00 |
Pos logit contributions | |
- | +7.943 |
. | +7.897 |
u | +7.699 |
acy | +7.264 |
ade | +7.041 |
Neg logit contributions | |
disparate | -7.478 |
relentless | -7.464 |
venerable | -7.388 |
anecdotal | -7.377 |
genuine | -7.345 |
Token | However |
Token ID | 2102 |
Feature activation | +5.25e-02 |
Pos logit contributions | |
various | +21.835 |
disparate | +21.525 |
newer | +21.378 |
modern | +21.098 |
blatant | +21.033 |
Neg logit contributions | |
acy | -12.911 |
u | -12.688 |
aga | -12.620 |
igr | -12.190 |
iev | -11.987 |
Token | , |
Token ID | 11 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
u | +0.046 |
- | +0.043 |
acy | +0.042 |
ia | +0.038 |
aga | +0.037 |
Neg logit contributions | |
disparate | -0.198 |
newer | -0.196 |
various | -0.196 |
blatant | -0.195 |
relentless | -0.195 |
Token | they |
Token ID | 484 |
Feature activation | -5.62e+00 |
Pos logit contributions | |
various | +34.192 |
disparate | +33.625 |
those | +33.279 |
newer | +33.143 |
many | +32.964 |
Neg logit contributions | |
u | -13.317 |
aga | -13.182 |
acy | -13.013 |
ée | -12.939 |
igr | -12.579 |
Token | have |
Token ID | 423 |
Feature activation | -6.43e+00 |
Pos logit contributions | |
disparate | +14.729 |
various | +14.581 |
newer | +14.508 |
blatant | +14.384 |
relentless | +14.284 |
Neg logit contributions | |
u | -10.620 |
acy | -10.359 |
- | -10.088 |
ia | -9.835 |
aga | -9.829 |
Token | done |
Token ID | 1760 |
Feature activation | -5.04e-01 |
Pos logit contributions | |
disparate | +18.227 |
various | +18.080 |
newer | +17.861 |
blatant | +17.791 |
tremendous | +17.762 |
Neg logit contributions | |
u | -10.517 |
acy | -10.224 |
- | -9.748 |
aga | -9.644 |
ia | -9.635 |
Token | so |
Token ID | 523 |
Feature activation | -3.96e+00 |
Pos logit contributions | |
venerable | +0.753 |
disparate | +0.751 |
relentless | +0.746 |
newer | +0.744 |
blatant | +0.731 |
Neg logit contributions | |
- | -1.597 |
u | -1.581 |
acy | -1.532 |
. | -1.517 |
ia | -1.513 |
Token | in |
Token ID | 287 |
Feature activation | -6.34e+00 |
Pos logit contributions | |
disparate | +11.546 |
newer | +11.375 |
various | +11.353 |
blatant | +11.305 |
relentless | +11.272 |
Neg logit contributions | |
u | -6.898 |
acy | -6.639 |
- | -6.627 |
ia | -6.310 |
aga | -6.244 |
Token | teammates |
Token ID | 13107 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
various | +20.194 |
disparate | +20.150 |
relentless | +20.114 |
tremendous | +20.021 |
newer | +19.975 |
Neg logit contributions | |
u | -9.697 |
acy | -9.410 |
- | -8.687 |
ia | -8.648 |
aga | -8.645 |
Token | . |
Token ID | 13 |
Feature activation | -6.25e+00 |
Pos logit contributions | |
- | +6.733 |
. | +6.699 |
u | +6.443 |
ong | +6.154 |
acy | +6.146 |
Neg logit contributions | |
disparate | -5.497 |
venerable | -5.309 |
blatant | -5.269 |
gradual | -5.240 |
anecdotal | -5.229 |
Token |
|
Token ID | 198 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
various | +15.013 |
newer | +14.866 |
disparate | +14.706 |
genuine | +14.631 |
blatant | +14.569 |
Neg logit contributions | |
acy | -11.846 |
u | -11.837 |
aga | -11.268 |
- | -11.147 |
ia | -11.047 |
Token |
|
Token ID | 198 |
Feature activation | -5.79e+00 |
Pos logit contributions | |
- | +4.665 |
. | +4.282 |
u | +4.167 |
ia | +3.626 |
ine | +3.589 |
Neg logit contributions | |
tremend | -12.656 |
mathemat | -12.287 |
hemor | -11.745 |
undermin | -11.613 |
disparate | -11.558 |
Token | However |
Token ID | 4864 |
Feature activation | -2.46e+00 |
Pos logit contributions | |
various | +15.547 |
blatant | +15.512 |
genuine | +15.434 |
newer | +15.402 |
tremendous | +15.365 |
Neg logit contributions | |
acy | -8.070 |
u | -7.622 |
aga | -7.573 |
ong | -7.269 |
illo | -7.189 |
Token | , |
Token ID | 11 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
disparate | +9.328 |
newer | +9.214 |
various | +9.166 |
blatant | +9.162 |
relentless | +9.159 |
Neg logit contributions | |
u | -2.216 |
- | -2.095 |
acy | -2.005 |
ia | -1.838 |
ine | -1.780 |
Token | life |
Token ID | 1204 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
various | +33.694 |
those | +32.831 |
anecdotal | +32.585 |
newer | +32.483 |
many | +32.408 |
Neg logit contributions | |
acy | -13.744 |
u | -12.735 |
aga | -12.373 |
ong | -12.217 |
ée | -12.103 |
Token | comes |
Token ID | 2058 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
- | +2.781 |
u | +2.688 |
. | +2.549 |
acy | +2.518 |
ine | +2.404 |
Neg logit contributions | |
disparate | -3.260 |
blatant | -3.164 |
venerable | -3.151 |
newer | -3.113 |
genuine | -3.104 |
Token | at |
Token ID | 379 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
disparate | +0.472 |
venerable | +0.471 |
blatant | +0.468 |
newer | +0.461 |
totality | +0.458 |
Neg logit contributions | |
u | -0.444 |
- | -0.438 |
acy | -0.416 |
. | -0.412 |
ade | -0.396 |
Token | you |
Token ID | 345 |
Feature activation | -7.83e-02 |
Pos logit contributions | |
disparate | +1.490 |
newer | +1.441 |
venerable | +1.413 |
blatant | +1.407 |
genuine | +1.390 |
Neg logit contributions | |
- | -4.658 |
u | -4.602 |
ia | -4.464 |
acy | -4.418 |
ine | -4.414 |
Token | fast |
Token ID | 3049 |
Feature activation | +2.45e+00 |
Pos logit contributions | |
disparate | +0.195 |
blatant | +0.191 |
newer | +0.190 |
venerable | +0.190 |
anecdotal | +0.189 |
Neg logit contributions | |
- | -0.172 |
u | -0.171 |
acy | -0.165 |
. | -0.163 |
ia | -0.158 |
Token | wisdom |
Token ID | 11501 |
Feature activation | +4.17e+00 |
Pos logit contributions | |
- | +0.491 |
u | +0.470 |
acy | +0.465 |
. | +0.462 |
ine | +0.453 |
Neg logit contributions | |
disparate | -0.262 |
blatant | -0.257 |
relentless | -0.251 |
genuine | -0.248 |
tremendous | -0.247 |
Token | about |
Token ID | 546 |
Feature activation | -7.25e+00 |
Pos logit contributions | |
. | +9.775 |
- | +9.660 |
u | +9.230 |
acy | +8.780 |
ia | +8.558 |
Neg logit contributions | |
disparate | -8.720 |
blatant | -8.524 |
totality | -8.472 |
gradual | -8.417 |
venerable | -8.389 |
Token | dinosaurs |
Token ID | 27199 |
Feature activation | +4.16e+00 |
Pos logit contributions | |
disparate | +20.861 |
various | +20.824 |
newer | +20.700 |
gradual | +20.584 |
genuine | +20.519 |
Neg logit contributions | |
u | -10.863 |
acy | -10.585 |
aga | -9.943 |
ire | -9.844 |
iev | -9.822 |
Token | . |
Token ID | 13 |
Feature activation | -8.01e+00 |
Pos logit contributions | |
. | +10.938 |
- | +10.823 |
u | +10.378 |
ia | +10.080 |
acy | +10.051 |
Neg logit contributions | |
disparate | -7.318 |
blatant | -7.282 |
relentless | -7.141 |
venerable | -7.069 |
stringent | -6.973 |
Token | However |
Token ID | 2102 |
Feature activation | -6.30e-01 |
Pos logit contributions | |
various | +21.352 |
newer | +21.245 |
disparate | +21.013 |
genuine | +20.956 |
modern | +20.893 |
Neg logit contributions | |
u | -11.353 |
acy | -11.333 |
aga | -10.990 |
iev | -10.625 |
ire | -10.511 |
Token | , |
Token ID | 11 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
disparate | +2.378 |
newer | +2.350 |
various | +2.343 |
blatant | +2.339 |
relentless | +2.338 |
Neg logit contributions | |
u | -0.559 |
- | -0.526 |
acy | -0.510 |
ia | -0.464 |
ine | -0.447 |
Token | it |
Token ID | 340 |
Feature activation | -4.22e+00 |
Pos logit contributions | |
various | +34.369 |
newer | +34.034 |
modern | +33.833 |
genuine | +33.533 |
many | +33.350 |
Neg logit contributions | |
u | -13.175 |
acy | -13.146 |
iev | -13.136 |
aga | -12.950 |
ire | -12.085 |
Token | has |
Token ID | 468 |
Feature activation | -4.38e+00 |
Pos logit contributions | |
disparate | +14.255 |
newer | +14.106 |
various | +14.097 |
blatant | +14.028 |
relentless | +13.995 |
Neg logit contributions | |
u | -5.220 |
acy | -4.975 |
- | -4.910 |
ia | -4.606 |
aga | -4.571 |
Token | been |
Token ID | 587 |
Feature activation | -6.24e+00 |
Pos logit contributions | |
disparate | +10.979 |
newer | +10.785 |
various | +10.740 |
blatant | +10.717 |
relentless | +10.685 |
Neg logit contributions | |
u | -9.492 |
- | -9.232 |
acy | -9.189 |
ia | -8.842 |
aga | -8.746 |
Token | hard |
Token ID | 1327 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
disparate | +16.832 |
various | +16.830 |
newer | +16.695 |
blatant | +16.581 |
relentless | +16.566 |
Neg logit contributions | |
u | -10.978 |
acy | -10.728 |
- | -10.356 |
aga | -10.191 |
ia | -10.141 |
Token | to |
Token ID | 284 |
Feature activation | -5.73e+00 |
Pos logit contributions | |
- | +6.116 |
u | +5.778 |
. | +5.570 |
acy | +5.402 |
ia | +5.391 |
Neg logit contributions | |
disparate | -6.406 |
venerable | -6.272 |
blatant | -6.230 |
totality | -6.166 |
newer | -6.157 |
Token | now |
Token ID | 783 |
Feature activation | -7.11e+00 |
Pos logit contributions | |
disparate | +21.896 |
various | +21.833 |
newer | +21.746 |
widespread | +21.684 |
relentless | +21.645 |
Neg logit contributions | |
u | -10.438 |
acy | -10.310 |
aga | -9.729 |
ia | -9.587 |
ire | -9.573 |
Token | a |
Token ID | 257 |
Feature activation | -6.40e+00 |
Pos logit contributions | |
newer | +20.014 |
disparate | +20.003 |
widespread | +19.992 |
various | +19.968 |
relentless | +19.805 |
Neg logit contributions | |
u | -9.994 |
acy | -9.830 |
aga | -9.340 |
ong | -9.244 |
iev | -9.161 |
Token | management |
Token ID | 4542 |
Feature activation | +3.19e+00 |
Pos logit contributions | |
disparate | +17.992 |
newer | +17.850 |
genuine | +17.765 |
blatant | +17.716 |
venerable | +17.672 |
Neg logit contributions | |
u | -10.168 |
acy | -10.029 |
aga | -9.544 |
ia | -9.507 |
- | -9.344 |
Token | priority |
Token ID | 8475 |
Feature activation | +1.04e-01 |
Pos logit contributions | |
- | +9.394 |
u | +8.567 |
. | +8.561 |
acy | +8.374 |
ite | +8.248 |
Neg logit contributions | |
disparate | -5.262 |
blatant | -5.186 |
newer | -5.103 |
sheer | -5.068 |
venerable | -5.065 |
Token | , |
Token ID | 11 |
Feature activation | -8.61e+00 |
Pos logit contributions | |
- | +0.106 |
u | +0.106 |
acy | +0.100 |
. | +0.097 |
ia | +0.090 |
Neg logit contributions | |
disparate | -0.381 |
blatant | -0.375 |
relentless | -0.373 |
venerable | -0.372 |
newer | -0.372 |
Token | but |
Token ID | 475 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
various | +24.110 |
newer | +23.967 |
gradual | +23.729 |
disparate | +23.714 |
widespread | +23.665 |
Neg logit contributions | |
u | -10.208 |
acy | -9.936 |
aga | -9.847 |
ia | -9.444 |
ong | -9.284 |
Token | that |
Token ID | 326 |
Feature activation | -8.15e+00 |
Pos logit contributions | |
various | +34.243 |
widespread | +33.695 |
newer | +33.678 |
many | +33.674 |
those | +33.663 |
Neg logit contributions | |
acy | -12.042 |
u | -11.937 |
aga | -11.548 |
ade | -11.151 |
ong | -11.120 |
Token | push |
Token ID | 4574 |
Feature activation | +6.63e-01 |
Pos logit contributions | |
newer | +24.185 |
various | +24.089 |
disparate | +24.062 |
relentless | +23.997 |
gradual | +23.991 |
Neg logit contributions | |
u | -8.166 |
acy | -7.886 |
aga | -7.691 |
ire | -7.565 |
ia | -7.389 |
Token | began |
Token ID | 2540 |
Feature activation | -4.61e+00 |
Pos logit contributions | |
- | +1.361 |
u | +1.353 |
acy | +1.299 |
ia | +1.244 |
. | +1.237 |
Neg logit contributions | |
disparate | -1.761 |
venerable | -1.724 |
blatant | -1.719 |
newer | -1.708 |
tremendous | -1.699 |
Token | under |
Token ID | 739 |
Feature activation | -4.38e+00 |
Pos logit contributions | |
disparate | +12.980 |
newer | +12.873 |
various | +12.863 |
gradual | +12.777 |
relentless | +12.772 |
Neg logit contributions | |
u | -7.778 |
acy | -7.580 |
- | -7.331 |
aga | -7.160 |
ia | -7.091 |
Token | the |
Token ID | 262 |
Feature activation | -7.70e+00 |
Pos logit contributions | |
disparate | +11.982 |
newer | +11.822 |
various | +11.816 |
blatant | +11.722 |
relentless | +11.716 |
Neg logit contributions | |
u | -8.217 |
acy | -7.978 |
- | -7.875 |
ia | -7.580 |
aga | -7.541 |
Token | five |
Token ID | 1936 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
disparate | +20.005 |
various | +19.767 |
newer | +19.704 |
tremendous | +19.566 |
genuine | +19.507 |
Neg logit contributions | |
u | -9.376 |
acy | -9.259 |
- | -8.602 |
aga | -8.534 |
ia | -8.468 |
Token | kids |
Token ID | 3988 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
disparate | +4.799 |
newer | +4.752 |
blatant | +4.743 |
relentless | +4.741 |
venerable | +4.732 |
Neg logit contributions | |
- | -1.599 |
u | -1.592 |
acy | -1.470 |
ia | -1.382 |
ine | -1.357 |
Token | on |
Token ID | 319 |
Feature activation | -3.87e+00 |
Pos logit contributions | |
- | +0.949 |
u | +0.924 |
. | +0.910 |
acy | +0.874 |
ia | +0.860 |
Neg logit contributions | |
blatant | -1.097 |
disparate | -1.095 |
venerable | -1.094 |
gradual | -1.078 |
newer | -1.078 |
Token | a |
Token ID | 257 |
Feature activation | -5.15e+00 |
Pos logit contributions | |
disparate | +13.055 |
various | +12.892 |
newer | +12.888 |
blatant | +12.804 |
relentless | +12.790 |
Neg logit contributions | |
u | -4.876 |
acy | -4.653 |
- | -4.576 |
ia | -4.317 |
aga | -4.239 |
Token | ship |
Token ID | 4074 |
Feature activation | +2.79e+00 |
Pos logit contributions | |
disparate | +13.839 |
newer | +13.651 |
various | +13.620 |
relentless | +13.544 |
blatant | +13.538 |
Neg logit contributions | |
u | -9.918 |
acy | -9.644 |
- | -9.526 |
ia | -9.181 |
aga | -9.092 |
Token | and |
Token ID | 290 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
- | +6.992 |
. | +6.891 |
u | +6.701 |
ia | +6.312 |
acy | +6.269 |
Neg logit contributions | |
venerable | -5.600 |
blatant | -5.575 |
disparate | -5.511 |
gradual | -5.474 |
anecdotal | -5.457 |
Token | for |
Token ID | 329 |
Feature activation | -6.44e+00 |
Pos logit contributions | |
various | +32.968 |
those | +32.381 |
disparate | +31.900 |
tremendous | +31.631 |
many | +31.630 |
Neg logit contributions | |
acy | -13.030 |
u | -12.830 |
iev | -12.107 |
ong | -11.801 |
ire | -11.682 |
Token | some |
Token ID | 617 |
Feature activation | -3.03e+00 |
Pos logit contributions | |
various | +18.077 |
disparate | +17.918 |
newer | +17.688 |
tremendous | +17.592 |
sheer | +17.563 |
Neg logit contributions | |
u | -10.231 |
acy | -10.166 |
- | -9.462 |
ia | -9.299 |
ong | -9.266 |
Token | reason |
Token ID | 1738 |
Feature activation | -5.04e+00 |
Pos logit contributions | |
disparate | +6.977 |
newer | +6.837 |
various | +6.800 |
blatant | +6.784 |
relentless | +6.771 |
Neg logit contributions | |
u | -7.181 |
- | -7.028 |
acy | -6.984 |
ia | -6.737 |
aga | -6.671 |
Token | they |
Token ID | 484 |
Feature activation | -5.59e+00 |
Pos logit contributions | |
disparate | +16.039 |
various | +15.893 |
newer | +15.845 |
blatant | +15.711 |
relentless | +15.695 |
Neg logit contributions | |
u | -6.867 |
acy | -6.576 |
- | -6.338 |
ia | -6.118 |
aga | -6.092 |
Token | were |
Token ID | 547 |
Feature activation | -8.31e+00 |
Pos logit contributions | |
disparate | +15.110 |
various | +14.979 |
newer | +14.861 |
relentless | +14.775 |
genuine | +14.728 |
Neg logit contributions | |
u | -9.750 |
acy | -9.539 |
- | -9.151 |
ia | -9.062 |
aga | -8.997 |
Token | � |
Token ID | 447 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
- | +15.525 |
. | +15.235 |
u | +14.819 |
ia | +14.103 |
ine | +13.957 |
Neg logit contributions | |
disparate | -8.488 |
gradual | -8.310 |
anecdotal | -8.280 |
venerable | -8.171 |
totality | -8.151 |
Token | � |
Token ID | 247 |
Feature activation | +8.11e+00 |
Pos logit contributions | |
� | +18.271 |
� | +16.423 |
u | +16.323 |
aga | +15.884 |
� | +15.822 |
Neg logit contributions | |
mathemat | -29.689 |
tremend | -29.119 |
anwhile | -28.737 |
theless | -28.545 |
disparate | -28.310 |
Token | s |
Token ID | 82 |
Feature activation | -2.16e+00 |
Pos logit contributions | |
u | +18.428 |
- | +18.237 |
. | +17.529 |
s | +17.214 |
acy | +16.923 |
Neg logit contributions | |
disparate | -13.682 |
gradual | -13.333 |
venerable | -13.267 |
totality | -13.162 |
anecdotal | -13.121 |
Token | monster |
Token ID | 9234 |
Feature activation | +4.79e+00 |
Pos logit contributions | |
disparate | +4.363 |
newer | +4.216 |
blatant | +4.205 |
anecdotal | +4.186 |
venerable | +4.185 |
Neg logit contributions | |
u | -5.863 |
- | -5.817 |
acy | -5.699 |
ia | -5.534 |
aga | -5.490 |
Token | , |
Token ID | 11 |
Feature activation | -7.79e+00 |
Pos logit contributions | |
. | +12.194 |
- | +12.107 |
u | +11.415 |
ia | +10.959 |
acy | +10.898 |
Neg logit contributions | |
disparate | -8.536 |
venerable | -8.350 |
anecdotal | -8.270 |
gradual | -8.171 |
blatant | -8.134 |
Token | and |
Token ID | 290 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
various | +22.085 |
newer | +21.880 |
disparate | +21.861 |
relentless | +21.669 |
tremendous | +21.660 |
Neg logit contributions | |
u | -10.092 |
acy | -9.883 |
ia | -9.366 |
- | -9.358 |
aga | -9.304 |
Token | have |
Token ID | 423 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
various | +33.600 |
newer | +33.212 |
those | +32.951 |
many | +32.946 |
most | +32.331 |
Neg logit contributions | |
acy | -12.116 |
u | -12.052 |
elle | -11.369 |
aga | -11.163 |
igr | -11.036 |
Token | been |
Token ID | 587 |
Feature activation | -6.26e+00 |
Pos logit contributions | |
disparate | +14.493 |
various | +14.441 |
newer | +14.332 |
tremendous | +14.290 |
blatant | +14.236 |
Neg logit contributions | |
u | -8.828 |
acy | -8.577 |
- | -8.365 |
ia | -8.159 |
ine | -8.020 |
Token | popular |
Token ID | 2968 |
Feature activation | +5.80e-02 |
Pos logit contributions | |
various | +18.578 |
disparate | +18.472 |
relentless | +18.409 |
newer | +18.398 |
tremendous | +18.298 |
Neg logit contributions | |
u | -8.740 |
acy | -8.604 |
- | -8.047 |
ia | -7.991 |
aga | -7.932 |
Token | cards |
Token ID | 4116 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
- | +0.114 |
u | +0.114 |
acy | +0.109 |
. | +0.105 |
ia | +0.105 |
Neg logit contributions | |
disparate | -0.158 |
blatant | -0.155 |
venerable | -0.155 |
relentless | -0.154 |
gradual | -0.153 |
Token | to |
Token ID | 284 |
Feature activation | -5.78e+00 |
Pos logit contributions | |
- | +4.380 |
u | +4.322 |
. | +4.141 |
acy | +4.045 |
ia | +3.976 |
Neg logit contributions | |
disparate | -4.560 |
totality | -4.528 |
blatant | -4.464 |
venerable | -4.464 |
gradual | -4.439 |
Token | to |
Token ID | 284 |
Feature activation | -6.14e+00 |
Pos logit contributions | |
- | +3.019 |
u | +2.988 |
. | +2.889 |
ia | +2.787 |
acy | +2.776 |
Neg logit contributions | |
disparate | -3.513 |
blatant | -3.464 |
totality | -3.457 |
venerable | -3.448 |
relentless | -3.429 |
Token | build |
Token ID | 1382 |
Feature activation | -2.54e+00 |
Pos logit contributions | |
disparate | +17.368 |
various | +17.329 |
newer | +17.307 |
tremendous | +17.085 |
genuine | +16.971 |
Neg logit contributions | |
u | -9.787 |
acy | -9.571 |
- | -9.091 |
aga | -8.912 |
ia | -8.906 |
Token | projects |
Token ID | 4493 |
Feature activation | +6.07e-01 |
Pos logit contributions | |
disparate | +6.963 |
blatant | +6.858 |
newer | +6.848 |
relentless | +6.823 |
venerable | +6.809 |
Neg logit contributions | |
u | -4.968 |
- | -4.899 |
acy | -4.753 |
ia | -4.607 |
ine | -4.524 |
Token | . |
Token ID | 13 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
- | +1.277 |
u | +1.258 |
. | +1.239 |
acy | +1.197 |
ia | +1.171 |
Neg logit contributions | |
disparate | -1.537 |
blatant | -1.518 |
venerable | -1.512 |
relentless | -1.509 |
gradual | -1.508 |
Token | However |
Token ID | 2102 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
various | +25.046 |
newer | +24.944 |
modern | +24.371 |
genuine | +24.164 |
disparate | +24.143 |
Neg logit contributions | |
acy | -13.048 |
u | -12.467 |
aga | -12.040 |
iev | -11.919 |
ire | -11.641 |
Token | , |
Token ID | 11 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
disparate | +5.583 |
newer | +5.531 |
various | +5.519 |
blatant | +5.496 |
relentless | +5.481 |
Neg logit contributions | |
u | -1.390 |
acy | -1.312 |
- | -1.281 |
ia | -1.174 |
aga | -1.145 |
Token | I |
Token ID | 314 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
newer | +33.976 |
various | +33.780 |
many | +33.112 |
those | +32.993 |
modern | +32.770 |
Neg logit contributions | |
acy | -12.986 |
u | -12.375 |
aga | -11.381 |
iev | -11.235 |
ade | -11.149 |
Token | am |
Token ID | 716 |
Feature activation | -6.01e+00 |
Pos logit contributions | |
disparate | +4.604 |
newer | +4.499 |
blatant | +4.499 |
venerable | +4.492 |
various | +4.484 |
Neg logit contributions | |
u | -3.046 |
- | -2.975 |
acy | -2.900 |
ia | -2.792 |
ine | -2.745 |
Token | planning |
Token ID | 5410 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
disparate | +17.009 |
newer | +17.006 |
various | +16.886 |
relentless | +16.854 |
genuine | +16.738 |
Neg logit contributions | |
u | -9.448 |
acy | -9.306 |
- | -8.990 |
ia | -8.820 |
aga | -8.749 |
Token | to |
Token ID | 284 |
Feature activation | -6.58e+00 |
Pos logit contributions | |
disparate | +3.375 |
blatant | +3.309 |
venerable | +3.297 |
newer | +3.292 |
relentless | +3.281 |
Neg logit contributions | |
u | -2.134 |
- | -2.090 |
acy | -2.024 |
ia | -1.948 |
ine | -1.915 |
Token | start |
Token ID | 923 |
Feature activation | -4.30e+00 |
Pos logit contributions | |
newer | +18.226 |
various | +18.171 |
disparate | +18.091 |
gradual | +17.824 |
relentless | +17.822 |
Neg logit contributions | |
u | -10.491 |
acy | -10.312 |
aga | -9.776 |
- | -9.761 |
ia | -9.736 |
Token | of |
Token ID | 286 |
Feature activation | -4.67e+00 |
Pos logit contributions | |
- | +17.560 |
u | +16.975 |
acy | +16.754 |
. | +16.561 |
ia | +16.236 |
Neg logit contributions | |
disparate | -11.857 |
newer | -11.575 |
venerable | -11.559 |
relentless | -11.449 |
anecdotal | -11.385 |
Token | blight |
Token ID | 42514 |
Feature activation | +5.23e+00 |
Pos logit contributions | |
disparate | +12.373 |
newer | +12.180 |
various | +12.177 |
blatant | +12.101 |
relentless | +12.063 |
Neg logit contributions | |
u | -9.226 |
acy | -8.944 |
- | -8.863 |
ia | -8.535 |
aga | -8.480 |
Token | � |
Token ID | 447 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
- | +13.019 |
. | +12.867 |
u | +12.259 |
ia | +11.986 |
ine | +11.812 |
Neg logit contributions | |
disparate | -9.692 |
venerable | -9.610 |
blatant | -9.393 |
genuine | -9.383 |
relentless | -9.366 |
Token | � |
Token ID | 251 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
� | +16.865 |
u | +16.745 |
- | +16.373 |
acy | +15.927 |
aga | +15.824 |
Neg logit contributions | |
disparate | -19.866 |
blatant | -19.821 |
newer | -19.374 |
sheer | -19.138 |
venerable | -19.107 |
Token | — |
Token ID | 851 |
Feature activation | -5.62e+00 |
Pos logit contributions | |
- | +4.180 |
u | +4.166 |
acy | +4.009 |
. | +3.994 |
ia | +3.938 |
Neg logit contributions | |
disparate | -4.433 |
venerable | -4.355 |
relentless | -4.311 |
blatant | -4.310 |
newer | -4.302 |
Token | but |
Token ID | 475 |
Feature activation | -1.37e+01 |
Pos logit contributions | |
disparate | +18.104 |
various | +18.090 |
newer | +17.894 |
blatant | +17.722 |
tremendous | +17.646 |
Neg logit contributions | |
u | -6.516 |
acy | -6.240 |
- | -5.959 |
aga | -5.854 |
ia | -5.822 |
Token | the |
Token ID | 262 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
various | +34.229 |
newer | +33.503 |
those | +33.432 |
many | +33.365 |
anecdotal | +33.174 |
Neg logit contributions | |
acy | -12.128 |
u | -11.666 |
ée | -11.293 |
ire | -11.199 |
igr | -11.169 |
Token | decisions |
Token ID | 5370 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
various | +28.241 |
newer | +27.815 |
disparate | +27.675 |
sheer | +27.399 |
blatant | +27.256 |
Neg logit contributions | |
acy | -11.788 |
u | -11.651 |
aga | -10.785 |
ade | -10.579 |
ia | -10.562 |
Token | on |
Token ID | 319 |
Feature activation | -9.06e+00 |
Pos logit contributions | |
disparate | +0.598 |
venerable | +0.586 |
blatant | +0.585 |
relentless | +0.581 |
newer | +0.581 |
Neg logit contributions | |
- | -0.521 |
u | -0.508 |
acy | -0.482 |
. | -0.480 |
ia | -0.479 |
Token | what |
Token ID | 644 |
Feature activation | -7.80e+00 |
Pos logit contributions | |
various | +25.781 |
disparate | +25.211 |
newer | +25.146 |
those | +24.805 |
genuine | +24.690 |
Neg logit contributions | |
acy | -11.170 |
u | -10.943 |
ire | -10.270 |
ade | -9.913 |
aga | -9.880 |
Token | that |
Token ID | 326 |
Feature activation | -6.93e+00 |
Pos logit contributions | |
various | +23.523 |
disparate | +23.304 |
newer | +23.161 |
genuine | +22.963 |
drastic | +22.916 |
Neg logit contributions | |
u | -9.274 |
acy | -8.942 |
ire | -8.384 |
aga | -8.299 |
ine | -8.129 |
Token | , |
Token ID | 11 |
Feature activation | +2.60e+00 |
Pos logit contributions | |
- | +20.532 |
. | +20.240 |
u | +18.875 |
, | +18.121 |
ia | +16.614 |
Neg logit contributions | |
tremend | -29.542 |
mathemat | -27.186 |
hemor | -26.194 |
cumbers | -25.364 |
undermin | -25.032 |
Token | $ |
Token ID | 3 |
Feature activation | +3.31e+00 |
Pos logit contributions | |
- | +3.568 |
u | +3.492 |
. | +3.130 |
ia | +2.973 |
acy | +2.937 |
Neg logit contributions | |
disparate | -8.604 |
relentless | -8.409 |
venerable | -8.399 |
totality | -8.392 |
gradual | -8.375 |
Token | FS |
Token ID | 10652 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
u | +3.217 |
- | +3.081 |
acy | +2.735 |
ia | +2.710 |
. | +2.595 |
Neg logit contributions | |
disparate | -12.033 |
relentless | -11.789 |
gradual | -11.743 |
newer | -11.734 |
venerable | -11.724 |
Token | 2 |
Token ID | 17 |
Feature activation | +9.13e+00 |
Pos logit contributions | |
- | +21.990 |
. | +21.344 |
u | +20.098 |
i | +18.434 |
' | +18.155 |
Neg logit contributions | |
tremend | -34.337 |
mathemat | -32.664 |
hemor | -30.697 |
metic | -29.883 |
undermin | -29.805 |
Token | ,[ |
Token ID | 17414 |
Feature activation | +7.53e+00 |
Pos logit contributions | |
. | +13.894 |
- | +13.865 |
u | +12.333 |
ong | +11.392 |
ag | +11.079 |
Neg logit contributions | |
tremend | -21.453 |
relentless | -21.264 |
venerable | -21.031 |
disparate | -20.967 |
blatant | -20.634 |
Token | System |
Token ID | 11964 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
- | +9.630 |
u | +8.902 |
. | +8.530 |
ia | +7.424 |
id | +7.143 |
Neg logit contributions | |
totality | -21.716 |
tremend | -21.710 |
venerable | -21.688 |
disparate | -21.621 |
mathemat | -21.598 |
Token | . |
Token ID | 13 |
Feature activation | +6.00e+00 |
Pos logit contributions | |
. | +29.345 |
- | +25.396 |
u | +22.545 |
' | +21.679 |
; | +19.853 |
Neg logit contributions | |
tremend | -44.719 |
mathemat | -40.008 |
cumbers | -39.361 |
metic | -38.420 |
eleph | -38.109 |
Token | Draw |
Token ID | 25302 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
- | +6.922 |
u | +6.439 |
. | +6.286 |
ine | +5.411 |
ia | +5.151 |
Neg logit contributions | |
tremend | -20.674 |
mathemat | -20.302 |
venerable | -19.660 |
totality | -19.654 |
gradual | -19.559 |
Token | ing |
Token ID | 278 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
ing | +24.797 |
- | +23.257 |
. | +22.580 |
u | +21.795 |
er | +20.560 |
Neg logit contributions | |
tremend | -44.542 |
mathemat | -40.740 |
cumbers | -40.023 |
metic | -39.119 |
hemor | -38.645 |
Token | . |
Token ID | 13 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
. | +24.319 |
- | +20.993 |
u | +18.182 |
' | +17.597 |
ia | +16.321 |
Neg logit contributions | |
tremend | -39.295 |
mathemat | -35.224 |
hemor | -34.088 |
cumbers | -33.771 |
eleph | -33.585 |
Token | Font |
Token ID | 23252 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
u | +2.307 |
- | +2.248 |
acy | +2.031 |
ia | +2.027 |
ine | +1.990 |
Neg logit contributions | |
disparate | -5.836 |
newer | -5.743 |
relentless | -5.740 |
anecdotal | -5.714 |
totality | -5.711 |
Token | ACLU |
Token ID | 24381 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
disparate | +2.736 |
newer | +2.646 |
various | +2.619 |
blatant | +2.602 |
relentless | +2.591 |
Neg logit contributions | |
u | -7.255 |
- | -7.125 |
acy | -7.110 |
ia | -6.935 |
aga | -6.883 |
Token | of |
Token ID | 286 |
Feature activation | +3.78e+00 |
Pos logit contributions | |
- | +20.902 |
. | +19.656 |
u | +18.865 |
ia | +17.682 |
' | +16.826 |
Neg logit contributions | |
mathemat | -27.366 |
tremend | -27.004 |
cumbers | -24.801 |
misunder | -24.263 |
hemor | -24.118 |
Token | Oregon |
Token ID | 8819 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
- | +10.181 |
. | +9.817 |
u | +9.557 |
ia | +9.239 |
ine | +9.006 |
Neg logit contributions | |
tremend | -7.934 |
mathemat | -7.873 |
disparate | -7.139 |
venerable | -6.997 |
relentless | -6.985 |
Token | (@ |
Token ID | 4275 |
Feature activation | +7.99e+00 |
Pos logit contributions | |
- | +21.466 |
. | +21.195 |
ia | +19.247 |
u | +19.076 |
(@ | +18.947 |
Neg logit contributions | |
tremend | -33.354 |
mathemat | -31.791 |
cumbers | -30.132 |
streng | -28.945 |
hemor | -28.923 |
Token | AC |
Token ID | 2246 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
- | +6.933 |
. | +6.099 |
ac | +6.030 |
u | +5.589 |
acy | +5.358 |
Neg logit contributions | |
tremend | -29.662 |
mathemat | -29.036 |
hemor | -28.442 |
disparate | -27.417 |
totality | -27.357 |
Token | LU |
Token ID | 41596 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
u | +16.396 |
- | +15.370 |
. | +15.305 |
elle | +13.246 |
' | +12.690 |
Neg logit contributions | |
tremend | -34.806 |
mathemat | -33.803 |
hemor | -31.583 |
metic | -31.298 |
cumbers | -30.897 |
Token | _ |
Token ID | 62 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
- | +21.962 |
_ | +21.825 |
. | +20.381 |
u | +19.479 |
' | +17.325 |
Neg logit contributions | |
tremend | -40.470 |
mathemat | -38.258 |
metic | -37.201 |
cumbers | -36.947 |
hemor | -35.952 |
Token | OR |
Token ID | 1581 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
- | +10.636 |
. | +10.303 |
u | +8.754 |
' | +7.758 |
| +7.218 |
Neg logit contributions | |
tremend | -40.712 |
mathemat | -39.364 |
metic | -37.113 |
undermin | -37.071 |
hemor | -36.652 |
Token | ) |
Token ID | 8 |
Feature activation | +5.15e+00 |
Pos logit contributions | |
- | +23.003 |
. | +22.239 |
u | +20.450 |
) | +20.419 |
' | +19.508 |
Neg logit contributions | |
tremend | -41.658 |
mathemat | -39.032 |
hemor | -37.729 |
cumbers | -37.562 |
metic | -37.415 |
Token | May |
Token ID | 1737 |
Feature activation | +7.74e+00 |
Pos logit contributions | |
- | +11.047 |
. | +10.708 |
u | +10.077 |
‐ | +9.389 |
y | +9.154 |
Neg logit contributions | |
tremend | -14.777 |
mathemat | -14.527 |
cumbers | -12.763 |
misunder | -12.651 |
hemor | -12.639 |
Token | 29 |
Token ID | 2808 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
- | +14.346 |
. | +13.701 |
u | +13.505 |
ine | +12.027 |
' | +11.701 |
Neg logit contributions | |
tremend | -19.723 |
mathemat | -19.631 |
cumbers | -18.302 |
disparate | -17.876 |
venerable | -17.635 |
Token | does |
Token ID | 857 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
disparate | +24.418 |
newer | +24.277 |
various | +24.223 |
blatant | +24.046 |
genuine | +23.868 |
Neg logit contributions | |
u | -9.759 |
acy | -9.626 |
aga | -8.986 |
ong | -8.859 |
ade | -8.784 |
Token | not |
Token ID | 407 |
Feature activation | -3.78e+00 |
Pos logit contributions | |
disparate | +2.121 |
relentless | +2.074 |
newer | +2.040 |
blatant | +2.038 |
venerable | +2.022 |
Neg logit contributions | |
u | -4.798 |
- | -4.756 |
acy | -4.638 |
ia | -4.543 |
. | -4.528 |
Token | prove |
Token ID | 5879 |
Feature activation | -2.48e+00 |
Pos logit contributions | |
disparate | +9.721 |
newer | +9.553 |
various | +9.512 |
blatant | +9.486 |
relentless | +9.477 |
Neg logit contributions | |
u | -7.960 |
- | -7.733 |
acy | -7.692 |
ia | -7.385 |
aga | -7.299 |
Token | that |
Token ID | 326 |
Feature activation | -9.53e+00 |
Pos logit contributions | |
disparate | +5.763 |
newer | +5.659 |
venerable | +5.631 |
relentless | +5.617 |
various | +5.595 |
Neg logit contributions | |
u | -5.966 |
- | -5.905 |
acy | -5.767 |
ia | -5.561 |
. | -5.509 |
Token | the |
Token ID | 262 |
Feature activation | -8.85e+00 |
Pos logit contributions | |
various | +27.334 |
disparate | +27.214 |
modern | +27.013 |
genuine | +26.938 |
blatant | +26.885 |
Neg logit contributions | |
u | -10.518 |
acy | -10.402 |
aga | -9.879 |
ong | -9.826 |
ire | -9.434 |
Token | Din |
Token ID | 23448 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
various | +24.966 |
disparate | +24.831 |
newer | +24.547 |
modern | +24.438 |
blatant | +24.409 |
Neg logit contributions | |
u | -10.858 |
acy | -10.717 |
aga | -9.987 |
ong | -9.913 |
ée | -9.761 |
Token | ah |
Token ID | 993 |
Feature activation | +5.17e-01 |
Pos logit contributions | |
ah | +23.208 |
acy | +21.616 |
ab | +21.362 |
u | +21.349 |
- | +21.203 |
Neg logit contributions | |
mathemat | -25.399 |
tremend | -24.390 |
hemor | -24.002 |
behavi | -23.837 |
cumbers | -23.412 |
Token | story |
Token ID | 1621 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
- | +1.416 |
u | +1.393 |
acy | +1.343 |
ia | +1.318 |
. | +1.317 |
Neg logit contributions | |
disparate | -1.011 |
newer | -0.997 |
relentless | -0.990 |
venerable | -0.981 |
blatant | -0.980 |
Token | is |
Token ID | 318 |
Feature activation | -6.19e+00 |
Pos logit contributions | |
- | +4.298 |
u | +4.237 |
. | +3.970 |
acy | +3.950 |
ia | +3.892 |
Neg logit contributions | |
disparate | -5.370 |
relentless | -5.305 |
newer | -5.262 |
venerable | -5.251 |
gradual | -5.216 |
Token | also |
Token ID | 635 |
Feature activation | -4.17e+00 |
Pos logit contributions | |
genuine | +18.244 |
disparate | +18.221 |
newer | +18.112 |
various | +18.097 |
blatant | +18.018 |
Neg logit contributions | |
u | -9.057 |
acy | -8.809 |
- | -8.397 |
ia | -8.251 |
aga | -8.195 |
Token | about |
Token ID | 546 |
Feature activation | -6.35e+00 |
Pos logit contributions | |
disparate | +11.151 |
newer | +10.979 |
various | +10.958 |
blatant | +10.913 |
relentless | +10.876 |
Neg logit contributions | |
u | -8.200 |
acy | -7.931 |
- | -7.912 |
ia | -7.585 |
aga | -7.507 |
Token | to |
Token ID | 284 |
Feature activation | -3.73e+00 |
Pos logit contributions | |
. | +8.006 |
- | +8.004 |
u | +7.618 |
acy | +7.323 |
ia | +7.248 |
Neg logit contributions | |
disparate | -7.425 |
blatant | -7.287 |
newer | -7.212 |
relentless | -7.210 |
gradual | -7.192 |
Token | all |
Token ID | 477 |
Feature activation | -3.74e+00 |
Pos logit contributions | |
disparate | +11.216 |
newer | +11.058 |
various | +11.028 |
blatant | +10.993 |
relentless | +10.968 |
Neg logit contributions | |
u | -6.152 |
- | -5.914 |
acy | -5.904 |
ia | -5.599 |
aga | -5.525 |
Token | others |
Token ID | 1854 |
Feature activation | +9.88e-01 |
Pos logit contributions | |
disparate | +12.480 |
newer | +12.324 |
various | +12.315 |
blatant | +12.224 |
genuine | +12.223 |
Neg logit contributions | |
u | -4.805 |
acy | -4.572 |
- | -4.460 |
ia | -4.232 |
aga | -4.213 |
Token | . |
Token ID | 13 |
Feature activation | -7.38e+00 |
Pos logit contributions | |
- | +1.351 |
. | +1.316 |
u | +1.314 |
acy | +1.214 |
ia | +1.196 |
Neg logit contributions | |
disparate | -3.236 |
gradual | -3.201 |
newer | -3.193 |
blatant | -3.192 |
relentless | -3.190 |
Token | It |
Token ID | 632 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
various | +19.373 |
disparate | +19.153 |
newer | +19.118 |
genuine | +19.117 |
modern | +18.954 |
Neg logit contributions | |
acy | -10.651 |
u | -10.650 |
aga | -10.292 |
- | -9.852 |
ire | -9.842 |
Token | � |
Token ID | 447 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
disparate | +10.543 |
various | +10.421 |
newer | +10.407 |
blatant | +10.358 |
relentless | +10.348 |
Neg logit contributions | |
u | -4.926 |
acy | -4.732 |
- | -4.682 |
ia | -4.446 |
aga | -4.406 |
Token | � |
Token ID | 247 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
u | +20.442 |
� | +19.047 |
- | +19.009 |
� | +18.942 |
� | +18.917 |
Neg logit contributions | |
mathemat | -24.056 |
tremend | -22.998 |
blatant | -22.631 |
disparate | -22.393 |
theless | -22.244 |
Token | s |
Token ID | 82 |
Feature activation | -4.46e+00 |
Pos logit contributions | |
u | +8.031 |
- | +7.852 |
acy | +7.502 |
. | +7.324 |
ine | +7.321 |
Neg logit contributions | |
disparate | -8.998 |
newer | -8.813 |
venerable | -8.783 |
blatant | -8.655 |
gradual | -8.623 |
Token | a |
Token ID | 257 |
Feature activation | -5.96e+00 |
Pos logit contributions | |
disparate | +12.844 |
various | +12.655 |
newer | +12.650 |
blatant | +12.608 |
relentless | +12.589 |
Neg logit contributions | |
u | -7.740 |
acy | -7.446 |
- | -7.395 |
ia | -7.093 |
aga | -7.028 |
Token | narrow |
Token ID | 7135 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
disparate | +17.212 |
blatant | +17.049 |
relentless | +17.012 |
genuine | +16.994 |
newer | +16.960 |
Neg logit contributions | |
u | -9.236 |
acy | -8.990 |
- | -8.598 |
ia | -8.528 |
aga | -8.486 |
Token | , |
Token ID | 11 |
Feature activation | -4.62e+00 |
Pos logit contributions | |
- | +4.821 |
u | +4.625 |
acy | +4.543 |
. | +4.453 |
ia | +4.410 |
Neg logit contributions | |
disparate | -2.561 |
newer | -2.511 |
blatant | -2.475 |
tremendous | -2.445 |
various | -2.435 |
Token | me |
Token ID | 502 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
- | +4.656 |
u | +4.483 |
. | +4.414 |
ine | +4.139 |
id | +4.093 |
Neg logit contributions | |
disparate | -4.280 |
venerable | -4.136 |
relentless | -4.084 |
newer | -4.045 |
gradual | -4.016 |
Token | remember |
Token ID | 3505 |
Feature activation | -3.12e+00 |
Pos logit contributions | |
- | +0.742 |
u | +0.726 |
. | +0.709 |
acy | +0.695 |
ade | +0.679 |
Neg logit contributions | |
disparate | -0.435 |
relentless | -0.415 |
venerable | -0.413 |
blatant | -0.412 |
gradual | -0.411 |
Token | anything |
Token ID | 1997 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
disparate | +8.496 |
relentless | +8.270 |
gradual | +8.269 |
newer | +8.263 |
venerable | +8.252 |
Neg logit contributions | |
u | -6.380 |
- | -6.322 |
acy | -6.044 |
. | -5.906 |
ia | -5.887 |
Token | that |
Token ID | 326 |
Feature activation | -7.18e+00 |
Pos logit contributions | |
disparate | +5.810 |
relentless | +5.667 |
various | +5.644 |
venerable | +5.639 |
gradual | +5.633 |
Neg logit contributions | |
u | -5.657 |
- | -5.622 |
acy | -5.452 |
. | -5.281 |
ia | -5.270 |
Token | preceded |
Token ID | 27165 |
Feature activation | -3.30e+00 |
Pos logit contributions | |
disparate | +23.847 |
newer | +23.823 |
various | +23.690 |
blatant | +23.523 |
venerable | +23.475 |
Neg logit contributions | |
u | -7.373 |
acy | -7.171 |
aga | -6.589 |
ong | -6.384 |
- | -6.310 |
Token | Alfred |
Token ID | 22044 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
disparate | +10.511 |
newer | +10.353 |
various | +10.315 |
blatant | +10.304 |
relentless | +10.291 |
Neg logit contributions | |
u | -4.936 |
- | -4.760 |
acy | -4.688 |
ia | -4.451 |
aga | -4.358 |
Token | o |
Token ID | 78 |
Feature activation | +6.64e+00 |
Pos logit contributions | |
o | +22.543 |
- | +21.525 |
u | +21.346 |
. | +20.920 |
os | +20.528 |
Neg logit contributions | |
mathemat | -24.383 |
tremend | -23.206 |
hemor | -23.077 |
disparate | -22.274 |
behavi | -22.150 |
Token | 's |
Token ID | 338 |
Feature activation | -2.61e+00 |
Pos logit contributions | |
- | +14.585 |
. | +14.167 |
u | +13.912 |
ia | +13.624 |
acy | +13.214 |
Neg logit contributions | |
disparate | -12.848 |
anecdotal | -12.722 |
gradual | -12.687 |
relentless | -12.516 |
totality | -12.418 |
Token | in |
Token ID | 287 |
Feature activation | -4.49e+00 |
Pos logit contributions | |
disparate | +9.797 |
newer | +9.675 |
various | +9.651 |
blatant | +9.636 |
relentless | +9.624 |
Neg logit contributions | |
u | -2.391 |
- | -2.245 |
acy | -2.213 |
ia | -2.004 |
aga | -1.947 |
Token | that |
Token ID | 326 |
Feature activation | -5.93e+00 |
Pos logit contributions | |
disparate | +13.870 |
newer | +13.749 |
various | +13.737 |
blatant | +13.629 |
relentless | +13.579 |
Neg logit contributions | |
u | -6.781 |
acy | -6.532 |
- | -6.398 |
ia | -6.110 |
aga | -6.078 |
Token | spot |
Token ID | 4136 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
disparate | +19.174 |
newer | +19.008 |
various | +18.973 |
blatant | +18.901 |
venerable | +18.884 |
Neg logit contributions | |
u | -7.870 |
acy | -7.459 |
- | -7.153 |
aga | -6.947 |
ia | -6.877 |
Token | old |
Token ID | 727 |
Feature activation | -3.40e+00 |
Pos logit contributions | |
- | +2.868 |
u | +2.859 |
acy | +2.410 |
. | +2.408 |
ine | +2.401 |
Neg logit contributions | |
disparate | -11.649 |
totality | -11.419 |
blatant | -11.408 |
gradual | -11.314 |
mathemat | -11.257 |
Token | under |
Token ID | 739 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
disparate | +9.473 |
newer | +9.335 |
various | +9.308 |
blatant | +9.272 |
relentless | +9.256 |
Neg logit contributions | |
u | -6.320 |
acy | -6.100 |
- | -6.086 |
ia | -5.816 |
aga | -5.752 |
Token | study |
Token ID | 44517 |
Feature activation | +6.55e-01 |
Pos logit contributions | |
- | +4.112 |
u | +3.845 |
. | +3.572 |
ia | +3.522 |
acy | +3.505 |
Neg logit contributions | |
disparate | -5.354 |
totality | -5.227 |
gradual | -5.212 |
blatant | -5.207 |
newer | -5.202 |
Token | , |
Token ID | 11 |
Feature activation | -8.51e+00 |
Pos logit contributions | |
- | +1.401 |
u | +1.381 |
acy | +1.318 |
. | +1.313 |
ia | +1.290 |
Neg logit contributions | |
disparate | -1.687 |
newer | -1.645 |
blatant | -1.640 |
gradual | -1.627 |
relentless | -1.619 |
Token | Norm |
Token ID | 11220 |
Feature activation | +5.06e+00 |
Pos logit contributions | |
various | +23.514 |
venerable | +23.390 |
genuine | +23.217 |
relentless | +23.196 |
newer | +23.178 |
Neg logit contributions | |
u | -10.568 |
acy | -10.494 |
ire | -9.885 |
aga | -9.807 |
ong | -9.666 |
Token | Van |
Token ID | 6656 |
Feature activation | +5.33e+00 |
Pos logit contributions | |
u | +14.136 |
- | +13.736 |
acy | +13.163 |
ia | +13.128 |
ine | +13.056 |
Neg logit contributions | |
disparate | -8.314 |
gradual | -8.197 |
anecdotal | -8.020 |
blatant | -8.010 |
newer | -7.985 |
Token | Brock |
Token ID | 20501 |
Feature activation | +5.73e+00 |
Pos logit contributions | |
- | +14.223 |
u | +14.116 |
. | +13.292 |
aga | +12.946 |
ite | +12.936 |
Neg logit contributions | |
disparate | -9.087 |
blatant | -8.789 |
anecdotal | -8.726 |
newer | -8.706 |
relentless | -8.658 |
Token | lin |
Token ID | 2815 |
Feature activation | +5.21e+00 |
Pos logit contributions | |
u | +11.096 |
- | +10.678 |
. | +10.460 |
ine | +9.549 |
ab | +9.351 |
Neg logit contributions | |
blatant | -14.039 |
gradual | -13.750 |
disparate | -13.718 |
relentless | -13.651 |
drastic | -13.607 |
Token | . |
Token ID | 13 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
- | +11.922 |
. | +11.889 |
u | +11.677 |
acy | +10.944 |
ia | +10.803 |
Neg logit contributions | |
disparate | -10.641 |
gradual | -10.354 |
blatant | -10.218 |
anecdotal | -10.205 |
totality | -10.188 |
Token |
|
Token ID | 198 |
Feature activation | +3.04e+00 |
Pos logit contributions | |
various | +26.253 |
newer | +25.895 |
genuine | +25.579 |
those | +25.515 |
disparate | +25.493 |
Neg logit contributions | |
acy | -12.749 |
igr | -12.329 |
u | -12.129 |
aga | -11.849 |
ire | -11.753 |
Token |
|
Token ID | 198 |
Feature activation | -8.48e+00 |
Pos logit contributions | |
- | +4.349 |
. | +4.001 |
u | +3.991 |
ia | +3.550 |
ine | +3.414 |
Neg logit contributions | |
tremend | -11.290 |
mathemat | -11.063 |
hemor | -10.452 |
disparate | -10.433 |
venerable | -10.413 |
Token | street |
Token ID | 4675 |
Feature activation | +4.08e+00 |
Pos logit contributions | |
various | +27.241 |
newer | +26.625 |
disparate | +26.434 |
venerable | +26.361 |
tremendous | +26.219 |
Neg logit contributions | |
u | -10.613 |
acy | -10.426 |
iev | -9.814 |
ong | -9.621 |
aga | -9.536 |
Token | signs |
Token ID | 5895 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
- | +11.833 |
u | +10.972 |
. | +10.956 |
ia | +10.520 |
ine | +10.512 |
Neg logit contributions | |
disparate | -6.679 |
anecdotal | -6.385 |
gradual | -6.360 |
blatant | -6.242 |
relentless | -6.194 |
Token | dedicated |
Token ID | 7256 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
- | +4.459 |
. | +4.384 |
u | +4.308 |
ia | +4.093 |
ine | +4.054 |
Neg logit contributions | |
disparate | -3.030 |
gradual | -2.951 |
anecdotal | -2.924 |
totality | -2.924 |
relentless | -2.903 |
Token | to |
Token ID | 284 |
Feature activation | -6.92e+00 |
Pos logit contributions | |
- | +4.784 |
u | +4.631 |
. | +4.480 |
ia | +4.375 |
acy | +4.330 |
Neg logit contributions | |
disparate | -7.422 |
anecdotal | -7.310 |
gradual | -7.178 |
tremendous | -7.163 |
totality | -7.163 |
Token | his |
Token ID | 465 |
Feature activation | -4.49e+00 |
Pos logit contributions | |
various | +19.821 |
disparate | +19.738 |
newer | +19.507 |
venerable | +19.330 |
relentless | +19.323 |
Neg logit contributions | |
u | -10.605 |
acy | -10.501 |
- | -9.721 |
aga | -9.652 |
ia | -9.611 |
Token | memory |
Token ID | 4088 |
Feature activation | +3.85e+00 |
Pos logit contributions | |
disparate | +11.944 |
various | +11.769 |
newer | +11.744 |
blatant | +11.673 |
relentless | +11.663 |
Neg logit contributions | |
u | -8.820 |
acy | -8.564 |
- | -8.427 |
ia | -8.132 |
aga | -8.114 |
Token | . |
Token ID | 13 |
Feature activation | -6.96e+00 |
Pos logit contributions | |
. | +9.071 |
- | +8.866 |
u | +8.525 |
acy | +8.130 |
ia | +7.946 |
Neg logit contributions | |
disparate | -8.152 |
gradual | -7.971 |
anecdotal | -7.956 |
totality | -7.896 |
blatant | -7.868 |
Token |
|
Token ID | 198 |
Feature activation | +4.31e+00 |
Pos logit contributions | |
various | +16.887 |
newer | +16.687 |
disparate | +16.540 |
blatant | +16.277 |
genuine | +16.273 |
Neg logit contributions | |
acy | -12.212 |
u | -12.201 |
aga | -11.812 |
- | -11.540 |
ia | -11.392 |
Token |
|
Token ID | 198 |
Feature activation | -5.28e+00 |
Pos logit contributions | |
- | +5.741 |
. | +5.286 |
u | +5.117 |
ia | +4.390 |
ine | +4.295 |
Neg logit contributions | |
tremend | -16.795 |
mathemat | -16.133 |
hemor | -15.457 |
undermin | -15.325 |
cumbers | -15.142 |
Token | Yet |
Token ID | 11486 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
blatant | +13.744 |
various | +13.724 |
disparate | +13.686 |
newer | +13.686 |
widespread | +13.598 |
Neg logit contributions | |
acy | -8.058 |
aga | -7.763 |
u | -7.724 |
illo | -7.294 |
ong | -7.285 |
Token | the |
Token ID | 262 |
Feature activation | -9.68e+00 |
Pos logit contributions | |
various | +30.706 |
newer | +30.497 |
disparate | +30.197 |
blatant | +29.991 |
those | +29.991 |
Neg logit contributions | |
u | -10.223 |
acy | -10.053 |
ée | -9.715 |
aga | -9.442 |
ong | -9.299 |
Token | attention |
Token ID | 3241 |
Feature activation | +3.16e+00 |
Pos logit contributions | |
disparate | +8.367 |
newer | +8.211 |
various | +8.182 |
blatant | +8.147 |
relentless | +8.122 |
Neg logit contributions | |
u | -8.797 |
- | -8.561 |
acy | -8.553 |
ia | -8.252 |
aga | -8.179 |
Token | . |
Token ID | 13 |
Feature activation | -6.52e+00 |
Pos logit contributions | |
. | +7.101 |
- | +6.944 |
u | +6.722 |
acy | +6.300 |
ong | +6.128 |
Neg logit contributions | |
disparate | -7.259 |
venerable | -7.216 |
tremendous | -7.127 |
relentless | -7.051 |
gradual | -7.035 |
Token |
|
Token ID | 198 |
Feature activation | +4.85e+00 |
Pos logit contributions | |
various | +16.824 |
newer | +16.744 |
disparate | +16.548 |
genuine | +16.489 |
blatant | +16.337 |
Neg logit contributions | |
u | -10.814 |
acy | -10.732 |
aga | -10.406 |
- | -10.214 |
ia | -10.140 |
Token |
|
Token ID | 198 |
Feature activation | -5.06e+00 |
Pos logit contributions | |
- | +6.336 |
. | +5.944 |
u | +5.644 |
ia | +4.893 |
ine | +4.750 |
Neg logit contributions | |
tremend | -18.687 |
mathemat | -18.004 |
hemor | -17.236 |
undermin | -16.940 |
cumbers | -16.848 |
Token | The |
Token ID | 464 |
Feature activation | -8.57e+00 |
Pos logit contributions | |
various | +13.958 |
newer | +13.944 |
blatant | +13.904 |
disparate | +13.889 |
genuine | +13.872 |
Neg logit contributions | |
acy | -7.114 |
u | -7.031 |
aga | -6.938 |
ia | -6.617 |
ong | -6.599 |
Token | truth |
Token ID | 3872 |
Feature activation | +4.30e+00 |
Pos logit contributions | |
various | +24.849 |
disparate | +24.811 |
newer | +24.736 |
relentless | +24.649 |
sheer | +24.640 |
Neg logit contributions | |
u | -9.885 |
acy | -9.673 |
aga | -9.372 |
ade | -9.107 |
- | -9.027 |
Token | is |
Token ID | 318 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
- | +9.281 |
u | +9.212 |
. | +8.729 |
acy | +8.677 |
ia | +8.286 |
Neg logit contributions | |
disparate | -9.814 |
venerable | -9.468 |
gradual | -9.375 |
blatant | -9.334 |
newer | -9.318 |
Token | that |
Token ID | 326 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
disparate | +13.033 |
newer | +12.884 |
various | +12.864 |
blatant | +12.816 |
relentless | +12.790 |
Neg logit contributions | |
u | -3.917 |
acy | -3.690 |
- | -3.670 |
ia | -3.403 |
aga | -3.350 |
Token | Bour |
Token ID | 20576 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
various | +30.883 |
newer | +30.328 |
disparate | +30.289 |
genuine | +30.263 |
many | +30.156 |
Neg logit contributions | |
u | -8.936 |
acy | -8.646 |
aga | -8.609 |
ong | -8.231 |
illo | -8.182 |
Token | dain |
Token ID | 27162 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
u | +18.595 |
- | +18.218 |
acy | +18.128 |
id | +17.739 |
. | +17.737 |
Neg logit contributions | |
tremend | -26.890 |
mathemat | -26.221 |
disparate | -25.887 |
cumbers | -25.574 |
hemor | -25.550 |
Token | has |
Token ID | 468 |
Feature activation | -4.40e+00 |
Pos logit contributions | |
- | +8.996 |
u | +8.913 |
acy | +8.620 |
. | +8.503 |
ia | +8.490 |
Neg logit contributions | |
disparate | -7.094 |
venerable | -6.868 |
blatant | -6.829 |
newer | -6.811 |
gradual | -6.807 |
Token | Get |
Token ID | 3855 |
Feature activation | +1.64e+00 |
Pos logit contributions | |
u | +1.269 |
- | +1.244 |
acy | +1.174 |
ia | +1.156 |
ine | +1.144 |
Neg logit contributions | |
disparate | -2.151 |
newer | -2.108 |
venerable | -2.098 |
blatant | -2.087 |
gradual | -2.085 |
Token | Ready |
Token ID | 23432 |
Feature activation | +6.50e+00 |
Pos logit contributions | |
u | +4.949 |
- | +4.904 |
acy | +4.732 |
. | +4.648 |
aga | +4.562 |
Neg logit contributions | |
disparate | -2.689 |
venerable | -2.614 |
blatant | -2.608 |
gradual | -2.587 |
newer | -2.583 |
Token | For |
Token ID | 1114 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
- | +15.695 |
. | +15.251 |
u | +15.124 |
acy | +14.481 |
ia | +14.329 |
Neg logit contributions | |
disparate | -11.439 |
blatant | -10.830 |
gradual | -10.784 |
venerable | -10.742 |
stringent | -10.683 |
Token | Sexy |
Token ID | 49131 |
Feature activation | +3.18e+00 |
Pos logit contributions | |
disparate | +3.981 |
venerable | +3.851 |
newer | +3.835 |
blatant | +3.830 |
relentless | +3.816 |
Neg logit contributions | |
u | -5.608 |
- | -5.507 |
acy | -5.434 |
ia | -5.312 |
aga | -5.249 |
Token | Old |
Token ID | 5706 |
Feature activation | +3.85e+00 |
Pos logit contributions | |
- | +8.800 |
u | +8.652 |
. | +8.502 |
acy | +8.449 |
ia | +8.157 |
Neg logit contributions | |
disparate | -5.744 |
venerable | -5.550 |
blatant | -5.516 |
stringent | -5.444 |
gradual | -5.417 |
Token | Fol |
Token ID | 30938 |
Feature activation | +9.90e+00 |
Pos logit contributions | |
- | +10.974 |
u | +10.563 |
acy | +10.240 |
. | +10.169 |
ia | +9.940 |
Neg logit contributions | |
disparate | -6.829 |
gradual | -6.448 |
blatant | -6.355 |
newer | -6.350 |
anecdotal | -6.347 |
Token | ks |
Token ID | 591 |
Feature activation | +3.56e+00 |
Pos logit contributions | |
- | +17.131 |
u | +17.001 |
acy | +16.073 |
ies | +15.925 |
ia | +15.918 |
Neg logit contributions | |
disparate | -19.359 |
blatant | -19.258 |
genuine | -18.779 |
tremendous | -18.687 |
newer | -18.611 |
Token | � |
Token ID | 447 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
- | +9.193 |
u | +9.128 |
. | +8.920 |
acy | +8.724 |
ia | +8.629 |
Neg logit contributions | |
disparate | -6.839 |
venerable | -6.560 |
blatant | -6.548 |
gradual | -6.523 |
totality | -6.444 |
Token | � |
Token ID | 251 |
Feature activation | +2.76e+00 |
Pos logit contributions | |
� | +16.996 |
- | +16.661 |
u | +16.541 |
acy | +15.764 |
. | +15.694 |
Neg logit contributions | |
disparate | -18.810 |
blatant | -18.530 |
newer | -17.898 |
relentless | -17.871 |
theless | -17.776 |
Token | from |
Token ID | 422 |
Feature activation | -6.18e+00 |
Pos logit contributions | |
- | +6.904 |
u | +6.813 |
. | +6.580 |
acy | +6.517 |
ia | +6.473 |
Neg logit contributions | |
disparate | -5.731 |
venerable | -5.492 |
blatant | -5.470 |
newer | -5.465 |
gradual | -5.459 |
Token | October |
Token ID | 3267 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
various | +17.967 |
disparate | +17.933 |
newer | +17.857 |
venerable | +17.648 |
blatant | +17.614 |
Neg logit contributions | |
u | -9.341 |
acy | -9.113 |
- | -8.842 |
aga | -8.585 |
ia | -8.489 |
Token | Jr |
Token ID | 7504 |
Feature activation | +8.76e+00 |
Pos logit contributions | |
- | +8.242 |
u | +8.097 |
ia | +7.688 |
. | +7.635 |
acy | +7.606 |
Neg logit contributions | |
disparate | -7.163 |
blatant | -6.944 |
newer | -6.927 |
gradual | -6.879 |
venerable | -6.826 |
Token | ., |
Token ID | 1539 |
Feature activation | -3.62e+00 |
Pos logit contributions | |
. | +18.526 |
- | +17.960 |
u | +17.390 |
ia | +16.622 |
acy | +16.580 |
Neg logit contributions | |
disparate | -16.575 |
anecdotal | -15.840 |
gradual | -15.660 |
blatant | -15.650 |
venerable | -15.542 |
Token | 34 |
Token ID | 4974 |
Feature activation | +9.64e+00 |
Pos logit contributions | |
disparate | +6.904 |
newer | +6.731 |
various | +6.688 |
blatant | +6.678 |
relentless | +6.651 |
Neg logit contributions | |
u | -10.065 |
- | -9.862 |
acy | -9.799 |
ia | -9.521 |
aga | -9.430 |
Token |
|
Token ID | 198 |
Feature activation | +5.02e+00 |
Pos logit contributions | |
- | +23.145 |
. | +21.705 |
u | +21.701 |
ia | +20.622 |
acy | +20.304 |
Neg logit contributions | |
disparate | -14.226 |
gradual | -13.714 |
anecdotal | -13.705 |
relentless | -13.590 |
blatant | -13.526 |
Token |
|
Token ID | 198 |
Feature activation | -4.74e+00 |
Pos logit contributions | |
- | +6.493 |
. | +6.029 |
u | +5.692 |
ia | +4.824 |
ine | +4.680 |
Neg logit contributions | |
tremend | -19.563 |
mathemat | -18.777 |
hemor | -17.901 |
undermin | -17.837 |
cumbers | -17.452 |
Token | Edward |
Token ID | 43982 |
Feature activation | +6.62e+00 |
Pos logit contributions | |
various | +13.097 |
disparate | +13.077 |
newer | +13.044 |
relentless | +12.927 |
venerable | +12.905 |
Neg logit contributions | |
acy | -6.949 |
u | -6.938 |
aga | -6.664 |
ire | -6.470 |
ong | -6.411 |
Token | S |
Token ID | 311 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
- | +16.069 |
u | +15.535 |
. | +15.428 |
ia | +14.849 |
ine | +14.595 |
Neg logit contributions | |
disparate | -10.736 |
blatant | -10.728 |
gradual | -10.495 |
relentless | -10.387 |
anecdotal | -10.376 |
Token | otom |
Token ID | 43125 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
. | +16.887 |
- | +16.271 |
acy | +15.811 |
ia | +15.235 |
u | +14.913 |
Neg logit contributions | |
tremend | -22.695 |
relentless | -22.315 |
venerable | -22.078 |
blatant | -22.074 |
mathemat | -22.043 |
Token | ay |
Token ID | 323 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
ay | +20.076 |
u | +19.253 |
- | +18.379 |
ate | +18.084 |
. | +18.060 |
Neg logit contributions | |
tremend | -33.836 |
mathemat | -32.537 |
cumbers | -32.061 |
hemor | -31.604 |
undermin | -31.521 |
Token | or |
Token ID | 273 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
- | +16.870 |
. | +16.600 |
u | +16.569 |
er | +14.860 |
ag | +14.822 |
Neg logit contributions | |
tremend | -32.151 |
mathemat | -30.727 |
behavi | -30.087 |
cumbers | -29.627 |
undermin | -29.000 |
Token | Jr |
Token ID | 7504 |
Feature activation | +8.79e+00 |
Pos logit contributions | |
- | +9.051 |
u | +8.823 |
. | +8.564 |
ia | +8.372 |
acy | +8.219 |
Neg logit contributions | |
disparate | -8.905 |
blatant | -8.758 |
newer | -8.578 |
totality | -8.535 |
relentless | -8.532 |
Token | denounced |
Token ID | 26443 |
Feature activation | +2.57e+00 |
Pos logit contributions | |
disparate | +11.639 |
various | +11.449 |
newer | +11.444 |
relentless | +11.416 |
blatant | +11.400 |
Neg logit contributions | |
u | -8.005 |
acy | -7.801 |
- | -7.678 |
ia | -7.399 |
aga | -7.344 |
Token | as |
Token ID | 355 |
Feature activation | -5.75e+00 |
Pos logit contributions | |
- | +6.235 |
. | +6.212 |
u | +5.846 |
ine | +5.525 |
ite | +5.501 |
Neg logit contributions | |
disparate | -5.454 |
newer | -5.398 |
gradual | -5.296 |
anecdotal | -5.288 |
venerable | -5.252 |
Token | Gr |
Token ID | 1902 |
Feature activation | +6.72e+00 |
Pos logit contributions | |
disparate | +17.423 |
various | +17.221 |
blatant | +17.169 |
relentless | +17.158 |
newer | +17.096 |
Neg logit contributions | |
u | -8.598 |
acy | -8.233 |
- | -8.008 |
ia | -7.736 |
aga | -7.673 |
Token | inch |
Token ID | 8589 |
Feature activation | +5.12e+00 |
Pos logit contributions | |
u | +10.777 |
- | +10.737 |
. | +10.329 |
ine | +10.312 |
acy | +10.311 |
Neg logit contributions | |
totality | -17.906 |
disparate | -17.787 |
gradual | -17.204 |
newer | -17.200 |
proactive | -17.076 |
Token | - |
Token ID | 12 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
- | +14.884 |
u | +14.112 |
. | +14.079 |
ia | +13.805 |
ite | +13.639 |
Neg logit contributions | |
disparate | -7.777 |
venerable | -7.334 |
newer | -7.286 |
anecdotal | -7.212 |
gradual | -7.021 |
Token | like |
Token ID | 2339 |
Feature activation | -1.93e-01 |
Pos logit contributions | |
u | +3.012 |
- | +2.975 |
acy | +2.775 |
ine | +2.703 |
ia | +2.696 |
Neg logit contributions | |
disparate | -6.161 |
newer | -6.004 |
anecdotal | -5.953 |
venerable | -5.951 |
gradual | -5.909 |
Token | heat |
Token ID | 4894 |
Feature activation | +6.51e+00 |
Pos logit contributions | |
disparate | +0.619 |
newer | +0.610 |
venerable | +0.603 |
gradual | +0.599 |
various | +0.599 |
Neg logit contributions | |
- | -0.294 |
u | -0.286 |
. | -0.272 |
acy | -0.267 |
ia | -0.259 |
Token | hens |
Token ID | 5135 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
- | +15.241 |
. | +13.912 |
u | +13.053 |
ong | +13.037 |
ia | +12.648 |
Neg logit contributions | |
disparate | -12.458 |
venerable | -12.197 |
newer | -11.977 |
anecdotal | -11.899 |
theless | -11.848 |
Token | . |
Token ID | 13 |
Feature activation | -7.08e+00 |
Pos logit contributions | |
- | +4.158 |
. | +4.039 |
u | +4.034 |
acy | +3.774 |
ia | +3.773 |
Neg logit contributions | |
disparate | -4.629 |
newer | -4.520 |
venerable | -4.498 |
anecdotal | -4.484 |
gradual | -4.478 |
Token |
|
Token ID | 198 |
Feature activation | +3.56e+00 |
Pos logit contributions | |
various | +17.840 |
disparate | +17.540 |
newer | +17.537 |
blatant | +17.433 |
genuine | +17.396 |
Neg logit contributions | |
acy | -12.103 |
u | -11.975 |
aga | -11.433 |
- | -11.142 |
ia | -11.104 |
Token |
|
Token ID | 198 |
Feature activation | -5.40e+00 |
Pos logit contributions | |
- | +4.943 |
. | +4.576 |
u | +4.444 |
ia | +3.834 |
ine | +3.782 |
Neg logit contributions | |
tremend | -13.639 |
mathemat | -13.245 |
hemor | -12.624 |
undermin | -12.469 |
disparate | -12.390 |
Token | Jenkins |
Token ID | 21835 |
Feature activation | +8.70e+00 |
Pos logit contributions | |
- | +15.465 |
u | +14.919 |
. | +14.758 |
ia | +14.501 |
ine | +14.252 |
Neg logit contributions | |
disparate | -9.598 |
gradual | -9.558 |
relentless | -9.385 |
tremendous | -9.331 |
blatant | -9.316 |
Token |
|
Token ID | 198 |
Feature activation | +3.92e+00 |
Pos logit contributions | |
- | +19.916 |
u | +19.191 |
. | +18.851 |
ong | +18.449 |
ia | +18.053 |
Neg logit contributions | |
disparate | -15.169 |
tremendous | -14.525 |
blatant | -14.383 |
relentless | -14.182 |
totality | -14.177 |
Token |
|
Token ID | 198 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
- | +5.261 |
. | +4.832 |
u | +4.607 |
ine | +3.994 |
ia | +3.950 |
Neg logit contributions | |
tremend | -15.221 |
mathemat | -14.470 |
hemor | -13.966 |
undermin | -13.715 |
cumbers | -13.465 |
Token | The |
Token ID | 464 |
Feature activation | -5.92e+00 |
Pos logit contributions | |
disparate | +10.114 |
newer | +10.031 |
various | +10.020 |
blatant | +9.995 |
genuine | +9.955 |
Neg logit contributions | |
u | -6.176 |
acy | -6.118 |
- | -5.855 |
aga | -5.755 |
ia | -5.699 |
Token | art |
Token ID | 1242 |
Feature activation | +5.80e+00 |
Pos logit contributions | |
disparate | +16.672 |
various | +16.564 |
newer | +16.513 |
blatant | +16.450 |
venerable | +16.428 |
Neg logit contributions | |
u | -9.863 |
acy | -9.678 |
- | -9.291 |
aga | -9.024 |
ia | -8.966 |
Token | of |
Token ID | 286 |
Feature activation | -4.21e+00 |
Pos logit contributions | |
- | +15.844 |
u | +15.026 |
. | +14.365 |
ia | +14.118 |
ite | +13.982 |
Neg logit contributions | |
disparate | -8.860 |
blatant | -8.677 |
relentless | -8.589 |
newer | -8.409 |
anecdotal | -8.404 |
Token | Ancient |
Token ID | 13406 |
Feature activation | +5.92e+00 |
Pos logit contributions | |
disparate | +10.636 |
newer | +10.454 |
various | +10.404 |
blatant | +10.371 |
relentless | +10.346 |
Neg logit contributions | |
u | -9.066 |
- | -8.816 |
acy | -8.772 |
ia | -8.444 |
aga | -8.345 |
Token | Greece |
Token ID | 10315 |
Feature activation | +5.24e+00 |
Pos logit contributions | |
- | +15.988 |
u | +14.558 |
. | +14.553 |
ong | +14.110 |
ia | +14.051 |
Neg logit contributions | |
disparate | -9.083 |
drastic | -8.899 |
newer | -8.839 |
stringent | -8.838 |
anecdotal | -8.761 |
Token | focused |
Token ID | 5670 |
Feature activation | +8.38e-01 |
Pos logit contributions | |
- | +12.756 |
. | +12.144 |
u | +12.012 |
ia | +11.697 |
ite | +11.285 |
Neg logit contributions | |
disparate | -9.609 |
totality | -9.261 |
relentless | -9.173 |
blatant | -9.143 |
newer | -9.112 |
Token | un |
Token ID | 555 |
Feature activation | +6.52e+00 |
Pos logit contributions | |
- | +2.082 |
u | +1.992 |
. | +1.965 |
acy | +1.932 |
ia | +1.891 |
Neg logit contributions | |
disparate | -1.789 |
newer | -1.749 |
blatant | -1.743 |
venerable | -1.736 |
anecdotal | -1.726 |
Token | ash |
Token ID | 1077 |
Feature activation | +7.05e+00 |
Pos logit contributions | |
- | +13.217 |
u | +12.231 |
acy | +12.214 |
id | +11.944 |
ire | +11.603 |
Neg logit contributions | |
disparate | -14.608 |
anecdotal | -14.538 |
gradual | -14.317 |
totality | -14.268 |
genuine | -14.196 |
Token | on |
Token ID | 319 |
Feature activation | -3.18e+00 |
Pos logit contributions | |
- | +6.518 |
u | +6.313 |
. | +6.186 |
acy | +6.102 |
ite | +5.980 |
Neg logit contributions | |
disparate | -5.082 |
venerable | -4.967 |
gradual | -4.925 |
blatant | -4.916 |
newer | -4.910 |
Token | cell |
Token ID | 2685 |
Feature activation | +7.71e+00 |
Pos logit contributions | |
disparate | +7.016 |
newer | +6.864 |
blatant | +6.835 |
relentless | +6.816 |
various | +6.801 |
Neg logit contributions | |
u | -7.908 |
- | -7.737 |
acy | -7.656 |
ia | -7.421 |
aga | -7.356 |
Token | phones |
Token ID | 9512 |
Feature activation | +2.99e+00 |
Pos logit contributions | |
- | +19.173 |
u | +18.222 |
. | +17.370 |
ia | +17.341 |
acy | +17.254 |
Neg logit contributions | |
disparate | -12.502 |
blatant | -12.009 |
relentless | -11.916 |
venerable | -11.642 |
gradual | -11.552 |
Token | and |
Token ID | 290 |
Feature activation | -7.95e+00 |
Pos logit contributions | |
- | +7.584 |
u | +7.282 |
. | +7.242 |
acy | +7.045 |
ia | +7.017 |
Neg logit contributions | |
disparate | -5.894 |
gradual | -5.813 |
venerable | -5.726 |
relentless | -5.653 |
drastic | -5.618 |
Token | a |
Token ID | 257 |
Feature activation | -5.41e+00 |
Pos logit contributions | |
various | +23.039 |
newer | +22.651 |
disparate | +22.615 |
genuine | +22.245 |
anecdotal | +22.124 |
Neg logit contributions | |
u | -10.503 |
acy | -10.268 |
ire | -9.758 |
ia | -9.702 |
iev | -9.664 |
Token | woman |
Token ID | 2415 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
disparate | +14.847 |
newer | +14.787 |
various | +14.673 |
relentless | +14.549 |
genuine | +14.544 |
Neg logit contributions | |
u | -9.601 |
acy | -9.367 |
- | -9.118 |
ia | -8.882 |
aga | -8.822 |
Token | clutching |
Token ID | 48281 |
Feature activation | +1.84e+00 |
Pos logit contributions | |
- | +7.115 |
u | +6.934 |
ia | +6.662 |
. | +6.637 |
acy | +6.609 |
Neg logit contributions | |
disparate | -5.120 |
venerable | -4.918 |
gradual | -4.913 |
blatant | -4.900 |
tremendous | -4.850 |
Token | an |
Token ID | 281 |
Feature activation | -3.53e+00 |
Pos logit contributions | |
- | +6.046 |
u | +5.925 |
. | +5.741 |
acy | +5.729 |
ia | +5.615 |
Neg logit contributions | |
disparate | -2.301 |
gradual | -2.283 |
venerable | -2.249 |
blatant | -2.239 |
relentless | -2.184 |
Token | envelope |
Token ID | 22878 |
Feature activation | +5.76e+00 |
Pos logit contributions | |
disparate | +7.463 |
various | +7.338 |
newer | +7.333 |
blatant | +7.257 |
relentless | +7.232 |
Neg logit contributions | |
u | -8.856 |
acy | -8.632 |
- | -8.600 |
ia | -8.339 |
aga | -8.295 |
Token | of |
Token ID | 286 |
Feature activation | -4.00e+00 |
Pos logit contributions | |
- | +15.051 |
. | +14.297 |
u | +14.195 |
acy | +13.667 |
ia | +13.419 |
Neg logit contributions | |
disparate | -9.038 |
gradual | -9.011 |
anecdotal | -8.651 |
relentless | -8.615 |
venerable | -8.605 |
Token | cash |
Token ID | 5003 |
Feature activation | +4.51e+00 |
Pos logit contributions | |
disparate | +8.670 |
newer | +8.514 |
various | +8.509 |
blatant | +8.436 |
relentless | +8.405 |
Neg logit contributions | |
u | -9.870 |
acy | -9.617 |
- | -9.594 |
ia | -9.289 |
aga | -9.212 |
Token | � |
Token ID | 114 |
Feature activation | +5.23e+00 |
Pos logit contributions | |
u | +3.949 |
� | +3.509 |
- | +3.369 |
acy | +3.301 |
ia | +3.037 |
Neg logit contributions | |
disparate | -17.498 |
venerable | -17.252 |
newer | -17.193 |
blatant | -17.154 |
relentless | -17.017 |
Token | д |
Token ID | 43666 |
Feature activation | +5.22e+00 |
Pos logit contributions | |
- | +10.119 |
u | +9.988 |
. | +9.821 |
ia | +9.651 |
acy | +9.550 |
Neg logit contributions | |
disparate | -12.484 |
anecdotal | -12.163 |
venerable | -12.160 |
totality | -12.101 |
blatant | -12.100 |
Token | а |
Token ID | 16142 |
Feature activation | +3.45e+00 |
Pos logit contributions | |
- | +10.145 |
u | +9.916 |
. | +9.792 |
ia | +9.570 |
acy | +9.095 |
Neg logit contributions | |
disparate | -12.389 |
blatant | -12.215 |
relentless | -12.121 |
venerable | -11.972 |
anecdotal | -11.934 |
Token | е |
Token ID | 16843 |
Feature activation | +5.09e+00 |
Pos logit contributions | |
- | +6.230 |
. | +6.001 |
u | +5.963 |
ia | +5.462 |
acy | +5.428 |
Neg logit contributions | |
disparate | -9.505 |
venerable | -9.345 |
relentless | -9.221 |
newer | -9.166 |
totality | -9.127 |
Token | т |
Token ID | 20375 |
Feature activation | +2.97e+00 |
Pos logit contributions | |
- | +9.704 |
. | +9.585 |
u | +9.474 |
ia | +8.734 |
acy | +8.685 |
Neg logit contributions | |
venerable | -12.134 |
disparate | -12.113 |
totality | -11.954 |
anecdotal | -11.828 |
blatant | -11.827 |
Token | � |
Token ID | 12466 |
Feature activation | +3.12e+00 |
Pos logit contributions | |
- | +5.791 |
u | +5.711 |
. | +5.612 |
ia | +5.308 |
acy | +5.265 |
Neg logit contributions | |
disparate | -7.822 |
venerable | -7.651 |
blatant | -7.549 |
anecdotal | -7.513 |
relentless | -7.508 |
Token | � |
Token ID | 116 |
Feature activation | +5.33e+00 |
Pos logit contributions | |
u | +2.725 |
- | +2.486 |
� | +2.336 |
acy | +2.280 |
ia | +2.262 |
Neg logit contributions | |
disparate | -11.432 |
newer | -11.241 |
venerable | -11.194 |
relentless | -11.133 |
blatant | -11.089 |
Token | � |
Token ID | 141 |
Feature activation | +8.91e+00 |
Pos logit contributions | |
- | +11.693 |
. | +11.199 |
u | +11.121 |
ia | +10.453 |
acy | +10.185 |
Neg logit contributions | |
disparate | -11.229 |
venerable | -11.014 |
gradual | -10.827 |
anecdotal | -10.755 |
relentless | -10.741 |
Token | � |
Token ID | 227 |
Feature activation | +4.41e+00 |
Pos logit contributions | |
u | +12.873 |
ia | +12.235 |
- | +12.214 |
acy | +11.847 |
. | +11.767 |
Neg logit contributions | |
disparate | -20.369 |
newer | -19.948 |
relentless | -19.824 |
gradual | -19.797 |
blatant | -19.766 |
Token | � |
Token ID | 12466 |
Feature activation | +3.69e+00 |
Pos logit contributions | |
- | +10.385 |
. | +10.183 |
u | +10.037 |
acy | +9.374 |
ia | +9.298 |
Neg logit contributions | |
disparate | -9.253 |
venerable | -8.898 |
gradual | -8.890 |
relentless | -8.889 |
blatant | -8.858 |
Token | � |
Token ID | 111 |
Feature activation | +4.63e+00 |
Pos logit contributions | |
u | +3.663 |
- | +3.321 |
� | +3.281 |
ia | +3.139 |
acy | +3.083 |
Neg logit contributions | |
disparate | -12.863 |
newer | -12.596 |
venerable | -12.567 |
relentless | -12.518 |
blatant | -12.496 |
Token | thieves |
Token ID | 26655 |
Feature activation | +6.27e+00 |
Pos logit contributions | |
- | +11.462 |
. | +11.138 |
u | +10.562 |
acy | +10.431 |
ite | +10.082 |
Neg logit contributions | |
venerable | -7.194 |
gradual | -6.961 |
disparate | -6.937 |
theless | -6.781 |
relentless | -6.766 |
Token | tends |
Token ID | 12444 |
Feature activation | +3.88e+00 |
Pos logit contributions | |
- | +16.327 |
. | +16.010 |
u | +15.591 |
ia | +15.223 |
acy | +14.927 |
Neg logit contributions | |
venerable | -9.502 |
disparate | -9.471 |
totality | -8.954 |
tremendous | -8.928 |
gradual | -8.869 |
Token | to |
Token ID | 284 |
Feature activation | -3.10e+00 |
Pos logit contributions | |
- | +8.391 |
u | +8.376 |
acy | +8.058 |
. | +7.877 |
ia | +7.870 |
Neg logit contributions | |
disparate | -8.819 |
venerable | -8.687 |
newer | -8.546 |
blatant | -8.514 |
relentless | -8.492 |
Token | rise |
Token ID | 4485 |
Feature activation | +2.61e+00 |
Pos logit contributions | |
disparate | +5.760 |
venerable | +5.556 |
newer | +5.546 |
blatant | +5.528 |
relentless | +5.515 |
Neg logit contributions | |
u | -8.944 |
- | -8.816 |
acy | -8.687 |
ia | -8.465 |
ine | -8.363 |
Token | in |
Token ID | 287 |
Feature activation | -3.50e+00 |
Pos logit contributions | |
- | +7.259 |
. | +7.102 |
u | +6.938 |
acy | +6.749 |
ite | +6.562 |
Neg logit contributions | |
disparate | -4.464 |
venerable | -4.459 |
blatant | -4.316 |
totality | -4.310 |
relentless | -4.266 |
Token | the |
Token ID | 262 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
disparate | +7.879 |
newer | +7.665 |
venerable | +7.649 |
relentless | +7.633 |
blatant | +7.621 |
Neg logit contributions | |
u | -8.639 |
- | -8.580 |
acy | -8.436 |
ia | -8.141 |
ine | -8.041 |
Token | Tampa |
Token ID | 15528 |
Feature activation | +9.60e+00 |
Pos logit contributions | |
disparate | +12.035 |
newer | +11.863 |
various | +11.833 |
blatant | +11.743 |
relentless | +11.726 |
Neg logit contributions | |
u | -10.930 |
acy | -10.608 |
- | -10.534 |
ia | -10.185 |
aga | -10.134 |
Token | Bay |
Token ID | 4696 |
Feature activation | +6.62e+00 |
Pos logit contributions | |
- | +22.380 |
. | +19.694 |
ia | +18.665 |
u | +18.372 |
acy | +18.235 |
Neg logit contributions | |
theless | -15.143 |
blatant | -13.478 |
newer | -13.224 |
disparate | -13.191 |
sheer | -13.136 |
Token | area |
Token ID | 1989 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
- | +14.377 |
. | +13.470 |
u | +12.568 |
acy | +12.508 |
ite | +12.342 |
Neg logit contributions | |
theless | -12.935 |
disparate | -12.579 |
blatant | -12.357 |
newer | -12.257 |
venerable | -12.243 |
Token | each |
Token ID | 1123 |
Feature activation | +6.61e-02 |
Pos logit contributions | |
. | +5.756 |
- | +5.717 |
u | +5.469 |
acy | +5.319 |
ia | +5.187 |
Neg logit contributions | |
disparate | -5.227 |
venerable | -5.181 |
blatant | -5.045 |
relentless | -4.993 |
tremendous | -4.970 |
Token | spring |
Token ID | 6076 |
Feature activation | +5.55e+00 |
Pos logit contributions | |
- | +0.181 |
u | +0.175 |
. | +0.169 |
acy | +0.169 |
ine | +0.165 |
Neg logit contributions | |
disparate | -0.132 |
venerable | -0.126 |
relentless | -0.126 |
gradual | -0.126 |
blatant | -0.126 |
Token | with |
Token ID | 351 |
Feature activation | -7.21e+00 |
Pos logit contributions | |
- | +8.253 |
u | +7.918 |
. | +7.774 |
ia | +7.497 |
acy | +7.367 |
Neg logit contributions | |
disparate | -9.948 |
venerable | -9.883 |
blatant | -9.782 |
totality | -9.777 |
relentless | -9.726 |
Token | a |
Token ID | 257 |
Feature activation | -6.41e+00 |
Pos logit contributions | |
various | +22.180 |
disparate | +22.067 |
newer | +21.810 |
blatant | +21.504 |
venerable | +21.470 |
Neg logit contributions | |
u | -9.746 |
acy | -9.360 |
- | -8.753 |
ia | -8.710 |
aga | -8.668 |
Token | couple |
Token ID | 3155 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
disparate | +18.358 |
newer | +18.123 |
various | +18.103 |
blatant | +17.902 |
venerable | +17.848 |
Neg logit contributions | |
u | -10.378 |
acy | -10.160 |
- | -9.639 |
ia | -9.558 |
aga | -9.472 |
Token | of |
Token ID | 286 |
Feature activation | -7.77e+00 |
Pos logit contributions | |
- | +0.555 |
u | +0.541 |
acy | +0.520 |
. | +0.513 |
ia | +0.498 |
Neg logit contributions | |
relentless | -0.603 |
disparate | -0.599 |
gradual | -0.595 |
tremendous | -0.594 |
blatant | -0.592 |
Token | districts |
Token ID | 12815 |
Feature activation | +4.53e+00 |
Pos logit contributions | |
disparate | +23.445 |
various | +23.332 |
newer | +23.143 |
venerable | +22.807 |
blatant | +22.801 |
Neg logit contributions | |
u | -10.061 |
acy | -9.749 |
aga | -9.108 |
ia | -9.095 |
ong | -8.982 |
Token | in |
Token ID | 287 |
Feature activation | -6.44e+00 |
Pos logit contributions | |
- | +11.584 |
. | +11.357 |
u | +10.836 |
ia | +10.476 |
acy | +10.472 |
Neg logit contributions | |
disparate | -7.770 |
venerable | -7.764 |
relentless | -7.732 |
gradual | -7.727 |
totality | -7.692 |
Token | other |
Token ID | 584 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
various | +19.263 |
disparate | +19.204 |
newer | +18.992 |
blatant | +18.758 |
genuine | +18.630 |
Neg logit contributions | |
u | -9.438 |
acy | -8.939 |
- | -8.500 |
ong | -8.424 |
aga | -8.415 |
Token | states |
Token ID | 2585 |
Feature activation | +3.04e+00 |
Pos logit contributions | |
disparate | +3.367 |
relentless | +3.339 |
newer | +3.293 |
gradual | +3.284 |
tremendous | +3.273 |
Neg logit contributions | |
- | -5.169 |
u | -5.107 |
acy | -4.973 |
ia | -4.863 |
. | -4.845 |
Token | .) |
Token ID | 2014 |
Feature activation | -6.07e+00 |
Pos logit contributions | |
- | +7.119 |
. | +6.995 |
u | +6.826 |
ia | +6.581 |
acy | +6.470 |
Neg logit contributions | |
disparate | -6.510 |
venerable | -6.506 |
totality | -6.470 |
relentless | -6.411 |
gradual | -6.390 |
Token |
|
Token ID | 198 |
Feature activation | +3.83e+00 |
Pos logit contributions | |
various | +16.221 |
newer | +16.173 |
disparate | +16.166 |
blatant | +15.925 |
genuine | +15.859 |
Neg logit contributions | |
u | -10.248 |
acy | -10.015 |
aga | -9.604 |
- | -9.542 |
ia | -9.389 |
Token |
|
Token ID | 198 |
Feature activation | -5.88e+00 |
Pos logit contributions | |
- | +5.195 |
. | +4.793 |
u | +4.636 |
ia | +4.024 |
ine | +3.976 |
Neg logit contributions | |
tremend | -14.815 |
mathemat | -14.326 |
hemor | -13.664 |
undermin | -13.550 |
cumbers | -13.311 |
Token | The |
Token ID | 383 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
various | +23.640 |
newer | +23.210 |
disparate | +22.792 |
genuine | +22.693 |
modern | +22.660 |
Neg logit contributions | |
acy | -12.059 |
u | -11.873 |
aga | -11.464 |
iev | -11.156 |
ong | -11.043 |
Token | gem |
Token ID | 16840 |
Feature activation | +3.12e+00 |
Pos logit contributions | |
various | +28.168 |
newer | +27.640 |
disparate | +27.239 |
modern | +27.210 |
genuine | +27.088 |
Neg logit contributions | |
acy | -11.380 |
u | -11.228 |
ache | -10.363 |
aga | -10.279 |
ong | -10.237 |
Token | of |
Token ID | 286 |
Feature activation | -7.00e+00 |
Pos logit contributions | |
- | +8.106 |
u | +7.939 |
acy | +7.471 |
ine | +7.464 |
ia | +7.402 |
Neg logit contributions | |
disparate | -6.339 |
relentless | -6.140 |
blatant | -6.079 |
anecdotal | -6.062 |
venerable | -6.000 |
Token | the |
Token ID | 262 |
Feature activation | -7.81e+00 |
Pos logit contributions | |
various | +19.006 |
disparate | +18.954 |
newer | +18.735 |
genuine | +18.593 |
tremendous | +18.513 |
Neg logit contributions | |
u | -11.469 |
acy | -11.343 |
- | -10.780 |
aga | -10.571 |
ia | -10.555 |
Token | collection |
Token ID | 4947 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
various | +21.308 |
disparate | +21.049 |
newer | +21.032 |
venerable | +20.826 |
genuine | +20.814 |
Neg logit contributions | |
u | -11.720 |
acy | -11.575 |
aga | -10.810 |
ong | -10.694 |
ade | -10.597 |
Token | is |
Token ID | 318 |
Feature activation | -6.78e+00 |
Pos logit contributions | |
- | +2.192 |
u | +2.136 |
acy | +2.032 |
. | +2.016 |
ia | +1.938 |
Neg logit contributions | |
disparate | -3.900 |
relentless | -3.851 |
blatant | -3.806 |
gradual | -3.806 |
newer | -3.801 |
Token | a |
Token ID | 257 |
Feature activation | -6.52e+00 |
Pos logit contributions | |
various | +19.438 |
disparate | +19.193 |
newer | +19.161 |
genuine | +19.030 |
venerable | +18.899 |
Neg logit contributions | |
u | -9.946 |
acy | -9.768 |
- | -9.267 |
ia | -9.069 |
aga | -9.024 |
Token | blue |
Token ID | 4171 |
Feature activation | +4.99e+00 |
Pos logit contributions | |
disparate | +19.180 |
newer | +19.155 |
various | +19.114 |
genuine | +19.060 |
tremendous | +18.995 |
Neg logit contributions | |
u | -9.214 |
acy | -9.179 |
- | -8.422 |
aga | -8.286 |
ia | -8.264 |
Token | five |
Token ID | 1936 |
Feature activation | +3.79e+00 |
Pos logit contributions | |
- | +14.347 |
u | +13.058 |
. | +12.899 |
ia | +12.749 |
ade | +12.457 |
Neg logit contributions | |
disparate | -7.793 |
anecdotal | -7.268 |
relentless | -7.239 |
blatant | -7.167 |
venerable | -7.083 |
Token | - |
Token ID | 12 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
- | +9.185 |
u | +8.483 |
. | +8.026 |
acy | +7.990 |
ia | +7.926 |
Neg logit contributions | |
disparate | -8.368 |
relentless | -8.177 |
blatant | -8.138 |
newer | -8.128 |
venerable | -8.051 |
Token | store |
Token ID | 8095 |
Feature activation | +7.62e+00 |
Pos logit contributions | |
- | +3.092 |
u | +3.080 |
acy | +2.854 |
ia | +2.775 |
ong | +2.760 |
Neg logit contributions | |
disparate | -6.627 |
newer | -6.498 |
totality | -6.471 |
blatant | -6.461 |
relentless | -6.456 |
Token | about |
Token ID | 546 |
Feature activation | -7.70e+00 |
Pos logit contributions | |
disparate | +1.389 |
venerable | +1.360 |
blatant | +1.359 |
relentless | +1.353 |
newer | +1.352 |
Neg logit contributions | |
- | -1.020 |
u | -0.983 |
. | -0.961 |
acy | -0.924 |
ia | -0.911 |
Token | Tyson |
Token ID | 27320 |
Feature activation | +5.21e+00 |
Pos logit contributions | |
various | +23.051 |
disparate | +22.863 |
newer | +22.805 |
genuine | +22.620 |
sheer | +22.585 |
Neg logit contributions | |
u | -10.049 |
acy | -9.731 |
ong | -9.115 |
ire | -9.087 |
ade | -8.941 |
Token | Chandler |
Token ID | 28346 |
Feature activation | +2.88e+00 |
Pos logit contributions | |
- | +13.470 |
. | +13.253 |
u | +12.455 |
acy | +12.141 |
ia | +11.758 |
Neg logit contributions | |
disparate | -8.882 |
relentless | -8.412 |
blatant | -8.383 |
venerable | -8.347 |
anecdotal | -8.252 |
Token | before |
Token ID | 878 |
Feature activation | -7.84e+00 |
Pos logit contributions | |
- | +7.365 |
. | +7.272 |
u | +6.947 |
ia | +6.589 |
acy | +6.574 |
Neg logit contributions | |
disparate | -5.870 |
venerable | -5.626 |
relentless | -5.576 |
blatant | -5.573 |
anecdotal | -5.526 |
Token | they |
Token ID | 484 |
Feature activation | -5.60e+00 |
Pos logit contributions | |
various | +23.016 |
newer | +22.743 |
disparate | +22.694 |
sheer | +22.678 |
genuine | +22.651 |
Neg logit contributions | |
u | -10.132 |
acy | -9.933 |
aga | -9.116 |
ong | -9.070 |
ire | -9.028 |
Token | can |
Token ID | 460 |
Feature activation | -6.37e+00 |
Pos logit contributions | |
various | +14.879 |
disparate | +14.847 |
newer | +14.813 |
genuine | +14.655 |
blatant | +14.652 |
Neg logit contributions | |
u | -9.868 |
acy | -9.645 |
ia | -9.267 |
- | -9.229 |
aga | -9.104 |
Token | do |
Token ID | 466 |
Feature activation | -3.43e+00 |
Pos logit contributions | |
various | +18.290 |
newer | +18.148 |
genuine | +18.105 |
disparate | +18.078 |
tremendous | +17.979 |
Neg logit contributions | |
u | -9.284 |
acy | -9.080 |
ia | -8.630 |
aga | -8.497 |
- | -8.446 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
disparate | +7.946 |
newer | +7.792 |
various | +7.731 |
blatant | +7.726 |
venerable | +7.708 |
Neg logit contributions | |
u | -8.120 |
- | -7.960 |
acy | -7.878 |
ia | -7.622 |
aga | -7.546 |
Token | else |
Token ID | 2073 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
disparate | +6.022 |
venerable | +5.924 |
newer | +5.922 |
relentless | +5.911 |
various | +5.907 |
Neg logit contributions | |
u | -2.476 |
- | -2.466 |
acy | -2.330 |
. | -2.241 |
ia | -2.218 |
Token | . |
Token ID | 13 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
disparate | +6.478 |
newer | +6.393 |
venerable | +6.380 |
relentless | +6.379 |
blatant | +6.374 |
Neg logit contributions | |
u | -1.061 |
- | -1.020 |
acy | -0.925 |
ia | -0.819 |
. | -0.815 |
Token | Do |
Token ID | 2141 |
Feature activation | -4.48e+00 |
Pos logit contributions | |
various | +24.684 |
modern | +24.183 |
newer | +24.157 |
those | +23.967 |
genuine | +23.882 |
Neg logit contributions | |
acy | -13.705 |
aga | -13.603 |
u | -13.567 |
igr | -13.510 |
iev | -13.045 |
Token | , |
Token ID | 11 |
Feature activation | -7.79e+00 |
Pos logit contributions | |
. | +5.960 |
- | +5.907 |
u | +5.694 |
acy | +5.256 |
ia | +5.182 |
Neg logit contributions | |
disparate | -6.951 |
venerable | -6.852 |
blatant | -6.749 |
anecdotal | -6.747 |
totality | -6.738 |
Token | so |
Token ID | 523 |
Feature activation | -9.39e+00 |
Pos logit contributions | |
newer | +22.458 |
various | +22.431 |
disparate | +22.168 |
tremendous | +21.945 |
relentless | +21.928 |
Neg logit contributions | |
u | -10.413 |
acy | -10.092 |
aga | -9.841 |
iev | -9.539 |
- | -9.514 |
Token | now |
Token ID | 783 |
Feature activation | -4.81e+00 |
Pos logit contributions | |
various | +26.299 |
newer | +26.066 |
disparate | +25.729 |
blatant | +25.711 |
gradual | +25.581 |
Neg logit contributions | |
u | -11.277 |
acy | -10.949 |
iev | -10.551 |
aga | -10.529 |
ée | -10.230 |
Token | the |
Token ID | 262 |
Feature activation | -7.55e+00 |
Pos logit contributions | |
disparate | +14.447 |
newer | +14.316 |
various | +14.300 |
blatant | +14.200 |
relentless | +14.135 |
Neg logit contributions | |
u | -7.644 |
acy | -7.329 |
- | -7.205 |
ia | -6.909 |
aga | -6.905 |
Token | ceremony |
Token ID | 10542 |
Feature activation | +4.55e+00 |
Pos logit contributions | |
various | +20.988 |
newer | +20.988 |
disparate | +20.827 |
blatant | +20.688 |
gradual | +20.658 |
Neg logit contributions | |
u | -11.195 |
acy | -10.914 |
aga | -10.555 |
iev | -10.268 |
ade | -10.201 |
Token | is |
Token ID | 318 |
Feature activation | -6.32e+00 |
Pos logit contributions | |
- | +10.764 |
. | +10.066 |
u | +10.024 |
ia | +9.528 |
acy | +9.431 |
Neg logit contributions | |
disparate | -9.064 |
venerable | -8.886 |
anecdotal | -8.644 |
totality | -8.601 |
relentless | -8.593 |
Token | happening |
Token ID | 5836 |
Feature activation | -5.65e-01 |
Pos logit contributions | |
disparate | +18.235 |
newer | +18.124 |
various | +18.058 |
blatant | +18.028 |
relentless | +17.957 |
Neg logit contributions | |
u | -9.840 |
acy | -9.688 |
- | -9.121 |
aga | -9.064 |
ia | -9.006 |
Token | to |
Token ID | 284 |
Feature activation | -5.18e+00 |
Pos logit contributions | |
disparate | +1.618 |
venerable | +1.594 |
blatant | +1.588 |
relentless | +1.580 |
totality | +1.573 |
Neg logit contributions | |
- | -1.042 |
u | -1.020 |
. | -1.000 |
acy | -0.969 |
ia | -0.938 |
Token | girls |
Token ID | 4813 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
disparate | +14.103 |
newer | +13.970 |
various | +13.932 |
blatant | +13.803 |
relentless | +13.753 |
Neg logit contributions | |
u | -9.664 |
acy | -9.374 |
- | -9.232 |
ia | -8.924 |
aga | -8.887 |
Token | as |
Token ID | 355 |
Feature activation | -3.83e+00 |
Pos logit contributions | |
. | +4.724 |
- | +4.719 |
u | +4.486 |
ia | +4.301 |
acy | +4.284 |
Neg logit contributions | |
disparate | -3.671 |
venerable | -3.611 |
totality | -3.599 |
anecdotal | -3.598 |
blatant | -3.589 |
Token | young |
Token ID | 1862 |
Feature activation | +7.22e+00 |
Pos logit contributions | |
disparate | +8.442 |
newer | +8.253 |
various | +8.223 |
blatant | +8.203 |
relentless | +8.186 |
Neg logit contributions | |
u | -9.518 |
- | -9.336 |
acy | -9.272 |
ia | -8.976 |
aga | -8.856 |
Token | state |
Token ID | 1181 |
Feature activation | +4.71e+00 |
Pos logit contributions | |
disparate | +3.315 |
newer | +3.262 |
various | +3.237 |
anecdotal | +3.225 |
venerable | +3.182 |
Neg logit contributions | |
u | -6.935 |
- | -6.924 |
acy | -6.729 |
ia | -6.571 |
ine | -6.560 |
Token | of |
Token ID | 286 |
Feature activation | -2.88e+00 |
Pos logit contributions | |
- | +11.597 |
. | +11.339 |
u | +10.687 |
acy | +10.193 |
ine | +10.089 |
Neg logit contributions | |
disparate | -8.668 |
anecdotal | -8.628 |
venerable | -8.559 |
relentless | -8.521 |
newer | -8.465 |
Token | dis |
Token ID | 595 |
Feature activation | +7.15e+00 |
Pos logit contributions | |
disparate | +4.519 |
newer | +4.414 |
venerable | +4.352 |
various | +4.305 |
anecdotal | +4.297 |
Neg logit contributions | |
u | -9.007 |
- | -8.955 |
acy | -8.821 |
ia | -8.567 |
ine | -8.497 |
Token | repair |
Token ID | 49932 |
Feature activation | +3.26e+00 |
Pos logit contributions | |
- | +9.961 |
u | +9.391 |
. | +8.457 |
ab | +8.388 |
acy | +8.239 |
Neg logit contributions | |
anecdotal | -20.142 |
disparate | -19.740 |
venerable | -19.652 |
relentless | -19.637 |
newer | -19.617 |
Token | , |
Token ID | 11 |
Feature activation | -8.50e+00 |
Pos logit contributions | |
- | +8.137 |
. | +8.080 |
u | +7.702 |
acy | +7.422 |
ia | +7.324 |
Neg logit contributions | |
disparate | -6.355 |
venerable | -6.304 |
relentless | -6.272 |
blatant | -6.243 |
gradual | -6.166 |
Token | its |
Token ID | 663 |
Feature activation | -7.54e+00 |
Pos logit contributions | |
various | +23.288 |
disparate | +23.244 |
newer | +23.184 |
widespread | +22.822 |
blatant | +22.817 |
Neg logit contributions | |
u | -11.549 |
acy | -11.180 |
aga | -10.953 |
ong | -10.643 |
- | -10.599 |
Token | value |
Token ID | 1988 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
various | +21.141 |
newer | +21.053 |
disparate | +20.994 |
venerable | +20.657 |
relentless | +20.652 |
Neg logit contributions | |
u | -11.123 |
acy | -10.983 |
aga | -10.367 |
ong | -10.239 |
- | -9.993 |
Token | is |
Token ID | 318 |
Feature activation | -5.18e+00 |
Pos logit contributions | |
- | +4.202 |
u | +3.961 |
. | +3.952 |
acy | +3.920 |
ia | +3.827 |
Neg logit contributions | |
newer | -2.516 |
disparate | -2.506 |
venerable | -2.470 |
blatant | -2.455 |
totality | -2.434 |
Token | marginal |
Token ID | 14461 |
Feature activation | +4.47e+00 |
Pos logit contributions | |
disparate | +14.442 |
various | +14.218 |
newer | +14.181 |
blatant | +14.135 |
relentless | +14.116 |
Neg logit contributions | |
u | -9.296 |
acy | -9.020 |
- | -8.835 |
ia | -8.585 |
aga | -8.544 |
Token | , |
Token ID | 11 |
Feature activation | -7.33e+00 |
Pos logit contributions | |
- | +10.650 |
. | +10.516 |
u | +10.310 |
acy | +9.996 |
ia | +9.843 |
Neg logit contributions | |
blatant | -8.786 |
disparate | -8.760 |
relentless | -8.685 |
venerable | -8.551 |
gradual | -8.543 |
Token | and |
Token ID | 290 |
Feature activation | -9.85e+00 |
Pos logit contributions | |
various | +22.116 |
newer | +22.018 |
disparate | +22.001 |
tremendous | +21.633 |
blatant | +21.606 |
Neg logit contributions | |
u | -8.933 |
acy | -8.549 |
aga | -8.261 |
- | -8.055 |
ong | -8.025 |