Token | culture |
Token ID | 3968 |
Feature activation | +7.38e-01 |
Pos logit contributions | |
slang | +9.644 |
stereotype | +9.309 |
puberty | +9.055 |
tradition | +8.969 |
mentality | +8.920 |
Neg logit contributions | |
elect | -10.940 |
events | -10.489 |
oops | -10.437 |
awaits | -10.057 |
absolutely | -9.636 |
Token | before |
Token ID | 878 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
slang | +7.115 |
stereotype | +6.883 |
ingrained | +6.674 |
curfew | +6.593 |
puberty | +6.553 |
Neg logit contributions | |
elect | -6.562 |
events | -6.221 |
oops | -6.213 |
awaits | -5.932 |
papers | -5.673 |
Token | it |
Token ID | 340 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
slang | +10.191 |
puberty | +9.849 |
stereotype | +9.826 |
curfew | +9.686 |
tradition | +9.436 |
Neg logit contributions | |
elect | -10.948 |
oops | -10.689 |
events | -10.441 |
awaits | -10.214 |
papers | -9.970 |
Token | came |
Token ID | 1625 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
slang | +11.671 |
stereotype | +11.369 |
ingrained | +11.112 |
curfew | +10.852 |
worn | +10.806 |
Neg logit contributions | |
elect | -11.763 |
oops | -11.249 |
events | -10.982 |
awaits | -10.520 |
papers | -10.466 |
Token | under |
Token ID | 739 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
slang | +12.050 |
stereotype | +11.682 |
ingrained | +11.350 |
puberty | +11.146 |
tradition | +10.968 |
Neg logit contributions | |
elect | -15.980 |
oops | -15.916 |
events | -15.624 |
awaits | -14.843 |
papers | -14.612 |
Token | Greek |
Token ID | 8312 |
Feature activation | +2.61e+00 |
Pos logit contributions | |
stereotype | +14.461 |
curfew | +14.366 |
slang | +14.267 |
colonialism | +14.031 |
puberty | +13.976 |
Neg logit contributions | |
oops | -15.793 |
elect | -15.562 |
events | -15.379 |
awaits | -14.906 |
ilib | -14.444 |
Token | influence |
Token ID | 4588 |
Feature activation | +5.25e-01 |
Pos logit contributions | |
colonialism | +17.955 |
tradition | +17.779 |
stereotype | +17.491 |
slang | +17.439 |
curfew | +17.148 |
Neg logit contributions | |
elect | -19.907 |
events | -19.775 |
oops | -19.623 |
papers | -18.807 |
ilib | -18.501 |
Token | . |
Token ID | 13 |
Feature activation | +7.62e-01 |
Pos logit contributions | |
slang | +5.259 |
stereotype | +5.094 |
curfew | +4.969 |
ingrained | +4.937 |
puberty | +4.909 |
Neg logit contributions | |
elect | -4.548 |
events | -4.280 |
oops | -4.267 |
awaits | -4.101 |
probably | -3.896 |
Token | I |
Token ID | 314 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
slang | +7.809 |
stereotype | +7.572 |
curfew | +7.200 |
puberty | +7.198 |
ingrained | +7.165 |
Neg logit contributions | |
elect | -6.213 |
events | -5.817 |
oops | -5.796 |
awaits | -5.604 |
papers | -5.269 |
Token | don |
Token ID | 836 |
Feature activation | -4.10e-01 |
Pos logit contributions | |
slang | +9.049 |
stereotype | +9.000 |
ingrained | +8.538 |
curfew | +8.391 |
puberty | +8.371 |
Neg logit contributions | |
elect | -9.370 |
events | -8.993 |
oops | -8.867 |
awaits | -8.508 |
papers | -8.209 |
Token | 't |
Token ID | 470 |
Feature activation | +9.80e-01 |
Pos logit contributions | |
elect | +1.962 |
events | +1.721 |
oops | +1.676 |
probably | +1.549 |
absolutely | +1.502 |
Neg logit contributions | |
slang | -5.739 |
curfew | -5.689 |
stereotype | -5.688 |
puberty | -5.545 |
ingrained | -5.517 |
Token | library |
Token ID | 32016 |
Feature activation | +6.46e-01 |
Pos logit contributions | |
slang | +1.063 |
stereotype | +1.035 |
curfew | +1.012 |
ingrained | +0.999 |
puberty | +0.991 |
Neg logit contributions | |
elect | -0.765 |
events | -0.715 |
oops | -0.703 |
awaits | -0.680 |
probably | -0.652 |
Token | services |
Token ID | 2594 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
slang | +6.007 |
stereotype | +5.826 |
curfew | +5.602 |
mentality | +5.528 |
ingrained | +5.523 |
Neg logit contributions | |
elect | -5.914 |
events | -5.676 |
oops | -5.622 |
awaits | -5.326 |
probably | -5.240 |
Token | platform |
Token ID | 3859 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
slang | +11.654 |
stereotype | +11.284 |
mentality | +10.941 |
ingrained | +10.752 |
curfew | +10.728 |
Neg logit contributions | |
elect | -8.075 |
events | -7.888 |
oops | -7.754 |
probably | -7.074 |
awaits | -7.009 |
Token | � |
Token ID | 447 |
Feature activation | +2.21e-01 |
Pos logit contributions | |
slang | +11.075 |
stereotype | +10.676 |
mentality | +10.241 |
ingrained | +10.202 |
curfew | +10.172 |
Neg logit contributions | |
elect | -7.558 |
events | -7.173 |
oops | -7.053 |
awaits | -6.450 |
absolutely | -6.416 |
Token | � |
Token ID | 251 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
slang | +2.122 |
stereotype | +2.060 |
curfew | +2.007 |
ingrained | +1.982 |
puberty | +1.964 |
Neg logit contributions | |
elect | -2.039 |
events | -1.929 |
oops | -1.898 |
awaits | -1.844 |
probably | -1.778 |
Token | was |
Token ID | 373 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
slang | +13.594 |
stereotype | +13.074 |
ingrained | +12.550 |
tradition | +12.338 |
worn | +12.300 |
Neg logit contributions | |
elect | -8.790 |
events | -8.379 |
oops | -8.246 |
awaits | -7.746 |
enough | -7.454 |
Token | established |
Token ID | 4920 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
slang | +21.113 |
ingrained | +19.398 |
worn | +19.274 |
stereotype | +18.745 |
prevalent | +18.485 |
Neg logit contributions | |
oops | -18.362 |
events | -17.450 |
elect | -17.268 |
awaits | -16.546 |
ilib | -15.855 |
Token | to |
Token ID | 284 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
slang | +14.048 |
stereotype | +12.829 |
ingrained | +12.575 |
puberty | +12.450 |
tradition | +12.445 |
Neg logit contributions | |
elect | -15.964 |
oops | -15.805 |
events | -15.383 |
awaits | -14.948 |
absolutely | -14.071 |
Token | differentiate |
Token ID | 28754 |
Feature activation | +8.61e-01 |
Pos logit contributions | |
slang | +15.301 |
stereotype | +14.707 |
ingrained | +13.106 |
emphasis | +12.867 |
leash | +12.808 |
Neg logit contributions | |
oops | -17.102 |
elect | -17.078 |
events | -16.613 |
awaits | -16.235 |
dies | -15.582 |
Token | these |
Token ID | 777 |
Feature activation | -1.92e-02 |
Pos logit contributions | |
slang | +7.629 |
stereotype | +7.307 |
ingrained | +7.064 |
curfew | +6.956 |
puberty | +6.888 |
Neg logit contributions | |
elect | -8.134 |
oops | -7.842 |
events | -7.757 |
awaits | -7.424 |
probably | -7.213 |
Token | products |
Token ID | 3186 |
Feature activation | +7.94e-01 |
Pos logit contributions | |
elect | +0.167 |
events | +0.157 |
oops | +0.154 |
awaits | +0.150 |
probably | +0.144 |
Neg logit contributions | |
slang | -0.194 |
stereotype | -0.189 |
curfew | -0.186 |
ingrained | -0.182 |
puberty | -0.181 |
Token | bend |
Token ID | 19396 |
Feature activation | +5.62e-02 |
Pos logit contributions | |
elect | +8.729 |
awaits | +8.198 |
events | +7.986 |
oops | +7.898 |
indeed | +7.789 |
Neg logit contributions | |
slang | -7.337 |
stereotype | -7.083 |
ingrained | -6.885 |
curfew | -6.877 |
puberty | -6.829 |
Token | - |
Token ID | 532 |
Feature activation | -8.44e-02 |
Pos logit contributions | |
slang | +0.537 |
stereotype | +0.522 |
curfew | +0.509 |
ingrained | +0.501 |
puberty | +0.497 |
Neg logit contributions | |
elect | -0.522 |
events | -0.492 |
oops | -0.484 |
awaits | -0.471 |
probably | -0.455 |
Token | a |
Token ID | 257 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
elect | +0.828 |
events | +0.782 |
oops | +0.773 |
awaits | +0.750 |
probably | +0.732 |
Neg logit contributions | |
slang | -0.758 |
stereotype | -0.741 |
curfew | -0.721 |
ingrained | -0.705 |
puberty | -0.702 |
Token | skill |
Token ID | 5032 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
slang | +10.652 |
stereotype | +10.251 |
curfew | +9.877 |
tradition | +9.768 |
ingrained | +9.734 |
Neg logit contributions | |
elect | -11.225 |
events | -10.897 |
oops | -10.721 |
papers | -10.152 |
awaits | -10.097 |
Token | that |
Token ID | 326 |
Feature activation | +7.88e-01 |
Pos logit contributions | |
slang | +17.234 |
ingrained | +16.884 |
stereotype | +16.612 |
worn | +16.447 |
tradition | +16.193 |
Neg logit contributions | |
elect | -13.096 |
events | -12.966 |
oops | -12.358 |
ilib | -11.875 |
papers | -11.832 |
Token | was |
Token ID | 373 |
Feature activation | +2.52e+00 |
Pos logit contributions | |
slang | +8.557 |
stereotype | +8.351 |
ingrained | +8.172 |
curfew | +8.132 |
puberty | +8.029 |
Neg logit contributions | |
elect | -5.899 |
events | -5.591 |
oops | -5.586 |
papers | -5.004 |
probably | -4.978 |
Token | hon |
Token ID | 3032 |
Feature activation | +3.10e-01 |
Pos logit contributions | |
ingrained | +23.718 |
slang | +23.402 |
worn | +22.691 |
practiced | +22.404 |
stereotype | +22.076 |
Neg logit contributions | |
oops | -14.654 |
events | -14.099 |
elect | -13.958 |
awaits | -12.568 |
papers | -12.549 |
Token | ed |
Token ID | 276 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
slang | +2.751 |
stereotype | +2.665 |
curfew | +2.586 |
ingrained | +2.558 |
puberty | +2.527 |
Neg logit contributions | |
elect | -3.071 |
events | -2.919 |
oops | -2.879 |
awaits | -2.805 |
probably | -2.714 |
Token | as |
Token ID | 355 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
slang | +13.393 |
ingrained | +12.607 |
stereotype | +12.533 |
puberty | +12.522 |
worn | +12.265 |
Neg logit contributions | |
oops | -13.609 |
elect | -13.449 |
events | -13.139 |
papers | -12.298 |
awaits | -12.192 |
Token | a |
Token ID | 257 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
slang | +11.208 |
stereotype | +10.597 |
ingrained | +10.369 |
puberty | +10.297 |
worn | +10.057 |
Neg logit contributions | |
elect | -12.158 |
oops | -11.938 |
events | -11.738 |
awaits | -11.020 |
ilib | -10.980 |
Token | child |
Token ID | 1200 |
Feature activation | +9.68e-01 |
Pos logit contributions | |
slang | +10.797 |
stereotype | +10.415 |
curfew | +9.828 |
puberty | +9.736 |
ingrained | +9.712 |
Neg logit contributions | |
elect | -13.012 |
events | -12.708 |
oops | -12.629 |
papers | -11.736 |
awaits | -11.727 |
Token | with |
Token ID | 351 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
slang | +9.131 |
stereotype | +8.807 |
ingrained | +8.468 |
tradition | +8.288 |
mentality | +8.198 |
Neg logit contributions | |
elect | -14.067 |
oops | -13.871 |
events | -13.693 |
awaits | -12.856 |
probably | -12.716 |
Token | the |
Token ID | 262 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
slang | +11.212 |
stereotype | +10.828 |
tradition | +10.573 |
ingrained | +10.353 |
puberty | +10.245 |
Neg logit contributions | |
elect | -14.297 |
oops | -14.244 |
events | -13.926 |
probably | -13.214 |
awaits | -13.160 |
Token | worship |
Token ID | 11892 |
Feature activation | +8.79e-01 |
Pos logit contributions | |
slang | +7.246 |
stereotype | +7.112 |
ingrained | +6.555 |
tradition | +6.550 |
curfew | +6.520 |
Neg logit contributions | |
elect | -12.578 |
oops | -12.351 |
events | -12.248 |
awaits | -11.617 |
probably | -11.549 |
Token | of |
Token ID | 286 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
slang | +8.450 |
stereotype | +8.192 |
ingrained | +7.973 |
mentality | +7.909 |
curfew | +7.889 |
Neg logit contributions | |
elect | -7.403 |
oops | -7.071 |
events | -7.063 |
awaits | -6.707 |
probably | -6.496 |
Token | North |
Token ID | 2258 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
slang | +8.167 |
stereotype | +8.057 |
tradition | +7.697 |
ingrained | +7.672 |
puberty | +7.629 |
Neg logit contributions | |
elect | -12.386 |
oops | -12.184 |
events | -12.013 |
awaits | -11.457 |
probably | -11.339 |
Token | Korea |
Token ID | 4969 |
Feature activation | +2.52e+00 |
Pos logit contributions | |
slang | +6.212 |
stereotype | +5.689 |
puberty | +5.518 |
mentality | +5.400 |
ingrained | +5.345 |
Neg logit contributions | |
elect | -17.525 |
oops | -17.244 |
events | -17.038 |
awaits | -16.442 |
papers | -16.235 |
Token | 's |
Token ID | 338 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
stereotype | +17.151 |
slang | +17.037 |
tradition | +16.462 |
mentality | +15.866 |
worn | +15.807 |
Neg logit contributions | |
oops | -18.092 |
elect | -18.065 |
events | -17.464 |
enough | -16.452 |
probably | -16.409 |
Token | founder |
Token ID | 9119 |
Feature activation | +5.09e-01 |
Pos logit contributions | |
slang | +6.301 |
stereotype | +6.093 |
ingrained | +5.697 |
tradition | +5.624 |
curfew | +5.557 |
Neg logit contributions | |
elect | -14.154 |
oops | -13.939 |
events | -13.789 |
awaits | -13.168 |
papers | -13.113 |
Token | Kim |
Token ID | 6502 |
Feature activation | +6.58e-01 |
Pos logit contributions | |
slang | +4.202 |
stereotype | +4.075 |
curfew | +3.934 |
ingrained | +3.898 |
puberty | +3.846 |
Neg logit contributions | |
elect | -5.263 |
events | -5.062 |
oops | -5.021 |
awaits | -4.801 |
probably | -4.705 |
Token | Il |
Token ID | 13778 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
slang | +5.927 |
stereotype | +5.738 |
ingrained | +5.554 |
curfew | +5.524 |
puberty | +5.484 |
Neg logit contributions | |
elect | -6.213 |
events | -5.944 |
oops | -5.910 |
awaits | -5.629 |
papers | -5.508 |
Token | Sung |
Token ID | 29802 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
slang | +5.971 |
stereotype | +5.545 |
ingrained | +5.286 |
puberty | +5.180 |
tradition | +5.153 |
Neg logit contributions | |
elect | -16.117 |
oops | -15.798 |
events | -15.752 |
awaits | -15.009 |
probably | -14.788 |
Token | ch |
Token ID | 354 |
Feature activation | +7.51e-02 |
Pos logit contributions | |
elect | +1.050 |
events | +0.976 |
oops | +0.959 |
awaits | +0.906 |
probably | +0.891 |
Neg logit contributions | |
slang | -1.570 |
stereotype | -1.539 |
curfew | -1.499 |
ingrained | -1.480 |
puberty | -1.478 |
Token | ucking |
Token ID | 19296 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
slang | +0.795 |
stereotype | +0.775 |
curfew | +0.757 |
ingrained | +0.745 |
puberty | +0.741 |
Neg logit contributions | |
elect | -0.622 |
events | -0.583 |
oops | -0.574 |
awaits | -0.554 |
probably | -0.534 |
Token | ' |
Token ID | 6 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
slang | +12.327 |
stereotype | +11.792 |
curfew | +11.682 |
ingrained | +11.477 |
mentality | +11.406 |
Neg logit contributions | |
elect | -9.628 |
events | -9.048 |
oops | -8.949 |
awaits | -8.265 |
probably | -8.262 |
Token | was |
Token ID | 373 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
slang | +10.935 |
stereotype | +10.415 |
curfew | +10.359 |
ingrained | +10.213 |
mentality | +10.104 |
Neg logit contributions | |
elect | -7.475 |
events | -7.028 |
oops | -7.012 |
probably | -6.413 |
awaits | -6.353 |
Token | not |
Token ID | 407 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
slang | +18.670 |
ingrained | +18.130 |
stereotype | +17.460 |
worn | +17.371 |
practiced | +17.257 |
Neg logit contributions | |
elect | -11.146 |
oops | -10.891 |
events | -10.424 |
awaits | -9.731 |
papers | -9.316 |
Token | a |
Token ID | 257 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
slang | +20.415 |
ingrained | +19.979 |
practiced | +19.335 |
stereotype | +19.175 |
worn | +19.087 |
Neg logit contributions | |
oops | -14.660 |
elect | -14.631 |
events | -13.932 |
awaits | -13.380 |
papers | -13.281 |
Token | crime |
Token ID | 4065 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
slang | +20.711 |
stereotype | +20.212 |
curfew | +19.279 |
ingrained | +19.271 |
tradition | +19.231 |
Neg logit contributions | |
elect | -17.885 |
events | -17.692 |
oops | -17.595 |
papers | -16.407 |
probably | -15.917 |
Token | but |
Token ID | 475 |
Feature activation | +6.17e-01 |
Pos logit contributions | |
slang | +12.026 |
stereotype | +11.656 |
ingrained | +11.289 |
curfew | +11.262 |
mentality | +11.157 |
Neg logit contributions | |
elect | -11.013 |
events | -10.753 |
oops | -10.633 |
awaits | -9.748 |
probably | -9.627 |
Token | a |
Token ID | 257 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
slang | +5.931 |
stereotype | +5.697 |
curfew | +5.584 |
ingrained | +5.545 |
puberty | +5.396 |
Neg logit contributions | |
elect | -5.677 |
events | -5.371 |
oops | -5.320 |
awaits | -5.046 |
probably | -4.926 |
Token | technical |
Token ID | 6276 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
slang | +18.743 |
stereotype | +18.244 |
curfew | +17.561 |
ingrained | +17.533 |
tradition | +17.418 |
Neg logit contributions | |
elect | -16.244 |
events | -16.176 |
oops | -16.079 |
papers | -14.631 |
awaits | -14.062 |
Token | fault |
Token ID | 8046 |
Feature activation | +6.42e-01 |
Pos logit contributions | |
slang | +13.434 |
stereotype | +12.941 |
curfew | +12.453 |
mentality | +12.286 |
ingrained | +12.274 |
Neg logit contributions | |
elect | -14.814 |
events | -14.724 |
oops | -14.267 |
awaits | -13.242 |
papers | -13.238 |
Token | from |
Token ID | 422 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
elect | +0.230 |
events | +0.214 |
oops | +0.209 |
awaits | +0.207 |
probably | +0.198 |
Neg logit contributions | |
slang | -0.274 |
stereotype | -0.267 |
curfew | -0.262 |
ingrained | -0.256 |
puberty | -0.255 |
Token | Devon |
Token ID | 36889 |
Feature activation | +3.97e-02 |
Pos logit contributions | |
elect | +1.026 |
events | +0.969 |
oops | +0.954 |
awaits | +0.935 |
probably | +0.910 |
Neg logit contributions | |
slang | -0.869 |
stereotype | -0.842 |
curfew | -0.824 |
ingrained | -0.808 |
puberty | -0.796 |
Token | who |
Token ID | 508 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
slang | +0.417 |
stereotype | +0.407 |
curfew | +0.398 |
ingrained | +0.392 |
puberty | +0.389 |
Neg logit contributions | |
elect | -0.331 |
events | -0.308 |
oops | -0.303 |
awaits | -0.295 |
probably | -0.284 |
Token | developed |
Token ID | 4166 |
Feature activation | +4.49e-01 |
Pos logit contributions | |
elect | +0.242 |
events | +0.229 |
oops | +0.225 |
awaits | +0.222 |
probably | +0.213 |
Neg logit contributions | |
slang | -0.232 |
stereotype | -0.226 |
curfew | -0.221 |
ingrained | -0.215 |
puberty | -0.214 |
Token | a |
Token ID | 257 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
slang | +3.794 |
stereotype | +3.642 |
curfew | +3.517 |
ingrained | +3.490 |
puberty | +3.461 |
Neg logit contributions | |
elect | -4.664 |
events | -4.463 |
oops | -4.425 |
awaits | -4.297 |
probably | -4.159 |
Token | Chinese |
Token ID | 3999 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
slang | +10.847 |
stereotype | +10.358 |
curfew | +9.890 |
ingrained | +9.714 |
puberty | +9.612 |
Neg logit contributions | |
elect | -12.160 |
events | -11.970 |
oops | -11.802 |
awaits | -11.186 |
papers | -11.134 |
Token | accent |
Token ID | 18702 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
slang | +19.368 |
stereotype | +18.336 |
mentality | +17.255 |
tradition | +16.978 |
ingrained | +16.816 |
Neg logit contributions | |
events | -19.073 |
oops | -19.041 |
elect | -18.825 |
papers | -17.811 |
cells | -17.525 |
Token | following |
Token ID | 1708 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
slang | +11.571 |
stereotype | +11.123 |
ingrained | +10.754 |
worn | +10.532 |
curfew | +10.386 |
Neg logit contributions | |
elect | -11.838 |
events | -11.630 |
oops | -11.426 |
awaits | -10.794 |
papers | -10.590 |
Token | a |
Token ID | 257 |
Feature activation | +5.01e-01 |
Pos logit contributions | |
slang | +2.985 |
stereotype | +2.886 |
curfew | +2.812 |
ingrained | +2.753 |
puberty | +2.749 |
Neg logit contributions | |
elect | -3.708 |
events | -3.536 |
oops | -3.504 |
awaits | -3.403 |
probably | -3.299 |
Token | migraine |
Token ID | 50082 |
Feature activation | +5.65e-01 |
Pos logit contributions | |
slang | +4.369 |
stereotype | +4.239 |
curfew | +4.139 |
ingrained | +4.027 |
puberty | +4.016 |
Neg logit contributions | |
elect | -5.049 |
events | -4.815 |
oops | -4.748 |
awaits | -4.614 |
probably | -4.462 |
Token | , |
Token ID | 11 |
Feature activation | +7.38e-01 |
Pos logit contributions | |
slang | +5.396 |
stereotype | +5.277 |
curfew | +5.154 |
ingrained | +5.053 |
puberty | +5.049 |
Neg logit contributions | |
elect | -5.150 |
events | -4.892 |
oops | -4.846 |
awaits | -4.679 |
probably | -4.523 |
Token | alcohol |
Token ID | 5548 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
slang | +1.112 |
stereotype | +1.082 |
curfew | +1.053 |
ingrained | +1.039 |
puberty | +1.031 |
Neg logit contributions | |
elect | -1.015 |
events | -0.955 |
oops | -0.940 |
awaits | -0.915 |
probably | -0.882 |
Token | monitoring |
Token ID | 9904 |
Feature activation | +1.72e+00 |
Pos logit contributions | |
slang | +13.887 |
curfew | +13.805 |
stereotype | +13.318 |
mentality | +12.912 |
leash | +12.840 |
Neg logit contributions | |
elect | -13.957 |
oops | -13.298 |
events | -13.165 |
probably | -12.369 |
absolutely | -12.220 |
Token | or |
Token ID | 393 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
slang | +14.477 |
curfew | +14.062 |
worn | +13.902 |
stereotype | +13.735 |
mentality | +13.670 |
Neg logit contributions | |
elect | -13.827 |
oops | -13.256 |
events | -13.116 |
probably | -12.428 |
absolutely | -12.323 |
Token | SC |
Token ID | 6374 |
Feature activation | +9.39e-01 |
Pos logit contributions | |
slang | +1.259 |
stereotype | +1.223 |
curfew | +1.187 |
ingrained | +1.172 |
puberty | +1.163 |
Neg logit contributions | |
elect | -1.311 |
events | -1.239 |
oops | -1.219 |
awaits | -1.191 |
probably | -1.150 |
Token | RAM |
Token ID | 24115 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
slang | +8.259 |
stereotype | +7.939 |
curfew | +7.808 |
ingrained | +7.598 |
puberty | +7.557 |
Neg logit contributions | |
elect | -8.741 |
events | -8.388 |
oops | -8.195 |
awaits | -8.025 |
probably | -7.796 |
Token | requirements |
Token ID | 5359 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
slang | +19.792 |
curfew | +19.651 |
mentality | +18.859 |
worn | +18.712 |
stereotype | +18.588 |
Neg logit contributions | |
elect | -14.707 |
oops | -14.086 |
events | -14.006 |
probably | -13.015 |
ilib | -12.785 |
Token | removed |
Token ID | 4615 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
ingrained | +19.026 |
worn | +18.774 |
slang | +18.509 |
curfew | +18.223 |
stereotype | +18.144 |
Neg logit contributions | |
events | -17.411 |
elect | -17.168 |
oops | -16.910 |
probably | -15.107 |
ilib | -14.962 |
Token | , |
Token ID | 11 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
slang | +9.821 |
stereotype | +9.373 |
ingrained | +9.346 |
curfew | +9.341 |
mentality | +9.127 |
Neg logit contributions | |
elect | -10.361 |
oops | -10.110 |
events | -9.951 |
probably | -9.147 |
awaits | -9.126 |
Token | and |
Token ID | 290 |
Feature activation | +4.22e-01 |
Pos logit contributions | |
slang | +9.802 |
stereotype | +9.292 |
curfew | +9.254 |
ingrained | +8.965 |
mentality | +8.875 |
Neg logit contributions | |
elect | -10.090 |
events | -9.590 |
oops | -9.535 |
awaits | -8.983 |
absolutely | -8.873 |
Token | the |
Token ID | 262 |
Feature activation | +7.08e-01 |
Pos logit contributions | |
slang | +3.907 |
stereotype | +3.789 |
curfew | +3.718 |
ingrained | +3.637 |
puberty | +3.606 |
Neg logit contributions | |
elect | -4.016 |
events | -3.803 |
oops | -3.777 |
awaits | -3.613 |
probably | -3.530 |
Token | judge |
Token ID | 5052 |
Feature activation | -5.97e-03 |
Pos logit contributions | |
slang | +6.280 |
stereotype | +6.093 |
curfew | +6.048 |
ingrained | +5.814 |
puberty | +5.756 |
Neg logit contributions | |
elect | -6.838 |
oops | -6.542 |
events | -6.535 |
awaits | -6.190 |
probably | -6.086 |
Token | old |
Token ID | 1468 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
slang | +2.428 |
stereotype | +2.365 |
curfew | +2.283 |
ingrained | +2.252 |
puberty | +2.230 |
Neg logit contributions | |
elect | -2.791 |
events | -2.644 |
oops | -2.618 |
awaits | -2.551 |
probably | -2.467 |
Token | term |
Token ID | 3381 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
slang | +11.319 |
stereotype | +11.270 |
tradition | +10.719 |
ingrained | +10.531 |
curfew | +10.528 |
Neg logit contributions | |
elect | -10.088 |
events | -9.519 |
oops | -9.501 |
awaits | -9.096 |
probably | -8.828 |
Token | myth |
Token ID | 7918 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
elect | +0.895 |
events | +0.841 |
oops | +0.829 |
awaits | +0.809 |
probably | +0.780 |
Neg logit contributions | |
slang | -1.013 |
stereotype | -0.985 |
curfew | -0.966 |
ingrained | -0.946 |
puberty | -0.942 |
Token | os |
Token ID | 418 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
elect | +1.324 |
events | +1.248 |
oops | +1.236 |
awaits | +1.204 |
probably | +1.168 |
Neg logit contributions | |
slang | -1.330 |
stereotype | -1.289 |
curfew | -1.268 |
ingrained | -1.235 |
puberty | -1.232 |
Token | only |
Token ID | 691 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
elect | +0.888 |
events | +0.832 |
oops | +0.820 |
awaits | +0.798 |
probably | +0.770 |
Neg logit contributions | |
slang | -1.083 |
stereotype | -1.053 |
curfew | -1.037 |
ingrained | -1.013 |
puberty | -1.010 |
Token | came |
Token ID | 1625 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
slang | +12.564 |
stereotype | +12.284 |
ingrained | +12.009 |
worn | +11.792 |
tradition | +11.544 |
Neg logit contributions | |
elect | -10.297 |
oops | -9.694 |
events | -9.550 |
papers | -8.758 |
absolutely | -8.546 |
Token | to |
Token ID | 284 |
Feature activation | +2.18e+00 |
Pos logit contributions | |
slang | +19.580 |
ingrained | +17.992 |
worn | +17.848 |
stereotype | +17.788 |
puberty | +17.233 |
Neg logit contributions | |
oops | -19.046 |
elect | -18.466 |
events | -18.007 |
awaits | -16.895 |
cells | -16.466 |
Token | denote |
Token ID | 42685 |
Feature activation | -6.37e-02 |
Pos logit contributions | |
slang | +17.889 |
stereotype | +17.342 |
puberty | +16.406 |
ingrained | +16.227 |
worn | +16.063 |
Neg logit contributions | |
elect | -16.701 |
oops | -16.688 |
events | -15.967 |
awaits | -15.336 |
papers | -14.490 |
Token | a |
Token ID | 257 |
Feature activation | +8.05e-01 |
Pos logit contributions | |
elect | +0.655 |
events | +0.623 |
oops | +0.611 |
awaits | +0.598 |
probably | +0.580 |
Neg logit contributions | |
slang | -0.541 |
stereotype | -0.523 |
curfew | -0.513 |
ingrained | -0.500 |
puberty | -0.496 |
Token | special |
Token ID | 2041 |
Feature activation | +5.30e-01 |
Pos logit contributions | |
slang | +7.150 |
stereotype | +7.010 |
curfew | +6.640 |
ingrained | +6.550 |
tradition | +6.514 |
Neg logit contributions | |
elect | -7.880 |
events | -7.515 |
oops | -7.457 |
awaits | -7.136 |
probably | -6.895 |
Token | category |
Token ID | 6536 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
slang | +4.506 |
stereotype | +4.393 |
curfew | +4.193 |
ingrained | +4.148 |
puberty | +4.107 |
Neg logit contributions | |
elect | -5.456 |
events | -5.191 |
oops | -5.149 |
awaits | -4.982 |
probably | -4.844 |
Token | , |
Token ID | 11 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
slang | +2.558 |
stereotype | +2.484 |
curfew | +2.418 |
ingrained | +2.403 |
puberty | +2.371 |
Neg logit contributions | |
elect | -2.142 |
events | -2.016 |
oops | -1.990 |
awaits | -1.920 |
probably | -1.855 |
Token | but |
Token ID | 475 |
Feature activation | +2.21e-01 |
Pos logit contributions | |
slang | +2.794 |
stereotype | +2.721 |
curfew | +2.661 |
ingrained | +2.628 |
puberty | +2.604 |
Neg logit contributions | |
elect | -2.102 |
events | -1.969 |
oops | -1.929 |
awaits | -1.869 |
probably | -1.796 |
Token | it |
Token ID | 340 |
Feature activation | +3.14e-01 |
Pos logit contributions | |
slang | +2.072 |
stereotype | +2.013 |
curfew | +1.957 |
ingrained | +1.932 |
puberty | +1.914 |
Neg logit contributions | |
elect | -2.095 |
events | -1.981 |
oops | -1.951 |
awaits | -1.892 |
probably | -1.834 |
Token | does |
Token ID | 857 |
Feature activation | +4.03e-01 |
Pos logit contributions | |
slang | +3.666 |
stereotype | +3.588 |
ingrained | +3.484 |
curfew | +3.481 |
puberty | +3.433 |
Neg logit contributions | |
elect | -2.218 |
events | -2.050 |
oops | -1.989 |
awaits | -1.895 |
probably | -1.810 |
Token | put |
Token ID | 1234 |
Feature activation | +2.27e+00 |
Pos logit contributions | |
slang | +3.722 |
stereotype | +3.634 |
curfew | +3.510 |
ingrained | +3.462 |
puberty | +3.417 |
Neg logit contributions | |
elect | -3.806 |
events | -3.617 |
oops | -3.580 |
awaits | -3.461 |
probably | -3.325 |
Token | a |
Token ID | 257 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
stereotype | +18.000 |
slang | +17.986 |
ingrained | +17.819 |
curfew | +17.637 |
tradition | +17.521 |
Neg logit contributions | |
elect | -15.908 |
events | -15.411 |
oops | -15.205 |
awaits | -14.107 |
probably | -13.973 |
Token | dam |
Token ID | 1801 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
stereotype | +19.268 |
curfew | +18.407 |
slang | +17.961 |
leash | +17.759 |
limitation | +17.732 |
Neg logit contributions | |
events | -19.006 |
elect | -18.427 |
oops | -17.653 |
papers | -16.335 |
awaits | -16.323 |
Token | per |
Token ID | 525 |
Feature activation | +7.40e-01 |
Pos logit contributions | |
slang | +2.136 |
stereotype | +2.084 |
curfew | +2.044 |
ingrained | +2.000 |
puberty | +1.999 |
Neg logit contributions | |
elect | -1.626 |
events | -1.510 |
oops | -1.495 |
awaits | -1.439 |
probably | -1.396 |
Token | on |
Token ID | 319 |
Feature activation | +6.84e-01 |
Pos logit contributions | |
slang | +5.055 |
stereotype | +5.038 |
mentality | +4.850 |
curfew | +4.784 |
ingrained | +4.725 |
Neg logit contributions | |
elect | -8.187 |
events | -8.122 |
oops | -7.860 |
awaits | -7.656 |
probably | -7.414 |
Token | sharing |
Token ID | 7373 |
Feature activation | +1.71e-01 |
Pos logit contributions | |
slang | +5.941 |
stereotype | +5.768 |
curfew | +5.630 |
ingrained | +5.589 |
puberty | +5.464 |
Neg logit contributions | |
elect | -6.713 |
events | -6.376 |
oops | -6.283 |
awaits | -6.076 |
probably | -5.953 |
Token | your |
Token ID | 534 |
Feature activation | +4.17e-01 |
Pos logit contributions | |
slang | +1.588 |
stereotype | +1.541 |
curfew | +1.501 |
ingrained | +1.477 |
puberty | +1.464 |
Neg logit contributions | |
elect | -1.641 |
events | -1.552 |
oops | -1.530 |
awaits | -1.488 |
probably | -1.442 |
Token | calls |
Token ID | 3848 |
Feature activation | +9.19e-01 |
Pos logit contributions | |
elect | +1.866 |
events | +1.746 |
oops | +1.737 |
awaits | +1.708 |
probably | +1.634 |
Neg logit contributions | |
slang | -1.591 |
stereotype | -1.538 |
curfew | -1.496 |
ingrained | -1.465 |
puberty | -1.464 |
Token | for |
Token ID | 329 |
Feature activation | +9.92e-01 |
Pos logit contributions | |
slang | +7.330 |
stereotype | +7.157 |
curfew | +6.889 |
ingrained | +6.812 |
puberty | +6.761 |
Neg logit contributions | |
elect | -9.274 |
events | -9.082 |
oops | -8.892 |
awaits | -8.526 |
probably | -8.519 |
Token | bilingual |
Token ID | 48116 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
slang | +8.410 |
stereotype | +8.146 |
curfew | +7.982 |
ingrained | +7.872 |
puberty | +7.669 |
Neg logit contributions | |
elect | -9.386 |
events | -9.132 |
oops | -9.061 |
awaits | -8.644 |
probably | -8.507 |
Token | ism |
Token ID | 1042 |
Feature activation | +1.64e+00 |
Pos logit contributions | |
slang | +9.455 |
stereotype | +9.163 |
curfew | +8.852 |
ingrained | +8.698 |
mentality | +8.669 |
Neg logit contributions | |
elect | -9.875 |
events | -9.629 |
oops | -9.438 |
awaits | -9.069 |
probably | -8.976 |
Token | to |
Token ID | 284 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
slang | +13.456 |
stereotype | +13.279 |
ingrained | +13.172 |
curfew | +12.780 |
proficiency | +12.748 |
Neg logit contributions | |
elect | -13.902 |
events | -13.470 |
oops | -13.369 |
probably | -12.497 |
awaits | -12.250 |
Token | be |
Token ID | 307 |
Feature activation | +2.47e+00 |
Pos logit contributions | |
slang | +9.454 |
stereotype | +9.437 |
ingrained | +8.920 |
curfew | +8.914 |
puberty | +8.648 |
Neg logit contributions | |
elect | -10.290 |
oops | -10.146 |
events | -9.984 |
awaits | -9.429 |
papers | -9.291 |
Token | a |
Token ID | 257 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
ingrained | +20.386 |
slang | +19.992 |
worn | +19.636 |
stereotype | +19.219 |
practiced | +19.213 |
Neg logit contributions | |
oops | -17.241 |
elect | -16.872 |
events | -16.488 |
awaits | -15.237 |
papers | -14.977 |
Token | requirement |
Token ID | 9079 |
Feature activation | +8.25e-01 |
Pos logit contributions | |
slang | +13.134 |
stereotype | +13.105 |
ingrained | +12.612 |
tradition | +12.601 |
curfew | +12.500 |
Neg logit contributions | |
elect | -15.460 |
events | -15.176 |
oops | -15.143 |
probably | -13.873 |
papers | -13.745 |
Token | for |
Token ID | 329 |
Feature activation | +7.12e-01 |
Pos logit contributions | |
slang | +7.185 |
stereotype | +7.064 |
ingrained | +6.938 |
curfew | +6.741 |
mentality | +6.737 |
Neg logit contributions | |
elect | -7.775 |
events | -7.607 |
oops | -7.537 |
awaits | -7.022 |
probably | -6.964 |
Token | all |
Token ID | 477 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
slang | +6.105 |
stereotype | +5.964 |
curfew | +5.768 |
ingrained | +5.724 |
puberty | +5.630 |
Neg logit contributions | |
elect | -7.020 |
events | -6.789 |
oops | -6.714 |
awaits | -6.419 |
probably | -6.310 |
Token | senior |
Token ID | 4664 |
Feature activation | -5.96e-02 |
Pos logit contributions | |
slang | +1.159 |
stereotype | +1.123 |
curfew | +1.092 |
ingrained | +1.072 |
puberty | +1.065 |
Neg logit contributions | |
elect | -1.345 |
events | -1.272 |
oops | -1.254 |
awaits | -1.228 |
probably | -1.186 |
Token | J |
Token ID | 449 |
Feature activation | +9.96e-02 |
Pos logit contributions | |
slang | +6.040 |
stereotype | +5.825 |
curfew | +5.660 |
puberty | +5.628 |
ingrained | +5.545 |
Neg logit contributions | |
elect | -5.752 |
events | -5.474 |
oops | -5.469 |
awaits | -5.195 |
probably | -5.029 |
Token | arl |
Token ID | 7063 |
Feature activation | -8.28e-02 |
Pos logit contributions | |
slang | +1.053 |
stereotype | +1.023 |
curfew | +0.995 |
ingrained | +0.982 |
puberty | +0.980 |
Neg logit contributions | |
elect | -0.820 |
events | -0.765 |
oops | -0.748 |
awaits | -0.737 |
probably | -0.702 |
Token | . |
Token ID | 13 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
elect | +0.669 |
events | +0.626 |
oops | +0.616 |
awaits | +0.595 |
probably | +0.572 |
Neg logit contributions | |
slang | -0.892 |
stereotype | -0.870 |
curfew | -0.850 |
ingrained | -0.838 |
puberty | -0.833 |
Token | " |
Token ID | 366 |
Feature activation | +2.23e-01 |
Pos logit contributions | |
slang | +2.996 |
stereotype | +2.833 |
curfew | +2.750 |
puberty | +2.714 |
ingrained | +2.673 |
Neg logit contributions | |
elect | -3.327 |
events | -3.200 |
oops | -3.159 |
awaits | -3.096 |
probably | -2.957 |
Token | When |
Token ID | 2215 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
slang | +2.407 |
stereotype | +2.343 |
curfew | +2.288 |
ingrained | +2.259 |
puberty | +2.242 |
Neg logit contributions | |
elect | -1.793 |
events | -1.678 |
oops | -1.650 |
awaits | -1.605 |
probably | -1.530 |
Token | I |
Token ID | 314 |
Feature activation | +2.43e+00 |
Pos logit contributions | |
slang | +10.651 |
puberty | +10.422 |
stereotype | +10.409 |
curfew | +10.198 |
tradition | +9.893 |
Neg logit contributions | |
elect | -9.984 |
events | -9.404 |
oops | -9.381 |
awaits | -8.727 |
probably | -8.675 |
Token | grew |
Token ID | 6348 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
stereotype | +16.535 |
practiced | +16.486 |
worn | +16.248 |
slang | +16.172 |
puberty | +16.018 |
Neg logit contributions | |
elect | -19.813 |
events | -19.166 |
oops | -18.873 |
papers | -17.681 |
legates | -17.163 |
Token | up |
Token ID | 510 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
slang | +10.505 |
puberty | +9.769 |
ingrained | +9.473 |
worn | +9.432 |
stereotype | +9.404 |
Neg logit contributions | |
elect | -20.134 |
oops | -19.601 |
events | -19.286 |
awaits | -18.653 |
probably | -18.475 |
Token | hockey |
Token ID | 12217 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
slang | +9.633 |
stereotype | +9.237 |
puberty | +9.085 |
ingrained | +9.033 |
curfew | +9.032 |
Neg logit contributions | |
elect | -9.293 |
oops | -8.847 |
events | -8.756 |
awaits | -8.381 |
papers | -8.111 |
Token | was |
Token ID | 373 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
slang | +13.360 |
stereotype | +12.887 |
ingrained | +12.662 |
puberty | +12.651 |
mentality | +12.630 |
Neg logit contributions | |
elect | -11.928 |
events | -11.268 |
oops | -11.138 |
ilib | -10.347 |
possibly | -10.189 |
Token | too |
Token ID | 1165 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
slang | +16.586 |
ingrained | +15.883 |
stereotype | +15.736 |
tradition | +15.358 |
puberty | +15.230 |
Neg logit contributions | |
elect | -13.105 |
oops | -12.407 |
events | -12.196 |
ilib | -11.345 |
awaits | -11.300 |
Token | , |
Token ID | 11 |
Feature activation | +6.01e-01 |
Pos logit contributions | |
elect | +0.192 |
events | +0.181 |
oops | +0.177 |
awaits | +0.173 |
probably | +0.166 |
Neg logit contributions | |
slang | -0.210 |
stereotype | -0.205 |
curfew | -0.200 |
ingrained | -0.196 |
puberty | -0.196 |
Token | a |
Token ID | 257 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
slang | +5.834 |
stereotype | +5.621 |
curfew | +5.560 |
ingrained | +5.435 |
puberty | +5.374 |
Neg logit contributions | |
elect | -5.369 |
events | -5.092 |
oops | -5.009 |
awaits | -4.804 |
probably | -4.683 |
Token | move |
Token ID | 1445 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
slang | +15.116 |
stereotype | +14.669 |
curfew | +14.645 |
tradition | +14.475 |
mentality | +14.026 |
Neg logit contributions | |
elect | -15.847 |
events | -15.522 |
oops | -15.209 |
ilib | -14.305 |
awaits | -14.043 |
Token | that |
Token ID | 326 |
Feature activation | +5.34e-01 |
Pos logit contributions | |
slang | +8.915 |
stereotype | +8.647 |
ingrained | +8.572 |
curfew | +8.465 |
tradition | +8.419 |
Neg logit contributions | |
elect | -9.740 |
events | -9.388 |
oops | -9.103 |
awaits | -8.683 |
probably | -8.558 |
Token | reversed |
Token ID | 17687 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
slang | +5.530 |
stereotype | +5.407 |
curfew | +5.301 |
ingrained | +5.237 |
puberty | +5.169 |
Neg logit contributions | |
elect | -4.404 |
events | -4.152 |
oops | -4.090 |
awaits | -3.816 |
probably | -3.773 |
Token | a |
Token ID | 257 |
Feature activation | +2.42e+00 |
Pos logit contributions | |
slang | +15.027 |
stereotype | +14.935 |
tradition | +14.837 |
ingrained | +14.529 |
curfew | +14.374 |
Neg logit contributions | |
elect | -13.957 |
oops | -13.475 |
events | -13.384 |
awaits | -12.746 |
probably | -12.543 |
Token | measure |
Token ID | 3953 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
stereotype | +18.741 |
tradition | +18.407 |
curfew | +18.178 |
slang | +17.918 |
mentality | +17.502 |
Neg logit contributions | |
events | -18.284 |
elect | -17.871 |
oops | -17.044 |
cells | -16.784 |
awaits | -16.182 |
Token | put |
Token ID | 1234 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
slang | +8.477 |
stereotype | +8.320 |
ingrained | +8.144 |
curfew | +8.094 |
worn | +8.040 |
Neg logit contributions | |
elect | -10.719 |
events | -10.511 |
oops | -10.314 |
probably | -9.702 |
awaits | -9.682 |
Token | in |
Token ID | 287 |
Feature activation | +8.96e-01 |
Pos logit contributions | |
slang | +10.161 |
ingrained | +9.676 |
stereotype | +9.664 |
puberty | +9.549 |
worn | +9.334 |
Neg logit contributions | |
events | -16.915 |
oops | -16.743 |
elect | -16.689 |
probably | -15.775 |
awaits | -15.316 |
Token | place |
Token ID | 1295 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
slang | +5.879 |
stereotype | +5.612 |
curfew | +5.579 |
puberty | +5.447 |
ingrained | +5.271 |
Neg logit contributions | |
elect | -10.300 |
events | -10.095 |
oops | -10.083 |
awaits | -9.547 |
probably | -9.387 |
Token | after |
Token ID | 706 |
Feature activation | +8.19e-01 |
Pos logit contributions | |
slang | +13.743 |
ingrained | +13.123 |
stereotype | +13.102 |
curfew | +13.051 |
worn | +13.049 |
Neg logit contributions | |
elect | -17.543 |
oops | -17.302 |
events | -17.077 |
awaits | -15.999 |
papers | -15.866 |
Token | . |
Token ID | 13 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
elect | +2.426 |
events | +2.305 |
oops | +2.226 |
awaits | +2.190 |
indeed | +2.099 |
Neg logit contributions | |
slang | -2.881 |
stereotype | -2.817 |
curfew | -2.786 |
puberty | -2.702 |
ingrained | -2.684 |
Token | Now |
Token ID | 2735 |
Feature activation | +6.45e-01 |
Pos logit contributions | |
elect | +1.987 |
events | +1.870 |
oops | +1.821 |
awaits | +1.762 |
probably | +1.716 |
Neg logit contributions | |
slang | -2.557 |
stereotype | -2.503 |
curfew | -2.481 |
puberty | -2.413 |
ingrained | -2.410 |
Token | that |
Token ID | 326 |
Feature activation | +6.42e-01 |
Pos logit contributions | |
slang | +6.164 |
stereotype | +5.977 |
ingrained | +5.895 |
curfew | +5.823 |
puberty | +5.743 |
Neg logit contributions | |
elect | -5.712 |
events | -5.359 |
oops | -5.338 |
awaits | -5.140 |
probably | -4.987 |
Token | this |
Token ID | 428 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
slang | +5.977 |
stereotype | +5.840 |
ingrained | +5.680 |
curfew | +5.665 |
puberty | +5.556 |
Neg logit contributions | |
elect | -5.872 |
oops | -5.515 |
events | -5.501 |
awaits | -5.229 |
probably | -5.153 |
Token | has |
Token ID | 468 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
slang | +11.389 |
stereotype | +11.253 |
ingrained | +10.983 |
mentality | +10.886 |
curfew | +10.827 |
Neg logit contributions | |
elect | -8.504 |
events | -8.003 |
oops | -7.924 |
probably | -7.205 |
papers | -7.169 |
Token | been |
Token ID | 587 |
Feature activation | +2.41e+00 |
Pos logit contributions | |
slang | +9.641 |
ingrained | +9.537 |
worn | +9.371 |
stereotype | +9.319 |
curfew | +8.982 |
Neg logit contributions | |
elect | -10.528 |
oops | -10.312 |
events | -9.882 |
awaits | -9.347 |
else | -9.200 |
Token | added |
Token ID | 2087 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
ingrained | +20.407 |
slang | +19.729 |
worn | +19.240 |
stereotype | +19.035 |
practiced | +18.604 |
Neg logit contributions | |
elect | -15.912 |
oops | -15.809 |
events | -15.295 |
awaits | -14.322 |
cells | -13.897 |
Token | , |
Token ID | 11 |
Feature activation | +1.68e-02 |
Pos logit contributions | |
slang | +11.261 |
stereotype | +10.739 |
ingrained | +10.728 |
mentality | +10.521 |
puberty | +10.458 |
Neg logit contributions | |
elect | -12.186 |
oops | -11.886 |
events | -11.524 |
awaits | -11.031 |
probably | -10.956 |
Token | I |
Token ID | 314 |
Feature activation | +4.39e-01 |
Pos logit contributions | |
slang | +0.161 |
stereotype | +0.156 |
curfew | +0.153 |
ingrained | +0.149 |
puberty | +0.149 |
Neg logit contributions | |
elect | -0.157 |
events | -0.148 |
oops | -0.145 |
awaits | -0.142 |
probably | -0.137 |
Token | feel |
Token ID | 1254 |
Feature activation | -3.69e-01 |
Pos logit contributions | |
slang | +4.258 |
stereotype | +4.148 |
curfew | +4.032 |
ingrained | +3.988 |
puberty | +3.944 |
Neg logit contributions | |
elect | -3.983 |
events | -3.763 |
oops | -3.703 |
awaits | -3.576 |
probably | -3.466 |
Token | a |
Token ID | 257 |
Feature activation | +9.64e-01 |
Pos logit contributions | |
elect | +3.408 |
events | +3.245 |
oops | +3.171 |
awaits | +3.138 |
absolutely | +3.047 |
Neg logit contributions | |
slang | -3.415 |
stereotype | -3.300 |
curfew | -3.229 |
puberty | -3.119 |
ingrained | -3.065 |
Token | was |
Token ID | 373 |
Feature activation | +8.15e-01 |
Pos logit contributions | |
slang | +6.879 |
stereotype | +6.686 |
curfew | +6.540 |
ingrained | +6.466 |
mentality | +6.335 |
Neg logit contributions | |
elect | -5.691 |
events | -5.345 |
oops | -5.256 |
awaits | -4.891 |
probably | -4.866 |
Token | the |
Token ID | 262 |
Feature activation | +9.39e-01 |
Pos logit contributions | |
slang | +6.893 |
stereotype | +6.628 |
curfew | +6.483 |
ingrained | +6.370 |
puberty | +6.276 |
Neg logit contributions | |
elect | -8.155 |
events | -7.861 |
oops | -7.734 |
awaits | -7.409 |
papers | -7.250 |
Token | old |
Token ID | 1468 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
slang | +8.163 |
stereotype | +7.935 |
curfew | +7.693 |
mentality | +7.563 |
ingrained | +7.534 |
Neg logit contributions | |
elect | -9.175 |
events | -8.916 |
oops | -8.650 |
awaits | -8.308 |
papers | -8.120 |
Token | D |
Token ID | 360 |
Feature activation | +8.92e-01 |
Pos logit contributions | |
slang | +17.554 |
stereotype | +17.234 |
tradition | +16.537 |
ingrained | +16.171 |
mentality | +16.149 |
Neg logit contributions | |
events | -15.758 |
elect | -15.428 |
oops | -14.797 |
awaits | -14.066 |
absolutely | -13.466 |
Token | FW |
Token ID | 24160 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
slang | +8.442 |
stereotype | +8.141 |
curfew | +8.042 |
ingrained | +7.817 |
mentality | +7.735 |
Neg logit contributions | |
elect | -7.773 |
events | -7.387 |
oops | -7.127 |
awaits | -7.006 |
probably | -6.814 |
Token | I |
Token ID | 40 |
Feature activation | +2.41e+00 |
Pos logit contributions | |
slang | +16.958 |
stereotype | +16.223 |
curfew | +15.987 |
tradition | +15.470 |
mentality | +15.465 |
Neg logit contributions | |
elect | -13.833 |
events | -13.555 |
oops | -12.742 |
awaits | -12.192 |
absolutely | -11.904 |
Token | ( |
Token ID | 357 |
Feature activation | +4.10e-02 |
Pos logit contributions | |
slang | +21.458 |
stereotype | +20.559 |
curfew | +20.508 |
mentality | +19.995 |
tradition | +19.953 |
Neg logit contributions | |
events | -15.631 |
elect | -15.429 |
oops | -14.425 |
awaits | -13.463 |
papers | -13.418 |
Token | Don |
Token ID | 3987 |
Feature activation | -8.73e-02 |
Pos logit contributions | |
slang | +0.427 |
stereotype | +0.416 |
curfew | +0.406 |
ingrained | +0.401 |
puberty | +0.398 |
Neg logit contributions | |
elect | -0.346 |
events | -0.324 |
oops | -0.319 |
awaits | -0.308 |
probably | -0.298 |
Token | 't |
Token ID | 470 |
Feature activation | +8.93e-01 |
Pos logit contributions | |
elect | +0.618 |
events | +0.572 |
oops | +0.564 |
awaits | +0.541 |
probably | +0.519 |
Neg logit contributions | |
slang | -1.022 |
stereotype | -1.003 |
curfew | -0.982 |
ingrained | -0.971 |
puberty | -0.965 |
Token | F |
Token ID | 376 |
Feature activation | +7.58e-01 |
Pos logit contributions | |
slang | +8.933 |
stereotype | +8.766 |
curfew | +8.468 |
ingrained | +8.219 |
mentality | +8.161 |
Neg logit contributions | |
elect | -7.414 |
events | -7.115 |
oops | -6.849 |
awaits | -6.763 |
papers | -6.484 |
Token | --- |
Token ID | 6329 |
Feature activation | +5.27e-01 |
Pos logit contributions | |
slang | +6.859 |
stereotype | +6.609 |
curfew | +6.415 |
ingrained | +6.325 |
mentality | +6.195 |
Neg logit contributions | |
elect | -6.995 |
events | -6.722 |
awaits | -6.547 |
oops | -6.449 |
probably | -6.174 |
Token | as |
Token ID | 292 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
elect | +1.788 |
events | +1.665 |
oops | +1.629 |
awaits | +1.531 |
probably | +1.529 |
Neg logit contributions | |
slang | -2.660 |
stereotype | -2.622 |
curfew | -2.545 |
ingrained | -2.524 |
puberty | -2.503 |
Token | opposed |
Token ID | 6886 |
Feature activation | +6.32e-01 |
Pos logit contributions | |
slang | +12.501 |
stereotype | +11.987 |
curfew | +11.834 |
ingrained | +11.729 |
worn | +11.602 |
Neg logit contributions | |
elect | -11.845 |
events | -11.363 |
oops | -11.140 |
probably | -10.422 |
absolutely | -10.181 |
Token | to |
Token ID | 284 |
Feature activation | +6.93e-01 |
Pos logit contributions | |
slang | +4.168 |
stereotype | +3.956 |
ingrained | +3.765 |
curfew | +3.762 |
puberty | +3.695 |
Neg logit contributions | |
elect | -7.628 |
events | -7.290 |
oops | -7.288 |
awaits | -7.067 |
probably | -6.875 |
Token | the |
Token ID | 262 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
slang | +6.483 |
stereotype | +6.324 |
curfew | +6.222 |
puberty | +6.058 |
ingrained | +6.052 |
Neg logit contributions | |
elect | -6.399 |
oops | -6.054 |
events | -6.009 |
awaits | -5.707 |
probably | -5.594 |
Token | division |
Token ID | 7297 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
slang | +8.721 |
stereotype | +8.642 |
curfew | +8.446 |
ingrained | +8.196 |
puberty | +8.110 |
Neg logit contributions | |
elect | -9.612 |
oops | -9.158 |
events | -9.123 |
awaits | -8.694 |
probably | -8.492 |
Token | housing |
Token ID | 5627 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
slang | +15.034 |
stereotype | +14.767 |
curfew | +14.664 |
mentality | +14.309 |
ingrained | +14.292 |
Neg logit contributions | |
elect | -12.582 |
events | -12.167 |
oops | -12.020 |
probably | -11.084 |
awaits | -10.965 |
Token | typical |
Token ID | 7226 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
stereotype | +20.336 |
slang | +20.290 |
curfew | +20.086 |
tradition | +19.667 |
mentality | +19.586 |
Neg logit contributions | |
elect | -15.974 |
events | -15.033 |
oops | -14.761 |
probably | -14.302 |
ilib | -13.790 |
Token | of |
Token ID | 286 |
Feature activation | +3.05e-01 |
Pos logit contributions | |
slang | +2.758 |
stereotype | +2.679 |
curfew | +2.614 |
ingrained | +2.571 |
puberty | +2.557 |
Neg logit contributions | |
elect | -2.433 |
events | -2.279 |
oops | -2.273 |
awaits | -2.176 |
probably | -2.120 |
Token | fr |
Token ID | 1216 |
Feature activation | -7.71e-01 |
Pos logit contributions | |
slang | +2.690 |
stereotype | +2.606 |
curfew | +2.534 |
ingrained | +2.489 |
puberty | +2.472 |
Neg logit contributions | |
elect | -3.062 |
events | -2.898 |
oops | -2.874 |
awaits | -2.790 |
probably | -2.708 |
Token | atern |
Token ID | 9205 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
elect | +3.652 |
events | +3.519 |
oops | +3.257 |
awaits | +2.853 |
papers | +2.773 |
Neg logit contributions | |
slang | -10.391 |
stereotype | -10.298 |
curfew | -10.163 |
puberty | -9.878 |
ingrained | -9.810 |
Token | ities |
Token ID | 871 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
elect | +1.595 |
events | +1.500 |
oops | +1.433 |
awaits | +1.306 |
probably | +1.274 |
Neg logit contributions | |
slang | -3.707 |
stereotype | -3.657 |
curfew | -3.611 |
ingrained | -3.550 |
puberty | -3.537 |
Token | my |
Token ID | 616 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
slang | +5.189 |
stereotype | +5.044 |
curfew | +4.911 |
ingrained | +4.852 |
puberty | +4.837 |
Neg logit contributions | |
elect | -4.809 |
events | -4.531 |
oops | -4.510 |
awaits | -4.290 |
probably | -4.170 |
Token | mother |
Token ID | 2802 |
Feature activation | +6.67e-02 |
Pos logit contributions | |
slang | +8.104 |
stereotype | +7.868 |
curfew | +7.634 |
ingrained | +7.429 |
puberty | +7.412 |
Neg logit contributions | |
elect | -13.100 |
oops | -12.723 |
events | -12.486 |
awaits | -12.046 |
probably | -11.778 |
Token | refused |
Token ID | 6520 |
Feature activation | +9.57e-02 |
Pos logit contributions | |
slang | +0.678 |
stereotype | +0.660 |
curfew | +0.645 |
ingrained | +0.634 |
puberty | +0.630 |
Neg logit contributions | |
elect | -0.577 |
events | -0.542 |
oops | -0.533 |
awaits | -0.520 |
probably | -0.500 |
Token | to |
Token ID | 284 |
Feature activation | +6.55e-01 |
Pos logit contributions | |
slang | +0.866 |
stereotype | +0.840 |
curfew | +0.818 |
ingrained | +0.804 |
puberty | +0.798 |
Neg logit contributions | |
elect | -0.937 |
events | -0.887 |
oops | -0.875 |
awaits | -0.852 |
probably | -0.825 |
Token | follow |
Token ID | 1061 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
slang | +5.810 |
stereotype | +5.720 |
curfew | +5.528 |
ingrained | +5.447 |
puberty | +5.377 |
Neg logit contributions | |
elect | -6.346 |
oops | -6.065 |
events | -6.060 |
awaits | -5.798 |
probably | -5.605 |
Token | this |
Token ID | 428 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
tradition | +14.419 |
slang | +14.184 |
stereotype | +14.038 |
curfew | +13.852 |
ingrained | +13.784 |
Neg logit contributions | |
elect | -15.963 |
oops | -15.678 |
events | -15.119 |
probably | -14.328 |
papers | -14.216 |
Token | custom |
Token ID | 2183 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
tradition | +20.734 |
stereotype | +20.329 |
mentality | +19.361 |
slang | +19.311 |
ingrained | +19.173 |
Neg logit contributions | |
oops | -17.419 |
elect | -17.414 |
events | -16.655 |
cells | -15.600 |
papers | -15.235 |
Token | . |
Token ID | 13 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
slang | +10.253 |
stereotype | +10.167 |
ingrained | +9.997 |
tradition | +9.821 |
mentality | +9.808 |
Neg logit contributions | |
elect | -9.996 |
oops | -9.827 |
events | -9.571 |
awaits | -9.074 |
probably | -8.798 |
Token |
|
Token ID | 198 |
Feature activation | +3.49e-01 |
Pos logit contributions | |
slang | +2.899 |
stereotype | +2.820 |
curfew | +2.744 |
ingrained | +2.704 |
puberty | +2.692 |
Neg logit contributions | |
elect | -2.458 |
events | -2.306 |
oops | -2.276 |
awaits | -2.207 |
probably | -2.115 |
Token |
|
Token ID | 198 |
Feature activation | +8.21e-01 |
Pos logit contributions | |
slang | +3.332 |
stereotype | +3.221 |
curfew | +3.119 |
ingrained | +3.092 |
puberty | +3.058 |
Neg logit contributions | |
elect | -3.195 |
events | -3.019 |
oops | -2.990 |
awaits | -2.918 |
probably | -2.775 |
Token | Instead |
Token ID | 13193 |
Feature activation | +5.92e-01 |
Pos logit contributions | |
slang | +7.932 |
stereotype | +7.607 |
curfew | +7.359 |
ingrained | +7.344 |
puberty | +7.292 |
Neg logit contributions | |
elect | -6.799 |
awaits | -6.474 |
events | -6.351 |
oops | -6.316 |
indeed | -5.861 |
Token | From |
Token ID | 4863 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
slang | +6.894 |
stereotype | +6.589 |
curfew | +6.346 |
ingrained | +6.307 |
puberty | +6.256 |
Neg logit contributions | |
elect | -6.195 |
awaits | -5.842 |
oops | -5.804 |
events | -5.792 |
indeed | -5.348 |
Token | the |
Token ID | 262 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
slang | +11.168 |
stereotype | +10.764 |
puberty | +10.644 |
tradition | +10.348 |
curfew | +10.281 |
Neg logit contributions | |
elect | -11.477 |
oops | -10.795 |
events | -10.644 |
awaits | -10.501 |
papers | -10.059 |
Token | mid |
Token ID | 3095 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
slang | +12.427 |
stereotype | +12.125 |
puberty | +11.670 |
tradition | +11.633 |
curfew | +11.552 |
Neg logit contributions | |
elect | -12.582 |
oops | -11.915 |
events | -11.683 |
awaits | -11.552 |
cells | -10.964 |
Token | - |
Token ID | 12 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
slang | +12.307 |
stereotype | +11.831 |
puberty | +11.643 |
tradition | +11.620 |
curfew | +11.539 |
Neg logit contributions | |
elect | -12.604 |
oops | -12.135 |
awaits | -12.094 |
events | -11.919 |
ilib | -11.221 |
Token | 13 |
Token ID | 1485 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
slang | +9.983 |
stereotype | +9.533 |
puberty | +9.425 |
curfew | +9.320 |
tradition | +9.240 |
Neg logit contributions | |
elect | -8.576 |
awaits | -8.241 |
oops | -8.079 |
events | -7.994 |
ilib | -7.635 |
Token | th |
Token ID | 400 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
slang | +11.571 |
stereotype | +10.973 |
tradition | +10.693 |
curfew | +10.482 |
puberty | +10.413 |
Neg logit contributions | |
elect | -13.051 |
awaits | -12.618 |
events | -12.618 |
oops | -12.548 |
absolutely | -11.808 |
Token | century |
Token ID | 4289 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
slang | +16.545 |
stereotype | +16.234 |
tradition | +15.884 |
puberty | +15.413 |
curfew | +15.373 |
Neg logit contributions | |
oops | -18.290 |
elect | -18.226 |
events | -17.904 |
papers | -16.861 |
awaits | -16.799 |
Token | Sanskrit |
Token ID | 46178 |
Feature activation | +9.46e-01 |
Pos logit contributions | |
slang | +13.362 |
stereotype | +12.895 |
puberty | +12.549 |
tradition | +12.523 |
curfew | +12.357 |
Neg logit contributions | |
elect | -13.473 |
oops | -13.034 |
events | -12.624 |
awaits | -11.872 |
absolutely | -11.712 |
Token | , |
Token ID | 11 |
Feature activation | +9.91e-01 |
Pos logit contributions | |
slang | +9.092 |
stereotype | +8.636 |
ingrained | +8.321 |
puberty | +8.290 |
tradition | +8.278 |
Neg logit contributions | |
elect | -8.348 |
events | -7.956 |
oops | -7.824 |
awaits | -7.403 |
absolutely | -7.251 |
Token | U |
Token ID | 471 |
Feature activation | +5.62e-01 |
Pos logit contributions | |
slang | +9.179 |
stereotype | +8.603 |
ingrained | +8.355 |
curfew | +8.272 |
tradition | +8.239 |
Neg logit contributions | |
elect | -9.070 |
events | -8.705 |
oops | -8.644 |
awaits | -8.190 |
papers | -7.948 |
Token | y |
Token ID | 88 |
Feature activation | +5.34e-01 |
Pos logit contributions | |
slang | +5.751 |
stereotype | +5.525 |
curfew | +5.370 |
ingrained | +5.343 |
puberty | +5.287 |
Neg logit contributions | |
elect | -4.630 |
events | -4.381 |
oops | -4.307 |
awaits | -4.237 |
probably | -4.003 |
Token | it |
Token ID | 340 |
Feature activation | +6.24e-01 |
Pos logit contributions | |
slang | +6.968 |
stereotype | +6.843 |
ingrained | +6.466 |
worn | +6.400 |
curfew | +6.393 |
Neg logit contributions | |
elect | -9.241 |
events | -8.959 |
oops | -8.788 |
awaits | -8.522 |
probably | -8.318 |
Token | was |
Token ID | 373 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
slang | +5.934 |
stereotype | +5.891 |
ingrained | +5.636 |
worn | +5.582 |
curfew | +5.526 |
Neg logit contributions | |
elect | -5.573 |
events | -5.321 |
oops | -5.239 |
awaits | -4.867 |
papers | -4.763 |
Token | a |
Token ID | 257 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
slang | +12.960 |
stereotype | +12.575 |
ingrained | +12.307 |
worn | +12.209 |
puberty | +12.198 |
Neg logit contributions | |
elect | -14.590 |
oops | -14.260 |
events | -13.989 |
awaits | -13.508 |
papers | -13.063 |
Token | year |
Token ID | 614 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
stereotype | +11.609 |
slang | +11.371 |
puberty | +10.685 |
worn | +10.668 |
tradition | +10.598 |
Neg logit contributions | |
events | -17.756 |
elect | -17.604 |
oops | -17.321 |
awaits | -16.298 |
ilib | -16.204 |
Token | or |
Token ID | 393 |
Feature activation | +8.70e-01 |
Pos logit contributions | |
slang | +8.769 |
stereotype | +8.062 |
ingrained | +7.918 |
puberty | +7.902 |
worn | +7.707 |
Neg logit contributions | |
elect | -18.699 |
events | -18.490 |
oops | -18.364 |
papers | -17.332 |
awaits | -17.328 |
Token | two |
Token ID | 734 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
slang | +7.537 |
stereotype | +7.418 |
curfew | +7.193 |
puberty | +7.119 |
ingrained | +7.088 |
Neg logit contributions | |
elect | -8.267 |
oops | -7.998 |
events | -7.890 |
awaits | -7.589 |
absolutely | -7.314 |
Token | ago |
Token ID | 2084 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
slang | +12.493 |
ingrained | +11.759 |
puberty | +11.474 |
stereotype | +11.456 |
worn | +11.450 |
Neg logit contributions | |
elect | -22.547 |
events | -22.512 |
oops | -22.221 |
papers | -21.422 |
absolutely | -20.857 |
Token | . |
Token ID | 13 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
slang | +3.604 |
stereotype | +3.526 |
curfew | +3.402 |
ingrained | +3.402 |
puberty | +3.360 |
Neg logit contributions | |
elect | -2.981 |
events | -2.812 |
oops | -2.770 |
awaits | -2.663 |
probably | -2.559 |
Token | Though |
Token ID | 7486 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
slang | +0.143 |
stereotype | +0.139 |
curfew | +0.137 |
ingrained | +0.135 |
puberty | +0.134 |
Neg logit contributions | |
elect | -0.114 |
events | -0.106 |
oops | -0.104 |
awaits | -0.101 |
probably | -0.098 |
Token | 50 |
Token ID | 2026 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
slang | +1.123 |
stereotype | +1.088 |
curfew | +1.063 |
ingrained | +1.043 |
puberty | +1.035 |
Neg logit contributions | |
elect | -1.198 |
events | -1.132 |
oops | -1.115 |
awaits | -1.089 |
probably | -1.054 |
Token | percent |
Token ID | 1411 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
elect | +1.344 |
events | +1.272 |
oops | +1.254 |
awaits | +1.223 |
probably | +1.183 |
Neg logit contributions | |
slang | -1.220 |
stereotype | -1.183 |
curfew | -1.158 |
ingrained | -1.131 |
puberty | -1.128 |
Token | S |
Token ID | 50 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
slang | +7.812 |
stereotype | +7.518 |
curfew | +7.176 |
ingrained | +7.144 |
mentality | +7.049 |
Neg logit contributions | |
elect | -6.953 |
events | -6.519 |
oops | -6.452 |
awaits | -6.274 |
probably | -5.992 |
Token | Telephone |
Token ID | 44735 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
slang | +15.524 |
stereotype | +14.654 |
curfew | +14.045 |
tradition | +13.835 |
mentality | +13.765 |
Neg logit contributions | |
elect | -12.198 |
oops | -11.434 |
events | -11.432 |
awaits | -10.667 |
probably | -10.616 |
Token | Sc |
Token ID | 1446 |
Feature activation | -5.04e-02 |
Pos logit contributions | |
slang | +10.031 |
stereotype | +9.535 |
curfew | +9.216 |
tradition | +8.977 |
ingrained | +8.970 |
Neg logit contributions | |
elect | -8.169 |
oops | -7.780 |
events | -7.766 |
awaits | -7.407 |
probably | -7.071 |
Token | am |
Token ID | 321 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
elect | +0.451 |
events | +0.424 |
oops | +0.420 |
awaits | +0.405 |
probably | +0.391 |
Neg logit contributions | |
slang | -0.499 |
stereotype | -0.486 |
curfew | -0.475 |
ingrained | -0.467 |
puberty | -0.464 |
Token | � |
Token ID | 447 |
Feature activation | +6.86e-01 |
Pos logit contributions | |
slang | +13.175 |
stereotype | +12.497 |
curfew | +11.888 |
mentality | +11.882 |
tradition | +11.867 |
Neg logit contributions | |
elect | -12.199 |
events | -11.756 |
oops | -11.445 |
awaits | -10.915 |
probably | -10.664 |
Token | � |
Token ID | 251 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
slang | +4.787 |
stereotype | +4.551 |
curfew | +4.384 |
ingrained | +4.354 |
puberty | +4.320 |
Neg logit contributions | |
elect | -7.764 |
events | -7.493 |
oops | -7.353 |
awaits | -7.208 |
probably | -6.986 |
Token | in |
Token ID | 287 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
slang | +19.737 |
stereotype | +17.988 |
terminology | +17.474 |
mentality | +17.216 |
curfew | +17.156 |
Neg logit contributions | |
elect | -15.908 |
events | -15.030 |
oops | -14.799 |
probably | -14.046 |
absolutely | -13.947 |
Token | the |
Token ID | 262 |
Feature activation | +3.03e-01 |
Pos logit contributions | |
slang | +2.500 |
stereotype | +2.380 |
curfew | +2.297 |
ingrained | +2.244 |
puberty | +2.225 |
Neg logit contributions | |
elect | -4.353 |
events | -4.168 |
oops | -4.116 |
awaits | -4.032 |
probably | -3.930 |
Token | notes |
Token ID | 4710 |
Feature activation | +5.80e-01 |
Pos logit contributions | |
slang | +2.705 |
stereotype | +2.610 |
curfew | +2.535 |
ingrained | +2.494 |
puberty | +2.469 |
Neg logit contributions | |
elect | -3.010 |
events | -2.851 |
oops | -2.813 |
awaits | -2.740 |
probably | -2.653 |
Token | . |
Token ID | 13 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
slang | +4.989 |
stereotype | +4.825 |
ingrained | +4.642 |
curfew | +4.637 |
puberty | +4.554 |
Neg logit contributions | |
elect | -5.770 |
events | -5.544 |
oops | -5.446 |
awaits | -5.261 |
probably | -5.154 |
Token |
|
Token ID | 198 |
Feature activation | -3.88e-02 |
Pos logit contributions | |
elect | +1.151 |
events | +1.078 |
oops | +1.061 |
awaits | +1.028 |
probably | +0.989 |
Neg logit contributions | |
slang | -1.378 |
stereotype | -1.345 |
curfew | -1.321 |
ingrained | -1.307 |
puberty | -1.295 |
Token | and |
Token ID | 290 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
slang | +11.586 |
curfew | +11.520 |
stereotype | +11.245 |
mentality | +11.106 |
ingrained | +10.740 |
Neg logit contributions | |
elect | -11.081 |
oops | -10.613 |
events | -10.521 |
probably | -9.762 |
absolutely | -9.575 |
Token | alcohol |
Token ID | 5548 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
slang | +1.112 |
stereotype | +1.082 |
curfew | +1.053 |
ingrained | +1.039 |
puberty | +1.031 |
Neg logit contributions | |
elect | -1.015 |
events | -0.955 |
oops | -0.940 |
awaits | -0.915 |
probably | -0.882 |
Token | monitoring |
Token ID | 9904 |
Feature activation | +1.72e+00 |
Pos logit contributions | |
slang | +13.887 |
curfew | +13.805 |
stereotype | +13.318 |
mentality | +12.912 |
leash | +12.840 |
Neg logit contributions | |
elect | -13.957 |
oops | -13.298 |
events | -13.165 |
probably | -12.369 |
absolutely | -12.220 |
Token | or |
Token ID | 393 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
slang | +14.477 |
curfew | +14.062 |
worn | +13.902 |
stereotype | +13.735 |
mentality | +13.670 |
Neg logit contributions | |
elect | -13.827 |
oops | -13.256 |
events | -13.116 |
probably | -12.428 |
absolutely | -12.323 |
Token | SC |
Token ID | 6374 |
Feature activation | +9.39e-01 |
Pos logit contributions | |
slang | +1.259 |
stereotype | +1.223 |
curfew | +1.187 |
ingrained | +1.172 |
puberty | +1.163 |
Neg logit contributions | |
elect | -1.311 |
events | -1.239 |
oops | -1.219 |
awaits | -1.191 |
probably | -1.150 |
Token | RAM |
Token ID | 24115 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
slang | +8.259 |
stereotype | +7.939 |
curfew | +7.808 |
ingrained | +7.598 |
puberty | +7.557 |
Neg logit contributions | |
elect | -8.741 |
events | -8.388 |
oops | -8.195 |
awaits | -8.025 |
probably | -7.796 |
Token | requirements |
Token ID | 5359 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
slang | +19.792 |
curfew | +19.651 |
mentality | +18.859 |
worn | +18.712 |
stereotype | +18.588 |
Neg logit contributions | |
elect | -14.707 |
oops | -14.086 |
events | -14.006 |
probably | -13.015 |
ilib | -12.785 |
Token | removed |
Token ID | 4615 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
ingrained | +19.026 |
worn | +18.774 |
slang | +18.509 |
curfew | +18.223 |
stereotype | +18.144 |
Neg logit contributions | |
events | -17.411 |
elect | -17.168 |
oops | -16.910 |
probably | -15.107 |
ilib | -14.962 |
Token | , |
Token ID | 11 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
slang | +9.821 |
stereotype | +9.373 |
ingrained | +9.346 |
curfew | +9.341 |
mentality | +9.127 |
Neg logit contributions | |
elect | -10.361 |
oops | -10.110 |
events | -9.951 |
probably | -9.147 |
awaits | -9.126 |
Token | and |
Token ID | 290 |
Feature activation | +4.22e-01 |
Pos logit contributions | |
slang | +9.802 |
stereotype | +9.292 |
curfew | +9.254 |
ingrained | +8.965 |
mentality | +8.875 |
Neg logit contributions | |
elect | -10.090 |
events | -9.590 |
oops | -9.535 |
awaits | -8.983 |
absolutely | -8.873 |
Token | the |
Token ID | 262 |
Feature activation | +7.08e-01 |
Pos logit contributions | |
slang | +3.907 |
stereotype | +3.789 |
curfew | +3.718 |
ingrained | +3.637 |
puberty | +3.606 |
Neg logit contributions | |
elect | -4.016 |
events | -3.803 |
oops | -3.777 |
awaits | -3.613 |
probably | -3.530 |
Token | — |
Token ID | 851 |
Feature activation | -7.55e-01 |
Pos logit contributions | |
elect | +12.107 |
awaits | +10.924 |
indeed | +10.819 |
events | +10.756 |
absolutely | +10.132 |
Neg logit contributions | |
slang | -12.239 |
stereotype | -11.592 |
curfew | -11.424 |
puberty | -11.121 |
ingrained | -10.957 |
Token | as |
Token ID | 355 |
Feature activation | -6.48e-01 |
Pos logit contributions | |
elect | +6.793 |
events | +6.307 |
oops | +6.067 |
awaits | +6.025 |
indeed | +5.991 |
Neg logit contributions | |
slang | -7.014 |
stereotype | -6.809 |
curfew | -6.726 |
puberty | -6.543 |
ingrained | -6.506 |
Token | promised |
Token ID | 8072 |
Feature activation | +4.54e-04 |
Pos logit contributions | |
elect | +6.036 |
events | +5.597 |
awaits | +5.581 |
oops | +5.431 |
indeed | +5.359 |
Neg logit contributions | |
slang | -5.882 |
stereotype | -5.615 |
curfew | -5.513 |
puberty | -5.364 |
ingrained | -5.331 |
Token | — |
Token ID | 851 |
Feature activation | -8.43e-01 |
Pos logit contributions | |
slang | +0.005 |
stereotype | +0.004 |
curfew | +0.004 |
ingrained | +0.004 |
puberty | +0.004 |
Neg logit contributions | |
elect | -0.004 |
events | -0.004 |
oops | -0.004 |
awaits | -0.004 |
probably | -0.004 |
Token | in |
Token ID | 287 |
Feature activation | -2.67e+00 |
Pos logit contributions | |
elect | +8.323 |
events | +7.730 |
awaits | +7.541 |
indeed | +7.396 |
probably | +7.316 |
Neg logit contributions | |
slang | -7.089 |
stereotype | -6.713 |
curfew | -6.655 |
puberty | -6.390 |
ingrained | -6.328 |
Token | the |
Token ID | 262 |
Feature activation | -2.92e+00 |
Pos logit contributions | |
elect | +19.622 |
indeed | +18.155 |
wins | +18.151 |
votes | +17.756 |
events | +17.696 |
Neg logit contributions | |
slang | -16.294 |
ipedia | -14.988 |
stereotype | -14.655 |
curfew | -14.522 |
ESE | -14.460 |
Token | Gran |
Token ID | 17113 |
Feature activation | -9.68e-01 |
Pos logit contributions | |
elect | +21.733 |
votes | +20.672 |
unlikely | +19.925 |
events | +19.836 |
bids | +19.795 |
Neg logit contributions | |
slang | -15.542 |
ipedia | -14.792 |
puberty | -14.501 |
colonialism | -14.149 |
guiActiveUnfocused | -14.048 |
Token | ite |
Token ID | 578 |
Feature activation | -7.37e-01 |
Pos logit contributions | |
elect | +5.003 |
events | +4.556 |
probably | +4.215 |
oops | +4.122 |
awaits | +3.944 |
Neg logit contributions | |
curfew | -12.282 |
slang | -12.250 |
stereotype | -11.972 |
ingrained | -11.808 |
puberty | -11.787 |
Token | State |
Token ID | 1812 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
elect | +6.781 |
events | +6.366 |
awaits | +6.091 |
oops | +6.065 |
probably | +5.842 |
Neg logit contributions | |
slang | -6.763 |
curfew | -6.433 |
stereotype | -6.377 |
puberty | -6.335 |
ingrained | -6.270 |
Token | to |
Token ID | 284 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
elect | +14.263 |
awaits | +13.502 |
events | +12.984 |
indeed | +12.953 |
probably | +12.141 |
Neg logit contributions | |
slang | -13.467 |
curfew | -12.844 |
puberty | -12.754 |
stereotype | -12.487 |
ingrained | -12.368 |
Token | give |
Token ID | 1577 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
elect | +12.536 |
indeed | +12.397 |
awaits | +11.293 |
events | +11.259 |
absolutely | +10.962 |
Neg logit contributions | |
slang | -12.153 |
puberty | -11.623 |
curfew | -11.605 |
stereotype | -10.949 |
ingrained | -10.872 |
Token | July |
Token ID | 2901 |
Feature activation | +7.53e-01 |
Pos logit contributions | |
slang | +1.718 |
stereotype | +1.668 |
curfew | +1.625 |
ingrained | +1.598 |
puberty | +1.585 |
Neg logit contributions | |
elect | -1.745 |
events | -1.649 |
oops | -1.627 |
awaits | -1.583 |
probably | -1.531 |
Token | 2017 |
Token ID | 2177 |
Feature activation | +6.48e-01 |
Pos logit contributions | |
slang | +6.769 |
stereotype | +6.535 |
curfew | +6.409 |
ingrained | +6.305 |
puberty | +6.278 |
Neg logit contributions | |
elect | -6.963 |
events | -6.699 |
oops | -6.629 |
awaits | -6.357 |
probably | -6.217 |
Token | , |
Token ID | 11 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
slang | +6.179 |
stereotype | +5.970 |
curfew | +5.856 |
ingrained | +5.798 |
puberty | +5.740 |
Neg logit contributions | |
elect | -5.741 |
events | -5.475 |
oops | -5.389 |
awaits | -5.193 |
probably | -5.049 |
Token | if |
Token ID | 611 |
Feature activation | -2.52e-01 |
Pos logit contributions | |
slang | +10.970 |
stereotype | +10.570 |
curfew | +10.492 |
ingrained | +10.347 |
puberty | +10.310 |
Neg logit contributions | |
elect | -10.672 |
events | -10.220 |
oops | -10.105 |
awaits | -9.528 |
probably | -9.332 |
Token | Labor |
Token ID | 7882 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
elect | +2.619 |
events | +2.473 |
oops | +2.429 |
awaits | +2.411 |
indeed | +2.338 |
Neg logit contributions | |
slang | -2.089 |
stereotype | -2.027 |
curfew | -1.957 |
ingrained | -1.903 |
puberty | -1.888 |
Token | wins |
Token ID | 7864 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
elect | +9.312 |
awaits | +8.469 |
indeed | +8.335 |
events | +8.328 |
oops | +8.154 |
Neg logit contributions | |
slang | -9.724 |
stereotype | -9.607 |
curfew | -9.481 |
puberty | -9.044 |
ingrained | -8.906 |
Token | the |
Token ID | 262 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
elect | +21.429 |
indeed | +18.814 |
votes | +18.201 |
events | +17.489 |
wins | +17.427 |
Neg logit contributions | |
slang | -16.857 |
stereotype | -16.132 |
avy | -15.417 |
curfew | -15.411 |
ingrained | -15.027 |
Token | election |
Token ID | 3071 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
elect | +18.717 |
votes | +16.716 |
events | +16.569 |
indeed | +15.965 |
probably | +15.669 |
Neg logit contributions | |
slang | -14.617 |
ipedia | -13.933 |
stereotype | -13.922 |
ESE | -13.566 |
curfew | -13.533 |
Token | . |
Token ID | 13 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
elect | +16.266 |
indeed | +14.808 |
awaits | +14.719 |
events | +13.972 |
probably | +13.475 |
Neg logit contributions | |
slang | -17.372 |
stereotype | -16.629 |
curfew | -16.453 |
colonialism | -15.857 |
puberty | -15.724 |
Token | Given |
Token ID | 11259 |
Feature activation | +6.63e-01 |
Pos logit contributions | |
slang | +0.111 |
stereotype | +0.108 |
curfew | +0.106 |
ingrained | +0.104 |
puberty | +0.103 |
Neg logit contributions | |
elect | -0.093 |
events | -0.088 |
oops | -0.086 |
awaits | -0.084 |
probably | -0.081 |
Token | the |
Token ID | 262 |
Feature activation | -5.67e-02 |
Pos logit contributions | |
slang | +5.189 |
stereotype | +5.059 |
curfew | +4.855 |
ingrained | +4.854 |
puberty | +4.721 |
Neg logit contributions | |
elect | -7.007 |
oops | -6.766 |
events | -6.693 |
awaits | -6.487 |
probably | -6.369 |
Token | all |
Token ID | 477 |
Feature activation | -9.58e-03 |
Pos logit contributions | |
slang | +6.825 |
stereotype | +6.543 |
curfew | +6.384 |
ingrained | +6.349 |
puberty | +6.208 |
Neg logit contributions | |
elect | -7.613 |
events | -7.261 |
oops | -7.244 |
awaits | -6.965 |
probably | -6.818 |
Token | family |
Token ID | 1641 |
Feature activation | -5.76e-01 |
Pos logit contributions | |
elect | +0.090 |
events | +0.085 |
oops | +0.084 |
awaits | +0.082 |
probably | +0.079 |
Neg logit contributions | |
slang | -0.090 |
stereotype | -0.087 |
curfew | -0.085 |
puberty | -0.083 |
ingrained | -0.083 |
Token | ties |
Token ID | 8470 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
elect | +5.056 |
events | +4.743 |
awaits | +4.607 |
oops | +4.519 |
indeed | +4.386 |
Neg logit contributions | |
slang | -5.327 |
stereotype | -5.281 |
curfew | -5.150 |
puberty | -5.099 |
ingrained | -5.043 |
Token | if |
Token ID | 611 |
Feature activation | -5.90e-01 |
Pos logit contributions | |
slang | +2.173 |
stereotype | +2.093 |
curfew | +2.029 |
ingrained | +2.012 |
puberty | +1.976 |
Neg logit contributions | |
elect | -2.861 |
events | -2.722 |
oops | -2.702 |
awaits | -2.618 |
probably | -2.556 |
Token | Clinton |
Token ID | 2605 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
elect | +5.670 |
events | +5.295 |
awaits | +5.225 |
oops | +5.189 |
indeed | +5.096 |
Neg logit contributions | |
slang | -5.220 |
stereotype | -5.049 |
curfew | -4.919 |
ingrained | -4.764 |
puberty | -4.734 |
Token | wins |
Token ID | 7864 |
Feature activation | -2.71e+00 |
Pos logit contributions | |
indeed | +15.747 |
elect | +15.513 |
awaits | +15.424 |
wins | +15.413 |
casts | +14.023 |
Neg logit contributions | |
slang | -16.986 |
stereotype | -16.519 |
curfew | -16.336 |
puberty | -15.739 |
ingrained | -15.334 |
Token | in |
Token ID | 287 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
elect | +19.745 |
indeed | +17.288 |
awaits | +15.844 |
events | +15.680 |
votes | +15.640 |
Neg logit contributions | |
slang | -18.474 |
stereotype | -17.654 |
curfew | -17.645 |
guiActiveUnfocused | -17.167 |
ingrained | -16.522 |
Token | November |
Token ID | 3389 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
elect | +15.814 |
indeed | +14.057 |
unlikely | +12.911 |
probably | +12.868 |
votes | +12.817 |
Neg logit contributions | |
slang | -20.389 |
guiActiveUnfocused | -20.158 |
stereotype | -20.084 |
curfew | -19.983 |
ESE | -19.845 |
Token | . |
Token ID | 13 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
elect | +11.938 |
events | +10.246 |
awaits | +10.210 |
indeed | +10.175 |
oops | +9.716 |
Neg logit contributions | |
slang | -15.566 |
stereotype | -15.157 |
curfew | -15.132 |
puberty | -14.930 |
ingrained | -14.447 |
Token |
|
Token ID | 198 |
Feature activation | +5.00e-01 |
Pos logit contributions | |
elect | +1.561 |
events | +1.467 |
oops | +1.437 |
awaits | +1.402 |
probably | +1.353 |
Neg logit contributions | |
slang | -1.908 |
stereotype | -1.861 |
curfew | -1.839 |
ingrained | -1.809 |
puberty | -1.799 |
Token |
|
Token ID | 198 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
slang | +4.566 |
stereotype | +4.384 |
curfew | +4.221 |
ingrained | +4.213 |
puberty | +4.147 |
Neg logit contributions | |
elect | -4.665 |
events | -4.418 |
oops | -4.401 |
awaits | -4.300 |
probably | -4.064 |
Token | family |
Token ID | 1641 |
Feature activation | -5.76e-01 |
Pos logit contributions | |
elect | +0.090 |
events | +0.085 |
oops | +0.084 |
awaits | +0.082 |
probably | +0.079 |
Neg logit contributions | |
slang | -0.090 |
stereotype | -0.087 |
curfew | -0.085 |
puberty | -0.083 |
ingrained | -0.083 |
Token | ties |
Token ID | 8470 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
elect | +5.056 |
events | +4.743 |
awaits | +4.607 |
oops | +4.519 |
indeed | +4.386 |
Neg logit contributions | |
slang | -5.327 |
stereotype | -5.281 |
curfew | -5.150 |
puberty | -5.099 |
ingrained | -5.043 |
Token | if |
Token ID | 611 |
Feature activation | -5.90e-01 |
Pos logit contributions | |
slang | +2.173 |
stereotype | +2.093 |
curfew | +2.029 |
ingrained | +2.012 |
puberty | +1.976 |
Neg logit contributions | |
elect | -2.861 |
events | -2.722 |
oops | -2.702 |
awaits | -2.618 |
probably | -2.556 |
Token | Clinton |
Token ID | 2605 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
elect | +5.670 |
events | +5.295 |
awaits | +5.225 |
oops | +5.189 |
indeed | +5.096 |
Neg logit contributions | |
slang | -5.220 |
stereotype | -5.049 |
curfew | -4.919 |
ingrained | -4.764 |
puberty | -4.734 |
Token | wins |
Token ID | 7864 |
Feature activation | -2.71e+00 |
Pos logit contributions | |
indeed | +15.747 |
elect | +15.513 |
awaits | +15.424 |
wins | +15.413 |
casts | +14.023 |
Neg logit contributions | |
slang | -16.986 |
stereotype | -16.519 |
curfew | -16.336 |
puberty | -15.739 |
ingrained | -15.334 |
Token | in |
Token ID | 287 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
elect | +19.745 |
indeed | +17.288 |
awaits | +15.844 |
events | +15.680 |
votes | +15.640 |
Neg logit contributions | |
slang | -18.474 |
stereotype | -17.654 |
curfew | -17.645 |
guiActiveUnfocused | -17.167 |
ingrained | -16.522 |
Token | November |
Token ID | 3389 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
elect | +15.814 |
indeed | +14.057 |
unlikely | +12.911 |
probably | +12.868 |
votes | +12.817 |
Neg logit contributions | |
slang | -20.389 |
guiActiveUnfocused | -20.158 |
stereotype | -20.084 |
curfew | -19.983 |
ESE | -19.845 |
Token | . |
Token ID | 13 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
elect | +11.938 |
events | +10.246 |
awaits | +10.210 |
indeed | +10.175 |
oops | +9.716 |
Neg logit contributions | |
slang | -15.566 |
stereotype | -15.157 |
curfew | -15.132 |
puberty | -14.930 |
ingrained | -14.447 |
Token |
|
Token ID | 198 |
Feature activation | +5.00e-01 |
Pos logit contributions | |
elect | +1.561 |
events | +1.467 |
oops | +1.437 |
awaits | +1.402 |
probably | +1.353 |
Neg logit contributions | |
slang | -1.908 |
stereotype | -1.861 |
curfew | -1.839 |
ingrained | -1.809 |
puberty | -1.799 |
Token |
|
Token ID | 198 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
slang | +4.566 |
stereotype | +4.384 |
curfew | +4.221 |
ingrained | +4.213 |
puberty | +4.147 |
Neg logit contributions | |
elect | -4.665 |
events | -4.418 |
oops | -4.401 |
awaits | -4.300 |
probably | -4.064 |
Token | In |
Token ID | 818 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
slang | +2.275 |
stereotype | +2.203 |
curfew | +2.140 |
ingrained | +2.119 |
puberty | +2.090 |
Neg logit contributions | |
elect | -2.106 |
events | -1.987 |
oops | -1.959 |
awaits | -1.928 |
probably | -1.833 |
Token | 't |
Token ID | 470 |
Feature activation | +9.65e-02 |
Pos logit contributions | |
elect | +1.636 |
events | +1.446 |
oops | +1.407 |
probably | +1.292 |
awaits | +1.265 |
Neg logit contributions | |
slang | -4.794 |
stereotype | -4.755 |
curfew | -4.736 |
puberty | -4.623 |
ingrained | -4.606 |
Token | matter |
Token ID | 2300 |
Feature activation | -4.84e-01 |
Pos logit contributions | |
slang | +0.827 |
stereotype | +0.798 |
curfew | +0.778 |
ingrained | +0.764 |
puberty | +0.758 |
Neg logit contributions | |
elect | -0.992 |
events | -0.940 |
oops | -0.924 |
awaits | -0.908 |
probably | -0.879 |
Token | whether |
Token ID | 1771 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
elect | +4.264 |
events | +4.002 |
awaits | +3.870 |
oops | +3.782 |
indeed | +3.778 |
Neg logit contributions | |
slang | -4.639 |
stereotype | -4.525 |
curfew | -4.447 |
puberty | -4.326 |
ingrained | -4.283 |
Token | Britain |
Token ID | 5491 |
Feature activation | -3.72e-01 |
Pos logit contributions | |
elect | +2.568 |
events | +2.405 |
awaits | +2.350 |
oops | +2.341 |
indeed | +2.240 |
Neg logit contributions | |
slang | -2.357 |
stereotype | -2.275 |
curfew | -2.221 |
ingrained | -2.175 |
puberty | -2.153 |
Token | agrees |
Token ID | 14386 |
Feature activation | -7.36e-01 |
Pos logit contributions | |
elect | +2.519 |
events | +2.261 |
awaits | +2.241 |
oops | +2.222 |
indeed | +2.042 |
Neg logit contributions | |
slang | -4.456 |
stereotype | -4.352 |
curfew | -4.286 |
puberty | -4.198 |
ingrained | -4.193 |
Token | or |
Token ID | 393 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
elect | +6.844 |
events | +6.319 |
awaits | +6.258 |
indeed | +6.074 |
oops | +6.056 |
Neg logit contributions | |
slang | -6.497 |
stereotype | -6.304 |
curfew | -6.119 |
ingrained | -6.007 |
puberty | -5.947 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e-01 |
Pos logit contributions | |
elect | +18.304 |
indeed | +18.090 |
awaits | +18.073 |
rejects | +17.169 |
dies | +17.027 |
Neg logit contributions | |
slang | -18.749 |
guiActiveUnfocused | -18.387 |
puberty | -18.223 |
curfew | -18.218 |
stereotype | -18.155 |
Token | , |
Token ID | 11 |
Feature activation | -4.50e-01 |
Pos logit contributions | |
elect | +4.027 |
events | +3.747 |
awaits | +3.658 |
oops | +3.641 |
indeed | +3.513 |
Neg logit contributions | |
slang | -4.057 |
stereotype | -3.915 |
curfew | -3.815 |
ingrained | -3.736 |
puberty | -3.725 |
Token | or |
Token ID | 393 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
elect | +4.121 |
events | +3.864 |
awaits | +3.772 |
oops | +3.757 |
indeed | +3.647 |
Neg logit contributions | |
slang | -4.221 |
stereotype | -4.094 |
curfew | -3.983 |
puberty | -3.906 |
ingrained | -3.897 |
Token | even |
Token ID | 772 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
elect | +11.663 |
indeed | +11.531 |
awaits | +11.135 |
events | +10.670 |
else | +10.257 |
Neg logit contributions | |
slang | -12.261 |
stereotype | -11.855 |
curfew | -11.626 |
puberty | -11.589 |
ingrained | -11.224 |
Token | whether |
Token ID | 1771 |
Feature activation | -4.14e-01 |
Pos logit contributions | |
elect | +8.400 |
awaits | +7.933 |
indeed | +7.734 |
events | +7.634 |
oops | +7.316 |
Neg logit contributions | |
slang | -9.827 |
stereotype | -9.517 |
curfew | -9.363 |
puberty | -9.291 |
ingrained | -9.171 |
Token | prevail |
Token ID | 28615 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
elect | +8.655 |
events | +7.940 |
indeed | +7.880 |
awaits | +7.673 |
probably | +7.577 |
Neg logit contributions | |
slang | -8.066 |
curfew | -7.681 |
puberty | -7.575 |
stereotype | -7.490 |
ingrained | -7.352 |
Token | — |
Token ID | 851 |
Feature activation | -7.55e-01 |
Pos logit contributions | |
elect | +12.107 |
awaits | +10.924 |
indeed | +10.819 |
events | +10.756 |
absolutely | +10.132 |
Neg logit contributions | |
slang | -12.239 |
stereotype | -11.592 |
curfew | -11.424 |
puberty | -11.121 |
ingrained | -10.957 |
Token | as |
Token ID | 355 |
Feature activation | -6.48e-01 |
Pos logit contributions | |
elect | +6.793 |
events | +6.307 |
oops | +6.067 |
awaits | +6.025 |
indeed | +5.991 |
Neg logit contributions | |
slang | -7.014 |
stereotype | -6.809 |
curfew | -6.726 |
puberty | -6.543 |
ingrained | -6.506 |
Token | promised |
Token ID | 8072 |
Feature activation | +4.54e-04 |
Pos logit contributions | |
elect | +6.036 |
events | +5.597 |
awaits | +5.581 |
oops | +5.431 |
indeed | +5.359 |
Neg logit contributions | |
slang | -5.882 |
stereotype | -5.615 |
curfew | -5.513 |
puberty | -5.364 |
ingrained | -5.331 |
Token | — |
Token ID | 851 |
Feature activation | -8.43e-01 |
Pos logit contributions | |
slang | +0.005 |
stereotype | +0.004 |
curfew | +0.004 |
ingrained | +0.004 |
puberty | +0.004 |
Neg logit contributions | |
elect | -0.004 |
events | -0.004 |
oops | -0.004 |
awaits | -0.004 |
probably | -0.004 |
Token | in |
Token ID | 287 |
Feature activation | -2.67e+00 |
Pos logit contributions | |
elect | +8.323 |
events | +7.730 |
awaits | +7.541 |
indeed | +7.396 |
probably | +7.316 |
Neg logit contributions | |
slang | -7.089 |
stereotype | -6.713 |
curfew | -6.655 |
puberty | -6.390 |
ingrained | -6.328 |
Token | the |
Token ID | 262 |
Feature activation | -2.92e+00 |
Pos logit contributions | |
elect | +19.622 |
indeed | +18.155 |
wins | +18.151 |
votes | +17.756 |
events | +17.696 |
Neg logit contributions | |
slang | -16.294 |
ipedia | -14.988 |
stereotype | -14.655 |
curfew | -14.522 |
ESE | -14.460 |
Token | Gran |
Token ID | 17113 |
Feature activation | -9.68e-01 |
Pos logit contributions | |
elect | +21.733 |
votes | +20.672 |
unlikely | +19.925 |
events | +19.836 |
bids | +19.795 |
Neg logit contributions | |
slang | -15.542 |
ipedia | -14.792 |
puberty | -14.501 |
colonialism | -14.149 |
guiActiveUnfocused | -14.048 |
Token | ite |
Token ID | 578 |
Feature activation | -7.37e-01 |
Pos logit contributions | |
elect | +5.003 |
events | +4.556 |
probably | +4.215 |
oops | +4.122 |
awaits | +3.944 |
Neg logit contributions | |
curfew | -12.282 |
slang | -12.250 |
stereotype | -11.972 |
ingrained | -11.808 |
puberty | -11.787 |
Token | State |
Token ID | 1812 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
elect | +6.781 |
events | +6.366 |
awaits | +6.091 |
oops | +6.065 |
probably | +5.842 |
Neg logit contributions | |
slang | -6.763 |
curfew | -6.433 |
stereotype | -6.377 |
puberty | -6.335 |
ingrained | -6.270 |
Token | to |
Token ID | 284 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
elect | +14.263 |
awaits | +13.502 |
events | +12.984 |
indeed | +12.953 |
probably | +12.141 |
Neg logit contributions | |
slang | -13.467 |
curfew | -12.844 |
puberty | -12.754 |
stereotype | -12.487 |
ingrained | -12.368 |
Token | mean |
Token ID | 1612 |
Feature activation | +4.84e-02 |
Pos logit contributions | |
slang | +5.586 |
stereotype | +5.501 |
curfew | +5.226 |
ingrained | +5.192 |
mentality | +5.174 |
Neg logit contributions | |
elect | -6.403 |
events | -6.133 |
oops | -6.048 |
awaits | -5.854 |
papers | -5.633 |
Token | they |
Token ID | 484 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
slang | +0.439 |
stereotype | +0.426 |
curfew | +0.415 |
ingrained | +0.408 |
puberty | +0.405 |
Neg logit contributions | |
elect | -0.472 |
events | -0.447 |
oops | -0.440 |
awaits | -0.429 |
probably | -0.415 |
Token | can |
Token ID | 460 |
Feature activation | -6.47e-01 |
Pos logit contributions | |
elect | +1.226 |
events | +1.148 |
oops | +1.131 |
awaits | +1.109 |
probably | +1.073 |
Neg logit contributions | |
slang | -1.507 |
stereotype | -1.450 |
curfew | -1.432 |
puberty | -1.399 |
ingrained | -1.399 |
Token | get |
Token ID | 651 |
Feature activation | +7.39e-01 |
Pos logit contributions | |
elect | +5.575 |
events | +5.140 |
oops | +5.104 |
awaits | +5.044 |
indeed | +5.038 |
Neg logit contributions | |
slang | -6.258 |
curfew | -5.917 |
stereotype | -5.851 |
puberty | -5.834 |
ingrained | -5.781 |
Token | back |
Token ID | 736 |
Feature activation | +6.47e-01 |
Pos logit contributions | |
slang | +6.160 |
stereotype | +6.019 |
curfew | +5.806 |
ingrained | +5.796 |
worn | +5.681 |
Neg logit contributions | |
elect | -7.457 |
events | -7.137 |
oops | -7.113 |
awaits | -6.813 |
probably | -6.690 |
Token | ? |
Token ID | 30 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
slang | +5.087 |
stereotype | +4.971 |
ingrained | +4.805 |
curfew | +4.759 |
puberty | +4.725 |
Neg logit contributions | |
elect | -6.815 |
events | -6.529 |
oops | -6.494 |
awaits | -6.287 |
probably | -6.068 |
Token | Yes |
Token ID | 3363 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
Nothing | +15.421 |
probably | +15.333 |
elect | +15.101 |
absolutely | +15.094 |
Absolutely | +15.054 |
Neg logit contributions | |
curfew | -21.184 |
puberty | -21.155 |
slang | -20.984 |
ingrained | -20.381 |
stereotype | -20.272 |
Token | , |
Token ID | 11 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
indeed | +15.126 |
elect | +15.099 |
absolutely | +14.154 |
awaits | +13.944 |
probably | +13.843 |
Neg logit contributions | |
slang | -16.341 |
curfew | -15.787 |
stereotype | -15.781 |
puberty | -15.595 |
ingrained | -15.127 |
Token | they |
Token ID | 484 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
elect | +13.782 |
indeed | +13.722 |
absolutely | +13.335 |
probably | +13.016 |
oops | +12.842 |
Neg logit contributions | |
slang | -14.897 |
stereotype | -14.006 |
puberty | -13.978 |
guiActiveUnfocused | -13.901 |
curfew | -13.884 |
Token | have |
Token ID | 423 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
elect | +1.078 |
events | +1.006 |
oops | +0.988 |
awaits | +0.965 |
probably | +0.939 |
Neg logit contributions | |
slang | -1.438 |
stereotype | -1.390 |
curfew | -1.369 |
ingrained | -1.340 |
puberty | -1.340 |
Token | a |
Token ID | 257 |
Feature activation | +7.73e-01 |
Pos logit contributions | |
elect | +3.112 |
events | +2.956 |
oops | +2.880 |
awaits | +2.870 |
probably | +2.778 |
Neg logit contributions | |
slang | -2.735 |
stereotype | -2.621 |
curfew | -2.554 |
puberty | -2.494 |
ingrained | -2.489 |
Token | - |
Token ID | 12 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
slang | +3.778 |
stereotype | +3.665 |
curfew | +3.581 |
ingrained | +3.530 |
puberty | +3.511 |
Neg logit contributions | |
elect | -3.146 |
events | -2.976 |
oops | -2.926 |
awaits | -2.833 |
probably | -2.739 |
Token | out |
Token ID | 448 |
Feature activation | -2.62e-01 |
Pos logit contributions | |
elect | +1.402 |
events | +1.301 |
oops | +1.284 |
awaits | +1.224 |
probably | +1.184 |
Neg logit contributions | |
slang | -2.060 |
stereotype | -2.018 |
curfew | -1.971 |
ingrained | -1.949 |
puberty | -1.944 |
Token | Assange |
Token ID | 21882 |
Feature activation | -3.94e-01 |
Pos logit contributions | |
elect | +2.380 |
events | +2.235 |
oops | +2.194 |
awaits | +2.142 |
probably | +2.062 |
Neg logit contributions | |
slang | -2.528 |
stereotype | -2.467 |
curfew | -2.401 |
ingrained | -2.366 |
puberty | -2.343 |
Token | if |
Token ID | 611 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
elect | +3.907 |
events | +3.662 |
awaits | +3.600 |
oops | +3.580 |
probably | +3.440 |
Neg logit contributions | |
slang | -3.420 |
stereotype | -3.331 |
curfew | -3.280 |
ingrained | -3.164 |
puberty | -3.158 |
Token | he |
Token ID | 339 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
elect | +9.426 |
events | +8.572 |
awaits | +8.546 |
oops | +8.438 |
indeed | +8.393 |
Neg logit contributions | |
slang | -9.217 |
stereotype | -9.052 |
curfew | -8.732 |
ingrained | -8.619 |
mentality | -8.517 |
Token | wins |
Token ID | 7864 |
Feature activation | -2.59e+00 |
Pos logit contributions | |
elect | +15.074 |
awaits | +14.851 |
indeed | +14.448 |
wins | +14.199 |
casts | +13.614 |
Neg logit contributions | |
slang | -13.964 |
stereotype | -13.483 |
curfew | -13.422 |
puberty | -13.018 |
leash | -12.696 |
Token | . |
Token ID | 13 |
Feature activation | -3.28e-01 |
Pos logit contributions | |
elect | +19.973 |
indeed | +17.142 |
awaits | +16.751 |
votes | +16.581 |
bids | +16.305 |
Neg logit contributions | |
slang | -16.746 |
stereotype | -16.545 |
curfew | -15.613 |
guiActiveUnfocused | -15.493 |
ingrained | -15.446 |
Token | Moreno |
Token ID | 43269 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
elect | +2.673 |
events | +2.494 |
oops | +2.440 |
awaits | +2.390 |
probably | +2.289 |
Neg logit contributions | |
slang | -3.458 |
stereotype | -3.394 |
curfew | -3.341 |
ingrained | -3.310 |
puberty | -3.274 |
Token | , |
Token ID | 11 |
Feature activation | -8.72e-01 |
Pos logit contributions | |
elect | +12.099 |
awaits | +11.718 |
indeed | +10.995 |
events | +10.848 |
oops | +10.418 |
Neg logit contributions | |
slang | -12.616 |
curfew | -12.291 |
stereotype | -12.223 |
puberty | -11.877 |
ingrained | -11.572 |
Token | meanwhile |
Token ID | 15066 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
elect | +7.944 |
events | +7.223 |
awaits | +7.219 |
oops | +7.068 |
indeed | +7.014 |
Neg logit contributions | |
slang | -7.507 |
stereotype | -7.460 |
curfew | -7.386 |
puberty | -7.103 |
ingrained | -7.029 |
Token | , |
Token ID | 11 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
elect | +6.837 |
awaits | +6.205 |
events | +5.834 |
indeed | +5.494 |
oops | +5.476 |
Neg logit contributions | |
slang | -13.174 |
stereotype | -12.985 |
curfew | -12.918 |
puberty | -12.491 |
leash | -12.314 |
Token | campaign |
Token ID | 1923 |
Feature activation | -2.01e-01 |
Pos logit contributions | |
elect | +8.013 |
events | +7.271 |
awaits | +7.191 |
oops | +7.102 |
probably | +6.912 |
Neg logit contributions | |
slang | -7.136 |
stereotype | -6.840 |
curfew | -6.752 |
puberty | -6.733 |
ingrained | -6.539 |
Token | all |
Token ID | 477 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
elect | +2.175 |
events | +2.054 |
oops | +2.002 |
awaits | +1.990 |
indeed | +1.921 |
Neg logit contributions | |
slang | -1.578 |
stereotype | -1.531 |
curfew | -1.500 |
ingrained | -1.467 |
puberty | -1.462 |
Token | the |
Token ID | 262 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
elect | +2.308 |
events | +2.160 |
oops | +2.136 |
awaits | +2.110 |
probably | +2.042 |
Neg logit contributions | |
slang | -1.515 |
stereotype | -1.453 |
curfew | -1.405 |
ingrained | -1.365 |
puberty | -1.353 |
Token | way |
Token ID | 835 |
Feature activation | -3.81e-02 |
Pos logit contributions | |
elect | +3.743 |
events | +3.500 |
oops | +3.471 |
awaits | +3.404 |
probably | +3.329 |
Neg logit contributions | |
slang | -2.135 |
stereotype | -2.040 |
curfew | -1.976 |
puberty | -1.928 |
ingrained | -1.913 |
Token | to |
Token ID | 284 |
Feature activation | -2.44e+00 |
Pos logit contributions | |
elect | +0.427 |
events | +0.406 |
oops | +0.399 |
awaits | +0.394 |
probably | +0.381 |
Neg logit contributions | |
slang | -0.292 |
stereotype | -0.281 |
curfew | -0.273 |
ingrained | -0.266 |
puberty | -0.265 |
Token | the |
Token ID | 262 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
elect | +18.240 |
events | +16.001 |
indeed | +15.928 |
wins | +15.755 |
awaits | +15.387 |
Neg logit contributions | |
slang | -17.089 |
stereotype | -15.585 |
curfew | -15.462 |
ESE | -15.065 |
ingrained | -14.938 |
Token | Democratic |
Token ID | 4390 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
elect | +18.282 |
wins | +16.997 |
votes | +16.920 |
events | +16.662 |
indeed | +16.417 |
Neg logit contributions | |
slang | -16.320 |
puberty | -15.395 |
ESE | -14.837 |
ipedia | -14.791 |
stereotype | -14.656 |
Token | National |
Token ID | 2351 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
elect | +12.734 |
events | +10.900 |
awaits | +10.835 |
indeed | +10.546 |
votes | +10.458 |
Neg logit contributions | |
slang | -14.694 |
curfew | -14.489 |
ingrained | -13.889 |
stereotype | -13.839 |
puberty | -13.619 |
Token | Convention |
Token ID | 11680 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
elect | +9.192 |
events | +8.340 |
awaits | +8.129 |
oops | +7.710 |
indeed | +7.326 |
Neg logit contributions | |
stereotype | -13.893 |
slang | -13.845 |
puberty | -13.837 |
ingrained | -13.657 |
curfew | -13.440 |
Token | in |
Token ID | 287 |
Feature activation | -2.56e+00 |
Pos logit contributions | |
elect | +14.990 |
awaits | +13.767 |
events | +13.574 |
indeed | +13.317 |
probably | +13.313 |
Neg logit contributions | |
slang | -15.922 |
curfew | -15.394 |
stereotype | -15.290 |
puberty | -15.161 |
leash | -14.650 |
Token | July |
Token ID | 2901 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
elect | +14.253 |
indeed | +12.757 |
probably | +12.742 |
events | +12.645 |
legates | +12.456 |
Neg logit contributions | |
puberty | -20.315 |
slang | -20.003 |
ESE | -19.786 |
ipedia | -19.352 |
guiActiveUnfocused | -19.343 |
Token | up |
Token ID | 510 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
elect | +4.274 |
events | +4.009 |
oops | +3.912 |
awaits | +3.885 |
indeed | +3.745 |
Neg logit contributions | |
slang | -3.205 |
stereotype | -3.063 |
curfew | -3.043 |
ingrained | -2.931 |
puberty | -2.914 |
Token | at |
Token ID | 379 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
elect | +13.920 |
events | +12.700 |
indeed | +12.577 |
awaits | +12.294 |
rooms | +11.563 |
Neg logit contributions | |
slang | -12.932 |
stereotype | -12.440 |
curfew | -12.361 |
colonialism | -12.204 |
puberty | -11.963 |
Token | a |
Token ID | 257 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
elect | +18.398 |
events | +17.359 |
indeed | +15.849 |
votes | +15.700 |
rallies | +15.461 |
Neg logit contributions | |
slang | -14.918 |
guiActiveUnfocused | -14.492 |
stereotype | -14.116 |
mentality | -13.797 |
colonialism | -13.783 |
Token | rally |
Token ID | 7903 |
Feature activation | -8.38e-01 |
Pos logit contributions | |
elect | +14.136 |
events | +13.364 |
awaits | +12.771 |
indeed | +12.407 |
oops | +12.296 |
Neg logit contributions | |
slang | -12.711 |
ingrained | -12.357 |
puberty | -11.991 |
colonialism | -11.934 |
stereotype | -11.907 |
Token | are |
Token ID | 389 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
elect | +7.468 |
events | +6.993 |
awaits | +6.780 |
indeed | +6.642 |
probably | +6.493 |
Neg logit contributions | |
slang | -7.475 |
curfew | -7.307 |
stereotype | -7.132 |
ingrained | -7.059 |
puberty | -7.048 |
Token | prospective |
Token ID | 17530 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
elect | +13.620 |
indeed | +13.159 |
events | +12.673 |
awaits | +12.374 |
probably | +12.185 |
Neg logit contributions | |
slang | -11.637 |
stereotype | -11.479 |
curfew | -11.350 |
puberty | -11.154 |
leash | -10.893 |
Token | precinct |
Token ID | 28802 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
elect | +19.721 |
awaits | +17.988 |
votes | +17.734 |
events | +17.682 |
indeed | +17.475 |
Neg logit contributions | |
slang | -15.939 |
puberty | -15.617 |
curfew | -15.583 |
stereotype | -15.541 |
ESE | -15.204 |
Token | captains |
Token ID | 37551 |
Feature activation | -2.32e-01 |
Pos logit contributions | |
elect | +11.201 |
awaits | +10.587 |
events | +10.439 |
oops | +10.167 |
indeed | +10.008 |
Neg logit contributions | |
stereotype | -9.295 |
puberty | -9.127 |
slang | -9.116 |
ingrained | -8.953 |
curfew | -8.951 |
Token | in |
Token ID | 287 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
elect | +1.965 |
events | +1.834 |
oops | +1.793 |
awaits | +1.763 |
probably | +1.680 |
Neg logit contributions | |
slang | -2.395 |
stereotype | -2.331 |
curfew | -2.301 |
puberty | -2.237 |
ingrained | -2.233 |
Token | Iowa |
Token ID | 9406 |
Feature activation | -9.23e-01 |
Pos logit contributions | |
elect | +11.969 |
events | +10.934 |
awaits | +10.790 |
indeed | +10.376 |
oops | +10.362 |
Neg logit contributions | |
slang | -9.623 |
curfew | -9.351 |
stereotype | -9.204 |
ingrained | -9.035 |
puberty | -9.015 |
Token | . |
Token ID | 13 |
Feature activation | -5.35e-01 |
Pos logit contributions | |
elect | +7.412 |
events | +6.827 |
awaits | +6.606 |
oops | +6.514 |
indeed | +6.212 |
Neg logit contributions | |
slang | -9.122 |
curfew | -8.995 |
stereotype | -8.965 |
puberty | -8.743 |
ingrained | -8.679 |
Token | Clinton |
Token ID | 2605 |
Feature activation | -4.11e-01 |
Pos logit contributions | |
elect | +3.020 |
events | +2.803 |
awaits | +2.735 |
oops | +2.729 |
indeed | +2.599 |
Neg logit contributions | |
slang | -3.042 |
stereotype | -2.941 |
curfew | -2.888 |
puberty | -2.785 |
ingrained | -2.778 |
Token | as |
Token ID | 355 |
Feature activation | -3.36e-01 |
Pos logit contributions | |
elect | +3.913 |
events | +3.629 |
awaits | +3.564 |
oops | +3.562 |
probably | +3.400 |
Neg logit contributions | |
slang | -3.794 |
stereotype | -3.671 |
curfew | -3.636 |
puberty | -3.492 |
ingrained | -3.476 |
Token | a |
Token ID | 257 |
Feature activation | -5.83e-01 |
Pos logit contributions | |
elect | +3.602 |
events | +3.333 |
awaits | +3.307 |
oops | +3.300 |
indeed | +3.204 |
Neg logit contributions | |
slang | -2.681 |
stereotype | -2.592 |
curfew | -2.549 |
puberty | -2.458 |
ingrained | -2.433 |
Token | running |
Token ID | 2491 |
Feature activation | -5.07e-01 |
Pos logit contributions | |
elect | +5.857 |
awaits | +5.419 |
events | +5.296 |
indeed | +5.230 |
oops | +5.228 |
Neg logit contributions | |
slang | -4.810 |
curfew | -4.557 |
stereotype | -4.545 |
puberty | -4.422 |
ingrained | -4.383 |
Token | mate |
Token ID | 16133 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
elect | +3.945 |
oops | +3.524 |
events | +3.499 |
awaits | +3.459 |
indeed | +3.351 |
Neg logit contributions | |
slang | -5.446 |
stereotype | -5.245 |
curfew | -5.238 |
ingrained | -5.136 |
puberty | -5.125 |
Token | in |
Token ID | 287 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
elect | +10.056 |
awaits | +9.102 |
indeed | +9.046 |
events | +8.808 |
oops | +8.806 |
Neg logit contributions | |
slang | -11.501 |
curfew | -11.167 |
stereotype | -10.973 |
puberty | -10.778 |
leash | -10.446 |
Token | the |
Token ID | 262 |
Feature activation | -2.48e+00 |
Pos logit contributions | |
elect | +18.595 |
indeed | +16.420 |
awaits | +15.649 |
events | +15.639 |
probably | +15.436 |
Neg logit contributions | |
slang | -17.228 |
curfew | -17.011 |
stereotype | -16.292 |
puberty | -16.271 |
ingrained | -15.986 |
Token | 2016 |
Token ID | 1584 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
elect | +19.159 |
indeed | +17.637 |
awaits | +17.279 |
events | +17.136 |
oops | +17.018 |
Neg logit contributions | |
curfew | -15.373 |
slang | -15.259 |
puberty | -15.143 |
stereotype | -14.427 |
colonialism | -13.796 |
Token | presidential |
Token ID | 4787 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
elect | +16.720 |
awaits | +14.526 |
oops | +14.486 |
events | +14.388 |
indeed | +14.068 |
Neg logit contributions | |
slang | -15.220 |
curfew | -15.131 |
puberty | -14.317 |
stereotype | -14.129 |
ingrained | -13.858 |
Token | election |
Token ID | 3071 |
Feature activation | -2.19e+00 |
Pos logit contributions | |
elect | +18.916 |
oops | +16.033 |
awaits | +15.979 |
bids | +15.715 |
events | +15.549 |
Neg logit contributions | |
slang | -15.966 |
curfew | -15.576 |
stereotype | -14.919 |
puberty | -14.860 |
ingrained | -14.682 |
Token | , |
Token ID | 11 |
Feature activation | -9.35e-01 |
Pos logit contributions | |
elect | +17.112 |
awaits | +16.007 |
indeed | +15.782 |
oops | +15.214 |
events | +15.200 |
Neg logit contributions | |
slang | -16.216 |
curfew | -15.704 |
puberty | -15.546 |
stereotype | -15.335 |
ingrained | -14.500 |
Token | - |
Token ID | 12 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
elect | +7.445 |
events | +7.078 |
oops | +7.074 |
awaits | +6.830 |
probably | +6.536 |
Neg logit contributions | |
slang | -5.315 |
stereotype | -5.112 |
curfew | -5.036 |
ingrained | -4.894 |
puberty | -4.824 |
Token | trip |
Token ID | 39813 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
elect | +7.278 |
oops | +6.800 |
events | +6.751 |
awaits | +5.910 |
probably | +5.897 |
Neg logit contributions | |
slang | -12.127 |
stereotype | -11.842 |
curfew | -11.725 |
puberty | -11.426 |
ingrained | -11.420 |
Token | propagation |
Token ID | 43594 |
Feature activation | -3.55e-01 |
Pos logit contributions | |
elect | +10.393 |
events | +10.155 |
awaits | +9.943 |
oops | +9.682 |
indeed | +9.558 |
Neg logit contributions | |
slang | -10.305 |
stereotype | -10.105 |
curfew | -9.979 |
ingrained | -9.616 |
puberty | -9.532 |
Token | if |
Token ID | 611 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
elect | +3.411 |
events | +3.238 |
oops | +3.173 |
awaits | +3.128 |
indeed | +2.990 |
Neg logit contributions | |
slang | -3.164 |
stereotype | -3.099 |
curfew | -3.039 |
puberty | -2.944 |
ingrained | -2.929 |
Token | there |
Token ID | 612 |
Feature activation | -9.83e-01 |
Pos logit contributions | |
elect | +10.007 |
events | +9.586 |
oops | +9.540 |
awaits | +9.283 |
indeed | +9.187 |
Neg logit contributions | |
slang | -9.072 |
curfew | -8.693 |
stereotype | -8.661 |
ingrained | -8.352 |
puberty | -8.269 |
Token | are |
Token ID | 389 |
Feature activation | -2.57e+00 |
Pos logit contributions | |
elect | +7.131 |
events | +6.684 |
oops | +6.623 |
awaits | +6.499 |
else | +6.228 |
Neg logit contributions | |
slang | -10.573 |
curfew | -10.168 |
stereotype | -10.150 |
puberty | -9.980 |
ingrained | -9.831 |
Token | no |
Token ID | 645 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
indeed | +19.761 |
events | +19.045 |
elect | +18.973 |
enough | +18.150 |
awaits | +17.935 |
Neg logit contributions | |
slang | -15.684 |
curfew | -15.227 |
stereotype | -15.165 |
puberty | -14.949 |
gypt | -14.017 |
Token | que |
Token ID | 8358 |
Feature activation | -5.61e-01 |
Pos logit contributions | |
elect | +13.144 |
events | +13.103 |
awaits | +12.754 |
oops | +12.502 |
indeed | +12.477 |
Neg logit contributions | |
slang | -10.735 |
curfew | -10.452 |
stereotype | -10.370 |
puberty | -10.335 |
ingrained | -9.734 |
Token | uing |
Token ID | 4250 |
Feature activation | -5.91e-01 |
Pos logit contributions | |
elect | +6.969 |
events | +6.706 |
oops | +6.679 |
awaits | +6.447 |
probably | +6.239 |
Neg logit contributions | |
slang | -3.459 |
stereotype | -3.351 |
curfew | -3.201 |
ingrained | -3.151 |
mentality | -3.034 |
Token | delays |
Token ID | 16119 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
elect | +4.995 |
events | +4.841 |
oops | +4.678 |
awaits | +4.654 |
indeed | +4.357 |
Neg logit contributions | |
slang | -5.735 |
stereotype | -5.707 |
curfew | -5.589 |
puberty | -5.459 |
ingrained | -5.412 |
Token | and |
Token ID | 290 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
slang | +2.021 |
stereotype | +1.964 |
curfew | +1.914 |
ingrained | +1.895 |
puberty | +1.873 |
Neg logit contributions | |
elect | -1.812 |
events | -1.704 |
oops | -1.681 |
awaits | -1.630 |
probably | -1.577 |
Token | to |
Token ID | 284 |
Feature activation | -2.44e+00 |
Pos logit contributions | |
elect | +0.427 |
events | +0.406 |
oops | +0.399 |
awaits | +0.394 |
probably | +0.381 |
Neg logit contributions | |
slang | -0.292 |
stereotype | -0.281 |
curfew | -0.273 |
ingrained | -0.266 |
puberty | -0.265 |
Token | the |
Token ID | 262 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
elect | +18.240 |
events | +16.001 |
indeed | +15.928 |
wins | +15.755 |
awaits | +15.387 |
Neg logit contributions | |
slang | -17.089 |
stereotype | -15.585 |
curfew | -15.462 |
ESE | -15.065 |
ingrained | -14.938 |
Token | Democratic |
Token ID | 4390 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
elect | +18.282 |
wins | +16.997 |
votes | +16.920 |
events | +16.662 |
indeed | +16.417 |
Neg logit contributions | |
slang | -16.320 |
puberty | -15.395 |
ESE | -14.837 |
ipedia | -14.791 |
stereotype | -14.656 |
Token | National |
Token ID | 2351 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
elect | +12.734 |
events | +10.900 |
awaits | +10.835 |
indeed | +10.546 |
votes | +10.458 |
Neg logit contributions | |
slang | -14.694 |
curfew | -14.489 |
ingrained | -13.889 |
stereotype | -13.839 |
puberty | -13.619 |
Token | Convention |
Token ID | 11680 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
elect | +9.192 |
events | +8.340 |
awaits | +8.129 |
oops | +7.710 |
indeed | +7.326 |
Neg logit contributions | |
stereotype | -13.893 |
slang | -13.845 |
puberty | -13.837 |
ingrained | -13.657 |
curfew | -13.440 |
Token | in |
Token ID | 287 |
Feature activation | -2.56e+00 |
Pos logit contributions | |
elect | +14.990 |
awaits | +13.767 |
events | +13.574 |
indeed | +13.317 |
probably | +13.313 |
Neg logit contributions | |
slang | -15.922 |
curfew | -15.394 |
stereotype | -15.290 |
puberty | -15.161 |
leash | -14.650 |
Token | July |
Token ID | 2901 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
elect | +14.253 |
indeed | +12.757 |
probably | +12.742 |
events | +12.645 |
legates | +12.456 |
Neg logit contributions | |
puberty | -20.315 |
slang | -20.003 |
ESE | -19.786 |
ipedia | -19.352 |
guiActiveUnfocused | -19.343 |
Token | . |
Token ID | 13 |
Feature activation | -3.08e-01 |
Pos logit contributions | |
elect | +9.588 |
events | +8.784 |
awaits | +8.599 |
oops | +8.398 |
indeed | +8.224 |
Neg logit contributions | |
slang | -11.625 |
curfew | -11.473 |
stereotype | -11.448 |
puberty | -11.114 |
leash | -10.962 |
Token | It |
Token ID | 632 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
elect | +2.605 |
events | +2.436 |
oops | +2.392 |
awaits | +2.331 |
probably | +2.253 |
Neg logit contributions | |
slang | -3.178 |
stereotype | -3.096 |
curfew | -3.050 |
ingrained | -3.000 |
puberty | -2.984 |
Token | seems |
Token ID | 2331 |
Feature activation | -8.44e-01 |
Pos logit contributions | |
elect | +0.864 |
events | +0.801 |
oops | +0.787 |
awaits | +0.763 |
probably | +0.725 |
Neg logit contributions | |
slang | -1.418 |
stereotype | -1.385 |
curfew | -1.358 |
ingrained | -1.337 |
puberty | -1.332 |
Token | his |
Token ID | 465 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
elect | +7.496 |
awaits | +6.916 |
events | +6.868 |
oops | +6.689 |
indeed | +6.679 |
Neg logit contributions | |
slang | -7.762 |
stereotype | -7.455 |
curfew | -7.326 |
puberty | -7.171 |
ingrained | -7.041 |
Token | has |
Token ID | 468 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
elect | +11.543 |
awaits | +11.069 |
events | +10.673 |
oops | +10.454 |
indeed | +10.382 |
Neg logit contributions | |
slang | -10.340 |
curfew | -10.010 |
stereotype | -9.967 |
puberty | -9.643 |
ingrained | -9.329 |
Token | no |
Token ID | 645 |
Feature activation | -6.88e-01 |
Pos logit contributions | |
elect | +11.916 |
indeed | +11.404 |
events | +11.233 |
awaits | +10.984 |
probably | +10.496 |
Neg logit contributions | |
slang | -9.351 |
stereotype | -9.060 |
curfew | -9.005 |
puberty | -8.775 |
mentality | -8.406 |
Token | mathematical |
Token ID | 18069 |
Feature activation | -8.37e-04 |
Pos logit contributions | |
elect | +6.837 |
events | +6.429 |
awaits | +6.346 |
oops | +6.120 |
indeed | +6.097 |
Neg logit contributions | |
slang | -5.471 |
stereotype | -5.286 |
puberty | -5.201 |
curfew | -5.107 |
ingrained | -4.993 |
Token | path |
Token ID | 3108 |
Feature activation | +2.94e-01 |
Pos logit contributions | |
elect | +0.009 |
events | +0.008 |
oops | +0.008 |
awaits | +0.008 |
probably | +0.008 |
Neg logit contributions | |
slang | -0.007 |
stereotype | -0.007 |
curfew | -0.007 |
ingrained | -0.006 |
puberty | -0.006 |
Token | to |
Token ID | 284 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
slang | +2.128 |
stereotype | +2.049 |
curfew | +1.977 |
ingrained | +1.943 |
puberty | +1.915 |
Neg logit contributions | |
elect | -3.394 |
events | -3.246 |
oops | -3.211 |
awaits | -3.136 |
probably | -3.057 |
Token | the |
Token ID | 262 |
Feature activation | -2.53e+00 |
Pos logit contributions | |
elect | +17.968 |
indeed | +16.053 |
wins | +15.902 |
events | +15.710 |
awaits | +15.466 |
Neg logit contributions | |
slang | -16.043 |
curfew | -15.104 |
stereotype | -14.608 |
guiActiveUnfocused | -14.009 |
ingrained | -13.959 |
Token | White |
Token ID | 2635 |
Feature activation | -6.97e-01 |
Pos logit contributions | |
elect | +16.989 |
votes | +15.694 |
wins | +15.482 |
awaits | +15.256 |
events | +14.898 |
Neg logit contributions | |
slang | -17.694 |
puberty | -17.144 |
curfew | -16.915 |
guiActiveUnfocused | -16.508 |
ipedia | -16.314 |
Token | House |
Token ID | 2097 |
Feature activation | -9.02e-01 |
Pos logit contributions | |
elect | +4.542 |
events | +4.149 |
oops | +3.912 |
awaits | +3.812 |
probably | +3.720 |
Neg logit contributions | |
slang | -8.152 |
curfew | -7.935 |
stereotype | -7.882 |
ingrained | -7.775 |
puberty | -7.671 |
Token | , |
Token ID | 11 |
Feature activation | -4.53e-01 |
Pos logit contributions | |
elect | +7.199 |
awaits | +6.475 |
oops | +6.394 |
events | +6.390 |
indeed | +6.011 |
Neg logit contributions | |
slang | -9.192 |
curfew | -8.778 |
stereotype | -8.762 |
puberty | -8.588 |
ingrained | -8.468 |
Token | he |
Token ID | 339 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
elect | +4.399 |
events | +4.113 |
oops | +4.017 |
awaits | +3.985 |
probably | +3.830 |
Neg logit contributions | |
slang | -4.064 |
stereotype | -3.918 |
curfew | -3.841 |
puberty | -3.754 |
ingrained | -3.743 |
Token | � |
Token ID | 447 |
Feature activation | -4.52e-01 |
Pos logit contributions | |
elect | +11.434 |
awaits | +11.206 |
events | +10.725 |
indeed | +10.435 |
oops | +10.319 |
Neg logit contributions | |
slang | -11.902 |
curfew | -11.593 |
stereotype | -11.336 |
puberty | -11.099 |
leash | -10.718 |
Token | out |
Token ID | 503 |
Feature activation | -4.62e-01 |
Pos logit contributions | |
elect | +15.114 |
indeed | +13.614 |
awaits | +13.270 |
events | +12.698 |
oops | +12.182 |
Neg logit contributions | |
slang | -15.139 |
stereotype | -14.806 |
curfew | -14.354 |
puberty | -14.282 |
leash | -14.067 |
Token | of |
Token ID | 286 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
elect | +3.443 |
events | +3.051 |
oops | +2.974 |
awaits | +2.825 |
probably | +2.821 |
Neg logit contributions | |
slang | -5.311 |
stereotype | -5.190 |
curfew | -5.081 |
puberty | -4.981 |
ingrained | -4.965 |
Token | the |
Token ID | 262 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
elect | +12.758 |
events | +11.355 |
indeed | +10.679 |
oops | +10.633 |
awaits | +10.626 |
Neg logit contributions | |
slang | -11.560 |
stereotype | -10.955 |
curfew | -10.580 |
ingrained | -10.458 |
puberty | -10.387 |
Token | 6 |
Token ID | 718 |
Feature activation | -6.96e-01 |
Pos logit contributions | |
elect | +15.565 |
events | +14.118 |
absolutely | +13.444 |
votes | +13.403 |
awaits | +13.346 |
Neg logit contributions | |
slang | -12.008 |
puberty | -10.832 |
stereotype | -10.812 |
ingrained | -10.421 |
curfew | -10.236 |
Token | 87 |
Token ID | 5774 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
elect | +5.538 |
events | +5.075 |
oops | +4.956 |
awaits | +4.873 |
probably | +4.676 |
Neg logit contributions | |
slang | -7.221 |
stereotype | -7.091 |
curfew | -6.960 |
puberty | -6.859 |
ingrained | -6.824 |
Token | total |
Token ID | 2472 |
Feature activation | -2.52e+00 |
Pos logit contributions | |
elect | +15.278 |
events | +13.623 |
votes | +13.220 |
indeed | +13.075 |
awaits | +13.028 |
Neg logit contributions | |
slang | -14.015 |
stereotype | -13.847 |
puberty | -13.432 |
curfew | -13.361 |
ingrained | -13.056 |
Token | seats |
Token ID | 8632 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
elect | +20.475 |
votes | +19.328 |
events | +17.960 |
indeed | +17.759 |
awaits | +17.569 |
Neg logit contributions | |
slang | -15.649 |
stereotype | -15.492 |
curfew | -15.007 |
puberty | -14.778 |
mentality | -14.337 |
Token | in |
Token ID | 287 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
elect | +10.490 |
indeed | +9.343 |
events | +9.270 |
awaits | +9.160 |
oops | +9.016 |
Neg logit contributions | |
slang | -9.774 |
curfew | -9.565 |
stereotype | -9.476 |
puberty | -9.173 |
leash | -8.950 |
Token | the |
Token ID | 262 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
elect | +11.660 |
events | +10.441 |
oops | +9.754 |
probably | +9.753 |
awaits | +9.722 |
Neg logit contributions | |
slang | -9.188 |
stereotype | -8.815 |
ingrained | -8.470 |
curfew | -8.466 |
mentality | -8.106 |
Token | 9 |
Token ID | 860 |
Feature activation | -5.26e-01 |
Pos logit contributions | |
elect | +14.280 |
events | +12.818 |
awaits | +12.049 |
probably | +12.011 |
absolutely | +11.954 |
Neg logit contributions | |
slang | -11.820 |
stereotype | -11.226 |
ingrained | -10.765 |
curfew | -10.744 |
puberty | -10.624 |
Token | th |
Token ID | 400 |
Feature activation | +9.78e-02 |
Pos logit contributions | |
elect | +4.474 |
events | +4.131 |
oops | +4.030 |
awaits | +3.935 |
probably | +3.842 |
Neg logit contributions | |
slang | -5.283 |
stereotype | -5.183 |
curfew | -5.054 |
ingrained | -4.992 |
puberty | -4.983 |
Token | once |
Token ID | 1752 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
elect | +9.514 |
events | +8.833 |
awaits | +8.661 |
oops | +8.587 |
indeed | +8.499 |
Neg logit contributions | |
slang | -7.861 |
stereotype | -7.578 |
curfew | -7.367 |
ingrained | -7.147 |
puberty | -7.125 |
Token | someone |
Token ID | 2130 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
slang | +2.498 |
stereotype | +2.426 |
curfew | +2.362 |
ingrained | +2.325 |
puberty | +2.304 |
Neg logit contributions | |
elect | -2.618 |
events | -2.484 |
oops | -2.451 |
awaits | -2.378 |
probably | -2.312 |
Token | has |
Token ID | 468 |
Feature activation | -8.34e-01 |
Pos logit contributions | |
elect | +11.565 |
awaits | +10.697 |
indeed | +10.220 |
oops | +10.219 |
events | +10.147 |
Neg logit contributions | |
slang | -11.496 |
curfew | -11.130 |
stereotype | -10.993 |
puberty | -10.816 |
guiActiveUnfocused | -10.745 |
Token | decided |
Token ID | 3066 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
elect | +8.283 |
events | +7.465 |
indeed | +7.380 |
awaits | +7.376 |
oops | +7.341 |
Neg logit contributions | |
slang | -6.710 |
stereotype | -6.438 |
curfew | -6.376 |
puberty | -6.072 |
ingrained | -5.981 |
Token | to |
Token ID | 284 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
elect | +12.876 |
awaits | +11.462 |
indeed | +11.435 |
oops | +11.106 |
events | +11.063 |
Neg logit contributions | |
slang | -11.295 |
stereotype | -10.826 |
curfew | -10.737 |
ingrained | -10.331 |
leash | -10.150 |
Token | vote |
Token ID | 3015 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
elect | +11.602 |
indeed | +10.423 |
oops | +10.115 |
awaits | +10.069 |
events | +9.992 |
Neg logit contributions | |
slang | -10.494 |
curfew | -10.135 |
puberty | -9.919 |
stereotype | -9.874 |
ingrained | -9.838 |
Token | Yes |
Token ID | 3363 |
Feature activation | -7.98e-01 |
Pos logit contributions | |
elect | +18.457 |
indeed | +16.924 |
awaits | +16.526 |
yes | +15.977 |
oops | +15.679 |
Neg logit contributions | |
slang | -16.664 |
curfew | -16.395 |
puberty | -16.045 |
stereotype | -15.799 |
guiActiveUnfocused | -15.745 |
Token | they |
Token ID | 484 |
Feature activation | -4.56e-01 |
Pos logit contributions | |
elect | +7.023 |
events | +6.335 |
awaits | +6.236 |
oops | +6.163 |
indeed | +6.114 |
Neg logit contributions | |
slang | -7.539 |
stereotype | -7.255 |
curfew | -7.236 |
ingrained | -7.036 |
puberty | -7.008 |
Token | won |
Token ID | 1839 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
elect | +3.484 |
events | +3.173 |
oops | +3.116 |
awaits | +3.104 |
probably | +3.000 |
Neg logit contributions | |
slang | -4.983 |
stereotype | -4.791 |
curfew | -4.776 |
puberty | -4.654 |
ingrained | -4.649 |
Token | 't |
Token ID | 470 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
elect | +4.972 |
events | +3.936 |
oops | +3.765 |
probably | +3.736 |
indeed | +3.690 |
Neg logit contributions | |
slang | -13.478 |
stereotype | -13.291 |
curfew | -13.174 |
ingrained | -12.982 |
puberty | -12.824 |
Token | change |
Token ID | 1487 |
Feature activation | +2.83e-01 |
Pos logit contributions | |
elect | +3.124 |
events | +2.882 |
awaits | +2.801 |
oops | +2.798 |
indeed | +2.757 |
Neg logit contributions | |
slang | -3.234 |
stereotype | -3.055 |
curfew | -3.055 |
ingrained | -3.003 |
puberty | -2.968 |
Token | day |
Token ID | 1110 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
elect | +4.865 |
events | +4.506 |
oops | +4.365 |
awaits | +4.316 |
probably | +4.209 |
Neg logit contributions | |
slang | -4.162 |
stereotype | -4.043 |
curfew | -3.928 |
puberty | -3.920 |
ingrained | -3.910 |
Token | this |
Token ID | 428 |
Feature activation | -1.64e-02 |
Pos logit contributions | |
slang | +2.901 |
stereotype | +2.805 |
curfew | +2.721 |
ingrained | +2.670 |
puberty | +2.645 |
Neg logit contributions | |
elect | -3.807 |
events | -3.621 |
oops | -3.575 |
awaits | -3.491 |
probably | -3.391 |
Token | month |
Token ID | 1227 |
Feature activation | -7.63e-02 |
Pos logit contributions | |
elect | +0.199 |
events | +0.189 |
oops | +0.186 |
awaits | +0.184 |
probably | +0.179 |
Neg logit contributions | |
slang | -0.108 |
stereotype | -0.104 |
curfew | -0.101 |
puberty | -0.098 |
ingrained | -0.098 |
Token | has |
Token ID | 468 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
elect | +0.723 |
events | +0.683 |
oops | +0.667 |
awaits | +0.661 |
probably | +0.632 |
Neg logit contributions | |
slang | -0.711 |
stereotype | -0.690 |
curfew | -0.676 |
ingrained | -0.660 |
puberty | -0.659 |
Token | so |
Token ID | 523 |
Feature activation | +7.48e-01 |
Pos logit contributions | |
elect | +11.954 |
events | +11.547 |
indeed | +11.446 |
awaits | +10.873 |
probably | +10.613 |
Neg logit contributions | |
slang | -9.236 |
stereotype | -9.097 |
curfew | -9.009 |
puberty | -8.545 |
colonialism | -8.281 |
Token | many |
Token ID | 867 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
slang | +6.184 |
stereotype | +5.995 |
ingrained | +5.905 |
curfew | +5.740 |
puberty | +5.689 |
Neg logit contributions | |
elect | -7.534 |
oops | -7.211 |
events | -7.201 |
awaits | -6.964 |
probably | -6.764 |
Token | people |
Token ID | 661 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
elect | +20.289 |
indeed | +19.052 |
events | +18.960 |
awaits | +18.751 |
votes | +18.062 |
Neg logit contributions | |
ESE | -14.454 |
puberty | -13.956 |
stereotype | -13.951 |
curfew | -13.934 |
slang | -13.610 |
Token | signing |
Token ID | 8415 |
Feature activation | -7.30e-01 |
Pos logit contributions | |
elect | +11.983 |
indeed | +11.197 |
events | +11.054 |
awaits | +11.007 |
else | +10.550 |
Neg logit contributions | |
curfew | -11.020 |
slang | -10.954 |
stereotype | -10.844 |
puberty | -10.665 |
leash | -10.211 |
Token | up |
Token ID | 510 |
Feature activation | -9.19e-01 |
Pos logit contributions | |
elect | +7.401 |
events | +6.846 |
oops | +6.775 |
awaits | +6.611 |
indeed | +6.389 |
Neg logit contributions | |
slang | -5.781 |
stereotype | -5.732 |
curfew | -5.645 |
puberty | -5.451 |
ingrained | -5.422 |
Token | that |
Token ID | 326 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
elect | +8.039 |
events | +7.400 |
awaits | +7.275 |
indeed | +7.124 |
oops | +7.080 |
Neg logit contributions | |
slang | -8.316 |
stereotype | -8.248 |
curfew | -8.194 |
puberty | -7.852 |
leash | -7.750 |
Token | the |
Token ID | 262 |
Feature activation | -8.28e-01 |
Pos logit contributions | |
elect | +5.659 |
events | +5.319 |
awaits | +5.093 |
oops | +5.087 |
indeed | +4.948 |
Neg logit contributions | |
slang | -4.924 |
stereotype | -4.788 |
curfew | -4.664 |
ingrained | -4.572 |
puberty | -4.548 |
Token | to |
Token ID | 284 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
elect | +11.737 |
awaits | +11.092 |
events | +10.952 |
indeed | +10.876 |
else | +10.188 |
Neg logit contributions | |
slang | -10.943 |
curfew | -10.552 |
stereotype | -10.500 |
puberty | -10.051 |
ingrained | -9.701 |
Token | continue |
Token ID | 2555 |
Feature activation | -8.11e-01 |
Pos logit contributions | |
elect | +13.548 |
indeed | +13.159 |
events | +12.556 |
awaits | +11.989 |
oops | +11.866 |
Neg logit contributions | |
slang | -12.187 |
curfew | -12.056 |
puberty | -11.564 |
ingrained | -11.098 |
ESE | -10.976 |
Token | its |
Token ID | 663 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
elect | +7.978 |
events | +7.508 |
awaits | +7.241 |
indeed | +7.078 |
oops | +7.049 |
Neg logit contributions | |
slang | -6.681 |
stereotype | -6.387 |
curfew | -6.354 |
puberty | -5.987 |
ingrained | -5.924 |
Token | challenge |
Token ID | 4427 |
Feature activation | -7.48e-01 |
Pos logit contributions | |
elect | +14.316 |
events | +13.244 |
awaits | +12.967 |
indeed | +12.876 |
oops | +12.830 |
Neg logit contributions | |
slang | -9.820 |
curfew | -8.994 |
stereotype | -8.738 |
ESE | -8.631 |
puberty | -8.517 |
Token | into |
Token ID | 656 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
elect | +7.193 |
events | +6.648 |
awaits | +6.621 |
indeed | +6.348 |
oops | +6.308 |
Neg logit contributions | |
slang | -6.537 |
stereotype | -6.186 |
curfew | -6.158 |
puberty | -5.980 |
ingrained | -5.835 |
Token | the |
Token ID | 262 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
elect | +13.944 |
events | +12.418 |
indeed | +11.880 |
awaits | +11.862 |
probably | +11.565 |
Neg logit contributions | |
slang | -13.495 |
curfew | -12.349 |
stereotype | -12.308 |
puberty | -11.779 |
proverb | -11.633 |
Token | spring |
Token ID | 6076 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
elect | +19.808 |
awaits | +17.804 |
votes | +17.790 |
events | +17.462 |
indeed | +17.433 |
Neg logit contributions | |
slang | -15.342 |
puberty | -13.921 |
curfew | -13.759 |
colonialism | -13.498 |
ESE | -13.497 |
Token | of |
Token ID | 286 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
elect | +8.567 |
awaits | +7.640 |
events | +7.606 |
oops | +7.366 |
indeed | +7.231 |
Neg logit contributions | |
slang | -10.556 |
stereotype | -9.954 |
curfew | -9.924 |
puberty | -9.798 |
ingrained | -9.707 |
Token | 2016 |
Token ID | 1584 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
elect | +10.169 |
events | +9.094 |
awaits | +9.013 |
indeed | +8.790 |
probably | +8.630 |
Neg logit contributions | |
slang | -10.958 |
curfew | -10.598 |
stereotype | -10.451 |
puberty | -10.224 |
ingrained | -9.999 |
Token | . |
Token ID | 13 |
Feature activation | -8.41e-01 |
Pos logit contributions | |
elect | +7.807 |
events | +6.933 |
awaits | +6.931 |
oops | +6.619 |
indeed | +6.453 |
Neg logit contributions | |
slang | -11.736 |
stereotype | -11.309 |
curfew | -11.302 |
puberty | -10.966 |
ingrained | -10.892 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +4.96e-01 |
Pos logit contributions | |
elect | +6.430 |
events | +5.958 |
oops | +5.705 |
awaits | +5.678 |
probably | +5.459 |
Neg logit contributions | |
slang | -9.048 |
curfew | -8.865 |
stereotype | -8.815 |
ingrained | -8.721 |
puberty | -8.671 |
Token | while |
Token ID | 981 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
elect | +3.153 |
events | +2.950 |
oops | +2.913 |
awaits | +2.910 |
probably | +2.820 |
Neg logit contributions | |
slang | -2.377 |
stereotype | -2.255 |
curfew | -2.194 |
ingrained | -2.177 |
puberty | -2.154 |
Token | in |
Token ID | 287 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
elect | +10.870 |
indeed | +10.352 |
awaits | +10.169 |
events | +9.954 |
probably | +9.685 |
Neg logit contributions | |
slang | -12.297 |
stereotype | -11.785 |
curfew | -11.681 |
puberty | -11.160 |
ingrained | -11.036 |
Token | the |
Token ID | 262 |
Feature activation | -2.11e+00 |
Pos logit contributions | |
elect | +16.819 |
events | +14.893 |
indeed | +14.560 |
awaits | +14.496 |
probably | +14.362 |
Neg logit contributions | |
slang | -14.814 |
curfew | -14.673 |
stereotype | -14.117 |
ingrained | -13.717 |
puberty | -13.701 |
Token | Democratic |
Token ID | 4390 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
elect | +18.427 |
events | +16.481 |
awaits | +16.296 |
indeed | +15.986 |
oops | +15.887 |
Neg logit contributions | |
slang | -13.263 |
curfew | -13.022 |
puberty | -12.725 |
stereotype | -12.322 |
ingrained | -12.085 |
Token | presidential |
Token ID | 4787 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
elect | +14.517 |
events | +12.636 |
awaits | +12.419 |
probably | +11.915 |
oops | +11.820 |
Neg logit contributions | |
curfew | -13.043 |
slang | -12.885 |
ingrained | -12.353 |
puberty | -12.209 |
stereotype | -12.151 |
Token | primary |
Token ID | 4165 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
elect | +16.197 |
awaits | +13.930 |
events | +13.558 |
bids | +13.440 |
oops | +13.358 |
Neg logit contributions | |
slang | -14.818 |
curfew | -14.805 |
puberty | -14.218 |
stereotype | -14.138 |
ingrained | -14.082 |
Token | . |
Token ID | 13 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
elect | +20.177 |
awaits | +18.988 |
indeed | +18.951 |
events | +17.870 |
rooms | +17.632 |
Neg logit contributions | |
slang | -15.643 |
curfew | -15.250 |
puberty | -14.591 |
stereotype | -14.492 |
ingrained | -14.001 |
Token |
|
Token ID | 198 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
elect | +7.930 |
events | +7.283 |
oops | +7.024 |
probably | +6.916 |
awaits | +6.894 |
Neg logit contributions | |
curfew | -11.497 |
slang | -11.325 |
ingrained | -11.143 |
puberty | -11.116 |
stereotype | -11.048 |
Token |
|
Token ID | 198 |
Feature activation | -7.06e-01 |
Pos logit contributions | |
slang | +2.253 |
stereotype | +2.183 |
curfew | +2.122 |
ingrained | +2.099 |
puberty | +2.078 |
Neg logit contributions | |
elect | -2.073 |
events | -1.956 |
oops | -1.933 |
awaits | -1.883 |
probably | -1.801 |
Token | Mr |
Token ID | 5246 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
elect | +6.002 |
events | +5.564 |
oops | +5.420 |
probably | +5.213 |
absolutely | +5.108 |
Neg logit contributions | |
slang | -7.253 |
curfew | -7.177 |
stereotype | -7.173 |
puberty | -7.014 |
ingrained | -6.900 |
Token | . |
Token ID | 13 |
Feature activation | -7.82e-01 |
Pos logit contributions | |
elect | +7.200 |
events | +6.642 |
oops | +6.348 |
awaits | +6.085 |
indeed | +5.762 |
Neg logit contributions | |
slang | -13.403 |
curfew | -13.011 |
stereotype | -12.995 |
ingrained | -12.602 |
puberty | -12.593 |
Token |
|
Token ID | 198 |
Feature activation | +4.77e-01 |
Pos logit contributions | |
elect | +3.487 |
events | +3.255 |
oops | +3.186 |
awaits | +3.124 |
probably | +2.999 |
Neg logit contributions | |
slang | -4.459 |
stereotype | -4.374 |
curfew | -4.277 |
ingrained | -4.260 |
puberty | -4.204 |
Token |
|
Token ID | 198 |
Feature activation | -2.97e-01 |
Pos logit contributions | |
slang | +4.376 |
stereotype | +4.204 |
curfew | +4.052 |
ingrained | +4.043 |
puberty | +3.970 |
Neg logit contributions | |
elect | -4.446 |
events | -4.208 |
oops | -4.191 |
awaits | -4.099 |
probably | -3.875 |
Token | Should |
Token ID | 19926 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
elect | +2.767 |
events | +2.603 |
oops | +2.564 |
awaits | +2.423 |
probably | +2.418 |
Neg logit contributions | |
slang | -2.856 |
stereotype | -2.818 |
curfew | -2.745 |
puberty | -2.691 |
ingrained | -2.688 |
Token | L |
Token ID | 406 |
Feature activation | -6.38e-01 |
Pos logit contributions | |
elect | +9.252 |
events | +8.548 |
oops | +8.467 |
awaits | +8.384 |
indeed | +8.098 |
Neg logit contributions | |
slang | -10.153 |
stereotype | -9.994 |
ingrained | -9.613 |
curfew | -9.552 |
mentality | -9.376 |
Token | asso |
Token ID | 28372 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
elect | +3.871 |
oops | +3.580 |
events | +3.516 |
awaits | +3.198 |
probably | +3.191 |
Neg logit contributions | |
slang | -7.889 |
stereotype | -7.764 |
curfew | -7.738 |
ingrained | -7.507 |
puberty | -7.448 |
Token | win |
Token ID | 1592 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
elect | +14.739 |
indeed | +13.795 |
awaits | +12.917 |
wins | +12.792 |
events | +12.512 |
Neg logit contributions | |
slang | -15.165 |
puberty | -14.853 |
curfew | -14.808 |
stereotype | -14.425 |
ingrained | -14.192 |
Token | and |
Token ID | 290 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
elect | +19.039 |
indeed | +16.439 |
awaits | +15.859 |
votes | +15.670 |
events | +15.422 |
Neg logit contributions | |
slang | -17.183 |
stereotype | -17.114 |
curfew | -16.300 |
ingrained | -16.284 |
guiActiveUnfocused | -15.987 |
Token | rescind |
Token ID | 39091 |
Feature activation | +8.09e-02 |
Pos logit contributions | |
elect | +12.255 |
awaits | +11.422 |
indeed | +11.188 |
events | +10.783 |
oops | +10.489 |
Neg logit contributions | |
slang | -13.390 |
stereotype | -12.995 |
ingrained | -12.549 |
puberty | -12.527 |
curfew | -12.395 |
Token | the |
Token ID | 262 |
Feature activation | -4.62e-01 |
Pos logit contributions | |
slang | +0.677 |
stereotype | +0.654 |
curfew | +0.638 |
ingrained | +0.624 |
puberty | +0.620 |
Neg logit contributions | |
elect | -0.845 |
events | -0.805 |
oops | -0.795 |
awaits | -0.775 |
probably | -0.752 |
Token | presidential |
Token ID | 4787 |
Feature activation | -9.72e-01 |
Pos logit contributions | |
elect | +4.683 |
events | +4.319 |
oops | +4.246 |
awaits | +4.230 |
probably | +4.057 |
Neg logit contributions | |
slang | -3.906 |
stereotype | -3.784 |
ingrained | -3.635 |
puberty | -3.601 |
curfew | -3.582 |
Token | decree |
Token ID | 25931 |
Feature activation | -1.49e-01 |
Pos logit contributions | |
elect | +9.845 |
awaits | +8.743 |
oops | +8.682 |
events | +8.630 |
indeed | +8.228 |
Neg logit contributions | |
slang | -7.456 |
stereotype | -7.180 |
ingrained | -7.013 |
puberty | -6.936 |
curfew | -6.679 |
Token | coded |
Token ID | 30817 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
slang | +1.474 |
stereotype | +1.421 |
curfew | +1.381 |
puberty | +1.336 |
ingrained | +1.335 |
Neg logit contributions | |
elect | -2.222 |
events | -2.112 |
oops | -2.087 |
awaits | -2.053 |
probably | -1.987 |
Token | The |
Token ID | 383 |
Feature activation | +3.60e-01 |
Pos logit contributions | |
elect | +2.341 |
events | +2.198 |
oops | +2.138 |
awaits | +2.093 |
probably | +2.013 |
Neg logit contributions | |
slang | -2.853 |
stereotype | -2.811 |
curfew | -2.769 |
puberty | -2.696 |
ingrained | -2.689 |
Token | boot |
Token ID | 6297 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
slang | +2.947 |
stereotype | +2.842 |
curfew | +2.758 |
ingrained | +2.709 |
puberty | +2.671 |
Neg logit contributions | |
elect | -3.814 |
events | -3.634 |
oops | -3.593 |
awaits | -3.502 |
probably | -3.395 |
Token | loader |
Token ID | 29356 |
Feature activation | +3.66e-01 |
Pos logit contributions | |
elect | +1.290 |
events | +1.219 |
oops | +1.204 |
awaits | +1.169 |
probably | +1.130 |
Neg logit contributions | |
slang | -1.281 |
stereotype | -1.245 |
curfew | -1.214 |
ingrained | -1.196 |
puberty | -1.188 |
Token | res |
Token ID | 581 |
Feature activation | -4.86e-01 |
Pos logit contributions | |
slang | +4.041 |
stereotype | +3.935 |
curfew | +3.836 |
ingrained | +3.797 |
puberty | +3.742 |
Neg logit contributions | |
elect | -2.837 |
events | -2.656 |
oops | -2.607 |
awaits | -2.485 |
probably | -2.402 |
Token | ets |
Token ID | 1039 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
elect | +4.199 |
oops | +3.877 |
events | +3.864 |
awaits | +3.653 |
probably | +3.552 |
Neg logit contributions | |
slang | -4.972 |
stereotype | -4.875 |
curfew | -4.769 |
ingrained | -4.669 |
puberty | -4.648 |
Token | the |
Token ID | 262 |
Feature activation | +5.68e-01 |
Pos logit contributions | |
slang | +12.223 |
stereotype | +11.629 |
curfew | +11.367 |
ingrained | +11.339 |
worn | +11.328 |
Neg logit contributions | |
elect | -11.574 |
oops | -11.083 |
events | -10.959 |
awaits | -10.559 |
absolutely | -10.218 |
Token | power |
Token ID | 1176 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
slang | +4.791 |
stereotype | +4.637 |
curfew | +4.506 |
ingrained | +4.428 |
puberty | +4.366 |
Neg logit contributions | |
elect | -5.811 |
events | -5.525 |
oops | -5.489 |
awaits | -5.312 |
probably | -5.175 |
Token | key |
Token ID | 1994 |
Feature activation | +9.08e-01 |
Pos logit contributions | |
slang | +3.059 |
stereotype | +2.964 |
curfew | +2.881 |
ingrained | +2.832 |
puberty | +2.805 |
Neg logit contributions | |
elect | -3.545 |
events | -3.363 |
oops | -3.321 |
awaits | -3.235 |
probably | -3.137 |
Token | status |
Token ID | 3722 |
Feature activation | +6.37e-01 |
Pos logit contributions | |
slang | +8.547 |
stereotype | +8.269 |
curfew | +7.997 |
ingrained | +7.983 |
worn | +7.953 |
Neg logit contributions | |
elect | -7.807 |
oops | -7.365 |
events | -7.352 |
awaits | -7.217 |
probably | -6.848 |
Token | on |
Token ID | 319 |
Feature activation | +6.00e-01 |
Pos logit contributions | |
slang | +6.059 |
stereotype | +5.855 |
curfew | +5.704 |
ingrained | +5.661 |
mentality | +5.568 |
Neg logit contributions | |
elect | -5.731 |
events | -5.379 |
oops | -5.358 |
awaits | -5.189 |
probably | -4.989 |
Token | . |
Token ID | 13 |
Feature activation | -8.32e-02 |
Pos logit contributions | |
slang | +1.461 |
stereotype | +1.417 |
curfew | +1.385 |
ingrained | +1.367 |
puberty | +1.356 |
Neg logit contributions | |
elect | -1.195 |
events | -1.123 |
oops | -1.105 |
awaits | -1.070 |
probably | -1.028 |
Token | " |
Token ID | 366 |
Feature activation | -9.87e-01 |
Pos logit contributions | |
elect | +0.741 |
events | +0.697 |
oops | +0.687 |
awaits | +0.666 |
probably | +0.645 |
Neg logit contributions | |
slang | -0.825 |
stereotype | -0.804 |
curfew | -0.787 |
ingrained | -0.775 |
puberty | -0.769 |
Token | That |
Token ID | 2504 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
elect | +7.551 |
events | +6.930 |
oops | +6.921 |
probably | +6.758 |
absolutely | +6.430 |
Neg logit contributions | |
curfew | -10.269 |
slang | -10.268 |
puberty | -10.206 |
stereotype | -10.125 |
ingrained | -9.807 |
Token | 's |
Token ID | 338 |
Feature activation | -1.38e-01 |
Pos logit contributions | |
slang | +3.710 |
stereotype | +3.629 |
curfew | +3.507 |
ingrained | +3.471 |
mentality | +3.426 |
Neg logit contributions | |
elect | -3.251 |
events | -3.078 |
oops | -3.028 |
awaits | -2.893 |
probably | -2.794 |
Token | [ |
Token ID | 685 |
Feature activation | -5.63e-01 |
Pos logit contributions | |
elect | +1.227 |
events | +1.151 |
oops | +1.125 |
awaits | +1.102 |
probably | +1.089 |
Neg logit contributions | |
slang | -1.349 |
stereotype | -1.314 |
curfew | -1.293 |
puberty | -1.257 |
ingrained | -1.250 |
Token | a |
Token ID | 64 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
elect | +4.366 |
events | +4.041 |
oops | +3.951 |
probably | +3.874 |
absolutely | +3.703 |
Neg logit contributions | |
slang | -6.160 |
stereotype | -6.135 |
curfew | -6.034 |
puberty | -5.948 |
ingrained | -5.866 |
Token | ] |
Token ID | 60 |
Feature activation | +5.22e-01 |
Pos logit contributions | |
slang | +10.753 |
stereotype | +10.544 |
mentality | +9.795 |
curfew | +9.779 |
ingrained | +9.708 |
Neg logit contributions | |
elect | -12.148 |
events | -11.766 |
oops | -11.491 |
awaits | -11.006 |
absolutely | -10.567 |
Token | 60 |
Token ID | 3126 |
Feature activation | +8.46e-01 |
Pos logit contributions | |
slang | +5.061 |
stereotype | +4.957 |
curfew | +4.776 |
ingrained | +4.716 |
mentality | +4.665 |
Neg logit contributions | |
elect | -4.696 |
events | -4.478 |
oops | -4.410 |
awaits | -4.248 |
papers | -4.035 |
Token | , |
Token ID | 11 |
Feature activation | -8.85e-02 |
Pos logit contributions | |
slang | +7.269 |
stereotype | +7.146 |
mentality | +6.833 |
curfew | +6.784 |
ingrained | +6.662 |
Neg logit contributions | |
elect | -7.857 |
events | -7.632 |
oops | -7.297 |
awaits | -7.191 |
absolutely | -6.902 |
Token | 000 |
Token ID | 830 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
elect | +0.695 |
events | +0.647 |
oops | +0.638 |
awaits | +0.615 |
probably | +0.598 |
Neg logit contributions | |
slang | -0.970 |
stereotype | -0.948 |
curfew | -0.934 |
ingrained | -0.915 |
puberty | -0.912 |
Token | app |
Token ID | 598 |
Feature activation | +3.61e-01 |
Pos logit contributions | |
slang | +5.166 |
stereotype | +5.052 |
curfew | +4.865 |
ingrained | +4.778 |
mentality | +4.747 |
Neg logit contributions | |
elect | -6.054 |
events | -5.798 |
oops | -5.658 |
awaits | -5.506 |
probably | -5.330 |
Token | the |
Token ID | 262 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
elect | +10.952 |
events | +10.154 |
oops | +9.689 |
indeed | +9.391 |
awaits | +9.380 |
Neg logit contributions | |
slang | -8.973 |
stereotype | -8.324 |
ingrained | -8.099 |
curfew | -8.095 |
puberty | -7.755 |
Token | table |
Token ID | 3084 |
Feature activation | -9.55e-01 |
Pos logit contributions | |
elect | +11.531 |
events | +11.020 |
awaits | +9.942 |
oops | +9.923 |
probably | +9.846 |
Neg logit contributions | |
slang | -12.350 |
stereotype | -11.567 |
curfew | -11.472 |
puberty | -11.215 |
ingrained | -11.125 |
Token | since |
Token ID | 1201 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
elect | +8.175 |
events | +7.605 |
awaits | +7.323 |
oops | +7.112 |
indeed | +7.038 |
Neg logit contributions | |
slang | -8.928 |
stereotype | -8.728 |
curfew | -8.561 |
ingrained | -8.310 |
puberty | -8.268 |
Token | joining |
Token ID | 9679 |
Feature activation | +3.71e-01 |
Pos logit contributions | |
slang | +10.320 |
stereotype | +10.098 |
curfew | +9.839 |
puberty | +9.781 |
ingrained | +9.776 |
Neg logit contributions | |
elect | -10.811 |
oops | -10.562 |
events | -10.425 |
papers | -9.953 |
awaits | -9.884 |
Token | the |
Token ID | 262 |
Feature activation | -4.65e-01 |
Pos logit contributions | |
slang | +2.517 |
stereotype | +2.424 |
curfew | +2.340 |
ingrained | +2.292 |
puberty | +2.276 |
Neg logit contributions | |
elect | -4.417 |
events | -4.243 |
oops | -4.217 |
awaits | -4.117 |
probably | -4.009 |
Token | club |
Token ID | 3430 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
elect | +4.239 |
events | +4.000 |
oops | +3.834 |
awaits | +3.724 |
probably | +3.660 |
Neg logit contributions | |
slang | -4.399 |
stereotype | -4.216 |
curfew | -4.127 |
ingrained | -4.055 |
puberty | -4.035 |
Token | in |
Token ID | 287 |
Feature activation | +5.62e-01 |
Pos logit contributions | |
slang | +11.364 |
stereotype | +11.064 |
ingrained | +10.748 |
mentality | +10.739 |
puberty | +10.713 |
Neg logit contributions | |
elect | -13.196 |
oops | -13.103 |
events | -12.923 |
awaits | -12.228 |
probably | -12.013 |
Token | 1997 |
Token ID | 8309 |
Feature activation | +7.55e-01 |
Pos logit contributions | |
slang | +4.195 |
stereotype | +4.025 |
curfew | +3.882 |
ingrained | +3.810 |
puberty | +3.806 |
Neg logit contributions | |
elect | -6.346 |
events | -6.059 |
oops | -6.036 |
awaits | -5.854 |
probably | -5.702 |
Token | , |
Token ID | 11 |
Feature activation | +7.36e-01 |
Pos logit contributions | |
slang | +7.168 |
stereotype | +6.922 |
ingrained | +6.786 |
curfew | +6.697 |
puberty | +6.674 |
Neg logit contributions | |
elect | -6.530 |
events | -6.260 |
oops | -6.228 |
awaits | -5.823 |
probably | -5.762 |
Token | Putin |
Token ID | 8144 |
Feature activation | -3.67e-01 |
Pos logit contributions | |
slang | +6.458 |
stereotype | +6.308 |
ingrained | +6.130 |
curfew | +6.130 |
puberty | +5.975 |
Neg logit contributions | |
elect | -6.917 |
oops | -6.684 |
events | -6.553 |
awaits | -6.250 |
probably | -6.165 |
Token | will |
Token ID | 481 |
Feature activation | -9.09e-01 |
Pos logit contributions | |
elect | +3.109 |
events | +2.906 |
awaits | +2.876 |
oops | +2.821 |
probably | +2.686 |
Neg logit contributions | |
slang | -3.747 |
stereotype | -3.640 |
curfew | -3.589 |
puberty | -3.490 |
ingrained | -3.465 |
Token | due |
Token ID | 2233 |
Feature activation | +7.45e-01 |
Pos logit contributions | |
slang | +1.470 |
stereotype | +1.425 |
curfew | +1.389 |
ingrained | +1.376 |
puberty | +1.362 |
Neg logit contributions | |
elect | -1.141 |
events | -1.067 |
oops | -1.055 |
awaits | -1.020 |
probably | -0.982 |
Token | to |
Token ID | 284 |
Feature activation | +6.24e-01 |
Pos logit contributions | |
slang | +4.758 |
stereotype | +4.563 |
ingrained | +4.259 |
curfew | +4.259 |
mentality | +4.180 |
Neg logit contributions | |
elect | -8.788 |
oops | -8.429 |
events | -8.377 |
awaits | -8.274 |
absolutely | -8.017 |
Token | technology |
Token ID | 3037 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
slang | +5.563 |
stereotype | +5.408 |
ingrained | +5.208 |
curfew | +5.186 |
puberty | +5.050 |
Neg logit contributions | |
elect | -6.060 |
events | -5.739 |
oops | -5.691 |
awaits | -5.573 |
probably | -5.325 |
Token | limitations |
Token ID | 11247 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
slang | +11.058 |
stereotype | +10.756 |
ingrained | +10.662 |
curfew | +10.303 |
mentality | +10.232 |
Neg logit contributions | |
elect | -9.960 |
events | -9.470 |
oops | -9.311 |
awaits | -8.931 |
probably | -8.630 |
Token | . |
Token ID | 13 |
Feature activation | +7.02e-01 |
Pos logit contributions | |
slang | +10.449 |
ingrained | +10.291 |
stereotype | +10.162 |
mentality | +9.834 |
worn | +9.798 |
Neg logit contributions | |
elect | -9.869 |
events | -9.508 |
oops | -9.240 |
awaits | -8.904 |
absolutely | -8.602 |
Token | That |
Token ID | 1320 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
slang | +6.881 |
stereotype | +6.663 |
curfew | +6.375 |
ingrained | +6.339 |
mentality | +6.284 |
Neg logit contributions | |
elect | -6.064 |
events | -5.674 |
oops | -5.603 |
awaits | -5.454 |
absolutely | -5.208 |
Token | correspondence |
Token ID | 22440 |
Feature activation | +4.65e-02 |
Pos logit contributions | |
slang | +15.517 |
stereotype | +15.196 |
mentality | +14.906 |
ingrained | +14.807 |
tradition | +14.629 |
Neg logit contributions | |
elect | -11.639 |
events | -10.994 |
oops | -10.583 |
awaits | -10.021 |
papers | -9.659 |
Token | no |
Token ID | 645 |
Feature activation | +5.69e-01 |
Pos logit contributions | |
slang | +0.504 |
stereotype | +0.491 |
curfew | +0.481 |
ingrained | +0.473 |
puberty | +0.471 |
Neg logit contributions | |
elect | -0.371 |
events | -0.347 |
oops | -0.341 |
awaits | -0.331 |
probably | -0.318 |
Token | longer |
Token ID | 2392 |
Feature activation | +6.37e-01 |
Pos logit contributions | |
slang | +3.494 |
stereotype | +3.347 |
curfew | +3.193 |
ingrained | +3.143 |
puberty | +3.047 |
Neg logit contributions | |
elect | -7.038 |
events | -6.792 |
oops | -6.703 |
awaits | -6.544 |
probably | -6.415 |
Token | holds |
Token ID | 6622 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
slang | +7.167 |
stereotype | +7.097 |
ingrained | +6.927 |
curfew | +6.789 |
worn | +6.750 |
Neg logit contributions | |
elect | -4.600 |
events | -4.262 |
oops | -4.247 |
probably | -3.824 |
absolutely | -3.766 |
Token | so |
Token ID | 523 |
Feature activation | +4.84e-01 |
Pos logit contributions | |
slang | +3.926 |
stereotype | +3.791 |
curfew | +3.677 |
ingrained | +3.650 |
puberty | +3.618 |
Neg logit contributions | |
elect | -3.917 |
events | -3.722 |
oops | -3.678 |
awaits | -3.536 |
probably | -3.466 |
Token | added |
Token ID | 2087 |
Feature activation | +2.46e-01 |
Pos logit contributions | |
slang | +3.313 |
stereotype | +3.220 |
curfew | +3.119 |
ingrained | +3.086 |
puberty | +3.042 |
Neg logit contributions | |
elect | -4.069 |
events | -3.859 |
oops | -3.840 |
awaits | -3.708 |
probably | -3.601 |
Token | enough |
Token ID | 1576 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
slang | +2.188 |
stereotype | +2.121 |
curfew | +2.063 |
ingrained | +2.028 |
puberty | +2.011 |
Neg logit contributions | |
elect | -2.448 |
events | -2.319 |
oops | -2.289 |
awaits | -2.229 |
probably | -2.161 |
Token | of |
Token ID | 286 |
Feature activation | +5.43e-01 |
Pos logit contributions | |
slang | +1.413 |
stereotype | +1.364 |
curfew | +1.323 |
ingrained | +1.296 |
puberty | +1.284 |
Neg logit contributions | |
elect | -1.975 |
events | -1.883 |
oops | -1.856 |
awaits | -1.817 |
probably | -1.765 |
Token | a |
Token ID | 257 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
slang | +4.522 |
stereotype | +4.394 |
curfew | +4.238 |
ingrained | +4.188 |
puberty | +4.159 |
Neg logit contributions | |
elect | -5.574 |
events | -5.288 |
oops | -5.257 |
awaits | -5.104 |
probably | -4.965 |
Token | defensive |
Token ID | 6110 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
slang | +9.351 |
stereotype | +9.261 |
mentality | +9.004 |
curfew | +8.906 |
ingrained | +8.744 |
Neg logit contributions | |
elect | -11.520 |
events | -11.043 |
oops | -10.984 |
awaits | -10.383 |
probably | -10.321 |
Token | facet |
Token ID | 39144 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
mentality | +12.288 |
slang | +12.233 |
stereotype | +12.229 |
leash | +11.348 |
proficiency | +11.331 |
Neg logit contributions | |
elect | -15.553 |
events | -15.455 |
oops | -14.828 |
papers | -13.864 |
probably | -13.780 |
Token | to |
Token ID | 284 |
Feature activation | +8.48e-01 |
Pos logit contributions | |
slang | +11.587 |
stereotype | +11.297 |
ingrained | +11.236 |
mentality | +11.053 |
worn | +10.820 |
Neg logit contributions | |
elect | -13.539 |
events | -13.126 |
oops | -12.576 |
awaits | -12.423 |
probably | -12.194 |
Token | his |
Token ID | 465 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
slang | +7.401 |
stereotype | +7.284 |
curfew | +6.984 |
ingrained | +6.955 |
puberty | +6.807 |
Neg logit contributions | |
elect | -8.091 |
events | -7.725 |
oops | -7.672 |
awaits | -7.425 |
probably | -7.136 |
Token | game |
Token ID | 983 |
Feature activation | +6.99e-01 |
Pos logit contributions | |
slang | +2.891 |
stereotype | +2.800 |
curfew | +2.699 |
ingrained | +2.667 |
puberty | +2.625 |
Neg logit contributions | |
elect | -3.816 |
events | -3.632 |
oops | -3.591 |
awaits | -3.504 |
probably | -3.402 |
Token | to |
Token ID | 284 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
slang | +5.970 |
stereotype | +5.805 |
curfew | +5.612 |
ingrained | +5.590 |
mentality | +5.545 |
Neg logit contributions | |
elect | -6.854 |
events | -6.530 |
oops | -6.472 |
awaits | -6.267 |
probably | -6.130 |
Token | truly |
Token ID | 4988 |
Feature activation | +4.52e-01 |
Pos logit contributions | |
slang | +4.531 |
stereotype | +4.432 |
curfew | +4.283 |
ingrained | +4.226 |
puberty | +4.172 |
Neg logit contributions | |
elect | -4.687 |
events | -4.463 |
oops | -4.404 |
awaits | -4.264 |
probably | -4.108 |
Token | ented |
Token ID | 4714 |
Feature activation | +4.16e-01 |
Pos logit contributions | |
slang | +3.854 |
stereotype | +3.730 |
curfew | +3.581 |
ingrained | +3.553 |
puberty | +3.516 |
Neg logit contributions | |
elect | -4.544 |
events | -4.369 |
oops | -4.260 |
awaits | -4.235 |
probably | -4.029 |
Token | with |
Token ID | 351 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
slang | +3.501 |
stereotype | +3.330 |
curfew | +3.213 |
ingrained | +3.171 |
puberty | +3.146 |
Neg logit contributions | |
elect | -4.314 |
events | -4.139 |
oops | -4.099 |
awaits | -3.975 |
probably | -3.833 |
Token | gold |
Token ID | 3869 |
Feature activation | +8.82e-01 |
Pos logit contributions | |
slang | +2.751 |
stereotype | +2.650 |
curfew | +2.567 |
ingrained | +2.532 |
puberty | +2.506 |
Neg logit contributions | |
elect | -3.055 |
events | -2.910 |
oops | -2.877 |
awaits | -2.793 |
probably | -2.696 |
Token | designs |
Token ID | 9824 |
Feature activation | +5.10e-01 |
Pos logit contributions | |
slang | +8.362 |
stereotype | +7.936 |
ingrained | +7.668 |
worn | +7.609 |
curfew | +7.504 |
Neg logit contributions | |
elect | -7.767 |
events | -7.423 |
oops | -7.419 |
awaits | -6.977 |
probably | -6.836 |
Token | and |
Token ID | 290 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
slang | +5.018 |
stereotype | +4.835 |
ingrained | +4.728 |
curfew | +4.649 |
worn | +4.638 |
Neg logit contributions | |
elect | -4.497 |
events | -4.287 |
oops | -4.192 |
awaits | -4.009 |
probably | -3.902 |
Token | a |
Token ID | 257 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
slang | +1.494 |
stereotype | +1.450 |
curfew | +1.413 |
ingrained | +1.393 |
puberty | +1.380 |
Neg logit contributions | |
elect | -1.387 |
events | -1.309 |
oops | -1.291 |
awaits | -1.247 |
probably | -1.208 |
Token | plate |
Token ID | 7480 |
Feature activation | +7.10e-01 |
Pos logit contributions | |
slang | +9.167 |
stereotype | +8.857 |
curfew | +8.495 |
worn | +8.431 |
ingrained | +8.267 |
Neg logit contributions | |
elect | -9.522 |
events | -9.341 |
oops | -9.104 |
awaits | -8.667 |
absolutely | -8.410 |
Token | that |
Token ID | 326 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
slang | +6.643 |
stereotype | +6.454 |
curfew | +6.194 |
ingrained | +6.186 |
worn | +6.146 |
Neg logit contributions | |
elect | -6.451 |
events | -6.262 |
oops | -6.109 |
awaits | -5.760 |
probably | -5.650 |
Token | says |
Token ID | 1139 |
Feature activation | +1.76e-01 |
Pos logit contributions | |
slang | +2.375 |
stereotype | +2.317 |
curfew | +2.260 |
ingrained | +2.238 |
puberty | +2.214 |
Neg logit contributions | |
elect | -1.539 |
events | -1.432 |
oops | -1.406 |
awaits | -1.337 |
probably | -1.290 |
Token | � |
Token ID | 564 |
Feature activation | -1.42e-03 |
Pos logit contributions | |
slang | +1.699 |
stereotype | +1.647 |
curfew | +1.604 |
ingrained | +1.581 |
puberty | +1.570 |
Neg logit contributions | |
elect | -1.613 |
events | -1.523 |
oops | -1.500 |
awaits | -1.458 |
probably | -1.405 |
Token | � |
Token ID | 250 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
elect | +0.014 |
events | +0.013 |
oops | +0.013 |
awaits | +0.012 |
probably | +0.012 |
Neg logit contributions | |
slang | -0.013 |
stereotype | -0.013 |
curfew | -0.013 |
ingrained | -0.012 |
puberty | -0.012 |
Token | aku |
Token ID | 8719 |
Feature activation | +8.46e-01 |
Pos logit contributions | |
slang | +4.201 |
stereotype | +4.009 |
curfew | +3.912 |
ingrained | +3.806 |
puberty | +3.731 |
Neg logit contributions | |
elect | -6.483 |
events | -6.197 |
oops | -6.070 |
awaits | -6.062 |
probably | -5.826 |
Token | za |
Token ID | 4496 |
Feature activation | +9.05e-01 |
Pos logit contributions | |
slang | +6.428 |
stereotype | +6.197 |
curfew | +5.936 |
ingrained | +5.742 |
mentality | +5.741 |
Neg logit contributions | |
elect | -8.813 |
events | -8.428 |
oops | -8.413 |
awaits | -8.257 |
probably | -7.909 |
Token | " |
Token ID | 1 |
Feature activation | +3.95e-01 |
Pos logit contributions | |
slang | +7.793 |
stereotype | +7.529 |
curfew | +7.277 |
ingrained | +7.099 |
mentality | +7.036 |
Neg logit contributions | |
elect | -8.858 |
events | -8.458 |
oops | -8.454 |
awaits | -8.047 |
probably | -7.878 |
Token | gang |
Token ID | 7706 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
slang | +3.349 |
stereotype | +3.240 |
curfew | +3.146 |
ingrained | +3.084 |
puberty | +3.046 |
Neg logit contributions | |
elect | -4.087 |
events | -3.892 |
oops | -3.856 |
awaits | -3.741 |
probably | -3.635 |
Token | , |
Token ID | 11 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
slang | +4.411 |
stereotype | +4.282 |
curfew | +4.177 |
ingrained | +4.102 |
puberty | +4.047 |
Neg logit contributions | |
elect | -3.729 |
events | -3.540 |
oops | -3.491 |
awaits | -3.364 |
probably | -3.232 |
Token | the |
Token ID | 262 |
Feature activation | +6.32e-03 |
Pos logit contributions | |
slang | +1.060 |
stereotype | +1.028 |
curfew | +1.000 |
ingrained | +0.984 |
puberty | +0.976 |
Neg logit contributions | |
elect | -1.150 |
events | -1.089 |
oops | -1.074 |
awaits | -1.047 |
probably | -1.014 |
Token | Yam |
Token ID | 14063 |
Feature activation | -8.84e-02 |
Pos logit contributions | |
slang | +0.059 |
stereotype | +0.057 |
curfew | +0.055 |
ingrained | +0.054 |
puberty | +0.054 |
Neg logit contributions | |
elect | -0.060 |
events | -0.057 |
oops | -0.056 |
awaits | -0.055 |
probably | -0.053 |
Token | ag |
Token ID | 363 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
elect | +0.657 |
events | +0.611 |
oops | +0.600 |
awaits | +0.576 |
probably | +0.554 |
Neg logit contributions | |
slang | -1.009 |
stereotype | -0.987 |
curfew | -0.967 |
ingrained | -0.954 |
puberty | -0.947 |
Token | uchi |
Token ID | 22200 |
Feature activation | +7.16e-01 |
Pos logit contributions | |
slang | +2.229 |
stereotype | +2.150 |
curfew | +2.089 |
ingrained | +2.041 |
puberty | +2.014 |
Neg logit contributions | |
elect | -3.195 |
events | -3.056 |
oops | -3.020 |
awaits | -2.963 |
probably | -2.865 |
Token | - |
Token ID | 12 |
Feature activation | -5.23e-01 |
Pos logit contributions | |
slang | +5.461 |
stereotype | +5.216 |
curfew | +5.080 |
ingrained | +4.893 |
mentality | +4.851 |
Neg logit contributions | |
elect | -7.722 |
events | -7.473 |
oops | -7.371 |
awaits | -7.112 |
probably | -6.939 |
Token | g |
Token ID | 70 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
elect | +4.340 |
events | +4.049 |
oops | +3.933 |
awaits | +3.751 |
probably | +3.706 |
Neg logit contributions | |
slang | -5.426 |
stereotype | -5.319 |
curfew | -5.170 |
ingrained | -5.132 |
puberty | -5.104 |
Token | Corporation |
Token ID | 10501 |
Feature activation | +2.95e-01 |
Pos logit contributions | |
slang | +3.877 |
stereotype | +3.719 |
curfew | +3.658 |
ingrained | +3.490 |
mentality | +3.436 |
Neg logit contributions | |
elect | -6.771 |
events | -6.585 |
oops | -6.546 |
awaits | -6.315 |
absolutely | -6.186 |
Token | ( |
Token ID | 357 |
Feature activation | +3.77e-01 |
Pos logit contributions | |
slang | +2.991 |
stereotype | +2.908 |
curfew | +2.848 |
ingrained | +2.811 |
puberty | +2.785 |
Neg logit contributions | |
elect | -2.533 |
events | -2.394 |
oops | -2.362 |
awaits | -2.274 |
probably | -2.197 |
Token | MF |
Token ID | 49800 |
Feature activation | +6.44e-01 |
Pos logit contributions | |
slang | +3.452 |
stereotype | +3.343 |
curfew | +3.274 |
ingrained | +3.214 |
puberty | +3.209 |
Neg logit contributions | |
elect | -3.551 |
events | -3.370 |
oops | -3.318 |
awaits | -3.255 |
probably | -3.084 |
Token | SC |
Token ID | 6173 |
Feature activation | +6.20e-01 |
Pos logit contributions | |
slang | +6.223 |
stereotype | +6.034 |
curfew | +5.947 |
ingrained | +5.779 |
puberty | +5.727 |
Neg logit contributions | |
elect | -5.496 |
oops | -5.248 |
events | -5.217 |
awaits | -5.118 |
probably | -4.868 |
Token | DC |
Token ID | 9697 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
slang | +4.974 |
stereotype | +4.769 |
curfew | +4.656 |
ingrained | +4.555 |
puberty | +4.499 |
Neg logit contributions | |
elect | -6.361 |
events | -6.137 |
oops | -6.047 |
awaits | -5.968 |
absolutely | -5.738 |
Token | ). |
Token ID | 737 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
slang | +6.711 |
stereotype | +6.297 |
curfew | +6.160 |
ingrained | +5.974 |
puberty | +5.894 |
Neg logit contributions | |
elect | -11.206 |
events | -10.866 |
oops | -10.852 |
awaits | -10.597 |
absolutely | -10.303 |
Token |
|
Token ID | 198 |
Feature activation | +5.87e-01 |
Pos logit contributions | |
slang | +1.382 |
stereotype | +1.339 |
curfew | +1.307 |
ingrained | +1.281 |
puberty | +1.279 |
Neg logit contributions | |
elect | -1.303 |
events | -1.232 |
oops | -1.221 |
awaits | -1.176 |
probably | -1.140 |
Token |
|
Token ID | 198 |
Feature activation | +4.95e-01 |
Pos logit contributions | |
slang | +5.262 |
stereotype | +5.039 |
curfew | +4.866 |
ingrained | +4.840 |
puberty | +4.754 |
Neg logit contributions | |
elect | -5.533 |
events | -5.235 |
oops | -5.226 |
awaits | -5.111 |
probably | -4.831 |
Token | The |
Token ID | 464 |
Feature activation | +8.31e-02 |
Pos logit contributions | |
slang | +4.523 |
stereotype | +4.332 |
curfew | +4.248 |
ingrained | +4.176 |
puberty | +4.151 |
Neg logit contributions | |
elect | -4.510 |
events | -4.288 |
oops | -4.260 |
awaits | -4.218 |
probably | -3.978 |
Token | high |
Token ID | 1029 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
slang | +0.720 |
stereotype | +0.698 |
curfew | +0.678 |
ingrained | +0.667 |
puberty | +0.660 |
Neg logit contributions | |
elect | -0.844 |
events | -0.801 |
oops | -0.790 |
awaits | -0.771 |
probably | -0.747 |
Token | court |
Token ID | 2184 |
Feature activation | +3.61e-01 |
Pos logit contributions | |
slang | +2.672 |
stereotype | +2.556 |
curfew | +2.506 |
puberty | +2.425 |
ingrained | +2.415 |
Neg logit contributions | |
elect | -4.346 |
events | -4.178 |
oops | -4.151 |
awaits | -4.012 |
probably | -3.938 |
Token | FDA |
Token ID | 14672 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
slang | +5.444 |
stereotype | +5.276 |
curfew | +5.144 |
ingrained | +5.006 |
puberty | +4.994 |
Neg logit contributions | |
elect | -5.394 |
events | -5.164 |
oops | -5.062 |
awaits | -4.906 |
probably | -4.787 |
Token | announces |
Token ID | 26459 |
Feature activation | -8.51e-01 |
Pos logit contributions | |
slang | +1.956 |
stereotype | +1.908 |
curfew | +1.866 |
ingrained | +1.841 |
puberty | +1.827 |
Neg logit contributions | |
elect | -1.430 |
events | -1.336 |
oops | -1.314 |
awaits | -1.273 |
probably | -1.220 |
Token | new |
Token ID | 649 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
elect | +8.677 |
oops | +8.243 |
awaits | +8.104 |
events | +8.081 |
probably | +7.687 |
Neg logit contributions | |
slang | -6.384 |
stereotype | -6.209 |
ingrained | -6.004 |
curfew | -5.849 |
mentality | -5.736 |
Token | plan |
Token ID | 1410 |
Feature activation | -6.57e-01 |
Pos logit contributions | |
slang | +1.879 |
stereotype | +1.817 |
curfew | +1.765 |
ingrained | +1.731 |
puberty | +1.718 |
Neg logit contributions | |
elect | -2.364 |
events | -2.247 |
oops | -2.218 |
awaits | -2.164 |
probably | -2.101 |
Token | to |
Token ID | 284 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
elect | +6.730 |
oops | +6.351 |
awaits | +6.292 |
events | +6.247 |
papers | +5.916 |
Neg logit contributions | |
slang | -5.317 |
stereotype | -5.201 |
curfew | -4.998 |
ingrained | -4.873 |
puberty | -4.778 |
Token | curb |
Token ID | 20799 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
slang | +0.162 |
stereotype | +0.155 |
curfew | +0.152 |
ingrained | +0.149 |
puberty | +0.147 |
Neg logit contributions | |
elect | -0.220 |
events | -0.208 |
oops | -0.207 |
awaits | -0.203 |
probably | -0.198 |
Token | tobacco |
Token ID | 11219 |
Feature activation | +6.76e-01 |
Pos logit contributions | |
slang | +0.979 |
stereotype | +0.949 |
curfew | +0.924 |
ingrained | +0.908 |
puberty | +0.897 |
Neg logit contributions | |
elect | -1.126 |
events | -1.066 |
oops | -1.052 |
awaits | -1.027 |
probably | -0.995 |
Token | 11 |
Token ID | 1367 |
Feature activation | +4.26e-01 |
Pos logit contributions | |
slang | +5.793 |
stereotype | +5.607 |
curfew | +5.448 |
ingrained | +5.343 |
puberty | +5.304 |
Neg logit contributions | |
elect | -6.856 |
events | -6.534 |
oops | -6.444 |
awaits | -6.139 |
probably | -6.029 |
Token | : |
Token ID | 25 |
Feature activation | +3.88e-01 |
Pos logit contributions | |
slang | +4.081 |
stereotype | +3.967 |
curfew | +3.864 |
ingrained | +3.812 |
puberty | +3.750 |
Neg logit contributions | |
elect | -3.872 |
events | -3.678 |
oops | -3.627 |
awaits | -3.534 |
probably | -3.398 |
Token | 50 |
Token ID | 1120 |
Feature activation | +4.15e-01 |
Pos logit contributions | |
slang | +3.801 |
stereotype | +3.660 |
curfew | +3.531 |
ingrained | +3.514 |
puberty | +3.445 |
Neg logit contributions | |
elect | -3.433 |
events | -3.227 |
oops | -3.195 |
awaits | -3.129 |
probably | -2.954 |
Token | AM |
Token ID | 3001 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
slang | +3.666 |
stereotype | +3.555 |
curfew | +3.474 |
ingrained | +3.437 |
mentality | +3.337 |
Neg logit contributions | |
elect | -4.041 |
events | -3.875 |
oops | -3.848 |
awaits | -3.717 |
probably | -3.564 |
Token | of |
Token ID | 286 |
Feature activation | -5.74e-01 |
Pos logit contributions | |
elect | +2.319 |
events | +2.163 |
oops | +2.130 |
awaits | +2.067 |
probably | +1.986 |
Neg logit contributions | |
slang | -2.937 |
stereotype | -2.868 |
curfew | -2.801 |
ingrained | -2.757 |
puberty | -2.743 |
Token | the |
Token ID | 262 |
Feature activation | -5.60e-01 |
Pos logit contributions | |
elect | +5.763 |
events | +5.418 |
oops | +5.296 |
awaits | +5.165 |
probably | +5.010 |
Neg logit contributions | |
slang | -4.776 |
stereotype | -4.627 |
curfew | -4.505 |
ingrained | -4.449 |
puberty | -4.408 |
Token | Future |
Token ID | 10898 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
elect | +5.526 |
events | +5.201 |
oops | +5.056 |
awaits | +4.940 |
probably | +4.765 |
Neg logit contributions | |
slang | -4.717 |
stereotype | -4.600 |
curfew | -4.482 |
ingrained | -4.447 |
puberty | -4.444 |
Token | Crimes |
Token ID | 32655 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
elect | +3.227 |
events | +3.075 |
oops | +3.022 |
awaits | +2.940 |
probably | +2.868 |
Neg logit contributions | |
slang | -2.692 |
stereotype | -2.627 |
curfew | -2.553 |
ingrained | -2.526 |
puberty | -2.520 |
Token | Institute |
Token ID | 5136 |
Feature activation | -4.58e-02 |
Pos logit contributions | |
elect | +1.789 |
events | +1.685 |
oops | +1.653 |
awaits | +1.625 |
probably | +1.563 |
Neg logit contributions | |
slang | -1.575 |
stereotype | -1.527 |
curfew | -1.485 |
puberty | -1.467 |
ingrained | -1.466 |
Token | and |
Token ID | 290 |
Feature activation | +3.92e-01 |
Pos logit contributions | |
elect | +0.379 |
events | +0.354 |
oops | +0.348 |
awaits | +0.338 |
probably | +0.324 |
Neg logit contributions | |
slang | -0.484 |
stereotype | -0.472 |
curfew | -0.462 |
ingrained | -0.454 |
puberty | -0.452 |
Token | the |
Token ID | 262 |
Feature activation | -8.53e-02 |
Pos logit contributions | |
slang | +3.291 |
stereotype | +3.178 |
curfew | +3.093 |
ingrained | +3.037 |
puberty | +2.998 |
Neg logit contributions | |
elect | -4.058 |
events | -3.868 |
oops | -3.843 |
awaits | -3.698 |
probably | -3.613 |
Token | Chair |
Token ID | 9369 |
Feature activation | -6.54e-01 |
Pos logit contributions | |
elect | +0.937 |
events | +0.890 |
oops | +0.872 |
awaits | +0.860 |
probably | +0.833 |
Neg logit contributions | |
slang | -0.662 |
stereotype | -0.641 |
curfew | -0.621 |
ingrained | -0.612 |
puberty | -0.608 |
Token | for |
Token ID | 329 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
elect | +4.876 |
events | +4.374 |
oops | +4.254 |
awaits | +4.183 |
probably | +3.992 |
Neg logit contributions | |
slang | -7.339 |
stereotype | -7.206 |
curfew | -7.099 |
ingrained | -6.932 |
puberty | -6.925 |
Token | Policy |
Token ID | 7820 |
Feature activation | -5.24e-01 |
Pos logit contributions | |
elect | +2.823 |
events | +2.671 |
oops | +2.602 |
awaits | +2.543 |
probably | +2.483 |
Neg logit contributions | |
slang | -2.067 |
stereotype | -1.995 |
curfew | -1.935 |
ingrained | -1.915 |
puberty | -1.886 |
Token | , |
Token ID | 11 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
elect | +4.995 |
events | +4.613 |
oops | +4.518 |
awaits | +4.448 |
papers | +4.286 |
Neg logit contributions | |
slang | -4.846 |
stereotype | -4.720 |
curfew | -4.632 |
ingrained | -4.501 |
puberty | -4.473 |
Token | are |
Token ID | 389 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
elect | +1.832 |
events | +1.727 |
oops | +1.702 |
awaits | +1.678 |
probably | +1.628 |
Neg logit contributions | |
slang | -1.773 |
stereotype | -1.706 |
curfew | -1.688 |
puberty | -1.648 |
ingrained | -1.648 |
Token | separate |
Token ID | 4553 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
elect | +9.963 |
indeed | +9.531 |
events | +9.314 |
awaits | +9.194 |
probably | +9.013 |
Neg logit contributions | |
stereotype | -8.050 |
slang | -7.982 |
curfew | -7.883 |
puberty | -7.582 |
leash | -7.473 |
Token | from |
Token ID | 422 |
Feature activation | +6.05e-01 |
Pos logit contributions | |
elect | +10.450 |
events | +10.024 |
awaits | +9.630 |
indeed | +9.618 |
oops | +9.514 |
Neg logit contributions | |
stereotype | -9.936 |
slang | -9.864 |
curfew | -9.681 |
puberty | -9.351 |
ingrained | -9.330 |
Token | the |
Token ID | 262 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
slang | +5.246 |
stereotype | +5.051 |
curfew | +4.956 |
ingrained | +4.860 |
puberty | +4.819 |
Neg logit contributions | |
elect | -5.993 |
events | -5.651 |
oops | -5.632 |
awaits | -5.448 |
probably | -5.316 |
Token | hundreds |
Token ID | 5179 |
Feature activation | -2.62e-01 |
Pos logit contributions | |
elect | +2.206 |
events | +2.084 |
oops | +2.047 |
awaits | +2.003 |
probably | +1.937 |
Neg logit contributions | |
slang | -2.209 |
stereotype | -2.146 |
curfew | -2.079 |
ingrained | -2.058 |
puberty | -2.044 |
Token | of |
Token ID | 286 |
Feature activation | -6.49e-01 |
Pos logit contributions | |
elect | +2.069 |
events | +1.924 |
oops | +1.890 |
awaits | +1.842 |
probably | +1.758 |
Neg logit contributions | |
slang | -2.848 |
stereotype | -2.782 |
curfew | -2.722 |
ingrained | -2.675 |
puberty | -2.666 |
Token | hours |
Token ID | 2250 |
Feature activation | +9.53e-01 |
Pos logit contributions | |
elect | +5.441 |
events | +5.057 |
awaits | +4.926 |
oops | +4.912 |
indeed | +4.734 |
Neg logit contributions | |
slang | -6.318 |
stereotype | -6.213 |
curfew | -6.044 |
puberty | -5.967 |
ingrained | -5.907 |
Token | of |
Token ID | 286 |
Feature activation | -1.44e-01 |
Pos logit contributions | |
slang | +8.987 |
stereotype | +8.676 |
ingrained | +8.585 |
curfew | +8.539 |
worn | +8.481 |
Neg logit contributions | |
elect | -8.244 |
events | -7.932 |
oops | -7.810 |
awaits | -7.314 |
probably | -7.236 |
Token | videot |
Token ID | 35026 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
elect | +1.289 |
events | +1.209 |
oops | +1.188 |
awaits | +1.166 |
probably | +1.119 |
Neg logit contributions | |
slang | -1.411 |
stereotype | -1.381 |
curfew | -1.343 |
puberty | -1.319 |
ingrained | -1.317 |
Token | ape |
Token ID | 1758 |
Feature activation | +3.87e-01 |
Pos logit contributions | |
elect | +2.464 |
events | +2.279 |
oops | +2.268 |
awaits | +2.113 |
probably | +2.059 |
Neg logit contributions | |
slang | -3.487 |
stereotype | -3.427 |
curfew | -3.330 |
ingrained | -3.277 |
puberty | -3.246 |
Token | of |
Token ID | 286 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
slang | +3.878 |
stereotype | +3.754 |
curfew | +3.671 |
ingrained | +3.632 |
puberty | +3.589 |
Neg logit contributions | |
elect | -3.380 |
events | -3.192 |
oops | -3.142 |
awaits | -3.022 |
probably | -2.953 |
Token | alcohol |
Token ID | 5548 |
Feature activation | -3.22e-01 |
Pos logit contributions | |
elect | +8.572 |
awaits | +7.664 |
events | +7.636 |
oops | +7.602 |
indeed | +7.596 |
Neg logit contributions | |
slang | -8.374 |
stereotype | -8.236 |
curfew | -8.017 |
ingrained | -7.976 |
mentality | -7.789 |
Token | . |
Token ID | 13 |
Feature activation | -6.65e-01 |
Pos logit contributions | |
elect | +2.757 |
events | +2.556 |
oops | +2.526 |
awaits | +2.464 |
probably | +2.378 |
Neg logit contributions | |
slang | -3.263 |
stereotype | -3.201 |
curfew | -3.130 |
ingrained | -3.083 |
puberty | -3.052 |
Token | What |
Token ID | 1867 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
elect | +5.199 |
events | +4.799 |
oops | +4.732 |
probably | +4.540 |
awaits | +4.471 |
Neg logit contributions | |
slang | -6.894 |
curfew | -6.837 |
stereotype | -6.829 |
ingrained | -6.708 |
puberty | -6.615 |
Token | you |
Token ID | 345 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
slang | +1.398 |
stereotype | +1.361 |
curfew | +1.332 |
ingrained | +1.312 |
puberty | +1.302 |
Neg logit contributions | |
elect | -1.119 |
events | -1.047 |
oops | -1.030 |
awaits | -1.004 |
probably | -0.963 |
Token | experience |
Token ID | 1998 |
Feature activation | -5.74e-01 |
Pos logit contributions | |
slang | +3.106 |
stereotype | +3.022 |
curfew | +2.945 |
ingrained | +2.901 |
puberty | +2.880 |
Neg logit contributions | |
elect | -2.826 |
events | -2.665 |
oops | -2.624 |
awaits | -2.547 |
probably | -2.456 |
Token | will |
Token ID | 481 |
Feature activation | -5.28e-01 |
Pos logit contributions | |
elect | +5.398 |
awaits | +5.059 |
events | +5.022 |
oops | +4.867 |
probably | +4.769 |
Neg logit contributions | |
slang | -5.118 |
stereotype | -5.007 |
curfew | -4.879 |
ingrained | -4.709 |
puberty | -4.618 |
Token | be |
Token ID | 307 |
Feature activation | -4.05e-01 |
Pos logit contributions | |
elect | +5.112 |
events | +4.740 |
probably | +4.661 |
indeed | +4.631 |
awaits | +4.607 |
Neg logit contributions | |
slang | -4.574 |
curfew | -4.344 |
stereotype | -4.314 |
puberty | -4.234 |
ingrained | -4.186 |
Token | more |
Token ID | 517 |
Feature activation | -2.82e-01 |
Pos logit contributions | |
elect | +3.927 |
events | +3.683 |
oops | +3.556 |
awaits | +3.555 |
probably | +3.511 |
Neg logit contributions | |
slang | -3.509 |
stereotype | -3.424 |
curfew | -3.345 |
puberty | -3.216 |
ingrained | -3.183 |
Token | intense |
Token ID | 8157 |
Feature activation | -6.64e-01 |
Pos logit contributions | |
elect | +2.852 |
events | +2.682 |
awaits | +2.611 |
oops | +2.591 |
probably | +2.544 |
Neg logit contributions | |
slang | -2.378 |
stereotype | -2.313 |
curfew | -2.254 |
puberty | -2.170 |
ingrained | -2.149 |
Token | than |
Token ID | 621 |
Feature activation | -7.67e-01 |
Pos logit contributions | |
elect | +5.947 |
events | +5.547 |
awaits | +5.488 |
oops | +5.317 |
indeed | +5.289 |
Neg logit contributions | |
slang | -6.038 |
stereotype | -5.939 |
curfew | -5.818 |
ingrained | -5.626 |
puberty | -5.529 |
Token | 4 |
Token ID | 604 |
Feature activation | -8.06e-01 |
Pos logit contributions | |
elect | +6.868 |
events | +6.390 |
awaits | +6.320 |
oops | +6.271 |
indeed | +6.171 |
Neg logit contributions | |
slang | -6.720 |
stereotype | -6.542 |
curfew | -6.414 |
ingrained | -6.308 |
leash | -6.218 |
Token | 70 |
Token ID | 4317 |
Feature activation | +3.13e-01 |
Pos logit contributions | |
elect | +1.629 |
events | +1.532 |
oops | +1.502 |
awaits | +1.473 |
probably | +1.434 |
Neg logit contributions | |
slang | -1.430 |
stereotype | -1.377 |
curfew | -1.336 |
ingrained | -1.317 |
puberty | -1.306 |
Token | in |
Token ID | 259 |
Feature activation | +8.72e-02 |
Pos logit contributions | |
slang | +2.937 |
stereotype | +2.851 |
curfew | +2.783 |
ingrained | +2.732 |
puberty | +2.709 |
Neg logit contributions | |
elect | -2.938 |
events | -2.785 |
oops | -2.744 |
awaits | -2.663 |
probably | -2.580 |
Token | Plasma |
Token ID | 31226 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
slang | +0.848 |
stereotype | +0.824 |
curfew | +0.804 |
ingrained | +0.792 |
puberty | +0.786 |
Neg logit contributions | |
elect | -0.794 |
events | -0.749 |
oops | -0.738 |
awaits | -0.717 |
probably | -0.693 |
Token | sound |
Token ID | 2128 |
Feature activation | -4.08e-01 |
Pos logit contributions | |
slang | +1.094 |
stereotype | +1.064 |
curfew | +1.036 |
ingrained | +1.019 |
puberty | +1.011 |
Neg logit contributions | |
elect | -1.092 |
events | -1.032 |
oops | -1.018 |
awaits | -0.988 |
probably | -0.956 |
Token | as |
Token ID | 355 |
Feature activation | -5.47e-03 |
Pos logit contributions | |
elect | +4.278 |
events | +4.031 |
oops | +3.943 |
awaits | +3.882 |
probably | +3.800 |
Neg logit contributions | |
slang | -3.338 |
stereotype | -3.197 |
curfew | -3.090 |
ingrained | -3.055 |
puberty | -3.020 |
Token | if |
Token ID | 611 |
Feature activation | -4.02e-01 |
Pos logit contributions | |
elect | +0.049 |
events | +0.046 |
oops | +0.046 |
awaits | +0.044 |
probably | +0.043 |
Neg logit contributions | |
slang | -0.054 |
stereotype | -0.052 |
curfew | -0.051 |
ingrained | -0.050 |
puberty | -0.050 |
Token | im |
Token ID | 545 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
elect | +3.862 |
events | +3.635 |
oops | +3.584 |
awaits | +3.523 |
probably | +3.378 |
Neg logit contributions | |
slang | -3.590 |
stereotype | -3.507 |
curfew | -3.360 |
ingrained | -3.335 |
puberty | -3.270 |
Token | on |
Token ID | 319 |
Feature activation | +2.11e-01 |
Pos logit contributions | |
slang | +3.690 |
stereotype | +3.565 |
curfew | +3.486 |
ingrained | +3.424 |
puberty | +3.393 |
Neg logit contributions | |
elect | -4.055 |
events | -3.863 |
oops | -3.811 |
awaits | -3.712 |
probably | -3.576 |
Token | the |
Token ID | 262 |
Feature activation | -2.94e-01 |
Pos logit contributions | |
slang | +1.793 |
stereotype | +1.736 |
curfew | +1.685 |
ingrained | +1.657 |
puberty | +1.639 |
Neg logit contributions | |
elect | -2.186 |
events | -2.074 |
oops | -2.048 |
awaits | -1.997 |
probably | -1.939 |
Token | set |
Token ID | 900 |
Feature activation | -8.21e-01 |
Pos logit contributions | |
elect | +2.915 |
events | +2.713 |
oops | +2.688 |
awaits | +2.626 |
probably | +2.542 |
Neg logit contributions | |
slang | -2.556 |
stereotype | -2.486 |
ingrained | -2.405 |
curfew | -2.390 |
puberty | -2.348 |
Token | filming |
Token ID | 17691 |
Feature activation | -9.08e-01 |
Pos logit contributions | |
elect | +6.688 |
oops | +6.086 |
events | +6.074 |
awaits | +5.993 |
probably | +5.666 |
Neg logit contributions | |
slang | -8.233 |
stereotype | -8.027 |
ingrained | -7.815 |
curfew | -7.790 |
puberty | -7.666 |
Token | , |
Token ID | 11 |
Feature activation | +4.17e-01 |
Pos logit contributions | |
slang | +6.459 |
stereotype | +6.203 |
curfew | +6.085 |
puberty | +5.981 |
ingrained | +5.973 |
Neg logit contributions | |
elect | -5.596 |
events | -5.278 |
oops | -5.252 |
awaits | -5.049 |
probably | -4.874 |
Token | when |
Token ID | 618 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
slang | +3.586 |
stereotype | +3.442 |
curfew | +3.340 |
ingrained | +3.304 |
puberty | +3.280 |
Neg logit contributions | |
elect | -4.244 |
events | -4.019 |
oops | -3.977 |
awaits | -3.871 |
probably | -3.733 |
Token | Night |
Token ID | 5265 |
Feature activation | -4.99e-01 |
Pos logit contributions | |
slang | +2.175 |
stereotype | +2.110 |
curfew | +2.059 |
ingrained | +2.020 |
puberty | +2.010 |
Neg logit contributions | |
elect | -2.273 |
events | -2.150 |
oops | -2.123 |
awaits | -2.062 |
probably | -1.998 |
Token | c |
Token ID | 66 |
Feature activation | +2.91e-02 |
Pos logit contributions | |
elect | +3.097 |
events | +2.812 |
oops | +2.754 |
awaits | +2.650 |
probably | +2.518 |
Neg logit contributions | |
slang | -6.096 |
stereotype | -6.016 |
ingrained | -5.907 |
curfew | -5.883 |
puberty | -5.839 |
Token | rawler |
Token ID | 39464 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
slang | +0.209 |
stereotype | +0.201 |
curfew | +0.195 |
ingrained | +0.190 |
puberty | +0.188 |
Neg logit contributions | |
elect | -0.340 |
events | -0.324 |
oops | -0.322 |
awaits | -0.314 |
probably | -0.306 |
Token | notices |
Token ID | 19748 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
elect | +2.156 |
events | +1.999 |
oops | +1.981 |
awaits | +1.934 |
probably | +1.819 |
Neg logit contributions | |
slang | -3.258 |
stereotype | -3.185 |
curfew | -3.130 |
ingrained | -3.080 |
puberty | -3.062 |
Token | that |
Token ID | 326 |
Feature activation | -2.51e-01 |
Pos logit contributions | |
elect | +2.637 |
events | +2.494 |
oops | +2.443 |
awaits | +2.396 |
probably | +2.324 |
Neg logit contributions | |
slang | -2.403 |
stereotype | -2.339 |
curfew | -2.249 |
ingrained | -2.244 |
mentality | -2.196 |
Token | no |
Token ID | 645 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
elect | +2.311 |
events | +2.177 |
oops | +2.144 |
awaits | +2.102 |
probably | +2.031 |
Neg logit contributions | |
slang | -2.382 |
stereotype | -2.318 |
curfew | -2.238 |
ingrained | -2.232 |
mentality | -2.181 |
Token | one |
Token ID | 530 |
Feature activation | -8.11e-01 |
Pos logit contributions | |
elect | +2.441 |
events | +2.302 |
oops | +2.281 |
awaits | +2.243 |
probably | +2.156 |
Neg logit contributions | |
slang | -2.000 |
stereotype | -1.941 |
ingrained | -1.871 |
curfew | -1.868 |
puberty | -1.833 |
Token | in |
Token ID | 287 |
Feature activation | -4.81e-01 |
Pos logit contributions | |
elect | +6.253 |
awaits | +6.008 |
events | +5.901 |
oops | +5.701 |
else | +5.669 |
Neg logit contributions | |
slang | -8.174 |
stereotype | -7.941 |
curfew | -7.657 |
ingrained | -7.652 |
puberty | -7.604 |
Token | the |
Token ID | 262 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
elect | +5.112 |
events | +4.875 |
oops | +4.771 |
awaits | +4.703 |
probably | +4.616 |
Neg logit contributions | |
slang | -3.711 |
stereotype | -3.584 |
ingrained | -3.477 |
curfew | -3.446 |
mentality | -3.311 |
Token | . |
Token ID | 13 |
Feature activation | -1.61e-03 |
Pos logit contributions | |
elect | +7.751 |
events | +7.238 |
awaits | +7.144 |
oops | +6.883 |
indeed | +6.834 |
Neg logit contributions | |
slang | -7.968 |
stereotype | -7.759 |
curfew | -7.599 |
puberty | -7.392 |
ingrained | -7.239 |
Token |
|
Token ID | 198 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
elect | +0.015 |
events | +0.014 |
oops | +0.014 |
awaits | +0.013 |
probably | +0.013 |
Neg logit contributions | |
slang | -0.016 |
stereotype | -0.015 |
curfew | -0.015 |
ingrained | -0.015 |
puberty | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
slang | +7.941 |
stereotype | +7.423 |
ingrained | +7.127 |
mentality | +6.992 |
tradition | +6.974 |
Neg logit contributions | |
elect | -10.544 |
oops | -10.240 |
events | -10.122 |
awaits | -10.074 |
mosqu | -10.023 |
Token | No |
Token ID | 2949 |
Feature activation | -6.05e-01 |
Pos logit contributions | |
elect | +1.049 |
events | +0.990 |
oops | +0.974 |
awaits | +0.942 |
probably | +0.917 |
Neg logit contributions | |
slang | -1.048 |
stereotype | -1.020 |
curfew | -0.993 |
ingrained | -0.977 |
puberty | -0.971 |
Token | major |
Token ID | 1688 |
Feature activation | -8.19e-01 |
Pos logit contributions | |
elect | +5.980 |
events | +5.619 |
oops | +5.459 |
awaits | +5.443 |
indeed | +5.171 |
Neg logit contributions | |
slang | -5.155 |
stereotype | -5.038 |
ingrained | -4.850 |
puberty | -4.793 |
curfew | -4.758 |
Token | out |
Token ID | 503 |
Feature activation | -8.19e-01 |
Pos logit contributions | |
elect | +8.124 |
events | +7.777 |
awaits | +7.457 |
oops | +7.318 |
papers | +7.043 |
Neg logit contributions | |
slang | -6.503 |
stereotype | -6.301 |
ingrained | -6.177 |
curfew | -6.035 |
puberty | -6.032 |
Token | bur |
Token ID | 6236 |
Feature activation | +5.88e-02 |
Pos logit contributions | |
elect | +8.320 |
events | +7.662 |
oops | +7.560 |
awaits | +7.240 |
papers | +7.024 |
Neg logit contributions | |
slang | -6.860 |
stereotype | -6.778 |
ingrained | -6.601 |
curfew | -6.493 |
puberty | -6.452 |
Token | sts |
Token ID | 6448 |
Feature activation | -3.72e-02 |
Pos logit contributions | |
slang | +0.815 |
stereotype | +0.799 |
curfew | +0.785 |
ingrained | +0.777 |
puberty | +0.773 |
Neg logit contributions | |
elect | -0.292 |
events | -0.261 |
oops | -0.254 |
awaits | -0.240 |
probably | -0.223 |
Token | marked |
Token ID | 7498 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
elect | +0.368 |
events | +0.349 |
oops | +0.342 |
awaits | +0.338 |
probably | +0.325 |
Neg logit contributions | |
slang | -0.332 |
stereotype | -0.321 |
curfew | -0.312 |
ingrained | -0.307 |
puberty | -0.305 |
Token | the |
Token ID | 262 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
elect | +1.682 |
events | +1.603 |
oops | +1.573 |
awaits | +1.541 |
probably | +1.493 |
Neg logit contributions | |
slang | -1.186 |
stereotype | -1.147 |
curfew | -1.103 |
ingrained | -1.090 |
puberty | -1.069 |
Token | SB |
Token ID | 18056 |
Feature activation | -2.58e-01 |
Pos logit contributions | |
elect | +10.078 |
events | +9.608 |
oops | +9.082 |
awaits | +9.025 |
absolutely | +8.729 |
Neg logit contributions | |
slang | -8.975 |
stereotype | -8.582 |
ingrained | -8.396 |
curfew | -8.205 |
puberty | -8.086 |
Token | GOP |
Token ID | 6796 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
elect | +2.826 |
events | +2.663 |
oops | +2.629 |
awaits | +2.558 |
probably | +2.469 |
Neg logit contributions | |
slang | -2.564 |
stereotype | -2.452 |
curfew | -2.429 |
puberty | -2.373 |
ingrained | -2.364 |
Token | is |
Token ID | 318 |
Feature activation | -6.40e-01 |
Pos logit contributions | |
elect | +11.389 |
oops | +10.379 |
awaits | +10.337 |
events | +10.266 |
indeed | +10.004 |
Neg logit contributions | |
slang | -9.892 |
curfew | -9.589 |
puberty | -9.293 |
stereotype | -9.172 |
ingrained | -9.087 |
Token | now |
Token ID | 783 |
Feature activation | +1.28e-01 |
Pos logit contributions | |
elect | +6.003 |
events | +5.510 |
indeed | +5.465 |
oops | +5.350 |
awaits | +5.336 |
Neg logit contributions | |
slang | -5.611 |
stereotype | -5.517 |
curfew | -5.412 |
puberty | -5.225 |
ingrained | -5.126 |
Token | in |
Token ID | 287 |
Feature activation | -8.96e-01 |
Pos logit contributions | |
slang | +1.155 |
stereotype | +1.122 |
curfew | +1.093 |
ingrained | +1.069 |
puberty | +1.063 |
Neg logit contributions | |
elect | -1.262 |
events | -1.192 |
oops | -1.171 |
awaits | -1.148 |
probably | -1.111 |
Token | total |
Token ID | 2472 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
elect | +8.695 |
events | +8.001 |
awaits | +7.805 |
indeed | +7.715 |
oops | +7.699 |
Neg logit contributions | |
slang | -7.295 |
stereotype | -7.040 |
curfew | -6.875 |
ingrained | -6.741 |
puberty | -6.520 |
Token | control |
Token ID | 1630 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
elect | +12.316 |
awaits | +11.200 |
events | +11.167 |
indeed | +10.913 |
oops | +10.710 |
Neg logit contributions | |
slang | -10.386 |
stereotype | -9.790 |
curfew | -9.695 |
ingrained | -9.483 |
puberty | -9.245 |
Token | . |
Token ID | 13 |
Feature activation | -4.88e-01 |
Pos logit contributions | |
elect | +12.797 |
indeed | +11.188 |
events | +11.146 |
awaits | +11.007 |
oops | +10.921 |
Neg logit contributions | |
slang | -14.394 |
stereotype | -14.184 |
curfew | -14.019 |
puberty | -13.534 |
ingrained | -13.221 |
Token | Who |
Token ID | 5338 |
Feature activation | -6.60e-01 |
Pos logit contributions | |
elect | +4.106 |
events | +3.815 |
oops | +3.765 |
awaits | +3.626 |
probably | +3.543 |
Neg logit contributions | |
slang | -4.991 |
stereotype | -4.832 |
curfew | -4.830 |
ingrained | -4.723 |
puberty | -4.722 |
Token | will |
Token ID | 481 |
Feature activation | -8.41e-01 |
Pos logit contributions | |
elect | +5.100 |
events | +4.653 |
awaits | +4.634 |
oops | +4.616 |
else | +4.316 |
Neg logit contributions | |
slang | -7.070 |
stereotype | -6.824 |
curfew | -6.777 |
puberty | -6.651 |
ingrained | -6.574 |
Token | the |
Token ID | 262 |
Feature activation | -7.11e-01 |
Pos logit contributions | |
elect | +7.999 |
indeed | +7.250 |
events | +7.154 |
oops | +7.121 |
awaits | +7.099 |
Neg logit contributions | |
slang | -7.183 |
curfew | -6.756 |
puberty | -6.661 |
stereotype | -6.659 |
ingrained | -6.618 |
Token | white |
Token ID | 2330 |
Feature activation | -3.47e-01 |
Pos logit contributions | |
elect | +6.652 |
events | +6.103 |
awaits | +5.983 |
oops | +5.972 |
probably | +5.714 |
Neg logit contributions | |
slang | -6.294 |
curfew | -6.070 |
stereotype | -5.998 |
puberty | -5.963 |
ingrained | -5.808 |
Token | some |
Token ID | 617 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
slang | +2.830 |
stereotype | +2.735 |
curfew | +2.693 |
ingrained | +2.618 |
puberty | +2.599 |
Neg logit contributions | |
elect | -3.217 |
events | -3.069 |
oops | -3.025 |
awaits | -2.942 |
probably | -2.868 |
Token | water |
Token ID | 1660 |
Feature activation | +4.20e-01 |
Pos logit contributions | |
elect | +4.190 |
events | +3.931 |
oops | +3.878 |
awaits | +3.840 |
indeed | +3.684 |
Neg logit contributions | |
slang | -3.656 |
stereotype | -3.575 |
puberty | -3.444 |
curfew | -3.435 |
ingrained | -3.415 |
Token | and |
Token ID | 290 |
Feature activation | -4.39e-01 |
Pos logit contributions | |
slang | +3.950 |
stereotype | +3.814 |
curfew | +3.732 |
ingrained | +3.673 |
puberty | +3.624 |
Neg logit contributions | |
elect | -3.935 |
events | -3.742 |
oops | -3.657 |
awaits | -3.555 |
probably | -3.451 |
Token | then |
Token ID | 788 |
Feature activation | -2.58e-01 |
Pos logit contributions | |
elect | +4.206 |
events | +3.895 |
awaits | +3.893 |
oops | +3.847 |
indeed | +3.724 |
Neg logit contributions | |
slang | -3.865 |
stereotype | -3.800 |
curfew | -3.624 |
ingrained | -3.610 |
puberty | -3.581 |
Token | ate |
Token ID | 15063 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
elect | +2.630 |
events | +2.468 |
awaits | +2.459 |
oops | +2.431 |
indeed | +2.333 |
Neg logit contributions | |
slang | -2.165 |
stereotype | -2.113 |
curfew | -2.027 |
ingrained | -1.985 |
puberty | -1.981 |
Token | some |
Token ID | 617 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
elect | +9.156 |
awaits | +8.506 |
indeed | +8.357 |
oops | +8.346 |
events | +8.341 |
Neg logit contributions | |
slang | -8.970 |
stereotype | -8.824 |
curfew | -8.404 |
mentality | -8.311 |
ingrained | -8.258 |
Token | fruit |
Token ID | 8234 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
elect | +14.388 |
indeed | +13.827 |
awaits | +13.742 |
oops | +13.327 |
events | +12.914 |
Neg logit contributions | |
slang | -12.175 |
stereotype | -12.060 |
puberty | -11.714 |
curfew | -11.644 |
mentality | -11.320 |
Token | salad |
Token ID | 20698 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
elect | +2.444 |
events | +2.275 |
oops | +2.268 |
awaits | +2.238 |
probably | +2.114 |
Neg logit contributions | |
slang | -2.787 |
stereotype | -2.730 |
curfew | -2.667 |
puberty | -2.624 |
ingrained | -2.600 |
Token | . |
Token ID | 13 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
elect | +1.272 |
events | +1.183 |
oops | +1.177 |
awaits | +1.159 |
probably | +1.099 |
Neg logit contributions | |
slang | -1.488 |
stereotype | -1.449 |
curfew | -1.422 |
puberty | -1.391 |
ingrained | -1.383 |
Token |
|
Token ID | 198 |
Feature activation | +5.86e-01 |
Pos logit contributions | |
slang | +2.902 |
stereotype | +2.806 |
curfew | +2.741 |
ingrained | +2.684 |
puberty | +2.659 |
Neg logit contributions | |
elect | -2.649 |
events | -2.505 |
oops | -2.472 |
awaits | -2.391 |
probably | -2.313 |
Token |
|
Token ID | 198 |
Feature activation | +7.77e-01 |
Pos logit contributions | |
slang | +5.238 |
stereotype | +5.019 |
curfew | +4.841 |
ingrained | +4.821 |
puberty | +4.730 |
Neg logit contributions | |
elect | -5.531 |
events | -5.239 |
oops | -5.224 |
awaits | -5.104 |
probably | -4.828 |
Token | it |
Token ID | 340 |
Feature activation | -6.48e-01 |
Pos logit contributions | |
slang | +1.230 |
stereotype | +1.191 |
curfew | +1.157 |
ingrained | +1.136 |
puberty | +1.127 |
Neg logit contributions | |
elect | -1.509 |
events | -1.434 |
oops | -1.414 |
awaits | -1.380 |
probably | -1.340 |
Token | until |
Token ID | 1566 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
elect | +5.202 |
events | +4.798 |
oops | +4.695 |
awaits | +4.659 |
probably | +4.462 |
Neg logit contributions | |
slang | -6.658 |
stereotype | -6.468 |
curfew | -6.416 |
puberty | -6.228 |
ingrained | -6.226 |
Token | I |
Token ID | 314 |
Feature activation | +3.36e-01 |
Pos logit contributions | |
elect | +1.294 |
events | +1.207 |
oops | +1.189 |
awaits | +1.162 |
probably | +1.121 |
Neg logit contributions | |
slang | -1.350 |
stereotype | -1.311 |
curfew | -1.269 |
ingrained | -1.251 |
puberty | -1.234 |
Token | am |
Token ID | 716 |
Feature activation | -5.81e-01 |
Pos logit contributions | |
slang | +2.934 |
stereotype | +2.870 |
curfew | +2.767 |
ingrained | +2.738 |
puberty | +2.702 |
Neg logit contributions | |
elect | -3.345 |
events | -3.198 |
oops | -3.147 |
awaits | -3.050 |
probably | -2.958 |
Token | in |
Token ID | 287 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
elect | +5.696 |
events | +5.227 |
awaits | +5.055 |
oops | +5.051 |
indeed | +5.008 |
Neg logit contributions | |
slang | -5.098 |
stereotype | -4.870 |
curfew | -4.777 |
puberty | -4.605 |
mentality | -4.554 |
Token | the |
Token ID | 262 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
elect | +16.261 |
events | +14.221 |
awaits | +14.009 |
indeed | +13.892 |
probably | +13.669 |
Neg logit contributions | |
slang | -13.247 |
stereotype | -12.712 |
ingrained | -12.281 |
curfew | -12.167 |
colonialism | -11.588 |
Token | White |
Token ID | 2635 |
Feature activation | -5.12e-01 |
Pos logit contributions | |
elect | +16.353 |
events | +14.699 |
awaits | +14.255 |
oops | +14.055 |
rooms | +14.044 |
Neg logit contributions | |
slang | -12.460 |
stereotype | -11.769 |
curfew | -11.428 |
ingrained | -11.357 |
puberty | -11.237 |
Token | House |
Token ID | 2097 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
elect | +3.429 |
events | +3.184 |
oops | +3.062 |
probably | +2.900 |
awaits | +2.889 |
Neg logit contributions | |
slang | -6.039 |
stereotype | -5.896 |
curfew | -5.860 |
ingrained | -5.742 |
puberty | -5.663 |
Token | . |
Token ID | 13 |
Feature activation | -9.47e-01 |
Pos logit contributions | |
elect | +13.569 |
events | +11.931 |
oops | +11.907 |
awaits | +11.895 |
indeed | +11.843 |
Neg logit contributions | |
slang | -14.933 |
stereotype | -14.289 |
curfew | -14.087 |
ingrained | -13.525 |
puberty | -13.480 |
Token | � |
Token ID | 447 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
elect | +6.278 |
events | +5.640 |
oops | +5.634 |
probably | +5.433 |
awaits | +5.304 |
Neg logit contributions | |
slang | -10.803 |
curfew | -10.642 |
stereotype | -10.497 |
ingrained | -10.457 |
puberty | -10.295 |
Token | � |
Token ID | 251 |
Feature activation | -8.87e-02 |
Pos logit contributions | |
slang | +2.151 |
stereotype | +2.096 |
curfew | +2.048 |
ingrained | +2.018 |
puberty | +2.003 |
Neg logit contributions | |
elect | -1.697 |
events | -1.591 |
oops | -1.565 |
awaits | -1.516 |
probably | -1.460 |
Token | tens |
Token ID | 11192 |
Feature activation | -5.76e-01 |
Pos logit contributions | |
elect | +6.823 |
events | +6.291 |
oops | +6.013 |
awaits | +5.986 |
probably | +5.969 |
Neg logit contributions | |
slang | -5.783 |
stereotype | -5.660 |
curfew | -5.533 |
ingrained | -5.440 |
puberty | -5.379 |
Token | of |
Token ID | 286 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
elect | +4.339 |
events | +3.986 |
oops | +3.900 |
awaits | +3.798 |
probably | +3.639 |
Neg logit contributions | |
slang | -6.435 |
stereotype | -6.278 |
curfew | -6.176 |
ingrained | -6.083 |
puberty | -6.044 |
Token | thousands |
Token ID | 4138 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
elect | +8.536 |
events | +7.169 |
probably | +6.717 |
indeed | +6.646 |
awaits | +6.572 |
Neg logit contributions | |
curfew | -16.870 |
slang | -16.846 |
stereotype | -16.628 |
puberty | -16.373 |
ingrained | -16.272 |
Token | of |
Token ID | 286 |
Feature activation | -1.92e+00 |
Pos logit contributions | |
elect | +13.657 |
events | +11.924 |
awaits | +11.923 |
indeed | +11.314 |
absolutely | +11.068 |
Neg logit contributions | |
slang | -15.692 |
stereotype | -15.553 |
curfew | -15.496 |
puberty | -15.261 |
leash | -14.871 |
Token | people |
Token ID | 661 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
elect | +14.769 |
indeed | +12.938 |
awaits | +12.920 |
events | +12.854 |
votes | +12.685 |
Neg logit contributions | |
slang | -14.149 |
curfew | -14.045 |
ESE | -13.989 |
stereotype | -13.908 |
puberty | -13.868 |
Token | in |
Token ID | 287 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
elect | +11.408 |
awaits | +10.336 |
events | +10.244 |
indeed | +9.914 |
probably | +9.550 |
Neg logit contributions | |
slang | -11.506 |
curfew | -11.264 |
stereotype | -11.229 |
puberty | -10.979 |
guiActiveUnfocused | -10.874 |
Token | America |
Token ID | 2253 |
Feature activation | -6.19e-01 |
Pos logit contributions | |
elect | +18.446 |
events | +16.629 |
batches | +16.077 |
probably | +15.920 |
bids | +15.888 |
Neg logit contributions | |
ESE | -14.570 |
curfew | -14.370 |
slang | -14.200 |
guiActiveUnfocused | -13.897 |
ingrained | -13.694 |
Token | at |
Token ID | 379 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
elect | +5.370 |
events | +4.916 |
awaits | +4.857 |
oops | +4.661 |
probably | +4.596 |
Neg logit contributions | |
slang | -5.920 |
stereotype | -5.779 |
curfew | -5.715 |
puberty | -5.608 |
ingrained | -5.542 |
Token | once |
Token ID | 1752 |
Feature activation | -6.95e-01 |
Pos logit contributions | |
elect | +12.283 |
events | +11.135 |
indeed | +10.417 |
probably | +10.373 |
oops | +10.251 |
Neg logit contributions | |
slang | -10.254 |
stereotype | -9.724 |
ingrained | -9.541 |
mentality | -9.534 |
puberty | -9.267 |
Token | and |
Token ID | 290 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
elect | +5.894 |
events | +5.452 |
awaits | +5.379 |
oops | +5.105 |
probably | +5.054 |
Neg logit contributions | |
slang | -6.705 |
stereotype | -6.538 |
curfew | -6.443 |
puberty | -6.297 |
ingrained | -6.236 |
Token | do |
Token ID | 466 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
elect | +9.391 |
events | +8.556 |
indeed | +8.435 |
probably | +8.187 |
awaits | +8.185 |
Neg logit contributions | |
slang | -8.490 |
curfew | -8.174 |
puberty | -8.096 |
ingrained | -8.007 |
stereotype | -7.944 |
Token | the |
Token ID | 262 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
elect | +11.236 |
events | +10.476 |
awaits | +10.261 |
indeed | +10.149 |
probably | +10.103 |
Neg logit contributions | |
stereotype | -9.528 |
slang | -9.299 |
curfew | -8.919 |
ingrained | -8.834 |
mentality | -8.593 |
Token | pipeline |
Token ID | 11523 |
Feature activation | -8.57e-01 |
Pos logit contributions | |
elect | +9.902 |
events | +9.306 |
awaits | +9.203 |
indeed | +8.807 |
oops | +8.795 |
Neg logit contributions | |
stereotype | -9.924 |
slang | -9.892 |
curfew | -9.733 |
ingrained | -9.379 |
puberty | -9.366 |
Token | for |
Token ID | 329 |
Feature activation | -8.91e-01 |
Pos logit contributions | |
elect | +7.211 |
events | +6.697 |
awaits | +6.651 |
oops | +6.563 |
indeed | +6.502 |
Neg logit contributions | |
stereotype | -8.090 |
slang | -8.052 |
curfew | -7.836 |
ingrained | -7.450 |
puberty | -7.415 |
Token | merge |
Token ID | 20121 |
Feature activation | -7.16e-01 |
Pos logit contributions | |
elect | +8.725 |
events | +8.214 |
oops | +7.962 |
awaits | +7.906 |
probably | +7.869 |
Neg logit contributions | |
slang | -6.980 |
stereotype | -6.858 |
curfew | -6.530 |
ingrained | -6.451 |
mentality | -6.294 |
Token | in |
Token ID | 287 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
elect | +7.082 |
events | +6.708 |
oops | +6.572 |
awaits | +6.516 |
indeed | +6.266 |
Neg logit contributions | |
slang | -5.925 |
stereotype | -5.880 |
curfew | -5.529 |
ingrained | -5.404 |
puberty | -5.285 |
Token | core |
Token ID | 4755 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
elect | +9.716 |
events | +9.053 |
oops | +8.808 |
probably | +8.760 |
awaits | +8.586 |
Neg logit contributions | |
stereotype | -8.322 |
slang | -8.309 |
ingrained | -8.008 |
curfew | -7.941 |
puberty | -7.566 |
Token | and |
Token ID | 290 |
Feature activation | -1.77e+00 |
Pos logit contributions | |
elect | +15.721 |
events | +14.652 |
oops | +14.454 |
indeed | +14.428 |
papers | +14.093 |
Neg logit contributions | |
stereotype | -12.170 |
slang | -11.564 |
curfew | -11.497 |
ingrained | -11.406 |
puberty | -11.279 |
Token | making |
Token ID | 1642 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
awaits | +15.701 |
elect | +15.609 |
indeed | +14.894 |
events | +14.649 |
probably | +14.246 |
Neg logit contributions | |
slang | -11.565 |
stereotype | -11.538 |
ingrained | -10.815 |
curfew | -10.785 |
puberty | -10.528 |
Token | good |
Token ID | 922 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
elect | +10.368 |
events | +9.753 |
awaits | +9.472 |
oops | +9.471 |
indeed | +9.302 |
Neg logit contributions | |
slang | -8.628 |
stereotype | -8.522 |
curfew | -8.043 |
ingrained | -7.995 |
puberty | -7.898 |
Token | progress |
Token ID | 4371 |
Feature activation | -9.38e-01 |
Pos logit contributions | |
elect | +9.662 |
awaits | +8.778 |
events | +8.771 |
oops | +8.650 |
indeed | +8.530 |
Neg logit contributions | |
slang | -8.070 |
stereotype | -7.814 |
curfew | -7.378 |
ingrained | -7.343 |
mentality | -7.093 |
Token | ( |
Token ID | 357 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
elect | +8.907 |
awaits | +8.421 |
events | +8.371 |
indeed | +8.161 |
oops | +8.086 |
Neg logit contributions | |
slang | -7.868 |
stereotype | -7.750 |
curfew | -7.439 |
puberty | -7.119 |
ingrained | -7.099 |