Token | because |
Token ID | 780 |
Feature activation | +3.39e+00 |
Pos logit contributions | |
hating | +27.442 |
dictators | +26.726 |
politics | +26.655 |
oppressed | +26.641 |
religion | +26.535 |
Neg logit contributions | |
Setup | -16.843 |
optionally | -13.921 |
formatted | -13.785 |
annot | -13.507 |
manually | -13.466 |
Token | she |
Token ID | 673 |
Feature activation | +2.85e+00 |
Pos logit contributions | |
hating | +24.434 |
dictators | +24.162 |
oppressed | +23.601 |
Jews | +23.451 |
politics | +23.338 |
Neg logit contributions | |
Setup | -18.932 |
manually | -16.238 |
annot | -16.208 |
Completed | -16.114 |
formatted | -16.091 |
Token | is |
Token ID | 318 |
Feature activation | +3.40e+00 |
Pos logit contributions | |
oppressed | +21.801 |
hating | +21.542 |
dictators | +21.401 |
Jews | +20.896 |
bullies | +20.716 |
Neg logit contributions | |
Setup | -16.414 |
optionally | -13.954 |
manually | -13.874 |
annot | -13.512 |
Completed | -13.468 |
Token | Scottish |
Token ID | 11905 |
Feature activation | +4.48e+00 |
Pos logit contributions | |
oppressed | +26.707 |
hating | +26.374 |
Jews | +25.583 |
dictators | +25.535 |
martyr | +25.362 |
Neg logit contributions | |
Setup | -16.774 |
optionally | -14.127 |
manually | -13.940 |
initialize | -13.683 |
Detailed | -13.579 |
Token | and |
Token ID | 290 |
Feature activation | +3.97e+00 |
Pos logit contributions | |
hating | +30.868 |
oppressed | +30.695 |
dictators | +30.635 |
politics | +30.213 |
Jews | +30.199 |
Neg logit contributions | |
Setup | -19.166 |
optionally | -16.571 |
updated | -16.060 |
manually | -15.959 |
formatted | -15.872 |
Token | British |
Token ID | 3517 |
Feature activation | +5.66e+00 |
Pos logit contributions | |
hating | +29.845 |
oppressed | +29.639 |
Jews | +29.214 |
dictators | +29.014 |
religion | +28.548 |
Neg logit contributions | |
Setup | -17.913 |
manually | -14.942 |
Completed | -14.482 |
annot | -14.313 |
optionally | -14.212 |
Token | , |
Token ID | 11 |
Feature activation | +3.91e+00 |
Pos logit contributions | |
dictators | +36.361 |
hating | +36.074 |
politicians | +36.069 |
politics | +35.985 |
Jews | +35.915 |
Neg logit contributions | |
Setup | -20.345 |
optionally | -17.140 |
manually | -16.671 |
formatted | -16.601 |
initialize | -16.454 |
Token | a |
Token ID | 257 |
Feature activation | +2.92e+00 |
Pos logit contributions | |
hating | +30.182 |
dictators | +29.702 |
oppressed | +29.423 |
Jews | +29.084 |
politicians | +28.771 |
Neg logit contributions | |
Setup | -16.930 |
manually | -14.061 |
optionally | -13.966 |
formatted | -13.472 |
Completed | -13.442 |
Token | citizen |
Token ID | 9511 |
Feature activation | +3.17e+00 |
Pos logit contributions | |
hating | +24.830 |
oppressed | +24.770 |
religion | +24.399 |
dictators | +24.374 |
politics | +24.056 |
Neg logit contributions | |
Setup | -14.194 |
optionally | -11.939 |
manually | -11.606 |
annot | -11.313 |
updated | -11.307 |
Token | of |
Token ID | 286 |
Feature activation | +3.63e+00 |
Pos logit contributions | |
oppressed | +23.648 |
hating | +23.630 |
dictators | +22.591 |
Jews | +22.342 |
religion | +22.217 |
Neg logit contributions | |
Setup | -17.485 |
manually | -15.050 |
optionally | -14.771 |
annot | -14.679 |
updated | -14.628 |
Token | our |
Token ID | 674 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
oppressed | +26.001 |
dictators | +25.981 |
hating | +25.914 |
America | +25.161 |
Jews | +25.117 |
Neg logit contributions | |
Setup | -18.582 |
manually | -16.279 |
optionally | -16.101 |
formatted | -15.958 |
annot | -15.464 |
Token | critical |
Token ID | 4688 |
Feature activation | +9.42e-01 |
Pos logit contributions | |
Setup | +8.080 |
manually | +7.778 |
updated | +7.691 |
optionally | +7.647 |
annot | +7.534 |
Neg logit contributions | |
dictators | -5.829 |
hating | -5.774 |
oppressed | -5.563 |
Jews | -5.382 |
Communism | -5.243 |
Token | of |
Token ID | 286 |
Feature activation | +3.63e+00 |
Pos logit contributions | |
dictators | +6.750 |
hating | +6.675 |
Jews | +6.526 |
oppressed | +6.510 |
religion | +6.386 |
Neg logit contributions | |
Setup | -7.466 |
optionally | -7.005 |
manually | -6.983 |
updated | -6.678 |
formatted | -6.607 |
Token | U |
Token ID | 471 |
Feature activation | +3.78e+00 |
Pos logit contributions | |
dictators | +29.169 |
Jews | +28.094 |
religion | +27.757 |
hating | +27.400 |
oppressed | +27.308 |
Neg logit contributions | |
Setup | -16.516 |
optionally | -14.703 |
manually | -14.556 |
formatted | -13.594 |
Detailed | -13.545 |
Token | . |
Token ID | 13 |
Feature activation | +4.09e+00 |
Pos logit contributions | |
dictators | +22.799 |
Jews | +22.634 |
Muslims | +22.085 |
hating | +22.003 |
religion | +21.966 |
Neg logit contributions | |
Setup | -20.592 |
optionally | -19.753 |
manually | -18.983 |
formatted | -18.968 |
annot | -18.276 |
Token | S |
Token ID | 50 |
Feature activation | +4.92e+00 |
Pos logit contributions | |
Jews | +23.408 |
Communism | +23.195 |
America | +23.062 |
Muslims | +22.710 |
dictators | +22.530 |
Neg logit contributions | |
optionally | -21.914 |
Setup | -21.514 |
manually | -21.131 |
formatted | -21.084 |
diagram | -20.420 |
Token | . |
Token ID | 13 |
Feature activation | +5.22e+00 |
Pos logit contributions | |
dictators | +34.266 |
hating | +31.942 |
politics | +31.810 |
Jews | +31.748 |
dictatorship | +31.340 |
Neg logit contributions | |
Setup | -20.609 |
optionally | -19.579 |
manually | -18.977 |
updated | -17.911 |
annot | -17.849 |
Token | foreign |
Token ID | 3215 |
Feature activation | +4.33e+00 |
Pos logit contributions | |
dictators | +37.492 |
politics | +35.703 |
Jews | +35.480 |
Communism | +35.196 |
politicians | +35.176 |
Neg logit contributions | |
Setup | -18.635 |
manually | -17.173 |
optionally | -17.143 |
updated | -15.242 |
screenshot | -15.173 |
Token | policy |
Token ID | 2450 |
Feature activation | +2.98e+00 |
Pos logit contributions | |
dictators | +29.738 |
politics | +27.147 |
hating | +26.931 |
dictatorship | +26.924 |
politicians | +26.480 |
Neg logit contributions | |
Setup | -22.763 |
manually | -21.045 |
optionally | -20.177 |
Completed | -19.759 |
Detailed | -19.210 |
Token | . |
Token ID | 13 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
dictators | +23.758 |
hating | +22.541 |
politics | +22.066 |
dictatorship | +21.918 |
oppressed | +21.866 |
Neg logit contributions | |
Setup | -16.139 |
optionally | -14.110 |
manually | -13.635 |
updated | -12.928 |
formatted | -12.924 |
Token | We |
Token ID | 775 |
Feature activation | -5.89e-01 |
Pos logit contributions | |
dictators | +6.715 |
Jews | +6.711 |
hating | +6.699 |
oppressed | +6.453 |
Communism | +6.426 |
Neg logit contributions | |
Setup | -9.693 |
manually | -9.328 |
optionally | -9.317 |
formatted | -9.073 |
updated | -9.038 |
Token | also |
Token ID | 635 |
Feature activation | -9.61e-01 |
Pos logit contributions | |
Setup | +4.782 |
manually | +4.565 |
updated | +4.507 |
optionally | +4.492 |
annot | +4.396 |
Neg logit contributions | |
dictators | -4.360 |
hating | -4.330 |
oppressed | -4.190 |
Jews | -4.074 |
Communism | -3.977 |
Token | � |
Token ID | 447 |
Feature activation | +5.86e-01 |
Pos logit contributions | |
hating | +20.025 |
dictators | +20.000 |
oppressed | +19.929 |
bullies | +19.371 |
Jews | +19.227 |
Neg logit contributions | |
Setup | -12.482 |
optionally | -11.035 |
manually | -10.914 |
formatted | -10.144 |
updated | -10.125 |
Token | � |
Token ID | 247 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
dictators | +3.697 |
hating | +3.652 |
oppressed | +3.578 |
Jews | +3.464 |
Communism | +3.364 |
Neg logit contributions | |
Setup | -5.311 |
manually | -5.077 |
optionally | -5.010 |
updated | -4.980 |
annot | -4.918 |
Token | s |
Token ID | 82 |
Feature activation | +2.93e+00 |
Pos logit contributions | |
dictators | +12.846 |
hating | +12.689 |
oppressed | +12.659 |
Jews | +12.230 |
bullies | +12.009 |
Neg logit contributions | |
Setup | -12.402 |
optionally | -11.501 |
manually | -11.430 |
updated | -10.932 |
annot | -10.868 |
Token | an |
Token ID | 281 |
Feature activation | +3.68e+00 |
Pos logit contributions | |
hating | +24.512 |
dictators | +24.370 |
oppressed | +24.123 |
Jews | +23.398 |
rapists | +22.814 |
Neg logit contributions | |
Setup | -14.842 |
optionally | -13.195 |
manually | -12.473 |
annot | -11.733 |
updated | -11.709 |
Token | embarrassment |
Token ID | 24655 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
oppressed | +30.908 |
dictators | +30.615 |
hating | +29.698 |
Jews | +29.212 |
martyr | +29.141 |
Neg logit contributions | |
Setup | -14.679 |
manually | -13.112 |
optionally | -12.800 |
formatted | -12.484 |
downloadable | -11.493 |
Token | to |
Token ID | 284 |
Feature activation | +5.18e+00 |
Pos logit contributions | |
hating | +20.631 |
dictators | +20.400 |
oppressed | +19.843 |
Jews | +19.789 |
America | +19.292 |
Neg logit contributions | |
Setup | -16.683 |
optionally | -14.938 |
manually | -14.582 |
updated | -14.525 |
formatted | -14.033 |
Token | humankind |
Token ID | 47634 |
Feature activation | +4.14e+00 |
Pos logit contributions | |
dictators | +36.350 |
Jews | +36.235 |
America | +36.044 |
religion | +35.797 |
oppressed | +35.356 |
Neg logit contributions | |
Setup | -19.458 |
optionally | -16.613 |
manually | -16.054 |
formatted | -15.648 |
Completed | -15.481 |
Token | . |
Token ID | 13 |
Feature activation | +3.31e+00 |
Pos logit contributions | |
hating | +29.853 |
dictators | +29.627 |
oppressed | +29.066 |
Jews | +28.408 |
Almighty | +28.327 |
Neg logit contributions | |
Setup | -18.441 |
optionally | -15.672 |
manually | -15.246 |
updated | -15.003 |
Completed | -14.927 |
Token | � |
Token ID | 447 |
Feature activation | +9.85e-01 |
Pos logit contributions | |
Jews | +24.598 |
dictators | +24.420 |
hating | +24.186 |
America | +24.009 |
Christians | +23.871 |
Neg logit contributions | |
Setup | -16.240 |
optionally | -15.835 |
manually | -15.360 |
formatted | -15.048 |
annot | -14.285 |
Token | � |
Token ID | 251 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
dictators | +6.065 |
hating | +6.035 |
oppressed | +5.865 |
Jews | +5.778 |
Communism | +5.524 |
Neg logit contributions | |
Setup | -8.600 |
manually | -8.346 |
optionally | -8.173 |
updated | -8.060 |
formatted | -8.059 |
Token |
|
Token ID | 198 |
Feature activation | +5.94e-01 |
Pos logit contributions | |
dictators | +9.797 |
hating | +9.716 |
Jews | +9.429 |
oppressed | +9.284 |
Communism | +9.111 |
Neg logit contributions | |
Setup | -10.636 |
manually | -10.131 |
optionally | -10.116 |
formatted | -9.804 |
updated | -9.709 |
Token | for |
Token ID | 329 |
Feature activation | +4.56e+00 |
Pos logit contributions | |
hating | +23.518 |
dictators | +23.348 |
oppressed | +22.736 |
Jews | +22.724 |
religion | +22.593 |
Neg logit contributions | |
Setup | -19.561 |
annot | -16.782 |
optionally | -16.721 |
manually | -16.485 |
updated | -15.906 |
Token | Jesus |
Token ID | 5803 |
Feature activation | +4.08e+00 |
Pos logit contributions | |
dictators | +33.827 |
Jews | +33.531 |
oppressed | +33.435 |
religion | +32.837 |
hating | +32.811 |
Neg logit contributions | |
Setup | -19.917 |
optionally | -16.712 |
manually | -16.056 |
annot | -15.739 |
Completed | -15.691 |
Token | , |
Token ID | 11 |
Feature activation | +4.91e+00 |
Pos logit contributions | |
hating | +29.526 |
dictators | +28.707 |
religion | +28.270 |
Jews | +28.113 |
Almighty | +28.036 |
Neg logit contributions | |
Setup | -19.348 |
annot | -16.659 |
manually | -16.643 |
optionally | -16.535 |
initialize | -15.863 |
Token | lazy |
Token ID | 16931 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
hating | +36.814 |
dictators | +35.790 |
Jews | +35.285 |
religion | +35.215 |
hatred | +34.831 |
Neg logit contributions | |
Setup | -18.002 |
manually | -15.000 |
optionally | -14.952 |
annot | -14.142 |
formatted | -14.024 |
Token | minorities |
Token ID | 15557 |
Feature activation | +4.00e+00 |
Pos logit contributions | |
dictators | +32.265 |
politicians | +31.942 |
politics | +31.734 |
hating | +31.713 |
Jews | +31.610 |
Neg logit contributions | |
Setup | -18.217 |
optionally | -16.561 |
manually | -16.242 |
available | -15.291 |
formatted | -15.282 |
Token | , |
Token ID | 11 |
Feature activation | +5.00e+00 |
Pos logit contributions | |
hating | +30.783 |
oppressed | +29.485 |
dictators | +29.243 |
politics | +28.219 |
Jews | +27.985 |
Neg logit contributions | |
Setup | -18.895 |
manually | -16.018 |
optionally | -15.936 |
annot | -15.483 |
updated | -15.271 |
Token | immigrants |
Token ID | 7971 |
Feature activation | +4.17e+00 |
Pos logit contributions | |
hating | +37.001 |
dictators | +36.720 |
Jews | +35.724 |
oppressed | +35.596 |
religion | +35.314 |
Neg logit contributions | |
Setup | -17.999 |
optionally | -15.054 |
manually | -14.944 |
annot | -13.882 |
formatted | -13.832 |
Token | and |
Token ID | 290 |
Feature activation | +4.70e+00 |
Pos logit contributions | |
hating | +31.638 |
oppressed | +30.149 |
dictators | +29.942 |
Jews | +28.668 |
politics | +28.575 |
Neg logit contributions | |
Setup | -19.246 |
optionally | -16.188 |
manually | -16.002 |
updated | -15.730 |
annot | -15.375 |
Token | rich |
Token ID | 5527 |
Feature activation | +4.69e+00 |
Pos logit contributions | |
dictators | +35.578 |
hating | +35.213 |
Jews | +34.807 |
oppressed | +34.515 |
religion | +34.053 |
Neg logit contributions | |
Setup | -18.543 |
manually | -15.063 |
optionally | -14.828 |
formatted | -14.417 |
available | -14.339 |
Token | liberals |
Token ID | 17194 |
Feature activation | +4.63e+00 |
Pos logit contributions | |
dictators | +35.307 |
Jews | +34.518 |
hating | +33.955 |
politicians | +33.628 |
oppressed | +33.437 |
Neg logit contributions | |
Setup | -18.311 |
optionally | -16.832 |
manually | -16.267 |
updated | -15.394 |
formatted | -15.009 |
Token | . |
Token ID | 13 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
hating | +35.101 |
oppressed | +33.547 |
dictators | +33.442 |
Jews | +32.393 |
politicians | +32.070 |
Neg logit contributions | |
Setup | -18.051 |
optionally | -15.524 |
manually | -14.903 |
Completed | -14.631 |
initialize | -14.392 |
Token | on |
Token ID | 319 |
Feature activation | +4.90e+00 |
Pos logit contributions | |
hating | +14.044 |
dictators | +13.929 |
oppressed | +13.417 |
Jews | +13.356 |
religion | +13.130 |
Neg logit contributions | |
Setup | -12.872 |
optionally | -11.439 |
manually | -11.431 |
updated | -11.403 |
annot | -11.156 |
Token | women |
Token ID | 1466 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
Jews | +35.800 |
dictators | +34.898 |
oppressed | +34.361 |
Muslims | +34.068 |
religion | +34.025 |
Neg logit contributions | |
Setup | -19.852 |
optionally | -16.950 |
manually | -16.571 |
formatted | -16.397 |
annot | -16.226 |
Token | , |
Token ID | 11 |
Feature activation | +4.57e+00 |
Pos logit contributions | |
dictators | +27.253 |
hating | +27.055 |
oppressed | +26.275 |
Jews | +26.072 |
politicians | +25.749 |
Neg logit contributions | |
Setup | -18.815 |
manually | -15.772 |
updated | -15.701 |
optionally | -15.652 |
Completed | -15.600 |
Token | blacks |
Token ID | 15102 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
hating | +34.493 |
dictators | +34.134 |
Jews | +33.405 |
oppressed | +32.922 |
religion | +32.772 |
Neg logit contributions | |
Setup | -17.604 |
manually | -15.354 |
optionally | -15.234 |
updated | -14.582 |
formatted | -14.334 |
Token | and |
Token ID | 290 |
Feature activation | +4.71e+00 |
Pos logit contributions | |
hating | +29.609 |
oppressed | +28.556 |
dictators | +28.545 |
Jews | +27.947 |
politics | +27.152 |
Neg logit contributions | |
Setup | -19.767 |
manually | -16.938 |
optionally | -16.689 |
updated | -16.447 |
annot | -16.278 |
Token | Muslims |
Token ID | 7045 |
Feature activation | +4.94e+00 |
Pos logit contributions | |
Jews | +34.898 |
oppressed | +33.632 |
Muslims | +33.221 |
dictators | +33.046 |
hating | +32.866 |
Neg logit contributions | |
Setup | -19.811 |
manually | -17.624 |
optionally | -16.628 |
formatted | -16.272 |
annot | -15.999 |
Token | , |
Token ID | 11 |
Feature activation | +4.44e+00 |
Pos logit contributions | |
hating | +34.377 |
dictators | +33.699 |
oppressed | +33.384 |
Jews | +32.903 |
Muslims | +32.052 |
Neg logit contributions | |
Setup | -20.009 |
manually | -16.193 |
Completed | -16.019 |
optionally | -15.973 |
formatted | -15.819 |
Token | and |
Token ID | 290 |
Feature activation | +4.12e+00 |
Pos logit contributions | |
dictators | +34.256 |
hating | +34.137 |
Jews | +33.537 |
oppressed | +32.772 |
religion | +32.657 |
Neg logit contributions | |
Setup | -16.723 |
optionally | -14.480 |
manually | -14.463 |
updated | -13.605 |
formatted | -13.561 |
Token | the |
Token ID | 262 |
Feature activation | +4.14e+00 |
Pos logit contributions | |
hating | +32.165 |
dictators | +32.158 |
Jews | +31.312 |
oppressed | +30.664 |
religion | +30.585 |
Neg logit contributions | |
Setup | -17.255 |
manually | -14.723 |
optionally | -14.395 |
updated | -14.119 |
annot | -13.943 |
Token | hate |
Token ID | 5465 |
Feature activation | +3.40e+00 |
Pos logit contributions | |
dictators | +32.820 |
hating | +32.376 |
Jews | +32.047 |
oppressed | +31.614 |
hatred | +31.531 |
Neg logit contributions | |
Setup | -16.174 |
optionally | -14.100 |
manually | -13.865 |
annot | -13.265 |
formatted | -13.127 |
Token | he |
Token ID | 339 |
Feature activation | +2.91e+00 |
Pos logit contributions | |
hating | +26.646 |
dictators | +26.198 |
politics | +26.035 |
Jews | +25.904 |
religion | +25.891 |
Neg logit contributions | |
Setup | -16.918 |
optionally | -14.748 |
manually | -14.018 |
Completed | -13.855 |
annot | -13.734 |
Token | he |
Token ID | 339 |
Feature activation | +2.91e+00 |
Pos logit contributions | |
hating | +26.646 |
dictators | +26.198 |
politics | +26.035 |
Jews | +25.904 |
religion | +25.891 |
Neg logit contributions | |
Setup | -16.918 |
optionally | -14.748 |
manually | -14.018 |
Completed | -13.855 |
annot | -13.734 |
Token | has |
Token ID | 468 |
Feature activation | +2.91e+00 |
Pos logit contributions | |
dictators | +22.842 |
hating | +22.733 |
oppressed | +22.707 |
bullies | +22.329 |
Jews | +22.222 |
Neg logit contributions | |
Setup | -14.908 |
manually | -13.285 |
optionally | -13.168 |
Completed | -12.860 |
updated | -12.794 |
Token | brought |
Token ID | 3181 |
Feature activation | +3.12e+00 |
Pos logit contributions | |
oppressed | +24.728 |
hating | +24.543 |
dictators | +24.282 |
Jews | +23.776 |
hatred | +23.328 |
Neg logit contributions | |
Setup | -13.558 |
optionally | -11.718 |
manually | -11.072 |
Completed | -10.854 |
annot | -10.809 |
Token | to |
Token ID | 284 |
Feature activation | +4.08e+00 |
Pos logit contributions | |
dictators | +23.300 |
hating | +22.608 |
oppressed | +22.396 |
Jews | +22.223 |
religion | +21.895 |
Neg logit contributions | |
Setup | -17.762 |
optionally | -15.831 |
updated | -15.097 |
manually | -14.998 |
Completed | -14.909 |
Token | the |
Token ID | 262 |
Feature activation | +3.81e+00 |
Pos logit contributions | |
dictators | +30.576 |
Jews | +30.487 |
oppressed | +30.149 |
America | +29.822 |
hating | +29.764 |
Neg logit contributions | |
Setup | -19.281 |
optionally | -16.997 |
manually | -16.438 |
formatted | -16.166 |
updated | -15.968 |
Token | American |
Token ID | 1605 |
Feature activation | +4.94e+00 |
Pos logit contributions | |
Jews | +28.920 |
oppressed | +28.453 |
dictators | +28.025 |
hating | +27.962 |
religion | +27.672 |
Neg logit contributions | |
Setup | -18.621 |
manually | -16.342 |
Completed | -16.204 |
optionally | -16.105 |
annot | -15.632 |
Token | political |
Token ID | 1964 |
Feature activation | +3.16e+00 |
Pos logit contributions | |
Jews | +35.761 |
politics | +34.518 |
religion | +34.072 |
hating | +33.984 |
society | +33.963 |
Neg logit contributions | |
Setup | -18.864 |
optionally | -17.141 |
manually | -17.110 |
Completed | -16.785 |
annot | -16.547 |
Token | system |
Token ID | 1080 |
Feature activation | +3.11e+00 |
Pos logit contributions | |
oppressed | +24.002 |
Jews | +23.910 |
dictators | +23.904 |
religion | +23.789 |
politics | +23.747 |
Neg logit contributions | |
Setup | -15.762 |
manually | -14.366 |
optionally | -14.110 |
Completed | -13.944 |
annot | -13.672 |
Token | , |
Token ID | 11 |
Feature activation | +3.09e+00 |
Pos logit contributions | |
dictators | +22.836 |
hating | +22.668 |
oppressed | +22.274 |
Jews | +21.829 |
politics | +21.591 |
Neg logit contributions | |
Setup | -17.068 |
optionally | -15.017 |
updated | -14.620 |
manually | -14.562 |
formatted | -14.220 |
Token | as |
Token ID | 355 |
Feature activation | +3.03e+00 |
Pos logit contributions | |
dictators | +23.947 |
hating | +23.833 |
Jews | +23.326 |
oppressed | +23.097 |
religion | +22.931 |
Neg logit contributions | |
Setup | -16.041 |
optionally | -14.137 |
manually | -13.902 |
updated | -13.546 |
Completed | -13.297 |
Token | well |
Token ID | 880 |
Feature activation | +2.54e+00 |
Pos logit contributions | |
dictators | +26.089 |
Jews | +25.384 |
hating | +25.095 |
oppressed | +24.903 |
politicians | +24.627 |
Neg logit contributions | |
Setup | -14.306 |
manually | -12.348 |
optionally | -11.996 |
updated | -11.249 |
Completed | -11.029 |
Token | book |
Token ID | 1492 |
Feature activation | -8.99e-01 |
Pos logit contributions | |
Setup | +7.550 |
manually | +7.288 |
updated | +7.201 |
optionally | +7.150 |
annot | +7.044 |
Neg logit contributions | |
dictators | -5.804 |
hating | -5.754 |
oppressed | -5.554 |
Jews | -5.363 |
Communism | -5.232 |
Token | critical |
Token ID | 4688 |
Feature activation | +9.42e-01 |
Pos logit contributions | |
Setup | +8.080 |
manually | +7.778 |
updated | +7.691 |
optionally | +7.647 |
annot | +7.534 |
Neg logit contributions | |
dictators | -5.829 |
hating | -5.774 |
oppressed | -5.563 |
Jews | -5.382 |
Communism | -5.243 |
Token | of |
Token ID | 286 |
Feature activation | +3.63e+00 |
Pos logit contributions | |
dictators | +6.750 |
hating | +6.675 |
Jews | +6.526 |
oppressed | +6.510 |
religion | +6.386 |
Neg logit contributions | |
Setup | -7.466 |
optionally | -7.005 |
manually | -6.983 |
updated | -6.678 |
formatted | -6.607 |
Token | U |
Token ID | 471 |
Feature activation | +3.78e+00 |
Pos logit contributions | |
dictators | +29.169 |
Jews | +28.094 |
religion | +27.757 |
hating | +27.400 |
oppressed | +27.308 |
Neg logit contributions | |
Setup | -16.516 |
optionally | -14.703 |
manually | -14.556 |
formatted | -13.594 |
Detailed | -13.545 |
Token | . |
Token ID | 13 |
Feature activation | +4.09e+00 |
Pos logit contributions | |
dictators | +22.799 |
Jews | +22.634 |
Muslims | +22.085 |
hating | +22.003 |
religion | +21.966 |
Neg logit contributions | |
Setup | -20.592 |
optionally | -19.753 |
manually | -18.983 |
formatted | -18.968 |
annot | -18.276 |
Token | S |
Token ID | 50 |
Feature activation | +4.92e+00 |
Pos logit contributions | |
Jews | +23.408 |
Communism | +23.195 |
America | +23.062 |
Muslims | +22.710 |
dictators | +22.530 |
Neg logit contributions | |
optionally | -21.914 |
Setup | -21.514 |
manually | -21.131 |
formatted | -21.084 |
diagram | -20.420 |
Token | . |
Token ID | 13 |
Feature activation | +5.22e+00 |
Pos logit contributions | |
dictators | +34.266 |
hating | +31.942 |
politics | +31.810 |
Jews | +31.748 |
dictatorship | +31.340 |
Neg logit contributions | |
Setup | -20.609 |
optionally | -19.579 |
manually | -18.977 |
updated | -17.911 |
annot | -17.849 |
Token | foreign |
Token ID | 3215 |
Feature activation | +4.33e+00 |
Pos logit contributions | |
dictators | +37.492 |
politics | +35.703 |
Jews | +35.480 |
Communism | +35.196 |
politicians | +35.176 |
Neg logit contributions | |
Setup | -18.635 |
manually | -17.173 |
optionally | -17.143 |
updated | -15.242 |
screenshot | -15.173 |
Token | policy |
Token ID | 2450 |
Feature activation | +2.98e+00 |
Pos logit contributions | |
dictators | +29.738 |
politics | +27.147 |
hating | +26.931 |
dictatorship | +26.924 |
politicians | +26.480 |
Neg logit contributions | |
Setup | -22.763 |
manually | -21.045 |
optionally | -20.177 |
Completed | -19.759 |
Detailed | -19.210 |
Token | . |
Token ID | 13 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
dictators | +23.758 |
hating | +22.541 |
politics | +22.066 |
dictatorship | +21.918 |
oppressed | +21.866 |
Neg logit contributions | |
Setup | -16.139 |
optionally | -14.110 |
manually | -13.635 |
updated | -12.928 |
formatted | -12.924 |
Token | We |
Token ID | 775 |
Feature activation | -5.89e-01 |
Pos logit contributions | |
dictators | +6.715 |
Jews | +6.711 |
hating | +6.699 |
oppressed | +6.453 |
Communism | +6.426 |
Neg logit contributions | |
Setup | -9.693 |
manually | -9.328 |
optionally | -9.317 |
formatted | -9.073 |
updated | -9.038 |
Token | lack |
Token ID | 3092 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
hating | +28.417 |
dictators | +28.102 |
Jews | +27.343 |
oppressed | +27.102 |
religion | +27.000 |
Neg logit contributions | |
Setup | -16.454 |
optionally | -13.568 |
manually | -13.493 |
annot | -13.117 |
Completed | -13.109 |
Token | of |
Token ID | 286 |
Feature activation | +3.16e+00 |
Pos logit contributions | |
hating | +13.678 |
dictators | +13.546 |
oppressed | +13.157 |
religion | +13.089 |
Jews | +13.010 |
Neg logit contributions | |
Setup | -16.797 |
manually | -15.650 |
optionally | -15.642 |
annot | -15.153 |
formatted | -15.041 |
Token | love |
Token ID | 1842 |
Feature activation | +3.30e+00 |
Pos logit contributions | |
dictators | +25.452 |
hating | +25.379 |
oppressed | +25.183 |
religion | +25.100 |
Jews | +24.771 |
Neg logit contributions | |
Setup | -16.202 |
optionally | -13.377 |
manually | -13.370 |
annot | -12.940 |
formatted | -12.615 |
Token | for |
Token ID | 329 |
Feature activation | +4.56e+00 |
Pos logit contributions | |
hating | +23.518 |
dictators | +23.348 |
oppressed | +22.736 |
Jews | +22.724 |
religion | +22.593 |
Neg logit contributions | |
Setup | -19.561 |
annot | -16.782 |
optionally | -16.721 |
manually | -16.485 |
updated | -15.906 |
Token | Jesus |
Token ID | 5803 |
Feature activation | +4.08e+00 |
Pos logit contributions | |
dictators | +33.827 |
Jews | +33.531 |
oppressed | +33.435 |
religion | +32.837 |
hating | +32.811 |
Neg logit contributions | |
Setup | -19.917 |
optionally | -16.712 |
manually | -16.056 |
annot | -15.739 |
Completed | -15.691 |
Token | , |
Token ID | 11 |
Feature activation | +4.91e+00 |
Pos logit contributions | |
hating | +29.526 |
dictators | +28.707 |
religion | +28.270 |
Jews | +28.113 |
Almighty | +28.036 |
Neg logit contributions | |
Setup | -19.348 |
annot | -16.659 |
manually | -16.643 |
optionally | -16.535 |
initialize | -15.863 |
Token | lazy |
Token ID | 16931 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
hating | +36.814 |
dictators | +35.790 |
Jews | +35.285 |
religion | +35.215 |
hatred | +34.831 |
Neg logit contributions | |
Setup | -18.002 |
manually | -15.000 |
optionally | -14.952 |
annot | -14.142 |
formatted | -14.024 |
Token | minorities |
Token ID | 15557 |
Feature activation | +4.00e+00 |
Pos logit contributions | |
dictators | +32.265 |
politicians | +31.942 |
politics | +31.734 |
hating | +31.713 |
Jews | +31.610 |
Neg logit contributions | |
Setup | -18.217 |
optionally | -16.561 |
manually | -16.242 |
available | -15.291 |
formatted | -15.282 |
Token | , |
Token ID | 11 |
Feature activation | +5.00e+00 |
Pos logit contributions | |
hating | +30.783 |
oppressed | +29.485 |
dictators | +29.243 |
politics | +28.219 |
Jews | +27.985 |
Neg logit contributions | |
Setup | -18.895 |
manually | -16.018 |
optionally | -15.936 |
annot | -15.483 |
updated | -15.271 |
Token | immigrants |
Token ID | 7971 |
Feature activation | +4.17e+00 |
Pos logit contributions | |
hating | +37.001 |
dictators | +36.720 |
Jews | +35.724 |
oppressed | +35.596 |
religion | +35.314 |
Neg logit contributions | |
Setup | -17.999 |
optionally | -15.054 |
manually | -14.944 |
annot | -13.882 |
formatted | -13.832 |
Token | and |
Token ID | 290 |
Feature activation | +4.70e+00 |
Pos logit contributions | |
hating | +31.638 |
oppressed | +30.149 |
dictators | +29.942 |
Jews | +28.668 |
politics | +28.575 |
Neg logit contributions | |
Setup | -19.246 |
optionally | -16.188 |
manually | -16.002 |
updated | -15.730 |
annot | -15.375 |
Token | stand |
Token ID | 1481 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
dictators | +5.066 |
hating | +5.046 |
oppressed | +4.862 |
Jews | +4.804 |
Communism | +4.661 |
Neg logit contributions | |
Setup | -4.862 |
manually | -4.701 |
optionally | -4.638 |
updated | -4.621 |
formatted | -4.526 |
Token | up |
Token ID | 510 |
Feature activation | +2.59e+00 |
Pos logit contributions | |
hating | +14.331 |
oppressed | +14.076 |
dictators | +13.919 |
Jews | +13.514 |
martyr | +13.320 |
Neg logit contributions | |
Setup | -11.643 |
optionally | -10.208 |
manually | -10.203 |
formatted | -10.022 |
annot | -9.999 |
Token | for |
Token ID | 329 |
Feature activation | +3.78e+00 |
Pos logit contributions | |
hating | +18.706 |
dictators | +18.516 |
oppressed | +18.275 |
Jews | +17.714 |
politics | +17.580 |
Neg logit contributions | |
Setup | -17.032 |
optionally | -14.661 |
annot | -14.570 |
manually | -14.481 |
updated | -14.479 |
Token | our |
Token ID | 674 |
Feature activation | +4.18e+00 |
Pos logit contributions | |
oppressed | +28.456 |
dictators | +28.219 |
hating | +28.142 |
Jews | +27.771 |
America | +27.564 |
Neg logit contributions | |
Setup | -19.033 |
optionally | -16.277 |
manually | -15.800 |
formatted | -15.527 |
Completed | -15.523 |
Token | proud |
Token ID | 6613 |
Feature activation | +3.50e+00 |
Pos logit contributions | |
oppressed | +31.168 |
dictators | +30.777 |
religion | +30.487 |
politics | +30.038 |
Jews | +29.990 |
Neg logit contributions | |
Setup | -19.572 |
manually | -16.452 |
optionally | -16.250 |
annot | -15.632 |
updated | -15.615 |
Token | American |
Token ID | 1605 |
Feature activation | +4.91e+00 |
Pos logit contributions | |
dictators | +26.688 |
religion | +26.464 |
oppressed | +26.205 |
Jews | +25.946 |
politics | +25.770 |
Neg logit contributions | |
Setup | -17.662 |
manually | -15.639 |
optionally | -15.423 |
formatted | -15.007 |
updated | -14.849 |
Token | values |
Token ID | 3815 |
Feature activation | +2.33e+00 |
Pos logit contributions | |
dictators | +33.769 |
religion | +33.586 |
Jews | +33.493 |
patri | +33.133 |
oppressed | +33.117 |
Neg logit contributions | |
Setup | -20.278 |
updated | -17.029 |
manually | -16.895 |
optionally | -16.614 |
annot | -16.565 |
Token | .' |
Token ID | 2637 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
dictators | +16.425 |
hating | +16.225 |
oppressed | +15.866 |
Jews | +15.550 |
politics | +15.526 |
Neg logit contributions | |
Setup | -16.237 |
optionally | -14.122 |
manually | -14.061 |
updated | -13.896 |
Completed | -13.848 |
Token |
|
Token ID | 198 |
Feature activation | +7.16e-01 |
Pos logit contributions | |
dictators | +8.684 |
hating | +8.654 |
Jews | +8.299 |
oppressed | +8.189 |
Communism | +7.993 |
Neg logit contributions | |
Setup | -13.785 |
manually | -13.263 |
optionally | -13.027 |
updated | -12.912 |
annot | -12.847 |
Token |
|
Token ID | 198 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
hating | +4.189 |
dictators | +4.155 |
Jews | +4.078 |
oppressed | +3.981 |
Communism | +3.916 |
Neg logit contributions | |
Setup | -6.561 |
optionally | -6.346 |
manually | -6.330 |
updated | -6.195 |
formatted | -6.174 |
Token | She |
Token ID | 3347 |
Feature activation | -4.50e-01 |
Pos logit contributions | |
Setup | +9.314 |
manually | +8.758 |
updated | +8.709 |
optionally | +8.612 |
annot | +8.516 |
Neg logit contributions | |
dictators | -7.336 |
hating | -7.252 |
oppressed | -7.043 |
Jews | -6.712 |
dictatorship | -6.660 |
Token | two |
Token ID | 734 |
Feature activation | +2.85e+00 |
Pos logit contributions | |
dictators | +16.239 |
oppressed | +15.416 |
hating | +15.163 |
dictatorship | +14.764 |
politicians | +14.607 |
Neg logit contributions | |
Setup | -12.751 |
manually | -11.425 |
optionally | -11.116 |
annot | -11.060 |
Completed | -10.921 |
Token | demonstr |
Token ID | 4110 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
dictators | +23.896 |
oppressed | +22.613 |
hating | +22.107 |
dictatorship | +21.767 |
politicians | +21.316 |
Neg logit contributions | |
Setup | -15.639 |
manually | -13.592 |
optionally | -13.358 |
annot | -13.312 |
Completed | -13.306 |
Token | ably |
Token ID | 1346 |
Feature activation | +2.84e+00 |
Pos logit contributions | |
dictators | +12.173 |
hating | +11.874 |
oppressed | +11.500 |
Jews | +11.127 |
bullies | +10.973 |
Neg logit contributions | |
Setup | -11.005 |
manually | -10.666 |
optionally | -10.484 |
updated | -10.404 |
formatted | -10.177 |
Token | anti |
Token ID | 3098 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
dictators | +23.874 |
oppressed | +23.394 |
hating | +23.080 |
dictatorship | +22.111 |
socialist | +21.729 |
Neg logit contributions | |
Setup | -14.834 |
manually | -13.255 |
optionally | -13.016 |
annot | -12.489 |
Completed | -12.480 |
Token | - |
Token ID | 12 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
dictators | +13.994 |
hating | +13.429 |
oppressed | +13.036 |
Communism | +12.891 |
Jews | +12.700 |
Neg logit contributions | |
Setup | -18.599 |
optionally | -18.103 |
manually | -18.010 |
annot | -17.645 |
updated | -17.252 |
Token | American |
Token ID | 7437 |
Feature activation | +4.91e+00 |
Pos logit contributions | |
dictators | +22.032 |
hating | +20.817 |
America | +20.532 |
oppressed | +20.426 |
Communism | +20.370 |
Neg logit contributions | |
annot | -19.187 |
manually | -18.752 |
optionally | -18.664 |
Setup | -18.271 |
annotation | -17.750 |
Token | governments |
Token ID | 6905 |
Feature activation | +2.94e+00 |
Pos logit contributions | |
dictators | +37.297 |
dictatorship | +33.817 |
oppressed | +33.671 |
politicians | +33.425 |
hating | +33.132 |
Neg logit contributions | |
Setup | -19.734 |
manually | -16.892 |
annot | -16.671 |
Completed | -16.482 |
optionally | -16.470 |
Token | . |
Token ID | 13 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
dictators | +21.665 |
hating | +21.131 |
oppressed | +20.859 |
Jews | +20.165 |
politics | +19.902 |
Neg logit contributions | |
Setup | -16.992 |
optionally | -14.849 |
manually | -14.797 |
Completed | -14.574 |
updated | -14.459 |
Token |
|
Token ID | 198 |
Feature activation | +6.08e-01 |
Pos logit contributions | |
dictators | +9.641 |
hating | +9.380 |
Jews | +9.362 |
Communism | +9.273 |
oppressed | +9.028 |
Neg logit contributions | |
Setup | -12.259 |
optionally | -11.969 |
manually | -11.959 |
formatted | -11.602 |
annot | -11.538 |
Token |
|
Token ID | 198 |
Feature activation | -8.08e-01 |
Pos logit contributions | |
hating | +3.611 |
dictators | +3.605 |
Jews | +3.489 |
oppressed | +3.442 |
Communism | +3.357 |
Neg logit contributions | |
Setup | -5.546 |
optionally | -5.361 |
manually | -5.350 |
updated | -5.257 |
formatted | -5.220 |
Token | However |
Token ID | 4864 |
Feature activation | +5.47e-01 |
Pos logit contributions | |
Setup | +6.158 |
manually | +5.806 |
updated | +5.747 |
optionally | +5.689 |
annot | +5.585 |
Neg logit contributions | |
dictators | -6.371 |
hating | -6.338 |
oppressed | -6.155 |
Jews | -5.964 |
dictatorship | -5.849 |
Token | is |
Token ID | 271 |
Feature activation | +1.98e+00 |
Pos logit contributions | |
hating | +16.393 |
Jews | +15.637 |
dictators | +15.598 |
oppressed | +15.524 |
dictatorship | +15.429 |
Neg logit contributions | |
Setup | -19.070 |
manually | -18.806 |
optionally | -18.265 |
annot | -18.104 |
updated | -17.967 |
Token | iveness |
Token ID | 6517 |
Feature activation | +2.81e+00 |
Pos logit contributions | |
hating | +9.113 |
oppressed | +8.804 |
Jews | +8.765 |
dictators | +8.577 |
tyranny | +8.202 |
Neg logit contributions | |
Setup | -18.225 |
manually | -17.757 |
optionally | -17.591 |
formatted | -17.249 |
updated | -17.180 |
Token | , |
Token ID | 11 |
Feature activation | +3.92e+00 |
Pos logit contributions | |
dictators | +21.765 |
hating | +21.509 |
oppressed | +21.468 |
Jews | +21.117 |
politics | +20.886 |
Neg logit contributions | |
Setup | -15.496 |
manually | -13.741 |
optionally | -13.671 |
updated | -13.393 |
Completed | -13.135 |
Token | the |
Token ID | 262 |
Feature activation | +4.55e+00 |
Pos logit contributions | |
dictators | +30.631 |
hating | +30.568 |
hatred | +29.653 |
tyranny | +29.144 |
politics | +28.939 |
Neg logit contributions | |
Setup | -16.319 |
optionally | -14.959 |
updated | -14.541 |
manually | -14.434 |
annot | -13.934 |
Token | attacks |
Token ID | 3434 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
dictators | +34.417 |
hating | +34.167 |
hatred | +33.735 |
politics | +33.332 |
Jews | +33.138 |
Neg logit contributions | |
Setup | -17.009 |
optionally | -15.456 |
manually | -14.765 |
annot | -14.272 |
Completed | -14.261 |
Token | on |
Token ID | 319 |
Feature activation | +4.90e+00 |
Pos logit contributions | |
hating | +14.044 |
dictators | +13.929 |
oppressed | +13.417 |
Jews | +13.356 |
religion | +13.130 |
Neg logit contributions | |
Setup | -12.872 |
optionally | -11.439 |
manually | -11.431 |
updated | -11.403 |
annot | -11.156 |
Token | women |
Token ID | 1466 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
Jews | +35.800 |
dictators | +34.898 |
oppressed | +34.361 |
Muslims | +34.068 |
religion | +34.025 |
Neg logit contributions | |
Setup | -19.852 |
optionally | -16.950 |
manually | -16.571 |
formatted | -16.397 |
annot | -16.226 |
Token | , |
Token ID | 11 |
Feature activation | +4.57e+00 |
Pos logit contributions | |
dictators | +27.253 |
hating | +27.055 |
oppressed | +26.275 |
Jews | +26.072 |
politicians | +25.749 |
Neg logit contributions | |
Setup | -18.815 |
manually | -15.772 |
updated | -15.701 |
optionally | -15.652 |
Completed | -15.600 |
Token | blacks |
Token ID | 15102 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
hating | +34.493 |
dictators | +34.134 |
Jews | +33.405 |
oppressed | +32.922 |
religion | +32.772 |
Neg logit contributions | |
Setup | -17.604 |
manually | -15.354 |
optionally | -15.234 |
updated | -14.582 |
formatted | -14.334 |
Token | and |
Token ID | 290 |
Feature activation | +4.71e+00 |
Pos logit contributions | |
hating | +29.609 |
oppressed | +28.556 |
dictators | +28.545 |
Jews | +27.947 |
politics | +27.152 |
Neg logit contributions | |
Setup | -19.767 |
manually | -16.938 |
optionally | -16.689 |
updated | -16.447 |
annot | -16.278 |
Token | Muslims |
Token ID | 7045 |
Feature activation | +4.94e+00 |
Pos logit contributions | |
Jews | +34.898 |
oppressed | +33.632 |
Muslims | +33.221 |
dictators | +33.046 |
hating | +32.866 |
Neg logit contributions | |
Setup | -19.811 |
manually | -17.624 |
optionally | -16.628 |
formatted | -16.272 |
annot | -15.999 |
Token | his |
Token ID | 465 |
Feature activation | +3.87e+00 |
Pos logit contributions | |
dictators | +30.294 |
oppressed | +29.577 |
hating | +29.313 |
Jews | +28.982 |
politicians | +28.313 |
Neg logit contributions | |
Setup | -17.901 |
optionally | -15.502 |
manually | -15.305 |
updated | -14.512 |
updated | -14.228 |
Token | natural |
Token ID | 3288 |
Feature activation | +2.59e+00 |
Pos logit contributions | |
oppressed | +30.598 |
dictators | +30.436 |
hating | +30.194 |
Jews | +29.311 |
martyr | +28.911 |
Neg logit contributions | |
Setup | -16.898 |
manually | -14.428 |
optionally | -13.920 |
available | -13.477 |
updated | -13.460 |
Token | enemy |
Token ID | 4472 |
Feature activation | +3.69e+00 |
Pos logit contributions | |
dictators | +21.778 |
hating | +21.616 |
oppressed | +21.361 |
Jews | +20.553 |
politics | +20.536 |
Neg logit contributions | |
Setup | -14.016 |
manually | -12.976 |
optionally | -12.574 |
updated | -12.417 |
formatted | -11.891 |
Token | , |
Token ID | 11 |
Feature activation | +4.28e+00 |
Pos logit contributions | |
dictators | +27.369 |
hating | +27.227 |
Jews | +26.524 |
oppressed | +26.437 |
tyranny | +25.981 |
Neg logit contributions | |
Setup | -17.937 |
optionally | -15.957 |
manually | -15.441 |
Completed | -15.298 |
updated | -15.154 |
Token | the |
Token ID | 262 |
Feature activation | +4.42e+00 |
Pos logit contributions | |
dictators | +32.029 |
hating | +31.980 |
Jews | +31.228 |
oppressed | +31.225 |
tyranny | +30.764 |
Neg logit contributions | |
Setup | -17.600 |
manually | -14.845 |
optionally | -14.747 |
Completed | -14.451 |
updated | -14.039 |
Token | British |
Token ID | 3517 |
Feature activation | +4.84e+00 |
Pos logit contributions | |
dictators | +34.005 |
oppressed | +33.601 |
Jews | +33.146 |
hating | +32.698 |
tyranny | +32.169 |
Neg logit contributions | |
Setup | -17.222 |
manually | -14.837 |
optionally | -14.727 |
Completed | -14.003 |
formatted | -13.806 |
Token | crown |
Token ID | 12389 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
dictators | +35.681 |
hating | +34.509 |
Jews | +34.159 |
tyranny | +34.111 |
oppressed | +33.925 |
Neg logit contributions | |
Setup | -17.229 |
optionally | -16.004 |
manually | -15.279 |
Completed | -14.650 |
available | -14.632 |
Token | , |
Token ID | 11 |
Feature activation | +2.89e+00 |
Pos logit contributions | |
dictators | +24.093 |
hating | +23.535 |
oppressed | +23.138 |
Jews | +22.702 |
dictatorship | +22.633 |
Neg logit contributions | |
Setup | -17.493 |
manually | -15.736 |
optionally | -15.580 |
updated | -15.335 |
formatted | -14.991 |
Token | to |
Token ID | 284 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
hating | +23.399 |
dictators | +23.234 |
oppressed | +22.879 |
Jews | +22.224 |
tyranny | +21.934 |
Neg logit contributions | |
Setup | -15.485 |
manually | -13.197 |
optionally | -13.168 |
Completed | -12.987 |
updated | -12.905 |
Token | defeat |
Token ID | 7433 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
dictators | +20.428 |
hating | +20.267 |
oppressed | +20.205 |
Jews | +19.593 |
martyr | +19.454 |
Neg logit contributions | |
Setup | -12.864 |
updated | -10.964 |
optionally | -10.932 |
updated | -10.796 |
formatted | -10.751 |
Token | a |
Token ID | 257 |
Feature activation | +3.04e+00 |
Pos logit contributions | |
dictators | +24.748 |
tyranny | +23.938 |
hating | +23.732 |
Jews | +23.623 |
oppressed | +23.607 |
Neg logit contributions | |
Setup | -17.824 |
optionally | -15.956 |
manually | -15.562 |
Completed | -15.359 |
updated | -15.306 |
Token | � |
Token ID | 250 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
dictators | +3.883 |
hating | +3.849 |
oppressed | +3.740 |
Jews | +3.643 |
Communism | +3.525 |
Neg logit contributions | |
Setup | -4.930 |
manually | -4.740 |
optionally | -4.672 |
updated | -4.629 |
formatted | -4.558 |
Token | John |
Token ID | 7554 |
Feature activation | +2.64e+00 |
Pos logit contributions | |
hating | +12.362 |
dictators | +12.336 |
Jews | +11.735 |
oppressed | +11.712 |
tyranny | +11.399 |
Neg logit contributions | |
Setup | -11.532 |
manually | -11.168 |
optionally | -10.990 |
updated | -10.789 |
formatted | -10.782 |
Token | McCain |
Token ID | 14264 |
Feature activation | +3.42e+00 |
Pos logit contributions | |
hating | +19.839 |
dictators | +19.576 |
oppressed | +19.079 |
Jews | +19.001 |
America | +18.578 |
Neg logit contributions | |
Setup | -15.415 |
manually | -13.626 |
optionally | -13.571 |
formatted | -13.277 |
updated | -12.943 |
Token | is |
Token ID | 318 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
hating | +27.331 |
dictators | +26.722 |
oppressed | +26.180 |
martyr | +25.713 |
Jews | +25.678 |
Neg logit contributions | |
Setup | -15.516 |
optionally | -13.344 |
manually | -13.187 |
formatted | -12.590 |
initialize | -12.182 |
Token | an |
Token ID | 281 |
Feature activation | +2.94e+00 |
Pos logit contributions | |
hating | +15.034 |
dictators | +14.732 |
oppressed | +14.581 |
martyr | +14.292 |
Jews | +14.194 |
Neg logit contributions | |
Setup | -12.548 |
optionally | -11.249 |
manually | -11.236 |
formatted | -10.903 |
updated | -10.829 |
Token | American |
Token ID | 1605 |
Feature activation | +4.82e+00 |
Pos logit contributions | |
oppressed | +25.117 |
dictators | +24.787 |
America | +24.284 |
hating | +24.250 |
Almighty | +24.061 |
Neg logit contributions | |
Setup | -14.389 |
manually | -12.645 |
formatted | -12.374 |
optionally | -12.084 |
Detailed | -11.291 |
Token | hero |
Token ID | 4293 |
Feature activation | +3.27e+00 |
Pos logit contributions | |
martyr | +33.938 |
patri | +33.337 |
hating | +33.133 |
dictators | +32.683 |
oppressed | +31.894 |
Neg logit contributions | |
Setup | -20.947 |
optionally | -17.609 |
formatted | -16.930 |
updated | -16.809 |
updated | -16.696 |
Token | & |
Token ID | 1222 |
Feature activation | +3.04e+00 |
Pos logit contributions | |
hating | +24.214 |
oppressed | +23.722 |
dictators | +23.710 |
martyr | +23.025 |
Jews | +22.784 |
Neg logit contributions | |
Setup | -17.541 |
optionally | -15.550 |
manually | -15.365 |
formatted | -14.828 |
updated | -14.821 |
Token | one |
Token ID | 530 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
dictators | +24.881 |
hating | +24.557 |
martyr | +24.496 |
oppressed | +24.407 |
patri | +24.046 |
Neg logit contributions | |
Setup | -15.368 |
manually | -13.105 |
optionally | -12.986 |
formatted | -12.783 |
updated | -12.292 |
Token | of |
Token ID | 286 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
hating | +16.143 |
dictators | +16.080 |
oppressed | +15.969 |
martyr | +15.543 |
Jews | +15.446 |
Neg logit contributions | |
Setup | -14.491 |
optionally | -13.198 |
manually | -13.182 |
updated | -12.844 |
formatted | -12.812 |
Token | the |
Token ID | 262 |
Feature activation | +3.41e+00 |
Pos logit contributions | |
dictators | +26.277 |
America | +25.510 |
oppressed | +25.289 |
hating | +25.177 |
Jews | +25.003 |
Neg logit contributions | |
Setup | -18.152 |
optionally | -16.672 |
formatted | -16.314 |
manually | -16.279 |
updated | -15.654 |
Token | standing |
Token ID | 5055 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
dictators | +22.039 |
hating | +21.934 |
oppressed | +21.241 |
politicians | +21.184 |
politics | +21.119 |
Neg logit contributions | |
Setup | -14.333 |
manually | -12.419 |
optionally | -12.385 |
formatted | -12.178 |
annot | -11.929 |
Token | up |
Token ID | 510 |
Feature activation | +3.13e+00 |
Pos logit contributions | |
dictators | +11.873 |
hating | +11.736 |
oppressed | +11.481 |
Jews | +11.424 |
politics | +11.188 |
Neg logit contributions | |
Setup | -9.918 |
manually | -8.759 |
optionally | -8.725 |
formatted | -8.641 |
updated | -8.532 |
Token | for |
Token ID | 329 |
Feature activation | +4.30e+00 |
Pos logit contributions | |
dictators | +22.955 |
hating | +22.115 |
oppressed | +21.984 |
politicians | +21.859 |
politics | +21.668 |
Neg logit contributions | |
Setup | -18.499 |
optionally | -15.833 |
annot | -15.709 |
manually | -15.601 |
updated | -15.224 |
Token | working |
Token ID | 1762 |
Feature activation | +3.82e+00 |
Pos logit contributions | |
oppressed | +32.365 |
dictators | +32.097 |
America | +31.583 |
Jews | +31.470 |
politics | +31.371 |
Neg logit contributions | |
Setup | -18.179 |
optionally | -15.555 |
manually | -14.653 |
Completed | -14.170 |
formatted | -14.162 |
Token | people |
Token ID | 661 |
Feature activation | +4.30e+00 |
Pos logit contributions | |
America | +24.411 |
Jews | +24.372 |
Americans | +24.267 |
oppressed | +24.119 |
hating | +23.773 |
Neg logit contributions | |
Setup | -23.302 |
optionally | -20.700 |
manually | -19.605 |
Detailed | -19.546 |
Completed | -19.483 |
Token | , |
Token ID | 11 |
Feature activation | +4.81e+00 |
Pos logit contributions | |
oppressed | +30.460 |
hating | +30.367 |
dictators | +30.192 |
politics | +29.368 |
politicians | +28.928 |
Neg logit contributions | |
Setup | -20.083 |
Completed | -16.776 |
optionally | -16.540 |
initialize | -15.851 |
manually | -15.602 |
Token | protecting |
Token ID | 10192 |
Feature activation | +4.26e+00 |
Pos logit contributions | |
hating | +34.964 |
oppressed | +34.467 |
dictators | +34.385 |
Jews | +33.843 |
patri | +33.435 |
Neg logit contributions | |
Setup | -18.002 |
optionally | -14.952 |
manually | -14.703 |
formatted | -14.356 |
Completed | -14.097 |
Token | affordable |
Token ID | 10935 |
Feature activation | +2.72e+00 |
Pos logit contributions | |
oppressed | +30.810 |
dictators | +30.651 |
America | +30.393 |
politics | +29.651 |
politicians | +29.569 |
Neg logit contributions | |
Setup | -19.441 |
optionally | -17.061 |
manually | -15.950 |
formatted | -15.813 |
Completed | -15.787 |
Token | health |
Token ID | 1535 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
dictators | +18.778 |
hating | +18.657 |
politics | +18.520 |
oppressed | +18.421 |
America | +18.227 |
Neg logit contributions | |
Setup | -17.691 |
optionally | -16.212 |
manually | -16.037 |
Completed | -15.478 |
formatted | -15.327 |
Token | care |
Token ID | 1337 |
Feature activation | +3.00e+00 |
Pos logit contributions | |
dictators | +9.532 |
hating | +9.335 |
oppressed | +9.189 |
politics | +8.905 |
Jews | +8.807 |
Neg logit contributions | |
Setup | -15.105 |
manually | -14.320 |
optionally | -14.062 |
annot | -13.800 |
formatted | -13.799 |
Token | and |
Token ID | 290 |
Feature activation | +3.62e+00 |
Pos logit contributions | |
dictators | +20.847 |
hating | +20.317 |
oppressed | +20.262 |
politics | +20.187 |
politicians | +19.833 |
Neg logit contributions | |
Setup | -17.933 |
manually | -15.840 |
optionally | -15.834 |
Completed | -15.511 |
formatted | -15.367 |
Token | ands |
Token ID | 1746 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
dictators | +10.142 |
hating | +10.092 |
Jews | +9.758 |
oppressed | +9.654 |
Christians | +9.336 |
Neg logit contributions | |
Setup | -14.052 |
manually | -13.617 |
updated | -13.303 |
optionally | -13.132 |
formatted | -12.931 |
Token | ons |
Token ID | 684 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
hating | +10.408 |
dictators | +10.283 |
oppressed | +10.177 |
Jews | +10.024 |
Christians | +9.492 |
Neg logit contributions | |
Setup | -12.000 |
manually | -11.006 |
optionally | -10.841 |
updated | -10.686 |
formatted | -10.549 |
Token | , |
Token ID | 11 |
Feature activation | +4.54e+00 |
Pos logit contributions | |
hating | +25.923 |
oppressed | +25.573 |
dictators | +24.826 |
Jews | +24.322 |
martyr | +24.043 |
Neg logit contributions | |
Setup | -16.224 |
manually | -13.958 |
optionally | -13.678 |
updated | -13.249 |
formatted | -13.170 |
Token | grandfather |
Token ID | 17695 |
Feature activation | +3.03e+00 |
Pos logit contributions | |
dictators | +34.573 |
oppressed | +33.801 |
hating | +33.353 |
martyr | +33.327 |
Jews | +33.003 |
Neg logit contributions | |
Setup | -16.880 |
manually | -14.065 |
Detailed | -13.657 |
Completed | -13.655 |
formatted | -13.485 |
Token | s |
Token ID | 82 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
dictators | +17.515 |
hating | +16.686 |
Jews | +16.438 |
oppressed | +16.282 |
politicians | +15.856 |
Neg logit contributions | |
Setup | -22.230 |
manually | -20.933 |
optionally | -20.853 |
updated | -20.353 |
formatted | -20.244 |
Token | , |
Token ID | 11 |
Feature activation | +4.76e+00 |
Pos logit contributions | |
hating | +25.990 |
oppressed | +25.414 |
dictators | +25.272 |
Jews | +24.535 |
martyr | +23.958 |
Neg logit contributions | |
Setup | -18.712 |
manually | -16.788 |
optionally | -16.199 |
updated | -16.074 |
formatted | -15.886 |
Token | wives |
Token ID | 17743 |
Feature activation | +3.39e+00 |
Pos logit contributions | |
dictators | +35.272 |
oppressed | +34.380 |
hating | +34.266 |
Jews | +33.990 |
martyr | +33.766 |
Neg logit contributions | |
Setup | -17.943 |
manually | -14.690 |
Detailed | -14.284 |
Completed | -13.984 |
optionally | -13.891 |
Token | ' |
Token ID | 6 |
Feature activation | +2.91e+00 |
Pos logit contributions | |
hating | +25.063 |
oppressed | +24.508 |
dictators | +23.998 |
Jews | +23.428 |
martyr | +22.903 |
Neg logit contributions | |
Setup | -18.428 |
manually | -16.320 |
optionally | -15.737 |
updated | -15.502 |
formatted | -15.351 |
Token | brothers |
Token ID | 9397 |
Feature activation | +3.66e+00 |
Pos logit contributions | |
dictators | +22.301 |
hating | +22.142 |
oppressed | +21.735 |
Jews | +21.305 |
martyr | +20.958 |
Neg logit contributions | |
Setup | -16.558 |
manually | -14.952 |
optionally | -14.226 |
formatted | -14.111 |
updated | -14.023 |
Token | ; |
Token ID | 26 |
Feature activation | +4.32e+00 |
Pos logit contributions | |
hating | +27.258 |
oppressed | +26.463 |
dictators | +26.295 |
Jews | +25.663 |
Almighty | +25.003 |
Neg logit contributions | |
Setup | -18.093 |
manually | -15.891 |
optionally | -15.354 |
formatted | -14.956 |
updated | -14.953 |
Token | mothers |
Token ID | 12289 |
Feature activation | +3.47e+00 |
Pos logit contributions | |
dictators | +32.767 |
hating | +32.069 |
oppressed | +32.044 |
Jews | +31.436 |
martyr | +31.304 |
Neg logit contributions | |
Setup | -17.369 |
manually | -15.002 |
formatted | -14.325 |
optionally | -14.302 |
Completed | -14.066 |
Token | equality |
Token ID | 10537 |
Feature activation | +2.51e+00 |
Pos logit contributions | |
dictators | +23.390 |
hating | +22.616 |
politicians | +22.541 |
oppressed | +22.420 |
politics | +22.288 |
Neg logit contributions | |
Setup | -14.868 |
optionally | -12.586 |
manually | -12.157 |
annot | -12.019 |
initialize | -11.620 |
Token | and |
Token ID | 290 |
Feature activation | +3.28e+00 |
Pos logit contributions | |
dictators | +16.966 |
hating | +16.942 |
oppressed | +16.848 |
politics | +16.460 |
Jews | +16.284 |
Neg logit contributions | |
Setup | -17.104 |
manually | -15.278 |
optionally | -15.248 |
annot | -14.932 |
Completed | -14.904 |
Token | fair |
Token ID | 3148 |
Feature activation | +2.88e+00 |
Pos logit contributions | |
hating | +25.524 |
dignity | +25.245 |
dictators | +25.216 |
oppressed | +25.159 |
politics | +24.770 |
Neg logit contributions | |
Setup | -17.308 |
manually | -14.395 |
optionally | -14.285 |
Completed | -14.084 |
annot | -13.930 |
Token | treatment |
Token ID | 3513 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
politics | +22.068 |
dictators | +21.948 |
hating | +21.421 |
oppressed | +21.374 |
politicians | +21.201 |
Neg logit contributions | |
Setup | -15.902 |
manually | -14.779 |
optionally | -14.576 |
annot | -13.908 |
Completed | -13.873 |
Token | for |
Token ID | 329 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
dictators | +15.592 |
oppressed | +15.347 |
hating | +15.201 |
Jews | +14.845 |
religion | +14.559 |
Neg logit contributions | |
Setup | -14.386 |
manually | -12.763 |
optionally | -12.675 |
annot | -12.445 |
updated | -12.390 |
Token | all |
Token ID | 477 |
Feature activation | +4.74e+00 |
Pos logit contributions | |
oppressed | +29.407 |
Jews | +28.393 |
dictators | +27.961 |
gays | +27.706 |
hating | +27.472 |
Neg logit contributions | |
Setup | -21.498 |
optionally | -17.923 |
manually | -17.863 |
Detailed | -16.991 |
formatted | -16.756 |
Token | , |
Token ID | 11 |
Feature activation | +3.57e+00 |
Pos logit contributions | |
oppressed | +32.965 |
Americans | +32.906 |
Jews | +32.121 |
dictators | +32.063 |
America | +31.395 |
Neg logit contributions | |
Setup | -20.684 |
optionally | -17.549 |
manually | -16.963 |
Completed | -16.071 |
annot | -15.981 |
Token | � |
Token ID | 447 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
dictators | +29.062 |
hating | +28.682 |
oppressed | +28.311 |
Jews | +27.950 |
politics | +27.913 |
Neg logit contributions | |
Setup | -14.986 |
optionally | -12.701 |
manually | -12.392 |
formatted | -11.999 |
annot | -11.863 |
Token | � |
Token ID | 251 |
Feature activation | +2.16e+00 |
Pos logit contributions | |
dictators | +6.421 |
hating | +6.313 |
oppressed | +6.192 |
Jews | +6.042 |
Communism | +5.818 |
Neg logit contributions | |
Setup | -10.071 |
manually | -9.657 |
optionally | -9.508 |
formatted | -9.426 |
updated | -9.399 |
Token | Mr |
Token ID | 1770 |
Feature activation | +8.62e-01 |
Pos logit contributions | |
dictators | +16.190 |
hating | +16.012 |
oppressed | +15.571 |
Jews | +15.531 |
politics | +15.481 |
Neg logit contributions | |
Setup | -13.814 |
optionally | -12.363 |
manually | -12.341 |
annot | -12.074 |
updated | -11.817 |
Token | . |
Token ID | 13 |
Feature activation | +1.84e+00 |
Pos logit contributions | |
dictators | +4.423 |
hating | +4.414 |
Jews | +4.228 |
oppressed | +4.167 |
Communism | +4.060 |
Neg logit contributions | |
Setup | -8.548 |
optionally | -8.281 |
manually | -8.254 |
updated | -8.122 |
formatted | -8.059 |
Token | going |
Token ID | 1016 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
hating | +16.869 |
oppressed | +16.478 |
dictators | +16.389 |
Jews | +15.887 |
bullies | +15.459 |
Neg logit contributions | |
Setup | -12.221 |
manually | -10.932 |
optionally | -10.734 |
updated | -10.426 |
update | -10.346 |
Token | to |
Token ID | 284 |
Feature activation | +2.16e+00 |
Pos logit contributions | |
hating | +13.296 |
dictators | +13.079 |
oppressed | +12.753 |
Jews | +12.415 |
religion | +12.066 |
Neg logit contributions | |
Setup | -13.025 |
optionally | -11.849 |
updated | -11.792 |
manually | -11.777 |
annot | -11.574 |
Token | treat |
Token ID | 2190 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
hating | +17.795 |
dictators | +17.288 |
oppressed | +17.181 |
Jews | +16.841 |
bullies | +16.466 |
Neg logit contributions | |
Setup | -13.237 |
manually | -11.468 |
Completed | -11.445 |
updated | -11.416 |
optionally | -11.283 |
Token | you |
Token ID | 345 |
Feature activation | +2.63e+00 |
Pos logit contributions | |
hating | +12.801 |
Jews | +12.641 |
dictators | +12.631 |
oppressed | +12.420 |
religion | +11.848 |
Neg logit contributions | |
Setup | -16.269 |
manually | -14.892 |
optionally | -14.704 |
updated | -14.489 |
annot | -14.467 |
Token | more |
Token ID | 517 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
hating | +21.085 |
dictators | +20.586 |
oppressed | +20.445 |
Jews | +20.210 |
religion | +19.700 |
Neg logit contributions | |
Setup | -15.373 |
Completed | -13.055 |
manually | -12.827 |
optionally | -12.642 |
updated | -12.496 |
Token | Asian |
Token ID | 7740 |
Feature activation | +4.72e+00 |
Pos logit contributions | |
hating | +25.968 |
oppressed | +25.831 |
dictators | +25.513 |
Jews | +25.417 |
religion | +24.427 |
Neg logit contributions | |
Setup | -15.986 |
Completed | -13.606 |
updated | -12.948 |
manually | -12.941 |
optionally | -12.937 |
Token | . |
Token ID | 13 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
hating | +34.024 |
dictators | +33.790 |
Jews | +32.879 |
society | +32.442 |
oppressed | +32.421 |
Neg logit contributions | |
Setup | -18.550 |
optionally | -15.836 |
Completed | -15.678 |
updated | -15.577 |
manually | -15.310 |
Token | If |
Token ID | 1002 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
Jews | +12.160 |
hating | +11.985 |
Communism | +11.613 |
dictators | +11.555 |
Christians | +11.230 |
Neg logit contributions | |
Setup | -17.025 |
manually | -16.404 |
optionally | -16.342 |
formatted | -16.020 |
updated | -15.967 |
Token | you |
Token ID | 345 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
hating | +8.949 |
dictators | +8.813 |
oppressed | +8.587 |
Jews | +8.516 |
religion | +8.181 |
Neg logit contributions | |
Setup | -12.554 |
manually | -11.656 |
updated | -11.495 |
optionally | -11.458 |
annot | -11.342 |
Token | look |
Token ID | 804 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
hating | +9.511 |
dictators | +9.453 |
oppressed | +9.225 |
Jews | +9.031 |
religion | +8.769 |
Neg logit contributions | |
Setup | -9.213 |
manually | -8.311 |
optionally | -8.240 |
updated | -8.166 |
formatted | -7.961 |
Token | more |
Token ID | 517 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
hating | +8.545 |
dictators | +8.452 |
oppressed | +8.338 |
Jews | +8.237 |
religion | +7.936 |
Neg logit contributions | |
Setup | -7.689 |
manually | -6.961 |
optionally | -6.908 |
updated | -6.834 |
annot | -6.771 |
Token | attacks |
Token ID | 3434 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
dictators | +34.417 |
hating | +34.167 |
hatred | +33.735 |
politics | +33.332 |
Jews | +33.138 |
Neg logit contributions | |
Setup | -17.009 |
optionally | -15.456 |
manually | -14.765 |
annot | -14.272 |
Completed | -14.261 |
Token | on |
Token ID | 319 |
Feature activation | +4.90e+00 |
Pos logit contributions | |
hating | +14.044 |
dictators | +13.929 |
oppressed | +13.417 |
Jews | +13.356 |
religion | +13.130 |
Neg logit contributions | |
Setup | -12.872 |
optionally | -11.439 |
manually | -11.431 |
updated | -11.403 |
annot | -11.156 |
Token | women |
Token ID | 1466 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
Jews | +35.800 |
dictators | +34.898 |
oppressed | +34.361 |
Muslims | +34.068 |
religion | +34.025 |
Neg logit contributions | |
Setup | -19.852 |
optionally | -16.950 |
manually | -16.571 |
formatted | -16.397 |
annot | -16.226 |
Token | , |
Token ID | 11 |
Feature activation | +4.57e+00 |
Pos logit contributions | |
dictators | +27.253 |
hating | +27.055 |
oppressed | +26.275 |
Jews | +26.072 |
politicians | +25.749 |
Neg logit contributions | |
Setup | -18.815 |
manually | -15.772 |
updated | -15.701 |
optionally | -15.652 |
Completed | -15.600 |
Token | blacks |
Token ID | 15102 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
hating | +34.493 |
dictators | +34.134 |
Jews | +33.405 |
oppressed | +32.922 |
religion | +32.772 |
Neg logit contributions | |
Setup | -17.604 |
manually | -15.354 |
optionally | -15.234 |
updated | -14.582 |
formatted | -14.334 |
Token | and |
Token ID | 290 |
Feature activation | +4.71e+00 |
Pos logit contributions | |
hating | +29.609 |
oppressed | +28.556 |
dictators | +28.545 |
Jews | +27.947 |
politics | +27.152 |
Neg logit contributions | |
Setup | -19.767 |
manually | -16.938 |
optionally | -16.689 |
updated | -16.447 |
annot | -16.278 |
Token | Muslims |
Token ID | 7045 |
Feature activation | +4.94e+00 |
Pos logit contributions | |
Jews | +34.898 |
oppressed | +33.632 |
Muslims | +33.221 |
dictators | +33.046 |
hating | +32.866 |
Neg logit contributions | |
Setup | -19.811 |
manually | -17.624 |
optionally | -16.628 |
formatted | -16.272 |
annot | -15.999 |
Token | , |
Token ID | 11 |
Feature activation | +4.44e+00 |
Pos logit contributions | |
hating | +34.377 |
dictators | +33.699 |
oppressed | +33.384 |
Jews | +32.903 |
Muslims | +32.052 |
Neg logit contributions | |
Setup | -20.009 |
manually | -16.193 |
Completed | -16.019 |
optionally | -15.973 |
formatted | -15.819 |
Token | and |
Token ID | 290 |
Feature activation | +4.12e+00 |
Pos logit contributions | |
dictators | +34.256 |
hating | +34.137 |
Jews | +33.537 |
oppressed | +32.772 |
religion | +32.657 |
Neg logit contributions | |
Setup | -16.723 |
optionally | -14.480 |
manually | -14.463 |
updated | -13.605 |
formatted | -13.561 |
Token | the |
Token ID | 262 |
Feature activation | +4.14e+00 |
Pos logit contributions | |
hating | +32.165 |
dictators | +32.158 |
Jews | +31.312 |
oppressed | +30.664 |
religion | +30.585 |
Neg logit contributions | |
Setup | -17.255 |
manually | -14.723 |
optionally | -14.395 |
updated | -14.119 |
annot | -13.943 |
Token | hate |
Token ID | 5465 |
Feature activation | +3.40e+00 |
Pos logit contributions | |
dictators | +32.820 |
hating | +32.376 |
Jews | +32.047 |
oppressed | +31.614 |
hatred | +31.531 |
Neg logit contributions | |
Setup | -16.174 |
optionally | -14.100 |
manually | -13.865 |
annot | -13.265 |
formatted | -13.127 |
Token | , |
Token ID | 11 |
Feature activation | +4.91e+00 |
Pos logit contributions | |
hating | +29.526 |
dictators | +28.707 |
religion | +28.270 |
Jews | +28.113 |
Almighty | +28.036 |
Neg logit contributions | |
Setup | -19.348 |
annot | -16.659 |
manually | -16.643 |
optionally | -16.535 |
initialize | -15.863 |
Token | lazy |
Token ID | 16931 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
hating | +36.814 |
dictators | +35.790 |
Jews | +35.285 |
religion | +35.215 |
hatred | +34.831 |
Neg logit contributions | |
Setup | -18.002 |
manually | -15.000 |
optionally | -14.952 |
annot | -14.142 |
formatted | -14.024 |
Token | minorities |
Token ID | 15557 |
Feature activation | +4.00e+00 |
Pos logit contributions | |
dictators | +32.265 |
politicians | +31.942 |
politics | +31.734 |
hating | +31.713 |
Jews | +31.610 |
Neg logit contributions | |
Setup | -18.217 |
optionally | -16.561 |
manually | -16.242 |
available | -15.291 |
formatted | -15.282 |
Token | , |
Token ID | 11 |
Feature activation | +5.00e+00 |
Pos logit contributions | |
hating | +30.783 |
oppressed | +29.485 |
dictators | +29.243 |
politics | +28.219 |
Jews | +27.985 |
Neg logit contributions | |
Setup | -18.895 |
manually | -16.018 |
optionally | -15.936 |
annot | -15.483 |
updated | -15.271 |
Token | immigrants |
Token ID | 7971 |
Feature activation | +4.17e+00 |
Pos logit contributions | |
hating | +37.001 |
dictators | +36.720 |
Jews | +35.724 |
oppressed | +35.596 |
religion | +35.314 |
Neg logit contributions | |
Setup | -17.999 |
optionally | -15.054 |
manually | -14.944 |
annot | -13.882 |
formatted | -13.832 |
Token | and |
Token ID | 290 |
Feature activation | +4.70e+00 |
Pos logit contributions | |
hating | +31.638 |
oppressed | +30.149 |
dictators | +29.942 |
Jews | +28.668 |
politics | +28.575 |
Neg logit contributions | |
Setup | -19.246 |
optionally | -16.188 |
manually | -16.002 |
updated | -15.730 |
annot | -15.375 |
Token | rich |
Token ID | 5527 |
Feature activation | +4.69e+00 |
Pos logit contributions | |
dictators | +35.578 |
hating | +35.213 |
Jews | +34.807 |
oppressed | +34.515 |
religion | +34.053 |
Neg logit contributions | |
Setup | -18.543 |
manually | -15.063 |
optionally | -14.828 |
formatted | -14.417 |
available | -14.339 |
Token | liberals |
Token ID | 17194 |
Feature activation | +4.63e+00 |
Pos logit contributions | |
dictators | +35.307 |
Jews | +34.518 |
hating | +33.955 |
politicians | +33.628 |
oppressed | +33.437 |
Neg logit contributions | |
Setup | -18.311 |
optionally | -16.832 |
manually | -16.267 |
updated | -15.394 |
formatted | -15.009 |
Token | . |
Token ID | 13 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
hating | +35.101 |
oppressed | +33.547 |
dictators | +33.442 |
Jews | +32.393 |
politicians | +32.070 |
Neg logit contributions | |
Setup | -18.051 |
optionally | -15.524 |
manually | -14.903 |
Completed | -14.631 |
initialize | -14.392 |
Token | This |
Token ID | 770 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
Jews | +19.729 |
hating | +19.537 |
Communism | +19.118 |
dictators | +19.118 |
Christians | +18.747 |
Neg logit contributions | |
Setup | -17.359 |
optionally | -16.749 |
manually | -16.557 |
formatted | -16.104 |
annot | -15.991 |
Token | diverted |
Token ID | 35673 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
hating | +12.097 |
dictators | +11.992 |
oppressed | +11.758 |
Jews | +11.492 |
politics | +11.379 |
Neg logit contributions | |
Setup | -9.926 |
optionally | -8.989 |
manually | -8.971 |
annot | -8.631 |
updated | -8.583 |
Token | lazy |
Token ID | 16931 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
hating | +36.814 |
dictators | +35.790 |
Jews | +35.285 |
religion | +35.215 |
hatred | +34.831 |
Neg logit contributions | |
Setup | -18.002 |
manually | -15.000 |
optionally | -14.952 |
annot | -14.142 |
formatted | -14.024 |
Token | minorities |
Token ID | 15557 |
Feature activation | +4.00e+00 |
Pos logit contributions | |
dictators | +32.265 |
politicians | +31.942 |
politics | +31.734 |
hating | +31.713 |
Jews | +31.610 |
Neg logit contributions | |
Setup | -18.217 |
optionally | -16.561 |
manually | -16.242 |
available | -15.291 |
formatted | -15.282 |
Token | , |
Token ID | 11 |
Feature activation | +5.00e+00 |
Pos logit contributions | |
hating | +30.783 |
oppressed | +29.485 |
dictators | +29.243 |
politics | +28.219 |
Jews | +27.985 |
Neg logit contributions | |
Setup | -18.895 |
manually | -16.018 |
optionally | -15.936 |
annot | -15.483 |
updated | -15.271 |
Token | immigrants |
Token ID | 7971 |
Feature activation | +4.17e+00 |
Pos logit contributions | |
hating | +37.001 |
dictators | +36.720 |
Jews | +35.724 |
oppressed | +35.596 |
religion | +35.314 |
Neg logit contributions | |
Setup | -17.999 |
optionally | -15.054 |
manually | -14.944 |
annot | -13.882 |
formatted | -13.832 |
Token | and |
Token ID | 290 |
Feature activation | +4.70e+00 |
Pos logit contributions | |
hating | +31.638 |
oppressed | +30.149 |
dictators | +29.942 |
Jews | +28.668 |
politics | +28.575 |
Neg logit contributions | |
Setup | -19.246 |
optionally | -16.188 |
manually | -16.002 |
updated | -15.730 |
annot | -15.375 |
Token | rich |
Token ID | 5527 |
Feature activation | +4.69e+00 |
Pos logit contributions | |
dictators | +35.578 |
hating | +35.213 |
Jews | +34.807 |
oppressed | +34.515 |
religion | +34.053 |
Neg logit contributions | |
Setup | -18.543 |
manually | -15.063 |
optionally | -14.828 |
formatted | -14.417 |
available | -14.339 |
Token | liberals |
Token ID | 17194 |
Feature activation | +4.63e+00 |
Pos logit contributions | |
dictators | +35.307 |
Jews | +34.518 |
hating | +33.955 |
politicians | +33.628 |
oppressed | +33.437 |
Neg logit contributions | |
Setup | -18.311 |
optionally | -16.832 |
manually | -16.267 |
updated | -15.394 |
formatted | -15.009 |
Token | . |
Token ID | 13 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
hating | +35.101 |
oppressed | +33.547 |
dictators | +33.442 |
Jews | +32.393 |
politicians | +32.070 |
Neg logit contributions | |
Setup | -18.051 |
optionally | -15.524 |
manually | -14.903 |
Completed | -14.631 |
initialize | -14.392 |
Token | This |
Token ID | 770 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
Jews | +19.729 |
hating | +19.537 |
Communism | +19.118 |
dictators | +19.118 |
Christians | +18.747 |
Neg logit contributions | |
Setup | -17.359 |
optionally | -16.749 |
manually | -16.557 |
formatted | -16.104 |
annot | -15.991 |
Token | diverted |
Token ID | 35673 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
hating | +12.097 |
dictators | +11.992 |
oppressed | +11.758 |
Jews | +11.492 |
politics | +11.379 |
Neg logit contributions | |
Setup | -9.926 |
optionally | -8.989 |
manually | -8.971 |
annot | -8.631 |
updated | -8.583 |
Token | attention |
Token ID | 3241 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
hating | +8.281 |
dictators | +8.175 |
oppressed | +8.001 |
Jews | +7.821 |
politics | +7.613 |
Neg logit contributions | |
Setup | -9.650 |
optionally | -8.959 |
manually | -8.907 |
updated | -8.684 |
annot | -8.638 |
Token | GB |
Token ID | 4579 |
Feature activation | -3.63e+00 |
Pos logit contributions | |
Setup | +18.823 |
manually | +18.075 |
updated | +18.056 |
optionally | +17.721 |
update | +17.413 |
Neg logit contributions | |
dictators | -18.836 |
hating | -18.556 |
oppressed | -18.163 |
Jews | -17.598 |
Communism | -17.538 |
Token | of |
Token ID | 286 |
Feature activation | -3.54e+00 |
Pos logit contributions | |
Setup | +29.293 |
updated | +28.942 |
manually | +28.782 |
update | +28.559 |
optionally | +28.504 |
Neg logit contributions | |
dictators | -17.451 |
hating | -17.295 |
oppressed | -16.468 |
Communism | -15.846 |
dictatorship | -15.431 |
Token | GDDR |
Token ID | 50092 |
Feature activation | -2.85e+00 |
Pos logit contributions | |
updated | +27.749 |
manually | +27.432 |
Setup | +27.318 |
optionally | +26.831 |
update | +26.775 |
Neg logit contributions | |
dictators | -17.851 |
hating | -17.397 |
oppressed | -16.524 |
Jews | -15.819 |
dictatorship | -15.788 |
Token | 5 |
Token ID | 20 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
Setup | +19.262 |
manually | +18.324 |
updated | +18.297 |
optionally | +18.070 |
formatted | +17.610 |
Neg logit contributions | |
dictators | -19.996 |
hating | -19.435 |
oppressed | -19.150 |
Jews | -18.535 |
Communism | -18.410 |
Token | memory |
Token ID | 4088 |
Feature activation | -5.00e+00 |
Pos logit contributions | |
Setup | +20.927 |
manually | +20.276 |
updated | +20.227 |
optionally | +20.022 |
update | +19.556 |
Neg logit contributions | |
dictators | -17.852 |
hating | -17.647 |
oppressed | -17.239 |
Jews | -16.436 |
Communism | -16.183 |
Token | is |
Token ID | 318 |
Feature activation | -5.80e+00 |
Pos logit contributions | |
updated | +36.978 |
optionally | +36.922 |
manually | +36.836 |
update | +36.187 |
Setup | +36.009 |
Neg logit contributions | |
hating | -18.391 |
dictators | -17.966 |
oppressed | -16.754 |
Communism | -16.300 |
tyranny | -15.421 |
Token | set |
Token ID | 900 |
Feature activation | -3.78e+00 |
Pos logit contributions | |
updated | +42.261 |
optionally | +41.644 |
manually | +41.143 |
formatted | +40.698 |
Setup | +40.038 |
Neg logit contributions | |
dictators | -18.469 |
hating | -17.882 |
oppressed | -16.349 |
dictatorship | -15.961 |
Communism | -15.850 |
Token | at |
Token ID | 379 |
Feature activation | -3.34e+00 |
Pos logit contributions | |
manually | +30.076 |
Setup | +29.764 |
updated | +29.519 |
optionally | +29.321 |
update | +28.338 |
Neg logit contributions | |
dictators | -18.066 |
hating | -17.623 |
oppressed | -17.317 |
Jews | -16.626 |
Communism | -16.335 |
Token | 1 |
Token ID | 352 |
Feature activation | -2.21e+00 |
Pos logit contributions | |
updated | +27.020 |
Setup | +26.892 |
manually | +26.838 |
optionally | +26.299 |
update | +26.047 |
Neg logit contributions | |
hating | -16.715 |
dictators | -16.589 |
oppressed | -15.776 |
Jews | -15.017 |
Communism | -14.833 |
Token | , |
Token ID | 11 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
Setup | +17.136 |
manually | +16.602 |
updated | +16.347 |
optionally | +16.155 |
update | +15.947 |
Neg logit contributions | |
dictators | -14.094 |
hating | -13.770 |
oppressed | -13.408 |
Jews | -12.999 |
Communism | -12.938 |
Token | 251 |
Token ID | 28072 |
Feature activation | -2.57e+00 |
Pos logit contributions | |
Setup | +13.987 |
manually | +13.116 |
updated | +12.974 |
optionally | +12.630 |
annot | +12.542 |
Neg logit contributions | |
dictators | -18.122 |
hating | -17.706 |
oppressed | -17.291 |
dictatorship | -16.765 |
Jews | -16.697 |
Token | ensitivity |
Token ID | 40545 |
Feature activation | -2.40e+00 |
Pos logit contributions | |
Setup | +10.501 |
manually | +10.013 |
updated | +9.902 |
optionally | +9.837 |
annot | +9.641 |
Neg logit contributions | |
dictators | -10.338 |
hating | -10.265 |
oppressed | -9.950 |
Jews | -9.657 |
Communism | -9.487 |
Token | analysis |
Token ID | 3781 |
Feature activation | -4.14e+00 |
Pos logit contributions | |
Setup | +19.326 |
manually | +18.885 |
updated | +18.790 |
update | +18.395 |
optionally | +18.376 |
Neg logit contributions | |
dictators | -14.656 |
hating | -14.563 |
oppressed | -14.253 |
dictatorship | -13.412 |
Jews | -13.305 |
Token | Sens |
Token ID | 14173 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
manually | +34.323 |
updated | +33.994 |
Setup | +33.809 |
optionally | +33.222 |
annot | +32.786 |
Neg logit contributions | |
hating | -15.942 |
dictators | -15.626 |
oppressed | -14.607 |
dictatorship | -13.720 |
tyranny | -13.637 |
Token | itivity |
Token ID | 11365 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
Setup | +12.020 |
updated | +11.198 |
manually | +11.141 |
optionally | +10.838 |
annot | +10.593 |
Neg logit contributions | |
dictators | -20.139 |
hating | -20.076 |
oppressed | -19.501 |
martyr | -18.846 |
Communism | -18.799 |
Token | analysis |
Token ID | 3781 |
Feature activation | -4.58e+00 |
Pos logit contributions | |
Setup | +28.555 |
manually | +28.296 |
updated | +28.058 |
optionally | +27.566 |
update | +27.487 |
Neg logit contributions | |
hating | -16.176 |
dictators | -15.936 |
oppressed | -15.323 |
martyr | -14.429 |
Jews | -14.370 |
Token | will |
Token ID | 481 |
Feature activation | -5.80e+00 |
Pos logit contributions | |
manually | +37.425 |
updated | +36.990 |
Setup | +36.517 |
optionally | +36.388 |
annot | +35.829 |
Neg logit contributions | |
hating | -15.772 |
dictators | -15.024 |
oppressed | -14.174 |
dictatorship | -13.249 |
martyr | -13.205 |
Token | be |
Token ID | 307 |
Feature activation | -5.30e+00 |
Pos logit contributions | |
manually | +40.261 |
optionally | +40.241 |
update | +39.438 |
annot | +38.776 |
updated | +38.282 |
Neg logit contributions | |
hating | -22.121 |
dictators | -19.938 |
oppressed | -18.542 |
Almighty | -17.906 |
martyr | -17.816 |
Token | performed |
Token ID | 6157 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
updated | +39.678 |
manually | +39.414 |
optionally | +38.564 |
annot | +37.782 |
detailed | +37.380 |
Neg logit contributions | |
hating | -18.351 |
dictators | -17.662 |
Almighty | -16.127 |
Communism | -15.827 |
martyr | -15.818 |
Token | excluding |
Token ID | 23494 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
manually | +38.802 |
optionally | +37.263 |
updated | +36.858 |
annot | +35.769 |
Setup | +35.533 |
Neg logit contributions | |
dictators | -18.091 |
hating | -17.600 |
oppressed | -16.848 |
Communism | -16.118 |
bullies | -16.101 |
Token | studies |
Token ID | 3640 |
Feature activation | -2.88e+00 |
Pos logit contributions | |
manually | +24.136 |
updated | +23.982 |
Setup | +23.869 |
optionally | +23.491 |
annot | +23.422 |
Neg logit contributions | |
hating | -11.647 |
dictators | -11.603 |
oppressed | -10.902 |
Communism | -10.361 |
dictatorship | -10.260 |
Token | only |
Token ID | 691 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
manually | +24.543 |
updated | +24.242 |
annot | +23.950 |
Setup | +23.926 |
optionally | +23.812 |
Neg logit contributions | |
dictators | -14.381 |
hating | -13.722 |
oppressed | -13.113 |
Communism | -12.895 |
tyranny | -12.808 |
Token |
|
Token ID | 198 |
Feature activation | -4.55e+00 |
Pos logit contributions | |
Setup | +11.531 |
manually | +10.897 |
updated | +10.875 |
update | +10.543 |
annot | +10.402 |
Neg logit contributions | |
dictators | -12.550 |
hating | -12.322 |
oppressed | -12.083 |
tyranny | -11.473 |
dictatorship | -11.424 |
Token | All |
Token ID | 3237 |
Feature activation | -3.01e+00 |
Pos logit contributions | |
Setup | +32.658 |
Completed | +28.306 |
manually | +27.633 |
Initial | +27.608 |
Detailed | +27.374 |
Neg logit contributions | |
dictators | -24.139 |
hating | -23.488 |
oppressed | -23.295 |
bullies | -22.060 |
Jews | -21.832 |
Token | the |
Token ID | 262 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
Setup | +26.921 |
manually | +26.266 |
updated | +26.060 |
optionally | +25.370 |
annot | +25.347 |
Neg logit contributions | |
hating | -14.502 |
dictators | -14.216 |
oppressed | -13.422 |
Jews | -12.918 |
Communism | -12.818 |
Token | ping |
Token ID | 29400 |
Feature activation | -4.07e+00 |
Pos logit contributions | |
Setup | +29.384 |
manually | +28.889 |
updated | +28.870 |
annot | +28.068 |
update | +27.885 |
Neg logit contributions | |
hating | -14.695 |
dictators | -14.453 |
oppressed | -13.497 |
Jews | -13.037 |
Communism | -12.852 |
Token | tests |
Token ID | 5254 |
Feature activation | -5.07e+00 |
Pos logit contributions | |
Setup | +32.770 |
manually | +32.460 |
updated | +31.875 |
update | +31.269 |
optionally | +31.163 |
Neg logit contributions | |
hating | -17.044 |
dictators | -16.456 |
oppressed | -16.317 |
Communism | -15.420 |
Jews | -15.278 |
Token | are |
Token ID | 389 |
Feature activation | -5.78e+00 |
Pos logit contributions | |
manually | +37.754 |
updated | +37.057 |
Setup | +36.491 |
optionally | +36.263 |
update | +36.103 |
Neg logit contributions | |
hating | -18.617 |
dictators | -17.955 |
oppressed | -16.898 |
Communism | -16.262 |
tyranny | -15.838 |
Token | independent |
Token ID | 4795 |
Feature activation | -2.52e+00 |
Pos logit contributions | |
manually | +42.407 |
updated | +41.865 |
Setup | +41.108 |
annot | +40.992 |
optionally | +40.644 |
Neg logit contributions | |
dictators | -17.623 |
hating | -17.575 |
oppressed | -16.128 |
Communism | -15.347 |
Almighty | -15.191 |
Token | to |
Token ID | 284 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
Setup | +21.611 |
manually | +21.131 |
updated | +20.769 |
optionally | +20.525 |
annot | +20.287 |
Neg logit contributions | |
hating | -14.313 |
dictators | -14.284 |
oppressed | -13.758 |
Jews | -13.111 |
Communism | -12.859 |
Token | others |
Token ID | 1854 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
Setup | +17.612 |
manually | +17.123 |
updated | +16.783 |
optionally | +16.673 |
update | +16.345 |
Neg logit contributions | |
dictators | -13.568 |
hating | -13.398 |
oppressed | -13.049 |
Jews | -12.628 |
Communism | -12.303 |
Token | , |
Token ID | 11 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
Setup | +14.089 |
manually | +13.700 |
updated | +13.518 |
optionally | +13.413 |
annot | +13.194 |
Neg logit contributions | |
dictators | -9.399 |
hating | -9.345 |
oppressed | -8.983 |
Jews | -8.625 |
Communism | -8.446 |
Token | so |
Token ID | 523 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
Setup | +13.116 |
manually | +12.764 |
updated | +12.612 |
optionally | +12.562 |
annot | +12.301 |
Neg logit contributions | |
dictators | -8.948 |
hating | -8.857 |
oppressed | -8.543 |
Jews | -8.200 |
Communism | -8.029 |
Token | of |
Token ID | 286 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
Setup | +26.180 |
updated | +25.871 |
manually | +25.560 |
update | +25.510 |
optionally | +25.126 |
Neg logit contributions | |
hating | -16.542 |
dictators | -16.442 |
oppressed | -15.664 |
Communism | -15.090 |
Jews | -14.807 |
Token | GDDR |
Token ID | 50092 |
Feature activation | -2.13e+00 |
Pos logit contributions | |
updated | +27.960 |
manually | +27.560 |
Setup | +27.283 |
update | +27.039 |
optionally | +26.782 |
Neg logit contributions | |
dictators | -18.006 |
hating | -17.726 |
oppressed | -16.706 |
Jews | -15.993 |
dictatorship | -15.942 |
Token | 5 |
Token ID | 20 |
Feature activation | -2.57e+00 |
Pos logit contributions | |
Setup | +10.861 |
manually | +10.205 |
updated | +10.059 |
optionally | +9.859 |
annot | +9.598 |
Neg logit contributions | |
dictators | -20.708 |
hating | -20.482 |
oppressed | -20.141 |
Jews | -19.667 |
Communism | -19.362 |
Token | X |
Token ID | 55 |
Feature activation | -3.40e+00 |
Pos logit contributions | |
Setup | +20.132 |
manually | +19.528 |
updated | +19.337 |
optionally | +19.244 |
formatted | +18.756 |
Neg logit contributions | |
dictators | -16.875 |
hating | -16.747 |
oppressed | -16.357 |
Jews | -15.715 |
dictatorship | -15.295 |
Token | memory |
Token ID | 4088 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
Setup | +27.838 |
manually | +27.497 |
optionally | +27.302 |
updated | +27.222 |
update | +26.598 |
Neg logit contributions | |
hating | -17.167 |
dictators | -17.143 |
oppressed | -16.551 |
Communism | -15.656 |
Jews | -15.574 |
Token | is |
Token ID | 318 |
Feature activation | -5.45e+00 |
Pos logit contributions | |
updated | +34.298 |
manually | +34.265 |
optionally | +34.209 |
Setup | +33.656 |
update | +33.254 |
Neg logit contributions | |
hating | -17.906 |
dictators | -17.485 |
oppressed | -16.778 |
Communism | -15.924 |
Almighty | -15.394 |
Token | connected |
Token ID | 5884 |
Feature activation | -3.95e+00 |
Pos logit contributions | |
updated | +41.300 |
optionally | +40.261 |
manually | +40.059 |
formatted | +39.820 |
Setup | +39.386 |
Neg logit contributions | |
dictators | -17.775 |
hating | -17.580 |
oppressed | -16.015 |
morals | -15.707 |
Communism | -15.692 |
Token | via |
Token ID | 2884 |
Feature activation | -4.05e+00 |
Pos logit contributions | |
manually | +29.784 |
optionally | +28.724 |
updated | +28.279 |
Setup | +28.230 |
formatted | +27.453 |
Neg logit contributions | |
dictators | -20.465 |
hating | -19.791 |
oppressed | -19.656 |
Jews | -18.534 |
Communism | -18.480 |
Token | a |
Token ID | 257 |
Feature activation | -4.26e+00 |
Pos logit contributions | |
updated | +31.806 |
Setup | +31.778 |
manually | +31.723 |
optionally | +31.309 |
update | +30.487 |
Neg logit contributions | |
dictators | -18.995 |
hating | -18.096 |
oppressed | -17.296 |
dictatorship | -16.810 |
Jews | -16.359 |
Token | 256 |
Token ID | 17759 |
Feature activation | -2.78e+00 |
Pos logit contributions | |
manually | +32.783 |
updated | +32.633 |
Setup | +32.475 |
optionally | +32.330 |
formatted | +31.677 |
Neg logit contributions | |
dictators | -19.072 |
hating | -17.894 |
oppressed | -17.702 |
Jews | -16.831 |
bullies | -16.538 |
Token | bit |
Token ID | 1643 |
Feature activation | -2.97e+00 |
Pos logit contributions | |
Setup | +20.858 |
manually | +20.359 |
updated | +20.294 |
optionally | +20.036 |
update | +19.775 |
Neg logit contributions | |
dictators | -17.597 |
hating | -17.113 |
oppressed | -16.766 |
Jews | -16.343 |
Communism | -16.171 |
Token | Calcul |
Token ID | 27131 |
Feature activation | -2.94e+00 |
Pos logit contributions | |
Setup | +32.245 |
manually | +32.113 |
updated | +31.801 |
optionally | +31.728 |
update | +31.478 |
Neg logit contributions | |
hating | -15.766 |
dictators | -15.669 |
oppressed | -14.886 |
Communism | -13.963 |
martyr | -13.801 |
Token | ate |
Token ID | 378 |
Feature activation | -3.67e+00 |
Pos logit contributions | |
Setup | +20.836 |
manually | +19.657 |
updated | +19.418 |
update | +18.986 |
optionally | +18.798 |
Neg logit contributions | |
hating | -20.071 |
dictators | -19.741 |
oppressed | -19.386 |
Jews | -18.409 |
tyranny | -18.310 |
Token | button |
Token ID | 4936 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
Setup | +31.254 |
manually | +30.393 |
updated | +29.552 |
update | +29.253 |
optionally | +29.178 |
Neg logit contributions | |
hating | -16.840 |
dictators | -16.652 |
oppressed | -16.201 |
martyr | -15.089 |
tyranny | -14.736 |
Token | . |
Token ID | 13 |
Feature activation | -2.80e+00 |
Pos logit contributions | |
manually | +28.560 |
Setup | +27.891 |
optionally | +27.596 |
updated | +27.523 |
annot | +26.927 |
Neg logit contributions | |
hating | -18.576 |
dictators | -18.547 |
oppressed | -17.659 |
Jews | -16.981 |
Communism | -16.665 |
Token | All |
Token ID | 1439 |
Feature activation | -3.53e+00 |
Pos logit contributions | |
Setup | +23.774 |
manually | +22.985 |
updated | +22.894 |
optionally | +22.611 |
update | +22.187 |
Neg logit contributions | |
dictators | -15.570 |
hating | -15.327 |
oppressed | -14.817 |
tyranny | -13.793 |
dictatorship | -13.778 |
Token | entries |
Token ID | 12784 |
Feature activation | -5.33e+00 |
Pos logit contributions | |
manually | +31.561 |
Setup | +31.351 |
updated | +31.252 |
optionally | +30.398 |
formatted | +30.241 |
Neg logit contributions | |
hating | -14.553 |
dictators | -14.034 |
oppressed | -13.217 |
Communism | -12.723 |
martyr | -12.684 |
Token | are |
Token ID | 389 |
Feature activation | -5.11e+00 |
Pos logit contributions | |
manually | +39.291 |
updated | +39.258 |
optionally | +38.161 |
update | +37.815 |
formatted | +37.721 |
Neg logit contributions | |
dictators | -19.347 |
hating | -19.305 |
Communism | -17.725 |
oppressed | -17.572 |
martyr | -17.112 |
Token | cleared |
Token ID | 12539 |
Feature activation | -3.46e+00 |
Pos logit contributions | |
manually | +40.886 |
updated | +40.866 |
formatted | +39.850 |
optionally | +39.395 |
annot | +39.086 |
Neg logit contributions | |
hating | -16.808 |
dictators | -16.227 |
oppressed | -14.855 |
Communism | -14.736 |
dictatorship | -13.988 |
Token | by |
Token ID | 416 |
Feature activation | -2.81e+00 |
Pos logit contributions | |
manually | +28.181 |
updated | +26.922 |
optionally | +26.834 |
Setup | +26.516 |
formatted | +26.256 |
Neg logit contributions | |
dictators | -17.277 |
hating | -17.038 |
oppressed | -16.607 |
Communism | -15.612 |
Jews | -15.600 |
Token | pressing |
Token ID | 12273 |
Feature activation | -3.37e+00 |
Pos logit contributions | |
manually | +25.533 |
Setup | +25.191 |
updated | +24.754 |
optionally | +24.638 |
annot | +24.293 |
Neg logit contributions | |
dictators | -13.332 |
hating | -13.139 |
oppressed | -12.762 |
Communism | -12.043 |
martyr | -11.795 |
Token | the |
Token ID | 262 |
Feature activation | -3.59e+00 |
Pos logit contributions | |
Setup | +28.330 |
manually | +28.164 |
optionally | +27.725 |
updated | +27.455 |
update | +27.100 |
Neg logit contributions | |
dictators | -15.972 |
hating | -15.820 |
oppressed | -15.062 |
martyr | -14.066 |
bullies | -14.058 |
Token | and |
Token ID | 290 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
Setup | +19.919 |
updated | +19.683 |
manually | +19.548 |
optionally | +19.246 |
annot | +19.033 |
Neg logit contributions | |
dictators | -12.647 |
hating | -12.214 |
oppressed | -11.921 |
Jews | -11.307 |
dictatorship | -11.232 |
Token | will |
Token ID | 481 |
Feature activation | -3.62e+00 |
Pos logit contributions | |
Setup | +10.692 |
manually | +10.328 |
updated | +10.270 |
optionally | +10.174 |
annot | +9.951 |
Neg logit contributions | |
dictators | -7.798 |
hating | -7.712 |
oppressed | -7.446 |
Jews | -7.176 |
dictatorship | -7.038 |
Token | have |
Token ID | 423 |
Feature activation | -2.95e+00 |
Pos logit contributions | |
update | +26.985 |
manually | +26.871 |
Setup | +26.675 |
updated | +26.569 |
optionally | +26.470 |
Neg logit contributions | |
dictators | -19.586 |
hating | -19.532 |
oppressed | -18.146 |
Communism | -17.520 |
dictatorship | -17.463 |
Token | one |
Token ID | 530 |
Feature activation | -3.19e+00 |
Pos logit contributions | |
updated | +25.460 |
Setup | +25.313 |
manually | +25.069 |
optionally | +24.483 |
update | +24.276 |
Neg logit contributions | |
dictators | -14.354 |
hating | -14.158 |
oppressed | -13.403 |
Communism | -12.760 |
dictatorship | -12.692 |
Token | more |
Token ID | 517 |
Feature activation | -2.84e+00 |
Pos logit contributions | |
Setup | +26.449 |
manually | +26.317 |
updated | +26.285 |
update | +25.629 |
optionally | +25.585 |
Neg logit contributions | |
dictators | -16.440 |
hating | -15.791 |
oppressed | -15.012 |
Communism | -14.431 |
Jews | -14.187 |
Token | session |
Token ID | 6246 |
Feature activation | -5.31e+00 |
Pos logit contributions | |
Setup | +23.902 |
updated | +23.887 |
manually | +23.761 |
update | +23.421 |
optionally | +23.016 |
Neg logit contributions | |
dictators | -14.647 |
hating | -13.984 |
oppressed | -13.187 |
Communism | -12.899 |
Jews | -12.808 |
Token | on |
Token ID | 319 |
Feature activation | -1.77e+00 |
Pos logit contributions | |
updated | +37.508 |
manually | +36.739 |
update | +36.152 |
preview | +35.751 |
detailed | +35.662 |
Neg logit contributions | |
dictators | -19.006 |
hating | -17.535 |
oppressed | -16.570 |
Communism | -16.442 |
tyranny | -16.288 |
Token | Thursday |
Token ID | 3635 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
Setup | +13.360 |
manually | +13.107 |
updated | +13.023 |
optionally | +12.683 |
update | +12.578 |
Neg logit contributions | |
dictators | -12.618 |
hating | -12.387 |
oppressed | -11.967 |
Jews | -11.477 |
Communism | -11.409 |
Token | , |
Token ID | 11 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
Setup | +11.511 |
manually | +11.236 |
updated | +11.155 |
optionally | +10.990 |
annot | +10.839 |
Neg logit contributions | |
dictators | -8.867 |
hating | -8.647 |
oppressed | -8.350 |
Jews | -8.105 |
Communism | -7.975 |
Token | before |
Token ID | 878 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
Setup | +12.777 |
manually | +12.494 |
updated | +12.458 |
optionally | +12.264 |
annot | +12.030 |
Neg logit contributions | |
dictators | -9.798 |
hating | -9.616 |
oppressed | -9.336 |
Jews | -8.919 |
Communism | -8.809 |
Token | getting |
Token ID | 1972 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
Setup | +14.709 |
manually | +14.265 |
updated | +14.157 |
optionally | +14.051 |
annot | +13.685 |
Neg logit contributions | |
dictators | -10.003 |
hating | -9.646 |
oppressed | -9.533 |
Jews | -9.023 |
dictatorship | -8.957 |
Token | analysis |
Token ID | 3781 |
Feature activation | -4.14e+00 |
Pos logit contributions | |
Setup | +19.326 |
manually | +18.885 |
updated | +18.790 |
update | +18.395 |
optionally | +18.376 |
Neg logit contributions | |
dictators | -14.656 |
hating | -14.563 |
oppressed | -14.253 |
dictatorship | -13.412 |
Jews | -13.305 |
Token | Sens |
Token ID | 14173 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
manually | +34.323 |
updated | +33.994 |
Setup | +33.809 |
optionally | +33.222 |
annot | +32.786 |
Neg logit contributions | |
hating | -15.942 |
dictators | -15.626 |
oppressed | -14.607 |
dictatorship | -13.720 |
tyranny | -13.637 |
Token | itivity |
Token ID | 11365 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
Setup | +12.020 |
updated | +11.198 |
manually | +11.141 |
optionally | +10.838 |
annot | +10.593 |
Neg logit contributions | |
dictators | -20.139 |
hating | -20.076 |
oppressed | -19.501 |
martyr | -18.846 |
Communism | -18.799 |
Token | analysis |
Token ID | 3781 |
Feature activation | -4.58e+00 |
Pos logit contributions | |
Setup | +28.555 |
manually | +28.296 |
updated | +28.058 |
optionally | +27.566 |
update | +27.487 |
Neg logit contributions | |
hating | -16.176 |
dictators | -15.936 |
oppressed | -15.323 |
martyr | -14.429 |
Jews | -14.370 |
Token | will |
Token ID | 481 |
Feature activation | -5.80e+00 |
Pos logit contributions | |
manually | +37.425 |
updated | +36.990 |
Setup | +36.517 |
optionally | +36.388 |
annot | +35.829 |
Neg logit contributions | |
hating | -15.772 |
dictators | -15.024 |
oppressed | -14.174 |
dictatorship | -13.249 |
martyr | -13.205 |
Token | be |
Token ID | 307 |
Feature activation | -5.30e+00 |
Pos logit contributions | |
manually | +40.261 |
optionally | +40.241 |
update | +39.438 |
annot | +38.776 |
updated | +38.282 |
Neg logit contributions | |
hating | -22.121 |
dictators | -19.938 |
oppressed | -18.542 |
Almighty | -17.906 |
martyr | -17.816 |
Token | performed |
Token ID | 6157 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
updated | +39.678 |
manually | +39.414 |
optionally | +38.564 |
annot | +37.782 |
detailed | +37.380 |
Neg logit contributions | |
hating | -18.351 |
dictators | -17.662 |
Almighty | -16.127 |
Communism | -15.827 |
martyr | -15.818 |
Token | excluding |
Token ID | 23494 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
manually | +38.802 |
optionally | +37.263 |
updated | +36.858 |
annot | +35.769 |
Setup | +35.533 |
Neg logit contributions | |
dictators | -18.091 |
hating | -17.600 |
oppressed | -16.848 |
Communism | -16.118 |
bullies | -16.101 |
Token | studies |
Token ID | 3640 |
Feature activation | -2.88e+00 |
Pos logit contributions | |
manually | +24.136 |
updated | +23.982 |
Setup | +23.869 |
optionally | +23.491 |
annot | +23.422 |
Neg logit contributions | |
hating | -11.647 |
dictators | -11.603 |
oppressed | -10.902 |
Communism | -10.361 |
dictatorship | -10.260 |
Token | only |
Token ID | 691 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
manually | +24.543 |
updated | +24.242 |
annot | +23.950 |
Setup | +23.926 |
optionally | +23.812 |
Neg logit contributions | |
dictators | -14.381 |
hating | -13.722 |
oppressed | -13.113 |
Communism | -12.895 |
tyranny | -12.808 |
Token | reported |
Token ID | 2098 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
Setup | +12.424 |
manually | +12.261 |
updated | +12.104 |
optionally | +12.030 |
annot | +11.831 |
Neg logit contributions | |
dictators | -8.832 |
hating | -8.745 |
oppressed | -8.382 |
Jews | -8.093 |
dictatorship | -7.994 |
Token | purchased |
Token ID | 8155 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
Setup | +23.790 |
updated | +23.635 |
update | +23.374 |
manually | +23.243 |
optionally | +22.715 |
Neg logit contributions | |
dictators | -13.539 |
hating | -13.350 |
oppressed | -13.000 |
Communism | -12.152 |
Jews | -12.101 |
Token | devices |
Token ID | 4410 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
Setup | +19.893 |
updated | +19.684 |
manually | +19.646 |
update | +19.199 |
optionally | +19.158 |
Neg logit contributions | |
dictators | -12.608 |
hating | -12.554 |
oppressed | -12.129 |
Jews | -11.384 |
Communism | -11.356 |
Token | . |
Token ID | 13 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
Setup | +18.117 |
updated | +17.844 |
manually | +17.829 |
optionally | +17.448 |
update | +17.315 |
Neg logit contributions | |
dictators | -12.458 |
hating | -12.174 |
oppressed | -11.862 |
Jews | -11.304 |
dictatorship | -11.179 |
Token | The |
Token ID | 383 |
Feature activation | -2.66e+00 |
Pos logit contributions | |
Setup | +13.622 |
updated | +13.091 |
manually | +13.028 |
optionally | +12.796 |
update | +12.711 |
Neg logit contributions | |
dictators | -8.913 |
hating | -8.739 |
oppressed | -8.502 |
dictatorship | -7.982 |
tyranny | -7.958 |
Token | screen |
Token ID | 3159 |
Feature activation | -3.65e+00 |
Pos logit contributions | |
updated | +24.497 |
Setup | +24.420 |
manually | +23.954 |
update | +23.851 |
optionally | +23.371 |
Neg logit contributions | |
dictators | -12.564 |
hating | -12.461 |
oppressed | -11.700 |
Communism | -11.039 |
dictatorship | -10.987 |
Token | shot |
Token ID | 2823 |
Feature activation | -5.27e+00 |
Pos logit contributions | |
Setup | +32.820 |
updated | +32.696 |
manually | +32.169 |
update | +32.093 |
optionally | +31.852 |
Neg logit contributions | |
dictators | -13.580 |
hating | -13.517 |
oppressed | -13.038 |
Jews | -12.241 |
Communism | -12.044 |
Token | below |
Token ID | 2174 |
Feature activation | -4.22e+00 |
Pos logit contributions | |
updated | +39.197 |
manually | +38.756 |
update | +38.012 |
optionally | +37.651 |
annot | +37.479 |
Neg logit contributions | |
hating | -16.918 |
dictators | -16.884 |
oppressed | -15.780 |
tyranny | -15.100 |
Communism | -15.009 |
Token | is |
Token ID | 318 |
Feature activation | -4.15e+00 |
Pos logit contributions | |
updated | +33.166 |
manually | +33.013 |
optionally | +32.405 |
Setup | +32.109 |
annot | +32.048 |
Neg logit contributions | |
hating | -17.092 |
dictators | -16.884 |
oppressed | -15.925 |
tyranny | -15.348 |
dictatorship | -15.132 |
Token | of |
Token ID | 286 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
updated | +34.959 |
manually | +34.313 |
Setup | +33.990 |
optionally | +33.634 |
formatted | +33.445 |
Neg logit contributions | |
dictators | -15.829 |
hating | -15.502 |
oppressed | -14.689 |
Jews | -13.785 |
dictatorship | -13.709 |
Token | a |
Token ID | 257 |
Feature activation | -2.78e+00 |
Pos logit contributions | |
Setup | +20.594 |
updated | +20.305 |
manually | +20.149 |
optionally | +19.626 |
update | +19.538 |
Neg logit contributions | |
dictators | -12.894 |
hating | -12.590 |
oppressed | -12.034 |
dictatorship | -11.522 |
Jews | -11.439 |
Token | Best |
Token ID | 6705 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
Setup | +24.842 |
updated | +24.764 |
manually | +24.616 |
update | +23.859 |
formatted | +23.801 |
Neg logit contributions | |
dictators | -13.780 |
hating | -13.492 |
oppressed | -12.723 |
Jews | -12.254 |
Communism | -12.008 |
Token | . |
Token ID | 13 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
Setup | +16.460 |
manually | +15.815 |
updated | +15.782 |
optionally | +15.571 |
update | +15.268 |
Neg logit contributions | |
dictators | -13.415 |
hating | -13.304 |
oppressed | -12.959 |
Jews | -12.518 |
tyranny | -12.167 |
Token | 1 |
Token ID | 16 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
Setup | +14.074 |
manually | +13.242 |
updated | +13.220 |
optionally | +12.958 |
annot | +12.714 |
Neg logit contributions | |
dictators | -15.242 |
hating | -15.073 |
oppressed | -14.701 |
Jews | -14.096 |
dictatorship | -14.007 |
Token |
|
Token ID | 198 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
Setup | +15.457 |
manually | +14.867 |
updated | +14.821 |
optionally | +14.610 |
update | +14.346 |
Neg logit contributions | |
dictators | -12.475 |
hating | -12.357 |
oppressed | -11.998 |
Jews | -11.567 |
tyranny | -11.302 |
Token |
|
Token ID | 198 |
Feature activation | -3.97e+00 |
Pos logit contributions | |
Setup | +10.661 |
updated | +10.121 |
manually | +10.092 |
update | +9.783 |
annot | +9.675 |
Neg logit contributions | |
dictators | -11.236 |
hating | -10.983 |
oppressed | -10.782 |
tyranny | -10.230 |
dictatorship | -10.229 |
Token | This |
Token ID | 1212 |
Feature activation | -4.26e+00 |
Pos logit contributions | |
Setup | +29.844 |
updated | +26.402 |
Completed | +26.188 |
manually | +26.034 |
annot | +25.880 |
Neg logit contributions | |
dictators | -22.115 |
hating | -21.579 |
oppressed | -21.343 |
dictatorship | -19.944 |
bullies | -19.901 |
Token | configuration |
Token ID | 8398 |
Feature activation | -5.24e+00 |
Pos logit contributions | |
updated | +35.996 |
Setup | +35.296 |
manually | +35.280 |
update | +35.221 |
optionally | +34.656 |
Neg logit contributions | |
dictators | -16.239 |
hating | -15.998 |
oppressed | -14.602 |
Jews | -13.880 |
Communism | -13.830 |
Token | boots |
Token ID | 14412 |
Feature activation | -3.22e+00 |
Pos logit contributions | |
updated | +39.920 |
manually | +39.891 |
update | +39.263 |
optionally | +38.905 |
Setup | +38.139 |
Neg logit contributions | |
hating | -17.985 |
dictators | -17.632 |
oppressed | -16.149 |
Communism | -15.423 |
Jews | -15.212 |
Token | H |
Token ID | 367 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
manually | +28.011 |
Setup | +27.476 |
updated | +27.470 |
optionally | +27.331 |
formatted | +26.626 |
Neg logit contributions | |
dictators | -15.230 |
hating | -15.006 |
oppressed | -14.322 |
Jews | -13.543 |
dictatorship | -13.233 |
Token | VM |
Token ID | 15996 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
Setup | +10.750 |
manually | +9.915 |
updated | +9.764 |
optionally | +9.567 |
annot | +9.297 |
Neg logit contributions | |
dictators | -14.861 |
hating | -14.780 |
oppressed | -14.407 |
bullies | -13.813 |
Jews | -13.782 |
Token | and |
Token ID | 290 |
Feature activation | -2.71e+00 |
Pos logit contributions | |
Setup | +16.062 |
manually | +15.802 |
updated | +15.476 |
optionally | +15.421 |
formatted | +15.074 |
Neg logit contributions | |
dictators | -12.865 |
hating | -12.786 |
oppressed | -12.342 |
Jews | -11.904 |
tyranny | -11.651 |
Token | uses |
Token ID | 3544 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
manually | +24.332 |
Setup | +24.245 |
optionally | +24.188 |
updated | +24.062 |
update | +23.369 |
Neg logit contributions | |
hating | -13.315 |
dictators | -13.314 |
oppressed | -12.609 |
Jews | -11.991 |
dictatorship | -11.673 |
Token | ambient |
Token ID | 25237 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
dictators | +0.609 |
hating | +0.607 |
oppressed | +0.596 |
Jews | +0.576 |
dictatorship | +0.574 |
Neg logit contributions | |
Setup | -0.329 |
manually | -0.293 |
updated | -0.289 |
optionally | -0.286 |
formatted | -0.278 |
Token | . |
Token ID | 13 |
Feature activation | -5.21e-01 |
Pos logit contributions | |
hating | +6.932 |
dictators | +6.884 |
oppressed | +6.633 |
Jews | +6.398 |
tyranny | +6.189 |
Neg logit contributions | |
Setup | -11.370 |
manually | -10.837 |
updated | -10.778 |
optionally | -10.697 |
annot | -10.593 |
Token |
|
Token ID | 198 |
Feature activation | -8.71e-01 |
Pos logit contributions | |
Setup | +4.628 |
manually | +4.443 |
updated | +4.383 |
optionally | +4.376 |
annot | +4.287 |
Neg logit contributions | |
dictators | -3.458 |
hating | -3.431 |
oppressed | -3.308 |
Jews | -3.222 |
Communism | -3.139 |
Token |
|
Token ID | 198 |
Feature activation | -3.43e+00 |
Pos logit contributions | |
Setup | +7.025 |
manually | +6.684 |
updated | +6.651 |
optionally | +6.491 |
annot | +6.434 |
Neg logit contributions | |
dictators | -6.502 |
hating | -6.402 |
oppressed | -6.224 |
dictatorship | -5.903 |
tyranny | -5.895 |
Token | The |
Token ID | 464 |
Feature activation | -2.47e+00 |
Pos logit contributions | |
Setup | +25.276 |
manually | +21.798 |
Completed | +21.633 |
Detailed | +21.572 |
updated | +21.517 |
Neg logit contributions | |
dictators | -21.679 |
hating | -21.195 |
oppressed | -20.957 |
dictatorship | -19.778 |
bullies | -19.749 |
Token | code |
Token ID | 2438 |
Feature activation | -5.22e+00 |
Pos logit contributions | |
Setup | +22.632 |
updated | +22.144 |
manually | +22.018 |
optionally | +21.626 |
annot | +21.549 |
Neg logit contributions | |
hating | -12.400 |
dictators | -12.247 |
oppressed | -11.551 |
Jews | -11.172 |
Communism | -10.927 |
Token | accompanying |
Token ID | 19249 |
Feature activation | -3.53e+00 |
Pos logit contributions | |
manually | +39.725 |
updated | +39.568 |
Setup | +39.377 |
update | +38.662 |
annot | +38.572 |
Neg logit contributions | |
hating | -16.168 |
dictators | -16.065 |
oppressed | -15.160 |
Jews | -13.929 |
tyranny | -13.861 |
Token | this |
Token ID | 428 |
Feature activation | -3.46e+00 |
Pos logit contributions | |
Setup | +29.532 |
manually | +28.893 |
updated | +28.876 |
annot | +28.460 |
update | +28.185 |
Neg logit contributions | |
hating | -15.888 |
dictators | -15.401 |
oppressed | -14.559 |
Jews | -13.894 |
dictatorship | -13.646 |
Token | article |
Token ID | 2708 |
Feature activation | -3.47e+00 |
Pos logit contributions | |
Setup | +29.317 |
updated | +28.879 |
manually | +28.796 |
annot | +28.464 |
update | +28.411 |
Neg logit contributions | |
dictators | -16.014 |
hating | -15.903 |
oppressed | -14.869 |
Jews | -14.350 |
Communism | -14.026 |
Token | has |
Token ID | 468 |
Feature activation | -3.97e+00 |
Pos logit contributions | |
manually | +28.722 |
Setup | +28.371 |
updated | +28.362 |
optionally | +28.143 |
annot | +27.759 |
Neg logit contributions | |
hating | -16.764 |
dictators | -16.414 |
oppressed | -15.465 |
tyranny | -14.917 |
Jews | -14.901 |
Token | a |
Token ID | 257 |
Feature activation | -3.63e+00 |
Pos logit contributions | |
updated | +33.334 |
Setup | +32.915 |
manually | +32.813 |
optionally | +32.449 |
annot | +32.402 |
Neg logit contributions | |
hating | -17.013 |
dictators | -16.328 |
oppressed | -15.138 |
Communism | -14.656 |
dictatorship | -14.526 |
Token | light |
Token ID | 1657 |
Feature activation | -4.34e-01 |
Pos logit contributions | |
Setup | +2.856 |
manually | +2.672 |
optionally | +2.639 |
updated | +2.630 |
annot | +2.570 |
Neg logit contributions | |
hating | -3.379 |
dictators | -3.371 |
oppressed | -3.285 |
Jews | -3.220 |
Communism | -3.140 |
Token | . |
Token ID | 13 |
Feature activation | -2.47e+00 |
Pos logit contributions | |
Setup | +4.080 |
manually | +3.876 |
updated | +3.837 |
optionally | +3.836 |
annot | +3.774 |
Neg logit contributions | |
dictators | -2.689 |
hating | -2.664 |
oppressed | -2.569 |
Jews | -2.487 |
dictatorship | -2.415 |
Token |
|
Token ID | 198 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
Setup | +22.339 |
manually | +21.384 |
updated | +21.383 |
optionally | +21.055 |
update | +20.643 |
Neg logit contributions | |
dictators | -13.340 |
hating | -13.098 |
oppressed | -12.619 |
dictatorship | -11.768 |
tyranny | -11.726 |
Token |
|
Token ID | 198 |
Feature activation | -3.96e+00 |
Pos logit contributions | |
Setup | +8.762 |
manually | +8.306 |
updated | +8.284 |
optionally | +8.003 |
update | +7.989 |
Neg logit contributions | |
dictators | -8.455 |
hating | -8.308 |
oppressed | -8.096 |
dictatorship | -7.680 |
tyranny | -7.668 |
Token | The |
Token ID | 464 |
Feature activation | -3.67e+00 |
Pos logit contributions | |
Setup | +31.167 |
manually | +27.488 |
updated | +27.254 |
Completed | +26.914 |
annot | +26.687 |
Neg logit contributions | |
dictators | -20.850 |
hating | -20.377 |
oppressed | -19.952 |
dictatorship | -18.685 |
bullies | -18.581 |
Token | program |
Token ID | 1430 |
Feature activation | -5.17e+00 |
Pos logit contributions | |
Setup | +33.255 |
updated | +32.957 |
manually | +32.499 |
update | +31.855 |
optionally | +31.457 |
Neg logit contributions | |
hating | -13.795 |
dictators | -13.728 |
oppressed | -12.785 |
martyr | -11.870 |
Communism | -11.700 |
Token | is |
Token ID | 318 |
Feature activation | -4.62e+00 |
Pos logit contributions | |
manually | +39.727 |
updated | +39.157 |
optionally | +39.007 |
Setup | +38.870 |
update | +38.185 |
Neg logit contributions | |
hating | -17.150 |
dictators | -16.672 |
oppressed | -15.595 |
dictatorship | -14.581 |
martyr | -14.533 |
Token | operated |
Token ID | 12228 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
updated | +38.458 |
manually | +37.736 |
optionally | +37.246 |
Setup | +37.202 |
formatted | +36.958 |
Neg logit contributions | |
dictators | -15.781 |
hating | -15.725 |
oppressed | -14.454 |
martyr | -13.836 |
Jews | -13.737 |
Token | by |
Token ID | 416 |
Feature activation | -2.40e+00 |
Pos logit contributions | |
manually | +29.950 |
Setup | +29.065 |
optionally | +28.729 |
updated | +28.605 |
annot | +27.690 |
Neg logit contributions | |
hating | -17.498 |
dictators | -17.288 |
oppressed | -16.336 |
Jews | -15.900 |
bullies | -15.700 |
Token | selecting |
Token ID | 17246 |
Feature activation | -3.84e+00 |
Pos logit contributions | |
Setup | +23.706 |
manually | +23.440 |
updated | +23.068 |
optionally | +22.818 |
annot | +22.644 |
Neg logit contributions | |
dictators | -10.320 |
hating | -10.143 |
oppressed | -9.691 |
Jews | -8.871 |
Communism | -8.851 |
Token | the |
Token ID | 262 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
manually | +33.652 |
Setup | +33.266 |
updated | +32.827 |
optionally | +32.566 |
update | +32.046 |
Neg logit contributions | |
hating | -15.220 |
dictators | -15.076 |
oppressed | -14.167 |
bullies | -13.302 |
martyr | -13.020 |
Token | and |
Token ID | 290 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
dictators | +11.508 |
hating | +11.284 |
oppressed | +10.730 |
Jews | +10.588 |
Almighty | +10.349 |
Neg logit contributions | |
Setup | -13.027 |
manually | -12.182 |
optionally | -11.935 |
annot | -11.933 |
updated | -11.833 |
Token | others |
Token ID | 1854 |
Feature activation | +2.95e-01 |
Pos logit contributions | |
dictators | +8.706 |
hating | +8.541 |
oppressed | +8.322 |
Jews | +8.318 |
Almighty | +8.023 |
Neg logit contributions | |
Setup | -9.408 |
manually | -8.598 |
optionally | -8.442 |
formatted | -8.425 |
annot | -8.423 |
Token | . |
Token ID | 13 |
Feature activation | -7.80e-01 |
Pos logit contributions | |
dictators | +1.968 |
hating | +1.951 |
oppressed | +1.886 |
Jews | +1.824 |
martyr | +1.768 |
Neg logit contributions | |
Setup | -2.613 |
optionally | -2.433 |
manually | -2.428 |
updated | -2.384 |
annot | -2.380 |
Token | Pre |
Token ID | 3771 |
Feature activation | -2.46e+00 |
Pos logit contributions | |
Setup | +6.923 |
manually | +6.638 |
updated | +6.569 |
optionally | +6.534 |
annot | +6.414 |
Neg logit contributions | |
dictators | -5.181 |
hating | -5.139 |
oppressed | -4.955 |
Jews | -4.784 |
dictatorship | -4.672 |
Token | - |
Token ID | 12 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
Setup | +19.401 |
updated | +18.715 |
manually | +18.549 |
optionally | +17.932 |
annot | +17.924 |
Neg logit contributions | |
dictators | -15.511 |
hating | -15.071 |
oppressed | -15.023 |
Communism | -14.329 |
dictatorship | -14.131 |
Token | orders |
Token ID | 6361 |
Feature activation | -5.16e+00 |
Pos logit contributions | |
Setup | +19.095 |
updated | +17.726 |
manually | +17.368 |
annot | +16.930 |
optionally | +16.845 |
Neg logit contributions | |
dictators | -19.836 |
hating | -19.519 |
oppressed | -19.362 |
dictatorship | -18.443 |
Communism | -18.410 |
Token | for |
Token ID | 329 |
Feature activation | -2.24e+00 |
Pos logit contributions | |
manually | +38.551 |
updated | +38.382 |
update | +37.130 |
optionally | +36.470 |
formatted | +36.461 |
Neg logit contributions | |
dictators | -18.040 |
hating | -16.634 |
Communism | -16.311 |
oppressed | -16.103 |
dictatorship | -15.999 |
Token | those |
Token ID | 883 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
updated | +20.040 |
Setup | +19.952 |
manually | +19.790 |
optionally | +19.286 |
update | +19.272 |
Neg logit contributions | |
dictators | -11.701 |
hating | -11.680 |
oppressed | -11.104 |
dictatorship | -10.603 |
Communism | -10.580 |
Token | figures |
Token ID | 5538 |
Feature activation | -4.13e+00 |
Pos logit contributions | |
Setup | +16.989 |
updated | +16.978 |
manually | +16.942 |
optionally | +16.530 |
update | +16.289 |
Neg logit contributions | |
hating | -9.975 |
dictators | -9.970 |
oppressed | -9.589 |
Communism | -9.219 |
Jews | -9.150 |
Token | , |
Token ID | 11 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
manually | +32.013 |
updated | +31.825 |
update | +30.732 |
optionally | +30.474 |
formatted | +30.064 |
Neg logit contributions | |
dictators | -17.838 |
hating | -17.370 |
Communism | -16.709 |
oppressed | -16.350 |
dictatorship | -16.288 |
Token | including |
Token ID | 1390 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
updated | +22.671 |
manually | +22.540 |
Setup | +22.530 |
optionally | +22.219 |
formatted | +21.831 |
Neg logit contributions | |
dictators | -13.086 |
hating | -12.979 |
oppressed | -12.424 |
dictatorship | -11.828 |
Communism | -11.716 |
Token | regions |
Token ID | 7652 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
Setup | +20.717 |
manually | +20.347 |
updated | +20.179 |
optionally | +19.776 |
annot | +19.602 |
Neg logit contributions | |
hating | -12.787 |
dictators | -12.615 |
oppressed | -12.031 |
Jews | -11.502 |
Communism | -11.358 |
Token | with |
Token ID | 351 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
Setup | +11.591 |
manually | +11.214 |
updated | +11.077 |
optionally | +11.006 |
annot | +10.794 |
Neg logit contributions | |
dictators | -8.399 |
hating | -8.332 |
oppressed | -8.022 |
Jews | -7.765 |
Communism | -7.581 |
Token | AWS |
Token ID | 30865 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
Setup | +28.281 |
manually | +28.132 |
updated | +27.966 |
optionally | +27.386 |
update | +27.088 |
Neg logit contributions | |
dictators | -14.421 |
hating | -14.397 |
oppressed | -13.497 |
Jews | -13.063 |
Communism | -12.983 |
Token | . |
Token ID | 13 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
Setup | +17.368 |
manually | +16.877 |
updated | +16.701 |
optionally | +16.457 |
annot | +16.252 |
Neg logit contributions | |
dictators | -11.785 |
hating | -11.711 |
oppressed | -11.270 |
Jews | -10.798 |
Communism | -10.471 |
Token | We |
Token ID | 775 |
Feature activation | -3.90e+00 |
Pos logit contributions | |
Setup | +20.271 |
manually | +19.213 |
updated | +19.019 |
optionally | +18.937 |
update | +18.605 |
Neg logit contributions | |
dictators | -13.278 |
hating | -13.169 |
oppressed | -12.604 |
Jews | -11.856 |
tyranny | -11.768 |
Token | will |
Token ID | 481 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
manually | +30.289 |
updated | +30.023 |
Setup | +29.743 |
optionally | +29.618 |
annot | +29.299 |
Neg logit contributions | |
dictators | -18.622 |
hating | -18.463 |
oppressed | -17.166 |
Communism | -17.005 |
tyranny | -16.803 |
Token | deploy |
Token ID | 6061 |
Feature activation | -3.65e+00 |
Pos logit contributions | |
manually | +36.790 |
optionally | +36.033 |
update | +36.012 |
annot | +35.560 |
Setup | +35.177 |
Neg logit contributions | |
hating | -21.305 |
dictators | -21.178 |
oppressed | -19.846 |
tyranny | -18.980 |
Communism | -18.899 |
Token | the |
Token ID | 262 |
Feature activation | -3.96e+00 |
Pos logit contributions | |
manually | +30.366 |
Setup | +29.950 |
updated | +29.742 |
update | +29.129 |
optionally | +29.124 |
Neg logit contributions | |
dictators | -16.761 |
hating | -16.385 |
oppressed | -15.654 |
Jews | -15.145 |
Communism | -14.762 |
Token | application |
Token ID | 3586 |
Feature activation | -4.29e+00 |
Pos logit contributions | |
Setup | +33.034 |
updated | +33.007 |
manually | +32.699 |
update | +32.018 |
annot | +31.774 |
Neg logit contributions | |
dictators | -16.326 |
hating | -15.853 |
oppressed | -14.861 |
Jews | -14.477 |
Communism | -14.064 |
Token | in |
Token ID | 287 |
Feature activation | -3.29e+00 |
Pos logit contributions | |
manually | +34.283 |
Setup | +32.738 |
optionally | +32.470 |
updated | +32.462 |
update | +31.897 |
Neg logit contributions | |
dictators | -18.303 |
hating | -17.667 |
oppressed | -17.300 |
Jews | -16.696 |
Communism | -16.278 |
Token | one |
Token ID | 530 |
Feature activation | -3.42e+00 |
Pos logit contributions | |
Setup | +28.516 |
manually | +28.251 |
updated | +27.751 |
optionally | +27.402 |
update | +27.107 |
Neg logit contributions | |
dictators | -15.166 |
hating | -15.165 |
oppressed | -13.963 |
Jews | -13.675 |
bullies | -13.437 |
Token | all |
Token ID | 477 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
Setup | +14.694 |
manually | +14.306 |
updated | +14.194 |
optionally | +14.027 |
annot | +13.716 |
Neg logit contributions | |
dictators | -12.125 |
hating | -12.102 |
oppressed | -11.652 |
Jews | -11.263 |
Communism | -11.000 |
Token | particles |
Token ID | 13166 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
Setup | +12.517 |
manually | +12.068 |
updated | +11.982 |
optionally | +11.833 |
annot | +11.607 |
Neg logit contributions | |
dictators | -10.775 |
hating | -10.746 |
oppressed | -10.328 |
Jews | -10.024 |
Communism | -9.847 |
Token | .) |
Token ID | 2014 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
Setup | +14.777 |
manually | +14.596 |
updated | +14.434 |
optionally | +14.301 |
annot | +14.046 |
Neg logit contributions | |
dictators | -10.908 |
hating | -10.686 |
oppressed | -10.257 |
Jews | -9.959 |
Communism | -9.868 |
Token | In |
Token ID | 554 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
Setup | +12.364 |
manually | +11.875 |
updated | +11.805 |
optionally | +11.638 |
annot | +11.443 |
Neg logit contributions | |
dictators | -8.876 |
hating | -8.780 |
oppressed | -8.516 |
dictatorship | -7.989 |
tyranny | -7.986 |
Token | the |
Token ID | 262 |
Feature activation | -2.57e+00 |
Pos logit contributions | |
Setup | +19.205 |
manually | +18.775 |
updated | +18.609 |
optionally | +18.294 |
update | +18.066 |
Neg logit contributions | |
hating | -13.123 |
dictators | -13.008 |
oppressed | -12.456 |
Jews | -12.073 |
martyr | -11.766 |
Token | code |
Token ID | 2438 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
Setup | +22.597 |
updated | +22.353 |
manually | +22.157 |
annot | +21.679 |
update | +21.652 |
Neg logit contributions | |
hating | -13.609 |
dictators | -13.339 |
oppressed | -12.564 |
Jews | -12.303 |
Communism | -11.940 |
Token | , |
Token ID | 11 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
updated | +39.038 |
manually | +39.006 |
annot | +38.978 |
Setup | +38.465 |
update | +38.059 |
Neg logit contributions | |
dictators | -17.153 |
hating | -16.678 |
oppressed | -15.596 |
Jews | -14.775 |
tyranny | -14.769 |
Token | Uniform |
Token ID | 35712 |
Feature activation | -2.97e+00 |
Pos logit contributions | |
Setup | +22.048 |
manually | +21.995 |
updated | +21.683 |
optionally | +21.462 |
annot | +21.201 |
Neg logit contributions | |
dictators | -14.086 |
hating | -13.992 |
oppressed | -13.440 |
Jews | -12.687 |
dictatorship | -12.653 |
Token | Grid |
Token ID | 41339 |
Feature activation | -3.50e+00 |
Pos logit contributions | |
Setup | +21.470 |
manually | +19.759 |
updated | +19.529 |
optionally | +19.126 |
formatted | +18.812 |
Neg logit contributions | |
hating | -19.627 |
dictators | -19.557 |
oppressed | -19.233 |
Jews | -18.133 |
dictatorship | -18.100 |
Token | :: |
Token ID | 3712 |
Feature activation | -3.83e+00 |
Pos logit contributions | |
Setup | +30.664 |
manually | +29.871 |
updated | +29.331 |
optionally | +29.219 |
annot | +28.730 |
Neg logit contributions | |
hating | -15.739 |
dictators | -15.507 |
oppressed | -14.950 |
dictatorship | -13.813 |
Jews | -13.798 |
Token | Acc |
Token ID | 17320 |
Feature activation | -2.41e+00 |
Pos logit contributions | |
Setup | +30.498 |
manually | +27.487 |
updated | +27.362 |
update | +26.944 |
optionally | +26.856 |
Neg logit contributions | |
hating | -19.914 |
dictators | -19.874 |
oppressed | -19.312 |
martyr | -17.989 |
dictatorship | -17.935 |
Token | Sens |
Token ID | 14173 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
manually | +34.323 |
updated | +33.994 |
Setup | +33.809 |
optionally | +33.222 |
annot | +32.786 |
Neg logit contributions | |
hating | -15.942 |
dictators | -15.626 |
oppressed | -14.607 |
dictatorship | -13.720 |
tyranny | -13.637 |
Token | itivity |
Token ID | 11365 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
Setup | +12.020 |
updated | +11.198 |
manually | +11.141 |
optionally | +10.838 |
annot | +10.593 |
Neg logit contributions | |
dictators | -20.139 |
hating | -20.076 |
oppressed | -19.501 |
martyr | -18.846 |
Communism | -18.799 |
Token | analysis |
Token ID | 3781 |
Feature activation | -4.58e+00 |
Pos logit contributions | |
Setup | +28.555 |
manually | +28.296 |
updated | +28.058 |
optionally | +27.566 |
update | +27.487 |
Neg logit contributions | |
hating | -16.176 |
dictators | -15.936 |
oppressed | -15.323 |
martyr | -14.429 |
Jews | -14.370 |
Token | will |
Token ID | 481 |
Feature activation | -5.80e+00 |
Pos logit contributions | |
manually | +37.425 |
updated | +36.990 |
Setup | +36.517 |
optionally | +36.388 |
annot | +35.829 |
Neg logit contributions | |
hating | -15.772 |
dictators | -15.024 |
oppressed | -14.174 |
dictatorship | -13.249 |
martyr | -13.205 |
Token | be |
Token ID | 307 |
Feature activation | -5.30e+00 |
Pos logit contributions | |
manually | +40.261 |
optionally | +40.241 |
update | +39.438 |
annot | +38.776 |
updated | +38.282 |
Neg logit contributions | |
hating | -22.121 |
dictators | -19.938 |
oppressed | -18.542 |
Almighty | -17.906 |
martyr | -17.816 |
Token | performed |
Token ID | 6157 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
updated | +39.678 |
manually | +39.414 |
optionally | +38.564 |
annot | +37.782 |
detailed | +37.380 |
Neg logit contributions | |
hating | -18.351 |
dictators | -17.662 |
Almighty | -16.127 |
Communism | -15.827 |
martyr | -15.818 |
Token | excluding |
Token ID | 23494 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
manually | +38.802 |
optionally | +37.263 |
updated | +36.858 |
annot | +35.769 |
Setup | +35.533 |
Neg logit contributions | |
dictators | -18.091 |
hating | -17.600 |
oppressed | -16.848 |
Communism | -16.118 |
bullies | -16.101 |
Token | studies |
Token ID | 3640 |
Feature activation | -2.88e+00 |
Pos logit contributions | |
manually | +24.136 |
updated | +23.982 |
Setup | +23.869 |
optionally | +23.491 |
annot | +23.422 |
Neg logit contributions | |
hating | -11.647 |
dictators | -11.603 |
oppressed | -10.902 |
Communism | -10.361 |
dictatorship | -10.260 |
Token | only |
Token ID | 691 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
manually | +24.543 |
updated | +24.242 |
annot | +23.950 |
Setup | +23.926 |
optionally | +23.812 |
Neg logit contributions | |
dictators | -14.381 |
hating | -13.722 |
oppressed | -13.113 |
Communism | -12.895 |
tyranny | -12.808 |
Token | reported |
Token ID | 2098 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
Setup | +12.424 |
manually | +12.261 |
updated | +12.104 |
optionally | +12.030 |
annot | +11.831 |
Neg logit contributions | |
dictators | -8.832 |
hating | -8.745 |
oppressed | -8.382 |
Jews | -8.093 |
dictatorship | -7.994 |
Token | as |
Token ID | 355 |
Feature activation | -2.37e+00 |
Pos logit contributions | |
manually | +20.054 |
Setup | +19.861 |
updated | +19.797 |
optionally | +19.562 |
annot | +19.133 |
Neg logit contributions | |
dictators | -13.605 |
hating | -13.312 |
oppressed | -12.873 |
Communism | -12.272 |
Jews | -12.166 |
Token | server |
Token ID | 4382 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
Setup | +23.691 |
manually | +23.325 |
updated | +23.044 |
optionally | +22.749 |
annot | +22.517 |
Neg logit contributions | |
dictators | -13.813 |
hating | -13.481 |
oppressed | -12.922 |
Jews | -12.683 |
Communism | -12.379 |
Token | less |
Token ID | 1203 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
Setup | +12.483 |
updated | +12.008 |
manually | +11.916 |
optionally | +11.458 |
update | +11.351 |
Neg logit contributions | |
dictators | -16.388 |
hating | -15.932 |
oppressed | -15.497 |
Jews | -15.442 |
bullies | -15.088 |
Token | framework |
Token ID | 9355 |
Feature activation | -2.61e+00 |
Pos logit contributions | |
Setup | +11.695 |
manually | +11.253 |
updated | +11.126 |
optionally | +11.049 |
annot | +10.886 |
Neg logit contributions | |
dictators | -8.709 |
hating | -8.649 |
oppressed | -8.340 |
Jews | -8.108 |
Communism | -7.867 |
Token | . |
Token ID | 13 |
Feature activation | -2.86e+00 |
Pos logit contributions | |
Setup | +21.356 |
manually | +20.794 |
updated | +20.615 |
optionally | +20.260 |
annot | +20.043 |
Neg logit contributions | |
dictators | -15.564 |
hating | -15.515 |
oppressed | -14.898 |
Jews | -14.521 |
Communism | -14.062 |
Token | We |
Token ID | 775 |
Feature activation | -3.97e+00 |
Pos logit contributions | |
Setup | +24.098 |
manually | +22.916 |
updated | +22.644 |
update | +22.370 |
optionally | +22.264 |
Neg logit contributions | |
dictators | -15.702 |
hating | -15.568 |
oppressed | -14.964 |
tyranny | -14.012 |
bullies | -13.921 |
Token | will |
Token ID | 481 |
Feature activation | -5.13e+00 |
Pos logit contributions | |
manually | +30.407 |
updated | +30.313 |
Setup | +29.990 |
optionally | +29.601 |
annot | +29.417 |
Neg logit contributions | |
hating | -19.168 |
dictators | -19.121 |
oppressed | -17.694 |
tyranny | -17.376 |
Communism | -17.333 |
Token | build |
Token ID | 1382 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
manually | +36.194 |
update | +35.408 |
optionally | +35.149 |
annot | +34.881 |
Setup | +34.870 |
Neg logit contributions | |
hating | -22.081 |
dictators | -21.821 |
oppressed | -20.525 |
tyranny | -19.597 |
Jews | -19.502 |
Token | a |
Token ID | 257 |
Feature activation | -3.52e+00 |
Pos logit contributions | |
Setup | +30.593 |
manually | +30.565 |
updated | +30.192 |
optionally | +29.593 |
annot | +29.446 |
Neg logit contributions | |
dictators | -16.348 |
hating | -16.067 |
oppressed | -15.256 |
Jews | -15.071 |
bullies | -14.422 |
Token | sample |
Token ID | 6291 |
Feature activation | -4.20e+00 |
Pos logit contributions | |
Setup | +30.740 |
manually | +30.479 |
updated | +30.052 |
optionally | +29.361 |
annot | +29.248 |
Neg logit contributions | |
dictators | -15.299 |
hating | -14.779 |
oppressed | -14.218 |
Jews | -13.799 |
bullies | -13.241 |
Token | application |
Token ID | 3586 |
Feature activation | -4.32e+00 |
Pos logit contributions | |
Setup | +33.350 |
manually | +32.752 |
updated | +32.495 |
update | +31.892 |
annot | +31.767 |
Neg logit contributions | |
dictators | -17.865 |
hating | -17.101 |
Jews | -16.421 |
oppressed | -16.390 |
bullies | -15.545 |
Token | that |
Token ID | 326 |
Feature activation | -3.72e+00 |
Pos logit contributions | |
manually | +33.540 |
Setup | +32.831 |
updated | +32.718 |
optionally | +32.048 |
annot | +31.949 |
Neg logit contributions | |
dictators | -18.697 |
hating | -17.685 |
oppressed | -17.261 |
Jews | -16.983 |
Communism | -16.291 |
Token | their |
Token ID | 511 |
Feature activation | -3.10e+00 |
Pos logit contributions | |
Setup | +10.942 |
manually | +10.634 |
updated | +10.478 |
optionally | +10.392 |
annot | +10.221 |
Neg logit contributions | |
dictators | -8.159 |
hating | -8.114 |
oppressed | -7.814 |
Jews | -7.549 |
dictatorship | -7.367 |
Token | site |
Token ID | 2524 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
updated | +26.610 |
manually | +26.438 |
Setup | +26.289 |
update | +25.465 |
annot | +25.455 |
Neg logit contributions | |
dictators | -14.779 |
hating | -14.683 |
oppressed | -14.110 |
Jews | -13.208 |
bullies | -12.964 |
Token | . |
Token ID | 13 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
Setup | +18.699 |
manually | +18.602 |
updated | +18.195 |
optionally | +17.975 |
annot | +17.678 |
Neg logit contributions | |
dictators | -13.539 |
hating | -13.504 |
oppressed | -13.050 |
Jews | -12.545 |
tyranny | -12.201 |
Token | This |
Token ID | 770 |
Feature activation | -4.05e+00 |
Pos logit contributions | |
Setup | +16.476 |
manually | +15.791 |
updated | +15.698 |
optionally | +15.444 |
annot | +15.191 |
Neg logit contributions | |
dictators | -11.851 |
hating | -11.726 |
oppressed | -11.349 |
dictatorship | -10.650 |
tyranny | -10.604 |
Token | link |
Token ID | 2792 |
Feature activation | -4.70e+00 |
Pos logit contributions | |
updated | +33.650 |
manually | +33.467 |
Setup | +33.235 |
update | +32.572 |
formatted | +32.035 |
Neg logit contributions | |
dictators | -17.016 |
hating | -16.591 |
oppressed | -15.776 |
Jews | -15.077 |
Communism | -14.841 |
Token | provides |
Token ID | 3769 |
Feature activation | -5.12e+00 |
Pos logit contributions | |
updated | +35.759 |
manually | +35.483 |
Setup | +34.982 |
optionally | +34.299 |
update | +34.141 |
Neg logit contributions | |
hating | -19.318 |
dictators | -18.446 |
oppressed | -17.840 |
tyranny | -16.953 |
Communism | -16.798 |
Token | a |
Token ID | 257 |
Feature activation | -4.94e+00 |
Pos logit contributions | |
updated | +40.123 |
manually | +39.414 |
Setup | +38.819 |
detailed | +38.387 |
optionally | +38.102 |
Neg logit contributions | |
dictators | -16.919 |
hating | -16.823 |
oppressed | -15.825 |
Communism | -14.651 |
Jews | -14.389 |
Token | copy |
Token ID | 4866 |
Feature activation | -3.69e+00 |
Pos logit contributions | |
updated | +38.163 |
manually | +38.123 |
formatted | +37.515 |
detailed | +37.505 |
Setup | +37.253 |
Neg logit contributions | |
hating | -16.960 |
dictators | -16.936 |
oppressed | -16.254 |
bullies | -14.919 |
Jews | -14.779 |
Token | of |
Token ID | 286 |
Feature activation | -2.97e+00 |
Pos logit contributions | |
Setup | +29.268 |
manually | +28.991 |
updated | +28.735 |
optionally | +28.267 |
formatted | +28.249 |
Neg logit contributions | |
dictators | -18.026 |
hating | -17.548 |
oppressed | -17.164 |
Jews | -16.594 |
Communism | -16.229 |
Token | the |
Token ID | 262 |
Feature activation | -3.83e+00 |
Pos logit contributions | |
Setup | +26.106 |
manually | +26.040 |
updated | +25.965 |
optionally | +25.004 |
formatted | +24.932 |
Neg logit contributions | |
dictators | -14.462 |
hating | -14.066 |
oppressed | -13.340 |
Jews | -12.724 |
dictatorship | -12.614 |
Token | Excel |
Token ID | 24134 |
Feature activation | -3.91e+00 |
Pos logit contributions | |
updated | +33.578 |
manually | +32.938 |
Setup | +32.602 |
formatted | +32.045 |
annot | +31.991 |
Neg logit contributions | |
dictators | -15.117 |
hating | -14.847 |
oppressed | -13.838 |
Jews | -13.014 |
bullies | -12.830 |
Token | - |
Token ID | 12 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
Setup | +14.678 |
manually | +13.890 |
updated | +13.769 |
optionally | +13.674 |
annot | +13.408 |
Neg logit contributions | |
dictators | -13.291 |
hating | -13.209 |
oppressed | -12.849 |
Jews | -12.395 |
Communism | -12.220 |
Token | local |
Token ID | 12001 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
Setup | +18.287 |
manually | +17.336 |
optionally | +17.137 |
updated | +17.102 |
annot | +16.759 |
Neg logit contributions | |
dictators | -14.842 |
hating | -14.708 |
oppressed | -14.198 |
Communism | -13.596 |
Jews | -13.592 |
Token | * |
Token ID | 9 |
Feature activation | -1.93e+00 |
Pos logit contributions | |
Setup | +10.453 |
manually | +9.978 |
updated | +9.865 |
optionally | +9.817 |
annot | +9.606 |
Neg logit contributions | |
dictators | -9.548 |
hating | -9.488 |
oppressed | -9.189 |
Jews | -8.922 |
Communism | -8.737 |
Token | The |
Token ID | 383 |
Feature activation | -3.15e+00 |
Pos logit contributions | |
Setup | +16.798 |
manually | +16.276 |
updated | +16.098 |
optionally | +16.051 |
annot | +15.722 |
Neg logit contributions | |
hating | -11.851 |
dictators | -11.848 |
oppressed | -11.439 |
Jews | -10.844 |
tyranny | -10.712 |
Token | options |
Token ID | 3689 |
Feature activation | -4.02e+00 |
Pos logit contributions | |
manually | +27.106 |
Setup | +27.022 |
updated | +26.967 |
optionally | +26.641 |
update | +26.405 |
Neg logit contributions | |
hating | -15.175 |
dictators | -14.941 |
oppressed | -14.156 |
Communism | -13.464 |
Jews | -13.430 |
Token | are |
Token ID | 389 |
Feature activation | -5.12e+00 |
Pos logit contributions | |
manually | +33.421 |
updated | +32.826 |
optionally | +32.636 |
Setup | +32.382 |
annot | +32.280 |
Neg logit contributions | |
hating | -16.976 |
dictators | -16.365 |
oppressed | -15.513 |
Communism | -15.067 |
martyr | -14.964 |
Token | set |
Token ID | 900 |
Feature activation | -4.44e+00 |
Pos logit contributions | |
manually | +40.627 |
updated | +40.577 |
optionally | +39.856 |
annot | +39.489 |
formatted | +39.392 |
Neg logit contributions | |
hating | -17.236 |
dictators | -15.346 |
oppressed | -14.796 |
bullies | -14.047 |
martyr | -14.002 |
Token | like |
Token ID | 588 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
manually | +35.084 |
optionally | +33.213 |
updated | +32.801 |
Setup | +32.343 |
annot | +31.909 |
Neg logit contributions | |
hating | -19.144 |
dictators | -18.982 |
oppressed | -18.549 |
Communism | -17.563 |
bullies | -17.560 |
Token | with |
Token ID | 351 |
Feature activation | -2.39e+00 |
Pos logit contributions | |
Setup | +19.532 |
manually | +19.363 |
updated | +18.927 |
optionally | +18.853 |
annot | +18.502 |
Neg logit contributions | |
hating | -14.033 |
dictators | -13.967 |
oppressed | -13.594 |
Jews | -12.886 |
Communism | -12.764 |
Token | " |
Token ID | 366 |
Feature activation | -2.44e+00 |
Pos logit contributions | |
Setup | +20.148 |
manually | +20.089 |
updated | +19.680 |
optionally | +19.548 |
update | +19.208 |
Neg logit contributions | |
hating | -13.948 |
dictators | -13.860 |
oppressed | -13.363 |
Jews | -12.792 |
Communism | -12.631 |
Token | : |
Token ID | 25 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
Setup | +19.312 |
manually | +18.476 |
updated | +18.064 |
optionally | +17.930 |
annot | +17.710 |
Neg logit contributions | |
hating | -15.698 |
dictators | -15.692 |
oppressed | -15.254 |
bullies | -14.479 |
Jews | -14.439 |
Token | ate |
Token ID | 378 |
Feature activation | -3.67e+00 |
Pos logit contributions | |
Setup | +20.836 |
manually | +19.657 |
updated | +19.418 |
update | +18.986 |
optionally | +18.798 |
Neg logit contributions | |
hating | -20.071 |
dictators | -19.741 |
oppressed | -19.386 |
Jews | -18.409 |
tyranny | -18.310 |
Token | button |
Token ID | 4936 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
Setup | +31.254 |
manually | +30.393 |
updated | +29.552 |
update | +29.253 |
optionally | +29.178 |
Neg logit contributions | |
hating | -16.840 |
dictators | -16.652 |
oppressed | -16.201 |
martyr | -15.089 |
tyranny | -14.736 |
Token | . |
Token ID | 13 |
Feature activation | -2.80e+00 |
Pos logit contributions | |
manually | +28.560 |
Setup | +27.891 |
optionally | +27.596 |
updated | +27.523 |
annot | +26.927 |
Neg logit contributions | |
hating | -18.576 |
dictators | -18.547 |
oppressed | -17.659 |
Jews | -16.981 |
Communism | -16.665 |
Token | All |
Token ID | 1439 |
Feature activation | -3.53e+00 |
Pos logit contributions | |
Setup | +23.774 |
manually | +22.985 |
updated | +22.894 |
optionally | +22.611 |
update | +22.187 |
Neg logit contributions | |
dictators | -15.570 |
hating | -15.327 |
oppressed | -14.817 |
tyranny | -13.793 |
dictatorship | -13.778 |
Token | entries |
Token ID | 12784 |
Feature activation | -5.33e+00 |
Pos logit contributions | |
manually | +31.561 |
Setup | +31.351 |
updated | +31.252 |
optionally | +30.398 |
formatted | +30.241 |
Neg logit contributions | |
hating | -14.553 |
dictators | -14.034 |
oppressed | -13.217 |
Communism | -12.723 |
martyr | -12.684 |
Token | are |
Token ID | 389 |
Feature activation | -5.11e+00 |
Pos logit contributions | |
manually | +39.291 |
updated | +39.258 |
optionally | +38.161 |
update | +37.815 |
formatted | +37.721 |
Neg logit contributions | |
dictators | -19.347 |
hating | -19.305 |
Communism | -17.725 |
oppressed | -17.572 |
martyr | -17.112 |
Token | cleared |
Token ID | 12539 |
Feature activation | -3.46e+00 |
Pos logit contributions | |
manually | +40.886 |
updated | +40.866 |
formatted | +39.850 |
optionally | +39.395 |
annot | +39.086 |
Neg logit contributions | |
hating | -16.808 |
dictators | -16.227 |
oppressed | -14.855 |
Communism | -14.736 |
dictatorship | -13.988 |
Token | by |
Token ID | 416 |
Feature activation | -2.81e+00 |
Pos logit contributions | |
manually | +28.181 |
updated | +26.922 |
optionally | +26.834 |
Setup | +26.516 |
formatted | +26.256 |
Neg logit contributions | |
dictators | -17.277 |
hating | -17.038 |
oppressed | -16.607 |
Communism | -15.612 |
Jews | -15.600 |
Token | pressing |
Token ID | 12273 |
Feature activation | -3.37e+00 |
Pos logit contributions | |
manually | +25.533 |
Setup | +25.191 |
updated | +24.754 |
optionally | +24.638 |
annot | +24.293 |
Neg logit contributions | |
dictators | -13.332 |
hating | -13.139 |
oppressed | -12.762 |
Communism | -12.043 |
martyr | -11.795 |
Token | the |
Token ID | 262 |
Feature activation | -3.59e+00 |
Pos logit contributions | |
Setup | +28.330 |
manually | +28.164 |
optionally | +27.725 |
updated | +27.455 |
update | +27.100 |
Neg logit contributions | |
dictators | -15.972 |
hating | -15.820 |
oppressed | -15.062 |
martyr | -14.066 |
bullies | -14.058 |
Token | Clear |
Token ID | 11459 |
Feature activation | -3.00e+00 |
Pos logit contributions | |
Setup | +30.759 |
manually | +30.435 |
updated | +30.230 |
optionally | +29.999 |
update | +29.817 |
Neg logit contributions | |
hating | -15.129 |
dictators | -15.061 |
oppressed | -14.234 |
Communism | -13.174 |
bullies | -13.169 |
Token | end |
Token ID | 886 |
Feature activation | -2.53e+00 |
Pos logit contributions | |
manually | +23.851 |
Setup | +23.838 |
updated | +23.645 |
optionally | +23.638 |
annot | +22.980 |
Neg logit contributions | |
hating | -13.638 |
dictators | -13.469 |
oppressed | -12.885 |
Communism | -12.340 |
Jews | -12.171 |
Token | - |
Token ID | 12 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
Setup | +20.484 |
manually | +20.112 |
updated | +19.891 |
optionally | +19.709 |
annot | +19.376 |
Neg logit contributions | |
hating | -15.789 |
dictators | -15.767 |
oppressed | -15.017 |
Communism | -14.380 |
Jews | -14.338 |
Token | points |
Token ID | 13033 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
Setup | +15.331 |
manually | +14.516 |
updated | +14.416 |
optionally | +14.356 |
annot | +13.917 |
Neg logit contributions | |
dictators | -15.937 |
hating | -15.832 |
oppressed | -15.208 |
dictatorship | -14.703 |
Communism | -14.689 |
Token | . |
Token ID | 13 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
Setup | +18.441 |
manually | +18.295 |
updated | +18.106 |
optionally | +17.849 |
annot | +17.624 |
Neg logit contributions | |
hating | -13.149 |
dictators | -13.136 |
oppressed | -12.548 |
Jews | -12.131 |
Communism | -12.026 |
Token | The |
Token ID | 383 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
Setup | +21.780 |
manually | +21.079 |
updated | +20.889 |
optionally | +20.804 |
update | +20.422 |
Neg logit contributions | |
dictators | -14.315 |
hating | -14.310 |
oppressed | -13.644 |
Jews | -12.736 |
tyranny | -12.693 |
Token | code |
Token ID | 2438 |
Feature activation | -5.10e+00 |
Pos logit contributions | |
updated | +31.377 |
Setup | +31.297 |
manually | +30.986 |
formatted | +30.575 |
annot | +30.401 |
Neg logit contributions | |
hating | -15.633 |
dictators | -15.247 |
oppressed | -14.354 |
Communism | -13.871 |
Jews | -13.535 |
Token | for |
Token ID | 329 |
Feature activation | -3.00e+00 |
Pos logit contributions | |
updated | +38.616 |
manually | +38.358 |
Setup | +38.192 |
update | +37.713 |
annot | +37.342 |
Neg logit contributions | |
hating | -17.573 |
dictators | -17.409 |
oppressed | -16.639 |
Jews | -15.428 |
Communism | -15.281 |
Token | this |
Token ID | 428 |
Feature activation | -3.62e+00 |
Pos logit contributions | |
Setup | +25.709 |
manually | +25.364 |
updated | +24.987 |
optionally | +24.508 |
update | +24.432 |
Neg logit contributions | |
dictators | -15.259 |
hating | -14.822 |
oppressed | -14.411 |
Jews | -13.835 |
Communism | -13.594 |
Token | application |
Token ID | 3586 |
Feature activation | -4.31e+00 |
Pos logit contributions | |
Setup | +29.803 |
manually | +29.583 |
updated | +29.304 |
update | +28.744 |
optionally | +28.509 |
Neg logit contributions | |
dictators | -17.208 |
hating | -16.974 |
oppressed | -16.095 |
Jews | -15.352 |
Communism | -15.173 |
Token | is |
Token ID | 318 |
Feature activation | -5.05e+00 |
Pos logit contributions | |
manually | +33.353 |
updated | +32.982 |
Setup | +32.969 |
update | +32.414 |
optionally | +32.336 |
Neg logit contributions | |
hating | -18.248 |
dictators | -17.859 |
oppressed | -17.146 |
Jews | -16.193 |
Communism | -16.167 |
Token | in |
Token ID | 287 |
Feature activation | -3.17e+00 |
Pos logit contributions | |
updated | +39.077 |
manually | +38.664 |
annot | +37.923 |
Setup | +37.773 |
formatted | +37.373 |
Neg logit contributions | |
dictators | -17.594 |
hating | -17.151 |
oppressed | -16.522 |
Jews | -15.666 |
Communism | -15.344 |
Token | , |
Token ID | 11 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
dictators | +14.945 |
hating | +14.902 |
oppressed | +14.866 |
Jews | +14.288 |
politics | +13.928 |
Neg logit contributions | |
Setup | -14.202 |
manually | -12.617 |
optionally | -12.503 |
updated | -12.371 |
annot | -12.152 |
Token | in |
Token ID | 287 |
Feature activation | +1.64e+00 |
Pos logit contributions | |
dictators | +10.818 |
hating | +10.713 |
oppressed | +10.583 |
Jews | +10.354 |
religion | +10.054 |
Neg logit contributions | |
Setup | -12.065 |
manually | -11.000 |
optionally | -10.829 |
updated | -10.821 |
annot | -10.722 |
Token | terms |
Token ID | 2846 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
dictators | +13.193 |
hating | +12.981 |
oppressed | +12.819 |
Jews | +12.633 |
politics | +12.364 |
Neg logit contributions | |
Setup | -10.983 |
optionally | -10.051 |
manually | -10.020 |
updated | -9.713 |
formatted | -9.692 |
Token | of |
Token ID | 286 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
Setup | +0.909 |
manually | +0.862 |
updated | +0.849 |
optionally | +0.847 |
annot | +0.827 |
Neg logit contributions | |
dictators | -1.035 |
hating | -1.029 |
oppressed | -0.999 |
Jews | -0.976 |
Communism | -0.955 |
Token | nationalism |
Token ID | 24436 |
Feature activation | +2.74e+00 |
Pos logit contributions | |
dictators | +16.035 |
hating | +15.899 |
oppressed | +15.668 |
Jews | +15.611 |
religion | +15.399 |
Neg logit contributions | |
Setup | -11.489 |
optionally | -10.139 |
manually | -10.074 |
annot | -9.838 |
updated | -9.765 |
Token | and |
Token ID | 290 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
hating | +19.550 |
oppressed | +19.434 |
dictators | +19.405 |
politics | +19.164 |
Jews | +18.840 |
Neg logit contributions | |
Setup | -17.152 |
manually | -15.183 |
optionally | -15.015 |
updated | -14.796 |
annot | -14.622 |
Token | the |
Token ID | 262 |
Feature activation | +2.93e+00 |
Pos logit contributions | |
dictators | +27.373 |
religion | +27.156 |
politics | +27.076 |
oppressed | +27.034 |
hating | +26.884 |
Neg logit contributions | |
Setup | -16.362 |
manually | -13.505 |
Completed | -13.474 |
updated | -13.226 |
optionally | -13.225 |
Token | will |
Token ID | 481 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
dictators | +25.049 |
oppressed | +24.955 |
Jews | +24.466 |
politics | +24.354 |
hating | +24.329 |
Neg logit contributions | |
Setup | -13.839 |
optionally | -11.987 |
manually | -11.937 |
annot | -11.644 |
updated | -11.251 |
Token | to |
Token ID | 284 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
dictators | +10.670 |
oppressed | +10.511 |
hating | +10.439 |
Jews | +10.103 |
dictatorship | +9.955 |
Neg logit contributions | |
Setup | -10.463 |
manually | -9.605 |
optionally | -9.582 |
updated | -9.517 |
annot | -9.399 |
Token | win |
Token ID | 1592 |
Feature activation | +2.67e+00 |
Pos logit contributions | |
dictators | +24.713 |
oppressed | +24.462 |
hating | +23.823 |
Jews | +23.745 |
dictatorship | +23.711 |
Neg logit contributions | |
Setup | -15.983 |
updated | -13.587 |
updated | -13.437 |
annot | -13.423 |
formatted | -13.417 |
Token | , |
Token ID | 11 |
Feature activation | +2.33e+00 |
Pos logit contributions | |
dictators | +21.158 |
oppressed | +20.482 |
Jews | +20.205 |
hating | +19.981 |
politics | +19.978 |
Neg logit contributions | |
Setup | -15.902 |
optionally | -14.145 |
annot | -13.877 |
manually | -13.753 |
updated | -13.719 |
Token | is |
Token ID | 318 |
Feature activation | -2.95e-01 |
Pos logit contributions | |
Setup | +5.142 |
manually | +4.919 |
updated | +4.860 |
optionally | +4.835 |
annot | +4.737 |
Neg logit contributions | |
dictators | -4.753 |
hating | -4.725 |
oppressed | -4.565 |
Jews | -4.439 |
Communism | -4.341 |
Token | dem |
Token ID | 1357 |
Feature activation | +8.40e-01 |
Pos logit contributions | |
Setup | +2.466 |
manually | +2.336 |
optionally | +2.310 |
updated | +2.298 |
annot | +2.251 |
Neg logit contributions | |
dictators | -2.158 |
hating | -2.137 |
oppressed | -2.070 |
Jews | -2.010 |
dictatorship | -1.963 |
Token | e |
Token ID | 68 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
hating | +5.272 |
dictators | +5.179 |
oppressed | +5.140 |
Jews | +4.987 |
tyranny | +4.866 |
Neg logit contributions | |
Setup | -7.454 |
manually | -7.249 |
optionally | -7.051 |
updated | -6.984 |
annot | -6.868 |
Token | aning |
Token ID | 7574 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
hating | +7.671 |
dictators | +7.497 |
Jews | +7.349 |
oppressed | +7.270 |
martyr | +6.877 |
Neg logit contributions | |
Setup | -11.275 |
manually | -10.683 |
optionally | -10.665 |
updated | -10.287 |
annot | -10.047 |
Token | for |
Token ID | 329 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
dictators | +16.392 |
hating | +15.929 |
oppressed | +15.708 |
Jews | +15.528 |
religion | +15.275 |
Neg logit contributions | |
Setup | -14.961 |
optionally | -13.527 |
manually | -13.343 |
annot | -13.019 |
updated | -12.964 |
Token | women |
Token ID | 1466 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
dictators | +21.520 |
oppressed | +21.330 |
hating | +20.869 |
Jews | +20.563 |
religion | +20.322 |
Neg logit contributions | |
Setup | -15.901 |
optionally | -13.861 |
manually | -13.856 |
Completed | -13.271 |
annot | -13.229 |
Token | , |
Token ID | 11 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
dictators | +24.701 |
oppressed | +24.528 |
hating | +24.458 |
Jews | +23.649 |
martyr | +23.180 |
Neg logit contributions | |
Setup | -17.505 |
optionally | -14.910 |
Completed | -14.739 |
manually | -14.541 |
updated | -14.102 |
Token | but |
Token ID | 475 |
Feature activation | +7.79e-01 |
Pos logit contributions | |
dictators | +20.333 |
hating | +19.958 |
oppressed | +19.918 |
Jews | +19.446 |
religion | +18.944 |
Neg logit contributions | |
Setup | -13.276 |
manually | -11.613 |
optionally | -11.465 |
Completed | -11.233 |
updated | -11.135 |
Token | according |
Token ID | 1864 |
Feature activation | -7.25e-01 |
Pos logit contributions | |
dictators | +5.752 |
hating | +5.682 |
oppressed | +5.529 |
Jews | +5.404 |
religion | +5.235 |
Neg logit contributions | |
Setup | -6.329 |
manually | -5.851 |
optionally | -5.785 |
updated | -5.728 |
annot | -5.719 |
Token | to |
Token ID | 284 |
Feature activation | +4.90e-02 |
Pos logit contributions | |
Setup | +4.565 |
manually | +4.380 |
updated | +4.328 |
optionally | +4.229 |
annot | +4.140 |
Neg logit contributions | |
dictators | -6.544 |
hating | -6.506 |
oppressed | -6.329 |
Jews | -6.128 |
dictatorship | -6.085 |
Token | amd |
Token ID | 39971 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
dictators | +0.306 |
hating | +0.302 |
oppressed | +0.292 |
Jews | +0.284 |
tyranny | +0.273 |
Neg logit contributions | |
Setup | -0.460 |
manually | -0.437 |
optionally | -0.433 |
updated | -0.429 |
annot | -0.424 |
Token | from |
Token ID | 422 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
hating | +7.947 |
dictators | +7.886 |
oppressed | +7.767 |
Jews | +7.521 |
tyranny | +7.290 |
Neg logit contributions | |
Setup | -8.299 |
manually | -7.664 |
optionally | -7.535 |
updated | -7.450 |
formatted | -7.372 |
Token | the |
Token ID | 262 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
hating | +13.435 |
dictators | +13.272 |
oppressed | +12.909 |
tyranny | +12.840 |
politics | +12.604 |
Neg logit contributions | |
Setup | -14.626 |
manually | -13.465 |
optionally | -13.409 |
updated | -13.248 |
formatted | -13.166 |
Token | influence |
Token ID | 4588 |
Feature activation | +4.53e-01 |
Pos logit contributions | |
dictators | +14.980 |
hating | +14.603 |
tyranny | +14.545 |
oppressed | +14.493 |
Jews | +14.311 |
Neg logit contributions | |
Setup | -13.382 |
optionally | -12.486 |
manually | -12.289 |
formatted | -12.019 |
updated | -11.921 |
Token | of |
Token ID | 286 |
Feature activation | +2.74e+00 |
Pos logit contributions | |
dictators | +3.543 |
hating | +3.518 |
oppressed | +3.423 |
Jews | +3.337 |
tyranny | +3.287 |
Neg logit contributions | |
Setup | -3.505 |
manually | -3.272 |
optionally | -3.263 |
updated | -3.239 |
annot | -3.144 |
Token | Sar |
Token ID | 6866 |
Feature activation | +2.07e+00 |
Pos logit contributions | |
dictators | +19.791 |
hating | +19.721 |
oppressed | +19.156 |
Jews | +19.135 |
tyranny | +18.973 |
Neg logit contributions | |
Setup | -17.380 |
manually | -15.485 |
optionally | -15.321 |
formatted | -15.222 |
updated | -14.994 |
Token | uman |
Token ID | 3778 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
hating | +7.891 |
dictators | +7.870 |
Jews | +7.768 |
oppressed | +7.406 |
Almighty | +7.345 |
Neg logit contributions | |
Setup | -20.725 |
manually | -20.141 |
formatted | -20.079 |
optionally | -19.960 |
updated | -19.911 |
Token | 's |
Token ID | 338 |
Feature activation | +2.41e+00 |
Pos logit contributions | |
hating | +22.964 |
dictators | +22.896 |
oppressed | +22.043 |
Jews | +21.806 |
tyranny | +21.651 |
Neg logit contributions | |
Setup | -17.770 |
optionally | -16.187 |
updated | -15.535 |
manually | -15.530 |
formatted | -15.486 |
Token | spy |
Token ID | 13997 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
dictators | +19.795 |
hating | +19.570 |
tyranny | +19.295 |
oppressed | +19.211 |
Jews | +19.201 |
Neg logit contributions | |
Setup | -13.981 |
optionally | -12.521 |
manually | -12.395 |
formatted | -12.089 |
updated | -11.665 |
Token | Gr |
Token ID | 1902 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
hating | +8.419 |
dictators | +8.413 |
Jews | +8.129 |
oppressed | +7.977 |
religion | +7.911 |
Neg logit contributions | |
Setup | -8.924 |
optionally | -8.366 |
manually | -8.283 |
updated | -8.131 |
formatted | -8.023 |
Token | í |
Token ID | 8836 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
dictators | +10.110 |
Jews | +9.738 |
hating | +9.720 |
dictatorship | +9.413 |
Almighty | +9.385 |
Neg logit contributions | |
Setup | -13.303 |
manually | -12.989 |
optionally | -12.823 |
updated | -12.733 |
formatted | -12.480 |
Token | ma |
Token ID | 2611 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
hating | +12.163 |
dictators | +12.032 |
Jews | +11.851 |
oppressed | +11.551 |
Almighty | +11.524 |
Neg logit contributions | |
Setup | -15.566 |
manually | -15.039 |
updated | -14.604 |
optionally | -14.481 |
formatted | -14.333 |
Token | bowl |
Token ID | 36859 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
hating | +13.879 |
dictators | +13.834 |
Jews | +13.416 |
oppressed | +13.033 |
Communism | +12.852 |
Neg logit contributions | |
Setup | -11.728 |
optionally | -11.451 |
manually | -11.326 |
updated | -10.936 |
annot | -10.830 |
Token | Advertising |
Token ID | 40113 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
dictators | +9.984 |
hating | +9.980 |
Jews | +9.663 |
Communism | +9.488 |
oppressed | +9.433 |
Neg logit contributions | |
Setup | -7.991 |
manually | -7.875 |
optionally | -7.755 |
updated | -7.427 |
annot | -7.377 |
Token | - |
Token ID | 12 |
Feature activation | +9.16e-01 |
Pos logit contributions | |
dictators | +0.086 |
hating | +0.085 |
oppressed | +0.081 |
Jews | +0.081 |
Communism | +0.078 |
Neg logit contributions | |
Setup | -0.103 |
manually | -0.100 |
optionally | -0.098 |
updated | -0.097 |
annot | -0.096 |
Token | Aust |
Token ID | 15160 |
Feature activation | +2.63e+00 |
Pos logit contributions | |
hating | +7.309 |
dictators | +7.203 |
Jews | +7.030 |
oppressed | +6.866 |
Communism | +6.806 |
Neg logit contributions | |
optionally | -6.234 |
manually | -6.193 |
Setup | -6.125 |
updated | -5.953 |
formatted | -5.919 |
Token | rail |
Token ID | 30224 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
dictators | +18.940 |
hating | +18.356 |
Jews | +18.097 |
Communism | +17.829 |
Christians | +17.802 |
Neg logit contributions | |
Setup | -15.418 |
manually | -14.673 |
optionally | -14.572 |
updated | -13.983 |
annot | -13.840 |
Token | ian |
Token ID | 666 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
hating | +14.474 |
dictators | +14.224 |
Jews | +13.809 |
Communism | +13.486 |
oppressed | +13.438 |
Neg logit contributions | |
Setup | -12.908 |
manually | -12.464 |
optionally | -12.389 |
formatted | -11.820 |
updated | -11.801 |
Token | Teen |
Token ID | 21432 |
Feature activation | +2.15e+00 |
Pos logit contributions | |
dictators | +25.756 |
Jews | +25.664 |
hating | +25.423 |
Communism | +24.882 |
Christians | +24.633 |
Neg logit contributions | |
Setup | -15.113 |
optionally | -14.919 |
manually | -14.798 |
formatted | -13.764 |
annot | -13.666 |
Token | Party |
Token ID | 3615 |
Feature activation | +6.00e-01 |
Pos logit contributions | |
hating | +15.457 |
dictators | +15.217 |
Jews | +14.989 |
Communism | +14.550 |
Christians | +14.451 |
Neg logit contributions | |
Setup | -14.323 |
manually | -13.880 |
optionally | -13.781 |
annot | -13.302 |
updated | -13.097 |
Token | - |
Token ID | 12 |
Feature activation | +9.51e-01 |
Pos logit contributions | |
hating | +4.118 |
dictators | +4.114 |
oppressed | +3.909 |
Jews | +3.890 |
Communism | +3.805 |
Neg logit contributions | |
Setup | -5.029 |
manually | -4.906 |
optionally | -4.840 |
updated | -4.740 |
annot | -4.708 |
Token | Pink |
Token ID | 41912 |
Feature activation | +2.18e+00 |
Pos logit contributions | |
hating | +7.555 |
dictators | +7.452 |
Jews | +7.276 |
oppressed | +7.095 |
Communism | +7.049 |
Neg logit contributions | |
optionally | -6.465 |
manually | -6.427 |
Setup | -6.356 |
updated | -6.176 |
formatted | -6.144 |
Token | S |
Token ID | 311 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
hating | +15.963 |
dictators | +15.896 |
Jews | +15.595 |
Communism | +14.951 |
Christians | +14.915 |
Neg logit contributions | |
Setup | -13.951 |
manually | -13.692 |
optionally | -13.541 |
annot | -13.023 |
formatted | -12.877 |
Token | angs |
Token ID | 27725 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
hating | +16.565 |
dictators | +16.200 |
oppressed | +15.840 |
Jews | +15.550 |
martyr | +15.335 |
Neg logit contributions | |
Setup | -15.073 |
manually | -14.499 |
formatted | -14.343 |
optionally | -14.298 |
updated | -14.218 |
Token | of |
Token ID | 286 |
Feature activation | +3.99e+00 |
Pos logit contributions | |
hating | +17.510 |
oppressed | +17.439 |
dictators | +17.063 |
Jews | +16.320 |
martyr | +16.111 |
Neg logit contributions | |
Setup | -14.685 |
optionally | -12.972 |
manually | -12.901 |
formatted | -12.626 |
updated | -12.616 |
Token | dis |
Token ID | 595 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
hating | +30.998 |
oppressed | +30.585 |
dictators | +30.516 |
tyranny | +30.401 |
martyr | +29.934 |
Neg logit contributions | |
Setup | -17.484 |
optionally | -14.893 |
formatted | -14.016 |
manually | -13.976 |
updated | -13.656 |
Token | pri |
Token ID | 3448 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
hating | +17.837 |
oppressed | +17.099 |
dictators | +16.972 |
Jews | +16.809 |
tyranny | +16.692 |
Neg logit contributions | |
Setup | -14.237 |
manually | -13.683 |
optionally | -13.070 |
updated | -12.934 |
formatted | -12.772 |
Token | z |
Token ID | 89 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
hating | +11.765 |
dictators | +11.269 |
Jews | +11.137 |
oppressed | +11.118 |
dictatorship | +10.920 |
Neg logit contributions | |
Setup | -12.534 |
manually | -12.369 |
optionally | -12.141 |
updated | -11.813 |
formatted | -11.737 |
Token | 'd |
Token ID | 1549 |
Feature activation | +4.55e+00 |
Pos logit contributions | |
hating | +12.554 |
Jews | +12.299 |
dictators | +12.279 |
oppressed | +12.142 |
Almighty | +11.844 |
Neg logit contributions | |
Setup | -13.805 |
manually | -12.922 |
optionally | -12.809 |
annot | -12.777 |
formatted | -12.690 |
Token | love |
Token ID | 1842 |
Feature activation | +3.00e+00 |
Pos logit contributions | |
hating | +33.545 |
dictators | +33.510 |
oppressed | +33.219 |
tyranny | +33.186 |
hatred | +32.537 |
Neg logit contributions | |
Setup | -18.321 |
optionally | -15.310 |
formatted | -14.948 |
manually | -14.864 |
updated | -14.821 |
Token | , |
Token ID | 11 |
Feature activation | +3.70e+00 |
Pos logit contributions | |
hating | +23.644 |
oppressed | +23.323 |
dictators | +22.620 |
Jews | +21.956 |
tyranny | +21.915 |
Neg logit contributions | |
Setup | -16.187 |
manually | -13.909 |
optionally | -13.890 |
annot | -13.164 |
formatted | -13.124 |
Token | the |
Token ID | 262 |
Feature activation | +3.83e+00 |
Pos logit contributions | |
hating | +28.879 |
oppressed | +28.215 |
dictators | +27.698 |
tyranny | +27.276 |
hatred | +26.745 |
Neg logit contributions | |
Setup | -17.156 |
manually | -14.822 |
optionally | -14.554 |
updated | -14.218 |
annot | -14.032 |
Token | law |
Token ID | 1099 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
hating | +30.550 |
oppressed | +30.338 |
dictators | +30.106 |
tyranny | +29.485 |
hatred | +29.170 |
Neg logit contributions | |
Setup | -16.274 |
optionally | -13.656 |
manually | -13.464 |
formatted | -13.029 |
updated | -12.742 |
Token | 's |
Token ID | 338 |
Feature activation | +2.72e+00 |
Pos logit contributions | |
hating | +14.589 |
oppressed | +14.167 |
dictators | +14.152 |
Jews | +13.386 |
tyranny | +13.309 |
Neg logit contributions | |
Setup | -14.077 |
manually | -13.150 |
optionally | -13.079 |
updated | -12.625 |
formatted | -12.536 |
Token | � |
Token ID | 251 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
dictators | +6.324 |
hating | +6.305 |
oppressed | +6.169 |
Jews | +6.062 |
Communism | +5.849 |
Neg logit contributions | |
Setup | -9.265 |
manually | -8.867 |
optionally | -8.697 |
updated | -8.637 |
formatted | -8.636 |
Token |
|
Token ID | 198 |
Feature activation | +7.07e-01 |
Pos logit contributions | |
Jews | +13.173 |
hating | +13.060 |
dictators | +13.028 |
Communism | +12.855 |
Christians | +12.845 |
Neg logit contributions | |
Setup | -14.991 |
optionally | -14.515 |
manually | -14.460 |
formatted | -14.039 |
updated | -13.908 |
Token |
|
Token ID | 198 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
hating | +4.141 |
dictators | +4.128 |
Jews | +4.026 |
oppressed | +3.941 |
Communism | +3.866 |
Neg logit contributions | |
Setup | -6.443 |
optionally | -6.249 |
manually | -6.232 |
updated | -6.119 |
formatted | -6.099 |
Token | And |
Token ID | 1870 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
Setup | +1.627 |
manually | +1.560 |
updated | +1.538 |
optionally | +1.535 |
annot | +1.499 |
Neg logit contributions | |
dictators | -1.610 |
hating | -1.602 |
oppressed | -1.549 |
Jews | -1.515 |
Communism | -1.479 |
Token | when |
Token ID | 618 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
dictators | +15.539 |
hating | +15.506 |
Jews | +14.941 |
oppressed | +14.878 |
Christians | +14.576 |
Neg logit contributions | |
Setup | -13.841 |
manually | -12.314 |
optionally | -12.161 |
updated | -12.133 |
formatted | -11.978 |
Token | Catholics |
Token ID | 21374 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
dictators | +14.887 |
hating | +14.700 |
oppressed | +14.376 |
Jews | +14.330 |
Christians | +14.029 |
Neg logit contributions | |
Setup | -13.547 |
optionally | -12.052 |
manually | -12.023 |
updated | -11.786 |
annot | -11.580 |
Token | claim |
Token ID | 1624 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
hating | +15.387 |
dictators | +15.298 |
oppressed | +15.187 |
Jews | +14.820 |
martyr | +14.483 |
Neg logit contributions | |
Setup | -10.878 |
optionally | -9.243 |
manually | -9.188 |
updated | -8.998 |
Completed | -8.968 |
Token | that |
Token ID | 326 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
hating | +9.054 |
dictators | +9.046 |
oppressed | +8.743 |
Jews | +8.614 |
martyr | +8.547 |
Neg logit contributions | |
Setup | -10.129 |
optionally | -9.282 |
manually | -9.262 |
updated | -9.235 |
annot | -9.059 |
Token | all |
Token ID | 477 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
hating | +15.714 |
dictators | +15.633 |
Jews | +15.177 |
oppressed | +15.168 |
martyr | +15.009 |
Neg logit contributions | |
Setup | -13.728 |
manually | -12.185 |
optionally | -12.102 |
updated | -12.039 |
annot | -11.839 |
Token | Christians |
Token ID | 9316 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
dictators | +16.828 |
hating | +16.557 |
Jews | +16.413 |
oppressed | +16.365 |
Christians | +16.137 |
Neg logit contributions | |
Setup | -12.823 |
optionally | -11.606 |
manually | -11.528 |
updated | -11.164 |
annot | -10.915 |
Token | , |
Token ID | 11 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
hating | +18.905 |
oppressed | +18.553 |
dictators | +18.393 |
Jews | +18.242 |
martyr | +17.756 |
Neg logit contributions | |
Setup | -14.139 |
manually | -12.093 |
optionally | -11.949 |
updated | -11.591 |
annot | -11.566 |
Token | now |
Token ID | 783 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
hating | +13.642 |
dictators | +13.606 |
oppressed | +13.285 |
Jews | +13.060 |
bullies | +12.723 |
Neg logit contributions | |
Setup | -11.135 |
optionally | -9.995 |
manually | -9.859 |
annot | -9.786 |
updated | -9.755 |
Token | turning |
Token ID | 6225 |
Feature activation | +1.78e+00 |
Pos logit contributions | |
hating | +15.437 |
dictators | +15.193 |
oppressed | +14.948 |
Jews | +14.673 |
murdering | +14.384 |
Neg logit contributions | |
Setup | -11.828 |
optionally | -10.560 |
manually | -10.453 |
updated | -10.341 |
Completed | -10.289 |
Token | 180 |
Token ID | 11546 |
Feature activation | +9.95e-01 |
Pos logit contributions | |
dictators | +13.179 |
hating | +13.045 |
oppressed | +12.759 |
Jews | +12.502 |
tyranny | +12.234 |
Neg logit contributions | |
Setup | -13.116 |
optionally | -11.732 |
formatted | -11.519 |
updated | -11.507 |
annot | -11.474 |
Token | degrees |
Token ID | 7370 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
dictators | +6.803 |
hating | +6.670 |
oppressed | +6.427 |
Jews | +6.310 |
martyr | +6.197 |
Neg logit contributions | |
Setup | -8.344 |
optionally | -7.763 |
manually | -7.704 |
updated | -7.694 |
annot | -7.580 |
Token | and |
Token ID | 290 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
dictators | +12.278 |
hating | +12.124 |
oppressed | +11.867 |
Jews | +11.536 |
martyr | +11.368 |
Neg logit contributions | |
Setup | -11.783 |
optionally | -10.651 |
manually | -10.503 |
updated | -10.378 |
annot | -10.322 |
Token | demanding |
Token ID | 11334 |
Feature activation | +9.26e-01 |
Pos logit contributions | |
hating | +15.504 |
dictators | +15.088 |
oppressed | +14.737 |
Jews | +14.555 |
murdering | +14.392 |
Neg logit contributions | |
Setup | -12.314 |
optionally | -10.963 |
manually | -10.903 |
updated | -10.868 |
annot | -10.686 |
Token | that |
Token ID | 326 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
dictators | +7.155 |
hating | +6.945 |
oppressed | +6.821 |
Jews | +6.712 |
dictatorship | +6.617 |
Neg logit contributions | |
Setup | -7.193 |
optionally | -6.569 |
manually | -6.542 |
annot | -6.464 |
updated | -6.408 |
Token | their |
Token ID | 511 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
dictators | +16.883 |
oppressed | +16.122 |
hating | +16.049 |
Jews | +15.933 |
politicians | +15.575 |
Neg logit contributions | |
Setup | -13.092 |
annot | -11.453 |
optionally | -11.426 |
manually | -11.381 |
formatted | -11.166 |
Token | puppet |
Token ID | 30095 |
Feature activation | +3.16e+00 |
Pos logit contributions | |
dictators | +20.566 |
oppressed | +19.750 |
hating | +19.683 |
Jews | +19.348 |
politicians | +19.138 |
Neg logit contributions | |
Setup | -13.334 |
optionally | -11.544 |
annot | -11.294 |
manually | -11.288 |
formatted | -11.000 |
Token | regime |
Token ID | 7142 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
dictators | +26.260 |
dictatorship | +24.327 |
politicians | +24.212 |
hating | +24.090 |
oppressed | +24.059 |
Neg logit contributions | |
Setup | -15.757 |
manually | -14.347 |
optionally | -14.206 |
annot | -14.007 |
formatted | -13.845 |
Token | be |
Token ID | 307 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
dictators | +13.509 |
oppressed | +13.112 |
hating | +13.090 |
Jews | +12.858 |
dictatorship | +12.732 |
Neg logit contributions | |
Setup | -9.973 |
manually | -8.875 |
annot | -8.789 |
updated | -8.760 |
formatted | -8.756 |
Token | , |
Token ID | 11 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
hating | +8.605 |
dictators | +8.605 |
oppressed | +8.425 |
Jews | +8.117 |
dictatorship | +8.032 |
Neg logit contributions | |
Setup | -9.307 |
optionally | -8.344 |
updated | -8.259 |
manually | -8.221 |
annot | -8.122 |
Token | it |
Token ID | 340 |
Feature activation | +2.95e-02 |
Pos logit contributions | |
dictators | +15.370 |
hating | +15.206 |
oppressed | +14.774 |
Jews | +14.580 |
politicians | +14.310 |
Neg logit contributions | |
Setup | -13.088 |
manually | -11.655 |
optionally | -11.496 |
annot | -11.395 |
updated | -11.219 |
Token | accuses |
Token ID | 35062 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
dictators | +0.230 |
hating | +0.228 |
oppressed | +0.223 |
Jews | +0.217 |
dictatorship | +0.210 |
Neg logit contributions | |
Setup | -0.230 |
manually | -0.216 |
optionally | -0.213 |
updated | -0.212 |
annot | -0.208 |
Token | Russia |
Token ID | 3284 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
dictators | +11.303 |
hating | +11.002 |
oppressed | +10.989 |
Jews | +10.791 |
politicians | +10.356 |
Neg logit contributions | |
Setup | -13.348 |
manually | -12.174 |
optionally | -12.081 |
annot | -12.023 |
formatted | -11.897 |
Token | without |
Token ID | 1231 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
dictators | +10.939 |
hating | +10.933 |
oppressed | +10.635 |
Jews | +10.326 |
dictatorship | +10.158 |
Neg logit contributions | |
Setup | -11.760 |
updated | -10.751 |
manually | -10.726 |
optionally | -10.645 |
annot | -10.556 |
Token | proof |
Token ID | 6617 |
Feature activation | +5.93e-01 |
Pos logit contributions | |
hating | +2.180 |
dictators | +2.171 |
oppressed | +2.099 |
Jews | +2.059 |
dictatorship | +2.009 |
Neg logit contributions | |
Setup | -2.278 |
manually | -2.118 |
updated | -2.091 |
optionally | -2.090 |
annot | -2.042 |
Token | of |
Token ID | 286 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
hating | +4.474 |
dictators | +4.472 |
oppressed | +4.330 |
Jews | +4.240 |
dictatorship | +4.127 |
Neg logit contributions | |
Setup | -4.650 |
manually | -4.306 |
updated | -4.294 |
optionally | -4.267 |
annot | -4.195 |
Token | doing |
Token ID | 1804 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
hating | +13.780 |
dictators | +13.738 |
oppressed | +13.315 |
Jews | +13.082 |
dictatorship | +13.039 |
Neg logit contributions | |
Setup | -11.941 |
optionally | -10.565 |
annot | -10.460 |
updated | -10.460 |
manually | -10.412 |
Token | precisely |
Token ID | 10582 |
Feature activation | +9.22e-01 |
Pos logit contributions | |
dictators | +7.361 |
hating | +7.104 |
oppressed | +6.879 |
Jews | +6.798 |
politics | +6.641 |
Neg logit contributions | |
Setup | -11.595 |
optionally | -10.758 |
updated | -10.698 |
manually | -10.677 |
annot | -10.670 |
Token | what |
Token ID | 644 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
dictators | +5.746 |
hating | +5.722 |
oppressed | +5.484 |
Jews | +5.339 |
dictatorship | +5.200 |
Neg logit contributions | |
Setup | -8.391 |
manually | -7.887 |
optionally | -7.857 |
updated | -7.800 |
annot | -7.718 |
Token | Washington |
Token ID | 2669 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
dictators | +13.001 |
oppressed | +12.586 |
hating | +12.540 |
Jews | +12.206 |
politicians | +11.939 |
Neg logit contributions | |
Setup | -13.232 |
manually | -11.780 |
optionally | -11.707 |
annot | -11.691 |
updated | -11.591 |
Token | , |
Token ID | 11 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
Setup | +4.942 |
manually | +4.744 |
updated | +4.692 |
optionally | +4.677 |
annot | +4.591 |
Neg logit contributions | |
dictators | -3.395 |
hating | -3.368 |
oppressed | -3.240 |
Jews | -3.133 |
Communism | -3.045 |
Token | especially |
Token ID | 2592 |
Feature activation | +4.76e-01 |
Pos logit contributions | |
Setup | +1.289 |
manually | +1.219 |
optionally | +1.201 |
updated | +1.201 |
annot | +1.174 |
Neg logit contributions | |
dictators | -1.126 |
hating | -1.116 |
oppressed | -1.079 |
Jews | -1.053 |
dictatorship | -1.025 |
Token | charter |
Token ID | 17422 |
Feature activation | +7.60e-01 |
Pos logit contributions | |
dictators | +3.550 |
hating | +3.535 |
oppressed | +3.415 |
Jews | +3.367 |
religion | +3.317 |
Neg logit contributions | |
Setup | -3.847 |
manually | -3.550 |
optionally | -3.514 |
updated | -3.451 |
annot | -3.405 |
Token | school |
Token ID | 1524 |
Feature activation | +9.01e-01 |
Pos logit contributions | |
dictators | +4.837 |
hating | +4.766 |
oppressed | +4.533 |
Jews | +4.530 |
religion | +4.422 |
Neg logit contributions | |
Setup | -6.792 |
manually | -6.396 |
optionally | -6.357 |
updated | -6.275 |
annot | -6.177 |
Token | teachers |
Token ID | 7799 |
Feature activation | +9.05e-01 |
Pos logit contributions | |
dictators | +7.128 |
hating | +6.939 |
Jews | +6.730 |
oppressed | +6.712 |
politics | +6.568 |
Neg logit contributions | |
Setup | -6.683 |
manually | -6.192 |
optionally | -6.157 |
updated | -6.036 |
annot | -5.889 |
Token | � |
Token ID | 447 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
hating | +5.915 |
dictators | +5.800 |
oppressed | +5.628 |
Jews | +5.475 |
religion | +5.294 |
Neg logit contributions | |
Setup | -8.020 |
manually | -7.377 |
optionally | -7.372 |
updated | -7.291 |
annot | -7.115 |
Token | � |
Token ID | 247 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
dictators | +2.150 |
hating | +2.128 |
oppressed | +2.078 |
Jews | +2.018 |
Communism | +1.956 |
Neg logit contributions | |
Setup | -2.903 |
manually | -2.771 |
optionally | -2.734 |
updated | -2.732 |
formatted | -2.689 |
Token | relative |
Token ID | 3585 |
Feature activation | +5.37e-01 |
Pos logit contributions | |
dictators | +10.306 |
hating | +10.302 |
oppressed | +9.952 |
Jews | +9.804 |
religion | +9.531 |
Neg logit contributions | |
Setup | -9.394 |
manually | -8.660 |
optionally | -8.578 |
updated | -8.431 |
formatted | -8.281 |
Token | youth |
Token ID | 6205 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
dictators | +4.405 |
hating | +4.390 |
oppressed | +4.244 |
Jews | +4.145 |
religion | +4.102 |
Neg logit contributions | |
Setup | -3.910 |
manually | -3.645 |
optionally | -3.596 |
updated | -3.548 |
annot | -3.468 |
Token | and |
Token ID | 290 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
dictators | +10.790 |
hating | +10.662 |
oppressed | +10.433 |
religion | +10.260 |
Jews | +10.228 |
Neg logit contributions | |
Setup | -8.727 |
manually | -8.033 |
optionally | -7.922 |
updated | -7.745 |
annot | -7.562 |
Token | inexper |
Token ID | 31830 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
dictators | +12.802 |
hating | +12.730 |
oppressed | +12.524 |
religion | +12.459 |
Jews | +12.361 |
Neg logit contributions | |
Setup | -10.179 |
manually | -8.924 |
optionally | -8.784 |
updated | -8.459 |
formatted | -8.455 |
Token | and |
Token ID | 290 |
Feature activation | -2.32e+00 |
Pos logit contributions | |
Setup | +14.213 |
manually | +14.187 |
updated | +13.950 |
optionally | +13.769 |
update | +13.460 |
Neg logit contributions | |
dictators | -11.267 |
hating | -11.179 |
oppressed | -10.786 |
Jews | -10.447 |
Communism | -10.353 |
Token | utilities |
Token ID | 20081 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
manually | +21.122 |
Setup | +21.119 |
updated | +20.925 |
optionally | +20.492 |
update | +20.235 |
Neg logit contributions | |
dictators | -11.900 |
hating | -11.643 |
oppressed | -11.417 |
Jews | -10.783 |
tyranny | -10.629 |
Token | will |
Token ID | 481 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Setup | +10.836 |
manually | +10.645 |
updated | +10.500 |
optionally | +10.378 |
annot | +10.131 |
Neg logit contributions | |
dictators | -9.358 |
hating | -9.309 |
oppressed | -8.970 |
Jews | -8.713 |
Communism | -8.572 |
Token | help |
Token ID | 1037 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
Setup | +8.560 |
manually | +8.356 |
updated | +8.188 |
optionally | +8.186 |
annot | +7.950 |
Neg logit contributions | |
dictators | -8.981 |
hating | -8.969 |
oppressed | -8.640 |
Jews | -8.414 |
Communism | -8.287 |
Token | with |
Token ID | 351 |
Feature activation | -7.72e-01 |
Pos logit contributions | |
Setup | +0.794 |
manually | +0.746 |
updated | +0.737 |
optionally | +0.737 |
annot | +0.720 |
Neg logit contributions | |
dictators | -0.848 |
hating | -0.836 |
oppressed | -0.814 |
Jews | -0.794 |
dictatorship | -0.776 |
Token | that |
Token ID | 326 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
Setup | +6.425 |
manually | +6.165 |
updated | +6.094 |
optionally | +6.055 |
annot | +5.940 |
Neg logit contributions | |
dictators | -5.507 |
hating | -5.467 |
oppressed | -5.288 |
Jews | -5.134 |
Communism | -5.012 |
Token | . |
Token ID | 13 |
Feature activation | +9.16e-01 |
Pos logit contributions | |
dictators | +1.767 |
hating | +1.765 |
oppressed | +1.686 |
Jews | +1.616 |
tyranny | +1.615 |
Neg logit contributions | |
Setup | -2.736 |
manually | -2.549 |
optionally | -2.546 |
updated | -2.530 |
annot | -2.526 |
Token |
|
Token ID | 198 |
Feature activation | +7.44e-01 |
Pos logit contributions | |
hating | +5.377 |
dictators | +5.349 |
Jews | +5.270 |
Communism | +5.106 |
oppressed | +4.986 |
Neg logit contributions | |
Setup | -8.130 |
manually | -7.964 |
optionally | -7.906 |
annot | -7.767 |
formatted | -7.751 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
hating | +4.299 |
dictators | +4.258 |
Jews | +4.172 |
oppressed | +4.067 |
Communism | +3.993 |
Neg logit contributions | |
Setup | -6.833 |
optionally | -6.621 |
manually | -6.605 |
formatted | -6.478 |
updated | -6.470 |
Token | If |
Token ID | 1532 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
Setup | +7.727 |
manually | +7.196 |
updated | +7.138 |
optionally | +7.045 |
annot | +6.920 |
Neg logit contributions | |
dictators | -7.875 |
hating | -7.782 |
oppressed | -7.622 |
Jews | -7.314 |
dictatorship | -7.233 |
Token | we |
Token ID | 356 |
Feature activation | +7.93e-03 |
Pos logit contributions | |
dictators | +1.035 |
hating | +1.028 |
oppressed | +0.985 |
Jews | +0.959 |
dictatorship | +0.934 |
Neg logit contributions | |
Setup | -1.267 |
manually | -1.187 |
optionally | -1.177 |
updated | -1.173 |
annot | -1.162 |
Token | , |
Token ID | 11 |
Feature activation | +5.48e-01 |
Pos logit contributions | |
Setup | +9.555 |
manually | +9.293 |
updated | +9.225 |
optionally | +9.136 |
annot | +9.016 |
Neg logit contributions | |
dictators | -6.772 |
hating | -6.740 |
oppressed | -6.457 |
Jews | -6.228 |
tyranny | -6.115 |
Token | villagers |
Token ID | 25263 |
Feature activation | -8.73e-02 |
Pos logit contributions | |
dictators | +3.830 |
hating | +3.742 |
oppressed | +3.629 |
Jews | +3.553 |
politicians | +3.466 |
Neg logit contributions | |
Setup | -4.743 |
manually | -4.377 |
optionally | -4.339 |
updated | -4.309 |
formatted | -4.243 |
Token | and |
Token ID | 290 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
Setup | +0.702 |
manually | +0.658 |
optionally | +0.650 |
updated | +0.647 |
annot | +0.634 |
Neg logit contributions | |
dictators | -0.662 |
hating | -0.659 |
oppressed | -0.640 |
Jews | -0.623 |
dictatorship | -0.606 |
Token | fisher |
Token ID | 17685 |
Feature activation | +3.23e-01 |
Pos logit contributions | |
dictators | +7.732 |
hating | +7.524 |
oppressed | +7.372 |
Jews | +7.203 |
politicians | +7.192 |
Neg logit contributions | |
Setup | -9.070 |
manually | -8.281 |
optionally | -8.167 |
updated | -8.141 |
formatted | -8.083 |
Token | s |
Token ID | 82 |
Feature activation | +9.21e-02 |
Pos logit contributions | |
dictators | +1.870 |
hating | +1.832 |
oppressed | +1.755 |
Jews | +1.733 |
martyr | +1.647 |
Neg logit contributions | |
Setup | -3.186 |
manually | -3.006 |
optionally | -2.988 |
updated | -2.968 |
formatted | -2.928 |
Token | have |
Token ID | 423 |
Feature activation | -7.77e-01 |
Pos logit contributions | |
dictators | +0.709 |
hating | +0.705 |
oppressed | +0.686 |
Jews | +0.669 |
martyr | +0.649 |
Neg logit contributions | |
Setup | -0.728 |
manually | -0.674 |
optionally | -0.670 |
updated | -0.664 |
annot | -0.651 |
Token | complained |
Token ID | 13832 |
Feature activation | +6.27e-02 |
Pos logit contributions | |
Setup | +5.991 |
manually | +5.741 |
updated | +5.671 |
optionally | +5.633 |
annot | +5.514 |
Neg logit contributions | |
dictators | -6.024 |
hating | -5.986 |
oppressed | -5.786 |
Jews | -5.636 |
Communism | -5.521 |
Token | of |
Token ID | 286 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
dictators | +0.476 |
hating | +0.472 |
oppressed | +0.460 |
Jews | +0.449 |
dictatorship | +0.435 |
Neg logit contributions | |
Setup | -0.504 |
manually | -0.470 |
optionally | -0.469 |
updated | -0.465 |
annot | -0.458 |
Token | the |
Token ID | 262 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
Setup | +0.879 |
manually | +0.826 |
optionally | +0.823 |
updated | +0.817 |
annot | +0.803 |
Neg logit contributions | |
dictators | -0.721 |
hating | -0.715 |
oppressed | -0.693 |
Jews | -0.672 |
tyranny | -0.657 |
Token | smell |
Token ID | 8508 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
dictators | +0.736 |
hating | +0.728 |
oppressed | +0.709 |
Jews | +0.690 |
tyranny | +0.676 |
Neg logit contributions | |
Setup | -0.878 |
manually | -0.822 |
optionally | -0.822 |
updated | -0.811 |
annot | -0.796 |
Token | of |
Token ID | 286 |
Feature activation | +6.83e-01 |
Pos logit contributions | |
dictators | +0.773 |
hating | +0.773 |
oppressed | +0.748 |
Jews | +0.731 |
tyranny | +0.711 |
Neg logit contributions | |
Setup | -0.818 |
manually | -0.766 |
optionally | -0.759 |
updated | -0.755 |
annot | -0.740 |
Token | . |
Token ID | 13 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
Setup | +6.040 |
manually | +5.787 |
updated | +5.738 |
optionally | +5.719 |
annot | +5.623 |
Neg logit contributions | |
dictators | -3.843 |
hating | -3.813 |
oppressed | -3.654 |
Jews | -3.531 |
Communism | -3.425 |
Token | If |
Token ID | 1532 |
Feature activation | -6.82e-01 |
Pos logit contributions | |
Setup | +14.578 |
manually | +13.909 |
updated | +13.840 |
optionally | +13.665 |
annot | +13.400 |
Neg logit contributions | |
dictators | -9.340 |
hating | -9.163 |
oppressed | -8.924 |
dictatorship | -8.366 |
tyranny | -8.345 |
Token | you |
Token ID | 345 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
Setup | +6.116 |
manually | +5.858 |
updated | +5.793 |
optionally | +5.772 |
annot | +5.670 |
Neg logit contributions | |
dictators | -4.490 |
hating | -4.458 |
oppressed | -4.293 |
Jews | -4.158 |
Communism | -4.043 |
Token | have |
Token ID | 423 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
manually | +15.189 |
Setup | +15.156 |
updated | +15.009 |
optionally | +14.801 |
annot | +14.544 |
Neg logit contributions | |
dictators | -10.976 |
hating | -10.927 |
oppressed | -10.435 |
Jews | -10.089 |
Communism | -10.000 |
Token | any |
Token ID | 597 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
Setup | +14.133 |
manually | +13.949 |
updated | +13.873 |
optionally | +13.653 |
annot | +13.428 |
Neg logit contributions | |
dictators | -9.698 |
hating | -9.636 |
oppressed | -9.182 |
Jews | -8.911 |
Communism | -8.794 |
Token | questions |
Token ID | 2683 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
Setup | +11.515 |
manually | +11.324 |
updated | +11.233 |
optionally | +11.075 |
annot | +10.899 |
Neg logit contributions | |
dictators | -8.964 |
hating | -8.937 |
oppressed | -8.553 |
Jews | -8.305 |
Communism | -8.217 |
Token | or |
Token ID | 393 |
Feature activation | -6.91e-01 |
Pos logit contributions | |
Setup | +12.998 |
manually | +12.797 |
updated | +12.577 |
optionally | +12.488 |
annot | +12.234 |
Neg logit contributions | |
dictators | -9.754 |
hating | -9.657 |
oppressed | -9.293 |
Jews | -9.022 |
tyranny | -8.856 |
Token | comments |
Token ID | 3651 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
Setup | +5.414 |
manually | +5.183 |
updated | +5.119 |
optionally | +5.092 |
annot | +4.985 |
Neg logit contributions | |
dictators | -5.278 |
hating | -5.243 |
oppressed | -5.079 |
Jews | -4.942 |
Communism | -4.838 |
Token | regarding |
Token ID | 5115 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
Setup | +14.891 |
manually | +14.811 |
updated | +14.523 |
optionally | +14.425 |
annot | +14.161 |
Neg logit contributions | |
dictators | -11.434 |
hating | -11.330 |
oppressed | -10.911 |
Jews | -10.619 |
tyranny | -10.427 |
Token | your |
Token ID | 534 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
Setup | +13.211 |
manually | +12.907 |
updated | +12.774 |
optionally | +12.587 |
annot | +12.394 |
Neg logit contributions | |
dictators | -8.802 |
hating | -8.647 |
oppressed | -8.384 |
Jews | -8.075 |
Communism | -7.896 |
Token | vote |
Token ID | 3015 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
Setup | +16.666 |
manually | +16.449 |
updated | +16.317 |
optionally | +15.978 |
update | +15.843 |
Neg logit contributions | |
dictators | -9.628 |
hating | -9.541 |
oppressed | -9.189 |
Jews | -8.793 |
Communism | -8.645 |
Token | it |
Token ID | 340 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
Setup | +11.993 |
manually | +11.897 |
updated | +11.698 |
optionally | +11.343 |
annot | +11.293 |
Neg logit contributions | |
dictators | -11.492 |
hating | -11.215 |
oppressed | -10.943 |
dictatorship | -10.413 |
tyranny | -10.412 |
Token | to |
Token ID | 284 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
Setup | +8.140 |
manually | +7.985 |
updated | +7.802 |
optionally | +7.546 |
update | +7.444 |
Neg logit contributions | |
dictators | -12.942 |
hating | -12.701 |
oppressed | -12.488 |
tyranny | -11.977 |
dictatorship | -11.977 |
Token | gr |
Token ID | 1036 |
Feature activation | -2.32e-01 |
Pos logit contributions | |
Setup | +8.977 |
manually | +8.883 |
updated | +8.746 |
optionally | +8.653 |
annot | +8.560 |
Neg logit contributions | |
dictators | -8.154 |
hating | -8.097 |
oppressed | -7.812 |
Jews | -7.563 |
Communism | -7.465 |
Token | ays |
Token ID | 592 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
Setup | +1.956 |
manually | +1.872 |
updated | +1.853 |
optionally | +1.842 |
annot | +1.810 |
Neg logit contributions | |
dictators | -1.636 |
hating | -1.627 |
oppressed | -1.568 |
Jews | -1.510 |
dictatorship | -1.489 |
Token | cale |
Token ID | 38765 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
Setup | +2.225 |
manually | +2.114 |
updated | +2.083 |
optionally | +2.076 |
annot | +2.028 |
Neg logit contributions | |
dictators | -2.467 |
hating | -2.454 |
oppressed | -2.381 |
Jews | -2.324 |
Communism | -2.276 |
Token | image |
Token ID | 2939 |
Feature activation | -2.38e+00 |
Pos logit contributions | |
Setup | +7.280 |
manually | +7.163 |
updated | +7.043 |
optionally | +6.776 |
annot | +6.673 |
Neg logit contributions | |
dictators | -15.253 |
hating | -15.008 |
oppressed | -14.609 |
Jews | -14.311 |
dictatorship | -14.191 |
Token | = |
Token ID | 796 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
Setup | +12.184 |
manually | +10.786 |
updated | +10.756 |
update | +10.087 |
Completed | +10.076 |
Neg logit contributions | |
dictators | -23.023 |
hating | -22.343 |
oppressed | -22.075 |
dictatorship | -21.389 |
tyranny | -21.279 |
Token | c |
Token ID | 269 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
manually | +13.259 |
updated | +13.115 |
Setup | +13.096 |
annot | +12.770 |
optionally | +12.651 |
Neg logit contributions | |
dictators | -18.724 |
hating | -18.519 |
oppressed | -17.708 |
dictatorship | -17.296 |
Jews | -17.277 |
Token | v |
Token ID | 85 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
Setup | +11.692 |
updated | +10.824 |
manually | +10.692 |
update | +10.279 |
annot | +10.202 |
Neg logit contributions | |
dictators | -17.573 |
hating | -17.131 |
oppressed | -16.656 |
tyranny | -16.127 |
bullies | -16.090 |
Token | 2 |
Token ID | 17 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
Setup | +6.822 |
updated | +6.096 |
manually | +6.066 |
update | +5.606 |
annot | +5.588 |
Neg logit contributions | |
dictators | -16.864 |
hating | -16.483 |
oppressed | -16.258 |
dictatorship | -15.775 |
tyranny | -15.692 |
Token | . |
Token ID | 13 |
Feature activation | -2.88e+00 |
Pos logit contributions | |
Setup | +9.815 |
manually | +9.411 |
updated | +9.345 |
annot | +9.047 |
update | +9.044 |
Neg logit contributions | |
dictators | -7.483 |
hating | -7.286 |
oppressed | -7.094 |
dictatorship | -6.716 |
tyranny | -6.699 |
Token | time |
Token ID | 640 |
Feature activation | +6.37e-01 |
Pos logit contributions | |
Setup | +6.446 |
manually | +6.305 |
updated | +6.299 |
optionally | +6.033 |
update | +6.029 |
Neg logit contributions | |
dictators | -9.508 |
hating | -9.438 |
oppressed | -9.180 |
Jews | -8.823 |
martyr | -8.778 |
Token | . |
Token ID | 13 |
Feature activation | +4.23e-01 |
Pos logit contributions | |
dictators | +3.437 |
hating | +3.410 |
oppressed | +3.232 |
Jews | +3.157 |
Communism | +3.028 |
Neg logit contributions | |
Setup | -6.277 |
manually | -5.961 |
updated | -5.921 |
optionally | -5.892 |
annot | -5.799 |
Token |
|
Token ID | 198 |
Feature activation | +6.21e-01 |
Pos logit contributions | |
hating | +2.608 |
dictators | +2.604 |
Jews | +2.527 |
oppressed | +2.477 |
Communism | +2.445 |
Neg logit contributions | |
Setup | -3.829 |
manually | -3.705 |
optionally | -3.657 |
updated | -3.627 |
formatted | -3.587 |
Token |
|
Token ID | 198 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
hating | +3.670 |
dictators | +3.661 |
Jews | +3.553 |
oppressed | +3.497 |
Communism | +3.414 |
Neg logit contributions | |
Setup | -5.679 |
optionally | -5.481 |
manually | -5.468 |
updated | -5.366 |
formatted | -5.357 |
Token | If |
Token ID | 1532 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
Setup | +13.263 |
manually | +11.984 |
updated | +11.951 |
optionally | +11.669 |
annot | +11.656 |
Neg logit contributions | |
dictators | -12.520 |
hating | -12.213 |
oppressed | -12.141 |
dictatorship | -11.492 |
martyr | -11.335 |
Token | Christopher |
Token ID | 12803 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
Setup | +1.381 |
manually | +1.311 |
optionally | +1.294 |
updated | +1.289 |
annot | +1.269 |
Neg logit contributions | |
dictators | -1.098 |
hating | -1.090 |
oppressed | -1.050 |
Jews | -1.027 |
Communism | -0.995 |
Token | is |
Token ID | 318 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
Setup | +2.388 |
manually | +2.286 |
updated | +2.258 |
optionally | +2.253 |
annot | +2.211 |
Neg logit contributions | |
dictators | -1.677 |
hating | -1.664 |
oppressed | -1.600 |
Jews | -1.549 |
Communism | -1.506 |
Token | correct |
Token ID | 3376 |
Feature activation | +8.21e-02 |
Pos logit contributions | |
Setup | +2.479 |
manually | +2.354 |
optionally | +2.331 |
updated | +2.320 |
annot | +2.288 |
Neg logit contributions | |
hating | -1.628 |
dictators | -1.626 |
oppressed | -1.561 |
Jews | -1.511 |
Communism | -1.465 |
Token | , |
Token ID | 11 |
Feature activation | +3.73e-01 |
Pos logit contributions | |
dictators | +0.516 |
hating | +0.509 |
oppressed | +0.490 |
Jews | +0.477 |
Communism | +0.464 |
Neg logit contributions | |
Setup | -0.766 |
manually | -0.727 |
optionally | -0.719 |
updated | -0.717 |
annot | -0.703 |
Token | there |
Token ID | 612 |
Feature activation | -8.52e-01 |
Pos logit contributions | |
dictators | +2.690 |
hating | +2.689 |
oppressed | +2.569 |
Jews | +2.539 |
politicians | +2.453 |
Neg logit contributions | |
Setup | -3.098 |
manually | -2.903 |
optionally | -2.861 |
updated | -2.845 |
annot | -2.801 |
Token | could |
Token ID | 714 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
Setup | +6.426 |
manually | +6.136 |
updated | +6.056 |
optionally | +6.026 |
annot | +5.892 |
Neg logit contributions | |
dictators | -6.739 |
hating | -6.704 |
oppressed | -6.496 |
Jews | -6.324 |
Communism | -6.196 |
Token | eliminate |
Token ID | 11005 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
manually | +19.766 |
Setup | +19.519 |
updated | +19.176 |
optionally | +19.170 |
update | +18.861 |
Neg logit contributions | |
hating | -12.585 |
dictators | -12.453 |
oppressed | -11.727 |
Communism | -11.213 |
dictatorship | -11.180 |
Token | further |
Token ID | 2252 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
Setup | +9.932 |
manually | +9.678 |
updated | +9.506 |
optionally | +9.434 |
annot | +9.272 |
Neg logit contributions | |
dictators | -8.577 |
hating | -8.505 |
oppressed | -8.205 |
Jews | -7.945 |
Communism | -7.810 |
Token | perceived |
Token ID | 11067 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
Setup | +12.389 |
manually | +12.228 |
updated | +11.983 |
optionally | +11.822 |
annot | +11.715 |
Neg logit contributions | |
dictators | -10.405 |
hating | -10.343 |
oppressed | -9.918 |
Jews | -9.591 |
Communism | -9.494 |
Token | motion |
Token ID | 6268 |
Feature activation | -4.36e-01 |
Pos logit contributions | |
Setup | +8.979 |
manually | +8.726 |
updated | +8.581 |
optionally | +8.490 |
annot | +8.339 |
Neg logit contributions | |
dictators | -8.755 |
hating | -8.685 |
oppressed | -8.407 |
Jews | -8.156 |
Communism | -8.030 |
Token | blur |
Token ID | 23671 |
Feature activation | -3.93e-01 |
Pos logit contributions | |
Setup | +2.853 |
manually | +2.660 |
updated | +2.626 |
optionally | +2.618 |
annot | +2.549 |
Neg logit contributions | |
dictators | -3.960 |
hating | -3.946 |
oppressed | -3.832 |
Jews | -3.743 |
tyranny | -3.689 |
Token | and |
Token ID | 290 |
Feature activation | -9.98e-01 |
Pos logit contributions | |
Setup | +3.670 |
manually | +3.490 |
updated | +3.468 |
optionally | +3.451 |
annot | +3.397 |
Neg logit contributions | |
dictators | -2.474 |
hating | -2.451 |
oppressed | -2.356 |
Jews | -2.281 |
tyranny | -2.218 |
Token | works |
Token ID | 2499 |
Feature activation | -2.95e+00 |
Pos logit contributions | |
Setup | +8.009 |
manually | +7.682 |
updated | +7.580 |
optionally | +7.549 |
annot | +7.388 |
Neg logit contributions | |
dictators | -7.431 |
hating | -7.377 |
oppressed | -7.136 |
Jews | -6.934 |
Communism | -6.782 |
Token | well |
Token ID | 880 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
manually | +23.745 |
optionally | +23.364 |
Setup | +23.231 |
updated | +23.199 |
annot | +22.505 |
Neg logit contributions | |
dictators | -16.335 |
hating | -16.186 |
oppressed | -15.592 |
Jews | -14.941 |
Communism | -14.877 |
Token | , |
Token ID | 11 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
Setup | +15.650 |
manually | +15.595 |
optionally | +15.296 |
updated | +15.259 |
annot | +14.776 |
Neg logit contributions | |
dictators | -14.605 |
hating | -14.433 |
oppressed | -13.912 |
Jews | -13.597 |
tyranny | -13.355 |
Token | along |
Token ID | 1863 |
Feature activation | -5.16e-01 |
Pos logit contributions | |
Setup | +11.531 |
manually | +11.271 |
updated | +11.126 |
optionally | +11.120 |
annot | +10.841 |
Neg logit contributions | |
dictators | -8.201 |
hating | -8.075 |
oppressed | -7.819 |
Jews | -7.515 |
dictatorship | -7.358 |
Token | with |
Token ID | 351 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
Setup | +3.763 |
manually | +3.574 |
updated | +3.524 |
optionally | +3.507 |
annot | +3.428 |
Neg logit contributions | |
dictators | -4.250 |
hating | -4.225 |
oppressed | -4.100 |
Jews | -3.998 |
Communism | -3.914 |
Token | , |
Token ID | 11 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
Setup | +0.326 |
manually | +0.308 |
optionally | +0.306 |
updated | +0.303 |
annot | +0.298 |
Neg logit contributions | |
hating | -0.325 |
dictators | -0.323 |
oppressed | -0.311 |
Jews | -0.305 |
Communism | -0.297 |
Token | who |
Token ID | 508 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
Setup | +16.966 |
manually | +16.621 |
updated | +16.588 |
optionally | +16.358 |
annot | +16.170 |
Neg logit contributions | |
dictators | -6.982 |
hating | -6.811 |
oppressed | -6.539 |
Jews | -6.108 |
dictatorship | -5.990 |
Token | provided |
Token ID | 2810 |
Feature activation | -3.81e+00 |
Pos logit contributions | |
Setup | +17.596 |
manually | +17.482 |
updated | +17.453 |
optionally | +17.028 |
annot | +16.870 |
Neg logit contributions | |
dictators | -11.535 |
hating | -11.419 |
oppressed | -10.857 |
Jews | -10.468 |
tyranny | -10.352 |
Token | a |
Token ID | 257 |
Feature activation | -3.51e+00 |
Pos logit contributions | |
updated | +32.647 |
manually | +32.066 |
Setup | +32.046 |
detailed | +31.534 |
update | +31.264 |
Neg logit contributions | |
dictators | -15.301 |
hating | -15.027 |
oppressed | -14.391 |
dictatorship | -13.518 |
tyranny | -13.384 |
Token | very |
Token ID | 845 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
manually | +30.385 |
updated | +30.351 |
Setup | +30.226 |
detailed | +29.752 |
update | +29.447 |
Neg logit contributions | |
dictators | -14.915 |
hating | -14.298 |
oppressed | -13.950 |
Jews | -12.986 |
bullies | -12.937 |
Token | detailed |
Token ID | 6496 |
Feature activation | -3.78e+00 |
Pos logit contributions | |
updated | +27.025 |
manually | +26.608 |
detailed | +26.564 |
Setup | +26.324 |
annot | +25.932 |
Neg logit contributions | |
dictators | -15.474 |
hating | -15.187 |
oppressed | -14.230 |
tyranny | -13.837 |
Jews | -13.800 |
Token | way |
Token ID | 835 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
updated | +31.245 |
Setup | +30.943 |
update | +30.923 |
manually | +30.606 |
detailed | +30.434 |
Neg logit contributions | |
dictators | -16.007 |
hating | -15.034 |
oppressed | -14.649 |
bullies | -13.851 |
Jews | -13.686 |
Token | to |
Token ID | 284 |
Feature activation | -3.10e+00 |
Pos logit contributions | |
Setup | +20.683 |
manually | +20.545 |
updated | +20.010 |
optionally | +19.533 |
update | +19.457 |
Neg logit contributions | |
dictators | -15.678 |
hating | -15.282 |
oppressed | -15.015 |
tyranny | -14.327 |
Jews | -14.226 |
Token | diagnose |
Token ID | 37489 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
manually | +24.695 |
Setup | +23.594 |
update | +23.527 |
updated | +23.493 |
optionally | +23.334 |
Neg logit contributions | |
dictators | -17.348 |
hating | -17.136 |
oppressed | -16.746 |
Jews | -15.726 |
tyranny | -15.688 |
Token | what |
Token ID | 644 |
Feature activation | -7.35e-01 |
Pos logit contributions | |
Setup | +10.447 |
manually | +10.186 |
updated | +10.008 |
optionally | +9.886 |
annot | +9.695 |
Neg logit contributions | |
dictators | -8.592 |
hating | -8.510 |
oppressed | -8.233 |
Jews | -7.948 |
dictatorship | -7.822 |
Token | is |
Token ID | 318 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
Setup | +6.326 |
manually | +6.068 |
updated | +5.995 |
optionally | +5.969 |
annot | +5.855 |
Neg logit contributions | |
dictators | -5.069 |
hating | -5.032 |
oppressed | -4.854 |
Jews | -4.706 |
Communism | -4.592 |
Token | Ranger |
Token ID | 21888 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
Setup | +15.305 |
manually | +14.994 |
updated | +14.847 |
optionally | +14.573 |
annot | +14.519 |
Neg logit contributions | |
dictators | -10.760 |
hating | -10.654 |
oppressed | -10.148 |
Jews | -9.803 |
dictatorship | -9.632 |
Token | 6 |
Token ID | 718 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
Setup | +10.646 |
manually | +10.260 |
updated | +10.143 |
optionally | +10.040 |
annot | +9.882 |
Neg logit contributions | |
dictators | -9.492 |
hating | -9.431 |
oppressed | -9.107 |
Jews | -8.834 |
tyranny | -8.647 |
Token | indicated |
Token ID | 8203 |
Feature activation | -2.36e+00 |
Pos logit contributions | |
Setup | +12.447 |
manually | +12.072 |
updated | +11.925 |
optionally | +11.797 |
annot | +11.616 |
Neg logit contributions | |
dictators | -9.615 |
hating | -9.580 |
oppressed | -9.215 |
Jews | -8.918 |
tyranny | -8.684 |
Token | that |
Token ID | 326 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
Setup | +19.759 |
manually | +19.718 |
updated | +19.330 |
optionally | +19.020 |
annot | +18.799 |
Neg logit contributions | |
dictators | -13.930 |
hating | -13.715 |
oppressed | -13.203 |
Jews | -12.637 |
dictatorship | -12.294 |
Token | it |
Token ID | 340 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
Setup | +10.253 |
manually | +9.911 |
updated | +9.777 |
optionally | +9.719 |
annot | +9.546 |
Neg logit contributions | |
dictators | -7.995 |
hating | -7.919 |
oppressed | -7.636 |
Jews | -7.388 |
dictatorship | -7.212 |
Token | would |
Token ID | 561 |
Feature activation | -2.94e+00 |
Pos logit contributions | |
Setup | +13.769 |
manually | +13.719 |
updated | +13.549 |
optionally | +13.320 |
annot | +13.020 |
Neg logit contributions | |
dictators | -13.684 |
hating | -13.474 |
oppressed | -12.900 |
Jews | -12.549 |
Communism | -12.460 |
Token | miss |
Token ID | 2051 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
manually | +23.531 |
Setup | +22.928 |
optionally | +22.823 |
updated | +22.598 |
update | +22.384 |
Neg logit contributions | |
dictators | -17.120 |
hating | -16.974 |
oppressed | -16.068 |
Jews | -15.362 |
Communism | -15.239 |
Token | the |
Token ID | 262 |
Feature activation | -1.76e+00 |
Pos logit contributions | |
Setup | +15.309 |
manually | +14.930 |
updated | +14.699 |
optionally | +14.581 |
annot | +14.433 |
Neg logit contributions | |
dictators | -10.340 |
hating | -10.122 |
oppressed | -9.749 |
Jews | -9.376 |
dictatorship | -9.217 |
Token | Moon |
Token ID | 6869 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
Setup | +15.831 |
manually | +15.634 |
updated | +15.502 |
optionally | +15.218 |
annot | +15.168 |
Neg logit contributions | |
dictators | -10.245 |
hating | -10.094 |
oppressed | -9.595 |
Jews | -9.249 |
dictatorship | -9.030 |
Token | by |
Token ID | 416 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
hating | +0.873 |
dictators | +0.871 |
oppressed | +0.837 |
Jews | +0.818 |
dictatorship | +0.803 |
Neg logit contributions | |
Setup | -0.928 |
updated | -0.863 |
optionally | -0.853 |
manually | -0.853 |
formatted | -0.837 |
Token | about |
Token ID | 546 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
manually | +16.218 |
Setup | +16.203 |
updated | +15.977 |
optionally | +15.916 |
annot | +15.505 |
Neg logit contributions | |
dictators | -13.728 |
hating | -13.487 |
oppressed | -13.047 |
Jews | -12.527 |
Communism | -12.401 |
Token | into |
Token ID | 656 |
Feature activation | -2.54e+00 |
Pos logit contributions | |
manually | +19.969 |
Setup | +19.930 |
optionally | +19.445 |
updated | +19.442 |
annot | +19.105 |
Neg logit contributions | |
dictators | -15.079 |
hating | -14.823 |
oppressed | -14.438 |
Jews | -13.941 |
tyranny | -13.716 |
Token | the |
Token ID | 262 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
Setup | +21.165 |
manually | +21.003 |
updated | +20.651 |
optionally | +20.548 |
annot | +20.228 |
Neg logit contributions | |
dictators | -14.835 |
hating | -14.691 |
oppressed | -14.008 |
Jews | -13.665 |
dictatorship | -13.481 |
Token | page |
Token ID | 2443 |
Feature activation | -3.04e+00 |
Pos logit contributions | |
Setup | +23.744 |
manually | +23.625 |
updated | +23.519 |
annot | +23.135 |
optionally | +23.097 |
Neg logit contributions | |
dictators | -14.164 |
hating | -13.966 |
oppressed | -13.129 |
Jews | -12.963 |
dictatorship | -12.489 |
Token | . |
Token ID | 13 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
manually | +24.787 |
Setup | +24.640 |
updated | +24.023 |
optionally | +23.898 |
update | +23.807 |
Neg logit contributions | |
dictators | -16.196 |
hating | -15.929 |
oppressed | -15.617 |
Jews | -15.201 |
Communism | -14.612 |
Token | Alternatively |
Token ID | 25929 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
Setup | +19.612 |
manually | +19.003 |
updated | +18.905 |
optionally | +18.713 |
update | +18.534 |
Neg logit contributions | |
dictators | -12.898 |
hating | -12.682 |
oppressed | -12.252 |
tyranny | -11.514 |
dictatorship | -11.493 |
Token | you |
Token ID | 345 |
Feature activation | -3.12e+00 |
Pos logit contributions | |
Setup | +13.428 |
manually | +13.209 |
optionally | +12.987 |
updated | +12.927 |
annot | +12.692 |
Neg logit contributions | |
dictators | -9.910 |
hating | -9.796 |
oppressed | -9.494 |
Jews | -9.117 |
dictatorship | -8.994 |
Token | can |
Token ID | 460 |
Feature activation | -3.92e+00 |
Pos logit contributions | |
manually | +21.250 |
optionally | +20.843 |
updated | +20.288 |
annot | +20.279 |
Setup | +20.198 |
Neg logit contributions | |
hating | -20.977 |
dictators | -20.606 |
oppressed | -19.799 |
Communism | -19.227 |
dictatorship | -19.158 |
Token | include |
Token ID | 2291 |
Feature activation | -3.98e+00 |
Pos logit contributions | |
manually | +31.313 |
optionally | +30.468 |
annot | +29.922 |
update | +29.585 |
Setup | +29.160 |
Neg logit contributions | |
hating | -19.089 |
dictators | -18.947 |
oppressed | -17.894 |
Communism | -17.310 |
Jews | -17.249 |
Token | this |
Token ID | 428 |
Feature activation | -4.16e+00 |
Pos logit contributions | |
manually | +33.293 |
optionally | +32.628 |
updated | +32.606 |
Setup | +32.173 |
annot | +32.086 |
Neg logit contributions | |
dictators | -15.611 |
hating | -15.398 |
oppressed | -14.529 |
Jews | -13.907 |
Communism | -13.760 |
Token | CSS |
Token ID | 17391 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
manually | +34.245 |
updated | +33.472 |
optionally | +33.218 |
annot | +33.149 |
Setup | +32.950 |
Neg logit contributions | |
dictators | -16.161 |
hating | -15.851 |
Jews | -14.846 |
oppressed | -14.810 |
Communism | -14.241 |
Token | hiding |
Token ID | 11816 |
Feature activation | -3.53e+00 |
Pos logit contributions | |
manually | +35.094 |
Setup | +33.810 |
optionally | +33.710 |
update | +33.610 |
updated | +33.580 |
Neg logit contributions | |
dictators | -16.883 |
hating | -16.810 |
oppressed | -16.218 |
Jews | -15.838 |
Communism | -15.390 |
Token | Super |
Token ID | 12442 |
Feature activation | -9.74e-01 |
Pos logit contributions | |
Setup | +21.348 |
updated | +18.799 |
Completed | +18.792 |
manually | +18.790 |
annot | +18.376 |
Neg logit contributions | |
dictators | -18.805 |
hating | -18.094 |
oppressed | -17.897 |
dictatorship | -17.186 |
bullies | -16.746 |
Token | conduct |
Token ID | 36495 |
Feature activation | -8.11e-01 |
Pos logit contributions | |
Setup | +6.478 |
manually | +6.129 |
updated | +6.038 |
optionally | +6.004 |
annot | +5.847 |
Neg logit contributions | |
dictators | -8.583 |
hating | -8.533 |
oppressed | -8.310 |
Jews | -8.102 |
Communism | -7.947 |
Token | ing |
Token ID | 278 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
Setup | +5.212 |
manually | +4.922 |
updated | +4.844 |
optionally | +4.817 |
annot | +4.690 |
Neg logit contributions | |
dictators | -7.356 |
hating | -7.315 |
oppressed | -7.122 |
Jews | -6.954 |
Communism | -6.825 |
Token | magnets |
Token ID | 37446 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
Setup | +10.022 |
manually | +9.704 |
updated | +9.575 |
optionally | +9.532 |
annot | +9.325 |
Neg logit contributions | |
dictators | -8.065 |
hating | -8.040 |
oppressed | -7.749 |
Jews | -7.472 |
dictatorship | -7.311 |
Token | are |
Token ID | 389 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
Setup | +14.268 |
manually | +14.188 |
updated | +13.968 |
optionally | +13.868 |
annot | +13.595 |
Neg logit contributions | |
dictators | -11.124 |
hating | -11.078 |
oppressed | -10.580 |
Jews | -10.256 |
Communism | -10.186 |
Token | currently |
Token ID | 3058 |
Feature activation | -2.94e+00 |
Pos logit contributions | |
manually | +21.798 |
updated | +21.507 |
Setup | +21.469 |
optionally | +21.300 |
annot | +20.682 |
Neg logit contributions | |
hating | -12.568 |
dictators | -12.322 |
oppressed | -11.763 |
Jews | -11.267 |
Communism | -11.213 |
Token | used |
Token ID | 973 |
Feature activation | -2.16e+00 |
Pos logit contributions | |
manually | +26.308 |
updated | +26.228 |
Setup | +25.779 |
optionally | +25.688 |
annot | +25.283 |
Neg logit contributions | |
hating | -12.777 |
dictators | -12.756 |
oppressed | -11.742 |
Jews | -11.628 |
tyranny | -11.553 |
Token | in |
Token ID | 287 |
Feature activation | -6.19e-01 |
Pos logit contributions | |
manually | +15.686 |
Setup | +15.671 |
updated | +15.312 |
optionally | +15.272 |
annot | +14.733 |
Neg logit contributions | |
dictators | -15.441 |
hating | -15.404 |
oppressed | -14.884 |
Jews | -14.432 |
Communism | -14.207 |
Token | MRI |
Token ID | 30278 |
Feature activation | -8.02e-01 |
Pos logit contributions | |
Setup | +5.160 |
manually | +4.900 |
updated | +4.836 |
optionally | +4.832 |
annot | +4.733 |
Neg logit contributions | |
dictators | -4.502 |
hating | -4.463 |
oppressed | -4.320 |
Jews | -4.200 |
Communism | -4.100 |
Token | machines |
Token ID | 8217 |
Feature activation | -9.94e-01 |
Pos logit contributions | |
Setup | +6.799 |
manually | +6.510 |
updated | +6.433 |
optionally | +6.407 |
annot | +6.281 |
Neg logit contributions | |
dictators | -5.644 |
hating | -5.604 |
oppressed | -5.411 |
Jews | -5.251 |
Communism | -5.123 |
Token | and |
Token ID | 290 |
Feature activation | -9.47e-01 |
Pos logit contributions | |
Setup | +9.020 |
manually | +8.717 |
updated | +8.620 |
optionally | +8.564 |
annot | +8.418 |
Neg logit contributions | |
dictators | -6.304 |
hating | -6.256 |
oppressed | -6.008 |
Jews | -5.814 |
Communism | -5.677 |
Token | 13 |
Token ID | 1485 |
Feature activation | -8.22e-01 |
Pos logit contributions | |
Setup | +6.180 |
manually | +5.684 |
updated | +5.666 |
optionally | +5.535 |
annot | +5.420 |
Neg logit contributions | |
dictators | -10.007 |
hating | -9.878 |
oppressed | -9.672 |
dictatorship | -9.340 |
Jews | -9.328 |
Token | 45 |
Token ID | 2231 |
Feature activation | +3.71e-01 |
Pos logit contributions | |
Setup | +5.033 |
manually | +4.728 |
updated | +4.662 |
optionally | +4.613 |
annot | +4.489 |
Neg logit contributions | |
dictators | -7.703 |
hating | -7.631 |
oppressed | -7.451 |
Jews | -7.247 |
dictatorship | -7.163 |
Token | , |
Token ID | 11 |
Feature activation | -8.48e-02 |
Pos logit contributions | |
dictators | +2.206 |
hating | +2.203 |
oppressed | +2.106 |
Jews | +2.050 |
Communism | +1.978 |
Neg logit contributions | |
Setup | -3.521 |
manually | -3.386 |
updated | -3.342 |
optionally | -3.341 |
annot | -3.283 |
Token | India |
Token ID | 3794 |
Feature activation | +7.39e-01 |
Pos logit contributions | |
Setup | +0.965 |
manually | +0.933 |
optionally | +0.924 |
updated | +0.923 |
annot | +0.909 |
Neg logit contributions | |
dictators | -0.350 |
hating | -0.346 |
oppressed | -0.325 |
Jews | -0.313 |
Communism | -0.299 |
Token |
|
Token ID | 198 |
Feature activation | -5.52e-03 |
Pos logit contributions | |
hating | +4.388 |
dictators | +4.352 |
Jews | +4.234 |
oppressed | +4.165 |
Communism | +4.086 |
Neg logit contributions | |
Setup | -6.736 |
manually | -6.464 |
optionally | -6.463 |
updated | -6.333 |
annot | -6.288 |
Token |
|
Token ID | 198 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
Setup | +0.049 |
manually | +0.047 |
optionally | +0.046 |
updated | +0.046 |
annot | +0.045 |
Neg logit contributions | |
dictators | -0.037 |
hating | -0.037 |
oppressed | -0.035 |
Jews | -0.034 |
Communism | -0.034 |
Token | Read |
Token ID | 5569 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
Setup | +22.637 |
Completed | +20.250 |
Detailed | +19.371 |
Update | +18.830 |
updated | +18.621 |
Neg logit contributions | |
dictators | -27.526 |
oppressed | -26.794 |
hating | -26.041 |
dictatorship | -25.491 |
bullies | -24.924 |
Token | More |
Token ID | 3125 |
Feature activation | -7.58e-01 |
Pos logit contributions | |
Setup | +14.826 |
updated | +14.546 |
update | +14.005 |
manually | +13.969 |
annot | +13.402 |
Neg logit contributions | |
dictators | -16.518 |
hating | -15.817 |
oppressed | -15.742 |
dictatorship | -14.985 |
tyranny | -14.946 |
Token | About |
Token ID | 7994 |
Feature activation | -7.18e-01 |
Pos logit contributions | |
Setup | +6.869 |
manually | +6.580 |
updated | +6.535 |
optionally | +6.472 |
annot | +6.376 |
Neg logit contributions | |
dictators | -4.869 |
hating | -4.822 |
oppressed | -4.654 |
Jews | -4.445 |
tyranny | -4.372 |
Token | N |
Token ID | 399 |
Feature activation | -4.70e-01 |
Pos logit contributions | |
Setup | +6.085 |
manually | +5.821 |
updated | +5.784 |
optionally | +5.715 |
annot | +5.637 |
Neg logit contributions | |
dictators | -4.992 |
hating | -4.936 |
oppressed | -4.787 |
Jews | -4.548 |
tyranny | -4.515 |
Token | ages |
Token ID | 1095 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
Setup | +2.593 |
manually | +2.425 |
updated | +2.392 |
optionally | +2.369 |
annot | +2.312 |
Neg logit contributions | |
hating | -4.652 |
dictators | -4.646 |
oppressed | -4.538 |
Jews | -4.395 |
Communism | -4.362 |