Token | important |
Token ID | 1593 |
Feature activation | -7.49e-01 |
Pos logit contributions | |
country | +4.536 |
majority | +4.512 |
nation | +4.503 |
inner | +4.309 |
oret | +4.268 |
Neg logit contributions | |
because | -6.444 |
besides | -6.412 |
nonetheless | -6.253 |
regardless | -6.178 |
nevertheless | -6.119 |
Token | theory |
Token ID | 4583 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
majority | +0.615 |
country | +0.614 |
nation | +0.611 |
oret | +0.586 |
inner | +0.581 |
Neg logit contributions | |
because | -0.947 |
besides | -0.939 |
nonetheless | -0.917 |
regardless | -0.902 |
nevertheless | -0.897 |
Token | out |
Token ID | 503 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
because | +12.924 |
besides | +12.601 |
nonetheless | +12.363 |
regardless | +12.082 |
nevertheless | +11.995 |
Neg logit contributions | |
majority | -8.877 |
nation | -8.816 |
country | -8.780 |
oret | -8.685 |
slightest | -8.416 |
Token | of |
Token ID | 286 |
Feature activation | +7.28e+00 |
Pos logit contributions | |
because | +17.116 |
besides | +16.513 |
nonetheless | +15.938 |
regardless | +15.812 |
nevertheless | +15.486 |
Neg logit contributions | |
oret | -14.109 |
majority | -13.618 |
nation | -13.361 |
slightest | -13.343 |
country | -13.263 |
Token | the |
Token ID | 262 |
Feature activation | -7.32e+00 |
Pos logit contributions | |
because | +6.968 |
besides | +6.806 |
nonetheless | +6.639 |
nevertheless | +6.435 |
regardless | +6.413 |
Neg logit contributions | |
oret | -7.632 |
nation | -7.573 |
majority | -7.564 |
country | -7.483 |
slightest | -7.349 |
Token | way |
Token ID | 835 |
Feature activation | +3.03e+01 |
Pos logit contributions | |
country | +7.293 |
majority | +7.238 |
nation | +7.222 |
inner | +6.944 |
oret | +6.936 |
Neg logit contributions | |
because | -7.858 |
besides | -7.806 |
nonetheless | -7.590 |
regardless | -7.457 |
nevertheless | -7.401 |
Token | . |
Token ID | 13 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
because | +31.804 |
nonetheless | +29.700 |
besides | +29.670 |
regardless | +28.708 |
nevertheless | +28.495 |
Neg logit contributions | |
oret | -15.897 |
majority | -15.454 |
slightest | -15.257 |
country | -14.992 |
nation | -14.981 |
Token |
|
Token ID | 198 |
Feature activation | +8.94e+00 |
Pos logit contributions | |
because | +16.956 |
besides | +16.206 |
regardless | +15.478 |
nonetheless | +15.470 |
unless | +15.253 |
Neg logit contributions | |
slightest | -12.281 |
country | -12.274 |
nation | -12.234 |
majority | -11.984 |
inner | -11.922 |
Token |
|
Token ID | 198 |
Feature activation | +5.11e+00 |
Pos logit contributions | |
because | +4.377 |
besides | +4.269 |
nonetheless | +3.992 |
regardless | +3.831 |
nevertheless | +3.757 |
Neg logit contributions | |
majority | -14.219 |
country | -14.217 |
nation | -14.181 |
oret | -13.854 |
inner | -13.851 |
Token | People |
Token ID | 8061 |
Feature activation | +5.40e+00 |
Pos logit contributions | |
because | +5.129 |
besides | +5.011 |
nonetheless | +4.802 |
regardless | +4.734 |
nevertheless | +4.669 |
Neg logit contributions | |
country | -5.473 |
nation | -5.456 |
majority | -5.418 |
inner | -5.266 |
trio | -5.200 |
Token | who |
Token ID | 508 |
Feature activation | +8.17e-01 |
Pos logit contributions | |
because | +5.622 |
besides | +5.580 |
nonetheless | +5.396 |
regardless | +5.301 |
nevertheless | +5.259 |
Neg logit contributions | |
country | -5.560 |
majority | -5.555 |
nation | -5.538 |
oret | -5.400 |
inner | -5.322 |
Token | 41 |
Token ID | 3901 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
because | +5.013 |
besides | +4.872 |
nonetheless | +4.737 |
regardless | +4.653 |
nevertheless | +4.652 |
Neg logit contributions | |
majority | -4.779 |
country | -4.719 |
nation | -4.714 |
oret | -4.639 |
inner | -4.556 |
Token | ] |
Token ID | 60 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
because | +10.339 |
besides | +9.839 |
nonetheless | +9.485 |
regardless | +9.318 |
nevertheless | +9.202 |
Neg logit contributions | |
majority | -12.034 |
nation | -11.824 |
country | -11.745 |
oret | -11.656 |
inner | -11.577 |
Token | and |
Token ID | 290 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
because | +17.950 |
besides | +17.316 |
nonetheless | +16.710 |
regardless | +16.660 |
nevertheless | +16.449 |
Neg logit contributions | |
country | -10.445 |
oret | -10.348 |
nation | -10.290 |
majority | -10.266 |
inner | -10.003 |
Token | Peterson |
Token ID | 18914 |
Feature activation | +8.77e+00 |
Pos logit contributions | |
because | +14.451 |
besides | +14.061 |
nonetheless | +13.761 |
nevertheless | +13.513 |
regardless | +13.495 |
Neg logit contributions | |
oret | -8.174 |
country | -8.173 |
nation | -8.076 |
majority | -8.040 |
inner | -7.739 |
Token | conc |
Token ID | 1673 |
Feature activation | +7.46e+00 |
Pos logit contributions | |
because | +9.684 |
besides | +9.480 |
nonetheless | +9.397 |
nevertheless | +9.196 |
regardless | +9.106 |
Neg logit contributions | |
country | -8.024 |
nation | -7.979 |
majority | -7.964 |
oret | -7.875 |
inner | -7.716 |
Token | urs |
Token ID | 1834 |
Feature activation | +2.99e+01 |
Pos logit contributions | |
because | +8.055 |
besides | +7.913 |
nonetheless | +7.736 |
nevertheless | +7.556 |
regardless | +7.549 |
Neg logit contributions | |
country | -7.030 |
nation | -7.010 |
majority | -6.837 |
inner | -6.629 |
slightest | -6.565 |
Token | that |
Token ID | 326 |
Feature activation | +9.10e+00 |
Pos logit contributions | |
because | +32.482 |
nonetheless | +30.617 |
besides | +30.540 |
regardless | +29.902 |
nevertheless | +29.698 |
Neg logit contributions | |
country | -14.295 |
oret | -14.142 |
nation | -14.115 |
majority | -14.022 |
slightest | -13.855 |
Token | the |
Token ID | 262 |
Feature activation | -1.95e+01 |
Pos logit contributions | |
because | +11.967 |
besides | +11.692 |
nonetheless | +11.459 |
regardless | +11.352 |
nevertheless | +11.239 |
Neg logit contributions | |
oret | -6.430 |
country | -6.373 |
nation | -6.284 |
majority | -6.277 |
inner | -6.068 |
Token | Muslims |
Token ID | 7045 |
Feature activation | +3.40e+00 |
Pos logit contributions | |
majority | +23.956 |
nation | +23.511 |
country | +23.502 |
inner | +22.455 |
remainder | +22.302 |
Neg logit contributions | |
besides | -12.395 |
because | -11.937 |
nonetheless | -11.534 |
regardless | -11.361 |
nevertheless | -11.171 |
Token | wanted |
Token ID | 2227 |
Feature activation | +8.79e+00 |
Pos logit contributions | |
because | +3.224 |
besides | +3.188 |
nonetheless | +3.095 |
regardless | +3.024 |
nevertheless | +3.007 |
Neg logit contributions | |
country | -3.854 |
majority | -3.853 |
nation | -3.838 |
oret | -3.736 |
inner | -3.712 |
Token | to |
Token ID | 284 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
because | +11.194 |
besides | +10.891 |
nonetheless | +10.722 |
regardless | +10.559 |
nevertheless | +10.506 |
Neg logit contributions | |
oret | -6.474 |
country | -6.347 |
nation | -6.312 |
majority | -6.217 |
ses | -6.175 |
Token | es |
Token ID | 274 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
majority | +3.811 |
country | +3.811 |
nation | +3.793 |
oret | +3.630 |
inner | +3.613 |
Neg logit contributions | |
because | -5.916 |
besides | -5.887 |
nonetheless | -5.757 |
regardless | -5.659 |
nevertheless | -5.631 |
Token | can |
Token ID | 460 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
because | +21.040 |
besides | +20.318 |
nonetheless | +20.114 |
nevertheless | +19.726 |
regardless | +19.661 |
Neg logit contributions | |
oret | -11.677 |
majority | -11.505 |
country | -11.426 |
nation | -11.232 |
inner | -10.975 |
Token | also |
Token ID | 635 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
because | +14.189 |
besides | +13.857 |
nonetheless | +13.795 |
nevertheless | +13.641 |
regardless | +13.253 |
Neg logit contributions | |
majority | -11.003 |
country | -10.987 |
nation | -10.970 |
oret | -10.899 |
inner | -10.661 |
Token | hardly |
Token ID | 8941 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
because | +17.426 |
nonetheless | +16.878 |
besides | +16.727 |
nevertheless | +16.674 |
regardless | +16.140 |
Neg logit contributions | |
oret | -12.490 |
majority | -12.376 |
nation | -12.374 |
country | -12.312 |
ses | -12.202 |
Token | be |
Token ID | 307 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
because | +13.808 |
besides | +13.439 |
nonetheless | +13.158 |
nevertheless | +12.955 |
regardless | +12.769 |
Neg logit contributions | |
majority | -10.891 |
oret | -10.734 |
country | -10.718 |
nation | -10.695 |
trio | -10.423 |
Token | doubted |
Token ID | 37104 |
Feature activation | +2.96e+01 |
Pos logit contributions | |
because | +13.533 |
besides | +13.172 |
nonetheless | +12.872 |
nevertheless | +12.605 |
regardless | +12.536 |
Neg logit contributions | |
nation | -9.705 |
country | -9.624 |
majority | -9.539 |
oret | -9.512 |
trio | -9.391 |
Token | ... |
Token ID | 986 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
because | +31.863 |
besides | +29.977 |
nonetheless | +29.472 |
regardless | +29.314 |
unless | +29.307 |
Neg logit contributions | |
majority | -15.169 |
country | -14.990 |
oret | -14.837 |
nation | -14.812 |
trio | -14.632 |
Token |
|
Token ID | 198 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
because | +20.897 |
besides | +20.268 |
nonetheless | +19.855 |
nevertheless | +19.731 |
regardless | +19.610 |
Neg logit contributions | |
country | -10.018 |
nation | -9.902 |
oret | -9.777 |
majority | -9.776 |
inner | -9.642 |
Token |
|
Token ID | 198 |
Feature activation | +8.37e+00 |
Pos logit contributions | |
because | +5.040 |
besides | +4.861 |
nonetheless | +4.527 |
regardless | +4.363 |
nevertheless | +4.262 |
Neg logit contributions | |
majority | -16.055 |
country | -16.054 |
nation | -16.010 |
inner | -15.665 |
oret | -15.634 |
Token | Fund |
Token ID | 24553 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
because | +8.177 |
besides | +7.975 |
nonetheless | +7.720 |
nevertheless | +7.519 |
regardless | +7.497 |
Neg logit contributions | |
country | -8.829 |
nation | -8.757 |
majority | -8.669 |
inner | -8.559 |
slightest | -8.453 |
Token | ament |
Token ID | 3263 |
Feature activation | +6.92e-01 |
Pos logit contributions | |
country | +1.833 |
majority | +1.832 |
nation | +1.825 |
oret | +1.752 |
inner | +1.745 |
Neg logit contributions | |
because | -2.529 |
besides | -2.503 |
nonetheless | -2.444 |
regardless | -2.404 |
nevertheless | -2.389 |
Token | he |
Token ID | 339 |
Feature activation | +2.28e+00 |
Pos logit contributions | |
because | +9.328 |
besides | +9.147 |
nonetheless | +8.962 |
regardless | +8.829 |
nevertheless | +8.718 |
Neg logit contributions | |
majority | -6.137 |
country | -6.106 |
nation | -6.084 |
oret | -5.971 |
inner | -5.853 |
Token | chooses |
Token ID | 19769 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
because | +2.215 |
besides | +2.182 |
nonetheless | +2.122 |
regardless | +2.076 |
nevertheless | +2.063 |
Neg logit contributions | |
country | -2.532 |
majority | -2.530 |
nation | -2.525 |
oret | -2.454 |
inner | -2.445 |
Token | to |
Token ID | 284 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
because | +14.069 |
besides | +13.737 |
nonetheless | +13.466 |
regardless | +13.330 |
nevertheless | +13.089 |
Neg logit contributions | |
oret | -9.567 |
nation | -9.437 |
majority | -9.407 |
country | -9.357 |
inner | -9.107 |
Token | exercise |
Token ID | 5517 |
Feature activation | +7.05e+00 |
Pos logit contributions | |
because | +2.528 |
besides | +2.498 |
nonetheless | +2.446 |
regardless | +2.403 |
nevertheless | +2.391 |
Neg logit contributions | |
majority | -1.712 |
country | -1.709 |
nation | -1.702 |
oret | -1.644 |
inner | -1.628 |
Token | that |
Token ID | 326 |
Feature activation | -5.07e+00 |
Pos logit contributions | |
because | +7.720 |
besides | +7.425 |
nonetheless | +7.423 |
regardless | +7.227 |
nevertheless | +7.157 |
Neg logit contributions | |
country | -6.546 |
nation | -6.534 |
oret | -6.507 |
majority | -6.501 |
inner | -6.287 |
Token | discretion |
Token ID | 14130 |
Feature activation | +2.96e+01 |
Pos logit contributions | |
majority | +3.992 |
country | +3.971 |
nation | +3.940 |
inner | +3.754 |
oret | +3.716 |
Neg logit contributions | |
because | -6.500 |
besides | -6.494 |
nonetheless | -6.321 |
regardless | -6.228 |
nevertheless | -6.200 |
Token | will |
Token ID | 481 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
because | +31.773 |
besides | +31.182 |
nonetheless | +30.726 |
regardless | +30.297 |
nevertheless | +30.296 |
Neg logit contributions | |
subur | -14.614 |
majority | -14.410 |
oret | -14.395 |
ikuman | -14.235 |
ses | -14.077 |
Token | determine |
Token ID | 5004 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
because | +20.087 |
nonetheless | +19.760 |
besides | +19.623 |
nevertheless | +19.408 |
regardless | +19.183 |
Neg logit contributions | |
majority | -11.013 |
ses | -10.913 |
country | -10.853 |
oret | -10.766 |
nation | -10.728 |
Token | Bob |
Token ID | 5811 |
Feature activation | -7.04e+00 |
Pos logit contributions | |
because | +18.538 |
besides | +17.879 |
regardless | +17.696 |
nonetheless | +17.619 |
unless | +17.149 |
Neg logit contributions | |
oret | -10.273 |
majority | -10.180 |
country | -10.081 |
nation | -10.011 |
trio | -9.975 |
Token | McDonnell |
Token ID | 39441 |
Feature activation | +6.00e+00 |
Pos logit contributions | |
majority | +7.087 |
country | +7.085 |
nation | +7.050 |
oret | +6.796 |
inner | +6.741 |
Neg logit contributions | |
besides | -7.269 |
because | -7.240 |
nonetheless | -7.034 |
regardless | -6.880 |
nevertheless | -6.865 |
Token | � |
Token ID | 447 |
Feature activation | -4.34e+00 |
Pos logit contributions | |
because | +5.446 |
besides | +5.234 |
regardless | +5.106 |
nonetheless | +5.100 |
nevertheless | +4.918 |
Neg logit contributions | |
majority | -6.805 |
country | -6.800 |
nation | -6.765 |
oret | -6.693 |
inner | -6.655 |
Token | most |
Token ID | 749 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
majority | +9.360 |
country | +9.307 |
nation | +9.262 |
inner | +8.998 |
oret | +8.884 |
Neg logit contributions | |
besides | -10.210 |
because | -10.157 |
nonetheless | -9.955 |
nevertheless | -9.728 |
regardless | -9.709 |
Token | realistic |
Token ID | 12653 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
because | +0.339 |
besides | +0.336 |
nonetheless | +0.328 |
regardless | +0.324 |
nevertheless | +0.321 |
Neg logit contributions | |
majority | -0.172 |
country | -0.171 |
nation | -0.171 |
oret | -0.163 |
inner | -0.160 |
Token | training |
Token ID | 3047 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
majority | +2.994 |
country | +2.994 |
nation | +2.982 |
inner | +2.877 |
oret | +2.877 |
Neg logit contributions | |
because | -2.767 |
besides | -2.749 |
nonetheless | -2.667 |
regardless | -2.612 |
nevertheless | -2.596 |
Token | experience |
Token ID | 1998 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
because | +19.573 |
besides | +19.183 |
regardless | +18.605 |
nonetheless | +18.529 |
nevertheless | +18.045 |
Neg logit contributions | |
majority | -7.503 |
nation | -7.345 |
country | -7.331 |
oret | -7.243 |
ses | -6.838 |
Token | to |
Token ID | 284 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
because | +27.182 |
besides | +26.549 |
regardless | +25.557 |
nonetheless | +25.139 |
unless | +24.678 |
Neg logit contributions | |
majority | -13.373 |
oret | -12.907 |
nation | -12.844 |
country | -12.818 |
ses | -12.626 |
Token | date |
Token ID | 3128 |
Feature activation | +2.91e+01 |
Pos logit contributions | |
because | +14.554 |
besides | +14.166 |
nonetheless | +13.812 |
regardless | +13.725 |
nevertheless | +13.477 |
Neg logit contributions | |
majority | -8.221 |
nation | -8.009 |
country | -8.007 |
oret | -7.974 |
ses | -7.689 |
Token | ! |
Token ID | 0 |
Feature activation | +1.70e+01 |
Pos logit contributions | |
because | +30.221 |
besides | +28.750 |
regardless | +28.258 |
nonetheless | +27.382 |
unless | +27.215 |
Neg logit contributions | |
majority | -16.952 |
oret | -16.728 |
ses | -16.155 |
country | -16.146 |
nation | -16.083 |
Token |
|
Token ID | 198 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
because | +16.839 |
besides | +16.260 |
regardless | +15.624 |
unless | +15.206 |
nonetheless | +15.051 |
Neg logit contributions | |
slightest | -14.140 |
majority | -14.042 |
country | -13.938 |
nation | -13.888 |
inner | -13.827 |
Token |
|
Token ID | 198 |
Feature activation | +8.33e+00 |
Pos logit contributions | |
because | +5.707 |
besides | +5.461 |
nonetheless | +5.044 |
regardless | +4.912 |
nevertheless | +4.746 |
Neg logit contributions | |
majority | -17.435 |
country | -17.429 |
nation | -17.378 |
inner | -17.039 |
oret | -16.946 |
Token | Just |
Token ID | 5703 |
Feature activation | +7.12e+00 |
Pos logit contributions | |
because | +8.010 |
besides | +7.790 |
nonetheless | +7.341 |
regardless | +7.337 |
unless | +7.140 |
Neg logit contributions | |
country | -9.006 |
majority | -8.995 |
nation | -8.965 |
inner | -8.766 |
slightest | -8.688 |
Token | check |
Token ID | 2198 |
Feature activation | +9.46e+00 |
Pos logit contributions | |
because | +8.708 |
besides | +8.436 |
nonetheless | +8.128 |
regardless | +8.087 |
nevertheless | +7.919 |
Neg logit contributions | |
majority | -6.037 |
nation | -6.024 |
country | -6.015 |
oret | -5.928 |
inner | -5.652 |
Token | taken |
Token ID | 2077 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
because | +11.915 |
besides | +11.664 |
nonetheless | +11.400 |
regardless | +11.251 |
nevertheless | +11.094 |
Neg logit contributions | |
nation | -7.876 |
country | -7.826 |
majority | -7.794 |
oret | -7.714 |
trio | -7.593 |
Token | with |
Token ID | 351 |
Feature activation | +3.96e+00 |
Pos logit contributions | |
because | +20.393 |
besides | +19.508 |
nonetheless | +19.335 |
regardless | +19.302 |
unless | +18.694 |
Neg logit contributions | |
oret | -11.211 |
nation | -11.111 |
country | -11.068 |
ses | -10.934 |
majority | -10.914 |
Token | a |
Token ID | 257 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
because | +3.269 |
besides | +3.148 |
nonetheless | +3.046 |
regardless | +2.998 |
nevertheless | +2.919 |
Neg logit contributions | |
nation | -4.917 |
country | -4.896 |
majority | -4.852 |
oret | -4.849 |
inner | -4.754 |
Token | grain |
Token ID | 13020 |
Feature activation | +7.02e+00 |
Pos logit contributions | |
majority | +9.014 |
country | +8.800 |
nation | +8.669 |
inner | +8.090 |
trio | +8.072 |
Neg logit contributions | |
besides | -14.429 |
because | -14.287 |
nonetheless | -14.144 |
nevertheless | -13.919 |
regardless | -13.803 |
Token | of |
Token ID | 286 |
Feature activation | -2.59e+00 |
Pos logit contributions | |
because | +4.950 |
besides | +4.815 |
nonetheless | +4.635 |
regardless | +4.512 |
nevertheless | +4.429 |
Neg logit contributions | |
majority | -9.590 |
country | -9.587 |
nation | -9.569 |
oret | -9.370 |
inner | -9.329 |
Token | salt |
Token ID | 8268 |
Feature activation | +2.88e+01 |
Pos logit contributions | |
majority | +1.316 |
country | +1.315 |
nation | +1.304 |
oret | +1.251 |
inner | +1.216 |
Neg logit contributions | |
because | -4.107 |
besides | -4.061 |
nonetheless | -3.974 |
regardless | -3.938 |
nevertheless | -3.907 |
Token | for |
Token ID | 329 |
Feature activation | +7.93e+00 |
Pos logit contributions | |
because | +32.741 |
besides | +30.473 |
regardless | +30.161 |
unless | +29.938 |
nonetheless | +29.536 |
Neg logit contributions | |
majority | -13.865 |
slightest | -13.506 |
oret | -13.501 |
country | -13.454 |
nation | -13.451 |
Token | now |
Token ID | 783 |
Feature activation | +2.19e+01 |
Pos logit contributions | |
because | +10.065 |
besides | +9.764 |
nonetheless | +9.660 |
regardless | +9.551 |
nevertheless | +9.402 |
Neg logit contributions | |
nation | -5.904 |
country | -5.901 |
majority | -5.763 |
oret | -5.696 |
inner | -5.607 |
Token | until |
Token ID | 1566 |
Feature activation | +7.63e+00 |
Pos logit contributions | |
because | +25.575 |
besides | +24.008 |
regardless | +23.690 |
nonetheless | +23.399 |
unless | +23.368 |
Neg logit contributions | |
majority | -13.477 |
nation | -13.314 |
country | -13.300 |
oret | -13.202 |
slightest | -13.192 |
Token | more |
Token ID | 517 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
because | +9.348 |
besides | +9.215 |
nonetheless | +8.991 |
regardless | +8.901 |
nevertheless | +8.757 |
Neg logit contributions | |
country | -6.047 |
nation | -6.030 |
majority | -6.009 |
oret | -5.965 |
inner | -5.759 |
Token | reputable |
Token ID | 40300 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
majority | +1.095 |
country | +1.093 |
nation | +1.088 |
oret | +1.042 |
inner | +1.032 |
Neg logit contributions | |
because | -1.866 |
besides | -1.852 |
nonetheless | -1.806 |
regardless | -1.780 |
nevertheless | -1.767 |
Token | that |
Token ID | 326 |
Feature activation | +3.08e+00 |
Pos logit contributions | |
because | +10.685 |
besides | +10.506 |
nonetheless | +10.355 |
regardless | +10.180 |
nevertheless | +10.074 |
Neg logit contributions | |
nation | -7.888 |
country | -7.847 |
majority | -7.830 |
oret | -7.789 |
inner | -7.585 |
Token | this |
Token ID | 428 |
Feature activation | -6.50e+00 |
Pos logit contributions | |
because | +4.099 |
besides | +4.044 |
nonetheless | +3.952 |
regardless | +3.919 |
nevertheless | +3.870 |
Neg logit contributions | |
country | -2.295 |
majority | -2.293 |
nation | -2.289 |
oret | -2.215 |
inner | -2.167 |
Token | is |
Token ID | 318 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
country | +8.007 |
majority | +7.983 |
nation | +7.954 |
inner | +7.689 |
oret | +7.634 |
Neg logit contributions | |
besides | -5.352 |
because | -5.333 |
nonetheless | -5.103 |
regardless | -5.009 |
nevertheless | -4.938 |
Token | not |
Token ID | 407 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
because | +16.145 |
besides | +15.578 |
nonetheless | +15.337 |
regardless | +15.090 |
nevertheless | +15.044 |
Neg logit contributions | |
nation | -11.097 |
ses | -11.087 |
oret | -11.001 |
majority | -10.992 |
country | -10.970 |
Token | the |
Token ID | 262 |
Feature activation | -5.81e+00 |
Pos logit contributions | |
because | +15.919 |
besides | +15.159 |
nonetheless | +14.830 |
regardless | +14.713 |
nevertheless | +14.520 |
Neg logit contributions | |
oret | -11.203 |
nation | -11.152 |
country | -10.925 |
majority | -10.811 |
ses | -10.805 |
Token | case |
Token ID | 1339 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
majority | +1.780 |
country | +1.771 |
nation | +1.740 |
oret | +1.525 |
inner | +1.516 |
Neg logit contributions | |
because | -10.299 |
besides | -10.273 |
nonetheless | -10.091 |
regardless | -9.977 |
nevertheless | -9.937 |
Token | . |
Token ID | 13 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
because | +30.601 |
regardless | +28.398 |
nonetheless | +28.207 |
besides | +28.144 |
unless | +27.855 |
Neg logit contributions | |
oret | -16.203 |
nation | -15.382 |
country | -15.308 |
majority | -15.248 |
ses | -15.061 |
Token | Instead |
Token ID | 5455 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
because | +14.637 |
besides | +13.975 |
regardless | +13.511 |
nonetheless | +13.493 |
unless | +13.225 |
Neg logit contributions | |
slightest | -10.772 |
country | -10.614 |
nation | -10.594 |
majority | -10.544 |
inner | -10.520 |
Token | , |
Token ID | 11 |
Feature activation | +8.93e+00 |
Pos logit contributions | |
because | +20.535 |
besides | +19.736 |
regardless | +19.078 |
although | +18.744 |
nonetheless | +18.694 |
Neg logit contributions | |
slightest | -11.397 |
oret | -11.391 |
nation | -11.369 |
majority | -11.319 |
country | -11.198 |
Token | the |
Token ID | 262 |
Feature activation | -1.79e+01 |
Pos logit contributions | |
because | +11.909 |
besides | +11.603 |
regardless | +11.285 |
nonetheless | +11.265 |
nevertheless | +11.048 |
Neg logit contributions | |
oret | -6.009 |
nation | -5.994 |
majority | -5.973 |
country | -5.941 |
slightest | -5.660 |
Token | greater |
Token ID | 3744 |
Feature activation | -6.75e+00 |
Pos logit contributions | |
majority | +20.930 |
country | +20.602 |
nation | +20.374 |
oret | +19.704 |
inner | +19.650 |
Neg logit contributions | |
besides | -13.609 |
because | -13.054 |
nonetheless | -12.779 |
nevertheless | -12.358 |
regardless | -12.357 |
Token | � |
Token ID | 447 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
because | +0.907 |
besides | +0.898 |
nonetheless | +0.857 |
regardless | +0.831 |
nevertheless | +0.821 |
Neg logit contributions | |
majority | -1.931 |
country | -1.928 |
nation | -1.923 |
oret | -1.871 |
inner | -1.869 |
Token | � |
Token ID | 247 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
majority | +2.346 |
nation | +2.271 |
country | +2.266 |
inner | +2.173 |
oret | +2.123 |
Neg logit contributions | |
besides | -5.233 |
because | -5.203 |
nonetheless | -5.155 |
nevertheless | -5.083 |
regardless | -5.069 |
Token | ve |
Token ID | 303 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
because | +1.641 |
besides | +1.636 |
nonetheless | +1.611 |
regardless | +1.584 |
nevertheless | +1.578 |
Neg logit contributions | |
majority | -0.653 |
country | -0.647 |
nation | -0.639 |
oret | -0.608 |
inner | -0.596 |
Token | done |
Token ID | 1760 |
Feature activation | +4.65e+00 |
Pos logit contributions | |
because | +1.974 |
besides | +1.935 |
nonetheless | +1.847 |
regardless | +1.788 |
nevertheless | +1.767 |
Neg logit contributions | |
country | -4.400 |
majority | -4.399 |
nation | -4.388 |
oret | -4.281 |
inner | -4.267 |
Token | it |
Token ID | 340 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
because | +2.208 |
besides | +2.190 |
nonetheless | +2.057 |
regardless | +1.960 |
nevertheless | +1.934 |
Neg logit contributions | |
majority | -7.497 |
country | -7.493 |
nation | -7.473 |
inner | -7.287 |
oret | -7.278 |
Token | differently |
Token ID | 10338 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
because | +11.873 |
besides | +11.710 |
nonetheless | +11.264 |
regardless | +11.174 |
nevertheless | +10.953 |
Neg logit contributions | |
country | -11.411 |
majority | -11.408 |
nation | -11.389 |
oret | -11.136 |
inner | -10.958 |
Token | . |
Token ID | 13 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
because | +29.668 |
besides | +27.618 |
regardless | +27.347 |
unless | +27.165 |
nonetheless | +26.736 |
Neg logit contributions | |
oret | -15.075 |
majority | -14.812 |
nation | -14.795 |
slightest | -14.639 |
trio | -14.448 |
Token |
|
Token ID | 198 |
Feature activation | +9.00e+00 |
Pos logit contributions | |
because | +12.823 |
besides | +11.939 |
regardless | +11.532 |
unless | +11.408 |
nonetheless | +11.316 |
Neg logit contributions | |
nation | -12.773 |
country | -12.605 |
oret | -12.471 |
majority | -12.452 |
slightest | -12.446 |
Token |
|
Token ID | 198 |
Feature activation | +4.94e+00 |
Pos logit contributions | |
because | +4.465 |
besides | +4.356 |
nonetheless | +4.074 |
regardless | +3.915 |
nevertheless | +3.838 |
Neg logit contributions | |
majority | -14.240 |
country | -14.237 |
nation | -14.202 |
oret | -13.870 |
inner | -13.867 |
Token | Do |
Token ID | 5211 |
Feature activation | +4.19e+00 |
Pos logit contributions | |
because | +4.736 |
besides | +4.641 |
nonetheless | +4.455 |
regardless | +4.376 |
nevertheless | +4.318 |
Neg logit contributions | |
country | -5.490 |
nation | -5.487 |
majority | -5.481 |
inner | -5.330 |
oret | -5.268 |
Token | you |
Token ID | 345 |
Feature activation | +6.17e+00 |
Pos logit contributions | |
because | +3.185 |
besides | +3.093 |
nonetheless | +2.962 |
regardless | +2.897 |
nevertheless | +2.827 |
Neg logit contributions | |
nation | -5.414 |
country | -5.389 |
majority | -5.381 |
oret | -5.325 |
trio | -5.242 |
Token | that |
Token ID | 326 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
because | +20.243 |
besides | +19.469 |
regardless | +18.765 |
nonetheless | +18.748 |
unless | +18.498 |
Neg logit contributions | |
oret | -13.191 |
country | -13.030 |
majority | -13.020 |
nation | -13.012 |
inner | -12.706 |
Token | was |
Token ID | 373 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
because | +10.003 |
besides | +9.678 |
nonetheless | +9.213 |
regardless | +9.070 |
nevertheless | +8.950 |
Neg logit contributions | |
oret | -13.143 |
country | -13.059 |
majority | -13.028 |
nation | -13.001 |
ses | -12.799 |
Token | worth |
Token ID | 2861 |
Feature activation | +3.74e+00 |
Pos logit contributions | |
because | +3.705 |
besides | +3.646 |
nonetheless | +3.502 |
regardless | +3.437 |
nevertheless | +3.387 |
Neg logit contributions | |
country | -4.839 |
nation | -4.815 |
majority | -4.796 |
oret | -4.684 |
inner | -4.663 |
Token | the |
Token ID | 262 |
Feature activation | -2.11e+01 |
Pos logit contributions | |
because | +2.707 |
besides | +2.632 |
nonetheless | +2.501 |
regardless | +2.475 |
nevertheless | +2.395 |
Neg logit contributions | |
country | -5.041 |
nation | -5.021 |
majority | -5.002 |
oret | -4.965 |
inner | -4.880 |
Token | Democratic |
Token ID | 4390 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
majority | +23.847 |
nation | +23.212 |
country | +22.995 |
inner | +22.249 |
primary | +22.042 |
Neg logit contributions | |
besides | -14.359 |
nonetheless | -13.813 |
because | -13.640 |
nevertheless | -13.573 |
regardless | -12.955 |
Token | votes |
Token ID | 5690 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
majority | +19.387 |
nation | +18.671 |
country | +18.620 |
primary | +17.741 |
inner | +17.702 |
Neg logit contributions | |
besides | -15.876 |
nonetheless | -15.237 |
because | -15.082 |
nevertheless | -14.881 |
regardless | -14.780 |
Token | , |
Token ID | 11 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
because | +31.307 |
besides | +29.718 |
regardless | +29.243 |
unless | +28.763 |
nonetheless | +28.579 |
Neg logit contributions | |
oret | -14.061 |
multitude | -13.333 |
country | -13.322 |
ses | -13.263 |
nation | -13.232 |
Token | � |
Token ID | 447 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
because | +22.516 |
besides | +21.992 |
regardless | +21.602 |
nonetheless | +21.070 |
unless | +20.773 |
Neg logit contributions | |
oret | -11.334 |
country | -10.934 |
nation | -10.890 |
majority | -10.641 |
inner | -10.598 |
Token | � |
Token ID | 251 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
because | +4.282 |
besides | +4.239 |
nonetheless | +4.117 |
regardless | +4.073 |
nevertheless | +4.031 |
Neg logit contributions | |
country | -2.615 |
majority | -2.614 |
nation | -2.609 |
oret | -2.498 |
inner | -2.480 |
Token | Evans |
Token ID | 13922 |
Feature activation | +8.77e+00 |
Pos logit contributions | |
because | +11.947 |
besides | +11.592 |
regardless | +11.219 |
nonetheless | +11.154 |
nevertheless | +10.905 |
Neg logit contributions | |
oret | -10.496 |
nation | -10.381 |
country | -10.374 |
majority | -10.208 |
inner | -10.117 |
Token | told |
Token ID | 1297 |
Feature activation | +6.45e+00 |
Pos logit contributions | |
because | +7.944 |
nonetheless | +7.722 |
besides | +7.560 |
nevertheless | +7.500 |
regardless | +7.294 |
Neg logit contributions | |
nation | -9.328 |
country | -9.324 |
majority | -9.257 |
oret | -9.216 |
inner | -9.188 |
Token | is |
Token ID | 318 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
because | +10.342 |
besides | +10.074 |
nonetheless | +9.943 |
nevertheless | +9.694 |
regardless | +9.626 |
Neg logit contributions | |
majority | -10.922 |
country | -10.907 |
nation | -10.891 |
oret | -10.841 |
inner | -10.663 |
Token | for |
Token ID | 329 |
Feature activation | +3.11e+00 |
Pos logit contributions | |
because | +19.940 |
besides | +19.147 |
nonetheless | +18.824 |
regardless | +18.484 |
nevertheless | +18.420 |
Neg logit contributions | |
nation | -9.955 |
country | -9.847 |
majority | -9.845 |
oret | -9.751 |
ses | -9.582 |
Token | making |
Token ID | 1642 |
Feature activation | +6.30e+00 |
Pos logit contributions | |
because | +2.042 |
besides | +1.975 |
nonetheless | +1.889 |
regardless | +1.835 |
nevertheless | +1.796 |
Neg logit contributions | |
majority | -4.412 |
country | -4.411 |
nation | -4.404 |
oret | -4.333 |
inner | -4.288 |
Token | the |
Token ID | 262 |
Feature activation | -1.82e+01 |
Pos logit contributions | |
because | +7.168 |
besides | +6.929 |
nonetheless | +6.860 |
regardless | +6.737 |
nevertheless | +6.660 |
Neg logit contributions | |
majority | -5.673 |
country | -5.645 |
oret | -5.629 |
nation | -5.625 |
inner | -5.442 |
Token | latter |
Token ID | 6846 |
Feature activation | +4.73e+00 |
Pos logit contributions | |
majority | +20.481 |
country | +20.347 |
nation | +20.180 |
oret | +19.210 |
inner | +19.195 |
Neg logit contributions | |
besides | -14.159 |
because | -13.656 |
nonetheless | -13.412 |
nevertheless | -13.094 |
regardless | -13.062 |
Token | argument |
Token ID | 4578 |
Feature activation | +2.85e+01 |
Pos logit contributions | |
because | +6.867 |
besides | +6.725 |
nonetheless | +6.584 |
regardless | +6.546 |
nevertheless | +6.452 |
Neg logit contributions | |
country | -2.869 |
majority | -2.866 |
nation | -2.863 |
oret | -2.794 |
inner | -2.718 |
Token | — |
Token ID | 960 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
because | +32.206 |
besides | +30.576 |
nonetheless | +30.173 |
regardless | +29.875 |
nevertheless | +28.921 |
Neg logit contributions | |
oret | -13.544 |
slightest | -13.513 |
nation | -13.323 |
majority | -13.181 |
country | -13.056 |
Token | that |
Token ID | 5562 |
Feature activation | +7.61e+00 |
Pos logit contributions | |
because | +16.386 |
besides | +15.871 |
nonetheless | +15.484 |
regardless | +15.425 |
nevertheless | +15.024 |
Neg logit contributions | |
majority | -10.891 |
country | -10.823 |
nation | -10.787 |
inner | -10.520 |
trio | -10.462 |
Token | it |
Token ID | 340 |
Feature activation | +4.41e+00 |
Pos logit contributions | |
because | +9.528 |
besides | +9.297 |
nonetheless | +9.070 |
regardless | +9.046 |
nevertheless | +8.868 |
Neg logit contributions | |
country | -5.964 |
nation | -5.947 |
oret | -5.929 |
majority | -5.917 |
inner | -5.721 |
Token | was |
Token ID | 373 |
Feature activation | +4.03e+00 |
Pos logit contributions | |
because | +3.702 |
besides | +3.624 |
nonetheless | +3.537 |
regardless | +3.431 |
nevertheless | +3.421 |
Neg logit contributions | |
majority | -5.432 |
country | -5.431 |
nation | -5.414 |
oret | -5.290 |
inner | -5.266 |
Token | wrong |
Token ID | 2642 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
because | +4.577 |
besides | +4.486 |
nonetheless | +4.392 |
regardless | +4.296 |
nevertheless | +4.287 |
Neg logit contributions | |
country | -3.804 |
majority | -3.803 |
nation | -3.795 |
oret | -3.669 |
inner | -3.650 |
Token | that |
Token ID | 326 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
because | +26.256 |
besides | +25.592 |
nonetheless | +24.162 |
regardless | +23.959 |
although | +23.310 |
Neg logit contributions | |
slightest | -12.993 |
nation | -12.898 |
majority | -12.819 |
country | -12.777 |
oret | -12.268 |
Token | we |
Token ID | 356 |
Feature activation | +3.01e+00 |
Pos logit contributions | |
because | +11.060 |
besides | +10.800 |
nonetheless | +10.446 |
regardless | +10.196 |
nevertheless | +10.177 |
Neg logit contributions | |
majority | -11.138 |
nation | -11.053 |
country | -11.048 |
oret | -10.806 |
ses | -10.729 |
Token | were |
Token ID | 547 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
because | +2.167 |
besides | +2.116 |
nonetheless | +2.024 |
regardless | +1.964 |
nevertheless | +1.943 |
Neg logit contributions | |
majority | -4.109 |
country | -4.091 |
nation | -4.075 |
inner | -3.978 |
oret | -3.975 |
Token | play |
Token ID | 711 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
majority | +1.075 |
country | +1.074 |
nation | +1.069 |
oret | +1.023 |
inner | +1.017 |
Neg logit contributions | |
because | -1.708 |
besides | -1.694 |
nonetheless | -1.653 |
regardless | -1.628 |
nevertheless | -1.618 |
Token | - |
Token ID | 12 |
Feature activation | -5.85e+00 |
Pos logit contributions | |
country | +0.580 |
majority | +0.578 |
nation | +0.574 |
oret | +0.536 |
inner | +0.524 |
Neg logit contributions | |
besides | -1.734 |
because | -1.725 |
nonetheless | -1.707 |
nevertheless | -1.681 |
regardless | -1.680 |
Token | testing |
Token ID | 33407 |
Feature activation | +2.79e+01 |
Pos logit contributions | |
nation | +5.825 |
majority | +5.820 |
country | +5.776 |
oret | +5.711 |
ses | +5.553 |
Neg logit contributions | |
besides | -5.865 |
nonetheless | -5.695 |
because | -5.685 |
nevertheless | -5.592 |
regardless | -5.571 |
Token | . |
Token ID | 13 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
because | +30.820 |
besides | +29.814 |
nonetheless | +28.333 |
regardless | +28.210 |
nevertheless | +27.338 |
Neg logit contributions | |
slightest | -13.760 |
nation | -13.527 |
majority | -13.399 |
ses | -13.348 |
country | -13.346 |
Token | One |
Token ID | 1881 |
Feature activation | +4.46e+00 |
Pos logit contributions | |
because | +11.795 |
besides | +11.179 |
nonetheless | +10.611 |
regardless | +10.543 |
unless | +10.316 |
Neg logit contributions | |
slightest | -12.798 |
country | -12.724 |
nation | -12.715 |
inner | -12.578 |
majority | -12.517 |
Token | was |
Token ID | 373 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
because | +3.353 |
besides | +3.280 |
nonetheless | +3.011 |
regardless | +2.987 |
nevertheless | +2.894 |
Neg logit contributions | |
majority | -5.883 |
nation | -5.846 |
country | -5.838 |
oret | -5.707 |
inner | -5.676 |
Token | a |
Token ID | 257 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
because | +3.222 |
besides | +3.130 |
nonetheless | +2.986 |
regardless | +2.950 |
nevertheless | +2.885 |
Neg logit contributions | |
nation | -4.620 |
majority | -4.612 |
country | -4.602 |
inner | -4.461 |
oret | -4.458 |
Token | Thought |
Token ID | 27522 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
majority | +26.084 |
country | +25.946 |
nation | +25.705 |
trio | +25.218 |
inner | +24.983 |
Neg logit contributions | |
besides | -11.039 |
nonetheless | -10.586 |
because | -10.440 |
nevertheless | -10.325 |
regardless | -10.100 |
Token | choices |
Token ID | 7747 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
country | +8.272 |
nation | +8.234 |
majority | +8.194 |
inner | +7.939 |
oret | +7.798 |
Neg logit contributions | |
besides | -6.258 |
because | -6.218 |
nonetheless | -6.096 |
regardless | -5.915 |
nevertheless | -5.908 |
Token | , |
Token ID | 11 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
because | +16.960 |
besides | +16.365 |
regardless | +15.781 |
nonetheless | +15.593 |
nevertheless | +15.298 |
Neg logit contributions | |
majority | -11.488 |
oret | -11.313 |
country | -11.165 |
slightest | -11.103 |
nation | -11.076 |
Token | this |
Token ID | 428 |
Feature activation | -4.05e+00 |
Pos logit contributions | |
because | +14.411 |
besides | +14.083 |
regardless | +13.752 |
nonetheless | +13.682 |
unless | +13.410 |
Neg logit contributions | |
majority | -7.473 |
oret | -7.464 |
nation | -7.371 |
country | -7.352 |
ses | -7.096 |
Token | raises |
Token ID | 12073 |
Feature activation | +8.44e+00 |
Pos logit contributions | |
country | +4.865 |
majority | +4.857 |
nation | +4.846 |
inner | +4.680 |
oret | +4.676 |
Neg logit contributions | |
because | -3.547 |
besides | -3.530 |
nonetheless | -3.396 |
regardless | -3.325 |
nevertheless | -3.295 |
Token | privacy |
Token ID | 6782 |
Feature activation | +7.37e+00 |
Pos logit contributions | |
because | +10.751 |
besides | +10.531 |
nonetheless | +10.292 |
regardless | +10.172 |
nevertheless | +10.011 |
Neg logit contributions | |
majority | -6.191 |
oret | -6.090 |
nation | -6.083 |
country | -6.056 |
inner | -5.784 |
Token | concerns |
Token ID | 4786 |
Feature activation | +2.79e+01 |
Pos logit contributions | |
because | +7.856 |
besides | +7.608 |
nonetheless | +7.392 |
regardless | +7.359 |
nevertheless | +7.163 |
Neg logit contributions | |
majority | -7.222 |
nation | -7.206 |
country | -7.167 |
oret | -7.049 |
inner | -6.932 |
Token | . |
Token ID | 13 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
because | +31.946 |
besides | +30.252 |
regardless | +30.033 |
nonetheless | +30.019 |
unless | +28.883 |
Neg logit contributions | |
oret | -14.824 |
slightest | -14.627 |
majority | -14.460 |
country | -14.010 |
ses | -14.005 |
Token |
|
Token ID | 198 |
Feature activation | +5.75e+00 |
Pos logit contributions | |
because | +17.188 |
besides | +16.478 |
regardless | +15.938 |
nonetheless | +15.895 |
unless | +15.720 |
Neg logit contributions | |
slightest | -11.806 |
inner | -11.599 |
country | -11.453 |
majority | -11.360 |
nation | -11.346 |
Token |
|
Token ID | 198 |
Feature activation | +4.58e+00 |
Pos logit contributions | |
besides | +3.005 |
because | +2.999 |
nonetheless | +2.859 |
regardless | +2.728 |
nevertheless | +2.709 |
Neg logit contributions | |
majority | -9.012 |
country | -9.007 |
nation | -8.986 |
oret | -8.785 |
inner | -8.730 |
Token | T |
Token ID | 51 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
because | +4.417 |
besides | +4.311 |
nonetheless | +4.145 |
regardless | +4.080 |
nevertheless | +4.014 |
Neg logit contributions | |
country | -5.089 |
majority | -5.072 |
nation | -5.058 |
inner | -4.939 |
slightest | -4.851 |
Token | ests |
Token ID | 3558 |
Feature activation | +9.24e+00 |
Pos logit contributions | |
majority | +14.603 |
country | +14.565 |
nation | +14.507 |
oret | +14.107 |
inner | +13.818 |
Neg logit contributions | |
besides | -12.612 |
nonetheless | -12.391 |
because | -12.042 |
nevertheless | -12.029 |
regardless | -11.909 |
Token | the |
Token ID | 262 |
Feature activation | -2.55e+01 |
Pos logit contributions | |
because | +12.749 |
besides | +12.201 |
regardless | +12.037 |
nonetheless | +11.793 |
nevertheless | +11.576 |
Neg logit contributions | |
oret | -9.798 |
nation | -9.528 |
country | -9.456 |
trio | -9.345 |
majority | -9.312 |
Token | dwelling |
Token ID | 26765 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
majority | +25.623 |
country | +24.877 |
nation | +24.656 |
remainder | +23.863 |
largest | +23.543 |
Neg logit contributions | |
besides | -17.642 |
nonetheless | -16.963 |
because | -16.824 |
nevertheless | -16.436 |
unless | -15.744 |
Token | supply |
Token ID | 5127 |
Feature activation | +6.80e+00 |
Pos logit contributions | |
majority | +8.984 |
country | +8.933 |
nation | +8.718 |
inner | +8.083 |
presence | +7.914 |
Neg logit contributions | |
besides | -17.143 |
nonetheless | -16.975 |
because | -16.696 |
nevertheless | -16.561 |
regardless | -16.413 |
Token | builds |
Token ID | 12188 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
because | +7.249 |
besides | +7.165 |
nonetheless | +6.984 |
regardless | +6.850 |
nevertheless | +6.800 |
Neg logit contributions | |
country | -6.861 |
majority | -6.847 |
nation | -6.833 |
oret | -6.608 |
inner | -6.579 |
Token | over |
Token ID | 625 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
because | +17.604 |
besides | +16.987 |
nonetheless | +16.461 |
regardless | +16.440 |
nevertheless | +15.927 |
Neg logit contributions | |
oret | -14.575 |
slightest | -14.430 |
country | -14.420 |
nation | -14.361 |
trio | -14.325 |
Token | time |
Token ID | 640 |
Feature activation | +2.78e+01 |
Pos logit contributions | |
besides | +2.063 |
because | +2.055 |
nonetheless | +2.020 |
regardless | +1.992 |
nevertheless | +1.983 |
Neg logit contributions | |
country | -0.863 |
majority | -0.855 |
nation | -0.845 |
inner | -0.788 |
oret | -0.784 |
Token | . |
Token ID | 13 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
because | +29.841 |
regardless | +28.070 |
besides | +27.778 |
nonetheless | +27.300 |
unless | +27.258 |
Neg logit contributions | |
oret | -15.260 |
slightest | -15.250 |
majority | -14.631 |
nation | -14.354 |
country | -14.331 |
Token |
|
Token ID | 198 |
Feature activation | +8.68e+00 |
Pos logit contributions | |
because | +17.117 |
besides | +16.335 |
regardless | +15.843 |
nonetheless | +15.705 |
unless | +15.530 |
Neg logit contributions | |
slightest | -13.078 |
country | -12.705 |
inner | -12.700 |
nation | -12.659 |
majority | -12.603 |
Token |
|
Token ID | 198 |
Feature activation | +7.68e+00 |
Pos logit contributions | |
because | +4.331 |
besides | +4.228 |
nonetheless | +3.962 |
regardless | +3.805 |
nevertheless | +3.733 |
Neg logit contributions | |
majority | -13.732 |
country | -13.727 |
nation | -13.693 |
oret | -13.374 |
inner | -13.371 |
Token | If |
Token ID | 1532 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
because | +7.505 |
besides | +7.302 |
nonetheless | +7.038 |
regardless | +6.927 |
nevertheless | +6.838 |
Neg logit contributions | |
country | -8.238 |
nation | -8.213 |
majority | -8.207 |
inner | -8.049 |
slightest | -7.939 |
Token | Christopher |
Token ID | 12803 |
Feature activation | +3.84e+00 |
Pos logit contributions | |
because | +3.583 |
besides | +3.516 |
nonetheless | +3.427 |
regardless | +3.389 |
nevertheless | +3.347 |
Neg logit contributions | |
country | -2.917 |
nation | -2.914 |
majority | -2.908 |
oret | -2.841 |
inner | -2.801 |
Token | of |
Token ID | 286 |
Feature activation | +6.42e+00 |
Pos logit contributions | |
because | +23.124 |
besides | +22.247 |
nonetheless | +21.449 |
unless | +21.352 |
regardless | +21.269 |
Neg logit contributions | |
country | -9.471 |
oret | -9.458 |
nation | -9.309 |
majority | -8.949 |
trio | -8.880 |
Token | major |
Token ID | 1688 |
Feature activation | +4.61e-01 |
Pos logit contributions | |
because | +8.329 |
besides | +8.071 |
nonetheless | +7.890 |
regardless | +7.811 |
unless | +7.772 |
Neg logit contributions | |
country | -4.653 |
majority | -4.578 |
nation | -4.575 |
oret | -4.550 |
trio | -4.354 |
Token |
|
Token ID | 198 |
Feature activation | +3.10e+00 |
Pos logit contributions | |
because | +0.504 |
besides | +0.495 |
nonetheless | +0.481 |
regardless | +0.474 |
nevertheless | +0.469 |
Neg logit contributions | |
country | -0.457 |
majority | -0.457 |
nation | -0.454 |
oret | -0.443 |
inner | -0.438 |
Token |
|
Token ID | 198 |
Feature activation | -6.76e+00 |
Pos logit contributions | |
besides | +1.806 |
nonetheless | +1.747 |
because | +1.745 |
nevertheless | +1.659 |
regardless | +1.656 |
Neg logit contributions | |
majority | -4.675 |
country | -4.672 |
nation | -4.661 |
oret | -4.556 |
inner | -4.505 |
Token | import |
Token ID | 11748 |
Feature activation | +7.21e+00 |
Pos logit contributions | |
country | +5.220 |
majority | +5.213 |
nation | +5.204 |
oret | +5.028 |
inner | +4.904 |
Neg logit contributions | |
besides | -8.621 |
because | -8.589 |
nonetheless | -8.430 |
regardless | -8.257 |
nevertheless | -8.254 |
Token | ance |
Token ID | 590 |
Feature activation | +2.78e+01 |
Pos logit contributions | |
because | +8.453 |
besides | +8.264 |
nonetheless | +7.949 |
regardless | +7.934 |
nevertheless | +7.771 |
Neg logit contributions | |
majority | -6.458 |
country | -6.403 |
nation | -6.392 |
oret | -6.229 |
inner | -6.177 |
Token | for |
Token ID | 329 |
Feature activation | +2.22e+00 |
Pos logit contributions | |
because | +31.520 |
besides | +29.847 |
unless | +29.560 |
regardless | +29.363 |
nonetheless | +29.047 |
Neg logit contributions | |
majority | -14.341 |
oret | -13.725 |
ses | -13.608 |
country | -13.592 |
nation | -13.449 |
Token | the |
Token ID | 262 |
Feature activation | -1.97e+01 |
Pos logit contributions | |
because | +2.981 |
besides | +2.942 |
nonetheless | +2.873 |
regardless | +2.840 |
nevertheless | +2.814 |
Neg logit contributions | |
country | -1.625 |
majority | -1.618 |
nation | -1.614 |
oret | -1.574 |
inner | -1.534 |
Token | applications |
Token ID | 5479 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
majority | +24.379 |
country | +23.835 |
nation | +23.806 |
inner | +23.089 |
oret | +22.786 |
Neg logit contributions | |
besides | -12.008 |
because | -11.566 |
nonetheless | -11.269 |
regardless | -10.865 |
nevertheless | -10.838 |
Token | I |
Token ID | 314 |
Feature activation | +5.85e-01 |
Pos logit contributions | |
because | +17.848 |
besides | +17.623 |
nonetheless | +17.008 |
regardless | +16.865 |
nevertheless | +16.748 |
Neg logit contributions | |
majority | -9.150 |
nation | -9.123 |
country | -9.064 |
oret | -8.772 |
trio | -8.712 |
Token | have |
Token ID | 423 |
Feature activation | +5.71e+00 |
Pos logit contributions | |
because | +0.610 |
besides | +0.605 |
nonetheless | +0.588 |
regardless | +0.577 |
nevertheless | +0.572 |
Neg logit contributions | |
country | -0.608 |
majority | -0.608 |
nation | -0.606 |
oret | -0.583 |
inner | -0.582 |
Token | the |
Token ID | 262 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
country | +14.655 |
majority | +14.616 |
nation | +14.508 |
inner | +14.296 |
primary | +13.799 |
Neg logit contributions | |
besides | -9.484 |
because | -9.343 |
nonetheless | -9.156 |
regardless | -8.898 |
nevertheless | -8.867 |
Token | disease |
Token ID | 4369 |
Feature activation | +4.32e+00 |
Pos logit contributions | |
majority | +30.389 |
country | +30.115 |
nation | +29.694 |
presence | +29.569 |
inner | +29.474 |
Neg logit contributions | |
besides | -13.398 |
because | -12.667 |
nonetheless | -12.562 |
nevertheless | -12.175 |
regardless | -12.168 |
Token | also |
Token ID | 635 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
because | +4.138 |
besides | +4.078 |
nonetheless | +3.972 |
regardless | +3.875 |
nevertheless | +3.863 |
Neg logit contributions | |
majority | -4.830 |
country | -4.818 |
nation | -4.794 |
oret | -4.694 |
inner | -4.645 |
Token | have |
Token ID | 423 |
Feature activation | +4.44e+00 |
Pos logit contributions | |
because | +14.335 |
besides | +14.079 |
nonetheless | +13.815 |
nevertheless | +13.536 |
regardless | +13.452 |
Neg logit contributions | |
majority | -8.611 |
country | -8.522 |
nation | -8.470 |
oret | -8.398 |
trio | -8.128 |
Token | social |
Token ID | 1919 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
because | +5.495 |
besides | +5.422 |
nonetheless | +5.285 |
regardless | +5.185 |
nevertheless | +5.168 |
Neg logit contributions | |
majority | -3.625 |
nation | -3.601 |
country | -3.591 |
oret | -3.542 |
trio | -3.445 |
Token | repercussions |
Token ID | 34056 |
Feature activation | +2.77e+01 |
Pos logit contributions | |
majority | +12.108 |
country | +12.052 |
nation | +12.011 |
inner | +11.638 |
oret | +11.517 |
Neg logit contributions | |
besides | -8.221 |
because | -8.157 |
nonetheless | -7.982 |
nevertheless | -7.768 |
regardless | -7.734 |
Token | . |
Token ID | 13 |
Feature activation | +9.93e+00 |
Pos logit contributions | |
because | +31.332 |
besides | +30.264 |
regardless | +29.399 |
nonetheless | +29.318 |
unless | +28.450 |
Neg logit contributions | |
oret | -14.754 |
slightest | -14.694 |
majority | -14.471 |
trio | -14.319 |
ses | -14.143 |
Token |
|
Token ID | 198 |
Feature activation | +3.41e+00 |
Pos logit contributions | |
because | +12.416 |
besides | +12.020 |
nonetheless | +11.694 |
regardless | +11.633 |
nevertheless | +11.423 |
Neg logit contributions | |
country | -7.526 |
majority | -7.514 |
nation | -7.473 |
slightest | -7.458 |
inner | -7.334 |
Token |
|
Token ID | 198 |
Feature activation | +8.51e-01 |
Pos logit contributions | |
besides | +1.859 |
because | +1.832 |
nonetheless | +1.779 |
regardless | +1.697 |
nevertheless | +1.691 |
Neg logit contributions | |
majority | -5.261 |
country | -5.251 |
nation | -5.239 |
oret | -5.125 |
inner | -5.076 |
Token | In |
Token ID | 818 |
Feature activation | -8.54e+00 |
Pos logit contributions | |
because | +0.861 |
besides | +0.850 |
nonetheless | +0.823 |
regardless | +0.807 |
nevertheless | +0.800 |
Neg logit contributions | |
country | -0.916 |
majority | -0.915 |
nation | -0.912 |
inner | -0.882 |
oret | -0.879 |
Token | extreme |
Token ID | 3257 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
country | +10.038 |
majority | +10.032 |
nation | +9.979 |
inner | +9.627 |
oret | +9.599 |
Neg logit contributions | |
besides | -7.491 |
because | -7.489 |
nonetheless | -7.200 |
regardless | -7.080 |
nevertheless | -6.976 |
Token | removed |
Token ID | 4615 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
because | +15.617 |
besides | +15.073 |
nonetheless | +14.640 |
regardless | +14.609 |
nevertheless | +14.297 |
Neg logit contributions | |
oret | -9.912 |
nation | -9.889 |
majority | -9.839 |
country | -9.807 |
inner | -9.497 |
Token | , |
Token ID | 11 |
Feature activation | +1.53e+01 |
Pos logit contributions | |
because | +18.490 |
besides | +17.495 |
regardless | +17.149 |
nonetheless | +16.946 |
unless | +16.743 |
Neg logit contributions | |
oret | -13.343 |
nation | -13.103 |
country | -13.027 |
majority | -13.007 |
slightest | -12.764 |
Token | and |
Token ID | 290 |
Feature activation | +8.30e+00 |
Pos logit contributions | |
because | +22.286 |
besides | +21.457 |
regardless | +21.269 |
nonetheless | +20.902 |
according | +20.837 |
Neg logit contributions | |
oret | -7.391 |
nation | -6.954 |
majority | -6.947 |
country | -6.869 |
slightest | -6.747 |
Token | the |
Token ID | 262 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
because | +10.819 |
besides | +10.566 |
nonetheless | +10.342 |
regardless | +10.226 |
nevertheless | +10.081 |
Neg logit contributions | |
majority | -6.121 |
nation | -6.104 |
country | -6.083 |
oret | -6.051 |
inner | -5.830 |
Token | judge |
Token ID | 5052 |
Feature activation | +9.92e+00 |
Pos logit contributions | |
country | +20.203 |
majority | +20.137 |
nation | +20.085 |
inner | +19.285 |
remainder | +19.161 |
Neg logit contributions | |
besides | -13.027 |
because | -12.611 |
nonetheless | -12.368 |
nevertheless | -12.090 |
regardless | -12.016 |
Token | agreed |
Token ID | 4987 |
Feature activation | +2.76e+01 |
Pos logit contributions | |
because | +10.895 |
nonetheless | +10.580 |
besides | +10.559 |
nevertheless | +10.299 |
regardless | +10.231 |
Neg logit contributions | |
country | -8.996 |
nation | -8.995 |
majority | -8.929 |
oret | -8.837 |
inner | -8.691 |
Token | . |
Token ID | 13 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
because | +30.946 |
regardless | +29.011 |
nonetheless | +28.902 |
besides | +28.586 |
unless | +27.950 |
Neg logit contributions | |
oret | -14.713 |
ses | -14.189 |
slightest | -14.156 |
nation | -13.926 |
country | -13.881 |
Token |
|
Token ID | 198 |
Feature activation | +9.52e+00 |
Pos logit contributions | |
because | +17.697 |
besides | +16.713 |
regardless | +16.401 |
nonetheless | +16.295 |
nevertheless | +15.977 |
Neg logit contributions | |
slightest | -13.094 |
country | -13.047 |
nation | -12.967 |
oret | -12.934 |
majority | -12.933 |
Token |
|
Token ID | 198 |
Feature activation | +6.33e+00 |
Pos logit contributions | |
because | +4.761 |
besides | +4.620 |
nonetheless | +4.309 |
regardless | +4.154 |
nevertheless | +4.061 |
Neg logit contributions | |
majority | -14.992 |
country | -14.987 |
nation | -14.948 |
inner | -14.612 |
oret | -14.601 |
Token | Now |
Token ID | 3844 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
because | +6.899 |
besides | +6.704 |
nonetheless | +6.493 |
regardless | +6.400 |
nevertheless | +6.306 |
Neg logit contributions | |
country | -6.161 |
majority | -6.140 |
nation | -6.132 |
inner | -5.991 |
slightest | -5.925 |
Token | prosecutors |
Token ID | 11947 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
because | +17.067 |
besides | +16.521 |
regardless | +16.089 |
nonetheless | +15.916 |
unless | +15.738 |
Neg logit contributions | |
majority | -8.308 |
nation | -8.210 |
country | -8.183 |
slightest | -8.143 |
oret | -8.079 |
Token | 'll |
Token ID | 1183 |
Feature activation | +5.13e+00 |
Pos logit contributions | |
because | +2.104 |
besides | +2.073 |
nonetheless | +2.014 |
regardless | +1.963 |
nevertheless | +1.953 |
Neg logit contributions | |
majority | -2.752 |
country | -2.745 |
nation | -2.736 |
oret | -2.671 |
inner | -2.660 |
Token | be |
Token ID | 307 |
Feature activation | +5.00e+00 |
Pos logit contributions | |
because | +5.009 |
besides | +4.867 |
nonetheless | +4.843 |
nevertheless | +4.711 |
regardless | +4.695 |
Neg logit contributions | |
majority | -5.594 |
country | -5.588 |
nation | -5.547 |
oret | -5.503 |
inner | -5.416 |
Token | in |
Token ID | 287 |
Feature activation | -7.20e+00 |
Pos logit contributions | |
because | +3.832 |
besides | +3.691 |
nonetheless | +3.589 |
regardless | +3.520 |
nevertheless | +3.438 |
Neg logit contributions | |
majority | -6.488 |
country | -6.460 |
nation | -6.440 |
oret | -6.398 |
inner | -6.301 |
Token | custody |
Token ID | 10804 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
country | +4.935 |
majority | +4.864 |
nation | +4.845 |
inner | +4.470 |
presence | +4.408 |
Neg logit contributions | |
besides | -9.734 |
because | -9.591 |
nonetheless | -9.392 |
regardless | -9.274 |
nevertheless | -9.244 |
Token | pretty |
Token ID | 2495 |
Feature activation | +3.19e+00 |
Pos logit contributions | |
because | +16.110 |
besides | +15.506 |
regardless | +15.224 |
nonetheless | +14.896 |
unless | +14.729 |
Neg logit contributions | |
majority | -12.629 |
country | -12.236 |
nation | -12.168 |
ses | -12.068 |
inner | -11.923 |
Token | quickly |
Token ID | 2952 |
Feature activation | +2.76e+01 |
Pos logit contributions | |
because | +2.097 |
besides | +2.096 |
nonetheless | +1.974 |
regardless | +1.919 |
nevertheless | +1.900 |
Neg logit contributions | |
country | -4.557 |
majority | -4.555 |
nation | -4.549 |
inner | -4.411 |
oret | -4.389 |
Token | ." |
Token ID | 526 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
because | +30.420 |
regardless | +28.355 |
besides | +27.877 |
unless | +27.831 |
nonetheless | +27.476 |
Neg logit contributions | |
oret | -15.860 |
majority | -15.416 |
slightest | -15.313 |
inner | -15.159 |
trio | -14.980 |
Token |
|
Token ID | 198 |
Feature activation | +8.38e+00 |
Pos logit contributions | |
because | +19.427 |
besides | +18.808 |
regardless | +18.143 |
nonetheless | +17.876 |
unless | +17.770 |
Neg logit contributions | |
majority | -14.808 |
country | -14.579 |
nation | -14.439 |
oret | -14.397 |
inner | -14.263 |
Token |
|
Token ID | 198 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
because | +4.135 |
besides | +4.050 |
nonetheless | +3.793 |
regardless | +3.640 |
nevertheless | +3.573 |
Neg logit contributions | |
majority | -13.302 |
country | -13.297 |
nation | -13.264 |
oret | -12.958 |
inner | -12.946 |
Token | ' |
Token ID | 6 |
Feature activation | -6.71e+00 |
Pos logit contributions | |
because | +2.332 |
besides | +2.294 |
nonetheless | +2.212 |
regardless | +2.175 |
nevertheless | +2.145 |
Neg logit contributions | |
majority | -2.442 |
country | -2.439 |
nation | -2.427 |
inner | -2.357 |
oret | -2.336 |
Token | A |
Token ID | 32 |
Feature activation | -2.35e+01 |
Pos logit contributions | |
majority | +7.718 |
country | +7.698 |
nation | +7.677 |
oret | +7.461 |
inner | +7.325 |
Neg logit contributions | |
besides | -5.885 |
because | -5.852 |
nonetheless | -5.749 |
nevertheless | -5.610 |
regardless | -5.561 |
Token | would |
Token ID | 561 |
Feature activation | +9.76e+00 |
Pos logit contributions | |
because | +4.682 |
besides | +4.637 |
nonetheless | +4.497 |
regardless | +4.377 |
nevertheless | +4.371 |
Neg logit contributions | |
majority | -6.153 |
country | -6.119 |
nation | -6.104 |
oret | -5.967 |
inner | -5.927 |
Token | come |
Token ID | 1282 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
because | +11.317 |
besides | +11.217 |
nonetheless | +11.037 |
nevertheless | +10.827 |
regardless | +10.755 |
Neg logit contributions | |
country | -8.184 |
nation | -8.158 |
majority | -8.150 |
oret | -8.057 |
inner | -7.873 |
Token | to |
Token ID | 284 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
because | +11.017 |
besides | +10.690 |
regardless | +10.348 |
nonetheless | +10.263 |
unless | +9.933 |
Neg logit contributions | |
oret | -11.406 |
majority | -11.237 |
nation | -11.197 |
country | -11.175 |
slightest | -10.887 |
Token | quite |
Token ID | 2407 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
because | +2.132 |
besides | +2.112 |
nonetheless | +2.033 |
regardless | +2.012 |
nevertheless | +1.985 |
Neg logit contributions | |
country | -2.070 |
nation | -2.067 |
majority | -2.055 |
oret | -2.022 |
inner | -1.987 |
Token | different |
Token ID | 1180 |
Feature activation | +3.75e-02 |
Pos logit contributions | |
majority | +1.360 |
country | +1.357 |
nation | +1.351 |
inner | +1.303 |
oret | +1.303 |
Neg logit contributions | |
because | -1.274 |
besides | -1.264 |
nonetheless | -1.228 |
regardless | -1.202 |
nevertheless | -1.194 |
Token | conclusions |
Token ID | 13242 |
Feature activation | +2.76e+01 |
Pos logit contributions | |
because | +0.052 |
besides | +0.051 |
nonetheless | +0.050 |
regardless | +0.050 |
nevertheless | +0.049 |
Neg logit contributions | |
majority | -0.026 |
country | -0.026 |
nation | -0.026 |
oret | -0.025 |
inner | -0.025 |
Token | about |
Token ID | 546 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
because | +30.494 |
besides | +29.522 |
regardless | +28.575 |
nonetheless | +28.417 |
unless | +27.829 |
Neg logit contributions | |
oret | -15.751 |
slightest | -15.500 |
majority | -15.324 |
nation | -15.314 |
country | -15.285 |
Token | this |
Token ID | 428 |
Feature activation | -6.56e+00 |
Pos logit contributions | |
because | +1.439 |
besides | +1.410 |
nonetheless | +1.349 |
regardless | +1.332 |
nevertheless | +1.304 |
Neg logit contributions | |
majority | -2.162 |
nation | -2.161 |
country | -2.159 |
oret | -2.110 |
inner | -2.085 |
Token | pair |
Token ID | 5166 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
country | +9.552 |
majority | +9.500 |
nation | +9.475 |
inner | +9.253 |
oret | +9.198 |
Neg logit contributions | |
besides | -3.811 |
because | -3.787 |
nonetheless | -3.636 |
regardless | -3.500 |
nevertheless | -3.478 |
Token | 's |
Token ID | 338 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
because | +3.790 |
besides | +3.706 |
nonetheless | +3.548 |
regardless | +3.492 |
nevertheless | +3.438 |
Neg logit contributions | |
majority | -4.827 |
country | -4.815 |
nation | -4.800 |
oret | -4.716 |
inner | -4.647 |
Token | shared |
Token ID | 4888 |
Feature activation | -1.47e+01 |
Pos logit contributions | |
country | +18.740 |
majority | +18.526 |
nation | +18.489 |
inner | +18.228 |
presence | +17.862 |
Neg logit contributions | |
besides | -10.901 |
because | -10.622 |
nonetheless | -10.481 |
nevertheless | -10.164 |
regardless | -10.153 |
Token | this |
Token ID | 428 |
Feature activation | -7.08e+00 |
Pos logit contributions | |
because | +4.784 |
besides | +4.657 |
nonetheless | +4.517 |
regardless | +4.466 |
nevertheless | +4.400 |
Neg logit contributions | |
majority | -4.735 |
country | -4.680 |
nation | -4.669 |
oret | -4.612 |
inner | -4.524 |
Token | , |
Token ID | 11 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
country | +11.041 |
nation | +10.950 |
majority | +10.885 |
inner | +10.574 |
trio | +10.467 |
Neg logit contributions | |
besides | -3.340 |
nonetheless | -3.153 |
because | -3.144 |
nevertheless | -2.993 |
regardless | -2.906 |
Token | � |
Token ID | 447 |
Feature activation | +7.94e-01 |
Pos logit contributions | |
because | +19.417 |
besides | +18.290 |
regardless | +17.921 |
nonetheless | +17.768 |
although | +17.343 |
Neg logit contributions | |
oret | -11.904 |
majority | -11.821 |
nation | -11.767 |
country | -11.711 |
slightest | -11.538 |
Token | � |
Token ID | 251 |
Feature activation | +9.65e+00 |
Pos logit contributions | |
because | +1.049 |
besides | +1.035 |
nonetheless | +1.005 |
regardless | +0.995 |
nevertheless | +0.985 |
Neg logit contributions | |
majority | -0.610 |
country | -0.609 |
nation | -0.608 |
oret | -0.585 |
inner | -0.579 |
Token | Todd |
Token ID | 14377 |
Feature activation | +9.32e+00 |
Pos logit contributions | |
because | +10.951 |
besides | +10.581 |
nonetheless | +10.209 |
regardless | +10.202 |
nevertheless | +10.010 |
Neg logit contributions | |
majority | -8.528 |
oret | -8.502 |
nation | -8.485 |
country | -8.479 |
inner | -8.305 |
Token | agreed |
Token ID | 4987 |
Feature activation | +2.75e+01 |
Pos logit contributions | |
because | +8.565 |
besides | +8.190 |
nonetheless | +8.184 |
nevertheless | +7.975 |
regardless | +7.760 |
Neg logit contributions | |
nation | -9.970 |
country | -9.953 |
majority | -9.913 |
oret | -9.836 |
inner | -9.680 |
Token | . |
Token ID | 13 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
because | +28.576 |
besides | +27.017 |
regardless | +26.631 |
nonetheless | +26.585 |
unless | +25.845 |
Neg logit contributions | |
oret | -15.475 |
majority | -15.039 |
nation | -14.902 |
country | -14.878 |
inner | -14.675 |
Token | � |
Token ID | 564 |
Feature activation | -9.24e-02 |
Pos logit contributions | |
because | +17.379 |
besides | +16.504 |
regardless | +16.028 |
nonetheless | +15.944 |
unless | +15.704 |
Neg logit contributions | |
slightest | -11.960 |
inner | -11.936 |
majority | -11.741 |
country | -11.718 |
oret | -11.701 |
Token | � |
Token ID | 250 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
majority | +0.066 |
country | +0.066 |
nation | +0.065 |
oret | +0.062 |
inner | +0.062 |
Neg logit contributions | |
because | -0.125 |
besides | -0.125 |
nonetheless | -0.123 |
regardless | -0.121 |
nevertheless | -0.121 |
Token | That |
Token ID | 2504 |
Feature activation | +7.81e+00 |
Pos logit contributions | |
because | +14.325 |
besides | +13.484 |
nonetheless | +13.011 |
regardless | +12.890 |
nevertheless | +12.680 |
Neg logit contributions | |
country | -14.200 |
nation | -14.199 |
slightest | -14.163 |
inner | -14.160 |
majority | -14.073 |
Token | there |
Token ID | 612 |
Feature activation | +6.39e+00 |
Pos logit contributions | |
because | +10.002 |
besides | +9.718 |
nonetheless | +9.559 |
regardless | +9.445 |
nevertheless | +9.371 |
Neg logit contributions | |
majority | -5.701 |
nation | -5.680 |
oret | -5.678 |
country | -5.644 |
inner | -5.463 |
Token | not |
Token ID | 407 |
Feature activation | +8.87e+00 |
Pos logit contributions | |
because | +15.360 |
besides | +14.752 |
nonetheless | +14.407 |
regardless | +14.186 |
nevertheless | +14.142 |
Neg logit contributions | |
nation | -9.824 |
country | -9.754 |
majority | -9.653 |
oret | -9.464 |
slightest | -9.213 |
Token | do |
Token ID | 466 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
because | +11.688 |
besides | +11.383 |
nonetheless | +11.081 |
regardless | +10.948 |
nevertheless | +10.867 |
Neg logit contributions | |
majority | -6.369 |
nation | -6.328 |
country | -6.310 |
oret | -6.081 |
inner | -5.977 |
Token | the |
Token ID | 262 |
Feature activation | -9.27e+00 |
Pos logit contributions | |
because | +12.825 |
besides | +12.341 |
regardless | +11.879 |
nonetheless | +11.862 |
unless | +11.723 |
Neg logit contributions | |
nation | -9.047 |
oret | -8.988 |
country | -8.928 |
majority | -8.910 |
inner | -8.625 |
Token | sub |
Token ID | 850 |
Feature activation | -5.49e+00 |
Pos logit contributions | |
majority | +6.945 |
country | +6.862 |
nation | +6.766 |
inner | +6.477 |
oret | +6.453 |
Neg logit contributions | |
besides | -12.039 |
because | -11.990 |
nonetheless | -11.865 |
nevertheless | -11.635 |
regardless | -11.567 |
Token | any |
Token ID | 597 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
country | +6.728 |
majority | +6.726 |
nation | +6.674 |
inner | +6.463 |
oret | +6.430 |
Neg logit contributions | |
besides | -4.531 |
because | -4.523 |
nonetheless | -4.392 |
regardless | -4.269 |
nevertheless | -4.258 |
Token | justice |
Token ID | 5316 |
Feature activation | +2.75e+01 |
Pos logit contributions | |
because | +1.887 |
besides | +1.865 |
nonetheless | +1.790 |
regardless | +1.778 |
nevertheless | +1.740 |
Neg logit contributions | |
majority | -1.465 |
country | -1.458 |
nation | -1.452 |
oret | -1.422 |
inner | -1.399 |
Token | . |
Token ID | 13 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
because | +31.971 |
besides | +30.502 |
regardless | +29.364 |
unless | +29.334 |
although | +29.008 |
Neg logit contributions | |
majority | -14.016 |
oret | -13.674 |
nation | -13.592 |
country | -13.306 |
ses | -13.165 |
Token | Get |
Token ID | 3497 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
because | +16.115 |
besides | +15.734 |
nonetheless | +15.061 |
regardless | +14.971 |
unless | +14.912 |
Neg logit contributions | |
nation | -11.201 |
country | -11.036 |
majority | -10.965 |
oret | -10.698 |
slightest | -10.694 |
Token | a |
Token ID | 257 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
because | +2.898 |
besides | +2.833 |
nonetheless | +2.720 |
regardless | +2.678 |
nevertheless | +2.622 |
Neg logit contributions | |
nation | -4.129 |
majority | -4.128 |
country | -4.116 |
oret | -4.015 |
inner | -3.961 |
Token | Monster |
Token ID | 12635 |
Feature activation | -7.19e+00 |
Pos logit contributions | |
country | +17.627 |
majority | +17.560 |
nation | +17.345 |
inner | +16.870 |
trio | +16.735 |
Neg logit contributions | |
besides | -11.589 |
because | -11.350 |
nonetheless | -11.234 |
nevertheless | -10.954 |
regardless | -10.802 |
Token | Bass |
Token ID | 19829 |
Feature activation | +8.87e-01 |
Pos logit contributions | |
country | +9.820 |
majority | +9.811 |
nation | +9.770 |
inner | +9.558 |
oret | +9.467 |
Neg logit contributions | |
besides | -4.842 |
because | -4.796 |
nonetheless | -4.610 |
nevertheless | -4.459 |
regardless | -4.454 |
Token | , |
Token ID | 11 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
because | +19.999 |
besides | +18.805 |
nonetheless | +18.297 |
regardless | +18.064 |
nevertheless | +17.807 |
Neg logit contributions | |
majority | -15.130 |
nation | -14.795 |
country | -14.738 |
multitude | -14.490 |
slightest | -14.458 |
Token | because |
Token ID | 780 |
Feature activation | +6.32e+00 |
Pos logit contributions | |
because | +21.310 |
besides | +20.048 |
regardless | +19.584 |
although | +19.391 |
unless | +19.280 |
Neg logit contributions | |
oret | -12.160 |
majority | -12.150 |
nation | -11.939 |
country | -11.876 |
ses | -11.703 |
Token | the |
Token ID | 262 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
because | +8.477 |
besides | +8.339 |
nonetheless | +8.072 |
regardless | +8.061 |
nevertheless | +7.905 |
Neg logit contributions | |
nation | -4.483 |
country | -4.475 |
majority | -4.464 |
oret | -4.389 |
ses | -4.234 |
Token | sun |
Token ID | 4252 |
Feature activation | -4.62e+00 |
Pos logit contributions | |
majority | +24.806 |
country | +24.427 |
inner | +24.076 |
nation | +24.008 |
oret | +23.612 |
Neg logit contributions | |
besides | -14.325 |
nonetheless | -13.772 |
because | -13.684 |
nevertheless | -13.402 |
regardless | -13.202 |
Token | and |
Token ID | 290 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
majority | +5.872 |
country | +5.866 |
nation | +5.842 |
inner | +5.669 |
oret | +5.650 |
Neg logit contributions | |
because | -3.640 |
besides | -3.621 |
nonetheless | -3.477 |
regardless | -3.413 |
nevertheless | -3.358 |
Token | the |
Token ID | 262 |
Feature activation | -3.42e+01 |
Pos logit contributions | |
majority | +20.949 |
country | +20.788 |
inner | +20.588 |
nation | +20.475 |
largest | +19.926 |
Neg logit contributions | |
besides | -11.788 |
because | -11.608 |
nonetheless | -11.582 |
nevertheless | -11.195 |
regardless | -11.070 |
Token | moon |
Token ID | 8824 |
Feature activation | -3.64e-01 |
Pos logit contributions | |
majority | +35.433 |
inner | +35.278 |
country | +34.496 |
largest | +34.163 |
nation | +33.801 |
Neg logit contributions | |
nonetheless | -15.373 |
besides | -15.361 |
because | -14.912 |
nevertheless | -14.911 |
regardless | -14.689 |
Token | are |
Token ID | 389 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
majority | +0.434 |
country | +0.434 |
nation | +0.432 |
oret | +0.418 |
inner | +0.418 |
Neg logit contributions | |
because | -0.323 |
besides | -0.320 |
nonetheless | -0.310 |
regardless | -0.303 |
nevertheless | -0.300 |
Token | tug |
Token ID | 27762 |
Feature activation | -8.35e-01 |
Pos logit contributions | |
because | +1.031 |
besides | +1.021 |
nonetheless | +0.991 |
regardless | +0.970 |
nevertheless | +0.964 |
Neg logit contributions | |
majority | -1.102 |
country | -1.102 |
nation | -1.099 |
oret | -1.063 |
inner | -1.058 |
Token | ging |
Token ID | 2667 |
Feature activation | +6.93e+00 |
Pos logit contributions | |
majority | +0.581 |
country | +0.580 |
nation | +0.577 |
oret | +0.557 |
inner | +0.546 |
Neg logit contributions | |
because | -1.165 |
besides | -1.147 |
nonetheless | -1.126 |
regardless | -1.109 |
nevertheless | -1.101 |
Token | on |
Token ID | 319 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
because | +7.583 |
besides | +7.410 |
nonetheless | +7.248 |
regardless | +7.057 |
nevertheless | +7.030 |
Neg logit contributions | |
majority | -6.651 |
country | -6.591 |
nation | -6.589 |
oret | -6.564 |
inner | -6.260 |
Token | of |
Token ID | 286 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
country | +9.320 |
majority | +9.280 |
nation | +9.261 |
inner | +8.907 |
oret | +8.833 |
Neg logit contributions | |
besides | -4.440 |
because | -4.332 |
nonetheless | -4.225 |
regardless | -4.057 |
nevertheless | -4.034 |
Token | Bulgaria |
Token ID | 27902 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
majority | +13.821 |
country | +13.702 |
nation | +13.623 |
inner | +13.107 |
largest | +12.887 |
Neg logit contributions | |
besides | -10.203 |
because | -10.050 |
nonetheless | -9.882 |
regardless | -9.625 |
nevertheless | -9.518 |
Token | and |
Token ID | 290 |
Feature activation | -5.90e+00 |
Pos logit contributions | |
country | +6.252 |
majority | +6.239 |
nation | +6.231 |
inner | +6.031 |
oret | +5.994 |
Neg logit contributions | |
besides | -2.169 |
because | -2.132 |
nonetheless | -2.060 |
regardless | -1.978 |
nevertheless | -1.939 |
Token | Romania |
Token ID | 23356 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
country | +6.753 |
majority | +6.751 |
nation | +6.721 |
inner | +6.473 |
oret | +6.359 |
Neg logit contributions | |
because | -5.354 |
besides | -5.329 |
nonetheless | -5.190 |
regardless | -5.065 |
nevertheless | -5.022 |
Token | to |
Token ID | 284 |
Feature activation | -1.60e+01 |
Pos logit contributions | |
because | +1.230 |
besides | +1.217 |
nonetheless | +1.157 |
regardless | +1.117 |
nevertheless | +1.102 |
Neg logit contributions | |
majority | -3.049 |
country | -3.048 |
nation | -3.039 |
oret | -2.959 |
inner | -2.957 |
Token | the |
Token ID | 262 |
Feature activation | -3.33e+01 |
Pos logit contributions | |
majority | +18.289 |
country | +18.027 |
nation | +17.915 |
inner | +17.461 |
largest | +17.083 |
Neg logit contributions | |
besides | -12.580 |
because | -12.361 |
nonetheless | -12.277 |
regardless | -11.820 |
nevertheless | -11.743 |
Token | Union |
Token ID | 4479 |
Feature activation | -6.01e+00 |
Pos logit contributions | |
country | +32.631 |
majority | +32.344 |
nation | +31.970 |
largest | +31.088 |
main | +30.963 |
Neg logit contributions | |
besides | -18.954 |
nonetheless | -18.066 |
because | -17.678 |
nevertheless | -17.436 |
regardless | -17.367 |
Token | in |
Token ID | 287 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
country | +8.600 |
nation | +8.563 |
majority | +8.556 |
inner | +8.245 |
oret | +8.193 |
Neg logit contributions | |
besides | -3.656 |
because | -3.562 |
nonetheless | -3.481 |
regardless | -3.351 |
nevertheless | -3.305 |
Token | 2007 |
Token ID | 4343 |
Feature activation | +8.35e+00 |
Pos logit contributions | |
majority | +10.977 |
country | +10.907 |
nation | +10.770 |
inner | +10.397 |
oret | +10.177 |
Neg logit contributions | |
besides | -10.830 |
because | -10.486 |
nonetheless | -10.433 |
regardless | -10.212 |
nevertheless | -10.105 |
Token | damaged |
Token ID | 9694 |
Feature activation | +2.88e+00 |
Pos logit contributions | |
because | +9.392 |
besides | +9.115 |
nonetheless | +8.954 |
regardless | +8.768 |
nevertheless | +8.766 |
Neg logit contributions | |
country | -7.696 |
nation | -7.691 |
majority | -7.661 |
oret | -7.493 |
inner | -7.405 |
Token | the |
Token ID | 262 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
because | +3.208 |
besides | +3.131 |
nonetheless | +3.068 |
regardless | +3.000 |
nevertheless | +2.998 |
Neg logit contributions | |
majority | -2.762 |
country | -2.739 |
nation | -2.732 |
oret | -2.732 |
inner | -2.640 |
Token | connection |
Token ID | 4637 |
Feature activation | +6.09e+00 |
Pos logit contributions | |
country | +28.101 |
nation | +27.884 |
majority | +27.658 |
inner | +26.744 |
primary | +26.182 |
Neg logit contributions | |
besides | -15.883 |
nonetheless | -15.354 |
because | -15.151 |
nevertheless | -14.812 |
regardless | -14.663 |
Token | between |
Token ID | 1022 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
because | +4.633 |
besides | +4.530 |
nonetheless | +4.289 |
regardless | +4.212 |
nevertheless | +4.115 |
Neg logit contributions | |
majority | -7.889 |
nation | -7.815 |
country | -7.807 |
oret | -7.764 |
inner | -7.635 |
Token | Russian |
Token ID | 3394 |
Feature activation | -2.60e+01 |
Pos logit contributions | |
country | +11.867 |
majority | +11.793 |
nation | +11.772 |
inner | +11.409 |
oret | +11.173 |
Neg logit contributions | |
besides | -9.173 |
because | -9.156 |
nonetheless | -8.930 |
regardless | -8.690 |
nevertheless | -8.642 |
Token | hackers |
Token ID | 17110 |
Feature activation | +9.06e-01 |
Pos logit contributions | |
country | +27.553 |
nation | +27.338 |
majority | +27.005 |
inner | +26.144 |
group | +25.605 |
Neg logit contributions | |
besides | -15.607 |
because | -15.218 |
nonetheless | -15.139 |
nevertheless | -14.537 |
regardless | -14.487 |
Token | and |
Token ID | 290 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
because | +0.639 |
besides | +0.627 |
nonetheless | +0.597 |
regardless | +0.581 |
nevertheless | +0.574 |
Neg logit contributions | |
majority | -1.252 |
country | -1.248 |
nation | -1.246 |
oret | -1.223 |
inner | -1.211 |
Token | the |
Token ID | 262 |
Feature activation | -3.26e+01 |
Pos logit contributions | |
country | +14.145 |
majority | +14.068 |
nation | +14.016 |
inner | +13.657 |
largest | +13.278 |
Neg logit contributions | |
besides | -9.564 |
because | -9.460 |
nonetheless | -9.269 |
regardless | -8.965 |
nevertheless | -8.923 |
Token | DNC |
Token ID | 17824 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
country | +31.448 |
nation | +31.188 |
majority | +30.837 |
inner | +30.453 |
primary | +29.910 |
Neg logit contributions | |
besides | -19.793 |
nonetheless | -18.780 |
because | -18.780 |
regardless | -18.171 |
nevertheless | -17.993 |
Token | leak |
Token ID | 13044 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
country | +11.626 |
majority | +11.588 |
nation | +11.586 |
inner | +11.172 |
oret | +11.001 |
Neg logit contributions | |
because | -8.874 |
besides | -8.861 |
nonetheless | -8.604 |
regardless | -8.383 |
nevertheless | -8.309 |
Token | isn |
Token ID | 2125 |
Feature activation | +8.72e+00 |
Pos logit contributions | |
because | +13.337 |
besides | +12.979 |
nonetheless | +12.606 |
regardless | +12.420 |
nevertheless | +12.347 |
Neg logit contributions | |
majority | -9.438 |
oret | -9.264 |
country | -9.248 |
nation | -9.188 |
inner | -8.986 |
Token | 't |
Token ID | 470 |
Feature activation | +8.63e+00 |
Pos logit contributions | |
because | +7.340 |
besides | +7.183 |
nonetheless | +6.899 |
regardless | +6.758 |
nevertheless | +6.670 |
Neg logit contributions | |
country | -10.757 |
majority | -10.755 |
nation | -10.714 |
inner | -10.418 |
oret | -10.367 |
Token | a |
Token ID | 257 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
because | +12.008 |
besides | +11.642 |
nonetheless | +11.310 |
regardless | +11.279 |
nevertheless | +11.084 |
Neg logit contributions | |
oret | -5.529 |
nation | -5.471 |
majority | -5.468 |
country | -5.427 |
ses | -5.257 |
Token | just |
Token ID | 655 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
country | +2.481 |
majority | +2.479 |
nation | +2.474 |
oret | +2.415 |
inner | +2.406 |
Neg logit contributions | |
because | -1.189 |
besides | -1.169 |
nonetheless | -1.118 |
regardless | -1.085 |
nevertheless | -1.070 |
Token | a |
Token ID | 257 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
country | +1.739 |
majority | +1.737 |
nation | +1.733 |
oret | +1.684 |
inner | +1.675 |
Neg logit contributions | |
because | -1.298 |
besides | -1.280 |
nonetheless | -1.234 |
regardless | -1.209 |
nevertheless | -1.194 |
Token | point |
Token ID | 966 |
Feature activation | +5.95e+00 |
Pos logit contributions | |
majority | +17.598 |
country | +17.344 |
nation | +17.288 |
trio | +16.628 |
inner | +16.412 |
Neg logit contributions | |
besides | -12.868 |
because | -12.631 |
nonetheless | -12.276 |
regardless | -12.088 |
nevertheless | -11.980 |
Token | to |
Token ID | 284 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
because | +6.108 |
besides | +5.995 |
nonetheless | +5.819 |
regardless | +5.737 |
nevertheless | +5.644 |
Neg logit contributions | |
country | -6.179 |
nation | -6.141 |
majority | -6.133 |
oret | -6.016 |
inner | -5.963 |
Token | clinch |
Token ID | 45963 |
Feature activation | -3.96e+00 |
Pos logit contributions | |
majority | +3.870 |
country | +3.855 |
nation | +3.839 |
inner | +3.684 |
oret | +3.634 |
Neg logit contributions | |
besides | -5.231 |
because | -5.225 |
nonetheless | -5.081 |
regardless | -4.994 |
nevertheless | -4.970 |
Token | the |
Token ID | 262 |
Feature activation | -3.26e+01 |
Pos logit contributions | |
majority | +5.155 |
country | +5.147 |
nation | +5.130 |
inner | +4.973 |
oret | +4.965 |
Neg logit contributions | |
because | -3.051 |
besides | -3.028 |
nonetheless | -2.915 |
regardless | -2.826 |
nevertheless | -2.815 |
Token | President |
Token ID | 1992 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
majority | +33.636 |
nation | +33.190 |
country | +32.995 |
remainder | +31.812 |
largest | +31.718 |
Neg logit contributions | |
besides | -16.422 |
because | -15.610 |
nonetheless | -15.530 |
nevertheless | -15.062 |
regardless | -14.376 |
Token | � |
Token ID | 447 |
Feature activation | -1.80e+01 |
Pos logit contributions | |
majority | +15.208 |
nation | +15.164 |
country | +15.135 |
oret | +14.587 |
inner | +14.498 |
Neg logit contributions | |
besides | -7.910 |
because | -7.796 |
nonetheless | -7.623 |
nevertheless | -7.348 |
regardless | -7.219 |
Token | � |
Token ID | 247 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
majority | +12.655 |
nation | +12.251 |
country | +12.038 |
inner | +11.599 |
primary | +11.213 |
Neg logit contributions | |
besides | -20.045 |
because | -19.647 |
nonetheless | -19.599 |
nevertheless | -19.505 |
regardless | -19.191 |
Token | s |
Token ID | 82 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
majority | +15.191 |
country | +14.892 |
nation | +14.858 |
oret | +14.296 |
inner | +14.149 |
Neg logit contributions | |
besides | -12.177 |
because | -12.067 |
nonetheless | -11.876 |
nevertheless | -11.452 |
regardless | -11.426 |
Token | Trophy |
Token ID | 25640 |
Feature activation | +3.57e+00 |
Pos logit contributions | |
majority | +25.060 |
nation | +24.793 |
country | +24.791 |
trio | +23.750 |
largest | +23.736 |
Neg logit contributions | |
besides | -11.915 |
because | -11.499 |
nonetheless | -11.471 |
nevertheless | -11.052 |
regardless | -10.671 |
Token | - |
Token ID | 12 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
country | +9.448 |
majority | +9.427 |
nation | +9.412 |
inner | +9.114 |
oret | +9.076 |
Neg logit contributions | |
besides | -4.987 |
because | -4.983 |
nonetheless | -4.790 |
regardless | -4.643 |
nevertheless | -4.616 |
Token | city |
Token ID | 19205 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
country | +10.441 |
nation | +10.413 |
majority | +10.403 |
inner | +10.003 |
oret | +9.989 |
Neg logit contributions | |
besides | -10.503 |
because | -10.343 |
nonetheless | -10.104 |
regardless | -9.933 |
nevertheless | -9.918 |
Token | of |
Token ID | 286 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
majority | +13.652 |
country | +13.595 |
nation | +13.543 |
inner | +13.148 |
oret | +13.036 |
Neg logit contributions | |
besides | -7.298 |
because | -7.197 |
nonetheless | -6.947 |
regardless | -6.763 |
nevertheless | -6.721 |
Token | Ariel |
Token ID | 33364 |
Feature activation | -7.60e+00 |
Pos logit contributions | |
majority | +18.046 |
nation | +17.843 |
country | +17.836 |
inner | +17.243 |
oret | +17.052 |
Neg logit contributions | |
besides | -13.152 |
nonetheless | -12.656 |
because | -12.487 |
nevertheless | -12.370 |
regardless | -12.230 |
Token | and |
Token ID | 290 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
majority | +10.815 |
country | +10.793 |
nation | +10.758 |
oret | +10.416 |
inner | +10.386 |
Neg logit contributions | |
because | -4.601 |
besides | -4.592 |
nonetheless | -4.449 |
regardless | -4.261 |
nevertheless | -4.251 |
Token | the |
Token ID | 262 |
Feature activation | -3.24e+01 |
Pos logit contributions | |
majority | +14.408 |
country | +14.349 |
nation | +14.251 |
inner | +13.853 |
largest | +13.648 |
Neg logit contributions | |
besides | -8.679 |
because | -8.570 |
nonetheless | -8.389 |
regardless | -8.152 |
nevertheless | -8.147 |
Token | Green |
Token ID | 3469 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
majority | +35.039 |
country | +34.658 |
nation | +34.169 |
largest | +33.568 |
city | +33.507 |
Neg logit contributions | |
besides | -15.176 |
because | -14.045 |
regardless | -13.711 |
nonetheless | -13.628 |
nevertheless | -13.392 |
Token | line |
Token ID | 1627 |
Feature activation | -3.99e-01 |
Pos logit contributions | |
country | +13.860 |
majority | +13.740 |
nation | +13.501 |
inner | +13.010 |
oret | +12.950 |
Neg logit contributions | |
besides | -15.360 |
nonetheless | -14.939 |
because | -14.764 |
nevertheless | -14.676 |
regardless | -14.496 |
Token | is |
Token ID | 318 |
Feature activation | +2.97e+00 |
Pos logit contributions | |
majority | +0.532 |
country | +0.531 |
nation | +0.530 |
oret | +0.516 |
inner | +0.514 |
Neg logit contributions | |
because | -0.301 |
besides | -0.297 |
nonetheless | -0.285 |
regardless | -0.277 |
nevertheless | -0.275 |
Token | a |
Token ID | 257 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
because | +3.080 |
besides | +3.031 |
nonetheless | +2.957 |
nevertheless | +2.875 |
regardless | +2.874 |
Neg logit contributions | |
majority | -3.085 |
country | -3.082 |
nation | -3.079 |
oret | -2.979 |
inner | -2.961 |
Token | new |
Token ID | 649 |
Feature activation | -1.49e+01 |
Pos logit contributions | |
country | +16.522 |
majority | +16.447 |
nation | +16.404 |
inner | +15.630 |
trio | +15.535 |
Neg logit contributions | |
besides | -11.587 |
because | -11.366 |
nonetheless | -11.028 |
regardless | -10.805 |
nevertheless | -10.772 |
Token | a |
Token ID | 257 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
because | +6.995 |
besides | +6.785 |
nonetheless | +6.537 |
regardless | +6.531 |
nevertheless | +6.335 |
Neg logit contributions | |
majority | -6.876 |
nation | -6.802 |
country | -6.783 |
oret | -6.662 |
inner | -6.539 |
Token | video |
Token ID | 2008 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
majority | +19.458 |
country | +19.451 |
nation | +19.241 |
trio | +18.551 |
inner | +18.353 |
Neg logit contributions | |
besides | -12.025 |
nonetheless | -11.588 |
because | -11.504 |
nevertheless | -11.350 |
regardless | -11.025 |
Token | with |
Token ID | 351 |
Feature activation | -3.47e+00 |
Pos logit contributions | |
because | +3.034 |
besides | +2.981 |
nonetheless | +2.878 |
regardless | +2.834 |
nevertheless | +2.786 |
Neg logit contributions | |
majority | -3.632 |
country | -3.624 |
nation | -3.614 |
oret | -3.528 |
inner | -3.497 |
Token | # |
Token ID | 1303 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
country | +4.255 |
majority | +4.255 |
nation | +4.239 |
oret | +4.109 |
inner | +4.104 |
Neg logit contributions | |
because | -2.968 |
besides | -2.944 |
nonetheless | -2.843 |
regardless | -2.772 |
nevertheless | -2.753 |
Token | Ask |
Token ID | 25214 |
Feature activation | -8.59e+00 |
Pos logit contributions | |
country | +11.623 |
nation | +11.484 |
majority | +11.434 |
oret | +11.196 |
ses | +11.020 |
Neg logit contributions | |
besides | -11.811 |
because | -11.709 |
nonetheless | -11.558 |
regardless | -11.314 |
nevertheless | -11.289 |
Token | The |
Token ID | 464 |
Feature activation | -3.21e+01 |
Pos logit contributions | |
country | +11.006 |
majority | +10.972 |
nation | +10.952 |
oret | +10.684 |
inner | +10.612 |
Neg logit contributions | |
because | -6.345 |
besides | -6.342 |
nonetheless | -6.143 |
regardless | -5.969 |
nevertheless | -5.925 |
Token | D |
Token ID | 35 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
country | +24.977 |
nation | +24.954 |
majority | +24.494 |
oret | +24.305 |
ses | +23.362 |
Neg logit contributions | |
nonetheless | -21.602 |
besides | -21.526 |
nevertheless | -21.346 |
because | -21.235 |
regardless | -20.631 |
Token | ubs |
Token ID | 23161 |
Feature activation | +5.52e+00 |
Pos logit contributions | |
oret | +15.016 |
country | +13.599 |
majority | +13.276 |
nation | +13.266 |
ses | +13.182 |
Neg logit contributions | |
nonetheless | -22.613 |
nevertheless | -22.392 |
besides | -22.121 |
insofar | -21.498 |
furthermore | -21.461 |
Token | , |
Token ID | 11 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
because | +5.956 |
besides | +5.807 |
nonetheless | +5.611 |
regardless | +5.585 |
nevertheless | +5.445 |
Neg logit contributions | |
majority | -5.464 |
country | -5.397 |
nation | -5.381 |
oret | -5.283 |
inner | -5.198 |
Token | then |
Token ID | 788 |
Feature activation | +8.73e+00 |
Pos logit contributions | |
because | +14.253 |
besides | +13.662 |
regardless | +13.395 |
nonetheless | +13.106 |
unless | +13.074 |
Neg logit contributions | |
majority | -8.544 |
nation | -8.372 |
country | -8.324 |
oret | -8.319 |
inner | -8.086 |
Token | tune |
Token ID | 14009 |
Feature activation | +6.34e+00 |
Pos logit contributions | |
because | +11.628 |
besides | +11.363 |
regardless | +11.047 |
nonetheless | +11.018 |
nevertheless | +10.778 |
Neg logit contributions | |
majority | -6.060 |
nation | -5.957 |
country | -5.943 |
oret | -5.919 |
inner | -5.708 |
Token | Muslims |
Token ID | 7045 |
Feature activation | +3.72e+00 |
Pos logit contributions | |
majority | +13.631 |
country | +13.559 |
nation | +13.412 |
inner | +12.998 |
trio | +12.665 |
Neg logit contributions | |
besides | -10.020 |
because | -9.856 |
nonetheless | -9.702 |
regardless | -9.458 |
nevertheless | -9.422 |
Token | by |
Token ID | 416 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
because | +3.118 |
besides | +3.075 |
nonetheless | +2.958 |
regardless | +2.892 |
nevertheless | +2.861 |
Neg logit contributions | |
majority | -4.639 |
country | -4.636 |
nation | -4.624 |
oret | -4.508 |
inner | -4.480 |
Token | Buddh |
Token ID | 20921 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
majority | +12.413 |
country | +12.367 |
nation | +12.222 |
inner | +11.799 |
trio | +11.510 |
Neg logit contributions | |
besides | -9.708 |
because | -9.623 |
nonetheless | -9.445 |
regardless | -9.187 |
nevertheless | -9.166 |
Token | ists |
Token ID | 1023 |
Feature activation | +9.32e+00 |
Pos logit contributions | |
majority | +10.736 |
country | +10.361 |
nation | +10.292 |
oret | +10.087 |
inner | +9.915 |
Neg logit contributions | |
besides | -19.907 |
nonetheless | -19.406 |
because | -19.371 |
regardless | -19.284 |
nevertheless | -19.052 |
Token | near |
Token ID | 1474 |
Feature activation | -9.81e+00 |
Pos logit contributions | |
because | +9.878 |
besides | +9.631 |
nonetheless | +9.308 |
regardless | +9.150 |
nevertheless | +9.073 |
Neg logit contributions | |
majority | -9.114 |
country | -9.089 |
nation | -9.077 |
oret | -9.030 |
inner | -8.712 |
Token | the |
Token ID | 262 |
Feature activation | -3.19e+01 |
Pos logit contributions | |
country | +11.895 |
majority | +11.874 |
nation | +11.778 |
inner | +11.437 |
oret | +11.164 |
Neg logit contributions | |
besides | -8.047 |
because | -7.951 |
nonetheless | -7.800 |
regardless | -7.563 |
nevertheless | -7.543 |
Token | border |
Token ID | 4865 |
Feature activation | -8.71e-01 |
Pos logit contributions | |
country | +34.081 |
nation | +33.241 |
majority | +32.369 |
main | +31.695 |
city | +31.545 |
Neg logit contributions | |
besides | -17.581 |
nonetheless | -16.601 |
because | -16.204 |
regardless | -16.194 |
nevertheless | -15.857 |
Token | with |
Token ID | 351 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
majority | +1.508 |
country | +1.505 |
nation | +1.502 |
oret | +1.476 |
inner | +1.471 |
Neg logit contributions | |
because | -0.310 |
besides | -0.300 |
nonetheless | -0.273 |
regardless | -0.258 |
nevertheless | -0.250 |
Token | Bangladesh |
Token ID | 19483 |
Feature activation | +8.14e+00 |
Pos logit contributions | |
country | +10.530 |
majority | +10.501 |
nation | +10.400 |
inner | +9.878 |
oret | +9.652 |
Neg logit contributions | |
besides | -12.948 |
because | -12.918 |
nonetheless | -12.676 |
regardless | -12.422 |
nevertheless | -12.348 |
Token | , |
Token ID | 11 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
because | +7.728 |
besides | +7.447 |
nonetheless | +7.161 |
regardless | +7.078 |
nevertheless | +6.961 |
Neg logit contributions | |
majority | -8.931 |
nation | -8.838 |
country | -8.832 |
oret | -8.829 |
inner | -8.624 |
Token | our |
Token ID | 674 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
because | +18.056 |
besides | +17.574 |
regardless | +17.130 |
nonetheless | +17.113 |
although | +16.871 |
Neg logit contributions | |
oret | -9.296 |
majority | -9.038 |
nation | -8.943 |
country | -8.865 |
ses | -8.599 |
Token | lines |
Token ID | 3951 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
majority | +1.233 |
country | +1.232 |
nation | +1.228 |
oret | +1.198 |
inner | +1.195 |
Neg logit contributions | |
because | -0.603 |
besides | -0.594 |
nonetheless | -0.568 |
regardless | -0.552 |
nevertheless | -0.545 |
Token | between |
Token ID | 1022 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
because | +10.425 |
besides | +10.067 |
nonetheless | +9.827 |
regardless | +9.666 |
nevertheless | +9.582 |
Neg logit contributions | |
majority | -9.899 |
country | -9.892 |
oret | -9.798 |
nation | -9.780 |
inner | -9.559 |
Token | sovereign |
Token ID | 18901 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
country | +15.974 |
nation | +15.946 |
majority | +15.914 |
inner | +15.215 |
oret | +14.942 |
Neg logit contributions | |
besides | -10.190 |
because | -9.982 |
nonetheless | -9.806 |
nevertheless | -9.493 |
regardless | -9.369 |
Token | Israel |
Token ID | 2692 |
Feature activation | -6.07e+00 |
Pos logit contributions | |
nation | +26.573 |
country | +26.490 |
majority | +26.326 |
inner | +24.861 |
presence | +24.476 |
Neg logit contributions | |
besides | -11.836 |
because | -11.182 |
nonetheless | -11.099 |
nevertheless | -10.693 |
regardless | -10.439 |
Token | and |
Token ID | 290 |
Feature activation | -1.79e+01 |
Pos logit contributions | |
country | +8.302 |
majority | +8.299 |
nation | +8.280 |
inner | +8.008 |
oret | +7.993 |
Neg logit contributions | |
because | -4.184 |
besides | -4.179 |
nonetheless | -4.012 |
regardless | -3.855 |
nevertheless | -3.854 |
Token | the |
Token ID | 262 |
Feature activation | -3.19e+01 |
Pos logit contributions | |
majority | +22.033 |
country | +21.966 |
nation | +21.837 |
inner | +20.864 |
remainder | +20.435 |
Neg logit contributions | |
besides | -11.475 |
because | -11.048 |
nonetheless | -10.942 |
nevertheless | -10.541 |
regardless | -10.326 |
Token | settlements |
Token ID | 18573 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
majority | +34.678 |
country | +34.383 |
nation | +33.982 |
remainder | +32.592 |
inner | +32.338 |
Neg logit contributions | |
besides | -14.807 |
nonetheless | -14.267 |
nevertheless | -13.894 |
because | -13.859 |
regardless | -13.180 |
Token | in |
Token ID | 287 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
country | +2.885 |
majority | +2.884 |
nation | +2.880 |
inner | +2.788 |
oret | +2.784 |
Neg logit contributions | |
because | -1.459 |
besides | -1.454 |
nonetheless | -1.395 |
regardless | -1.349 |
nevertheless | -1.340 |
Token | the |
Token ID | 262 |
Feature activation | -2.95e+01 |
Pos logit contributions | |
majority | +19.499 |
country | +19.435 |
nation | +19.256 |
inner | +18.823 |
oret | +18.402 |
Neg logit contributions | |
besides | -11.545 |
nonetheless | -11.286 |
because | -11.153 |
nevertheless | -10.918 |
regardless | -10.523 |
Token | territories |
Token ID | 16771 |
Feature activation | +3.10e+00 |
Pos logit contributions | |
country | +30.913 |
majority | +30.605 |
nation | +30.163 |
inner | +29.198 |
city | +28.598 |
Neg logit contributions | |
besides | -17.580 |
nonetheless | -17.238 |
nevertheless | -16.906 |
because | -16.438 |
regardless | -15.965 |
Token | ended |
Token ID | 4444 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
because | +2.709 |
besides | +2.667 |
nonetheless | +2.562 |
regardless | +2.519 |
nevertheless | +2.482 |
Neg logit contributions | |
country | -3.728 |
majority | -3.723 |
nation | -3.711 |
oret | -3.621 |
inner | -3.605 |
Token | and |
Token ID | 290 |
Feature activation | +4.95e+00 |
Pos logit contributions | |
because | +21.865 |
besides | +21.464 |
regardless | +20.634 |
nonetheless | +20.379 |
unless | +20.324 |
Neg logit contributions | |
oret | -10.861 |
majority | -10.792 |
country | -10.403 |
nation | -10.396 |
slightest | -10.125 |
Token | even |
Token ID | 772 |
Feature activation | +4.26e+00 |
Pos logit contributions | |
because | +5.977 |
besides | +5.910 |
nonetheless | +5.715 |
regardless | +5.648 |
nevertheless | +5.600 |
Neg logit contributions | |
majority | -4.228 |
country | -4.186 |
nation | -4.185 |
oret | -4.179 |
inner | -4.004 |
Token | " |
Token ID | 366 |
Feature activation | -4.17e+00 |
Pos logit contributions | |
because | +5.030 |
besides | +4.978 |
nonetheless | +4.810 |
regardless | +4.738 |
nevertheless | +4.703 |
Neg logit contributions | |
majority | -3.781 |
country | -3.741 |
nation | -3.739 |
oret | -3.700 |
inner | -3.580 |
Token | to |
Token ID | 1462 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
country | +3.698 |
majority | +3.682 |
nation | +3.677 |
oret | +3.520 |
inner | +3.508 |
Neg logit contributions | |
because | -4.911 |
besides | -4.887 |
nonetheless | -4.778 |
regardless | -4.698 |
nevertheless | -4.659 |
Token | seize |
Token ID | 21031 |
Feature activation | -7.96e+00 |
Pos logit contributions | |
country | +11.711 |
nation | +11.624 |
majority | +11.598 |
inner | +11.246 |
oret | +10.914 |
Neg logit contributions | |
besides | -9.673 |
because | -9.610 |
nonetheless | -9.358 |
regardless | -9.231 |
nevertheless | -8.962 |
Token | the |
Token ID | 262 |
Feature activation | -3.18e+01 |
Pos logit contributions | |
country | +10.185 |
majority | +10.167 |
nation | +10.114 |
inner | +9.833 |
oret | +9.696 |
Neg logit contributions | |
because | -6.013 |
besides | -5.988 |
nonetheless | -5.835 |
regardless | -5.636 |
nevertheless | -5.578 |
Token | Lub |
Token ID | 40753 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
country | +35.058 |
majority | +34.339 |
nation | +34.244 |
city | +33.392 |
inner | +33.140 |
Neg logit contributions | |
nonetheless | -14.076 |
besides | -13.938 |
because | -13.613 |
regardless | -13.502 |
nevertheless | -12.944 |
Token | lin |
Token ID | 2815 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
oret | +16.636 |
majority | +16.563 |
nation | +16.463 |
country | +16.337 |
ses | +16.068 |
Neg logit contributions | |
besides | -17.612 |
nonetheless | -17.275 |
because | -17.203 |
regardless | -16.935 |
nevertheless | -16.648 |
Token | region |
Token ID | 3814 |
Feature activation | +6.98e+00 |
Pos logit contributions | |
country | +24.938 |
nation | +24.533 |
majority | +24.391 |
inner | +23.630 |
city | +23.542 |
Neg logit contributions | |
besides | -10.411 |
nonetheless | -10.347 |
because | -10.228 |
regardless | -9.743 |
nevertheless | -9.710 |
Token | by |
Token ID | 416 |
Feature activation | -8.60e+00 |
Pos logit contributions | |
because | +6.923 |
besides | +6.777 |
nonetheless | +6.522 |
regardless | +6.456 |
nevertheless | +6.364 |
Neg logit contributions | |
majority | -7.327 |
country | -7.271 |
nation | -7.261 |
oret | -7.169 |
inner | -7.008 |
Token | the |
Token ID | 262 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
country | +10.325 |
majority | +10.279 |
nation | +10.250 |
inner | +9.949 |
oret | +9.819 |
Neg logit contributions | |
because | -7.219 |
besides | -7.203 |
nonetheless | -6.975 |
regardless | -6.801 |
nevertheless | -6.724 |
Token | decision |
Token ID | 2551 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
country | +23.232 |
majority | +23.112 |
nation | +22.789 |
trio | +22.005 |
largest | +21.786 |
Neg logit contributions | |
besides | -14.952 |
because | -14.676 |
nonetheless | -14.295 |
regardless | -13.938 |
nevertheless | -13.921 |
Token | to |
Token ID | 284 |
Feature activation | -4.89e+00 |
Pos logit contributions | |
because | +11.200 |
besides | +10.813 |
nonetheless | +10.646 |
nevertheless | +10.404 |
regardless | +10.371 |
Neg logit contributions | |
majority | -10.304 |
country | -10.263 |
nation | -10.244 |
oret | -10.199 |
inner | -10.002 |
Token | drop |
Token ID | 4268 |
Feature activation | -3.31e+00 |
Pos logit contributions | |
country | +5.055 |
majority | +5.024 |
nation | +5.017 |
inner | +4.770 |
oret | +4.725 |
Neg logit contributions | |
besides | -4.985 |
because | -4.962 |
nonetheless | -4.803 |
regardless | -4.753 |
nevertheless | -4.672 |
Token | Russia |
Token ID | 3284 |
Feature activation | -6.05e+00 |
Pos logit contributions | |
majority | +4.025 |
country | +4.023 |
nation | +4.010 |
oret | +3.894 |
inner | +3.882 |
Neg logit contributions | |
because | -2.870 |
besides | -2.840 |
nonetheless | -2.741 |
regardless | -2.679 |
nevertheless | -2.654 |
Token | from |
Token ID | 422 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
majority | +9.406 |
country | +9.370 |
nation | +9.343 |
inner | +9.037 |
trio | +8.985 |
Neg logit contributions | |
besides | -2.895 |
because | -2.862 |
nonetheless | -2.745 |
regardless | -2.597 |
nevertheless | -2.579 |
Token | the |
Token ID | 262 |
Feature activation | -3.18e+01 |
Pos logit contributions | |
majority | +16.852 |
country | +16.728 |
nation | +16.539 |
inner | +16.006 |
group | +15.904 |
Neg logit contributions | |
besides | -11.016 |
because | -10.972 |
nonetheless | -10.737 |
nevertheless | -10.346 |
regardless | -10.344 |
Token | group |
Token ID | 1448 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
group | +32.843 |
country | +32.711 |
majority | +32.656 |
nation | +31.906 |
trio | +31.432 |
Neg logit contributions | |
besides | -16.725 |
nonetheless | -16.095 |
because | -15.713 |
nevertheless | -15.401 |
regardless | -15.136 |
Token | was |
Token ID | 373 |
Feature activation | +7.37e+00 |
Pos logit contributions | |
because | +0.130 |
besides | +0.129 |
nonetheless | +0.124 |
regardless | +0.120 |
nevertheless | +0.119 |
Neg logit contributions | |
majority | -0.217 |
country | -0.217 |
nation | -0.216 |
oret | -0.210 |
inner | -0.210 |
Token | taken |
Token ID | 2077 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
because | +8.498 |
besides | +8.266 |
nonetheless | +8.178 |
nevertheless | +8.005 |
regardless | +7.911 |
Neg logit contributions | |
majority | -6.582 |
nation | -6.572 |
country | -6.551 |
oret | -6.477 |
inner | -6.348 |
Token | by |
Token ID | 416 |
Feature activation | -3.26e+00 |
Pos logit contributions | |
because | +13.584 |
besides | +12.935 |
nonetheless | +12.724 |
regardless | +12.565 |
nevertheless | +12.390 |
Neg logit contributions | |
majority | -9.935 |
country | -9.928 |
nation | -9.898 |
oret | -9.761 |
inner | -9.623 |
Token | its |
Token ID | 663 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
majority | +3.575 |
country | +3.574 |
nation | +3.562 |
oret | +3.451 |
inner | +3.437 |
Neg logit contributions | |
because | -3.227 |
besides | -3.196 |
nonetheless | -3.100 |
regardless | -3.038 |
nevertheless | -3.014 |
Token | of |
Token ID | 286 |
Feature activation | -8.45e+00 |
Pos logit contributions | |
because | +0.450 |
besides | +0.441 |
nonetheless | +0.429 |
regardless | +0.418 |
nevertheless | +0.414 |
Neg logit contributions | |
majority | -0.580 |
country | -0.579 |
nation | -0.578 |
oret | -0.562 |
inner | -0.559 |
Token | wider |
Token ID | 10595 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
majority | +11.158 |
country | +11.119 |
nation | +11.078 |
inner | +10.815 |
oret | +10.683 |
Neg logit contributions | |
because | -6.120 |
besides | -6.119 |
nonetheless | -5.885 |
nevertheless | -5.707 |
regardless | -5.700 |
Token | approaches |
Token ID | 10581 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
country | +16.377 |
majority | +16.287 |
nation | +16.145 |
inner | +15.840 |
oret | +15.397 |
Neg logit contributions | |
besides | -10.446 |
because | -10.271 |
nonetheless | -9.989 |
nevertheless | -9.836 |
regardless | -9.785 |
Token | running |
Token ID | 2491 |
Feature activation | -7.68e-01 |
Pos logit contributions | |
because | +11.629 |
besides | +11.468 |
nonetheless | +11.047 |
regardless | +10.842 |
nevertheless | +10.738 |
Neg logit contributions | |
majority | -9.996 |
country | -9.926 |
nation | -9.894 |
oret | -9.665 |
inner | -9.513 |
Token | under |
Token ID | 739 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
majority | +1.100 |
country | +1.100 |
nation | +1.096 |
oret | +1.067 |
inner | +1.067 |
Neg logit contributions | |
because | -0.499 |
besides | -0.493 |
nonetheless | -0.471 |
regardless | -0.455 |
nevertheless | -0.451 |
Token | the |
Token ID | 262 |
Feature activation | -3.17e+01 |
Pos logit contributions | |
country | +14.942 |
majority | +14.882 |
nation | +14.764 |
inner | +14.432 |
oret | +14.192 |
Neg logit contributions | |
besides | -8.806 |
because | -8.772 |
nonetheless | -8.522 |
nevertheless | -8.273 |
regardless | -8.221 |
Token | bridge |
Token ID | 7696 |
Feature activation | +3.13e+00 |
Pos logit contributions | |
majority | +33.427 |
country | +33.359 |
nation | +32.932 |
main | +32.520 |
inner | +32.479 |
Neg logit contributions | |
besides | -15.241 |
because | -14.618 |
nonetheless | -14.403 |
nevertheless | -14.172 |
regardless | -13.941 |
Token | would |
Token ID | 561 |
Feature activation | +7.76e+00 |
Pos logit contributions | |
because | +2.616 |
besides | +2.578 |
nonetheless | +2.485 |
regardless | +2.424 |
nevertheless | +2.402 |
Neg logit contributions | |
majority | -3.900 |
country | -3.894 |
nation | -3.882 |
oret | -3.783 |
inner | -3.766 |
Token | allow |
Token ID | 1249 |
Feature activation | +2.44e+00 |
Pos logit contributions | |
because | +9.241 |
besides | +9.100 |
nonetheless | +8.971 |
nevertheless | +8.769 |
regardless | +8.697 |
Neg logit contributions | |
majority | -6.618 |
country | -6.604 |
nation | -6.552 |
oret | -6.363 |
inner | -6.278 |
Token | the |
Token ID | 262 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
because | +2.964 |
besides | +2.913 |
nonetheless | +2.843 |
regardless | +2.800 |
nevertheless | +2.768 |
Neg logit contributions | |
nation | -2.094 |
country | -2.091 |
majority | -2.086 |
oret | -2.050 |
trio | -1.971 |
Token | Park |
Token ID | 3250 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
majority | +26.234 |
country | +25.882 |
nation | +25.681 |
inner | +25.108 |
city | +24.874 |
Neg logit contributions | |
besides | -14.010 |
because | -13.651 |
nonetheless | -13.270 |
nevertheless | -13.076 |
regardless | -12.917 |
Token | speak |
Token ID | 2740 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
because | +2.099 |
besides | +2.084 |
nonetheless | +2.030 |
regardless | +1.995 |
nevertheless | +1.982 |
Neg logit contributions | |
majority | -1.672 |
country | -1.671 |
nation | -1.664 |
oret | -1.599 |
inner | -1.594 |
Token | about |
Token ID | 546 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
because | +11.984 |
besides | +11.649 |
nonetheless | +11.182 |
regardless | +11.135 |
unless | +10.966 |
Neg logit contributions | |
majority | -9.313 |
nation | -9.281 |
country | -9.278 |
oret | -9.134 |
inner | -9.004 |
Token | how |
Token ID | 703 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
majority | +0.128 |
country | +0.127 |
nation | +0.127 |
oret | +0.124 |
inner | +0.123 |
Neg logit contributions | |
because | -0.091 |
besides | -0.089 |
nonetheless | -0.086 |
regardless | -0.084 |
nevertheless | -0.083 |
Token | anybody |
Token ID | 9599 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
because | +0.290 |
besides | +0.287 |
nonetheless | +0.278 |
regardless | +0.273 |
nevertheless | +0.270 |
Neg logit contributions | |
majority | -0.303 |
country | -0.303 |
nation | -0.303 |
oret | -0.293 |
inner | -0.291 |
Token | on |
Token ID | 319 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
because | +0.090 |
besides | +0.089 |
nonetheless | +0.086 |
regardless | +0.083 |
nevertheless | +0.083 |
Neg logit contributions | |
country | -0.171 |
majority | -0.171 |
nation | -0.170 |
inner | -0.165 |
oret | -0.165 |
Token | the |
Token ID | 262 |
Feature activation | -3.14e+01 |
Pos logit contributions | |
country | +15.203 |
majority | +15.166 |
nation | +15.011 |
inner | +14.705 |
oret | +14.369 |
Neg logit contributions | |
besides | -9.262 |
because | -9.224 |
nonetheless | -9.108 |
nevertheless | -8.772 |
regardless | -8.613 |
Token | left |
Token ID | 1364 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
majority | +31.605 |
country | +31.600 |
nation | +31.124 |
inner | +30.727 |
main | +29.919 |
Neg logit contributions | |
besides | -17.626 |
nonetheless | -17.498 |
nevertheless | -17.002 |
because | -16.854 |
regardless | -16.153 |
Token | is |
Token ID | 318 |
Feature activation | +2.54e+00 |
Pos logit contributions | |
because | +2.265 |
besides | +2.244 |
nonetheless | +2.155 |
regardless | +2.115 |
nevertheless | +2.089 |
Neg logit contributions | |
majority | -3.052 |
country | -3.048 |
nation | -3.039 |
oret | -2.957 |
inner | -2.940 |
Token | sexist |
Token ID | 24651 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
because | +2.953 |
besides | +2.920 |
nonetheless | +2.838 |
regardless | +2.797 |
nevertheless | +2.773 |
Neg logit contributions | |
country | -2.335 |
nation | -2.333 |
majority | -2.333 |
oret | -2.254 |
inner | -2.233 |
Token | or |
Token ID | 393 |
Feature activation | -8.54e+00 |
Pos logit contributions | |
because | +9.594 |
besides | +9.176 |
regardless | +8.825 |
nonetheless | +8.783 |
unless | +8.617 |
Neg logit contributions | |
majority | -10.826 |
nation | -10.795 |
country | -10.790 |
oret | -10.633 |
inner | -10.539 |
Token | racist |
Token ID | 9811 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
majority | +8.624 |
country | +8.612 |
nation | +8.554 |
inner | +8.192 |
oret | +8.064 |
Neg logit contributions | |
besides | -8.516 |
because | -8.396 |
nonetheless | -8.330 |
nevertheless | -8.129 |
regardless | -8.024 |
Token | doctrine |
Token ID | 13115 |
Feature activation | +6.11e+00 |
Pos logit contributions | |
country | +28.101 |
nation | +27.801 |
majority | +27.533 |
group | +26.163 |
trio | +26.063 |
Neg logit contributions | |
besides | -13.687 |
nonetheless | -13.017 |
because | -12.819 |
nevertheless | -12.650 |
regardless | -12.398 |
Token | which |
Token ID | 543 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
because | +5.809 |
besides | +5.700 |
nonetheless | +5.502 |
regardless | +5.386 |
nevertheless | +5.335 |
Neg logit contributions | |
nation | -6.681 |
country | -6.678 |
majority | -6.660 |
oret | -6.616 |
inner | -6.457 |
Token | mixes |
Token ID | 33237 |
Feature activation | -7.27e+00 |
Pos logit contributions | |
majority | +1.877 |
country | +1.875 |
nation | +1.868 |
inner | +1.796 |
oret | +1.796 |
Neg logit contributions | |
because | -1.900 |
besides | -1.887 |
nonetheless | -1.832 |
regardless | -1.799 |
nevertheless | -1.784 |
Token | Marxism |
Token ID | 30634 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
country | +7.148 |
majority | +7.143 |
nation | +7.118 |
inner | +6.824 |
oret | +6.803 |
Neg logit contributions | |
because | -7.929 |
besides | -7.887 |
nonetheless | -7.678 |
regardless | -7.525 |
nevertheless | -7.490 |
Token | with |
Token ID | 351 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
country | +4.069 |
majority | +4.063 |
nation | +4.043 |
inner | +3.950 |
oret | +3.911 |
Neg logit contributions | |
besides | -0.672 |
because | -0.649 |
nonetheless | -0.624 |
nevertheless | -0.573 |
regardless | -0.548 |
Token | the |
Token ID | 262 |
Feature activation | -3.14e+01 |
Pos logit contributions | |
country | +14.359 |
majority | +14.290 |
nation | +14.255 |
inner | +13.780 |
oret | +13.541 |
Neg logit contributions | |
besides | -9.332 |
because | -9.286 |
nonetheless | -8.965 |
regardless | -8.737 |
nevertheless | -8.673 |
Token | worship |
Token ID | 11892 |
Feature activation | -4.18e+00 |
Pos logit contributions | |
country | +33.300 |
nation | +32.997 |
majority | +32.664 |
inner | +30.918 |
presence | +30.810 |
Neg logit contributions | |
besides | -17.179 |
because | -16.412 |
nonetheless | -15.825 |
unless | -15.778 |
regardless | -15.768 |
Token | of |
Token ID | 286 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
country | +5.280 |
nation | +5.275 |
majority | +5.248 |
inner | +5.036 |
oret | +4.946 |
Neg logit contributions | |
besides | -3.207 |
nonetheless | -3.134 |
because | -3.126 |
nevertheless | -3.067 |
regardless | -3.009 |
Token | North |
Token ID | 2258 |
Feature activation | -1.95e+01 |
Pos logit contributions | |
country | +14.976 |
nation | +14.840 |
majority | +14.811 |
inner | +14.211 |
oret | +13.718 |
Neg logit contributions | |
besides | -12.738 |
because | -12.571 |
nonetheless | -12.342 |
nevertheless | -11.995 |
regardless | -11.945 |
Token | Korea |
Token ID | 4969 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
country | +18.254 |
nation | +17.785 |
majority | +17.405 |
inner | +16.964 |
family | +16.515 |
Neg logit contributions | |
besides | -15.868 |
nonetheless | -15.567 |
nevertheless | -15.490 |
regardless | -15.191 |
because | -14.890 |
Token | 's |
Token ID | 338 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
majority | +2.084 |
country | +2.079 |
nation | +2.072 |
oret | +2.018 |
inner | +2.004 |
Neg logit contributions | |
because | -1.720 |
besides | -1.699 |
nonetheless | -1.642 |
regardless | -1.612 |
nevertheless | -1.595 |
Token | don |
Token ID | 836 |
Feature activation | +3.98e+00 |
Pos logit contributions | |
majority | +1.648 |
country | +1.645 |
nation | +1.641 |
oret | +1.587 |
inner | +1.587 |
Neg logit contributions | |
because | -1.160 |
besides | -1.153 |
nonetheless | -1.114 |
regardless | -1.087 |
nevertheless | -1.078 |
Token | � |
Token ID | 447 |
Feature activation | -4.38e+00 |
Pos logit contributions | |
because | +3.149 |
besides | +3.138 |
nonetheless | +3.030 |
regardless | +2.945 |
nevertheless | +2.925 |
Neg logit contributions | |
majority | -5.148 |
country | -5.137 |
nation | -5.127 |
oret | -4.983 |
inner | -4.958 |
Token | � |
Token ID | 247 |
Feature activation | -7.82e-01 |
Pos logit contributions | |
majority | +2.964 |
nation | +2.925 |
country | +2.916 |
inner | +2.741 |
oret | +2.731 |
Neg logit contributions | |
because | -6.092 |
besides | -6.074 |
nonetheless | -5.971 |
regardless | -5.878 |
nevertheless | -5.861 |
Token | t |
Token ID | 83 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
country | +0.630 |
majority | +0.628 |
nation | +0.627 |
oret | +0.599 |
inner | +0.597 |
Neg logit contributions | |
because | -1.000 |
besides | -0.991 |
nonetheless | -0.968 |
regardless | -0.954 |
nevertheless | -0.948 |
Token | enter |
Token ID | 3802 |
Feature activation | -4.69e+00 |
Pos logit contributions | |
because | +1.259 |
besides | +1.252 |
nonetheless | +1.218 |
regardless | +1.194 |
nevertheless | +1.187 |
Neg logit contributions | |
majority | -1.190 |
country | -1.189 |
nation | -1.184 |
oret | -1.140 |
inner | -1.139 |
Token | the |
Token ID | 262 |
Feature activation | -3.14e+01 |
Pos logit contributions | |
country | +6.122 |
majority | +6.120 |
nation | +6.095 |
inner | +5.923 |
oret | +5.888 |
Neg logit contributions | |
because | -3.548 |
besides | -3.542 |
nonetheless | -3.414 |
regardless | -3.310 |
nevertheless | -3.296 |
Token | fast |
Token ID | 3049 |
Feature activation | -1.61e+01 |
Pos logit contributions | |
majority | +34.237 |
country | +34.195 |
nation | +33.734 |
inner | +32.819 |
main | +32.363 |
Neg logit contributions | |
besides | -13.395 |
nonetheless | -12.645 |
because | -12.405 |
nevertheless | -12.397 |
regardless | -11.918 |
Token | ed |
Token ID | 276 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
country | +15.598 |
nation | +15.505 |
majority | +15.234 |
inner | +14.857 |
group | +14.224 |
Neg logit contributions | |
besides | -13.326 |
nonetheless | -13.150 |
nevertheless | -12.925 |
regardless | -12.377 |
because | -12.346 |
Token | state |
Token ID | 1181 |
Feature activation | +9.21e+00 |
Pos logit contributions | |
country | +18.650 |
majority | +18.572 |
nation | +18.548 |
inner | +17.908 |
oret | +17.595 |
Neg logit contributions | |
besides | -10.575 |
because | -10.199 |
nonetheless | -10.154 |
nevertheless | -9.840 |
regardless | -9.618 |
Token | until |
Token ID | 1566 |
Feature activation | -3.58e-01 |
Pos logit contributions | |
because | +10.978 |
besides | +10.601 |
nonetheless | +10.262 |
regardless | +10.246 |
unless | +10.119 |
Neg logit contributions | |
country | -7.870 |
majority | -7.816 |
nation | -7.809 |
oret | -7.611 |
trio | -7.452 |
Token | 12 |
Token ID | 1105 |
Feature activation | -5.54e+00 |
Pos logit contributions | |
country | +0.431 |
majority | +0.431 |
nation | +0.430 |
oret | +0.418 |
inner | +0.416 |
Neg logit contributions | |
because | -0.315 |
besides | -0.311 |
nonetheless | -0.300 |
regardless | -0.294 |
nevertheless | -0.291 |
Token | the |
Token ID | 262 |
Feature activation | -2.58e+01 |
Pos logit contributions | |
country | +6.997 |
majority | +6.986 |
nation | +6.963 |
inner | +6.704 |
oret | +6.661 |
Neg logit contributions | |
besides | -5.200 |
because | -5.199 |
nonetheless | -5.020 |
regardless | -4.930 |
nevertheless | -4.868 |
Token | seas |
Token ID | 21547 |
Feature activation | -5.28e+00 |
Pos logit contributions | |
country | +28.673 |
majority | +28.379 |
nation | +28.351 |
largest | +27.348 |
inner | +26.790 |
Neg logit contributions | |
besides | -17.164 |
because | -16.021 |
nonetheless | -15.832 |
regardless | -15.657 |
nevertheless | -15.387 |
Token | had |
Token ID | 550 |
Feature activation | -1.92e+00 |
Pos logit contributions | |
country | +6.616 |
nation | +6.611 |
majority | +6.606 |
oret | +6.412 |
inner | +6.383 |
Neg logit contributions | |
because | -4.226 |
besides | -4.219 |
nonetheless | -4.108 |
regardless | -3.997 |
nevertheless | -3.952 |
Token | risen |
Token ID | 17450 |
Feature activation | +5.72e+00 |
Pos logit contributions | |
majority | +2.025 |
country | +2.022 |
nation | +2.016 |
oret | +1.943 |
inner | +1.939 |
Neg logit contributions | |
because | -1.958 |
besides | -1.953 |
nonetheless | -1.889 |
regardless | -1.866 |
nevertheless | -1.836 |
Token | and |
Token ID | 290 |
Feature activation | -3.25e+00 |
Pos logit contributions | |
because | +6.070 |
besides | +5.939 |
nonetheless | +5.763 |
regardless | +5.649 |
nevertheless | +5.615 |
Neg logit contributions | |
majority | -5.782 |
country | -5.778 |
nation | -5.742 |
oret | -5.637 |
inner | -5.529 |
Token | the |
Token ID | 262 |
Feature activation | -3.13e+01 |
Pos logit contributions | |
country | +3.878 |
majority | +3.873 |
nation | +3.860 |
inner | +3.734 |
oret | +3.725 |
Neg logit contributions | |
because | -2.862 |
besides | -2.845 |
nonetheless | -2.757 |
regardless | -2.690 |
nevertheless | -2.671 |
Token | cave |
Token ID | 11527 |
Feature activation | -9.89e+00 |
Pos logit contributions | |
country | +33.660 |
majority | +33.218 |
nation | +33.128 |
world | +31.903 |
largest | +31.859 |
Neg logit contributions | |
besides | -16.668 |
nonetheless | -15.937 |
because | -15.406 |
nevertheless | -15.233 |
regardless | -15.182 |
Token | system |
Token ID | 1080 |
Feature activation | -2.95e+00 |
Pos logit contributions | |
country | +12.722 |
nation | +12.683 |
majority | +12.649 |
inner | +12.237 |
oret | +12.125 |
Neg logit contributions | |
besides | -7.195 |
because | -7.190 |
nonetheless | -6.976 |
regardless | -6.800 |
nevertheless | -6.694 |
Token | had |
Token ID | 550 |
Feature activation | -4.25e+00 |
Pos logit contributions | |
majority | +3.785 |
country | +3.781 |
nation | +3.772 |
inner | +3.658 |
oret | +3.649 |
Neg logit contributions | |
because | -2.308 |
besides | -2.296 |
nonetheless | -2.217 |
regardless | -2.166 |
nevertheless | -2.136 |
Token | filled |
Token ID | 5901 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
majority | +4.694 |
country | +4.677 |
nation | +4.662 |
inner | +4.498 |
oret | +4.488 |
Neg logit contributions | |
besides | -4.046 |
because | -4.029 |
nonetheless | -3.894 |
regardless | -3.851 |
nevertheless | -3.777 |
Token | with |
Token ID | 351 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
because | +0.634 |
besides | +0.615 |
nonetheless | +0.580 |
regardless | +0.555 |
nevertheless | +0.546 |
Neg logit contributions | |
majority | -1.955 |
country | -1.951 |
nation | -1.949 |
oret | -1.908 |
inner | -1.900 |
Token | people |
Token ID | 15332 |
Feature activation | +4.66e+00 |
Pos logit contributions | |
majority | +3.335 |
country | +3.333 |
nation | +3.319 |
oret | +3.193 |
inner | +3.184 |
Neg logit contributions | |
because | -3.685 |
besides | -3.676 |
nonetheless | -3.586 |
regardless | -3.505 |
nevertheless | -3.496 |
Token | don |
Token ID | 836 |
Feature activation | +7.83e+00 |
Pos logit contributions | |
because | +4.489 |
besides | +4.446 |
nonetheless | +4.291 |
regardless | +4.227 |
nevertheless | +4.177 |
Neg logit contributions | |
country | -5.177 |
nation | -5.161 |
majority | -5.153 |
oret | -5.012 |
inner | -4.974 |
Token | 't |
Token ID | 470 |
Feature activation | +7.10e+00 |
Pos logit contributions | |
because | +6.692 |
besides | +6.598 |
nonetheless | +6.359 |
regardless | +6.217 |
nevertheless | +6.152 |
Neg logit contributions | |
country | -9.591 |
majority | -9.590 |
nation | -9.557 |
inner | -9.268 |
oret | -9.265 |
Token | know |
Token ID | 760 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
because | +7.672 |
besides | +7.549 |
nonetheless | +7.306 |
regardless | +7.223 |
nevertheless | +7.136 |
Neg logit contributions | |
majority | -6.931 |
country | -6.931 |
nation | -6.926 |
oret | -6.740 |
inner | -6.633 |
Token | who |
Token ID | 508 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
because | +10.922 |
besides | +10.635 |
regardless | +10.190 |
nonetheless | +10.170 |
unless | +10.032 |
Neg logit contributions | |
country | -9.590 |
nation | -9.574 |
oret | -9.552 |
majority | -9.515 |
ses | -9.293 |
Token | the |
Token ID | 262 |
Feature activation | -3.13e+01 |
Pos logit contributions | |
majority | +5.854 |
country | +5.853 |
nation | +5.835 |
oret | +5.678 |
inner | +5.663 |
Neg logit contributions | |
because | -3.348 |
besides | -3.309 |
nonetheless | -3.176 |
regardless | -3.093 |
nevertheless | -3.060 |
Token | Koch |
Token ID | 17009 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
majority | +32.401 |
nation | +31.907 |
country | +31.866 |
inner | +30.815 |
largest | +30.805 |
Neg logit contributions | |
nonetheless | -17.069 |
besides | -16.945 |
nevertheless | -16.490 |
because | -16.412 |
regardless | -16.117 |
Token | brothers |
Token ID | 9397 |
Feature activation | +4.72e-01 |
Pos logit contributions | |
majority | +21.163 |
nation | +20.589 |
country | +20.530 |
inner | +20.162 |
family | +20.133 |
Neg logit contributions | |
besides | -16.537 |
nonetheless | -16.447 |
because | -16.393 |
nevertheless | -15.973 |
regardless | -15.864 |
Token | are |
Token ID | 389 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
because | +0.310 |
besides | +0.305 |
nonetheless | +0.286 |
regardless | +0.278 |
nevertheless | +0.275 |
Neg logit contributions | |
country | -0.673 |
nation | -0.672 |
majority | -0.671 |
oret | -0.661 |
inner | -0.654 |
Token | ." |
Token ID | 526 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
because | +9.905 |
besides | +9.613 |
regardless | +9.100 |
nonetheless | +9.046 |
unless | +8.955 |
Neg logit contributions | |
country | -11.068 |
nation | -11.011 |
majority | -10.981 |
oret | -10.927 |
inner | -10.698 |
Token | It |
Token ID | 632 |
Feature activation | +7.49e+00 |
Pos logit contributions | |
because | +20.361 |
besides | +19.408 |
nonetheless | +18.887 |
regardless | +18.797 |
nevertheless | +18.523 |
Neg logit contributions | |
slightest | -13.690 |
inner | -13.496 |
country | -13.449 |
nation | -13.236 |
subur | -13.179 |
Token | Ext |
Token ID | 5683 |
Feature activation | -4.85e+00 |
Pos logit contributions | |
because | +14.705 |
besides | +14.227 |
regardless | +13.604 |
nonetheless | +13.488 |
unless | +13.337 |
Neg logit contributions | |
country | -11.433 |
nation | -11.343 |
slightest | -11.319 |
majority | -11.274 |
inner | -11.145 |
Token | ending |
Token ID | 1571 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
majority | +3.742 |
country | +3.732 |
nation | +3.709 |
oret | +3.551 |
inner | +3.533 |
Neg logit contributions | |
because | -6.316 |
besides | -6.289 |
nonetheless | -6.160 |
regardless | -6.056 |
nevertheless | -6.034 |
Token | your |
Token ID | 534 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
because | +2.889 |
besides | +2.831 |
nonetheless | +2.742 |
regardless | +2.692 |
nevertheless | +2.648 |
Neg logit contributions | |
majority | -3.489 |
country | -3.489 |
nation | -3.483 |
oret | -3.397 |
inner | -3.346 |
Token | time |
Token ID | 640 |
Feature activation | +8.43e+00 |
Pos logit contributions | |
country | +23.637 |
majority | +23.579 |
nation | +23.355 |
inner | +22.962 |
presence | +22.678 |
Neg logit contributions | |
besides | -11.646 |
nonetheless | -11.211 |
because | -11.187 |
nevertheless | -10.990 |
regardless | -10.672 |
Token | in |
Token ID | 287 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
because | +8.611 |
besides | +8.393 |
nonetheless | +8.107 |
regardless | +8.070 |
nevertheless | +7.813 |
Neg logit contributions | |
country | -8.631 |
majority | -8.626 |
nation | -8.612 |
oret | -8.406 |
trio | -8.252 |
Token | the |
Token ID | 262 |
Feature activation | -3.13e+01 |
Pos logit contributions | |
country | +15.839 |
majority | +15.789 |
nation | +15.662 |
inner | +15.333 |
oret | +15.009 |
Neg logit contributions | |
besides | -9.719 |
because | -9.621 |
nonetheless | -9.442 |
nevertheless | -9.138 |
regardless | -8.998 |
Token | fast |
Token ID | 3049 |
Feature activation | -1.47e+01 |
Pos logit contributions | |
country | +34.479 |
majority | +34.439 |
nation | +34.188 |
presence | +32.981 |
inner | +32.977 |
Neg logit contributions | |
besides | -13.082 |
nonetheless | -12.596 |
because | -12.507 |
nevertheless | -12.323 |
regardless | -11.487 |
Token | ed |
Token ID | 276 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
country | +12.841 |
nation | +12.687 |
majority | +12.491 |
inner | +12.026 |
oret | +11.617 |
Neg logit contributions | |
besides | -14.645 |
nonetheless | -14.354 |
because | -14.126 |
nevertheless | -14.107 |
regardless | -13.864 |
Token | state |
Token ID | 1181 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
country | +18.249 |
nation | +18.097 |
majority | +18.055 |
inner | +17.433 |
oret | +17.142 |
Neg logit contributions | |
besides | -11.896 |
because | -11.612 |
nonetheless | -11.466 |
nevertheless | -11.174 |
regardless | -10.948 |
Token | is |
Token ID | 318 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
because | +18.274 |
besides | +17.818 |
nonetheless | +17.296 |
regardless | +17.242 |
nevertheless | +16.864 |
Neg logit contributions | |
country | -10.758 |
majority | -10.691 |
nation | -10.675 |
oret | -10.363 |
slightest | -10.195 |
Token | actually |
Token ID | 1682 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
because | +14.850 |
besides | +14.394 |
nonetheless | +14.073 |
regardless | +13.873 |
nevertheless | +13.793 |
Neg logit contributions | |
nation | -7.815 |
country | -7.810 |
majority | -7.737 |
oret | -7.555 |
slightest | -7.526 |
Token |
|
Token ID | 198 |
Feature activation | +4.83e+00 |
Pos logit contributions | |
because | +10.719 |
besides | +10.377 |
regardless | +10.067 |
nonetheless | +10.010 |
unless | +9.867 |
Neg logit contributions | |
majority | -8.696 |
country | -8.668 |
slightest | -8.646 |
nation | -8.621 |
inner | -8.476 |
Token |
|
Token ID | 198 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
besides | +2.652 |
because | +2.613 |
nonetheless | +2.550 |
nevertheless | +2.426 |
regardless | +2.422 |
Neg logit contributions | |
majority | -7.469 |
country | -7.461 |
nation | -7.447 |
oret | -7.273 |
inner | -7.205 |
Token | Moving |
Token ID | 33622 |
Feature activation | -4.81e+00 |
Pos logit contributions | |
majority | +0.382 |
country | +0.382 |
nation | +0.380 |
oret | +0.365 |
inner | +0.365 |
Neg logit contributions | |
because | -0.429 |
besides | -0.425 |
nonetheless | -0.413 |
regardless | -0.406 |
nevertheless | -0.403 |
Token | ash |
Token ID | 12530 |
Feature activation | +3.80e+00 |
Pos logit contributions | |
majority | +4.013 |
country | +4.008 |
nation | +3.988 |
oret | +3.807 |
inner | +3.804 |
Neg logit contributions | |
because | -5.994 |
besides | -5.957 |
nonetheless | -5.815 |
regardless | -5.720 |
nevertheless | -5.689 |
Token | from |
Token ID | 422 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
because | +2.411 |
besides | +2.342 |
nonetheless | +2.210 |
regardless | +2.176 |
nevertheless | +2.096 |
Neg logit contributions | |
majority | -5.474 |
country | -5.459 |
nation | -5.452 |
oret | -5.356 |
inner | -5.300 |
Token | the |
Token ID | 262 |
Feature activation | -3.12e+01 |
Pos logit contributions | |
majority | +13.782 |
country | +13.745 |
nation | +13.643 |
inner | +13.359 |
oret | +13.082 |
Neg logit contributions | |
besides | -8.628 |
because | -8.607 |
nonetheless | -8.455 |
nevertheless | -8.168 |
regardless | -8.087 |
Token | Asheville |
Token ID | 49362 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
majority | +33.847 |
country | +33.602 |
nation | +33.300 |
inner | +32.794 |
largest | +32.590 |
Neg logit contributions | |
besides | -14.070 |
nonetheless | -13.717 |
because | -13.372 |
nevertheless | -13.207 |
regardless | -12.907 |
Token | plant |
Token ID | 4618 |
Feature activation | -3.45e+00 |
Pos logit contributions | |
country | +27.784 |
nation | +27.701 |
majority | +27.694 |
inner | +27.125 |
largest | +26.866 |
Neg logit contributions | |
besides | -11.568 |
nonetheless | -11.202 |
because | -10.890 |
nevertheless | -10.822 |
regardless | -10.546 |
Token | to |
Token ID | 284 |
Feature activation | -6.42e+00 |
Pos logit contributions | |
country | +5.036 |
majority | +5.036 |
nation | +5.020 |
inner | +4.895 |
oret | +4.888 |
Neg logit contributions | |
because | -2.111 |
besides | -2.092 |
nonetheless | -1.995 |
regardless | -1.920 |
nevertheless | -1.909 |
Token | a |
Token ID | 257 |
Feature activation | -2.42e+01 |
Pos logit contributions | |
majority | +7.922 |
country | +7.913 |
nation | +7.870 |
inner | +7.683 |
oret | +7.595 |
Neg logit contributions | |
because | -5.274 |
besides | -5.263 |
nonetheless | -5.091 |
regardless | -4.937 |
nevertheless | -4.927 |
Token | lined |
Token ID | 16566 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
majority | +28.183 |
country | +27.900 |
nation | +27.833 |
inner | +27.259 |
trio | +27.011 |
Neg logit contributions | |
besides | -12.993 |
because | -12.397 |
nonetheless | -12.256 |
nevertheless | -11.985 |
regardless | -11.683 |
Token | University |
Token ID | 2059 |
Feature activation | +4.74e+00 |
Pos logit contributions | |
majority | +5.183 |
country | +5.181 |
nation | +5.163 |
oret | +5.010 |
inner | +4.999 |
Neg logit contributions | |
because | -3.579 |
besides | -3.547 |
nonetheless | -3.422 |
regardless | -3.341 |
nevertheless | -3.311 |
Token | . |
Token ID | 13 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
because | +5.743 |
besides | +5.562 |
nonetheless | +5.403 |
regardless | +5.344 |
nevertheless | +5.264 |
Neg logit contributions | |
majority | -4.069 |
nation | -4.042 |
country | -4.019 |
oret | -3.867 |
inner | -3.845 |
Token | The |
Token ID | 383 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
because | +13.841 |
besides | +13.266 |
nonetheless | +12.686 |
regardless | +12.638 |
unless | +12.466 |
Neg logit contributions | |
slightest | -10.316 |
majority | -10.263 |
nation | -10.209 |
country | -10.202 |
inner | -9.942 |
Token | sun |
Token ID | 4252 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
majority | +26.318 |
country | +25.872 |
inner | +25.599 |
nation | +25.491 |
oret | +25.478 |
Neg logit contributions | |
besides | -14.357 |
nonetheless | -13.860 |
because | -13.748 |
regardless | -13.454 |
nevertheless | -13.385 |
Token | and |
Token ID | 290 |
Feature activation | -1.45e+01 |
Pos logit contributions | |
majority | +3.410 |
country | +3.410 |
nation | +3.398 |
oret | +3.298 |
inner | +3.295 |
Neg logit contributions | |
because | -2.197 |
besides | -2.176 |
nonetheless | -2.095 |
regardless | -2.048 |
nevertheless | -2.024 |
Token | the |
Token ID | 262 |
Feature activation | -3.11e+01 |
Pos logit contributions | |
majority | +16.764 |
country | +16.704 |
nation | +16.515 |
inner | +16.354 |
largest | +15.892 |
Neg logit contributions | |
besides | -11.514 |
because | -11.401 |
nonetheless | -11.212 |
regardless | -10.899 |
nevertheless | -10.882 |
Token | solar |
Token ID | 6591 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
majority | +33.285 |
inner | +32.741 |
country | +32.462 |
largest | +32.089 |
nation | +31.997 |
Neg logit contributions | |
besides | -15.883 |
nonetheless | -15.605 |
because | -15.371 |
regardless | -15.130 |
nevertheless | -15.126 |
Token | system |
Token ID | 1080 |
Feature activation | +1.77e+00 |
Pos logit contributions | |
majority | +19.279 |
country | +19.107 |
inner | +18.920 |
nation | +18.844 |
largest | +18.419 |
Neg logit contributions | |
nonetheless | -16.759 |
because | -16.637 |
besides | -16.608 |
nevertheless | -16.342 |
regardless | -16.226 |
Token | appear |
Token ID | 1656 |
Feature activation | +5.38e+00 |
Pos logit contributions | |
because | +1.712 |
besides | +1.698 |
nonetheless | +1.642 |
regardless | +1.604 |
nevertheless | +1.596 |
Neg logit contributions | |
majority | -1.982 |
country | -1.977 |
nation | -1.970 |
oret | -1.918 |
inner | -1.902 |
Token | to |
Token ID | 284 |
Feature activation | -3.51e-01 |
Pos logit contributions | |
because | +5.894 |
besides | +5.753 |
nonetheless | +5.584 |
regardless | +5.507 |
nevertheless | +5.426 |
Neg logit contributions | |
majority | -5.221 |
nation | -5.203 |
country | -5.191 |
oret | -5.104 |
ses | -4.949 |
Token | be |
Token ID | 307 |
Feature activation | +9.30e-01 |
Pos logit contributions | |
majority | +0.342 |
country | +0.341 |
nation | +0.340 |
oret | +0.329 |
inner | +0.326 |
Neg logit contributions | |
because | -0.390 |
besides | -0.386 |
nonetheless | -0.376 |
regardless | -0.368 |
nevertheless | -0.367 |
Token | whether |
Token ID | 1771 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
country | +13.597 |
nation | +13.534 |
majority | +13.510 |
inner | +13.011 |
largest | +12.777 |
Neg logit contributions | |
besides | -6.334 |
because | -6.207 |
nonetheless | -6.029 |
nevertheless | -5.765 |
regardless | -5.681 |
Token | the |
Token ID | 262 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
majority | +3.187 |
country | +3.182 |
nation | +3.176 |
oret | +3.124 |
inner | +3.095 |
Neg logit contributions | |
because | -1.503 |
besides | -1.470 |
nonetheless | -1.400 |
regardless | -1.371 |
nevertheless | -1.343 |
Token | UK |
Token ID | 3482 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
country | +26.599 |
nation | +26.030 |
majority | +25.387 |
remainder | +23.810 |
inner | +23.743 |
Neg logit contributions | |
besides | -18.981 |
nonetheless | -18.234 |
because | -17.984 |
nevertheless | -17.722 |
regardless | -16.872 |
Token | remains |
Token ID | 3793 |
Feature activation | -2.96e+00 |
Pos logit contributions | |
country | +18.213 |
nation | +18.116 |
majority | +17.979 |
inner | +17.178 |
largest | +16.934 |
Neg logit contributions | |
because | -7.826 |
besides | -7.760 |
nonetheless | -7.437 |
regardless | -7.094 |
nevertheless | -7.006 |
Token | in |
Token ID | 287 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
majority | +4.124 |
country | +4.119 |
nation | +4.103 |
inner | +3.978 |
oret | +3.959 |
Neg logit contributions | |
because | -2.029 |
besides | -2.019 |
nonetheless | -1.933 |
regardless | -1.865 |
nevertheless | -1.853 |
Token | the |
Token ID | 262 |
Feature activation | -3.11e+01 |
Pos logit contributions | |
majority | +19.570 |
country | +19.491 |
nation | +19.172 |
inner | +18.816 |
primary | +18.453 |
Neg logit contributions | |
besides | -11.202 |
nonetheless | -10.789 |
because | -10.752 |
nevertheless | -10.303 |
regardless | -10.129 |
Token | EU |
Token ID | 4576 |
Feature activation | -3.25e+00 |
Pos logit contributions | |
country | +30.411 |
majority | +29.541 |
nation | +29.269 |
group | +28.268 |
inner | +28.239 |
Neg logit contributions | |
besides | -20.424 |
nonetheless | -19.768 |
nevertheless | -19.216 |
because | -19.193 |
regardless | -18.241 |
Token | - |
Token ID | 532 |
Feature activation | +7.42e+00 |
Pos logit contributions | |
country | +5.318 |
majority | +5.303 |
nation | +5.301 |
inner | +5.148 |
oret | +5.117 |
Neg logit contributions | |
besides | -1.408 |
because | -1.405 |
nonetheless | -1.316 |
regardless | -1.229 |
nevertheless | -1.226 |
Token | a |
Token ID | 257 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
because | +8.025 |
besides | +7.831 |
regardless | +7.588 |
nonetheless | +7.576 |
nevertheless | +7.390 |
Neg logit contributions | |
nation | -7.220 |
majority | -7.219 |
country | -7.213 |
oret | -7.105 |
inner | -6.958 |
Token | so |
Token ID | 523 |
Feature activation | -3.57e-01 |
Pos logit contributions | |
country | +16.707 |
majority | +16.632 |
nation | +16.388 |
trio | +15.390 |
inner | +15.364 |
Neg logit contributions | |
besides | -13.132 |
because | -12.470 |
nonetheless | -12.236 |
regardless | -11.948 |
nevertheless | -11.930 |
Token | - |
Token ID | 12 |
Feature activation | +6.77e+00 |
Pos logit contributions | |
nation | +0.223 |
majority | +0.222 |
country | +0.220 |
oret | +0.210 |
inner | +0.209 |
Neg logit contributions | |
because | -0.526 |
besides | -0.517 |
nonetheless | -0.505 |
regardless | -0.501 |
nevertheless | -0.496 |
Token | confront |
Token ID | 7239 |
Feature activation | -4.28e+00 |
Pos logit contributions | |
majority | +8.367 |
country | +8.309 |
nation | +8.278 |
inner | +7.944 |
primary | +7.811 |
Neg logit contributions | |
besides | -6.925 |
because | -6.744 |
nonetheless | -6.514 |
regardless | -6.484 |
nevertheless | -6.360 |
Token | one |
Token ID | 530 |
Feature activation | -9.49e+00 |
Pos logit contributions | |
majority | +5.363 |
country | +5.341 |
nation | +5.328 |
inner | +5.168 |
oret | +5.124 |
Neg logit contributions | |
besides | -3.465 |
because | -3.448 |
nonetheless | -3.323 |
regardless | -3.222 |
nevertheless | -3.222 |
Token | 's |
Token ID | 338 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
country | +11.453 |
majority | +11.437 |
nation | +11.432 |
inner | +11.002 |
oret | +10.877 |
Neg logit contributions | |
besides | -7.679 |
because | -7.651 |
nonetheless | -7.448 |
nevertheless | -7.235 |
regardless | -7.185 |
Token | accuser |
Token ID | 43738 |
Feature activation | +9.98e+00 |
Pos logit contributions | |
country | +21.424 |
majority | +21.240 |
nation | +21.194 |
inner | +20.843 |
primary | +20.294 |
Neg logit contributions | |
besides | -14.802 |
nonetheless | -13.964 |
because | -13.867 |
nevertheless | -13.835 |
regardless | -13.310 |
Token | is |
Token ID | 318 |
Feature activation | +7.34e+00 |
Pos logit contributions | |
because | +10.986 |
besides | +10.678 |
nonetheless | +10.454 |
regardless | +10.364 |
nevertheless | +10.155 |
Neg logit contributions | |
country | -9.368 |
majority | -9.333 |
nation | -9.271 |
oret | -9.172 |
inner | -9.001 |
Token | important |
Token ID | 1593 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
because | +9.486 |
besides | +9.250 |
nonetheless | +9.218 |
regardless | +9.016 |
nevertheless | +8.999 |
Neg logit contributions | |
country | -5.576 |
nation | -5.518 |
majority | -5.491 |
oret | -5.355 |
inner | -5.268 |
Token | not |
Token ID | 407 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
because | +20.898 |
regardless | +19.761 |
besides | +19.741 |
nonetheless | +19.684 |
nevertheless | +19.039 |
Neg logit contributions | |
oret | -11.508 |
country | -11.296 |
ses | -11.222 |
nation | -11.165 |
majority | -11.156 |
Token | merely |
Token ID | 6974 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
because | +17.353 |
regardless | +15.667 |
besides | +15.476 |
nonetheless | +15.406 |
unless | +15.161 |
Neg logit contributions | |
country | -12.037 |
oret | -11.975 |
nation | -11.890 |
ses | -11.889 |
trio | -11.772 |
Token | because |
Token ID | 780 |
Feature activation | +8.40e+00 |
Pos logit contributions | |
because | +17.827 |
besides | +16.358 |
regardless | +16.119 |
nonetheless | +15.957 |
unless | +15.588 |
Neg logit contributions | |
country | -12.743 |
majority | -12.716 |
oret | -12.633 |
nation | -12.631 |
trio | -12.484 |
Token | it |
Token ID | 340 |
Feature activation | +3.04e+00 |
Pos logit contributions | |
because | +10.307 |
besides | +9.990 |
nonetheless | +9.782 |
regardless | +9.737 |
nevertheless | +9.552 |
Neg logit contributions | |
country | -6.630 |
oret | -6.605 |
nation | -6.558 |
majority | -6.535 |
inner | -6.281 |
Token | aids |
Token ID | 31378 |
Feature activation | +2.86e+00 |
Pos logit contributions | |
because | +2.826 |
besides | +2.788 |
nonetheless | +2.708 |
regardless | +2.644 |
nevertheless | +2.628 |
Neg logit contributions | |
majority | -3.490 |
country | -3.487 |
nation | -3.476 |
oret | -3.378 |
inner | -3.360 |
Token | . |
Token ID | 13 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
because | +12.708 |
besides | +12.121 |
nonetheless | +11.900 |
regardless | +11.854 |
nevertheless | +11.572 |
Neg logit contributions | |
oret | -8.857 |
majority | -8.763 |
country | -8.706 |
nation | -8.665 |
slightest | -8.611 |
Token |
|
Token ID | 198 |
Feature activation | +8.26e+00 |
Pos logit contributions | |
because | +15.742 |
besides | +15.184 |
nonetheless | +14.749 |
regardless | +14.694 |
nevertheless | +14.477 |
Neg logit contributions | |
slightest | -11.441 |
inner | -11.218 |
oret | -11.183 |
majority | -11.062 |
country | -11.037 |
Token |
|
Token ID | 198 |
Feature activation | +4.49e+00 |
Pos logit contributions | |
because | +4.113 |
besides | +4.033 |
nonetheless | +3.784 |
regardless | +3.630 |
nevertheless | +3.566 |
Neg logit contributions | |
majority | -13.094 |
country | -13.090 |
nation | -13.057 |
oret | -12.759 |
inner | -12.742 |
Token | Hug |
Token ID | 48098 |
Feature activation | -5.65e+00 |
Pos logit contributions | |
because | +4.620 |
besides | +4.521 |
nonetheless | +4.382 |
regardless | +4.304 |
nevertheless | +4.252 |
Neg logit contributions | |
country | -4.646 |
majority | -4.646 |
nation | -4.631 |
inner | -4.546 |
slightest | -4.470 |
Token | hes |
Token ID | 956 |
Feature activation | +8.19e+00 |
Pos logit contributions | |
majority | +4.133 |
country | +4.108 |
nation | +4.104 |
inner | +3.755 |
ses | +3.708 |
Neg logit contributions | |
besides | -7.349 |
because | -7.341 |
nonetheless | -7.223 |
regardless | -7.155 |
nevertheless | -7.003 |
Token | said |
Token ID | 531 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
because | +8.312 |
besides | +8.130 |
nonetheless | +8.092 |
nevertheless | +7.860 |
regardless | +7.751 |
Neg logit contributions | |
majority | -8.139 |
country | -8.129 |
nation | -8.101 |
inner | -7.920 |
oret | -7.900 |
Token | the |
Token ID | 262 |
Feature activation | -1.89e+01 |
Pos logit contributions | |
because | +19.833 |
besides | +19.294 |
nonetheless | +18.835 |
regardless | +18.831 |
unless | +18.548 |
Neg logit contributions | |
oret | -7.067 |
ses | -6.960 |
slightest | -6.937 |
majority | -6.933 |
nation | -6.864 |
Token | � |
Token ID | 564 |
Feature activation | -1.68e+01 |
Pos logit contributions | |
country | +22.732 |
majority | +22.495 |
nation | +22.364 |
largest | +21.321 |
oret | +21.273 |
Neg logit contributions | |
besides | -13.145 |
because | -12.553 |
nonetheless | -12.221 |
regardless | -12.102 |
nevertheless | -11.864 |
Token | � |
Token ID | 250 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
majority | +13.584 |
country | +13.317 |
nation | +13.184 |
oret | +12.951 |
inner | +12.677 |
Neg logit contributions | |
besides | -17.939 |
nonetheless | -17.672 |
because | -17.599 |
regardless | -17.362 |
nevertheless | -17.307 |
Token | aston |
Token ID | 45966 |
Feature activation | -5.41e+00 |
Pos logit contributions | |
majority | +13.351 |
country | +13.320 |
nation | +13.154 |
oret | +12.858 |
ses | +12.533 |
Neg logit contributions | |
besides | -10.788 |
because | -10.631 |
nonetheless | -10.377 |
regardless | -10.219 |
nevertheless | -10.101 |
Token | ishing |
Token ID | 3929 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
majority | +3.561 |
country | +3.559 |
nation | +3.538 |
oret | +3.342 |
inner | +3.328 |
Neg logit contributions | |
because | -7.704 |
besides | -7.656 |
nonetheless | -7.496 |
regardless | -7.392 |
nevertheless | -7.354 |
Token | more |
Token ID | 517 |
Feature activation | +4.06e+00 |
Pos logit contributions | |
because | +7.268 |
besides | +7.068 |
nonetheless | +6.929 |
regardless | +6.817 |
nevertheless | +6.696 |
Neg logit contributions | |
majority | -7.411 |
nation | -7.380 |
country | -7.307 |
oret | -7.204 |
inner | -7.071 |
Token | and |
Token ID | 290 |
Feature activation | +8.41e+00 |
Pos logit contributions | |
because | +4.354 |
besides | +4.293 |
nonetheless | +4.131 |
regardless | +4.082 |
nevertheless | +4.008 |
Neg logit contributions | |
majority | -4.123 |
nation | -4.097 |
country | -4.054 |
oret | -3.994 |
inner | -3.927 |
Token | more |
Token ID | 517 |
Feature activation | +8.37e+00 |
Pos logit contributions | |
because | +9.986 |
besides | +9.880 |
nonetheless | +9.428 |
regardless | +9.405 |
nevertheless | +9.210 |
Neg logit contributions | |
majority | -7.144 |
nation | -7.136 |
country | -7.060 |
oret | -6.964 |
inner | -6.809 |
Token | of |
Token ID | 286 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
because | +10.735 |
besides | +10.524 |
nonetheless | +10.174 |
regardless | +10.152 |
unless | +9.930 |
Neg logit contributions | |
majority | -6.417 |
nation | -6.319 |
oret | -6.231 |
country | -6.173 |
inner | -6.011 |
Token | it |
Token ID | 340 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
because | +0.095 |
besides | +0.093 |
nonetheless | +0.088 |
regardless | +0.085 |
nevertheless | +0.083 |
Neg logit contributions | |
majority | -0.246 |
nation | -0.245 |
country | -0.244 |
oret | -0.240 |
inner | -0.238 |
Token | . |
Token ID | 13 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
because | +14.219 |
besides | +13.830 |
regardless | +13.394 |
nonetheless | +13.319 |
unless | +12.995 |
Neg logit contributions | |
majority | -11.310 |
nation | -11.032 |
country | -10.941 |
oret | -10.924 |
inner | -10.707 |
Token | Everyone |
Token ID | 11075 |
Feature activation | +4.75e+00 |
Pos logit contributions | |
because | +17.213 |
besides | +16.592 |
regardless | +15.941 |
nonetheless | +15.901 |
unless | +15.707 |
Neg logit contributions | |
slightest | -11.768 |
nation | -11.616 |
majority | -11.566 |
inner | -11.521 |
country | -11.456 |
Token | who |
Token ID | 508 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
because | +5.032 |
besides | +4.992 |
nonetheless | +4.804 |
regardless | +4.755 |
nevertheless | +4.679 |
Neg logit contributions | |
majority | -4.823 |
country | -4.818 |
nation | -4.811 |
oret | -4.687 |
inner | -4.626 |
Token | was |
Token ID | 373 |
Feature activation | -3.33e+00 |
Pos logit contributions | |
majority | +2.574 |
country | +2.572 |
nation | +2.561 |
inner | +2.481 |
oret | +2.471 |
Neg logit contributions | |
because | -1.698 |
besides | -1.685 |
nonetheless | -1.624 |
regardless | -1.587 |
nevertheless | -1.570 |
Token | at |
Token ID | 379 |
Feature activation | -8.38e+00 |
Pos logit contributions | |
country | +5.152 |
majority | +5.133 |
nation | +5.115 |
inner | +4.998 |
oret | +4.958 |
Neg logit contributions | |
because | -1.701 |
besides | -1.690 |
nonetheless | -1.611 |
regardless | -1.542 |
nevertheless | -1.530 |
Token | The |
Token ID | 383 |
Feature activation | -2.42e+01 |
Pos logit contributions | |
country | +10.963 |
majority | +10.863 |
nation | +10.822 |
inner | +10.532 |
oret | +10.460 |
Neg logit contributions | |
besides | -6.101 |
because | -6.074 |
nonetheless | -5.901 |
regardless | -5.701 |
nevertheless | -5.683 |
Token | . |
Token ID | 13 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
because | +3.120 |
besides | +3.020 |
nonetheless | +2.867 |
regardless | +2.833 |
nevertheless | +2.762 |
Neg logit contributions | |
country | -5.687 |
majority | -5.681 |
nation | -5.656 |
oret | -5.581 |
inner | -5.532 |
Token | It |
Token ID | 632 |
Feature activation | +5.91e+00 |
Pos logit contributions | |
because | +15.351 |
besides | +14.636 |
regardless | +14.219 |
unless | +13.995 |
nonetheless | +13.936 |
Neg logit contributions | |
slightest | -11.789 |
country | -11.754 |
inner | -11.738 |
majority | -11.682 |
nation | -11.674 |
Token | would |
Token ID | 561 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
because | +5.038 |
besides | +4.846 |
nonetheless | +4.720 |
regardless | +4.619 |
nevertheless | +4.575 |
Neg logit contributions | |
majority | -7.095 |
nation | -7.074 |
country | -7.073 |
oret | -6.993 |
inner | -6.888 |
Token | be |
Token ID | 307 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
because | +13.188 |
nonetheless | +12.749 |
besides | +12.721 |
nevertheless | +12.438 |
regardless | +12.373 |
Neg logit contributions | |
majority | -10.534 |
country | -10.464 |
oret | -10.378 |
nation | -10.375 |
inner | -10.163 |
Token | too |
Token ID | 1165 |
Feature activation | +5.59e+00 |
Pos logit contributions | |
because | +16.538 |
besides | +15.976 |
nonetheless | +15.598 |
regardless | +15.472 |
nevertheless | +15.213 |
Neg logit contributions | |
oret | -8.302 |
majority | -8.186 |
nation | -8.103 |
country | -8.076 |
inner | -7.892 |
Token | easy |
Token ID | 2562 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
because | +7.401 |
besides | +7.242 |
nonetheless | +7.050 |
regardless | +6.990 |
nevertheless | +6.879 |
Neg logit contributions | |
majority | -4.073 |
nation | -4.042 |
country | -4.027 |
oret | -4.011 |
inner | -3.881 |
Token | if |
Token ID | 611 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
because | +25.033 |
besides | +23.599 |
nonetheless | +23.304 |
regardless | +23.117 |
unless | +22.760 |
Neg logit contributions | |
oret | -13.886 |
majority | -13.466 |
nation | -13.344 |
slightest | -13.206 |
country | -13.194 |
Token | that |
Token ID | 326 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
because | +11.942 |
besides | +11.643 |
nonetheless | +11.238 |
regardless | +11.179 |
nevertheless | +11.020 |
Neg logit contributions | |
oret | -8.246 |
majority | -8.163 |
nation | -8.129 |
country | -8.066 |
trio | -7.962 |
Token | were |
Token ID | 547 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
because | +1.047 |
besides | +1.026 |
nonetheless | +0.992 |
regardless | +0.977 |
nevertheless | +0.965 |
Neg logit contributions | |
majority | -1.125 |
country | -1.119 |
nation | -1.117 |
oret | -1.108 |
inner | -1.086 |
Token | the |
Token ID | 262 |
Feature activation | -9.98e+00 |
Pos logit contributions | |
because | +14.173 |
besides | +13.654 |
nonetheless | +13.232 |
regardless | +13.018 |
nevertheless | +12.948 |
Neg logit contributions | |
oret | -10.382 |
nation | -10.376 |
majority | -10.319 |
country | -10.270 |
trio | -10.207 |
Token | goal |
Token ID | 3061 |
Feature activation | +2.03e+01 |
Pos logit contributions | |
majority | +9.617 |
country | +9.593 |
nation | +9.522 |
oret | +9.128 |
inner | +9.117 |
Neg logit contributions | |
besides | -10.822 |
because | -10.740 |
nonetheless | -10.537 |
nevertheless | -10.309 |
regardless | -10.279 |
Token | got |
Token ID | 1392 |
Feature activation | -3.77e+00 |
Pos logit contributions | |
country | +10.298 |
majority | +10.297 |
nation | +10.246 |
inner | +10.031 |
oret | +9.857 |
Neg logit contributions | |
besides | -5.718 |
because | -5.675 |
nonetheless | -5.462 |
regardless | -5.397 |
nevertheless | -5.306 |
Token | cha |
Token ID | 11693 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
majority | +2.863 |
country | +2.861 |
nation | +2.848 |
oret | +2.713 |
inner | +2.699 |
Neg logit contributions | |
because | -4.995 |
besides | -4.958 |
nonetheless | -4.845 |
regardless | -4.776 |
nevertheless | -4.747 |
Token | 's |
Token ID | 338 |
Feature activation | +8.91e+00 |
Pos logit contributions | |
because | +2.128 |
besides | +2.089 |
nonetheless | +2.050 |
regardless | +2.010 |
nevertheless | +2.000 |
Neg logit contributions | |
majority | -1.332 |
nation | -1.326 |
country | -1.324 |
oret | -1.290 |
inner | -1.244 |
Token | I |
Token ID | 314 |
Feature activation | +4.68e+00 |
Pos logit contributions | |
because | +8.383 |
besides | +8.193 |
nonetheless | +7.872 |
regardless | +7.721 |
nevertheless | +7.568 |
Neg logit contributions | |
majority | -9.885 |
nation | -9.856 |
country | -9.826 |
oret | -9.693 |
inner | -9.444 |
Token | encountered |
Token ID | 12956 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
because | +4.392 |
besides | +4.330 |
nonetheless | +4.210 |
nevertheless | +4.089 |
regardless | +4.088 |
Neg logit contributions | |
majority | -5.319 |
country | -5.295 |
nation | -5.287 |
oret | -5.166 |
inner | -5.102 |
Token | . |
Token ID | 13 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
because | +19.358 |
besides | +18.734 |
nonetheless | +18.214 |
regardless | +17.965 |
nevertheless | +17.686 |
Neg logit contributions | |
majority | -12.537 |
nation | -12.447 |
oret | -12.404 |
country | -12.298 |
slightest | -11.875 |
Token | Assuming |
Token ID | 33238 |
Feature activation | +9.16e+00 |
Pos logit contributions | |
because | +16.228 |
besides | +15.468 |
nonetheless | +14.897 |
regardless | +14.740 |
nevertheless | +14.677 |
Neg logit contributions | |
nation | -13.362 |
slightest | -13.323 |
country | -13.260 |
majority | -13.020 |
inner | -12.889 |
Token | you |
Token ID | 345 |
Feature activation | +3.16e+00 |
Pos logit contributions | |
because | +9.648 |
besides | +9.432 |
nonetheless | +9.149 |
regardless | +9.050 |
nevertheless | +8.889 |
Neg logit contributions | |
nation | -8.745 |
country | -8.661 |
majority | -8.541 |
oret | -8.505 |
trio | -8.273 |
Token | already |
Token ID | 1541 |
Feature activation | +3.62e+00 |
Pos logit contributions | |
because | +2.892 |
besides | +2.860 |
nonetheless | +2.769 |
regardless | +2.705 |
nevertheless | +2.686 |
Neg logit contributions | |
majority | -3.682 |
country | -3.676 |
nation | -3.667 |
oret | -3.558 |
inner | -3.545 |
Token | know |
Token ID | 760 |
Feature activation | +9.82e+00 |
Pos logit contributions | |
because | +3.891 |
besides | +3.844 |
nonetheless | +3.735 |
regardless | +3.662 |
nevertheless | +3.637 |
Neg logit contributions | |
majority | -3.635 |
nation | -3.622 |
country | -3.621 |
oret | -3.512 |
inner | -3.466 |
Token | your |
Token ID | 534 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
because | +11.618 |
besides | +11.369 |
nonetheless | +10.896 |
regardless | +10.887 |
nevertheless | +10.654 |
Neg logit contributions | |
nation | -8.041 |
country | -7.973 |
oret | -7.956 |
majority | -7.880 |
trio | -7.583 |
Token | � |
Token ID | 250 |
Feature activation | +8.17e+00 |
Pos logit contributions | |
majority | +3.888 |
country | +3.883 |
nation | +3.863 |
oret | +3.664 |
inner | +3.653 |
Neg logit contributions | |
because | -7.353 |
besides | -7.310 |
nonetheless | -7.148 |
regardless | -7.046 |
nevertheless | -7.007 |
Token | ins |
Token ID | 1040 |
Feature activation | -4.44e+00 |
Pos logit contributions | |
because | +10.957 |
besides | +10.723 |
nonetheless | +10.442 |
regardless | +10.428 |
nevertheless | +10.289 |
Neg logit contributions | |
majority | -5.345 |
country | -5.315 |
nation | -5.279 |
trio | -5.089 |
oret | -5.069 |
Token | pection |
Token ID | 14978 |
Feature activation | +4.82e+00 |
Pos logit contributions | |
majority | +4.315 |
country | +4.310 |
nation | +4.287 |
oret | +4.135 |
inner | +4.116 |
Neg logit contributions | |
because | -4.866 |
besides | -4.864 |
nonetheless | -4.730 |
regardless | -4.639 |
nevertheless | -4.613 |
Token | � |
Token ID | 447 |
Feature activation | -5.82e-01 |
Pos logit contributions | |
because | +5.304 |
besides | +5.150 |
nonetheless | +5.021 |
regardless | +4.988 |
nevertheless | +4.878 |
Neg logit contributions | |
majority | -4.666 |
country | -4.596 |
nation | -4.588 |
oret | -4.492 |
inner | -4.466 |
Token | � |
Token ID | 251 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
country | +0.453 |
majority | +0.452 |
nation | +0.449 |
oret | +0.431 |
inner | +0.425 |
Neg logit contributions | |
because | -0.765 |
besides | -0.757 |
nonetheless | -0.738 |
regardless | -0.729 |
nevertheless | -0.722 |
Token | if |
Token ID | 611 |
Feature activation | +6.98e+00 |
Pos logit contributions | |
because | +17.160 |
besides | +16.703 |
regardless | +16.299 |
nonetheless | +16.216 |
nevertheless | +15.938 |
Neg logit contributions | |
majority | -7.992 |
country | -7.790 |
nation | -7.778 |
oret | -7.679 |
trio | -7.553 |
Token | there |
Token ID | 612 |
Feature activation | +2.85e+00 |
Pos logit contributions | |
because | +8.151 |
besides | +7.952 |
nonetheless | +7.823 |
regardless | +7.690 |
nevertheless | +7.643 |
Neg logit contributions | |
majority | -6.018 |
nation | -5.951 |
country | -5.931 |
oret | -5.848 |
trio | -5.740 |
Token | is |
Token ID | 318 |
Feature activation | -8.75e-01 |
Pos logit contributions | |
because | +2.151 |
besides | +2.113 |
nonetheless | +2.026 |
regardless | +1.979 |
nevertheless | +1.955 |
Neg logit contributions | |
majority | -3.762 |
country | -3.742 |
nation | -3.735 |
oret | -3.702 |
inner | -3.648 |
Token | any |
Token ID | 597 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
majority | +1.056 |
country | +1.056 |
nation | +1.053 |
oret | +1.025 |
inner | +1.019 |
Neg logit contributions | |
because | -0.767 |
besides | -0.757 |
nonetheless | -0.734 |
regardless | -0.716 |
nevertheless | -0.711 |
Token | . |
Token ID | 13 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
country | +12.903 |
nation | +12.803 |
majority | +12.774 |
inner | +12.390 |
oret | +12.252 |
Neg logit contributions | |
besides | -7.817 |
because | -7.743 |
nonetheless | -7.506 |
nevertheless | -7.284 |
regardless | -7.265 |
Token | A |
Token ID | 317 |
Feature activation | -1.78e+01 |
Pos logit contributions | |
because | +15.918 |
besides | +15.476 |
nonetheless | +14.928 |
regardless | +14.858 |
nevertheless | +14.678 |
Neg logit contributions | |
majority | -10.266 |
country | -10.183 |
nation | -10.118 |
slightest | -10.014 |
inner | -9.963 |
Token | that |
Token ID | 326 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
because | +7.429 |
besides | +7.240 |
nonetheless | +6.966 |
regardless | +6.936 |
nevertheless | +6.805 |
Neg logit contributions | |
nation | -5.689 |
country | -5.633 |
majority | -5.601 |
oret | -5.476 |
trio | -5.349 |
Token | these |
Token ID | 777 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
majority | +2.292 |
country | +2.290 |
nation | +2.282 |
oret | +2.219 |
inner | +2.218 |
Neg logit contributions | |
because | -1.227 |
besides | -1.216 |
nonetheless | -1.169 |
regardless | -1.133 |
nevertheless | -1.125 |
Token | mushrooms |
Token ID | 23452 |
Feature activation | +4.92e+00 |
Pos logit contributions | |
majority | +17.419 |
country | +17.337 |
nation | +17.129 |
inner | +16.905 |
oret | +16.661 |
Neg logit contributions | |
besides | -11.093 |
because | -10.908 |
nonetheless | -10.805 |
regardless | -10.468 |
nevertheless | -10.417 |
Token | cause |
Token ID | 2728 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
because | +5.403 |
besides | +5.335 |
nonetheless | +5.152 |
regardless | +5.077 |
nevertheless | +5.031 |
Neg logit contributions | |
country | -4.783 |
majority | -4.774 |
nation | -4.767 |
oret | -4.600 |
inner | -4.555 |
Token | some |
Token ID | 617 |
Feature activation | -8.26e+00 |
Pos logit contributions | |
country | +1.518 |
majority | +1.517 |
nation | +1.513 |
oret | +1.467 |
inner | +1.450 |
Neg logit contributions | |
because | -1.655 |
besides | -1.636 |
nonetheless | -1.588 |
regardless | -1.562 |
nevertheless | -1.548 |
Token | nausea |
Token ID | 32122 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
country | +9.584 |
majority | +9.580 |
nation | +9.555 |
inner | +9.311 |
oret | +9.108 |
Neg logit contributions | |
because | -7.179 |
besides | -7.167 |
nonetheless | -7.033 |
nevertheless | -6.835 |
regardless | -6.807 |
Token | . |
Token ID | 13 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
because | +13.999 |
besides | +13.605 |
regardless | +13.020 |
nonetheless | +12.921 |
unless | +12.646 |
Neg logit contributions | |
majority | -11.496 |
nation | -11.487 |
country | -11.473 |
oret | -11.335 |
trio | -11.181 |
Token | suggest |
Token ID | 47811 |
Feature activation | +4.52e+00 |
Pos logit contributions | |
because | +13.029 |
besides | +12.625 |
regardless | +12.062 |
nonetheless | +12.015 |
unless | +11.891 |
Neg logit contributions | |
nation | -10.363 |
country | -10.329 |
inner | -10.069 |
majority | -10.061 |
slightest | -9.993 |
Token | s |
Token ID | 82 |
Feature activation | +8.87e+00 |
Pos logit contributions | |
because | +5.242 |
besides | +5.127 |
nonetheless | +5.001 |
regardless | +4.946 |
nevertheless | +4.873 |
Neg logit contributions | |
country | -4.112 |
nation | -4.110 |
majority | -4.082 |
oret | -3.979 |
inner | -3.933 |
Token | the |
Token ID | 262 |
Feature activation | -1.62e+01 |
Pos logit contributions | |
because | +10.373 |
besides | +10.137 |
nonetheless | +9.810 |
regardless | +9.680 |
nevertheless | +9.580 |
Neg logit contributions | |
nation | -7.516 |
country | -7.455 |
majority | -7.387 |
oret | -7.197 |
inner | -7.103 |
Token | use |
Token ID | 779 |
Feature activation | +4.27e+00 |
Pos logit contributions | |
majority | +20.354 |
country | +19.869 |
nation | +19.737 |
oret | +19.466 |
inner | +19.410 |
Neg logit contributions | |
besides | -11.017 |
because | -10.823 |
nonetheless | -10.797 |
nevertheless | -10.380 |
regardless | -10.324 |
Token | seizures |
Token ID | 24715 |
Feature activation | +2.87e+00 |
Pos logit contributions | |
majority | +16.474 |
country | +16.347 |
nation | +16.270 |
inner | +16.103 |
primary | +15.597 |
Neg logit contributions | |
besides | -9.967 |
because | -9.649 |
nonetheless | -9.615 |
nevertheless | -9.281 |
regardless | -9.229 |
Token | and |
Token ID | 290 |
Feature activation | -4.89e+00 |
Pos logit contributions | |
because | +2.007 |
besides | +1.962 |
nonetheless | +1.868 |
regardless | +1.819 |
nevertheless | +1.792 |
Neg logit contributions | |
country | -3.977 |
majority | -3.975 |
nation | -3.961 |
oret | -3.884 |
inner | -3.854 |
Token | the |
Token ID | 262 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
majority | +6.182 |
country | +6.166 |
nation | +6.144 |
inner | +5.982 |
oret | +5.948 |
Neg logit contributions | |
because | -3.912 |
besides | -3.906 |
nonetheless | -3.762 |
regardless | -3.657 |
nevertheless | -3.638 |
Token | best |
Token ID | 1266 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
majority | +26.832 |
country | +26.307 |
nation | +26.223 |
inner | +26.191 |
presence | +25.680 |
Neg logit contributions | |
besides | -14.203 |
because | -13.243 |
nonetheless | -13.083 |
nevertheless | -12.764 |
regardless | -12.735 |
Token | surgical |
Token ID | 21998 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
country | +10.822 |
majority | +10.812 |
nation | +10.738 |
inner | +10.415 |
oret | +10.321 |
Neg logit contributions | |
besides | -9.526 |
because | -9.377 |
nonetheless | -9.155 |
regardless | -8.965 |
nevertheless | -8.917 |
Token | path |
Token ID | 3108 |
Feature activation | +8.48e+00 |
Pos logit contributions | |
majority | +10.489 |
country | +10.429 |
nation | +10.396 |
inner | +9.983 |
oret | +9.935 |
Neg logit contributions | |
besides | -10.454 |
because | -10.258 |
nonetheless | -10.093 |
nevertheless | -9.863 |
regardless | -9.856 |
Token | to |
Token ID | 284 |
Feature activation | -3.75e+00 |
Pos logit contributions | |
because | +9.465 |
besides | +9.240 |
nonetheless | +8.885 |
regardless | +8.847 |
nevertheless | +8.673 |
Neg logit contributions | |
country | -7.778 |
nation | -7.722 |
majority | -7.706 |
slightest | -7.463 |
oret | -7.453 |
Token | the |
Token ID | 262 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
majority | +3.477 |
country | +3.470 |
nation | +3.453 |
inner | +3.317 |
oret | +3.294 |
Neg logit contributions | |
because | -4.284 |
besides | -4.280 |
nonetheless | -4.165 |
regardless | -4.088 |
nevertheless | -4.066 |
Token | part |
Token ID | 636 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
majority | +24.425 |
nation | +24.140 |
country | +24.122 |
inner | +23.690 |
largest | +23.082 |
Neg logit contributions | |
besides | -14.549 |
because | -13.939 |
nonetheless | -13.759 |
nevertheless | -13.320 |
regardless | -13.050 |
Token | of |
Token ID | 286 |
Feature activation | -9.19e+00 |
Pos logit contributions | |
because | +1.841 |
besides | +1.796 |
nonetheless | +1.696 |
regardless | +1.671 |
nevertheless | +1.624 |
Neg logit contributions | |
country | -3.705 |
majority | -3.697 |
nation | -3.689 |
oret | -3.611 |
inner | -3.579 |
Token | the |
Token ID | 262 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
country | +11.531 |
majority | +11.483 |
nation | +11.452 |
inner | +11.184 |
oret | +10.972 |
Neg logit contributions | |
besides | -7.248 |
because | -7.210 |
nonetheless | -6.995 |
nevertheless | -6.758 |
regardless | -6.755 |
Token | Though |
Token ID | 10915 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
because | +4.738 |
besides | +4.671 |
nonetheless | +4.468 |
regardless | +4.377 |
nevertheless | +4.347 |
Neg logit contributions | |
country | -4.683 |
nation | -4.678 |
majority | -4.664 |
inner | -4.559 |
slightest | -4.526 |
Token | not |
Token ID | 407 |
Feature activation | +2.07e+00 |
Pos logit contributions | |
because | +4.257 |
besides | +4.218 |
nonetheless | +4.099 |
nevertheless | +4.018 |
regardless | +4.015 |
Neg logit contributions | |
nation | -2.996 |
country | -2.989 |
majority | -2.964 |
oret | -2.930 |
inner | -2.878 |
Token | a |
Token ID | 257 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
because | +1.946 |
besides | +1.916 |
nonetheless | +1.840 |
regardless | +1.808 |
nevertheless | +1.787 |
Neg logit contributions | |
country | -2.356 |
nation | -2.349 |
majority | -2.346 |
oret | -2.307 |
inner | -2.280 |
Token | full |
Token ID | 1336 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
majority | +22.729 |
country | +22.395 |
nation | +22.216 |
primary | +21.355 |
main | +21.118 |
Neg logit contributions | |
besides | -13.451 |
nonetheless | -12.889 |
because | -12.881 |
regardless | -12.631 |
nevertheless | -12.475 |
Token | acquisition |
Token ID | 12673 |
Feature activation | +6.14e+00 |
Pos logit contributions | |
majority | +16.324 |
country | +16.222 |
nation | +16.009 |
inner | +15.453 |
trio | +15.197 |
Neg logit contributions | |
besides | -11.811 |
because | -11.615 |
nonetheless | -11.532 |
nevertheless | -11.171 |
regardless | -11.083 |
Token | , |
Token ID | 11 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
because | +8.115 |
besides | +7.927 |
nonetheless | +7.708 |
regardless | +7.666 |
nevertheless | +7.564 |
Neg logit contributions | |
country | -4.438 |
majority | -4.420 |
oret | -4.395 |
nation | -4.395 |
ses | -4.299 |
Token | Fol |
Token ID | 30938 |
Feature activation | -8.10e+00 |
Pos logit contributions | |
because | +13.810 |
besides | +13.610 |
nonetheless | +13.191 |
regardless | +13.021 |
nevertheless | +12.992 |
Neg logit contributions | |
oret | -6.750 |
nation | -6.680 |
country | -6.593 |
majority | -6.557 |
slightest | -6.515 |
Token | lett |
Token ID | 15503 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
majority | +7.041 |
country | +6.998 |
nation | +6.993 |
oret | +6.744 |
inner | +6.669 |
Neg logit contributions | |
besides | -9.587 |
because | -9.581 |
nonetheless | -9.302 |
regardless | -9.170 |
nevertheless | -9.095 |
Token | made |
Token ID | 925 |
Feature activation | +5.64e+00 |
Pos logit contributions | |
country | +2.610 |
majority | +2.608 |
nation | +2.602 |
oret | +2.528 |
inner | +2.521 |
Neg logit contributions | |
because | -1.806 |
besides | -1.785 |
nonetheless | -1.727 |
regardless | -1.681 |
nevertheless | -1.672 |
Token | an |
Token ID | 281 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
because | +7.321 |
besides | +7.179 |
nonetheless | +7.111 |
nevertheless | +6.966 |
regardless | +6.924 |
Neg logit contributions | |
nation | -4.119 |
country | -4.081 |
oret | -4.061 |
majority | -4.037 |
ses | -3.893 |
Token | investment |
Token ID | 4896 |
Feature activation | +8.21e+00 |
Pos logit contributions | |
majority | +14.796 |
inner | +14.494 |
country | +14.433 |
nation | +14.387 |
largest | +14.109 |
Neg logit contributions | |
because | -10.473 |
besides | -10.446 |
nonetheless | -9.836 |
regardless | -9.757 |
nevertheless | -9.573 |
Token | final |
Token ID | 2457 |
Feature activation | -5.37e+00 |
Pos logit contributions | |
majority | +19.419 |
country | +19.181 |
nation | +19.180 |
inner | +18.421 |
fifth | +18.297 |
Neg logit contributions | |
besides | -14.148 |
because | -14.038 |
nonetheless | -13.374 |
regardless | -13.164 |
nevertheless | -13.055 |
Token | period |
Token ID | 2278 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
majority | +4.830 |
country | +4.820 |
nation | +4.800 |
inner | +4.597 |
oret | +4.587 |
Neg logit contributions | |
because | -6.304 |
besides | -6.276 |
nonetheless | -6.121 |
regardless | -6.012 |
nevertheless | -5.984 |
Token | , |
Token ID | 11 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
because | +12.969 |
besides | +12.424 |
nonetheless | +12.310 |
regardless | +12.158 |
nevertheless | +11.850 |
Neg logit contributions | |
country | -10.288 |
majority | -10.191 |
nation | -10.152 |
oret | -10.056 |
slightest | -9.915 |
Token | plus |
Token ID | 5556 |
Feature activation | +7.59e+00 |
Pos logit contributions | |
because | +14.812 |
besides | +14.334 |
nonetheless | +14.115 |
regardless | +13.995 |
nevertheless | +13.737 |
Neg logit contributions | |
country | -9.606 |
nation | -9.547 |
majority | -9.534 |
oret | -9.468 |
slightest | -9.143 |
Token | two |
Token ID | 734 |
Feature activation | -3.89e+00 |
Pos logit contributions | |
because | +9.470 |
besides | +9.276 |
nonetheless | +9.067 |
regardless | +8.938 |
nevertheless | +8.841 |
Neg logit contributions | |
nation | -5.834 |
majority | -5.818 |
country | -5.812 |
oret | -5.588 |
inner | -5.554 |
Token | others |
Token ID | 1854 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
majority | +4.667 |
country | +4.665 |
nation | +4.647 |
oret | +4.502 |
inner | +4.498 |
Neg logit contributions | |
because | -3.396 |
besides | -3.371 |
nonetheless | -3.259 |
regardless | -3.186 |
nevertheless | -3.164 |
Token | , |
Token ID | 11 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
because | +16.761 |
besides | +16.454 |
nonetheless | +16.187 |
regardless | +15.787 |
nevertheless | +15.623 |
Neg logit contributions | |
majority | -10.559 |
country | -10.500 |
nation | -10.442 |
oret | -10.335 |
inner | -10.091 |
Token | as |
Token ID | 355 |
Feature activation | +3.57e+00 |
Pos logit contributions | |
because | +16.674 |
besides | +16.204 |
nonetheless | +15.890 |
regardless | +15.676 |
nevertheless | +15.406 |
Neg logit contributions | |
country | -10.363 |
nation | -10.286 |
majority | -10.257 |
oret | -10.202 |
slightest | -10.012 |
Token | the |
Token ID | 262 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
because | +4.073 |
besides | +4.015 |
nonetheless | +3.896 |
regardless | +3.856 |
nevertheless | +3.796 |
Neg logit contributions | |
country | -3.305 |
nation | -3.298 |
majority | -3.296 |
oret | -3.209 |
inner | -3.171 |
Token | Caps |
Token ID | 23534 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
majority | +27.169 |
country | +26.646 |
nation | +26.601 |
trio | +26.083 |
remainder | +25.627 |
Neg logit contributions | |
besides | -14.742 |
because | -14.351 |
nonetheless | -14.223 |
nevertheless | -13.761 |
regardless | -13.347 |
Token | ran |
Token ID | 4966 |
Feature activation | +6.19e+00 |
Pos logit contributions | |
majority | +1.625 |
country | +1.623 |
nation | +1.619 |
oret | +1.568 |
inner | +1.566 |
Neg logit contributions | |
because | -1.110 |
besides | -1.102 |
nonetheless | -1.059 |
regardless | -1.036 |
nevertheless | -1.025 |
Token | among |
Token ID | 1871 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
country | +2.750 |
majority | +2.750 |
nation | +2.740 |
oret | +2.685 |
inner | +2.678 |
Neg logit contributions | |
because | -0.915 |
besides | -0.900 |
nonetheless | -0.838 |
regardless | -0.811 |
nevertheless | -0.790 |
Token | guards |
Token ID | 10942 |
Feature activation | +7.97e+00 |
Pos logit contributions | |
country | +17.118 |
majority | +17.064 |
nation | +17.061 |
inner | +16.543 |
trio | +16.243 |
Neg logit contributions | |
because | -13.224 |
besides | -13.099 |
nonetheless | -12.720 |
nevertheless | -12.499 |
regardless | -12.396 |
Token | ) |
Token ID | 8 |
Feature activation | +9.86e+00 |
Pos logit contributions | |
because | +7.380 |
besides | +7.268 |
regardless | +6.867 |
nonetheless | +6.724 |
unless | +6.711 |
Neg logit contributions | |
nation | -8.616 |
majority | -8.594 |
country | -8.577 |
inner | -8.435 |
slightest | -8.396 |
Token |
|
Token ID | 198 |
Feature activation | +6.69e+00 |
Pos logit contributions | |
because | +9.491 |
besides | +9.314 |
regardless | +8.867 |
unless | +8.700 |
nonetheless | +8.696 |
Neg logit contributions | |
nation | -9.988 |
country | -9.966 |
majority | -9.908 |
oret | -9.719 |
inner | -9.635 |
Token |
|
Token ID | 198 |
Feature activation | -2.56e+00 |
Pos logit contributions | |
because | +3.450 |
besides | +3.447 |
nonetheless | +3.271 |
regardless | +3.122 |
nevertheless | +3.096 |
Neg logit contributions | |
majority | -10.518 |
country | -10.516 |
nation | -10.488 |
oret | -10.254 |
inner | -10.198 |
Token | Total |
Token ID | 14957 |
Feature activation | -8.18e+00 |
Pos logit contributions | |
majority | +2.521 |
country | +2.515 |
nation | +2.505 |
oret | +2.422 |
inner | +2.403 |
Neg logit contributions | |
because | -2.796 |
besides | -2.778 |
nonetheless | -2.706 |
regardless | -2.655 |
nevertheless | -2.641 |
Token | guaranteed |
Token ID | 11462 |
Feature activation | +4.34e+00 |
Pos logit contributions | |
majority | +8.531 |
country | +8.499 |
nation | +8.438 |
oret | +8.168 |
inner | +8.106 |
Neg logit contributions | |
because | -8.287 |
besides | -8.233 |
nonetheless | -8.040 |
regardless | -7.850 |
nevertheless | -7.837 |
Token | at |
Token ID | 379 |
Feature activation | -7.53e+00 |
Pos logit contributions | |
because | +3.178 |
besides | +3.095 |
nonetheless | +2.899 |
regardless | +2.889 |
nevertheless | +2.794 |
Neg logit contributions | |
nation | -5.787 |
country | -5.784 |
majority | -5.766 |
oret | -5.675 |
inner | -5.641 |
Token | signing |
Token ID | 8415 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
majority | +6.032 |
country | +6.013 |
nation | +5.982 |
oret | +5.680 |
inner | +5.676 |
Neg logit contributions | |
because | -9.575 |
besides | -9.529 |
nonetheless | -9.307 |
regardless | -9.153 |
nevertheless | -9.116 |
Token | : |
Token ID | 25 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
because | +8.468 |
besides | +8.217 |
nonetheless | +7.783 |
regardless | +7.715 |
nevertheless | +7.470 |
Neg logit contributions | |
country | -13.828 |
majority | -13.819 |
nation | -13.813 |
inner | -13.553 |
slightest | -13.497 |
Token | $ |
Token ID | 720 |
Feature activation | -3.25e+00 |
Pos logit contributions | |
because | +1.566 |
besides | +1.550 |
nonetheless | +1.512 |
regardless | +1.495 |
nevertheless | +1.480 |
Neg logit contributions | |
country | -0.842 |
nation | -0.839 |
majority | -0.830 |
inner | -0.801 |
oret | -0.798 |
Token | gang |
Token ID | 7706 |
Feature activation | -9.68e+00 |
Pos logit contributions | |
country | +27.910 |
nation | +27.792 |
majority | +27.754 |
inner | +26.342 |
group | +26.285 |
Neg logit contributions | |
besides | -15.310 |
nonetheless | -14.717 |
because | -14.607 |
nevertheless | -14.341 |
regardless | -13.973 |
Token | � |
Token ID | 447 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
majority | +11.432 |
country | +11.381 |
nation | +11.339 |
inner | +10.912 |
oret | +10.871 |
Neg logit contributions | |
besides | -8.315 |
because | -8.311 |
nonetheless | -8.066 |
regardless | -7.877 |
nevertheless | -7.827 |
Token | � |
Token ID | 247 |
Feature activation | -8.79e+00 |
Pos logit contributions | |
majority | +5.944 |
nation | +5.903 |
country | +5.846 |
inner | +5.336 |
largest | +5.043 |
Neg logit contributions | |
besides | -14.579 |
because | -14.483 |
nonetheless | -14.402 |
regardless | -14.217 |
nevertheless | -14.194 |
Token | s |
Token ID | 82 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
majority | +8.314 |
country | +8.298 |
nation | +8.261 |
oret | +7.888 |
inner | +7.879 |
Neg logit contributions | |
because | -9.708 |
besides | -9.698 |
nonetheless | -9.473 |
regardless | -9.275 |
nevertheless | -9.240 |
Token | leadership |
Token ID | 5531 |
Feature activation | +4.56e+00 |
Pos logit contributions | |
majority | +13.543 |
country | +13.409 |
nation | +13.361 |
inner | +12.921 |
oret | +12.715 |
Neg logit contributions | |
besides | -9.476 |
because | -9.395 |
nonetheless | -9.200 |
nevertheless | -8.924 |
regardless | -8.911 |
Token | in |
Token ID | 287 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
because | +5.032 |
besides | +4.954 |
nonetheless | +4.809 |
regardless | +4.705 |
nevertheless | +4.702 |
Neg logit contributions | |
majority | -4.378 |
country | -4.373 |
nation | -4.356 |
oret | -4.281 |
inner | -4.221 |
Token | the |
Token ID | 262 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
country | +13.835 |
majority | +13.746 |
nation | +13.723 |
inner | +13.343 |
oret | +12.980 |
Neg logit contributions | |
besides | -9.686 |
because | -9.641 |
nonetheless | -9.435 |
nevertheless | -9.160 |
regardless | -9.158 |
Token | early |
Token ID | 1903 |
Feature activation | -1.79e+01 |
Pos logit contributions | |
country | +29.970 |
nation | +29.532 |
majority | +29.253 |
inner | +28.391 |
city | +27.888 |
Neg logit contributions | |
besides | -16.011 |
because | -15.326 |
nonetheless | -15.315 |
nevertheless | -15.004 |
regardless | -14.882 |
Token | 1980 |
Token ID | 7169 |
Feature activation | -7.85e+00 |
Pos logit contributions | |
country | +20.860 |
majority | +20.794 |
nation | +20.585 |
inner | +19.996 |
city | +19.418 |
Neg logit contributions | |
besides | -13.083 |
nonetheless | -12.738 |
because | -12.412 |
nevertheless | -12.363 |
regardless | -12.162 |
Token | s |
Token ID | 82 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
country | +5.948 |
nation | +5.886 |
majority | +5.869 |
inner | +5.429 |
oret | +5.346 |
Neg logit contributions | |
besides | -9.916 |
because | -9.698 |
nonetheless | -9.672 |
nevertheless | -9.484 |
regardless | -9.464 |
Token | led |
Token ID | 2957 |
Feature activation | +7.51e+00 |
Pos logit contributions | |
because | +11.526 |
besides | +11.254 |
nonetheless | +11.041 |
nevertheless | +10.799 |
regardless | +10.705 |
Neg logit contributions | |
majority | -9.036 |
country | -8.946 |
nation | -8.909 |
oret | -8.865 |
slightest | -8.709 |
Token | . |
Token ID | 13 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
because | +6.706 |
besides | +6.585 |
nonetheless | +6.368 |
regardless | +6.265 |
nevertheless | +6.212 |
Neg logit contributions | |
majority | -6.965 |
country | -6.919 |
nation | -6.879 |
oret | -6.777 |
inner | -6.673 |
Token |
|
Token ID | 198 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
because | +14.333 |
besides | +13.838 |
nonetheless | +13.375 |
regardless | +13.292 |
nevertheless | +13.139 |
Neg logit contributions | |
slightest | -9.707 |
country | -9.640 |
inner | -9.551 |
majority | -9.542 |
nation | -9.513 |
Token |
|
Token ID | 198 |
Feature activation | +2.89e+00 |
Pos logit contributions | |
besides | +2.138 |
because | +2.133 |
nonetheless | +2.035 |
regardless | +1.945 |
nevertheless | +1.930 |
Neg logit contributions | |
majority | -6.360 |
country | -6.357 |
nation | -6.342 |
oret | -6.191 |
inner | -6.161 |
Token | 1994 |
Token ID | 22666 |
Feature activation | +8.91e-01 |
Pos logit contributions | |
because | +2.756 |
besides | +2.699 |
nonetheless | +2.605 |
regardless | +2.550 |
nevertheless | +2.527 |
Neg logit contributions | |
country | -3.263 |
majority | -3.257 |
nation | -3.245 |
inner | -3.162 |
oret | -3.119 |
Token | Roger |
Token ID | 13637 |
Feature activation | -5.38e+00 |
Pos logit contributions | |
because | +0.757 |
besides | +0.740 |
nonetheless | +0.720 |
regardless | +0.697 |
nevertheless | +0.694 |
Neg logit contributions | |
majority | -1.102 |
nation | -1.098 |
country | -1.098 |
oret | -1.072 |
inner | -1.068 |
Token | Po |
Token ID | 7695 |
Feature activation | -4.30e+00 |
Pos logit contributions | |
country | +4.851 |
majority | +4.843 |
nation | +4.827 |
oret | +4.632 |
inner | +4.601 |
Neg logit contributions | |
because | -6.319 |
besides | -6.289 |
nonetheless | -6.129 |
regardless | -6.025 |
nevertheless | -5.985 |
Token | isson |
Token ID | 30927 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
country | +3.394 |
majority | +3.390 |
nation | +3.377 |
oret | +3.225 |
inner | +3.209 |
Neg logit contributions | |
because | -5.544 |
besides | -5.513 |
nonetheless | -5.383 |
regardless | -5.306 |
nevertheless | -5.271 |
Token | admits |
Token ID | 15534 |
Feature activation | +7.98e+00 |
Pos logit contributions | |
majority | +4.289 |
country | +4.286 |
nation | +4.274 |
oret | +4.156 |
inner | +4.147 |
Neg logit contributions | |
because | -2.391 |
besides | -2.366 |
nonetheless | -2.270 |
regardless | -2.211 |
nevertheless | -2.186 |
Token | to |
Token ID | 284 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
because | +9.411 |
besides | +9.197 |
nonetheless | +8.957 |
regardless | +8.819 |
nevertheless | +8.756 |
Neg logit contributions | |
majority | -6.695 |
country | -6.644 |
nation | -6.635 |
oret | -6.576 |
inner | -6.366 |
Token | fabric |
Token ID | 9664 |
Feature activation | -4.92e+00 |
Pos logit contributions | |
majority | +3.354 |
country | +3.353 |
nation | +3.342 |
oret | +3.244 |
inner | +3.236 |
Neg logit contributions | |
because | -2.345 |
besides | -2.321 |
nonetheless | -2.240 |
regardless | -2.187 |
nevertheless | -2.168 |
Token | ating |
Token ID | 803 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
majority | +3.885 |
country | +3.881 |
nation | +3.859 |
oret | +3.678 |
inner | +3.672 |
Neg logit contributions | |
because | -6.341 |
besides | -6.318 |
nonetheless | -6.166 |
regardless | -6.074 |
nevertheless | -6.042 |
Token | words |
Token ID | 2456 |
Feature activation | +9.89e+00 |
Pos logit contributions | |
because | +1.967 |
besides | +1.938 |
nonetheless | +1.889 |
regardless | +1.868 |
nevertheless | +1.849 |
Neg logit contributions | |
country | -1.329 |
majority | -1.328 |
nation | -1.321 |
oret | -1.282 |
inner | -1.258 |
Token | that |
Token ID | 326 |
Feature activation | +5.35e+00 |
Pos logit contributions | |
because | +10.402 |
besides | +10.075 |
nonetheless | +9.793 |
regardless | +9.700 |
nevertheless | +9.482 |
Neg logit contributions | |
majority | -9.786 |
country | -9.771 |
nation | -9.675 |
oret | -9.548 |
slightest | -9.330 |
Token | equate |
Token ID | 45423 |
Feature activation | +2.54e+00 |
Pos logit contributions | |
because | +6.505 |
besides | +6.404 |
nonetheless | +6.287 |
regardless | +6.161 |
nevertheless | +6.153 |
Neg logit contributions | |
majority | -4.543 |
country | -4.535 |
nation | -4.506 |
oret | -4.378 |
inner | -4.281 |
Token | the |
Token ID | 262 |
Feature activation | -2.38e+01 |
Pos logit contributions | |
because | +3.391 |
besides | +3.343 |
nonetheless | +3.260 |
regardless | +3.232 |
nevertheless | +3.190 |
Neg logit contributions | |
majority | -1.890 |
country | -1.883 |
nation | -1.873 |
oret | -1.836 |
inner | -1.765 |
Token | inward |
Token ID | 29879 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
majority | +28.803 |
nation | +28.689 |
country | +28.568 |
inner | +28.199 |
presence | +27.491 |
Neg logit contributions | |
besides | -12.063 |
nonetheless | -11.470 |
because | -11.466 |
nevertheless | -11.153 |
regardless | -10.872 |
Token | - |
Token ID | 12 |
Feature activation | -1.49e+01 |
Pos logit contributions | |
country | +22.742 |
nation | +22.594 |
majority | +22.586 |
inner | +22.255 |
presence | +22.099 |
Neg logit contributions | |
besides | -7.788 |
because | -7.346 |
nonetheless | -7.307 |
nevertheless | -6.946 |
regardless | -6.872 |
Token | looking |
Token ID | 11534 |
Feature activation | -1.71e+01 |
Pos logit contributions | |
country | +15.071 |
nation | +14.877 |
majority | +14.816 |
inner | +14.735 |
oret | +14.486 |
Neg logit contributions | |
besides | -13.110 |
because | -12.740 |
nonetheless | -12.615 |
regardless | -12.282 |
nevertheless | -12.260 |
Token | good |
Token ID | 922 |
Feature activation | -5.03e+00 |
Pos logit contributions | |
nation | +23.644 |
majority | +23.574 |
country | +23.500 |
inner | +23.098 |
presence | +22.685 |
Neg logit contributions | |
besides | -7.905 |
nonetheless | -7.299 |
because | -7.256 |
nevertheless | -7.026 |
regardless | -6.800 |
Token | with |
Token ID | 351 |
Feature activation | -9.32e+00 |
Pos logit contributions | |
majority | +8.609 |
country | +8.598 |
nation | +8.583 |
inner | +8.395 |
oret | +8.377 |
Neg logit contributions | |
because | -1.809 |
besides | -1.799 |
nonetheless | -1.638 |
regardless | -1.533 |
nevertheless | -1.509 |
Token | evil |
Token ID | 6181 |
Feature activation | +6.48e+00 |
Pos logit contributions | |
country | +11.491 |
majority | +11.488 |
nation | +11.449 |
inner | +11.324 |
oret | +10.908 |
Neg logit contributions | |
besides | -7.280 |
because | -7.153 |
nonetheless | -6.950 |
regardless | -6.754 |
nevertheless | -6.718 |
Token | and |
Token ID | 290 |
Feature activation | +2.59e+00 |
Pos logit contributions | |
because | +6.068 |
besides | +5.809 |
nonetheless | +5.659 |
regardless | +5.599 |
nevertheless | +5.467 |
Neg logit contributions | |
majority | -7.335 |
country | -7.322 |
nation | -7.287 |
oret | -7.239 |
inner | -6.989 |
Token | border |
Token ID | 4865 |
Feature activation | +8.29e+00 |
Pos logit contributions | |
country | +25.315 |
nation | +24.905 |
majority | +24.372 |
inner | +23.661 |
city | +23.400 |
Neg logit contributions | |
besides | -14.399 |
nonetheless | -13.894 |
because | -13.803 |
regardless | -13.485 |
nevertheless | -13.436 |
Token | and |
Token ID | 290 |
Feature activation | -3.45e+00 |
Pos logit contributions | |
because | +8.480 |
besides | +8.238 |
nonetheless | +8.010 |
regardless | +7.904 |
nevertheless | +7.737 |
Neg logit contributions | |
majority | -8.467 |
nation | -8.333 |
country | -8.320 |
oret | -8.306 |
inner | -8.176 |
Token | Turkish |
Token ID | 9663 |
Feature activation | -2.29e+01 |
Pos logit contributions | |
country | +4.330 |
majority | +4.325 |
nation | +4.312 |
inner | +4.176 |
oret | +4.165 |
Neg logit contributions | |
because | -2.841 |
besides | -2.816 |
nonetheless | -2.717 |
regardless | -2.645 |
nevertheless | -2.630 |
Token | fighter |
Token ID | 10543 |
Feature activation | -6.13e+00 |
Pos logit contributions | |
country | +26.735 |
majority | +26.541 |
nation | +26.514 |
presence | +26.152 |
inner | +25.544 |
Neg logit contributions | |
besides | -13.278 |
because | -12.761 |
nonetheless | -12.161 |
regardless | -11.910 |
nevertheless | -11.845 |
Token | planes |
Token ID | 13016 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
country | +4.760 |
majority | +4.751 |
nation | +4.731 |
inner | +4.483 |
oret | +4.469 |
Neg logit contributions | |
because | -7.934 |
besides | -7.906 |
nonetheless | -7.711 |
regardless | -7.597 |
nevertheless | -7.553 |
Token | over |
Token ID | 625 |
Feature activation | -5.31e+00 |
Pos logit contributions | |
because | +15.200 |
besides | +14.851 |
nonetheless | +14.648 |
regardless | +14.391 |
nevertheless | +14.238 |
Neg logit contributions | |
majority | -8.737 |
oret | -8.695 |
country | -8.623 |
nation | -8.623 |
inner | -8.344 |
Token | flying |
Token ID | 45928 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
country | +6.505 |
majority | +6.502 |
nation | +6.478 |
oret | +6.276 |
inner | +6.272 |
Neg logit contributions | |
because | -4.544 |
besides | -4.506 |
nonetheless | -4.342 |
regardless | -4.243 |
nevertheless | -4.204 |
Token | Syrian |
Token ID | 6318 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
because | +1.845 |
besides | +1.818 |
nonetheless | +1.781 |
regardless | +1.752 |
nevertheless | +1.738 |
Neg logit contributions | |
majority | -1.153 |
nation | -1.148 |
country | -1.147 |
oret | -1.122 |
inner | -1.093 |
Token | territory |
Token ID | 7674 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
country | +25.937 |
nation | +25.507 |
majority | +25.230 |
city | +24.352 |
army | +24.272 |
Neg logit contributions | |
besides | -13.576 |
because | -12.893 |
nonetheless | -12.532 |
regardless | -12.231 |
nevertheless | -12.222 |
Token | . |
Token ID | 13 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
because | +15.845 |
besides | +15.286 |
nonetheless | +15.004 |
regardless | +14.822 |
unless | +14.498 |
Neg logit contributions | |
majority | -12.162 |
nation | -12.046 |
oret | -12.033 |
country | -11.981 |
inner | -11.649 |
Token | He |
Token ID | 679 |
Feature activation | +5.62e+00 |
Pos logit contributions | |
because | +18.646 |
besides | +18.083 |
nonetheless | +17.415 |
regardless | +17.322 |
nevertheless | +17.042 |
Neg logit contributions | |
slightest | -11.851 |
inner | -11.575 |
majority | -11.479 |
country | -11.438 |
nation | -11.382 |
Token | . |
Token ID | 13 |
Feature activation | +1.57e+01 |
Pos logit contributions | |
because | +20.802 |
besides | +19.685 |
nonetheless | +19.010 |
regardless | +19.004 |
nevertheless | +18.580 |
Neg logit contributions | |
majority | -12.359 |
oret | -12.323 |
slightest | -12.058 |
nation | -12.038 |
country | -11.997 |
Token |
|
Token ID | 198 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
because | +16.206 |
besides | +15.446 |
regardless | +14.758 |
although | +14.618 |
nonetheless | +14.576 |
Neg logit contributions | |
slightest | -13.137 |
oret | -12.840 |
inner | -12.769 |
majority | -12.741 |
nation | -12.673 |
Token |
|
Token ID | 198 |
Feature activation | +6.80e+00 |
Pos logit contributions | |
because | +5.854 |
besides | +5.639 |
nonetheless | +5.246 |
regardless | +5.100 |
nevertheless | +4.963 |
Neg logit contributions | |
majority | -16.587 |
country | -16.563 |
nation | -16.524 |
inner | -16.188 |
oret | -16.127 |
Token | MORE |
Token ID | 23346 |
Feature activation | +8.20e+00 |
Pos logit contributions | |
because | +6.521 |
besides | +6.329 |
nonetheless | +6.022 |
regardless | +5.959 |
nevertheless | +5.831 |
Neg logit contributions | |
country | -7.425 |
majority | -7.419 |
nation | -7.416 |
inner | -7.285 |
slightest | -7.216 |
Token | : |
Token ID | 25 |
Feature activation | -4.17e+00 |
Pos logit contributions | |
because | +5.248 |
besides | +5.138 |
nonetheless | +4.843 |
regardless | +4.727 |
nevertheless | +4.623 |
Neg logit contributions | |
majority | -11.759 |
country | -11.738 |
nation | -11.713 |
oret | -11.453 |
inner | -11.426 |
Token | The |
Token ID | 383 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
country | +4.351 |
majority | +4.349 |
nation | +4.331 |
oret | +4.174 |
inner | +4.158 |
Neg logit contributions | |
because | -4.306 |
besides | -4.284 |
nonetheless | -4.172 |
regardless | -4.080 |
nevertheless | -4.063 |
Token | 10 |
Token ID | 838 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
country | +27.517 |
majority | +27.469 |
nation | +27.347 |
inner | +26.503 |
oret | +26.324 |
Neg logit contributions | |
besides | -13.700 |
nonetheless | -13.218 |
because | -12.962 |
nevertheless | -12.780 |
regardless | -12.574 |
Token | best |
Token ID | 1266 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
country | +17.820 |
majority | +17.685 |
nation | +17.627 |
inner | +17.149 |
largest | +17.057 |
Neg logit contributions | |
besides | -10.933 |
because | -10.708 |
nonetheless | -10.680 |
nevertheless | -10.399 |
regardless | -10.328 |
Token | things |
Token ID | 1243 |
Feature activation | +5.98e+00 |
Pos logit contributions | |
country | +13.369 |
nation | +13.229 |
majority | +13.209 |
inner | +12.810 |
oret | +12.650 |
Neg logit contributions | |
besides | -9.074 |
because | -8.945 |
nonetheless | -8.833 |
nevertheless | -8.573 |
regardless | -8.521 |
Token | about |
Token ID | 546 |
Feature activation | -7.88e+00 |
Pos logit contributions | |
because | +6.829 |
besides | +6.697 |
nonetheless | +6.379 |
regardless | +6.355 |
nevertheless | +6.210 |
Neg logit contributions | |
majority | -5.384 |
nation | -5.376 |
oret | -5.338 |
country | -5.307 |
inner | -5.137 |
Token | being |
Token ID | 852 |
Feature activation | -8.39e+00 |
Pos logit contributions | |
country | +9.501 |
majority | +9.446 |
nation | +9.404 |
inner | +9.143 |
oret | +9.022 |
Neg logit contributions | |
besides | -6.655 |
because | -6.629 |
nonetheless | -6.479 |
nevertheless | -6.272 |
regardless | -6.271 |
Token | a |
Token ID | 257 |
Feature activation | -2.04e+01 |
Pos logit contributions | |
country | +13.064 |
majority | +13.004 |
nation | +12.944 |
inner | +12.622 |
oret | +12.367 |
Neg logit contributions | |
besides | -9.388 |
because | -9.358 |
nonetheless | -9.130 |
regardless | -8.845 |
nevertheless | -8.837 |
Token | cathedral |
Token ID | 41756 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
country | +24.591 |
nation | +24.163 |
majority | +24.029 |
inner | +22.966 |
multitude | +22.884 |
Neg logit contributions | |
besides | -13.863 |
because | -13.418 |
nonetheless | -13.351 |
regardless | -12.910 |
nevertheless | -12.892 |
Token | , |
Token ID | 11 |
Feature activation | +8.27e+00 |
Pos logit contributions | |
majority | +0.164 |
country | +0.164 |
nation | +0.164 |
oret | +0.160 |
inner | +0.159 |
Neg logit contributions | |
because | -0.073 |
besides | -0.072 |
nonetheless | -0.068 |
regardless | -0.066 |
nevertheless | -0.065 |
Token | and |
Token ID | 290 |
Feature activation | +6.63e+00 |
Pos logit contributions | |
because | +9.766 |
besides | +9.473 |
regardless | +9.214 |
nonetheless | +9.207 |
nevertheless | +9.019 |
Neg logit contributions | |
country | -6.757 |
majority | -6.744 |
oret | -6.735 |
nation | -6.720 |
slightest | -6.412 |
Token | over |
Token ID | 625 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
because | +7.653 |
besides | +7.487 |
nonetheless | +7.303 |
regardless | +7.215 |
nevertheless | +7.147 |
Neg logit contributions | |
country | -5.857 |
majority | -5.856 |
nation | -5.829 |
oret | -5.791 |
inner | -5.578 |
Token | the |
Token ID | 262 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
majority | +1.539 |
nation | +1.535 |
country | +1.533 |
oret | +1.505 |
inner | +1.481 |
Neg logit contributions | |
because | -1.417 |
besides | -1.387 |
nonetheless | -1.350 |
regardless | -1.329 |
nevertheless | -1.312 |
Token | background |
Token ID | 4469 |
Feature activation | +5.60e+00 |
Pos logit contributions | |
country | +21.054 |
majority | +20.886 |
nation | +20.875 |
inner | +19.865 |
remainder | +19.770 |
Neg logit contributions | |
besides | -15.604 |
because | -15.337 |
nonetheless | -15.057 |
regardless | -14.626 |
nevertheless | -14.590 |
Token | noise |
Token ID | 7838 |
Feature activation | +7.46e+00 |
Pos logit contributions | |
because | +7.008 |
besides | +6.882 |
nonetheless | +6.691 |
regardless | +6.617 |
nevertheless | +6.551 |
Neg logit contributions | |
majority | -4.358 |
oret | -4.339 |
nation | -4.329 |
country | -4.306 |
inner | -4.154 |
Token | of |
Token ID | 286 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
because | +7.737 |
besides | +7.522 |
nonetheless | +7.252 |
regardless | +7.187 |
nevertheless | +7.024 |
Neg logit contributions | |
oret | -7.344 |
majority | -7.341 |
nation | -7.327 |
country | -7.304 |
inner | -7.036 |
Token | pagan |
Token ID | 36164 |
Feature activation | -2.06e+01 |
Pos logit contributions | |
country | +12.813 |
majority | +12.751 |
nation | +12.717 |
inner | +12.324 |
oret | +12.068 |
Neg logit contributions | |
besides | -9.260 |
because | -9.188 |
nonetheless | -8.946 |
regardless | -8.730 |
nevertheless | -8.663 |
Token | priests |
Token ID | 17345 |
Feature activation | +5.71e+00 |
Pos logit contributions | |
country | +24.655 |
nation | +24.433 |
majority | +24.301 |
inner | +23.690 |
presence | +22.914 |
Neg logit contributions | |
besides | -12.728 |
because | -12.454 |
nonetheless | -12.152 |
regardless | -11.972 |
nevertheless | -11.725 |
Token |
|
Token ID | 198 |
Feature activation | +5.89e+00 |
Pos logit contributions | |
because | +13.076 |
besides | +12.701 |
nonetheless | +12.277 |
regardless | +12.110 |
nevertheless | +12.021 |
Neg logit contributions | |
nation | -9.570 |
country | -9.518 |
majority | -9.498 |
slightest | -9.188 |
oret | -9.115 |
Token |
|
Token ID | 198 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
besides | +3.093 |
because | +3.079 |
nonetheless | +2.938 |
regardless | +2.809 |
nevertheless | +2.783 |
Neg logit contributions | |
majority | -9.215 |
country | -9.211 |
nation | -9.188 |
oret | -8.983 |
inner | -8.929 |
Token | 4 |
Token ID | 19 |
Feature activation | +3.67e+00 |
Pos logit contributions | |
because | +1.356 |
besides | +1.337 |
nonetheless | +1.291 |
regardless | +1.262 |
nevertheless | +1.254 |
Neg logit contributions | |
country | -1.527 |
majority | -1.526 |
nation | -1.524 |
inner | -1.468 |
oret | -1.461 |
Token | . |
Token ID | 13 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
besides | +1.582 |
because | +1.573 |
nonetheless | +1.482 |
regardless | +1.402 |
nevertheless | +1.396 |
Neg logit contributions | |
majority | -6.086 |
country | -6.076 |
nation | -6.055 |
oret | -5.940 |
inner | -5.901 |
Token | Xen |
Token ID | 21173 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
majority | +12.585 |
country | +12.537 |
nation | +12.480 |
inner | +12.150 |
oret | +12.089 |
Neg logit contributions | |
besides | -9.881 |
because | -9.847 |
nonetheless | -9.646 |
regardless | -9.378 |
nevertheless | -9.349 |
Token | H |
Token ID | 367 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
majority | +19.863 |
country | +19.811 |
nation | +19.737 |
inner | +19.361 |
oret | +19.163 |
Neg logit contributions | |
besides | -10.724 |
because | -10.631 |
nonetheless | -10.375 |
regardless | -10.137 |
nevertheless | -10.019 |
Token | VM |
Token ID | 15996 |
Feature activation | -6.05e+00 |
Pos logit contributions | |
oret | +20.513 |
country | +20.405 |
majority | +20.333 |
nation | +20.145 |
inner | +19.981 |
Neg logit contributions | |
nonetheless | -14.012 |
besides | -13.925 |
nevertheless | -13.638 |
regardless | -13.511 |
because | -13.475 |
Token | 4 |
Token ID | 604 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
country | +6.215 |
majority | +6.215 |
nation | +6.183 |
inner | +5.972 |
oret | +5.945 |
Neg logit contributions | |
because | -6.250 |
besides | -6.216 |
nonetheless | -6.060 |
regardless | -5.930 |
nevertheless | -5.901 |
Token | . |
Token ID | 13 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
majority | +0.940 |
country | +0.940 |
nation | +0.939 |
oret | +0.920 |
inner | +0.915 |
Neg logit contributions | |
because | -0.225 |
besides | -0.217 |
nonetheless | -0.201 |
regardless | -0.191 |
nevertheless | -0.186 |
Token | 0 |
Token ID | 15 |
Feature activation | +5.58e+00 |
Pos logit contributions | |
majority | +1.313 |
country | +1.311 |
nation | +1.306 |
oret | +1.261 |
inner | +1.256 |
Neg logit contributions | |
because | -1.355 |
besides | -1.349 |
nonetheless | -1.313 |
regardless | -1.287 |
nevertheless | -1.279 |
Token | . |
Token ID | 13 |
Feature activation | +5.32e-01 |
Pos logit contributions | |
because | +4.962 |
besides | +4.820 |
nonetheless | +4.601 |
regardless | +4.545 |
nevertheless | +4.468 |
Neg logit contributions | |
nation | -6.474 |
majority | -6.429 |
country | -6.421 |
oret | -6.276 |
slightest | -6.162 |
Token | interested |
Token ID | 4609 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
country | +1.539 |
majority | +1.536 |
nation | +1.530 |
inner | +1.482 |
oret | +1.480 |
Neg logit contributions | |
because | -1.028 |
besides | -1.022 |
nonetheless | -0.987 |
regardless | -0.963 |
nevertheless | -0.955 |
Token | in |
Token ID | 287 |
Feature activation | -3.30e+00 |
Pos logit contributions | |
because | +16.982 |
besides | +16.254 |
nonetheless | +15.722 |
regardless | +15.509 |
nevertheless | +15.289 |
Neg logit contributions | |
majority | -12.732 |
nation | -12.412 |
country | -12.187 |
ses | -12.183 |
oret | -12.182 |
Token | ob |
Token ID | 909 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
country | +4.319 |
majority | +4.299 |
nation | +4.294 |
inner | +4.164 |
oret | +4.154 |
Neg logit contributions | |
because | -2.539 |
besides | -2.525 |
nonetheless | -2.431 |
regardless | -2.366 |
nevertheless | -2.344 |
Token | vi |
Token ID | 8903 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
country | +13.750 |
nation | +13.627 |
majority | +13.499 |
oret | +13.210 |
inner | +12.937 |
Neg logit contributions | |
besides | -11.418 |
because | -11.294 |
nonetheless | -11.239 |
regardless | -10.907 |
nevertheless | -10.866 |
Token | ating |
Token ID | 803 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
because | +2.931 |
besides | +2.879 |
nonetheless | +2.759 |
regardless | +2.746 |
nevertheless | +2.695 |
Neg logit contributions | |
majority | -2.018 |
country | -2.018 |
nation | -2.005 |
inner | -1.936 |
oret | -1.910 |
Token | a |
Token ID | 257 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
majority | +3.547 |
country | +3.545 |
nation | +3.535 |
oret | +3.442 |
inner | +3.435 |
Neg logit contributions | |
because | -1.827 |
besides | -1.805 |
nonetheless | -1.728 |
regardless | -1.679 |
nevertheless | -1.660 |
Token | star |
Token ID | 3491 |
Feature activation | -8.87e+00 |
Pos logit contributions | |
country | +28.181 |
nation | +27.899 |
majority | +27.776 |
inner | +26.291 |
primary | +26.225 |
Neg logit contributions | |
besides | -13.652 |
nonetheless | -13.009 |
nevertheless | -12.512 |
regardless | -12.495 |
because | -12.427 |
Token | system |
Token ID | 1080 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
country | +11.442 |
nation | +11.381 |
majority | +11.370 |
inner | +10.949 |
oret | +10.909 |
Neg logit contributions | |
besides | -6.487 |
because | -6.405 |
nonetheless | -6.292 |
nevertheless | -6.069 |
regardless | -6.046 |
Token | , |
Token ID | 11 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
because | +11.678 |
besides | +11.296 |
nonetheless | +10.858 |
regardless | +10.802 |
nevertheless | +10.636 |
Neg logit contributions | |
majority | -9.340 |
nation | -9.235 |
country | -9.234 |
oret | -9.165 |
inner | -8.882 |
Token | you |
Token ID | 345 |
Feature activation | +6.63e+00 |
Pos logit contributions | |
because | +19.227 |
besides | +18.713 |
regardless | +18.063 |
nonetheless | +18.001 |
nevertheless | +17.748 |
Neg logit contributions | |
oret | -9.451 |
majority | -9.382 |
nation | -9.222 |
country | -9.060 |
trio | -8.937 |
Token | might |
Token ID | 1244 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
because | +6.832 |
besides | +6.726 |
nonetheless | +6.552 |
regardless | +6.406 |
nevertheless | +6.390 |
Neg logit contributions | |
majority | -6.866 |
country | -6.818 |
nation | -6.810 |
oret | -6.631 |
inner | -6.568 |
Token | you |
Token ID | 345 |
Feature activation | +8.26e-01 |
Pos logit contributions | |
because | +1.047 |
besides | +1.034 |
nonetheless | +0.995 |
regardless | +0.969 |
nevertheless | +0.961 |
Neg logit contributions | |
majority | -1.707 |
country | -1.705 |
nation | -1.701 |
oret | -1.656 |
inner | -1.652 |
Token | want |
Token ID | 765 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
because | +0.798 |
besides | +0.791 |
nonetheless | +0.767 |
regardless | +0.751 |
nevertheless | +0.745 |
Neg logit contributions | |
majority | -0.924 |
country | -0.923 |
nation | -0.920 |
oret | -0.890 |
inner | -0.887 |
Token | to |
Token ID | 284 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
because | +14.059 |
besides | +13.584 |
regardless | +13.157 |
nonetheless | +13.106 |
nevertheless | +12.778 |
Neg logit contributions | |
majority | -10.341 |
nation | -10.257 |
slightest | -10.133 |
country | -10.021 |
inner | -10.003 |
Token | read |
Token ID | 1100 |
Feature activation | +8.98e+00 |
Pos logit contributions | |
country | +1.230 |
majority | +1.222 |
nation | +1.219 |
inner | +1.159 |
oret | +1.159 |
Neg logit contributions | |
because | -1.854 |
besides | -1.850 |
nonetheless | -1.803 |
regardless | -1.776 |
nevertheless | -1.764 |
Token | on |
Token ID | 319 |
Feature activation | -5.90e+00 |
Pos logit contributions | |
because | +9.450 |
besides | +9.213 |
regardless | +8.879 |
nonetheless | +8.848 |
nevertheless | +8.639 |
Neg logit contributions | |
majority | -8.945 |
nation | -8.876 |
country | -8.841 |
oret | -8.609 |
inner | -8.592 |
Token | the |
Token ID | 262 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
country | +7.032 |
majority | +7.015 |
nation | +6.974 |
inner | +6.763 |
oret | +6.755 |
Neg logit contributions | |
because | -5.101 |
besides | -5.079 |
nonetheless | -4.952 |
nevertheless | -4.790 |
regardless | -4.768 |
Token | Kindle |
Token ID | 27114 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
country | +24.045 |
majority | +23.922 |
nation | +23.639 |
inner | +23.233 |
largest | +23.034 |
Neg logit contributions | |
besides | -14.610 |
because | -14.505 |
nonetheless | -14.248 |
nevertheless | -13.874 |
regardless | -13.515 |
Token | , |
Token ID | 11 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
majority | +3.056 |
country | +3.056 |
nation | +3.047 |
oret | +2.971 |
inner | +2.966 |
Neg logit contributions | |
because | -1.301 |
besides | -1.286 |
nonetheless | -1.226 |
regardless | -1.183 |
nevertheless | -1.171 |
Token | but |
Token ID | 475 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
because | +12.790 |
besides | +12.514 |
regardless | +12.128 |
nonetheless | +12.044 |
nevertheless | +11.825 |
Neg logit contributions | |
nation | -9.518 |
majority | -9.503 |
country | -9.476 |
oret | -9.272 |
trio | -9.066 |
Token | they |
Token ID | 484 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
because | +11.321 |
besides | +11.042 |
nonetheless | +10.726 |
regardless | +10.548 |
nevertheless | +10.526 |
Neg logit contributions | |
nation | -9.270 |
majority | -9.170 |
country | -9.138 |
oret | -9.003 |
trio | -8.809 |
Token | won |
Token ID | 1839 |
Feature activation | +3.93e+00 |
Pos logit contributions | |
because | +1.164 |
besides | +1.145 |
nonetheless | +1.104 |
regardless | +1.075 |
nevertheless | +1.068 |
Neg logit contributions | |
country | -1.844 |
majority | -1.844 |
nation | -1.840 |
oret | -1.790 |
inner | -1.788 |