Token | and |
Token ID | 290 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
ullivan | +3.799 |
Hera | +3.786 |
asma | +3.766 |
enhagen | +3.710 |
eda | +3.701 |
Neg logit contributions | |
MX | -4.188 |
ovie | -3.874 |
oir | -3.712 |
resp | -3.514 |
butt | -3.479 |
Token | head |
Token ID | 1182 |
Feature activation | +9.25e-03 |
Pos logit contributions | |
ullivan | +3.866 |
asma | +3.830 |
enhagen | +3.818 |
Hera | +3.809 |
eda | +3.715 |
Neg logit contributions | |
MX | -4.046 |
ovie | -3.772 |
oir | -3.583 |
resp | -3.381 |
butt | -3.371 |
Token | of |
Token ID | 286 |
Feature activation | -5.54e-02 |
Pos logit contributions | |
ullivan | +0.107 |
enhagen | +0.105 |
asma | +0.103 |
Hera | +0.101 |
eda | +0.101 |
Neg logit contributions | |
MX | -0.105 |
ovie | -0.098 |
oir | -0.094 |
resp | -0.088 |
butt | -0.087 |
Token | the |
Token ID | 262 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
MX | +0.600 |
ovie | +0.560 |
oir | +0.531 |
resp | +0.497 |
butt | +0.496 |
Neg logit contributions | |
ullivan | -0.671 |
enhagen | -0.659 |
asma | -0.650 |
eda | -0.636 |
Hera | -0.635 |
Token | main |
Token ID | 1388 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
ullivan | +4.311 |
Hera | +4.270 |
enhagen | +4.259 |
asma | +4.242 |
eda | +4.160 |
Neg logit contributions | |
MX | -4.181 |
ovie | -3.857 |
oir | -3.739 |
resp | -3.492 |
butt | -3.467 |
Token | ruling |
Token ID | 6922 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
ullivan | +4.027 |
enhagen | +4.005 |
asma | +3.983 |
Hera | +3.965 |
eda | +3.896 |
Neg logit contributions | |
MX | -3.377 |
ovie | -3.104 |
oir | -2.979 |
resp | -2.761 |
butt | -2.742 |
Token | VM |
Token ID | 16990 |
Feature activation | +4.77e-01 |
Pos logit contributions | |
Hera | +12.670 |
asma | +12.095 |
ullivan | +11.632 |
Kol | +11.562 |
eda | +11.499 |
Neg logit contributions | |
MX | -13.774 |
ovie | -13.237 |
resp | -12.588 |
oir | -12.297 |
sburgh | -11.960 |
Token | RO |
Token ID | 13252 |
Feature activation | +9.57e-01 |
Pos logit contributions | |
Hera | +3.557 |
asma | +3.552 |
ullivan | +3.530 |
eda | +3.403 |
enhagen | +3.311 |
Neg logit contributions | |
MX | -6.815 |
ovie | -6.702 |
oir | -6.371 |
resp | -6.214 |
sburgh | -6.161 |
Token | D |
Token ID | 360 |
Feature activation | +3.88e-01 |
Pos logit contributions | |
asma | +10.182 |
Hera | +10.042 |
ullivan | +9.748 |
eda | +9.709 |
zl | +9.450 |
Neg logit contributions | |
MX | -9.030 |
ovie | -8.775 |
oir | -8.470 |
resp | -8.042 |
butt | -7.894 |
Token | PM |
Token ID | 5868 |
Feature activation | +2.80e-01 |
Pos logit contributions | |
asma | +4.732 |
ullivan | +4.685 |
eda | +4.641 |
enhagen | +4.511 |
Hera | +4.463 |
Neg logit contributions | |
MX | -3.942 |
ovie | -3.665 |
oir | -3.456 |
resp | -3.299 |
sburgh | -3.255 |
Token | NE |
Token ID | 12161 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
ullivan | +2.819 |
asma | +2.743 |
Hera | +2.702 |
enhagen | +2.685 |
eda | +2.616 |
Neg logit contributions | |
MX | -3.510 |
ovie | -3.344 |
oir | -3.159 |
sburgh | -3.059 |
resp | -3.033 |
Token | to |
Token ID | 284 |
Feature activation | +8.26e-02 |
Pos logit contributions | |
Hera | +5.507 |
ullivan | +5.477 |
asma | +5.476 |
eda | +5.415 |
enhagen | +5.389 |
Neg logit contributions | |
MX | -7.030 |
ovie | -6.430 |
oir | -6.119 |
sburgh | -5.873 |
resp | -5.817 |
Token | slay |
Token ID | 42596 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
ullivan | +0.923 |
enhagen | +0.907 |
asma | +0.896 |
Hera | +0.883 |
eda | +0.879 |
Neg logit contributions | |
MX | -0.968 |
ovie | -0.903 |
oir | -0.860 |
resp | -0.808 |
butt | -0.808 |
Token | , |
Token ID | 11 |
Feature activation | +7.28e-01 |
Pos logit contributions | |
ullivan | +2.792 |
enhagen | +2.744 |
asma | +2.710 |
Hera | +2.707 |
eda | +2.693 |
Neg logit contributions | |
MX | -2.932 |
ovie | -2.695 |
oir | -2.556 |
resp | -2.404 |
sburgh | -2.400 |
Token | even |
Token ID | 772 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
Hera | +7.206 |
eda | +6.994 |
ullivan | +6.982 |
asma | +6.797 |
enhagen | +6.670 |
Neg logit contributions | |
MX | -8.679 |
ovie | -7.942 |
oir | -7.538 |
sburgh | -7.134 |
butt | -7.072 |
Token | if |
Token ID | 611 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
ullivan | +1.220 |
enhagen | +1.200 |
asma | +1.186 |
Hera | +1.177 |
eda | +1.171 |
Neg logit contributions | |
MX | -1.083 |
ovie | -1.004 |
oir | -0.952 |
resp | -0.889 |
butt | -0.886 |
Token | I |
Token ID | 314 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
Hera | +4.001 |
ullivan | +3.999 |
asma | +3.906 |
enhagen | +3.897 |
eda | +3.892 |
Neg logit contributions | |
MX | -4.576 |
ovie | -4.273 |
oir | -4.027 |
resp | -3.800 |
butt | -3.787 |
Token | myself |
Token ID | 3589 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
Hera | +10.993 |
eda | +10.606 |
asma | +10.013 |
lication | +9.840 |
ullivan | +9.811 |
Neg logit contributions | |
MX | -16.157 |
ovie | -14.065 |
oir | -13.537 |
ーテ | -13.150 |
butt | -12.836 |
Token | am |
Token ID | 716 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
Hera | +9.327 |
eda | +8.921 |
ullivan | +8.664 |
asma | +8.603 |
lication | +8.442 |
Neg logit contributions | |
MX | -12.478 |
ovie | -11.172 |
oir | -10.509 |
sburgh | -10.110 |
resp | -9.920 |
Token | slain |
Token ID | 27029 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
ullivan | +0.270 |
enhagen | +0.266 |
asma | +0.262 |
Hera | +0.257 |
eda | +0.256 |
Neg logit contributions | |
MX | -0.294 |
ovie | -0.275 |
oir | -0.262 |
resp | -0.247 |
butt | -0.246 |
Token | . |
Token ID | 13 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
ullivan | +2.769 |
enhagen | +2.727 |
asma | +2.683 |
Hera | +2.679 |
eda | +2.656 |
Neg logit contributions | |
MX | -2.890 |
ovie | -2.661 |
oir | -2.510 |
resp | -2.389 |
sburgh | -2.364 |
Token |
|
Token ID | 198 |
Feature activation | -3.87e-02 |
Pos logit contributions | |
ullivan | +2.106 |
Hera | +2.069 |
asma | +2.063 |
enhagen | +2.051 |
eda | +2.037 |
Neg logit contributions | |
MX | -2.196 |
ovie | -2.054 |
oir | -1.942 |
resp | -1.825 |
butt | -1.825 |
Token | get |
Token ID | 651 |
Feature activation | +5.47e-01 |
Pos logit contributions | |
ullivan | +3.270 |
asma | +3.195 |
enhagen | +3.187 |
eda | +3.134 |
Hera | +3.083 |
Neg logit contributions | |
MX | -3.671 |
ovie | -3.436 |
oir | -3.247 |
resp | -3.067 |
butt | -3.033 |
Token | your |
Token ID | 534 |
Feature activation | +5.30e-01 |
Pos logit contributions | |
Hera | +5.305 |
enhagen | +5.292 |
asma | +5.279 |
eda | +5.262 |
ullivan | +5.234 |
Neg logit contributions | |
MX | -6.592 |
ovie | -6.152 |
oir | -5.925 |
sburgh | -5.648 |
resp | -5.546 |
Token | hands |
Token ID | 2832 |
Feature activation | +3.23e-01 |
Pos logit contributions | |
asma | +5.354 |
ullivan | +5.209 |
Hera | +5.176 |
enhagen | +5.130 |
eda | +5.064 |
Neg logit contributions | |
MX | -6.382 |
ovie | -5.924 |
oir | -5.692 |
resp | -5.386 |
sburgh | -5.349 |
Token | on |
Token ID | 319 |
Feature activation | +3.36e-01 |
Pos logit contributions | |
ullivan | +3.573 |
enhagen | +3.514 |
asma | +3.478 |
eda | +3.384 |
Hera | +3.368 |
Neg logit contributions | |
MX | -3.765 |
ovie | -3.437 |
oir | -3.308 |
resp | -3.112 |
sburgh | -3.107 |
Token | a |
Token ID | 257 |
Feature activation | +7.48e-01 |
Pos logit contributions | |
ullivan | +3.639 |
enhagen | +3.603 |
asma | +3.538 |
eda | +3.517 |
Hera | +3.496 |
Neg logit contributions | |
MX | -3.912 |
ovie | -3.675 |
oir | -3.468 |
sburgh | -3.321 |
resp | -3.290 |
Token | beta |
Token ID | 12159 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
asma | +7.269 |
ullivan | +7.224 |
enhagen | +7.043 |
Hera | +7.020 |
eda | +7.016 |
Neg logit contributions | |
MX | -8.618 |
ovie | -8.179 |
oir | -7.772 |
sburgh | -7.424 |
butt | -7.379 |
Token | key |
Token ID | 1994 |
Feature activation | +4.40e-01 |
Pos logit contributions | |
asma | +12.167 |
ullivan | +12.010 |
eda | +11.780 |
enhagen | +11.590 |
Hera | +11.204 |
Neg logit contributions | |
MX | -13.507 |
ovie | -12.381 |
sburgh | -11.974 |
oir | -11.915 |
butt | -11.631 |
Token | yet |
Token ID | 1865 |
Feature activation | +4.58e-01 |
Pos logit contributions | |
ullivan | +4.680 |
enhagen | +4.600 |
eda | +4.498 |
asma | +4.473 |
Hera | +4.435 |
Neg logit contributions | |
MX | -5.219 |
ovie | -4.771 |
oir | -4.543 |
sburgh | -4.352 |
resp | -4.272 |
Token | you |
Token ID | 345 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
ullivan | +4.864 |
enhagen | +4.807 |
asma | +4.700 |
eda | +4.643 |
Hera | +4.599 |
Neg logit contributions | |
MX | -5.340 |
ovie | -4.956 |
oir | -4.696 |
resp | -4.500 |
butt | -4.481 |
Token | can |
Token ID | 460 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
ullivan | +1.730 |
enhagen | +1.707 |
asma | +1.687 |
eda | +1.646 |
Hera | +1.638 |
Neg logit contributions | |
MX | -1.935 |
ovie | -1.805 |
oir | -1.717 |
butt | -1.619 |
resp | -1.619 |
Token | still |
Token ID | 991 |
Feature activation | +6.13e-02 |
Pos logit contributions | |
MX | +2.276 |
ovie | +2.149 |
oir | +2.074 |
resp | +1.948 |
butt | +1.946 |
Neg logit contributions | |
ullivan | -1.826 |
enhagen | -1.811 |
asma | -1.763 |
Hera | -1.724 |
lication | -1.721 |
Token | � |
Token ID | 247 |
Feature activation | -6.25e-02 |
Pos logit contributions | |
MX | +0.231 |
ovie | +0.216 |
oir | +0.205 |
resp | +0.192 |
butt | +0.191 |
Neg logit contributions | |
ullivan | -0.251 |
enhagen | -0.248 |
asma | -0.244 |
Hera | -0.239 |
eda | -0.239 |
Token | t |
Token ID | 83 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
MX | +0.596 |
ovie | +0.549 |
oir | +0.521 |
resp | +0.479 |
butt | +0.478 |
Neg logit contributions | |
ullivan | -0.836 |
enhagen | -0.829 |
asma | -0.814 |
Hera | -0.802 |
eda | -0.797 |
Token | the |
Token ID | 262 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
MX | +1.987 |
ovie | +1.852 |
oir | +1.772 |
butt | +1.640 |
resp | +1.640 |
Neg logit contributions | |
ullivan | -2.214 |
enhagen | -2.181 |
asma | -2.135 |
eda | -2.093 |
Hera | -2.087 |
Token | be |
Token ID | 307 |
Feature activation | -6.63e-02 |
Pos logit contributions | |
MX | +2.582 |
ovie | +2.398 |
oir | +2.295 |
resp | +2.128 |
butt | +2.109 |
Neg logit contributions | |
ullivan | -2.962 |
enhagen | -2.908 |
asma | -2.871 |
eda | -2.807 |
lication | -2.791 |
Token | all |
Token ID | 477 |
Feature activation | +7.49e-01 |
Pos logit contributions | |
MX | +0.717 |
ovie | +0.669 |
oir | +0.637 |
resp | +0.597 |
butt | +0.593 |
Neg logit contributions | |
ullivan | -0.801 |
enhagen | -0.790 |
asma | -0.776 |
Hera | -0.761 |
eda | -0.760 |
Token | and |
Token ID | 290 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
ullivan | +7.265 |
enhagen | +6.961 |
eda | +6.948 |
Hera | +6.896 |
asma | +6.771 |
Neg logit contributions | |
MX | -9.009 |
ovie | -8.489 |
oir | -7.858 |
resp | -7.820 |
sburgh | -7.554 |
Token | end |
Token ID | 886 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
Hera | +9.064 |
eda | +8.330 |
ullivan | +8.214 |
asma | +7.825 |
aza | +7.725 |
Neg logit contributions | |
MX | -17.532 |
ovie | -17.077 |
resp | -15.620 |
sburgh | -15.430 |
oir | -15.407 |
Token | all |
Token ID | 477 |
Feature activation | +3.39e-01 |
Pos logit contributions | |
ullivan | +8.399 |
eda | +8.007 |
asma | +7.896 |
Hera | +7.757 |
enhagen | +7.341 |
Neg logit contributions | |
MX | -16.472 |
ovie | -15.152 |
sburgh | -14.541 |
resp | -14.025 |
oir | -13.666 |
Token | . |
Token ID | 13 |
Feature activation | -6.92e-02 |
Pos logit contributions | |
ullivan | +3.591 |
enhagen | +3.547 |
asma | +3.485 |
Hera | +3.450 |
eda | +3.420 |
Neg logit contributions | |
MX | -4.017 |
ovie | -3.756 |
oir | -3.590 |
resp | -3.409 |
sburgh | -3.378 |
Token | It |
Token ID | 632 |
Feature activation | +4.98e-02 |
Pos logit contributions | |
MX | +0.777 |
ovie | +0.726 |
oir | +0.692 |
resp | +0.646 |
butt | +0.644 |
Neg logit contributions | |
ullivan | -0.811 |
enhagen | -0.800 |
asma | -0.783 |
eda | -0.768 |
Hera | -0.766 |
Token | is |
Token ID | 318 |
Feature activation | -5.24e-02 |
Pos logit contributions | |
ullivan | +0.630 |
enhagen | +0.623 |
asma | +0.613 |
eda | +0.602 |
Hera | +0.602 |
Neg logit contributions | |
MX | -0.512 |
ovie | -0.473 |
oir | -0.446 |
resp | -0.416 |
butt | -0.414 |
Token | s |
Token ID | 264 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
MX | +1.339 |
ovie | +1.224 |
oir | +1.163 |
resp | +1.067 |
butt | +1.063 |
Neg logit contributions | |
ullivan | -1.948 |
enhagen | -1.925 |
asma | -1.903 |
eda | -1.861 |
Hera | -1.853 |
Token | . |
Token ID | 13 |
Feature activation | +2.50e-02 |
Pos logit contributions | |
ullivan | +1.673 |
asma | +1.629 |
enhagen | +1.609 |
eda | +1.605 |
Hera | +1.602 |
Neg logit contributions | |
MX | -1.583 |
ovie | -1.491 |
oir | -1.410 |
resp | -1.317 |
butt | -1.308 |
Token | t |
Token ID | 83 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
ullivan | +0.327 |
enhagen | +0.321 |
asma | +0.318 |
eda | +0.312 |
Hera | +0.312 |
Neg logit contributions | |
MX | -0.245 |
ovie | -0.227 |
oir | -0.214 |
resp | -0.198 |
butt | -0.196 |
Token | . |
Token ID | 13 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
ullivan | +2.687 |
asma | +2.634 |
Hera | +2.598 |
eda | +2.591 |
enhagen | +2.548 |
Neg logit contributions | |
MX | -2.726 |
ovie | -2.589 |
oir | -2.444 |
resp | -2.287 |
butt | -2.275 |
Token | F |
Token ID | 376 |
Feature activation | -4.52e-01 |
Pos logit contributions | |
MX | +3.206 |
ovie | +2.893 |
oir | +2.747 |
resp | +2.567 |
butt | +2.564 |
Neg logit contributions | |
ullivan | -3.982 |
enhagen | -3.949 |
asma | -3.847 |
eda | -3.761 |
lication | -3.758 |
Token | RA |
Token ID | 3861 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
MX | +3.267 |
ovie | +2.655 |
oir | +2.630 |
resp | +2.302 |
butt | +2.194 |
Neg logit contributions | |
enhagen | -7.218 |
ullivan | -7.054 |
asma | -6.889 |
lication | -6.849 |
Hera | -6.802 |
Token | 19 |
Token ID | 678 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
enhagen | +8.649 |
Hera | +8.118 |
ullivan | +7.774 |
eda | +7.577 |
lication | +7.553 |
Neg logit contributions | |
ovie | -16.189 |
MX | -15.862 |
oir | -15.517 |
iaries | -15.273 |
resp | -15.134 |
Token | William |
Token ID | 3977 |
Feature activation | -6.43e-02 |
Pos logit contributions | |
ullivan | +1.425 |
enhagen | +1.397 |
asma | +1.388 |
Hera | +1.381 |
eda | +1.365 |
Neg logit contributions | |
MX | -1.417 |
ovie | -1.328 |
oir | -1.262 |
resp | -1.190 |
butt | -1.181 |
Token | Bon |
Token ID | 7979 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
MX | +0.756 |
ovie | +0.711 |
oir | +0.684 |
resp | +0.638 |
butt | +0.637 |
Neg logit contributions | |
ullivan | -0.716 |
enhagen | -0.706 |
asma | -0.691 |
Hera | -0.674 |
eda | -0.672 |
Token | net |
Token ID | 3262 |
Feature activation | -4.21e-02 |
Pos logit contributions | |
ullivan | +1.475 |
enhagen | +1.454 |
asma | +1.420 |
eda | +1.418 |
Hera | +1.389 |
Neg logit contributions | |
MX | -1.658 |
ovie | -1.536 |
oir | -1.451 |
resp | -1.385 |
butt | -1.380 |
Token | ( |
Token ID | 357 |
Feature activation | -2.99e-03 |
Pos logit contributions | |
MX | +0.446 |
ovie | +0.415 |
oir | +0.395 |
resp | +0.367 |
butt | +0.366 |
Neg logit contributions | |
ullivan | -0.521 |
enhagen | -0.512 |
asma | -0.505 |
Hera | -0.495 |
eda | -0.495 |
Token |
|
Token ID | 198 |
Feature activation | +5.03e-01 |
Pos logit contributions | |
MX | +1.918 |
ovie | +1.740 |
oir | +1.657 |
resp | +1.560 |
butt | +1.551 |
Neg logit contributions | |
enhagen | -2.371 |
ullivan | -2.355 |
asma | -2.259 |
Hera | -2.218 |
eda | -2.205 |
Token | ADVERTISEMENT |
Token ID | 19053 |
Feature activation | +4.55e-01 |
Pos logit contributions | |
ullivan | +5.508 |
asma | +5.457 |
eda | +5.402 |
lication | +5.288 |
enhagen | +5.171 |
Neg logit contributions | |
MX | -5.308 |
ovie | -5.186 |
oir | -4.865 |
sburgh | -4.679 |
iaries | -4.505 |
Token |
|
Token ID | 198 |
Feature activation | +6.65e-02 |
Pos logit contributions | |
ullivan | +4.653 |
asma | +4.619 |
enhagen | +4.603 |
Hera | +4.561 |
eda | +4.422 |
Neg logit contributions | |
MX | -5.345 |
ovie | -5.086 |
oir | -4.770 |
resp | -4.592 |
butt | -4.570 |
Token |
|
Token ID | 198 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
ullivan | +0.768 |
enhagen | +0.748 |
asma | +0.748 |
Hera | +0.735 |
eda | +0.734 |
Neg logit contributions | |
MX | -0.748 |
ovie | -0.704 |
oir | -0.668 |
resp | -0.625 |
butt | -0.622 |
Token | � |
Token ID | 447 |
Feature activation | +1.97e-01 |
Pos logit contributions | |
ullivan | +6.665 |
asma | +6.641 |
eda | +6.510 |
lication | +6.424 |
zl | +6.249 |
Neg logit contributions | |
MX | -7.066 |
ovie | -6.994 |
oir | -6.498 |
sburgh | -6.375 |
iaries | -6.200 |
Token | � |
Token ID | 250 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
ullivan | +1.985 |
enhagen | +1.938 |
asma | +1.896 |
eda | +1.876 |
Hera | +1.857 |
Neg logit contributions | |
MX | -2.525 |
ovie | -2.394 |
oir | -2.280 |
resp | -2.144 |
butt | -2.139 |
Token | What |
Token ID | 2061 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
eda | +11.373 |
ullivan | +11.367 |
asma | +11.292 |
lication | +11.246 |
zl | +11.073 |
Neg logit contributions | |
MX | -12.474 |
ovie | -12.461 |
oir | -11.364 |
sburgh | -11.351 |
arcity | -11.225 |
Token | � |
Token ID | 447 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
asma | +6.070 |
ullivan | +6.058 |
eda | +6.031 |
enhagen | +6.002 |
Hera | +5.901 |
Neg logit contributions | |
MX | -7.103 |
ovie | -6.648 |
oir | -6.228 |
resp | -6.031 |
sburgh | -5.891 |
Token | � |
Token ID | 247 |
Feature activation | +3.73e-01 |
Pos logit contributions | |
ullivan | +1.318 |
enhagen | +1.292 |
asma | +1.268 |
eda | +1.253 |
Hera | +1.237 |
Neg logit contributions | |
MX | -1.756 |
ovie | -1.660 |
oir | -1.581 |
resp | -1.497 |
butt | -1.492 |
Token | s |
Token ID | 82 |
Feature activation | +4.79e-01 |
Pos logit contributions | |
ullivan | +4.245 |
enhagen | +4.219 |
eda | +4.167 |
asma | +4.147 |
Hera | +4.064 |
Neg logit contributions | |
MX | -4.138 |
ovie | -3.819 |
oir | -3.614 |
resp | -3.405 |
butt | -3.351 |
Token | important |
Token ID | 1593 |
Feature activation | +3.00e-01 |
Pos logit contributions | |
ullivan | +5.131 |
enhagen | +5.007 |
asma | +4.984 |
Hera | +4.901 |
eda | +4.856 |
Neg logit contributions | |
MX | -5.511 |
ovie | -5.162 |
oir | -4.911 |
sburgh | -4.692 |
resp | -4.668 |
Token | – |
Token ID | 784 |
Feature activation | +9.06e-02 |
Pos logit contributions | |
MX | +0.606 |
ovie | +0.567 |
oir | +0.541 |
resp | +0.507 |
butt | +0.505 |
Neg logit contributions | |
ullivan | -0.621 |
enhagen | -0.610 |
asma | -0.600 |
Hera | -0.588 |
eda | -0.586 |
Token | who |
Token ID | 508 |
Feature activation | -1.38e-01 |
Pos logit contributions | |
ullivan | +1.050 |
enhagen | +1.033 |
asma | +1.019 |
Hera | +1.004 |
eda | +0.999 |
Neg logit contributions | |
MX | -1.019 |
ovie | -0.952 |
oir | -0.908 |
resp | -0.853 |
butt | -0.847 |
Token | comes |
Token ID | 2058 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
MX | +1.507 |
ovie | +1.410 |
oir | +1.342 |
resp | +1.255 |
butt | +1.252 |
Neg logit contributions | |
ullivan | -1.655 |
enhagen | -1.632 |
asma | -1.591 |
eda | -1.560 |
Hera | -1.553 |
Token | from |
Token ID | 422 |
Feature activation | +4.80e-01 |
Pos logit contributions | |
MX | +2.959 |
ovie | +2.743 |
oir | +2.628 |
butt | +2.438 |
resp | +2.424 |
Neg logit contributions | |
ullivan | -3.629 |
enhagen | -3.579 |
asma | -3.516 |
eda | -3.442 |
lication | -3.432 |
Token | the |
Token ID | 262 |
Feature activation | +7.95e-01 |
Pos logit contributions | |
Hera | +5.106 |
ullivan | +5.012 |
asma | +4.948 |
enhagen | +4.941 |
eda | +4.905 |
Neg logit contributions | |
MX | -5.573 |
ovie | -5.199 |
oir | -5.045 |
resp | -4.737 |
butt | -4.652 |
Token | opposition |
Token ID | 5471 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
Hera | +8.378 |
asma | +8.034 |
ullivan | +7.948 |
eda | +7.917 |
enhagen | +7.860 |
Neg logit contributions | |
MX | -8.678 |
ovie | -8.086 |
oir | -7.951 |
resp | -7.400 |
butt | -7.347 |
Token | – |
Token ID | 784 |
Feature activation | -6.79e-02 |
Pos logit contributions | |
Hera | +12.392 |
asma | +11.703 |
ullivan | +11.543 |
eda | +11.158 |
enhagen | +10.787 |
Neg logit contributions | |
MX | -13.017 |
ovie | -12.823 |
oir | -12.321 |
resp | -11.805 |
butt | -11.512 |
Token | later |
Token ID | 1568 |
Feature activation | +1.85e-02 |
Pos logit contributions | |
MX | +0.770 |
ovie | +0.720 |
oir | +0.687 |
resp | +0.644 |
butt | +0.643 |
Neg logit contributions | |
ullivan | -0.786 |
enhagen | -0.773 |
asma | -0.760 |
eda | -0.743 |
Hera | -0.743 |
Token | clarified |
Token ID | 28464 |
Feature activation | -1.44e-01 |
Pos logit contributions | |
ullivan | +0.210 |
enhagen | +0.207 |
asma | +0.204 |
Hera | +0.200 |
eda | +0.199 |
Neg logit contributions | |
MX | -0.214 |
ovie | -0.200 |
oir | -0.191 |
resp | -0.180 |
butt | -0.179 |
Token | that |
Token ID | 326 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
MX | +1.598 |
ovie | +1.492 |
oir | +1.418 |
butt | +1.333 |
resp | +1.327 |
Neg logit contributions | |
ullivan | -1.696 |
enhagen | -1.671 |
asma | -1.635 |
eda | -1.599 |
lication | -1.587 |
Token | the |
Token ID | 262 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
ullivan | +1.241 |
enhagen | +1.214 |
asma | +1.204 |
Hera | +1.194 |
eda | +1.182 |
Neg logit contributions | |
MX | -1.248 |
ovie | -1.163 |
oir | -1.114 |
resp | -1.043 |
butt | -1.035 |
Token | was |
Token ID | 373 |
Feature activation | -7.49e-01 |
Pos logit contributions | |
MX | +4.954 |
ovie | +4.689 |
oir | +4.534 |
butt | +4.181 |
sburgh | +4.094 |
Neg logit contributions | |
ullivan | -6.301 |
asma | -6.144 |
enhagen | -6.129 |
lication | -5.945 |
eda | -5.873 |
Token | bad |
Token ID | 2089 |
Feature activation | -9.46e-01 |
Pos logit contributions | |
MX | +7.339 |
ovie | +6.978 |
oir | +6.740 |
butt | +6.064 |
pa | +5.995 |
Neg logit contributions | |
ullivan | -8.789 |
enhagen | -8.738 |
asma | -8.668 |
lication | -8.544 |
rocal | -8.241 |
Token | , |
Token ID | 11 |
Feature activation | -2.88e-01 |
Pos logit contributions | |
MX | +8.485 |
ovie | +8.106 |
oir | +7.530 |
butt | +7.404 |
pa | +7.350 |
Neg logit contributions | |
ullivan | -11.004 |
enhagen | -10.979 |
asma | -10.855 |
lication | -10.763 |
rocal | -10.667 |
Token | but |
Token ID | 475 |
Feature activation | -3.29e-01 |
Pos logit contributions | |
MX | +3.020 |
ovie | +2.834 |
oir | +2.690 |
butt | +2.513 |
resp | +2.479 |
Neg logit contributions | |
ullivan | -3.529 |
enhagen | -3.505 |
asma | -3.458 |
lication | -3.359 |
eda | -3.333 |
Token | he |
Token ID | 339 |
Feature activation | -3.57e-01 |
Pos logit contributions | |
MX | +3.403 |
ovie | +3.204 |
oir | +3.055 |
butt | +2.859 |
resp | +2.791 |
Neg logit contributions | |
ullivan | -4.042 |
enhagen | -3.994 |
asma | -3.939 |
lication | -3.813 |
eda | -3.785 |
Token | p |
Token ID | 279 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
MX | +3.648 |
ovie | +3.433 |
oir | +3.309 |
resp | +3.074 |
butt | +3.057 |
Neg logit contributions | |
ullivan | -4.395 |
enhagen | -4.347 |
asma | -4.266 |
lication | -4.140 |
Hera | -4.128 |
Token | ales |
Token ID | 2040 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
eda | +13.826 |
enhagen | +13.543 |
ullivan | +13.384 |
asma | +13.326 |
lication | +12.713 |
Neg logit contributions | |
MX | -11.863 |
ovie | -10.768 |
sburgh | -9.518 |
oir | -9.470 |
resp | -9.244 |
Token | in |
Token ID | 287 |
Feature activation | +8.63e-02 |
Pos logit contributions | |
ullivan | +2.081 |
enhagen | +2.029 |
asma | +2.005 |
eda | +1.982 |
Hera | +1.970 |
Neg logit contributions | |
MX | -2.041 |
ovie | -1.887 |
oir | -1.803 |
resp | -1.705 |
butt | -1.699 |
Token | com |
Token ID | 401 |
Feature activation | -3.25e-01 |
Pos logit contributions | |
ullivan | +0.988 |
enhagen | +0.970 |
asma | +0.952 |
Hera | +0.935 |
eda | +0.934 |
Neg logit contributions | |
MX | -0.991 |
ovie | -0.924 |
oir | -0.879 |
resp | -0.830 |
butt | -0.826 |
Token | |
Token ID | 3907 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
MX | +3.418 |
ovie | +3.259 |
oir | +3.122 |
resp | +2.923 |
butt | +2.811 |
Neg logit contributions | |
ullivan | -3.915 |
enhagen | -3.829 |
asma | -3.804 |
Hera | -3.783 |
eda | -3.669 |
Token | par |
Token ID | 1845 |
Feature activation | -5.37e-01 |
Pos logit contributions | |
MX | +1.173 |
ovie | +1.088 |
oir | +1.039 |
resp | +0.969 |
butt | +0.968 |
Neg logit contributions | |
ullivan | -1.397 |
enhagen | -1.365 |
asma | -1.356 |
Hera | -1.336 |
eda | -1.328 |
Token | , |
Token ID | 11 |
Feature activation | -6.34e-02 |
Pos logit contributions | |
ullivan | +0.288 |
enhagen | +0.284 |
asma | +0.280 |
Hera | +0.275 |
eda | +0.275 |
Neg logit contributions | |
MX | -0.259 |
ovie | -0.241 |
oir | -0.229 |
resp | -0.215 |
butt | -0.214 |
Token | and |
Token ID | 290 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
MX | +0.682 |
ovie | +0.634 |
oir | +0.601 |
resp | +0.562 |
butt | +0.559 |
Neg logit contributions | |
ullivan | -0.774 |
enhagen | -0.762 |
asma | -0.750 |
Hera | -0.734 |
eda | -0.733 |
Token | Ambassador |
Token ID | 20656 |
Feature activation | -6.09e-01 |
Pos logit contributions | |
MX | +5.461 |
ovie | +4.999 |
oir | +4.727 |
resp | +4.404 |
butt | +4.367 |
Neg logit contributions | |
enhagen | -7.033 |
ullivan | -7.025 |
asma | -6.747 |
lication | -6.676 |
eda | -6.546 |
Token | Sand |
Token ID | 3837 |
Feature activation | -4.05e-01 |
Pos logit contributions | |
MX | +4.535 |
ovie | +4.174 |
oir | +3.986 |
resp | +3.571 |
butt | +3.473 |
Neg logit contributions | |
ullivan | -8.798 |
enhagen | -8.765 |
asma | -8.533 |
eda | -8.516 |
lication | -8.386 |
Token | erson |
Token ID | 882 |
Feature activation | -4.52e-01 |
Pos logit contributions | |
MX | +3.663 |
ovie | +3.335 |
oir | +3.293 |
butt | +3.083 |
resp | +3.030 |
Neg logit contributions | |
ullivan | -5.436 |
enhagen | -5.414 |
Hera | -5.301 |
asma | -5.271 |
lication | -5.172 |
Token | ab |
Token ID | 450 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
MX | +4.506 |
ovie | +4.327 |
oir | +4.076 |
butt | +3.807 |
sburgh | +3.746 |
Neg logit contributions | |
ullivan | -5.597 |
enhagen | -5.447 |
asma | -5.354 |
Hera | -5.278 |
lication | -5.226 |
Token | et |
Token ID | 316 |
Feature activation | +1.90e-01 |
Pos logit contributions | |
eda | +11.241 |
ullivan | +10.917 |
asma | +10.567 |
enhagen | +10.473 |
Hera | +9.832 |
Neg logit contributions | |
MX | -14.303 |
ovie | -13.676 |
sburgh | -13.178 |
oir | -12.452 |
ーテ | -12.180 |
Token | ted |
Token ID | 1513 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
ullivan | +1.205 |
enhagen | +1.159 |
eda | +1.134 |
asma | +1.128 |
Hera | +1.117 |
Neg logit contributions | |
MX | -3.128 |
ovie | -2.971 |
oir | -2.866 |
resp | -2.750 |
butt | -2.731 |
Token | U |
Token ID | 471 |
Feature activation | +1.27e-01 |
Pos logit contributions | |
MX | +3.739 |
ovie | +3.486 |
oir | +3.279 |
butt | +3.071 |
resp | +3.064 |
Neg logit contributions | |
ullivan | -4.442 |
enhagen | -4.416 |
asma | -4.303 |
eda | -4.189 |
lication | -4.187 |
Token | . |
Token ID | 13 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
ullivan | +1.493 |
asma | +1.456 |
enhagen | +1.447 |
eda | +1.439 |
Hera | +1.426 |
Neg logit contributions | |
MX | -1.377 |
ovie | -1.304 |
oir | -1.229 |
resp | -1.149 |
butt | -1.139 |
Token | S |
Token ID | 50 |
Feature activation | +4.32e-02 |
Pos logit contributions | |
MX | +1.269 |
ovie | +1.152 |
oir | +1.097 |
resp | +1.026 |
butt | +1.024 |
Neg logit contributions | |
ullivan | -1.560 |
enhagen | -1.555 |
asma | -1.514 |
Hera | -1.474 |
eda | -1.472 |
Token | you |
Token ID | 345 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
ullivan | +0.117 |
enhagen | +0.115 |
asma | +0.113 |
Hera | +0.111 |
eda | +0.111 |
Neg logit contributions | |
MX | -0.105 |
ovie | -0.098 |
oir | -0.093 |
resp | -0.087 |
butt | -0.087 |
Token | have |
Token ID | 423 |
Feature activation | +5.34e-02 |
Pos logit contributions | |
ullivan | +2.307 |
asma | +2.256 |
enhagen | +2.251 |
Hera | +2.214 |
eda | +2.211 |
Neg logit contributions | |
MX | -2.342 |
ovie | -2.176 |
oir | -2.074 |
resp | -1.959 |
butt | -1.938 |
Token | a |
Token ID | 257 |
Feature activation | +5.21e-01 |
Pos logit contributions | |
ullivan | +0.548 |
enhagen | +0.537 |
asma | +0.530 |
Hera | +0.519 |
eda | +0.516 |
Neg logit contributions | |
MX | -0.675 |
ovie | -0.637 |
oir | -0.609 |
resp | -0.578 |
butt | -0.573 |
Token | moment |
Token ID | 2589 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
ullivan | +6.164 |
asma | +6.040 |
Hera | +5.999 |
enhagen | +5.891 |
eda | +5.835 |
Neg logit contributions | |
MX | -5.248 |
ovie | -5.103 |
oir | -4.702 |
resp | -4.449 |
butt | -4.323 |
Token | , |
Token ID | 11 |
Feature activation | +7.06e-01 |
Pos logit contributions | |
ullivan | +1.184 |
enhagen | +1.169 |
asma | +1.153 |
Hera | +1.129 |
eda | +1.123 |
Neg logit contributions | |
MX | -1.163 |
ovie | -1.084 |
oir | -1.031 |
resp | -0.970 |
butt | -0.968 |
Token | please |
Token ID | 3387 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
ullivan | +6.845 |
Hera | +6.784 |
asma | +6.600 |
enhagen | +6.562 |
eda | +6.547 |
Neg logit contributions | |
MX | -8.219 |
ovie | -7.880 |
oir | -7.534 |
resp | -7.132 |
butt | -6.995 |
Token | help |
Token ID | 1037 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
Hera | +10.010 |
ullivan | +9.990 |
eda | +9.810 |
asma | +9.207 |
cone | +9.157 |
Neg logit contributions | |
MX | -14.457 |
ovie | -13.967 |
oir | -13.185 |
resp | -12.792 |
ャ | -12.573 |
Token | spread |
Token ID | 4104 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
MX | +2.702 |
ovie | +2.440 |
oir | +2.339 |
butt | +2.171 |
resp | +2.122 |
Neg logit contributions | |
ullivan | -3.831 |
enhagen | -3.768 |
asma | -3.700 |
lication | -3.659 |
eda | -3.617 |
Token | the |
Token ID | 262 |
Feature activation | -3.96e-01 |
Pos logit contributions | |
MX | +0.131 |
ovie | +0.122 |
oir | +0.116 |
resp | +0.108 |
butt | +0.108 |
Neg logit contributions | |
ullivan | -0.143 |
enhagen | -0.141 |
asma | -0.139 |
Hera | -0.136 |
eda | -0.136 |
Token | word |
Token ID | 1573 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
MX | +3.142 |
ovie | +2.786 |
oir | +2.612 |
butt | +2.463 |
sburgh | +2.379 |
Neg logit contributions | |
ullivan | -5.821 |
enhagen | -5.753 |
asma | -5.638 |
eda | -5.589 |
lication | -5.523 |
Token | about |
Token ID | 546 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
MX | +0.235 |
ovie | +0.219 |
oir | +0.209 |
resp | +0.195 |
butt | +0.195 |
Neg logit contributions | |
ullivan | -0.251 |
enhagen | -0.247 |
asma | -0.244 |
Hera | -0.239 |
eda | -0.239 |
Token | members |
Token ID | 1866 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
ullivan | +3.372 |
asma | +3.325 |
eda | +3.306 |
enhagen | +3.285 |
Hera | +3.268 |
Neg logit contributions | |
MX | -3.819 |
ovie | -3.625 |
oir | -3.510 |
resp | -3.261 |
sburgh | -3.229 |
Token | a |
Token ID | 257 |
Feature activation | +5.65e-01 |
Pos logit contributions | |
ullivan | +2.924 |
enhagen | +2.866 |
asma | +2.814 |
eda | +2.794 |
Hera | +2.788 |
Neg logit contributions | |
MX | -2.757 |
ovie | -2.589 |
oir | -2.476 |
resp | -2.296 |
sburgh | -2.279 |
Token | one |
Token ID | 530 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
ullivan | +5.763 |
Hera | +5.614 |
enhagen | +5.586 |
asma | +5.518 |
eda | +5.475 |
Neg logit contributions | |
MX | -6.586 |
ovie | -6.267 |
oir | -5.995 |
sburgh | -5.543 |
resp | -5.536 |
Token | - |
Token ID | 12 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
ullivan | +1.711 |
enhagen | +1.682 |
asma | +1.658 |
Hera | +1.634 |
eda | +1.628 |
Neg logit contributions | |
MX | -1.694 |
ovie | -1.586 |
oir | -1.523 |
butt | -1.408 |
resp | -1.406 |
Token | month |
Token ID | 8424 |
Feature activation | +7.92e-01 |
Pos logit contributions | |
ullivan | +2.772 |
enhagen | +2.733 |
asma | +2.707 |
eda | +2.670 |
Hera | +2.646 |
Neg logit contributions | |
MX | -2.705 |
ovie | -2.516 |
oir | -2.432 |
resp | -2.206 |
sburgh | -2.202 |
Token | free |
Token ID | 1479 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
Hera | +7.132 |
lication | +7.051 |
ullivan | +6.996 |
eda | +6.991 |
enhagen | +6.796 |
Neg logit contributions | |
MX | -9.450 |
ovie | -9.007 |
oir | -8.597 |
iaries | -8.037 |
resp | -7.872 |
Token | trial |
Token ID | 4473 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
Hera | +8.360 |
lication | +8.306 |
ullivan | +8.297 |
asma | +7.965 |
eda | +7.902 |
Neg logit contributions | |
MX | -15.896 |
ovie | -15.095 |
oir | -14.955 |
iaries | -13.926 |
sburgh | -13.712 |
Token | of |
Token ID | 286 |
Feature activation | +4.26e-01 |
Pos logit contributions | |
Hera | +8.705 |
eda | +8.503 |
ullivan | +8.486 |
lication | +8.198 |
enhagen | +8.045 |
Neg logit contributions | |
MX | -13.426 |
ovie | -12.858 |
oir | -12.352 |
sburgh | -11.762 |
resp | -11.683 |
Token | S |
Token ID | 311 |
Feature activation | +9.48e-01 |
Pos logit contributions | |
ullivan | +4.256 |
enhagen | +4.203 |
Hera | +4.151 |
eda | +4.114 |
asma | +4.055 |
Neg logit contributions | |
MX | -5.211 |
ovie | -4.837 |
oir | -4.734 |
resp | -4.435 |
butt | -4.420 |
Token | ling |
Token ID | 1359 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
eda | +5.560 |
ullivan | +5.405 |
lication | +5.221 |
asma | +5.204 |
cone | +5.141 |
Neg logit contributions | |
MX | -13.863 |
ovie | -13.089 |
oir | -12.850 |
ーテ | -12.835 |
� | -12.621 |
Token | TV |
Token ID | 3195 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
ullivan | +2.967 |
enhagen | +2.927 |
asma | +2.918 |
Hera | +2.868 |
eda | +2.864 |
Neg logit contributions | |
MX | -4.455 |
ovie | -4.202 |
oir | -4.100 |
resp | -3.916 |
butt | -3.851 |
Token | harm |
Token ID | 4419 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
Hera | +4.506 |
ullivan | +4.444 |
asma | +4.403 |
lication | +4.342 |
eda | +4.312 |
Neg logit contributions | |
MX | -6.008 |
ovie | -5.647 |
oir | -5.315 |
butt | -4.919 |
resp | -4.869 |
Token | but |
Token ID | 475 |
Feature activation | +6.15e-01 |
Pos logit contributions | |
ullivan | +1.421 |
enhagen | +1.408 |
asma | +1.382 |
Hera | +1.364 |
eda | +1.363 |
Neg logit contributions | |
MX | -1.376 |
ovie | -1.278 |
oir | -1.219 |
resp | -1.137 |
butt | -1.134 |
Token | this |
Token ID | 428 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
eda | +6.143 |
Hera | +6.006 |
ullivan | +5.993 |
enhagen | +5.931 |
asma | +5.773 |
Neg logit contributions | |
MX | -7.411 |
ovie | -6.789 |
oir | -6.582 |
sburgh | -6.131 |
resp | -6.092 |
Token | charge |
Token ID | 3877 |
Feature activation | +9.54e-02 |
Pos logit contributions | |
ullivan | +2.657 |
enhagen | +2.608 |
asma | +2.587 |
Hera | +2.567 |
eda | +2.564 |
Neg logit contributions | |
MX | -2.633 |
ovie | -2.441 |
oir | -2.331 |
resp | -2.182 |
sburgh | -2.163 |
Token | was |
Token ID | 373 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
ullivan | +1.070 |
enhagen | +1.056 |
asma | +1.039 |
Hera | +1.023 |
eda | +1.022 |
Neg logit contributions | |
MX | -1.113 |
ovie | -1.037 |
oir | -0.988 |
resp | -0.925 |
butt | -0.923 |
Token | later |
Token ID | 1568 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
Hera | +8.107 |
eda | +7.905 |
ullivan | +7.722 |
enhagen | +7.389 |
asma | +7.195 |
Neg logit contributions | |
MX | -13.637 |
ovie | -12.766 |
oir | -12.163 |
resp | -12.031 |
sburgh | -11.800 |
Token | dismissed |
Token ID | 11126 |
Feature activation | -1.38e-02 |
Pos logit contributions | |
eda | +8.204 |
Hera | +8.142 |
ullivan | +7.790 |
enhagen | +7.678 |
cone | +7.414 |
Neg logit contributions | |
MX | -16.196 |
ovie | -15.254 |
oir | -14.763 |
resp | -14.318 |
sburgh | -14.269 |
Token | by |
Token ID | 416 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
MX | +0.152 |
ovie | +0.142 |
oir | +0.135 |
resp | +0.126 |
butt | +0.126 |
Neg logit contributions | |
ullivan | -0.164 |
enhagen | -0.162 |
asma | -0.159 |
Hera | -0.156 |
eda | -0.156 |
Token | the |
Token ID | 262 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
ullivan | +4.855 |
enhagen | +4.752 |
Hera | +4.679 |
eda | +4.679 |
asma | +4.662 |
Neg logit contributions | |
MX | -5.125 |
ovie | -4.713 |
oir | -4.542 |
resp | -4.317 |
sburgh | -4.223 |
Token | Judge |
Token ID | 8974 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
ullivan | +6.165 |
enhagen | +6.088 |
Hera | +6.046 |
asma | +5.984 |
eda | +5.921 |
Neg logit contributions | |
MX | -6.162 |
ovie | -5.642 |
oir | -5.366 |
resp | -5.074 |
butt | -5.058 |
Token | due |
Token ID | 2233 |
Feature activation | -3.68e-01 |
Pos logit contributions | |
ullivan | +2.941 |
enhagen | +2.880 |
asma | +2.834 |
eda | +2.828 |
Hera | +2.805 |
Neg logit contributions | |
MX | -2.952 |
ovie | -2.722 |
oir | -2.627 |
resp | -2.465 |
butt | -2.452 |
Token | " |
Token ID | 1 |
Feature activation | +5.82e-01 |
Pos logit contributions | |
enhagen | +3.615 |
ullivan | +3.599 |
asma | +3.576 |
eda | +3.542 |
Hera | +3.521 |
Neg logit contributions | |
MX | -3.665 |
ovie | -3.418 |
oir | -3.288 |
resp | -3.121 |
butt | -3.070 |
Token | Blu |
Token ID | 12391 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
ullivan | +6.097 |
Hera | +6.029 |
eda | +6.019 |
enhagen | +6.016 |
asma | +5.951 |
Neg logit contributions | |
MX | -6.481 |
ovie | -5.927 |
oir | -5.920 |
resp | -5.564 |
butt | -5.503 |
Token | - |
Token ID | 12 |
Feature activation | -5.77e-02 |
Pos logit contributions | |
ullivan | +1.627 |
enhagen | +1.600 |
asma | +1.585 |
eda | +1.554 |
Hera | +1.549 |
Neg logit contributions | |
MX | -1.558 |
ovie | -1.449 |
oir | -1.380 |
butt | -1.302 |
resp | -1.302 |
Token | Ray |
Token ID | 19591 |
Feature activation | +2.58e-01 |
Pos logit contributions | |
MX | +0.180 |
ovie | +0.135 |
oir | +0.108 |
resp | +0.072 |
butt | +0.069 |
Neg logit contributions | |
ullivan | -1.144 |
enhagen | -1.134 |
asma | -1.122 |
Hera | -1.109 |
eda | -1.108 |
Token | : |
Token ID | 25 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
ullivan | +2.825 |
enhagen | +2.797 |
asma | +2.741 |
Hera | +2.738 |
eda | +2.735 |
Neg logit contributions | |
MX | -2.954 |
ovie | -2.769 |
oir | -2.664 |
resp | -2.520 |
butt | -2.490 |
Token | Sky |
Token ID | 5274 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
enhagen | +4.159 |
ullivan | +4.138 |
asma | +4.046 |
Hera | +4.043 |
eda | +4.013 |
Neg logit contributions | |
MX | -4.285 |
ovie | -4.025 |
oir | -3.897 |
resp | -3.637 |
sburgh | -3.627 |
Token | fall |
Token ID | 7207 |
Feature activation | +6.20e-01 |
Pos logit contributions | |
enhagen | +7.116 |
asma | +6.657 |
Hera | +6.643 |
eda | +6.421 |
ullivan | +6.341 |
Neg logit contributions | |
MX | -17.159 |
ovie | -16.698 |
oir | -15.636 |
resp | -15.356 |
sburgh | -15.234 |
Token | ( |
Token ID | 357 |
Feature activation | +8.10e-02 |
Pos logit contributions | |
enhagen | +6.617 |
asma | +6.443 |
eda | +6.432 |
Hera | +6.369 |
ullivan | +6.358 |
Neg logit contributions | |
MX | -6.759 |
ovie | -6.200 |
oir | -6.155 |
resp | -5.810 |
butt | -5.713 |
Token | Blu |
Token ID | 38676 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
ullivan | +0.936 |
enhagen | +0.926 |
asma | +0.910 |
eda | +0.895 |
Hera | +0.893 |
Neg logit contributions | |
MX | -0.908 |
ovie | -0.850 |
oir | -0.813 |
resp | -0.759 |
butt | -0.756 |
Token | - |
Token ID | 12 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
ullivan | +2.245 |
enhagen | +2.212 |
asma | +2.194 |
eda | +2.159 |
Hera | +2.134 |
Neg logit contributions | |
MX | -2.186 |
ovie | -2.025 |
oir | -1.932 |
resp | -1.832 |
butt | -1.825 |
Token | ray |
Token ID | 2433 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
MX | +0.639 |
ovie | +0.492 |
oir | +0.404 |
resp | +0.289 |
butt | +0.274 |
Neg logit contributions | |
ullivan | -3.677 |
enhagen | -3.641 |
asma | -3.596 |
Hera | -3.562 |
eda | -3.541 |
Token | slowly |
Token ID | 6364 |
Feature activation | +2.19e-01 |
Pos logit contributions | |
ullivan | +0.597 |
enhagen | +0.586 |
asma | +0.578 |
Hera | +0.568 |
eda | +0.566 |
Neg logit contributions | |
MX | -0.578 |
ovie | -0.541 |
oir | -0.514 |
resp | -0.483 |
butt | -0.481 |
Token | along |
Token ID | 1863 |
Feature activation | +4.54e-01 |
Pos logit contributions | |
ullivan | +2.454 |
enhagen | +2.430 |
asma | +2.407 |
Hera | +2.385 |
eda | +2.361 |
Neg logit contributions | |
MX | -2.525 |
ovie | -2.362 |
oir | -2.267 |
resp | -2.119 |
butt | -2.092 |
Token | the |
Token ID | 262 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
enhagen | +4.827 |
ullivan | +4.816 |
asma | +4.804 |
Hera | +4.753 |
eda | +4.719 |
Neg logit contributions | |
MX | -5.221 |
ovie | -5.006 |
oir | -4.644 |
resp | -4.388 |
butt | -4.388 |
Token | city |
Token ID | 1748 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
ullivan | +1.691 |
enhagen | +1.674 |
asma | +1.653 |
Hera | +1.626 |
eda | +1.618 |
Neg logit contributions | |
MX | -1.533 |
ovie | -1.436 |
oir | -1.355 |
butt | -1.270 |
resp | -1.264 |
Token | 's |
Token ID | 338 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
ullivan | +1.652 |
enhagen | +1.645 |
asma | +1.623 |
Hera | +1.597 |
eda | +1.590 |
Neg logit contributions | |
MX | -1.523 |
ovie | -1.426 |
oir | -1.349 |
resp | -1.261 |
butt | -1.256 |
Token | broad |
Token ID | 3154 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
ullivan | +6.575 |
asma | +6.537 |
Hera | +6.530 |
enhagen | +6.498 |
eda | +6.393 |
Neg logit contributions | |
MX | -6.553 |
ovie | -6.362 |
oir | -5.770 |
butt | -5.500 |
resp | -5.396 |
Token | bou |
Token ID | 35833 |
Feature activation | +7.35e-01 |
Pos logit contributions | |
asma | +11.857 |
eda | +11.737 |
enhagen | +11.424 |
aza | +11.419 |
ullivan | +11.227 |
Neg logit contributions | |
MX | -12.525 |
ovie | -12.142 |
oir | -10.859 |
iaries | -10.620 |
resp | -10.513 |
Token | lev |
Token ID | 2768 |
Feature activation | -1.38e-02 |
Pos logit contributions | |
eda | +6.163 |
asma | +6.158 |
enhagen | +6.003 |
cone | +5.925 |
rocal | +5.843 |
Neg logit contributions | |
MX | -9.967 |
ovie | -9.454 |
oir | -8.638 |
sburgh | -8.631 |
iaries | -8.176 |
Token | ards |
Token ID | 1371 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
MX | +0.164 |
ovie | +0.154 |
oir | +0.147 |
resp | +0.138 |
butt | +0.138 |
Neg logit contributions | |
ullivan | -0.153 |
enhagen | -0.150 |
asma | -0.148 |
Hera | -0.145 |
eda | -0.145 |
Token | in |
Token ID | 287 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
MX | +2.732 |
ovie | +2.535 |
oir | +2.414 |
resp | +2.258 |
butt | +2.249 |
Neg logit contributions | |
ullivan | -3.371 |
enhagen | -3.282 |
asma | -3.232 |
Hera | -3.164 |
eda | -3.153 |
Token | support |
Token ID | 1104 |
Feature activation | -3.00e-01 |
Pos logit contributions | |
ullivan | +2.618 |
asma | +2.564 |
enhagen | +2.563 |
Hera | +2.525 |
eda | +2.511 |
Neg logit contributions | |
MX | -2.380 |
ovie | -2.218 |
oir | -2.107 |
butt | -1.970 |
resp | -1.968 |
Token | of |
Token ID | 286 |
Feature activation | +8.81e-02 |
Pos logit contributions | |
MX | +0.161 |
ovie | +0.151 |
oir | +0.144 |
resp | +0.135 |
butt | +0.134 |
Neg logit contributions | |
ullivan | -0.166 |
enhagen | -0.164 |
asma | -0.161 |
Hera | -0.158 |
eda | -0.158 |
Token | workers |
Token ID | 3259 |
Feature activation | -6.62e-02 |
Pos logit contributions | |
ullivan | +1.022 |
enhagen | +1.005 |
asma | +0.991 |
Hera | +0.982 |
eda | +0.973 |
Neg logit contributions | |
MX | -0.993 |
ovie | -0.926 |
oir | -0.878 |
resp | -0.827 |
butt | -0.826 |
Token | , |
Token ID | 11 |
Feature activation | -7.31e-02 |
Pos logit contributions | |
MX | +0.714 |
ovie | +0.665 |
oir | +0.633 |
resp | +0.591 |
butt | +0.588 |
Neg logit contributions | |
ullivan | -0.805 |
enhagen | -0.791 |
asma | -0.780 |
Hera | -0.764 |
eda | -0.762 |
Token | politicians |
Token ID | 7602 |
Feature activation | +3.04e-02 |
Pos logit contributions | |
MX | +0.817 |
ovie | +0.762 |
oir | +0.727 |
resp | +0.681 |
butt | +0.676 |
Neg logit contributions | |
ullivan | -0.860 |
enhagen | -0.846 |
asma | -0.833 |
Hera | -0.815 |
eda | -0.815 |
Token | who |
Token ID | 508 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
ullivan | +0.348 |
enhagen | +0.343 |
asma | +0.337 |
Hera | +0.331 |
eda | +0.331 |
Neg logit contributions | |
MX | -0.349 |
ovie | -0.326 |
oir | -0.311 |
resp | -0.292 |
butt | -0.291 |
Token | p |
Token ID | 279 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
ullivan | +2.170 |
enhagen | +2.119 |
asma | +2.111 |
eda | +2.077 |
Hera | +2.074 |
Neg logit contributions | |
MX | -2.289 |
ovie | -2.121 |
oir | -2.031 |
resp | -1.907 |
butt | -1.900 |
Token | ander |
Token ID | 4066 |
Feature activation | +2.62e-01 |
Pos logit contributions | |
ullivan | +10.192 |
eda | +10.141 |
asma | +10.052 |
enhagen | +10.027 |
rocal | +9.246 |
Neg logit contributions | |
MX | -14.440 |
ovie | -12.782 |
ーテ | -12.542 |
oir | -12.375 |
sburgh | -12.318 |
Token | to |
Token ID | 284 |
Feature activation | +4.82e-01 |
Pos logit contributions | |
ullivan | +2.754 |
enhagen | +2.713 |
asma | +2.675 |
Hera | +2.631 |
eda | +2.613 |
Neg logit contributions | |
MX | -3.184 |
ovie | -2.995 |
oir | -2.801 |
resp | -2.713 |
butt | -2.651 |
Token | donors |
Token ID | 13334 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
ullivan | +5.012 |
Hera | +4.970 |
eda | +4.856 |
enhagen | +4.818 |
asma | +4.813 |
Neg logit contributions | |
MX | -5.694 |
ovie | -5.206 |
oir | -4.931 |
resp | -4.903 |
butt | -4.793 |
Token | not |
Token ID | 407 |
Feature activation | -4.52e-03 |
Pos logit contributions | |
ullivan | +2.229 |
enhagen | +2.205 |
asma | +2.166 |
Hera | +2.131 |
eda | +2.129 |
Neg logit contributions | |
MX | -2.305 |
ovie | -2.150 |
oir | -2.045 |
resp | -1.939 |
butt | -1.918 |
Token | voters |
Token ID | 4446 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
MX | +0.052 |
ovie | +0.049 |
oir | +0.046 |
resp | +0.044 |
butt | +0.043 |
Neg logit contributions | |
ullivan | -0.052 |
enhagen | -0.051 |
asma | -0.050 |
Hera | -0.049 |
eda | -0.049 |
Token | One |
Token ID | 3198 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
ullivan | +2.189 |
enhagen | +2.148 |
asma | +2.130 |
Hera | +2.103 |
eda | +2.093 |
Neg logit contributions | |
MX | -2.128 |
ovie | -2.000 |
oir | -1.905 |
resp | -1.810 |
butt | -1.782 |
Token | which |
Token ID | 543 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
ullivan | +1.525 |
enhagen | +1.509 |
asma | +1.487 |
eda | +1.466 |
Hera | +1.458 |
Neg logit contributions | |
MX | -1.500 |
ovie | -1.408 |
oir | -1.336 |
resp | -1.265 |
butt | -1.252 |
Token | is |
Token ID | 318 |
Feature activation | -5.78e-02 |
Pos logit contributions | |
MX | +1.558 |
ovie | +1.463 |
oir | +1.392 |
resp | +1.298 |
butt | +1.297 |
Neg logit contributions | |
ullivan | -1.638 |
enhagen | -1.612 |
asma | -1.578 |
eda | -1.540 |
Hera | -1.539 |
Token | almost |
Token ID | 2048 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
MX | +0.655 |
ovie | +0.613 |
oir | +0.583 |
resp | +0.545 |
butt | +0.545 |
Neg logit contributions | |
ullivan | -0.672 |
enhagen | -0.661 |
asma | -0.650 |
eda | -0.636 |
Hera | -0.635 |
Token | universally |
Token ID | 26208 |
Feature activation | +8.55e-02 |
Pos logit contributions | |
ullivan | +1.344 |
enhagen | +1.327 |
asma | +1.310 |
Hera | +1.293 |
eda | +1.286 |
Neg logit contributions | |
MX | -1.343 |
ovie | -1.259 |
oir | -1.203 |
resp | -1.130 |
butt | -1.124 |
Token | p |
Token ID | 279 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
ullivan | +0.944 |
enhagen | +0.930 |
asma | +0.917 |
Hera | +0.902 |
eda | +0.898 |
Neg logit contributions | |
MX | -1.012 |
ovie | -0.946 |
oir | -0.903 |
resp | -0.854 |
butt | -0.846 |
Token | anned |
Token ID | 3577 |
Feature activation | -1.38e-01 |
Pos logit contributions | |
enhagen | +10.620 |
eda | +10.376 |
asma | +10.347 |
ullivan | +9.874 |
lication | +9.792 |
Neg logit contributions | |
MX | -14.209 |
ovie | -13.093 |
oir | -12.201 |
resp | -11.725 |
ーテ | -11.631 |
Token | by |
Token ID | 416 |
Feature activation | +7.53e-02 |
Pos logit contributions | |
MX | +1.466 |
ovie | +1.373 |
oir | +1.301 |
butt | +1.207 |
resp | +1.204 |
Neg logit contributions | |
ullivan | -1.696 |
enhagen | -1.668 |
asma | -1.635 |
Hera | -1.603 |
eda | -1.600 |
Token | Indian |
Token ID | 3942 |
Feature activation | -4.75e-01 |
Pos logit contributions | |
ullivan | +0.895 |
enhagen | +0.883 |
asma | +0.871 |
Hera | +0.856 |
eda | +0.854 |
Neg logit contributions | |
MX | -0.827 |
ovie | -0.766 |
oir | -0.730 |
resp | -0.689 |
butt | -0.683 |
Token | critics |
Token ID | 9188 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
MX | +4.698 |
ovie | +4.388 |
oir | +4.194 |
butt | +3.823 |
sburgh | +3.749 |
Neg logit contributions | |
ullivan | -6.072 |
enhagen | -5.941 |
asma | -5.732 |
rocal | -5.722 |
lication | -5.649 |
Token | for |
Token ID | 329 |
Feature activation | -3.64e-02 |
Pos logit contributions | |
ullivan | +1.612 |
enhagen | +1.591 |
asma | +1.568 |
Hera | +1.545 |
eda | +1.542 |
Neg logit contributions | |
MX | -1.551 |
ovie | -1.434 |
oir | -1.367 |
resp | -1.294 |
butt | -1.285 |
Token | t |
Token ID | 83 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
MX | +0.596 |
ovie | +0.549 |
oir | +0.521 |
resp | +0.479 |
butt | +0.478 |
Neg logit contributions | |
ullivan | -0.836 |
enhagen | -0.829 |
asma | -0.814 |
Hera | -0.802 |
eda | -0.797 |
Token | the |
Token ID | 262 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
MX | +1.987 |
ovie | +1.852 |
oir | +1.772 |
butt | +1.640 |
resp | +1.640 |
Neg logit contributions | |
ullivan | -2.214 |
enhagen | -2.181 |
asma | -2.135 |
eda | -2.093 |
Hera | -2.087 |
Token | be |
Token ID | 307 |
Feature activation | -6.63e-02 |
Pos logit contributions | |
MX | +2.582 |
ovie | +2.398 |
oir | +2.295 |
resp | +2.128 |
butt | +2.109 |
Neg logit contributions | |
ullivan | -2.962 |
enhagen | -2.908 |
asma | -2.871 |
eda | -2.807 |
lication | -2.791 |
Token | all |
Token ID | 477 |
Feature activation | +7.49e-01 |
Pos logit contributions | |
MX | +0.717 |
ovie | +0.669 |
oir | +0.637 |
resp | +0.597 |
butt | +0.593 |
Neg logit contributions | |
ullivan | -0.801 |
enhagen | -0.790 |
asma | -0.776 |
Hera | -0.761 |
eda | -0.760 |
Token | and |
Token ID | 290 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
ullivan | +7.265 |
enhagen | +6.961 |
eda | +6.948 |
Hera | +6.896 |
asma | +6.771 |
Neg logit contributions | |
MX | -9.009 |
ovie | -8.489 |
oir | -7.858 |
resp | -7.820 |
sburgh | -7.554 |
Token | end |
Token ID | 886 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
Hera | +9.064 |
eda | +8.330 |
ullivan | +8.214 |
asma | +7.825 |
aza | +7.725 |
Neg logit contributions | |
MX | -17.532 |
ovie | -17.077 |
resp | -15.620 |
sburgh | -15.430 |
oir | -15.407 |
Token | all |
Token ID | 477 |
Feature activation | +3.39e-01 |
Pos logit contributions | |
ullivan | +8.399 |
eda | +8.007 |
asma | +7.896 |
Hera | +7.757 |
enhagen | +7.341 |
Neg logit contributions | |
MX | -16.472 |
ovie | -15.152 |
sburgh | -14.541 |
resp | -14.025 |
oir | -13.666 |
Token | . |
Token ID | 13 |
Feature activation | -6.92e-02 |
Pos logit contributions | |
ullivan | +3.591 |
enhagen | +3.547 |
asma | +3.485 |
Hera | +3.450 |
eda | +3.420 |
Neg logit contributions | |
MX | -4.017 |
ovie | -3.756 |
oir | -3.590 |
resp | -3.409 |
sburgh | -3.378 |
Token | It |
Token ID | 632 |
Feature activation | +4.98e-02 |
Pos logit contributions | |
MX | +0.777 |
ovie | +0.726 |
oir | +0.692 |
resp | +0.646 |
butt | +0.644 |
Neg logit contributions | |
ullivan | -0.811 |
enhagen | -0.800 |
asma | -0.783 |
eda | -0.768 |
Hera | -0.766 |
Token | is |
Token ID | 318 |
Feature activation | -5.24e-02 |
Pos logit contributions | |
ullivan | +0.630 |
enhagen | +0.623 |
asma | +0.613 |
eda | +0.602 |
Hera | +0.602 |
Neg logit contributions | |
MX | -0.512 |
ovie | -0.473 |
oir | -0.446 |
resp | -0.416 |
butt | -0.414 |
Token | a |
Token ID | 257 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
MX | +0.564 |
ovie | +0.526 |
oir | +0.501 |
resp | +0.466 |
butt | +0.465 |
Neg logit contributions | |
ullivan | -0.637 |
enhagen | -0.626 |
asma | -0.617 |
Hera | -0.606 |
eda | -0.604 |
Token | Sh |
Token ID | 911 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
MX | +0.668 |
ovie | +0.621 |
oir | +0.590 |
resp | +0.544 |
butt | +0.543 |
Neg logit contributions | |
ullivan | -0.898 |
enhagen | -0.884 |
asma | -0.871 |
Hera | -0.856 |
eda | -0.852 |
Token | atter |
Token ID | 1436 |
Feature activation | -7.49e-03 |
Pos logit contributions | |
MX | +1.532 |
ovie | +1.447 |
oir | +1.376 |
resp | +1.282 |
butt | +1.269 |
Neg logit contributions | |
ullivan | -1.815 |
enhagen | -1.803 |
asma | -1.760 |
Hera | -1.755 |
eda | -1.726 |
Token | gone |
Token ID | 3750 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
MX | +0.093 |
ovie | +0.087 |
oir | +0.084 |
resp | +0.079 |
butt | +0.079 |
Neg logit contributions | |
ullivan | -0.079 |
enhagen | -0.077 |
asma | -0.076 |
Hera | -0.074 |
eda | -0.074 |
Token | through |
Token ID | 832 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
MX | +1.981 |
ovie | +1.861 |
oir | +1.770 |
butt | +1.647 |
resp | +1.644 |
Neg logit contributions | |
ullivan | -2.201 |
enhagen | -2.167 |
asma | -2.135 |
Hera | -2.096 |
lication | -2.093 |
Token | the |
Token ID | 262 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
ullivan | +1.217 |
enhagen | +1.197 |
asma | +1.174 |
Hera | +1.159 |
eda | +1.155 |
Neg logit contributions | |
MX | -1.198 |
ovie | -1.116 |
oir | -1.071 |
resp | -1.004 |
butt | -0.991 |
Token | washing |
Token ID | 20518 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
ullivan | +2.950 |
enhagen | +2.856 |
asma | +2.845 |
Hera | +2.816 |
eda | +2.800 |
Neg logit contributions | |
MX | -3.029 |
ovie | -2.825 |
oir | -2.691 |
resp | -2.574 |
butt | -2.525 |
Token | machine |
Token ID | 4572 |
Feature activation | +5.63e-01 |
Pos logit contributions | |
ullivan | +7.865 |
cone | +7.554 |
Hera | +7.400 |
eda | +7.276 |
asma | +7.260 |
Neg logit contributions | |
MX | -16.224 |
ovie | -15.623 |
oir | -15.062 |
resp | -14.571 |
sburgh | -14.132 |
Token | a |
Token ID | 257 |
Feature activation | +9.92e-02 |
Pos logit contributions | |
ullivan | +5.769 |
enhagen | +5.745 |
asma | +5.640 |
Hera | +5.601 |
eda | +5.501 |
Neg logit contributions | |
MX | -6.656 |
ovie | -6.128 |
oir | -5.774 |
resp | -5.599 |
sburgh | -5.510 |
Token | few |
Token ID | 1178 |
Feature activation | +4.06e-03 |
Pos logit contributions | |
ullivan | +1.103 |
enhagen | +1.074 |
asma | +1.068 |
Hera | +1.045 |
eda | +1.045 |
Neg logit contributions | |
MX | -1.168 |
ovie | -1.098 |
oir | -1.044 |
resp | -0.985 |
butt | -0.981 |
Token | too |
Token ID | 1165 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
ullivan | +0.052 |
enhagen | +0.051 |
asma | +0.050 |
Hera | +0.049 |
eda | +0.049 |
Neg logit contributions | |
MX | -0.041 |
ovie | -0.038 |
oir | -0.036 |
resp | -0.034 |
butt | -0.034 |
Token | many |
Token ID | 867 |
Feature activation | -6.76e-02 |
Pos logit contributions | |
MX | +2.798 |
ovie | +2.645 |
oir | +2.533 |
resp | +2.359 |
butt | +2.335 |
Neg logit contributions | |
enhagen | -2.849 |
ullivan | -2.827 |
asma | -2.794 |
Hera | -2.712 |
lication | -2.707 |
Token | seen |
Token ID | 1775 |
Feature activation | -9.46e-02 |
Pos logit contributions | |
enhagen | +3.822 |
ullivan | +3.801 |
asma | +3.690 |
eda | +3.671 |
Hera | +3.631 |
Neg logit contributions | |
MX | -3.692 |
ovie | -3.441 |
oir | -3.289 |
resp | -3.104 |
butt | -3.051 |
Token | is |
Token ID | 318 |
Feature activation | -7.69e-03 |
Pos logit contributions | |
MX | +1.048 |
ovie | +0.979 |
oir | +0.931 |
resp | +0.871 |
butt | +0.870 |
Neg logit contributions | |
ullivan | -1.119 |
enhagen | -1.100 |
asma | -1.085 |
Hera | -1.062 |
eda | -1.061 |
Token | a |
Token ID | 257 |
Feature activation | -5.64e-02 |
Pos logit contributions | |
MX | +0.087 |
ovie | +0.082 |
oir | +0.078 |
resp | +0.073 |
butt | +0.073 |
Neg logit contributions | |
ullivan | -0.089 |
enhagen | -0.088 |
asma | -0.086 |
Hera | -0.084 |
eda | -0.084 |
Token | willingness |
Token ID | 16826 |
Feature activation | +7.29e-02 |
Pos logit contributions | |
MX | +0.659 |
ovie | +0.615 |
oir | +0.588 |
resp | +0.553 |
butt | +0.551 |
Neg logit contributions | |
ullivan | -0.635 |
enhagen | -0.625 |
asma | -0.614 |
eda | -0.601 |
Hera | -0.600 |
Token | to |
Token ID | 284 |
Feature activation | +3.50e-01 |
Pos logit contributions | |
ullivan | +0.825 |
enhagen | +0.814 |
asma | +0.800 |
Hera | +0.783 |
eda | +0.781 |
Neg logit contributions | |
MX | -0.842 |
ovie | -0.790 |
oir | -0.751 |
resp | -0.710 |
butt | -0.701 |
Token | p |
Token ID | 279 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
ullivan | +3.746 |
asma | +3.657 |
enhagen | +3.633 |
Hera | +3.594 |
eda | +3.551 |
Neg logit contributions | |
MX | -4.148 |
ovie | -3.869 |
oir | -3.704 |
resp | -3.484 |
sburgh | -3.437 |
Token | ander |
Token ID | 4066 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
asma | +10.390 |
eda | +10.247 |
ullivan | +10.150 |
enhagen | +10.056 |
rocal | +9.415 |
Neg logit contributions | |
MX | -13.746 |
ovie | -12.089 |
oir | -11.914 |
sburgh | -11.788 |
ーテ | -11.656 |
Token | without |
Token ID | 1231 |
Feature activation | +4.00e-01 |
Pos logit contributions | |
ullivan | +2.599 |
enhagen | +2.572 |
asma | +2.538 |
Hera | +2.477 |
eda | +2.473 |
Neg logit contributions | |
MX | -2.866 |
ovie | -2.685 |
oir | -2.534 |
resp | -2.431 |
sburgh | -2.363 |
Token | constraint |
Token ID | 32315 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
asma | +4.239 |
ullivan | +4.233 |
enhagen | +4.229 |
Hera | +4.197 |
lication | +4.086 |
Neg logit contributions | |
MX | -4.708 |
ovie | -4.380 |
oir | -4.224 |
butt | -3.955 |
resp | -3.938 |
Token | or |
Token ID | 393 |
Feature activation | +6.08e-01 |
Pos logit contributions | |
ullivan | +2.513 |
enhagen | +2.507 |
asma | +2.459 |
eda | +2.410 |
Hera | +2.404 |
Neg logit contributions | |
MX | -2.655 |
ovie | -2.484 |
oir | -2.346 |
resp | -2.237 |
butt | -2.192 |
Token | embarrassment |
Token ID | 24655 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
Hera | +6.312 |
asma | +6.237 |
enhagen | +6.140 |
ullivan | +6.104 |
lication | +6.098 |
Neg logit contributions | |
MX | -6.961 |
ovie | -6.518 |
oir | -6.248 |
butt | -5.841 |
sburgh | -5.822 |
Token | the |
Token ID | 262 |
Feature activation | +2.05e-01 |
Pos logit contributions | |
ullivan | +3.470 |
enhagen | +3.460 |
asma | +3.352 |
Hera | +3.351 |
eda | +3.287 |
Neg logit contributions | |
MX | -5.587 |
ovie | -5.345 |
oir | -5.119 |
resp | -4.995 |
sburgh | -4.890 |
Token | empty |
Token ID | 6565 |
Feature activation | +4.29e-01 |
Pos logit contributions | |
ullivan | +2.171 |
enhagen | +2.143 |
asma | +2.109 |
Hera | +2.097 |
eda | +2.063 |
Neg logit contributions | |
MX | -2.453 |
ovie | -2.303 |
oir | -2.218 |
resp | -2.095 |
butt | -2.081 |
Token | holder |
Token ID | 15762 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
ullivan | +4.419 |
enhagen | +4.314 |
asma | +4.303 |
Hera | +4.267 |
lication | +4.184 |
Neg logit contributions | |
MX | -5.141 |
ovie | -4.716 |
oir | -4.554 |
resp | -4.346 |
butt | -4.317 |
Token | designated |
Token ID | 11032 |
Feature activation | +7.64e-02 |
Pos logit contributions | |
ullivan | +1.801 |
enhagen | +1.778 |
asma | +1.737 |
Hera | +1.718 |
eda | +1.704 |
Neg logit contributions | |
MX | -1.883 |
ovie | -1.761 |
oir | -1.682 |
resp | -1.583 |
butt | -1.570 |
Token | " |
Token ID | 366 |
Feature activation | +4.61e-01 |
Pos logit contributions | |
ullivan | +0.857 |
enhagen | +0.844 |
asma | +0.830 |
Hera | +0.817 |
eda | +0.812 |
Neg logit contributions | |
MX | -0.889 |
ovie | -0.832 |
oir | -0.797 |
resp | -0.747 |
butt | -0.745 |
Token | Sky |
Token ID | 22308 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
ullivan | +5.022 |
enhagen | +4.965 |
asma | +4.962 |
Hera | +4.920 |
eda | +4.916 |
Neg logit contributions | |
MX | -4.926 |
ovie | -4.717 |
oir | -4.571 |
sburgh | -4.250 |
resp | -4.146 |
Token | fall |
Token ID | 7207 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
enhagen | +7.249 |
Hera | +6.980 |
asma | +6.888 |
ullivan | +6.818 |
eda | +6.741 |
Neg logit contributions | |
MX | -15.960 |
ovie | -15.338 |
oir | -14.551 |
sburgh | -14.069 |
resp | -14.052 |
Token | " |
Token ID | 1 |
Feature activation | +4.02e-01 |
Pos logit contributions | |
ullivan | +1.541 |
enhagen | +1.527 |
asma | +1.505 |
eda | +1.480 |
Hera | +1.479 |
Neg logit contributions | |
MX | -1.454 |
ovie | -1.357 |
oir | -1.298 |
resp | -1.218 |
butt | -1.210 |
Token | --- |
Token ID | 6329 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
ullivan | +4.293 |
enhagen | +4.279 |
asma | +4.149 |
Hera | +4.140 |
eda | +4.088 |
Neg logit contributions | |
MX | -4.609 |
ovie | -4.324 |
oir | -4.253 |
butt | -3.943 |
resp | -3.932 |
Token | Now |
Token ID | 2735 |
Feature activation | +3.43e-01 |
Pos logit contributions | |
ullivan | +1.640 |
enhagen | +1.620 |
asma | +1.591 |
Hera | +1.568 |
eda | +1.561 |
Neg logit contributions | |
MX | -1.657 |
ovie | -1.547 |
oir | -1.486 |
butt | -1.391 |
resp | -1.390 |
Token | your |
Token ID | 534 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
ullivan | +3.708 |
enhagen | +3.676 |
Hera | +3.629 |
asma | +3.612 |
eda | +3.600 |
Neg logit contributions | |
MX | -3.960 |
ovie | -3.691 |
oir | -3.546 |
resp | -3.321 |
butt | -3.282 |
Token | an |
Token ID | 281 |
Feature activation | -4.57e-01 |
Pos logit contributions | |
MX | +1.900 |
ovie | +1.758 |
oir | +1.673 |
resp | +1.523 |
butt | +1.512 |
Neg logit contributions | |
ullivan | -2.720 |
enhagen | -2.706 |
asma | -2.632 |
lication | -2.563 |
eda | -2.550 |
Token | Introduction |
Token ID | 22395 |
Feature activation | -6.73e-02 |
Pos logit contributions | |
MX | +4.283 |
ovie | +4.019 |
oir | +3.925 |
resp | +3.556 |
butt | +3.370 |
Neg logit contributions | |
ullivan | -5.951 |
asma | -5.865 |
enhagen | -5.790 |
lication | -5.571 |
zl | -5.548 |
Token | by |
Token ID | 416 |
Feature activation | -6.24e-01 |
Pos logit contributions | |
MX | +0.745 |
ovie | +0.695 |
oir | +0.663 |
resp | +0.620 |
butt | +0.615 |
Neg logit contributions | |
ullivan | -0.799 |
enhagen | -0.784 |
asma | -0.774 |
Hera | -0.757 |
eda | -0.751 |
Token | Prof |
Token ID | 4415 |
Feature activation | -6.23e-02 |
Pos logit contributions | |
MX | +3.719 |
oir | +3.389 |
ovie | +3.367 |
pa | +2.788 |
resp | +2.663 |
Neg logit contributions | |
enhagen | -10.187 |
ullivan | -10.114 |
asma | -9.707 |
cone | -9.696 |
rocal | -9.637 |
Token | . |
Token ID | 13 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
MX | +0.640 |
ovie | +0.599 |
oir | +0.565 |
resp | +0.526 |
butt | +0.520 |
Neg logit contributions | |
ullivan | -0.785 |
enhagen | -0.774 |
asma | -0.760 |
Hera | -0.748 |
eda | -0.746 |
Token | George |
Token ID | 4502 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
ullivan | +1.048 |
enhagen | +1.028 |
asma | +1.019 |
Hera | +0.999 |
eda | +0.988 |
Neg logit contributions | |
MX | -1.415 |
ovie | -1.330 |
oir | -1.277 |
butt | -1.211 |
resp | -1.199 |
Token | W |
Token ID | 370 |
Feature activation | -3.51e-01 |
Pos logit contributions | |
MX | +7.209 |
ovie | +6.920 |
oir | +6.306 |
¯ | +5.976 |
resp | +5.854 |
Neg logit contributions | |
nown | -22.027 |
ullivan | -20.420 |
enhagen | -20.261 |
cone | -19.896 |
eda | -19.886 |
Token | . |
Token ID | 13 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
MX | +3.158 |
ovie | +2.927 |
oir | +2.858 |
resp | +2.600 |
butt | +2.516 |
Neg logit contributions | |
enhagen | -4.690 |
ullivan | -4.682 |
Hera | -4.615 |
lication | -4.569 |
asma | -4.556 |
Token | Carey |
Token ID | 31612 |
Feature activation | -4.10e-01 |
Pos logit contributions | |
MX | +2.204 |
ovie | +1.995 |
oir | +1.911 |
resp | +1.745 |
butt | +1.711 |
Neg logit contributions | |
ullivan | -3.463 |
enhagen | -3.408 |
lication | -3.375 |
asma | -3.374 |
Hera | -3.317 |
Token | , |
Token ID | 11 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
MX | +3.850 |
ovie | +3.375 |
oir | +3.325 |
resp | +3.114 |
butt | +2.995 |
Neg logit contributions | |
ullivan | -5.491 |
asma | -5.322 |
enhagen | -5.278 |
Hera | -5.256 |
eda | -5.181 |
Token | a |
Token ID | 257 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
MX | +1.781 |
ovie | +1.638 |
oir | +1.589 |
resp | +1.492 |
butt | +1.433 |
Neg logit contributions | |
ullivan | -2.220 |
enhagen | -2.182 |
asma | -2.125 |
Hera | -2.093 |
eda | -2.064 |
Token | break |
Token ID | 2270 |
Feature activation | +3.61e-02 |
Pos logit contributions | |
ullivan | +0.114 |
enhagen | +0.112 |
asma | +0.110 |
Hera | +0.108 |
eda | +0.108 |
Neg logit contributions | |
MX | -0.115 |
ovie | -0.107 |
oir | -0.103 |
resp | -0.096 |
butt | -0.096 |
Token | through |
Token ID | 832 |
Feature activation | -2.22e-02 |
Pos logit contributions | |
ullivan | +0.418 |
enhagen | +0.411 |
asma | +0.405 |
Hera | +0.398 |
eda | +0.397 |
Neg logit contributions | |
MX | -0.408 |
ovie | -0.381 |
oir | -0.364 |
resp | -0.341 |
butt | -0.338 |
Token | the |
Token ID | 262 |
Feature activation | -8.31e-01 |
Pos logit contributions | |
MX | +0.255 |
ovie | +0.238 |
oir | +0.227 |
resp | +0.213 |
butt | +0.212 |
Neg logit contributions | |
ullivan | -0.255 |
enhagen | -0.251 |
asma | -0.247 |
Hera | -0.242 |
eda | -0.241 |
Token | 30 |
Token ID | 1542 |
Feature activation | -1.98e-01 |
Pos logit contributions | |
MX | +8.498 |
ovie | +8.080 |
sburgh | +7.755 |
oir | +7.702 |
butt | +7.150 |
Neg logit contributions | |
ullivan | -9.200 |
enhagen | -8.951 |
rocal | -8.557 |
asma | -8.493 |
lication | -8.412 |
Token | - |
Token ID | 12 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
MX | +2.102 |
ovie | +1.937 |
oir | +1.854 |
resp | +1.742 |
butt | +1.738 |
Neg logit contributions | |
ullivan | -2.424 |
enhagen | -2.392 |
asma | -2.335 |
eda | -2.312 |
Hera | -2.283 |
Token | point |
Token ID | 4122 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
MX | +2.129 |
ovie | +1.967 |
oir | +1.876 |
butt | +1.786 |
resp | +1.777 |
Neg logit contributions | |
ullivan | -2.550 |
enhagen | -2.495 |
asma | -2.455 |
eda | -2.412 |
Hera | -2.409 |
Token | barrier |
Token ID | 13054 |
Feature activation | -5.33e-01 |
Pos logit contributions | |
MX | +11.151 |
sburgh | +10.482 |
oir | +10.453 |
ovie | +9.701 |
waves | +9.399 |
Neg logit contributions | |
ullivan | -15.458 |
enhagen | -15.351 |
rocal | -15.338 |
lication | -14.644 |
nown | -14.357 |
Token | for |
Token ID | 329 |
Feature activation | +2.00e-01 |
Pos logit contributions | |
MX | +4.910 |
ovie | +4.453 |
oir | +4.235 |
sburgh | +3.970 |
butt | +3.969 |
Neg logit contributions | |
ullivan | -7.055 |
enhagen | -6.891 |
asma | -6.676 |
rocal | -6.632 |
lication | -6.555 |
Token | the |
Token ID | 262 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
ullivan | +2.225 |
enhagen | +2.190 |
asma | +2.159 |
Hera | +2.144 |
eda | +2.120 |
Neg logit contributions | |
MX | -2.349 |
ovie | -2.179 |
oir | -2.106 |
resp | -1.976 |
butt | -1.951 |
Token | third |
Token ID | 2368 |
Feature activation | +4.71e-01 |
Pos logit contributions | |
MX | +0.240 |
ovie | +0.226 |
oir | +0.216 |
resp | +0.204 |
butt | +0.204 |
Neg logit contributions | |
ullivan | -0.195 |
enhagen | -0.192 |
asma | -0.188 |
Hera | -0.184 |
eda | -0.184 |
Token | successive |
Token ID | 25175 |
Feature activation | +3.06e-02 |
Pos logit contributions | |
ullivan | +4.949 |
Hera | +4.935 |
enhagen | +4.875 |
asma | +4.833 |
eda | +4.718 |
Neg logit contributions | |
MX | -5.416 |
ovie | -5.190 |
oir | -4.868 |
resp | -4.630 |
butt | -4.495 |
Token | 's |
Token ID | 338 |
Feature activation | +2.99e-02 |
Pos logit contributions | |
ullivan | +0.231 |
enhagen | +0.227 |
asma | +0.224 |
Hera | +0.219 |
eda | +0.219 |
Neg logit contributions | |
MX | -0.211 |
ovie | -0.196 |
oir | -0.186 |
resp | -0.175 |
butt | -0.174 |
Token | headquarters |
Token ID | 10043 |
Feature activation | -8.29e-02 |
Pos logit contributions | |
ullivan | +0.385 |
enhagen | +0.379 |
asma | +0.374 |
Hera | +0.368 |
eda | +0.367 |
Neg logit contributions | |
MX | -0.302 |
ovie | -0.279 |
oir | -0.264 |
resp | -0.246 |
butt | -0.245 |
Token | in |
Token ID | 287 |
Feature activation | -2.15e-01 |
Pos logit contributions | |
MX | +0.890 |
ovie | +0.831 |
oir | +0.789 |
resp | +0.736 |
butt | +0.734 |
Neg logit contributions | |
ullivan | -1.010 |
enhagen | -0.994 |
asma | -0.977 |
eda | -0.958 |
Hera | -0.955 |
Token | Hawth |
Token ID | 41457 |
Feature activation | -6.53e-02 |
Pos logit contributions | |
MX | +2.687 |
ovie | +2.562 |
oir | +2.438 |
butt | +2.321 |
resp | +2.309 |
Neg logit contributions | |
ullivan | -2.222 |
enhagen | -2.169 |
asma | -2.132 |
eda | -2.056 |
lication | -2.037 |
Token | orne |
Token ID | 8553 |
Feature activation | -4.14e-01 |
Pos logit contributions | |
MX | +0.829 |
ovie | +0.783 |
oir | +0.752 |
resp | +0.709 |
butt | +0.706 |
Neg logit contributions | |
ullivan | -0.669 |
enhagen | -0.653 |
asma | -0.639 |
Hera | -0.628 |
eda | -0.623 |
Token | , |
Token ID | 11 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
MX | +3.927 |
ovie | +3.576 |
oir | +3.351 |
butt | +3.144 |
resp | +3.140 |
Neg logit contributions | |
ullivan | -5.545 |
enhagen | -5.337 |
asma | -5.322 |
eda | -5.158 |
Hera | -5.155 |
Token | California |
Token ID | 3442 |
Feature activation | -4.54e-01 |
Pos logit contributions | |
MX | +9.064 |
ovie | +7.540 |
butt | +6.909 |
oir | +6.536 |
Tex | +6.468 |
Neg logit contributions | |
ullivan | -19.706 |
enhagen | -18.437 |
asma | -18.256 |
eda | -17.403 |
zl | -17.320 |
Token | , |
Token ID | 11 |
Feature activation | -8.14e-02 |
Pos logit contributions | |
MX | +4.362 |
ovie | +4.049 |
oir | +3.823 |
resp | +3.480 |
butt | +3.463 |
Neg logit contributions | |
ullivan | -5.888 |
enhagen | -5.703 |
asma | -5.659 |
eda | -5.616 |
Hera | -5.602 |
Token | to |
Token ID | 284 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
MX | +0.894 |
ovie | +0.833 |
oir | +0.791 |
resp | +0.742 |
butt | +0.738 |
Neg logit contributions | |
ullivan | -0.974 |
enhagen | -0.956 |
asma | -0.943 |
eda | -0.924 |
Hera | -0.921 |
Token | perform |
Token ID | 1620 |
Feature activation | -7.02e-03 |
Pos logit contributions | |
MX | +0.176 |
ovie | +0.165 |
oir | +0.157 |
resp | +0.147 |
butt | +0.147 |
Neg logit contributions | |
ullivan | -0.183 |
enhagen | -0.181 |
asma | -0.178 |
Hera | -0.174 |
eda | -0.174 |
Token | a |
Token ID | 257 |
Feature activation | +4.80e-02 |
Pos logit contributions | |
MX | +0.077 |
ovie | +0.072 |
oir | +0.068 |
resp | +0.064 |
butt | +0.063 |
Neg logit contributions | |
ullivan | -0.084 |
enhagen | -0.083 |
asma | -0.082 |
Hera | -0.080 |
eda | -0.080 |
Token | vot |
Token ID | 1993 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
MX | +1.698 |
ovie | +1.581 |
oir | +1.519 |
resp | +1.413 |
butt | +1.394 |
Neg logit contributions | |
ullivan | -1.793 |
enhagen | -1.780 |
asma | -1.741 |
Hera | -1.698 |
eda | -1.696 |
Token | re |
Token ID | 260 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
MX | +1.009 |
ovie | +0.929 |
oir | +0.889 |
resp | +0.817 |
butt | +0.805 |
Neg logit contributions | |
ullivan | -1.401 |
enhagen | -1.379 |
asma | -1.357 |
Hera | -1.336 |
eda | -1.329 |
Token | p |
Token ID | 279 |
Feature activation | +3.04e-01 |
Pos logit contributions | |
MX | +2.343 |
ovie | +2.180 |
oir | +2.099 |
resp | +1.965 |
butt | +1.950 |
Neg logit contributions | |
ullivan | -2.442 |
enhagen | -2.422 |
asma | -2.358 |
eda | -2.303 |
lication | -2.278 |
Token | ère |
Token ID | 35979 |
Feature activation | -7.86e-02 |
Pos logit contributions | |
ullivan | +3.244 |
enhagen | +3.226 |
asma | +3.180 |
eda | +3.144 |
lication | +3.114 |
Neg logit contributions | |
MX | -3.618 |
ovie | -3.364 |
oir | -3.155 |
butt | -3.061 |
sburgh | -3.033 |
Token | , |
Token ID | 11 |
Feature activation | -3.72e-01 |
Pos logit contributions | |
MX | +0.882 |
ovie | +0.823 |
oir | +0.788 |
resp | +0.737 |
butt | +0.731 |
Neg logit contributions | |
ullivan | -0.923 |
enhagen | -0.909 |
asma | -0.893 |
Hera | -0.872 |
eda | -0.872 |
Token | v |
Token ID | 410 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
MX | +4.202 |
ovie | +3.890 |
oir | +3.767 |
resp | +3.514 |
butt | +3.423 |
Neg logit contributions | |
ullivan | -4.266 |
enhagen | -4.248 |
asma | -4.137 |
eda | -4.002 |
Hera | -3.943 |
Token | ous |
Token ID | 516 |
Feature activation | -2.25e-01 |
Pos logit contributions | |
oir | +13.675 |
MX | +13.040 |
ovie | +12.295 |
resp | +11.524 |
ie | +11.268 |
Neg logit contributions | |
ullivan | -13.425 |
Hera | -13.341 |
enhagen | -13.299 |
�� | -13.002 |
asma | -12.109 |
Token | , |
Token ID | 11 |
Feature activation | -7.00e-03 |
Pos logit contributions | |
MX | +2.506 |
ovie | +2.330 |
oir | +2.270 |
resp | +2.096 |
butt | +2.076 |
Neg logit contributions | |
ullivan | -2.620 |
enhagen | -2.593 |
asma | -2.541 |
eda | -2.467 |
Hera | -2.456 |
Token | le |
Token ID | 443 |
Feature activation | +5.89e-02 |
Pos logit contributions | |
MX | +0.080 |
ovie | +0.074 |
oir | +0.071 |
resp | +0.066 |
butt | +0.066 |
Neg logit contributions | |
ullivan | -0.081 |
enhagen | -0.080 |
asma | -0.078 |
Hera | -0.077 |
eda | -0.077 |
Token | S |
Token ID | 311 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
ullivan | +0.691 |
enhagen | +0.678 |
asma | +0.671 |
Hera | +0.661 |
eda | +0.658 |
Neg logit contributions | |
MX | -0.657 |
ovie | -0.614 |
oir | -0.582 |
resp | -0.546 |
butt | -0.545 |
Token | é |
Token ID | 2634 |
Feature activation | -5.39e-01 |
Pos logit contributions | |
ullivan | +2.562 |
enhagen | +2.520 |
asma | +2.501 |
eda | +2.475 |
lication | +2.407 |
Neg logit contributions | |
MX | -2.456 |
ovie | -2.291 |
oir | -2.158 |
butt | -2.085 |
sburgh | -2.046 |
Token | J |
Token ID | 449 |
Feature activation | -7.94e-01 |
Pos logit contributions | |
MX | +6.148 |
ovie | +5.454 |
oir | +5.320 |
resp | +4.983 |
butt | +4.802 |
Neg logit contributions | |
enhagen | -6.309 |
ullivan | -6.300 |
asma | -6.091 |
eda | -5.809 |
rocal | -5.757 |
Token | ' |
Token ID | 6 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
MX | +7.861 |
ovie | +7.123 |
oir | +7.038 |
resp | +6.322 |
\' | +6.105 |
Neg logit contributions | |
ullivan | -9.629 |
enhagen | -9.514 |
Hera | -9.425 |
asma | -9.002 |
lication | -8.937 |
Token | esp |
Token ID | 9774 |
Feature activation | -2.45e-01 |
Pos logit contributions | |
MX | +1.994 |
ovie | +1.886 |
oir | +1.822 |
resp | +1.727 |
butt | +1.704 |
Neg logit contributions | |
ullivan | -1.420 |
enhagen | -1.404 |
asma | -1.372 |
Hera | -1.361 |
lication | -1.323 |
Token | ère |
Token ID | 35979 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
MX | +2.179 |
ovie | +2.082 |
oir | +2.000 |
resp | +1.814 |
butt | +1.751 |
Neg logit contributions | |
ullivan | -3.362 |
enhagen | -3.336 |
Hera | -3.294 |
asma | -3.266 |
eda | -3.174 |
Token | que |
Token ID | 8358 |
Feature activation | -3.81e-01 |
Pos logit contributions | |
MX | +1.550 |
ovie | +1.446 |
oir | +1.396 |
resp | +1.301 |
butt | +1.289 |
Neg logit contributions | |
ullivan | -1.563 |
enhagen | -1.543 |
asma | -1.513 |
eda | -1.471 |
Hera | -1.469 |
Token | v |
Token ID | 410 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
MX | +4.206 |
ovie | +3.918 |
oir | +3.808 |
resp | +3.524 |
butt | +3.454 |
Neg logit contributions | |
ullivan | -4.447 |
enhagen | -4.411 |
asma | -4.282 |
eda | -4.130 |
lication | -4.076 |
Token | ous |
Token ID | 516 |
Feature activation | -2.44e-01 |
Pos logit contributions | |
oir | +12.220 |
MX | +11.502 |
ovie | +10.748 |
resp | +10.097 |
ie | +9.951 |
Neg logit contributions | |
ullivan | -14.983 |
Hera | -14.904 |
enhagen | -14.861 |
�� | -14.366 |
asma | -13.658 |
Token | comp |
Token ID | 552 |
Feature activation | +2.23e-01 |
Pos logit contributions | |
MX | +2.721 |
ovie | +2.528 |
oir | +2.458 |
resp | +2.270 |
butt | +2.246 |
Neg logit contributions | |
ullivan | -2.852 |
enhagen | -2.833 |
asma | -2.771 |
eda | -2.684 |
Hera | -2.670 |
Token | rend |
Token ID | 10920 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
ullivan | +2.584 |
enhagen | +2.543 |
eda | +2.512 |
asma | +2.501 |
lication | +2.463 |
Neg logit contributions | |
MX | -2.520 |
ovie | -2.298 |
oir | -2.169 |
butt | -2.080 |
resp | -2.049 |
Token | rez |
Token ID | 21107 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
MX | +2.688 |
ovie | +2.510 |
oir | +2.440 |
resp | +2.245 |
butt | +2.164 |
Neg logit contributions | |
ullivan | -3.185 |
enhagen | -3.132 |
asma | -3.072 |
Hera | -3.012 |
eda | -2.985 |
Token | que |
Token ID | 8358 |
Feature activation | -3.96e-01 |
Pos logit contributions | |
MX | +3.417 |
ovie | +3.178 |
oir | +3.089 |
resp | +2.857 |
butt | +2.793 |
Neg logit contributions | |
ullivan | -3.692 |
enhagen | -3.642 |
asma | -3.553 |
eda | -3.436 |
Hera | -3.433 |
Token | the |
Token ID | 262 |
Feature activation | +6.26e-01 |
Pos logit contributions | |
ullivan | +1.038 |
enhagen | +1.024 |
asma | +1.006 |
Hera | +0.990 |
eda | +0.987 |
Neg logit contributions | |
MX | -0.997 |
ovie | -0.937 |
oir | -0.889 |
resp | -0.832 |
butt | -0.831 |
Token | most |
Token ID | 749 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
ullivan | +5.065 |
asma | +5.057 |
Hera | +5.004 |
enhagen | +4.967 |
eda | +4.956 |
Neg logit contributions | |
MX | -8.525 |
ovie | -8.068 |
oir | -7.648 |
butt | -7.465 |
sburgh | -7.410 |
Token | , |
Token ID | 11 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
ullivan | +1.862 |
enhagen | +1.842 |
asma | +1.799 |
Hera | +1.768 |
eda | +1.767 |
Neg logit contributions | |
MX | -1.829 |
ovie | -1.715 |
oir | -1.626 |
resp | -1.531 |
butt | -1.518 |
Token | took |
Token ID | 1718 |
Feature activation | -5.49e-01 |
Pos logit contributions | |
MX | +1.181 |
ovie | +1.100 |
oir | +1.048 |
resp | +0.988 |
butt | +0.982 |
Neg logit contributions | |
ullivan | -1.242 |
enhagen | -1.219 |
asma | -1.197 |
Hera | -1.172 |
eda | -1.170 |
Token | a |
Token ID | 257 |
Feature activation | -7.36e-01 |
Pos logit contributions | |
MX | +5.682 |
ovie | +5.051 |
oir | +4.815 |
butt | +4.648 |
resp | +4.621 |
Neg logit contributions | |
enhagen | -6.624 |
ullivan | -6.531 |
asma | -6.384 |
lication | -6.282 |
eda | -6.080 |
Token | good |
Token ID | 922 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
MX | +7.652 |
ovie | +6.664 |
oir | +6.515 |
resp | +6.226 |
butt | +6.040 |
Neg logit contributions | |
enhagen | -8.719 |
ullivan | -8.456 |
lication | -8.090 |
asma | -8.072 |
eda | -7.864 |
Token | - |
Token ID | 12 |
Feature activation | -6.10e-01 |
Pos logit contributions | |
MX | +12.232 |
ovie | +11.158 |
oir | +11.038 |
ie | +10.270 |
ray | +10.222 |
Neg logit contributions | |
enhagen | -14.608 |
ullivan | -13.846 |
asma | -13.568 |
lication | -13.532 |
eda | -13.282 |
Token | guy |
Token ID | 22932 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
MX | +5.479 |
ovie | +5.160 |
butt | +4.821 |
oir | +4.819 |
resp | +4.605 |
Neg logit contributions | |
enhagen | -7.929 |
ullivan | -7.923 |
asma | -7.754 |
Hera | -7.641 |
lication | -7.494 |
Token | - |
Token ID | 12 |
Feature activation | -2.55e-02 |
Pos logit contributions | |
MX | +3.585 |
ovie | +3.323 |
oir | +3.181 |
butt | +2.996 |
resp | +2.996 |
Neg logit contributions | |
ullivan | -3.503 |
enhagen | -3.501 |
asma | -3.381 |
eda | -3.301 |
lication | -3.292 |
Token | vers |
Token ID | 690 |
Feature activation | +3.20e-01 |
Pos logit contributions | |
MX | +0.282 |
ovie | +0.263 |
oir | +0.250 |
resp | +0.235 |
butt | +0.234 |
Neg logit contributions | |
ullivan | -0.304 |
enhagen | -0.299 |
asma | -0.294 |
Hera | -0.289 |
eda | -0.288 |
Token | us |
Token ID | 385 |
Feature activation | -5.98e-02 |
Pos logit contributions | |
ullivan | +3.979 |
asma | +3.852 |
enhagen | +3.844 |
eda | +3.788 |
Hera | +3.704 |
Neg logit contributions | |
MX | -3.415 |
ovie | -3.145 |
oir | -2.943 |
butt | -2.804 |
resp | -2.725 |
Token | - |
Token ID | 12 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
MX | +1.572 |
ovie | +1.464 |
oir | +1.411 |
resp | +1.310 |
butt | +1.298 |
Neg logit contributions | |
ullivan | -1.790 |
enhagen | -1.766 |
asma | -1.735 |
eda | -1.701 |
Hera | -1.700 |
Token | than |
Token ID | 14813 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
ullivan | +1.735 |
enhagen | +1.690 |
asma | +1.682 |
eda | +1.640 |
Hera | +1.623 |
Neg logit contributions | |
MX | -2.614 |
ovie | -2.478 |
oir | -2.363 |
sburgh | -2.229 |
butt | -2.223 |
Token | - |
Token ID | 12 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
ullivan | +2.478 |
enhagen | +2.394 |
asma | +2.374 |
Hera | +2.332 |
eda | +2.321 |
Neg logit contributions | |
MX | -2.488 |
ovie | -2.337 |
oir | -2.194 |
resp | -2.071 |
butt | -2.063 |
Token | opt |
Token ID | 8738 |
Feature activation | -1.34e-02 |
Pos logit contributions | |
ullivan | +1.335 |
enhagen | +1.304 |
asma | +1.289 |
eda | +1.259 |
Hera | +1.251 |
Neg logit contributions | |
MX | -1.725 |
ovie | -1.634 |
oir | -1.552 |
butt | -1.460 |
resp | -1.460 |
Token | imal |
Token ID | 4402 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
MX | +0.168 |
ovie | +0.158 |
oir | +0.152 |
resp | +0.143 |
butt | +0.143 |
Neg logit contributions | |
ullivan | -0.139 |
enhagen | -0.137 |
asma | -0.134 |
Hera | -0.132 |
eda | -0.131 |
Token | v |
Token ID | 410 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
MX | +1.777 |
ovie | +1.653 |
oir | +1.579 |
resp | +1.471 |
butt | +1.451 |
Neg logit contributions | |
ullivan | -2.133 |
enhagen | -2.109 |
asma | -2.059 |
eda | -2.023 |
lication | -2.011 |
Token | int |
Token ID | 600 |
Feature activation | -2.97e-01 |
Pos logit contributions | |
MX | +9.658 |
oir | +9.293 |
ovie | +8.867 |
resp | +8.298 |
inas | +8.256 |
Neg logit contributions | |
Hera | -17.188 |
ullivan | -17.026 |
�� | -16.588 |
asma | -16.314 |
rocal | -15.901 |
Token | ages |
Token ID | 1095 |
Feature activation | -4.34e-02 |
Pos logit contributions | |
MX | +4.030 |
ovie | +3.796 |
oir | +3.725 |
resp | +3.512 |
butt | +3.470 |
Neg logit contributions | |
ullivan | -2.752 |
enhagen | -2.622 |
asma | -2.617 |
Hera | -2.590 |
eda | -2.500 |
Token | . |
Token ID | 13 |
Feature activation | +2.76e-01 |
Pos logit contributions | |
MX | +0.487 |
ovie | +0.454 |
oir | +0.433 |
resp | +0.406 |
butt | +0.404 |
Neg logit contributions | |
ullivan | -0.510 |
enhagen | -0.501 |
asma | -0.494 |
Hera | -0.483 |
eda | -0.483 |
Token |
|
Token ID | 198 |
Feature activation | -1.48e-01 |
Pos logit contributions | |
ullivan | +3.146 |
enhagen | +3.070 |
asma | +3.026 |
Hera | +3.005 |
eda | +2.964 |
Neg logit contributions | |
MX | -3.104 |
ovie | -2.870 |
oir | -2.746 |
resp | -2.615 |
butt | -2.587 |
Token |
|
Token ID | 198 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
MX | +1.532 |
ovie | +1.404 |
oir | +1.341 |
resp | +1.255 |
butt | +1.255 |
Neg logit contributions | |
enhagen | -1.872 |
ullivan | -1.867 |
asma | -1.803 |
Hera | -1.761 |
eda | -1.756 |
Token | his |
Token ID | 465 |
Feature activation | -6.72e-01 |
Pos logit contributions | |
MX | +1.962 |
ovie | +1.830 |
oir | +1.751 |
resp | +1.641 |
butt | +1.621 |
Neg logit contributions | |
ullivan | -2.255 |
enhagen | -2.222 |
asma | -2.193 |
eda | -2.125 |
Hera | -2.116 |
Token | new |
Token ID | 649 |
Feature activation | -6.46e-01 |
Pos logit contributions | |
MX | +7.328 |
ovie | +6.766 |
oir | +6.574 |
resp | +6.336 |
butt | +6.186 |
Neg logit contributions | |
enhagen | -7.203 |
ullivan | -7.176 |
asma | -6.922 |
lication | -6.708 |
eda | -6.696 |
Token | brother |
Token ID | 3956 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
MX | +6.904 |
ovie | +6.441 |
oir | +6.267 |
resp | +6.021 |
butt | +5.817 |
Neg logit contributions | |
ullivan | -7.129 |
enhagen | -7.052 |
asma | -6.902 |
Hera | -6.663 |
lication | -6.615 |
Token | - |
Token ID | 12 |
Feature activation | -5.21e-01 |
Pos logit contributions | |
ullivan | +1.939 |
enhagen | +1.904 |
asma | +1.881 |
Hera | +1.868 |
eda | +1.855 |
Neg logit contributions | |
MX | -1.810 |
ovie | -1.681 |
oir | -1.596 |
resp | -1.488 |
butt | -1.484 |
Token | in |
Token ID | 259 |
Feature activation | -5.54e-01 |
Pos logit contributions | |
MX | +3.509 |
ovie | +3.084 |
oir | +2.959 |
resp | +2.725 |
butt | +2.716 |
Neg logit contributions | |
ullivan | -8.127 |
enhagen | -8.088 |
asma | -7.962 |
Hera | -7.821 |
lication | -7.711 |
Token | - |
Token ID | 12 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
MX | +4.743 |
ovie | +4.384 |
oir | +4.224 |
resp | +3.974 |
butt | +3.918 |
Neg logit contributions | |
enhagen | -7.540 |
ullivan | -7.419 |
asma | -7.190 |
Hera | -6.996 |
lication | -6.994 |
Token | law |
Token ID | 6270 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
MX | +11.431 |
butt | +10.763 |
oir | +10.504 |
pa | +10.316 |
ovie | +10.311 |
Neg logit contributions | |
ullivan | -15.360 |
enhagen | -14.987 |
�� | -14.857 |
asma | -14.316 |
Hera | -14.157 |
Token | , |
Token ID | 11 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
MX | +2.034 |
ovie | +1.901 |
oir | +1.810 |
resp | +1.694 |
butt | +1.684 |
Neg logit contributions | |
ullivan | -2.389 |
enhagen | -2.357 |
asma | -2.309 |
eda | -2.250 |
Hera | -2.246 |
Token | E |
Token ID | 412 |
Feature activation | +8.35e-02 |
Pos logit contributions | |
MX | +0.154 |
ovie | +0.143 |
oir | +0.136 |
resp | +0.128 |
butt | +0.127 |
Neg logit contributions | |
ullivan | -0.171 |
enhagen | -0.168 |
asma | -0.165 |
Hera | -0.162 |
eda | -0.162 |
Token | ad |
Token ID | 324 |
Feature activation | +7.66e-02 |
Pos logit contributions | |
ullivan | +0.995 |
enhagen | +0.979 |
asma | +0.970 |
eda | +0.953 |
Hera | +0.939 |
Neg logit contributions | |
MX | -0.921 |
ovie | -0.852 |
oir | -0.805 |
resp | -0.755 |
butt | -0.752 |
Token | gar |
Token ID | 4563 |
Feature activation | -2.28e-01 |
Pos logit contributions | |
ullivan | +1.052 |
enhagen | +1.032 |
asma | +1.024 |
eda | +1.007 |
Hera | +1.002 |
Neg logit contributions | |
MX | -0.710 |
ovie | -0.648 |
oir | -0.608 |
resp | -0.559 |
butt | -0.556 |
Token | , |
Token ID | 11 |
Feature activation | -9.19e-02 |
Pos logit contributions | |
MX | +3.809 |
ovie | +3.661 |
oir | +3.348 |
butt | +3.122 |
sburgh | +3.079 |
Neg logit contributions | |
ullivan | -4.929 |
enhagen | -4.825 |
asma | -4.780 |
lication | -4.676 |
Hera | -4.674 |
Token | and |
Token ID | 290 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
MX | +0.985 |
ovie | +0.921 |
oir | +0.870 |
butt | +0.813 |
resp | +0.811 |
Neg logit contributions | |
ullivan | -1.119 |
enhagen | -1.101 |
asma | -1.087 |
eda | -1.064 |
Hera | -1.060 |
Token | I |
Token ID | 314 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
MX | +1.103 |
ovie | +1.035 |
oir | +0.977 |
butt | +0.914 |
resp | +0.908 |
Neg logit contributions | |
ullivan | -1.249 |
enhagen | -1.226 |
asma | -1.211 |
eda | -1.182 |
Hera | -1.179 |
Token | think |
Token ID | 892 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
MX | +3.258 |
ovie | +3.112 |
oir | +2.915 |
sburgh | +2.724 |
butt | +2.720 |
Neg logit contributions | |
ullivan | -4.214 |
enhagen | -4.097 |
asma | -4.054 |
Hera | -3.906 |
lication | -3.901 |
Token | he |
Token ID | 339 |
Feature activation | -7.76e-01 |
Pos logit contributions | |
MX | +1.270 |
ovie | +1.189 |
oir | +1.123 |
butt | +1.053 |
resp | +1.044 |
Neg logit contributions | |
ullivan | -1.452 |
enhagen | -1.429 |
asma | -1.407 |
eda | -1.376 |
Hera | -1.372 |
Token | 's |
Token ID | 338 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
MX | +5.939 |
ovie | +5.855 |
oir | +5.620 |
sburgh | +5.225 |
\' | +5.147 |
Neg logit contributions | |
ullivan | -10.875 |
enhagen | -9.987 |
asma | -9.985 |
rocal | -9.879 |
lication | -9.812 |
Token | going |
Token ID | 1016 |
Feature activation | -7.02e-01 |
Pos logit contributions | |
MX | +9.212 |
ovie | +8.652 |
oir | +7.992 |
butt | +7.527 |
pa | +7.144 |
Neg logit contributions | |
ullivan | -17.218 |
rocal | -16.126 |
enhagen | -16.125 |
�� | -16.063 |
asma | -16.054 |
Token | to |
Token ID | 284 |
Feature activation | -4.76e-01 |
Pos logit contributions | |
MX | +5.889 |
ovie | +5.504 |
oir | +5.257 |
butt | +4.998 |
sburgh | +4.790 |
Neg logit contributions | |
ullivan | -9.342 |
enhagen | -9.191 |
lication | -8.876 |
asma | -8.866 |
eda | -8.833 |
Token | have |
Token ID | 423 |
Feature activation | -5.27e-01 |
Pos logit contributions | |
MX | +4.827 |
ovie | +4.573 |
oir | +4.468 |
sburgh | +4.139 |
butt | +4.134 |
Neg logit contributions | |
ullivan | -5.805 |
enhagen | -5.694 |
asma | -5.561 |
lication | -5.493 |
eda | -5.423 |
Token | a |
Token ID | 257 |
Feature activation | -4.67e-02 |
Pos logit contributions | |
MX | +4.866 |
ovie | +4.452 |
oir | +4.315 |
butt | +3.969 |
sburgh | +3.922 |
Neg logit contributions | |
ullivan | -6.841 |
enhagen | -6.651 |
eda | -6.436 |
asma | -6.434 |
lication | -6.388 |
Token | big |
Token ID | 1263 |
Feature activation | -5.16e-01 |
Pos logit contributions | |
MX | +0.539 |
ovie | +0.504 |
oir | +0.482 |
resp | +0.452 |
butt | +0.451 |
Neg logit contributions | |
ullivan | -0.532 |
enhagen | -0.524 |
asma | -0.513 |
eda | -0.503 |
Hera | -0.503 |
Token | fractured |
Token ID | 34051 |
Feature activation | -2.05e-01 |
Pos logit contributions | |
MX | +0.387 |
ovie | +0.362 |
oir | +0.346 |
resp | +0.325 |
butt | +0.324 |
Neg logit contributions | |
ullivan | -0.377 |
enhagen | -0.372 |
asma | -0.364 |
eda | -0.357 |
Hera | -0.357 |
Token | collar |
Token ID | 19908 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
MX | +2.308 |
ovie | +2.143 |
oir | +2.060 |
butt | +1.950 |
resp | +1.920 |
Neg logit contributions | |
ullivan | -2.393 |
enhagen | -2.364 |
asma | -2.278 |
eda | -2.236 |
lication | -2.225 |
Token | bone |
Token ID | 9970 |
Feature activation | +1.57e-01 |
Pos logit contributions | |
ullivan | +1.576 |
asma | +1.550 |
enhagen | +1.546 |
eda | +1.502 |
Hera | +1.495 |
Neg logit contributions | |
MX | -3.130 |
ovie | -2.990 |
oir | -2.855 |
sburgh | -2.741 |
resp | -2.727 |
Token | in |
Token ID | 287 |
Feature activation | +3.10e-01 |
Pos logit contributions | |
ullivan | +1.732 |
enhagen | +1.711 |
asma | +1.706 |
Hera | +1.682 |
eda | +1.665 |
Neg logit contributions | |
MX | -1.817 |
ovie | -1.709 |
oir | -1.631 |
resp | -1.532 |
sburgh | -1.513 |
Token | Foot |
Token ID | 7870 |
Feature activation | +2.59e-01 |
Pos logit contributions | |
ullivan | +3.352 |
Hera | +3.287 |
asma | +3.267 |
enhagen | +3.256 |
eda | +3.204 |
Neg logit contributions | |
MX | -3.667 |
ovie | -3.378 |
oir | -3.299 |
resp | -3.078 |
butt | -3.014 |
Token | sc |
Token ID | 1416 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
enhagen | +2.851 |
ullivan | +2.850 |
asma | +2.813 |
Hera | +2.813 |
eda | +2.768 |
Neg logit contributions | |
MX | -2.999 |
ovie | -2.751 |
oir | -2.629 |
resp | -2.479 |
sburgh | -2.437 |
Token | ray |
Token ID | 2433 |
Feature activation | -6.62e-02 |
Pos logit contributions | |
ray | +6.886 |
ovie | +6.347 |
oir | +5.625 |
MX | +5.208 |
butt | +4.504 |
Neg logit contributions | |
enhagen | -20.737 |
ullivan | -20.208 |
Hera | -19.986 |
�� | -19.769 |
lication | -19.373 |
Token | � |
Token ID | 447 |
Feature activation | -3.67e-02 |
Pos logit contributions | |
MX | +0.695 |
ovie | +0.647 |
oir | +0.614 |
butt | +0.573 |
resp | +0.572 |
Neg logit contributions | |
ullivan | -0.824 |
enhagen | -0.811 |
asma | -0.797 |
Hera | -0.783 |
eda | -0.780 |
Token | � |
Token ID | 247 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
MX | +0.464 |
ovie | +0.436 |
oir | +0.418 |
resp | +0.396 |
butt | +0.394 |
Neg logit contributions | |
ullivan | -0.378 |
enhagen | -0.372 |
asma | -0.364 |
Hera | -0.357 |
eda | -0.356 |
Token | s |
Token ID | 82 |
Feature activation | +3.14e-01 |
Pos logit contributions | |
ullivan | +2.810 |
asma | +2.766 |
enhagen | +2.762 |
eda | +2.705 |
Hera | +2.693 |
Neg logit contributions | |
MX | -2.736 |
ovie | -2.535 |
oir | -2.431 |
resp | -2.271 |
butt | -2.215 |
Token | win |
Token ID | 1592 |
Feature activation | +5.50e-03 |
Pos logit contributions | |
ullivan | +3.468 |
asma | +3.353 |
Hera | +3.345 |
enhagen | +3.322 |
eda | +3.272 |
Neg logit contributions | |
MX | -3.658 |
ovie | -3.374 |
oir | -3.234 |
resp | -3.029 |
sburgh | -3.003 |
Token | , |
Token ID | 11 |
Feature activation | +8.54e-02 |
Pos logit contributions | |
ullivan | +2.491 |
enhagen | +2.479 |
asma | +2.428 |
Hera | +2.409 |
eda | +2.381 |
Neg logit contributions | |
MX | -2.693 |
ovie | -2.483 |
oir | -2.401 |
resp | -2.260 |
butt | -2.225 |
Token | The |
Token ID | 383 |
Feature activation | +3.09e-01 |
Pos logit contributions | |
ullivan | +1.009 |
enhagen | +0.991 |
asma | +0.975 |
Hera | +0.962 |
eda | +0.956 |
Neg logit contributions | |
MX | -0.949 |
ovie | -0.883 |
oir | -0.845 |
resp | -0.789 |
butt | -0.785 |
Token | Daily |
Token ID | 6714 |
Feature activation | +8.20e-02 |
Pos logit contributions | |
ullivan | +3.320 |
enhagen | +3.258 |
asma | +3.194 |
eda | +3.178 |
Hera | +3.161 |
Neg logit contributions | |
MX | -3.708 |
ovie | -3.462 |
oir | -3.325 |
butt | -3.122 |
resp | -3.114 |
Token | Caller |
Token ID | 10244 |
Feature activation | -2.48e-01 |
Pos logit contributions | |
ullivan | +0.701 |
enhagen | +0.687 |
asma | +0.677 |
Hera | +0.660 |
eda | +0.658 |
Neg logit contributions | |
MX | -1.172 |
ovie | -1.112 |
oir | -1.074 |
resp | -1.022 |
butt | -1.013 |
Token | co |
Token ID | 763 |
Feature activation | -3.61e-01 |
Pos logit contributions | |
MX | +2.506 |
ovie | +2.312 |
oir | +2.183 |
butt | +2.036 |
resp | +2.029 |
Neg logit contributions | |
ullivan | -3.183 |
enhagen | -3.094 |
asma | -3.057 |
Hera | -3.015 |
lication | -3.001 |
Token | - |
Token ID | 12 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
MX | +3.501 |
ovie | +3.288 |
oir | +3.102 |
butt | +2.908 |
resp | +2.874 |
Neg logit contributions | |
ullivan | -4.613 |
enhagen | -4.542 |
asma | -4.492 |
Hera | -4.458 |
eda | -4.438 |
Token | founder |
Token ID | 15454 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
MX | +8.313 |
ovie | +7.182 |
pa | +7.015 |
butt | +6.994 |
resp | +6.948 |
Neg logit contributions | |
ullivan | -17.380 |
�� | -16.976 |
rocal | -16.726 |
Hera | -16.584 |
enhagen | -16.519 |
Token | said |
Token ID | 531 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
MX | +1.790 |
ovie | +1.672 |
oir | +1.586 |
resp | +1.474 |
butt | +1.474 |
Neg logit contributions | |
ullivan | -2.068 |
enhagen | -2.046 |
asma | -2.007 |
eda | -1.965 |
lication | -1.957 |
Token | , |
Token ID | 11 |
Feature activation | +2.46e-01 |
Pos logit contributions | |
ullivan | +1.707 |
enhagen | +1.676 |
asma | +1.649 |
Hera | +1.628 |
eda | +1.621 |
Neg logit contributions | |
MX | -1.713 |
ovie | -1.591 |
oir | -1.526 |
resp | -1.430 |
butt | -1.416 |
Token | � |
Token ID | 564 |
Feature activation | +8.85e-02 |
Pos logit contributions | |
ullivan | +2.704 |
enhagen | +2.635 |
asma | +2.574 |
Hera | +2.559 |
eda | +2.531 |
Neg logit contributions | |
MX | -2.928 |
ovie | -2.733 |
oir | -2.625 |
resp | -2.449 |
butt | -2.435 |
Token | � |
Token ID | 250 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
ullivan | +1.216 |
enhagen | +1.190 |
asma | +1.180 |
eda | +1.163 |
Hera | +1.161 |
Neg logit contributions | |
MX | -0.813 |
ovie | -0.750 |
oir | -0.703 |
resp | -0.644 |
butt | -0.643 |
Token | dev |
Token ID | 1614 |
Feature activation | -9.24e-01 |
Pos logit contributions | |
MX | +1.282 |
ovie | +1.197 |
oir | +1.150 |
resp | +1.075 |
butt | +1.066 |
Neg logit contributions | |
ullivan | -1.279 |
enhagen | -1.267 |
asma | -1.241 |
eda | -1.212 |
Hera | -1.209 |
Token | oir |
Token ID | 10840 |
Feature activation | -5.91e-01 |
Pos logit contributions | |
oir | +9.296 |
MX | +8.898 |
ovie | +8.118 |
resp | +7.678 |
pa | +7.400 |
Neg logit contributions | |
Hera | -10.454 |
ullivan | -10.316 |
enhagen | -10.250 |
asma | -10.101 |
�� | -9.829 |
Token | s |
Token ID | 82 |
Feature activation | -3.66e-01 |
Pos logit contributions | |
MX | +5.783 |
ovie | +5.326 |
oir | +5.325 |
resp | +4.784 |
butt | +4.587 |
Neg logit contributions | |
ullivan | -7.328 |
enhagen | -7.275 |
asma | -7.099 |
Hera | -6.895 |
eda | -6.886 |
Token | en |
Token ID | 551 |
Feature activation | -2.99e-02 |
Pos logit contributions | |
MX | +3.961 |
ovie | +3.664 |
oir | +3.577 |
resp | +3.290 |
butt | +3.208 |
Neg logit contributions | |
enhagen | -4.348 |
ullivan | -4.345 |
asma | -4.236 |
eda | -4.109 |
Hera | -4.097 |
Token | vers |
Token ID | 690 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
MX | +0.338 |
ovie | +0.315 |
oir | +0.301 |
resp | +0.282 |
butt | +0.281 |
Neg logit contributions | |
ullivan | -0.348 |
enhagen | -0.342 |
asma | -0.337 |
Hera | -0.330 |
eda | -0.329 |
Token | v |
Token ID | 410 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
MX | +2.093 |
ovie | +1.947 |
oir | +1.882 |
resp | +1.744 |
butt | +1.710 |
Neg logit contributions | |
ullivan | -2.218 |
enhagen | -2.211 |
asma | -2.159 |
Hera | -2.111 |
eda | -2.102 |
Token | ous |
Token ID | 516 |
Feature activation | -2.58e-01 |
Pos logit contributions | |
oir | +13.579 |
MX | +13.312 |
ovie | +12.478 |
resp | +11.532 |
pa | +11.505 |
Neg logit contributions | |
ullivan | -12.219 |
Hera | -12.081 |
enhagen | -12.021 |
�� | -11.411 |
asma | -11.207 |
Token | et |
Token ID | 2123 |
Feature activation | -4.66e-01 |
Pos logit contributions | |
MX | +2.857 |
ovie | +2.649 |
oir | +2.578 |
resp | +2.385 |
butt | +2.345 |
Neg logit contributions | |
ullivan | -3.018 |
enhagen | -3.006 |
asma | -2.936 |
eda | -2.843 |
Hera | -2.827 |
Token | vot |
Token ID | 1993 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
MX | +5.079 |
ovie | +4.680 |
oir | +4.621 |
resp | +4.313 |
butt | +4.155 |
Neg logit contributions | |
ullivan | -5.426 |
enhagen | -5.362 |
asma | -5.222 |
eda | -5.079 |
Hera | -5.031 |
Token | re |
Token ID | 260 |
Feature activation | -7.95e-02 |
Pos logit contributions | |
MX | +1.479 |
ovie | +1.358 |
oir | +1.314 |
resp | +1.197 |
butt | +1.169 |
Neg logit contributions | |
ullivan | -2.121 |
enhagen | -2.088 |
asma | -2.050 |
Hera | -2.017 |
eda | -2.009 |
Token | dé |
Token ID | 39073 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
MX | +0.902 |
ovie | +0.843 |
oir | +0.807 |
resp | +0.756 |
butt | +0.752 |
Neg logit contributions | |
ullivan | -0.921 |
enhagen | -0.911 |
asma | -0.892 |
eda | -0.873 |
Hera | -0.870 |
Token | Times |
Token ID | 3782 |
Feature activation | -5.22e-01 |
Pos logit contributions | |
MX | +2.242 |
ovie | +2.095 |
oir | +2.014 |
butt | +1.907 |
resp | +1.893 |
Neg logit contributions | |
enhagen | -1.815 |
ullivan | -1.814 |
asma | -1.738 |
eda | -1.696 |
lication | -1.694 |
Token | 's |
Token ID | 338 |
Feature activation | -4.87e-01 |
Pos logit contributions | |
MX | +4.357 |
ovie | +3.832 |
oir | +3.740 |
butt | +3.520 |
\' | +3.505 |
Neg logit contributions | |
enhagen | -7.525 |
ullivan | -7.500 |
lication | -7.064 |
Hera | -6.969 |
asma | -6.943 |
Token | products |
Token ID | 3186 |
Feature activation | +2.28e-02 |
Pos logit contributions | |
MX | +5.820 |
ovie | +5.270 |
oir | +5.207 |
resp | +4.902 |
butt | +4.886 |
Neg logit contributions | |
enhagen | -5.334 |
ullivan | -5.101 |
asma | -4.969 |
lication | -4.899 |
eda | -4.896 |
Token | and |
Token ID | 290 |
Feature activation | -1.96e-02 |
Pos logit contributions | |
ullivan | +0.268 |
enhagen | +0.263 |
asma | +0.260 |
Hera | +0.256 |
eda | +0.255 |
Neg logit contributions | |
MX | -0.254 |
ovie | -0.237 |
oir | -0.226 |
resp | -0.211 |
butt | -0.211 |
Token | services |
Token ID | 2594 |
Feature activation | -3.72e-01 |
Pos logit contributions | |
MX | +0.303 |
ovie | +0.289 |
oir | +0.279 |
resp | +0.267 |
butt | +0.266 |
Neg logit contributions | |
ullivan | -0.147 |
enhagen | -0.144 |
asma | -0.140 |
Hera | -0.135 |
eda | -0.135 |
Token | . |
Token ID | 13 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
MX | +3.426 |
ovie | +3.064 |
oir | +2.863 |
butt | +2.700 |
resp | +2.665 |
Neg logit contributions | |
enhagen | -5.185 |
ullivan | -5.107 |
asma | -4.912 |
lication | -4.849 |
Hera | -4.754 |
Token | Thank |
Token ID | 6952 |
Feature activation | -7.53e-01 |
Pos logit contributions | |
MX | +5.587 |
resp | +4.017 |
� | +3.745 |
ovie | +3.700 |
pa | +3.210 |
Neg logit contributions | |
enhagen | -21.519 |
ullivan | -20.470 |
asma | -20.051 |
lication | -19.785 |
livest | -19.718 |
Token | you |
Token ID | 345 |
Feature activation | -6.07e-01 |
Pos logit contributions | |
MX | +5.583 |
ovie | +4.794 |
oir | +4.657 |
resp | +4.494 |
butt | +4.327 |
Neg logit contributions | |
enhagen | -11.053 |
ullivan | -10.855 |
lication | -10.343 |
asma | -10.327 |
Hera | -9.948 |
Token | for |
Token ID | 329 |
Feature activation | +3.68e-02 |
Pos logit contributions | |
MX | +5.239 |
ovie | +4.749 |
oir | +4.409 |
butt | +4.219 |
resp | +4.194 |
Neg logit contributions | |
enhagen | -8.486 |
ullivan | -8.412 |
asma | -7.996 |
lication | -7.971 |
Hera | -7.914 |
Token | subscribing |
Token ID | 18412 |
Feature activation | -6.68e-01 |
Pos logit contributions | |
ullivan | +0.343 |
enhagen | +0.336 |
asma | +0.330 |
Hera | +0.323 |
eda | +0.322 |
Neg logit contributions | |
MX | -0.499 |
ovie | -0.473 |
oir | -0.455 |
resp | -0.430 |
butt | -0.429 |
Token | . |
Token ID | 13 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
MX | +5.281 |
oir | +4.353 |
ovie | +4.343 |
butt | +3.829 |
sburgh | +3.826 |
Neg logit contributions | |
enhagen | -10.204 |
ullivan | -9.863 |
lication | -9.523 |
asma | -9.304 |
Hera | -9.164 |
Token | and |
Token ID | 290 |
Feature activation | +4.57e-02 |
Pos logit contributions | |
MX | +3.647 |
ovie | +3.359 |
oir | +3.216 |
resp | +2.999 |
butt | +2.974 |
Neg logit contributions | |
ullivan | -4.312 |
enhagen | -4.187 |
asma | -4.110 |
Hera | -4.063 |
eda | -3.999 |
Token | Google |
Token ID | 3012 |
Feature activation | -4.40e-01 |
Pos logit contributions | |
ullivan | +0.514 |
enhagen | +0.505 |
asma | +0.497 |
Hera | +0.489 |
eda | +0.487 |
Neg logit contributions | |
MX | -0.532 |
ovie | -0.498 |
oir | -0.475 |
resp | -0.447 |
butt | -0.445 |
Token | are |
Token ID | 389 |
Feature activation | -5.16e-02 |
Pos logit contributions | |
MX | +4.623 |
ovie | +4.353 |
oir | +4.086 |
butt | +3.946 |
resp | +3.864 |
Neg logit contributions | |
ullivan | -5.276 |
enhagen | -5.133 |
asma | -5.066 |
Hera | -4.940 |
eda | -4.887 |
Token | taking |
Token ID | 2263 |
Feature activation | -3.44e-01 |
Pos logit contributions | |
MX | +0.592 |
ovie | +0.553 |
oir | +0.527 |
resp | +0.494 |
butt | +0.494 |
Neg logit contributions | |
ullivan | -0.592 |
enhagen | -0.583 |
asma | -0.573 |
eda | -0.561 |
Hera | -0.560 |
Token | a |
Token ID | 257 |
Feature activation | -7.13e-01 |
Pos logit contributions | |
MX | +3.680 |
ovie | +3.400 |
oir | +3.247 |
resp | +3.078 |
butt | +3.070 |
Neg logit contributions | |
ullivan | -4.143 |
enhagen | -4.086 |
asma | -3.964 |
eda | -3.878 |
lication | -3.864 |
Token | tougher |
Token ID | 20516 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
MX | +7.210 |
ovie | +6.487 |
oir | +6.379 |
resp | +5.969 |
butt | +5.819 |
Neg logit contributions | |
enhagen | -8.421 |
ullivan | -8.413 |
lication | -8.000 |
asma | -7.996 |
eda | -7.907 |
Token | stance |
Token ID | 12046 |
Feature activation | -3.35e-01 |
Pos logit contributions | |
MX | +9.022 |
ovie | +8.541 |
oir | +7.239 |
butt | +7.198 |
resp | +7.153 |
Neg logit contributions | |
enhagen | -15.916 |
ullivan | -15.608 |
lication | -15.359 |
rocal | -15.234 |
�� | -15.199 |
Token | against |
Token ID | 1028 |
Feature activation | -2.66e-01 |
Pos logit contributions | |
MX | +3.313 |
ovie | +3.157 |
oir | +2.922 |
butt | +2.731 |
resp | +2.726 |
Neg logit contributions | |
ullivan | -4.279 |
enhagen | -4.201 |
asma | -4.122 |
eda | -4.031 |
Hera | -4.019 |
Token | nudity |
Token ID | 42156 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
MX | +2.940 |
ovie | +2.769 |
oir | +2.628 |
resp | +2.505 |
butt | +2.461 |
Neg logit contributions | |
ullivan | -3.114 |
enhagen | -3.048 |
asma | -3.018 |
eda | -2.955 |
lication | -2.927 |
Token | to |
Token ID | 284 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
MX | +3.192 |
ovie | +2.949 |
oir | +2.828 |
resp | +2.662 |
butt | +2.630 |
Neg logit contributions | |
ullivan | -3.986 |
enhagen | -3.916 |
asma | -3.785 |
Hera | -3.724 |
eda | -3.721 |
Token | prevent |
Token ID | 2948 |
Feature activation | -5.57e-02 |
Pos logit contributions | |
MX | +1.285 |
ovie | +1.200 |
oir | +1.149 |
butt | +1.073 |
resp | +1.073 |
Neg logit contributions | |
ullivan | -1.350 |
enhagen | -1.324 |
asma | -1.305 |
Hera | -1.276 |
eda | -1.273 |
Token | Nov |
Token ID | 5267 |
Feature activation | -6.83e-01 |
Pos logit contributions | |
MX | +1.693 |
ovie | +1.583 |
oir | +1.504 |
butt | +1.399 |
resp | +1.396 |
Neg logit contributions | |
ullivan | -1.930 |
enhagen | -1.898 |
asma | -1.863 |
eda | -1.807 |
Hera | -1.800 |
Token | . |
Token ID | 13 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
MX | +5.147 |
ovie | +4.734 |
oir | +4.386 |
resp | +4.033 |
pa | +4.023 |
Neg logit contributions | |
enhagen | -10.037 |
ullivan | -9.856 |
asma | -9.423 |
Hera | -9.267 |
lication | -9.154 |
Token | 8 |
Token ID | 807 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
MX | +3.194 |
ovie | +2.907 |
oir | +2.772 |
butt | +2.605 |
resp | +2.599 |
Neg logit contributions | |
enhagen | -3.779 |
ullivan | -3.777 |
asma | -3.613 |
lication | -3.511 |
eda | -3.496 |
Token | in |
Token ID | 287 |
Feature activation | -4.66e-02 |
Pos logit contributions | |
MX | +3.011 |
ovie | +2.844 |
oir | +2.654 |
butt | +2.466 |
resp | +2.463 |
Neg logit contributions | |
ullivan | -4.083 |
enhagen | -3.995 |
asma | -3.970 |
Hera | -3.815 |
eda | -3.794 |
Token | Vaughan |
Token ID | 47451 |
Feature activation | -8.47e-01 |
Pos logit contributions | |
MX | +0.562 |
ovie | +0.528 |
oir | +0.504 |
resp | +0.475 |
butt | +0.474 |
Neg logit contributions | |
ullivan | -0.506 |
enhagen | -0.497 |
asma | -0.489 |
Hera | -0.477 |
eda | -0.477 |
Token | , |
Token ID | 11 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
MX | +6.638 |
ovie | +5.968 |
oir | +5.801 |
sburgh | +5.486 |
butt | +5.396 |
Neg logit contributions | |
ullivan | -12.021 |
asma | -11.100 |
enhagen | -11.079 |
Hera | -10.897 |
rocal | -10.820 |
Token | Ont |
Token ID | 9463 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
MX | +10.614 |
butt | +9.195 |
ovie | +9.186 |
pa | +8.759 |
sburgh | +8.431 |
Neg logit contributions | |
ullivan | -15.226 |
enhagen | -14.348 |
asma | -14.212 |
lication | -13.340 |
eda | -13.252 |
Token | . |
Token ID | 13 |
Feature activation | +2.05e-02 |
Pos logit contributions | |
MX | +1.989 |
ovie | +1.851 |
oir | +1.744 |
resp | +1.584 |
butt | +1.555 |
Neg logit contributions | |
ullivan | -3.347 |
enhagen | -3.254 |
asma | -3.224 |
Hera | -3.207 |
eda | -3.151 |
Token | The |
Token ID | 383 |
Feature activation | -2.54e-01 |
Pos logit contributions | |
ullivan | +0.242 |
enhagen | +0.238 |
asma | +0.234 |
Hera | +0.230 |
eda | +0.230 |
Neg logit contributions | |
MX | -0.229 |
ovie | -0.213 |
oir | -0.203 |
resp | -0.190 |
butt | -0.189 |
Token | three |
Token ID | 1115 |
Feature activation | -6.40e-01 |
Pos logit contributions | |
MX | +2.837 |
ovie | +2.651 |
oir | +2.515 |
butt | +2.362 |
resp | +2.354 |
Neg logit contributions | |
ullivan | -2.953 |
enhagen | -2.882 |
asma | -2.862 |
eda | -2.771 |
lication | -2.760 |
Token | players |
Token ID | 1938 |
Feature activation | -3.71e-01 |
Pos logit contributions | |
MX | +6.454 |
ovie | +5.929 |
oir | +5.635 |
butt | +5.428 |
sburgh | +5.370 |
Neg logit contributions | |
ullivan | -7.678 |
enhagen | -7.339 |
asma | -7.309 |
lication | -7.197 |
eda | -7.102 |
Token | make |
Token ID | 787 |
Feature activation | +3.04e-01 |
Pos logit contributions | |
ullivan | +1.725 |
enhagen | +1.683 |
asma | +1.672 |
Hera | +1.655 |
eda | +1.641 |
Neg logit contributions | |
MX | -2.271 |
ovie | -2.149 |
oir | -2.054 |
resp | -1.945 |
butt | -1.930 |
Token | the |
Token ID | 262 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
ullivan | +3.383 |
enhagen | +3.311 |
asma | +3.283 |
Hera | +3.257 |
eda | +3.194 |
Neg logit contributions | |
MX | -3.521 |
ovie | -3.292 |
oir | -3.132 |
sburgh | -2.930 |
butt | -2.921 |
Token | noise |
Token ID | 7838 |
Feature activation | -4.77e-01 |
Pos logit contributions | |
ullivan | +1.354 |
enhagen | +1.328 |
asma | +1.312 |
Hera | +1.293 |
eda | +1.286 |
Neg logit contributions | |
MX | -1.282 |
ovie | -1.194 |
oir | -1.132 |
resp | -1.062 |
butt | -1.060 |
Token | with |
Token ID | 351 |
Feature activation | -1.43e-02 |
Pos logit contributions | |
MX | +4.863 |
ovie | +4.403 |
oir | +4.224 |
resp | +3.944 |
butt | +3.931 |
Neg logit contributions | |
ullivan | -5.913 |
enhagen | -5.777 |
asma | -5.747 |
eda | -5.586 |
lication | -5.506 |
Token | a |
Token ID | 257 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
MX | +0.168 |
ovie | +0.158 |
oir | +0.151 |
resp | +0.142 |
butt | +0.141 |
Neg logit contributions | |
ullivan | -0.160 |
enhagen | -0.158 |
asma | -0.155 |
Hera | -0.152 |
eda | -0.152 |
Token | sound |
Token ID | 2128 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
MX | +1.171 |
ovie | +1.089 |
oir | +1.042 |
resp | +0.977 |
butt | +0.976 |
Neg logit contributions | |
ullivan | -1.176 |
enhagen | -1.162 |
asma | -1.138 |
eda | -1.114 |
Hera | -1.112 |
Token | board |
Token ID | 3526 |
Feature activation | +7.96e-02 |
Pos logit contributions | |
MX | +12.298 |
ovie | +11.091 |
oir | +10.792 |
butt | +10.689 |
pa | +10.507 |
Neg logit contributions | |
enhagen | -13.073 |
ullivan | -12.902 |
asma | -12.356 |
rocal | -12.029 |
eda | -11.852 |
Token | or |
Token ID | 393 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
ullivan | +0.933 |
enhagen | +0.919 |
asma | +0.907 |
Hera | +0.891 |
eda | +0.887 |
Neg logit contributions | |
MX | -0.886 |
ovie | -0.826 |
oir | -0.784 |
resp | -0.738 |
butt | -0.733 |
Token | your |
Token ID | 534 |
Feature activation | +4.98e-02 |
Pos logit contributions | |
MX | +1.451 |
ovie | +1.352 |
oir | +1.289 |
resp | +1.205 |
butt | +1.204 |
Neg logit contributions | |
ullivan | -1.514 |
enhagen | -1.493 |
asma | -1.464 |
eda | -1.431 |
Hera | -1.429 |
Token | own |
Token ID | 898 |
Feature activation | -9.38e-02 |
Pos logit contributions | |
ullivan | +0.551 |
enhagen | +0.540 |
asma | +0.533 |
Hera | +0.522 |
eda | +0.521 |
Neg logit contributions | |
MX | -0.591 |
ovie | -0.554 |
oir | -0.528 |
resp | -0.498 |
butt | -0.495 |
Token | effects |
Token ID | 3048 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
MX | +1.050 |
ovie | +0.980 |
oir | +0.935 |
resp | +0.873 |
butt | +0.873 |
Neg logit contributions | |
ullivan | -1.099 |
enhagen | -1.090 |
asma | -1.065 |
eda | -1.042 |
Hera | -1.040 |
Token | la |
Token ID | 8591 |
Feature activation | -5.00e-02 |
Pos logit contributions | |
MX | +4.797 |
ovie | +4.457 |
oir | +4.418 |
resp | +4.029 |
butt | +3.928 |
Neg logit contributions | |
ullivan | -5.054 |
enhagen | -5.020 |
asma | -4.869 |
Hera | -4.730 |
eda | -4.694 |
Token | corporation |
Token ID | 12017 |
Feature activation | -3.77e-02 |
Pos logit contributions | |
MX | +0.573 |
ovie | +0.535 |
oir | +0.511 |
resp | +0.479 |
butt | +0.476 |
Neg logit contributions | |
ullivan | -0.575 |
enhagen | -0.566 |
asma | -0.556 |
Hera | -0.544 |
eda | -0.543 |
Token | , |
Token ID | 11 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
MX | +0.420 |
ovie | +0.392 |
oir | +0.374 |
resp | +0.350 |
butt | +0.348 |
Neg logit contributions | |
ullivan | -0.445 |
enhagen | -0.438 |
asma | -0.431 |
Hera | -0.422 |
eda | -0.422 |
Token | s |
Token ID | 264 |
Feature activation | -4.10e-01 |
Pos logit contributions | |
MX | +2.734 |
ovie | +2.530 |
oir | +2.435 |
resp | +2.277 |
butt | +2.239 |
Neg logit contributions | |
ullivan | -2.737 |
enhagen | -2.714 |
asma | -2.654 |
eda | -2.578 |
Hera | -2.573 |
Token | es |
Token ID | 274 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
MX | +4.145 |
ovie | +3.927 |
oir | +3.829 |
resp | +3.440 |
butt | +3.298 |
Neg logit contributions | |
ullivan | -5.173 |
enhagen | -5.075 |
Hera | -5.038 |
asma | -4.932 |
eda | -4.772 |
Token | v |
Token ID | 410 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
MX | +1.477 |
ovie | +1.375 |
oir | +1.321 |
resp | +1.238 |
butt | +1.227 |
Neg logit contributions | |
ullivan | -1.463 |
enhagen | -1.451 |
asma | -1.418 |
eda | -1.384 |
Hera | -1.378 |
Token | ale |
Token ID | 1000 |
Feature activation | -6.74e-02 |
Pos logit contributions | |
oir | +13.058 |
MX | +12.676 |
ovie | +11.949 |
resp | +11.201 |
ie | +11.008 |
Neg logit contributions | |
ullivan | -12.069 |
Hera | -11.929 |
enhagen | -11.600 |
�� | -11.476 |
asma | -11.254 |
Token | urs |
Token ID | 1834 |
Feature activation | -3.49e-01 |
Pos logit contributions | |
MX | +0.560 |
ovie | +0.509 |
oir | +0.480 |
resp | +0.437 |
butt | +0.431 |
Neg logit contributions | |
ullivan | -0.985 |
enhagen | -0.974 |
asma | -0.961 |
Hera | -0.945 |
eda | -0.942 |
Token | et |
Token ID | 2123 |
Feature activation | -4.50e-01 |
Pos logit contributions | |
MX | +3.862 |
ovie | +3.576 |
oir | +3.492 |
resp | +3.233 |
butt | +3.151 |
Neg logit contributions | |
enhagen | -4.076 |
ullivan | -4.054 |
asma | -3.947 |
eda | -3.815 |
lication | -3.787 |
Token | le |
Token ID | 443 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
MX | +5.005 |
ovie | +4.630 |
oir | +4.556 |
resp | +4.241 |
butt | +4.092 |
Neg logit contributions | |
ullivan | -5.157 |
enhagen | -5.091 |
asma | -4.951 |
eda | -4.779 |
Hera | -4.770 |
Token | urs |
Token ID | 1834 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
MX | +1.202 |
ovie | +1.117 |
oir | +1.067 |
resp | +0.995 |
butt | +0.988 |
Neg logit contributions | |
ullivan | -1.376 |
enhagen | -1.363 |
asma | -1.333 |
eda | -1.304 |
Hera | -1.301 |
Token | the |
Token ID | 262 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
MX | +6.116 |
ovie | +5.701 |
oir | +5.351 |
sburgh | +4.913 |
butt | +4.806 |
Neg logit contributions | |
ullivan | -8.521 |
enhagen | -8.396 |
asma | -8.065 |
lication | -7.958 |
rocal | -7.832 |
Token | new |
Token ID | 649 |
Feature activation | -4.99e-01 |
Pos logit contributions | |
MX | +0.118 |
ovie | +0.110 |
oir | +0.104 |
resp | +0.097 |
butt | +0.097 |
Neg logit contributions | |
ullivan | -0.134 |
enhagen | -0.132 |
asma | -0.130 |
Hera | -0.127 |
eda | -0.127 |
Token | Secretary |
Token ID | 4986 |
Feature activation | -6.07e-01 |
Pos logit contributions | |
MX | +4.569 |
ovie | +4.223 |
oir | +3.985 |
sburgh | +3.679 |
resp | +3.635 |
Neg logit contributions | |
ullivan | -6.595 |
enhagen | -6.545 |
asma | -6.403 |
lication | -6.278 |
eda | -6.253 |
Token | of |
Token ID | 286 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
MX | +5.601 |
ovie | +5.327 |
oir | +4.860 |
butt | +4.551 |
pa | +4.468 |
Neg logit contributions | |
enhagen | -7.838 |
ullivan | -7.810 |
asma | -7.619 |
eda | -7.391 |
Hera | -7.316 |
Token | Energy |
Token ID | 6682 |
Feature activation | -7.97e-01 |
Pos logit contributions | |
MX | +6.406 |
ovie | +6.156 |
oir | +5.442 |
pa | +5.061 |
sburgh | +5.052 |
Neg logit contributions | |
ullivan | -14.373 |
enhagen | -14.181 |
asma | -13.981 |
eda | -13.340 |
lication | -13.307 |
Token | , |
Token ID | 11 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
MX | +6.783 |
ovie | +6.638 |
oir | +5.840 |
butt | +5.486 |
pa | +5.469 |
Neg logit contributions | |
ullivan | -10.435 |
enhagen | -10.273 |
asma | -9.976 |
rocal | -9.844 |
lication | -9.703 |
Token | Ernest |
Token ID | 34705 |
Feature activation | -3.95e-01 |
Pos logit contributions | |
MX | +9.690 |
ovie | +9.057 |
pa | +8.509 |
sburgh | +8.410 |
oir | +8.217 |
Neg logit contributions | |
ullivan | -14.763 |
enhagen | -14.438 |
asma | -13.858 |
rocal | -13.507 |
lication | -13.285 |
Token | Mon |
Token ID | 2892 |
Feature activation | +4.85e-02 |
Pos logit contributions | |
MX | +3.727 |
ovie | +3.450 |
oir | +3.415 |
butt | +3.056 |
resp | +3.043 |
Neg logit contributions | |
ullivan | -5.326 |
enhagen | -5.176 |
asma | -5.035 |
rocal | -4.897 |
lication | -4.886 |
Token | iz |
Token ID | 528 |
Feature activation | +9.68e-02 |
Pos logit contributions | |
ullivan | +0.478 |
enhagen | +0.470 |
asma | +0.467 |
eda | +0.455 |
Hera | +0.451 |
Neg logit contributions | |
MX | -0.633 |
ovie | -0.594 |
oir | -0.569 |
resp | -0.541 |
butt | -0.538 |
Token | . |
Token ID | 13 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
ullivan | +1.156 |
enhagen | +1.136 |
asma | +1.121 |
eda | +1.103 |
Hera | +1.101 |
Neg logit contributions | |
MX | -1.059 |
ovie | -0.984 |
oir | -0.939 |
resp | -0.884 |
butt | -0.876 |
Token |
|
Token ID | 198 |
Feature activation | +8.21e-02 |
Pos logit contributions | |
MX | +3.801 |
ovie | +3.447 |
oir | +3.294 |
butt | +3.034 |
resp | +3.009 |
Neg logit contributions | |
enhagen | -4.926 |
ullivan | -4.925 |
asma | -4.733 |
eda | -4.665 |
lication | -4.637 |
Token | , |
Token ID | 11 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
MX | +3.508 |
ovie | +3.028 |
oir | +2.873 |
butt | +2.754 |
resp | +2.711 |
Neg logit contributions | |
enhagen | -4.878 |
ullivan | -4.800 |
asma | -4.631 |
Hera | -4.576 |
eda | -4.573 |
Token | local |
Token ID | 1957 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
ullivan | +2.073 |
asma | +2.032 |
enhagen | +1.964 |
Hera | +1.948 |
eda | +1.920 |
Neg logit contributions | |
MX | -3.104 |
ovie | -2.963 |
oir | -2.825 |
butt | -2.716 |
resp | -2.707 |
Token | independent |
Token ID | 4795 |
Feature activation | -7.75e-01 |
Pos logit contributions | |
MX | +3.154 |
ovie | +2.149 |
oir | +1.225 |
iary | +0.992 |
pa | +0.959 |
Neg logit contributions | |
enhagen | -20.076 |
lication | -19.015 |
ullivan | -18.771 |
zl | -18.174 |
�� | -18.166 |
Token | journalism |
Token ID | 14033 |
Feature activation | -6.50e-01 |
Pos logit contributions | |
MX | +5.937 |
ovie | +5.357 |
sburgh | +4.798 |
iary | +4.600 |
oir | +4.556 |
Neg logit contributions | |
enhagen | -11.582 |
ullivan | -11.562 |
eda | -10.871 |
rocal | -10.798 |
cone | -10.693 |
Token | in |
Token ID | 287 |
Feature activation | -4.89e-01 |
Pos logit contributions | |
MX | +5.590 |
ovie | +4.827 |
oir | +4.591 |
resp | +4.336 |
butt | +4.284 |
Neg logit contributions | |
ullivan | -9.315 |
enhagen | -8.947 |
asma | -8.677 |
lication | -8.646 |
rocal | -8.359 |
Token | South |
Token ID | 2520 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
MX | +2.774 |
ovie | +2.344 |
pa | +1.940 |
resp | +1.913 |
oir | +1.904 |
Neg logit contributions | |
enhagen | -8.359 |
ullivan | -8.306 |
Hera | -8.162 |
asma | -8.154 |
lication | -8.005 |
Token | Australia |
Token ID | 4505 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
MX | +6.782 |
butt | +5.007 |
pa | +4.722 |
oir | +4.636 |
resp | +4.448 |
Neg logit contributions | |
ullivan | -20.495 |
enhagen | -19.441 |
rocal | -18.968 |
lication | -18.567 |
�� | -18.549 |
Token | . |
Token ID | 13 |
Feature activation | -6.74e-01 |
Pos logit contributions | |
MX | +4.438 |
ovie | +4.003 |
oir | +3.889 |
resp | +3.681 |
butt | +3.641 |
Neg logit contributions | |
ullivan | -8.458 |
enhagen | -8.215 |
asma | -8.116 |
lication | -8.005 |
Hera | -7.957 |
Token | As |
Token ID | 1081 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
MX | +5.387 |
oir | +4.615 |
ovie | +4.492 |
butt | +4.403 |
sburgh | +4.338 |
Neg logit contributions | |
enhagen | -9.965 |
ullivan | -9.814 |
lication | -9.422 |
cone | -9.363 |
asma | -9.101 |
Token | a |
Token ID | 257 |
Feature activation | -6.64e-01 |
Pos logit contributions | |
MX | +6.456 |
oir | +6.155 |
ovie | +6.132 |
pa | +5.272 |
resp | +5.159 |
Neg logit contributions | |
ullivan | -15.119 |
enhagen | -14.739 |
lication | -14.593 |
cone | -14.413 |
asma | -14.250 |
Token | news |
Token ID | 1705 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
MX | +4.351 |
oir | +3.751 |
ovie | +3.434 |
pa | +3.222 |
resp | +3.183 |
Neg logit contributions | |
enhagen | -10.665 |
ullivan | -10.400 |
cone | -9.946 |
asma | -9.850 |
zl | -9.774 |
Token | test |
Token ID | 1332 |
Feature activation | -6.73e-02 |
Pos logit contributions | |
MX | +1.839 |
ovie | +1.716 |
oir | +1.638 |
resp | +1.543 |
butt | +1.541 |
Neg logit contributions | |
ullivan | -1.873 |
enhagen | -1.848 |
asma | -1.805 |
lication | -1.778 |
Hera | -1.772 |
Token | methods |
Token ID | 5050 |
Feature activation | -9.77e-02 |
Pos logit contributions | |
MX | +0.722 |
ovie | +0.672 |
oir | +0.638 |
resp | +0.596 |
butt | +0.594 |
Neg logit contributions | |
ullivan | -0.819 |
enhagen | -0.807 |
asma | -0.795 |
Hera | -0.778 |
eda | -0.778 |
Token | to |
Token ID | 284 |
Feature activation | -2.56e-01 |
Pos logit contributions | |
MX | +1.074 |
ovie | +1.002 |
oir | +0.950 |
resp | +0.890 |
butt | +0.889 |
Neg logit contributions | |
ullivan | -1.165 |
enhagen | -1.145 |
asma | -1.123 |
eda | -1.103 |
Hera | -1.103 |
Token | measure |
Token ID | 3953 |
Feature activation | -4.49e-01 |
Pos logit contributions | |
MX | +2.828 |
ovie | +2.630 |
oir | +2.499 |
butt | +2.358 |
resp | +2.353 |
Neg logit contributions | |
ullivan | -3.008 |
enhagen | -2.980 |
asma | -2.885 |
lication | -2.875 |
eda | -2.849 |
Token | weak |
Token ID | 4939 |
Feature activation | -6.02e-01 |
Pos logit contributions | |
MX | +4.404 |
ovie | +4.073 |
oir | +3.870 |
resp | +3.552 |
sburgh | +3.537 |
Neg logit contributions | |
ullivan | -5.692 |
enhagen | -5.590 |
asma | -5.440 |
lication | -5.418 |
eda | -5.340 |
Token | gravitational |
Token ID | 29973 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
MX | +6.502 |
ovie | +6.107 |
oir | +5.774 |
butt | +5.476 |
pa | +5.444 |
Neg logit contributions | |
ullivan | -6.932 |
enhagen | -6.542 |
lication | -6.403 |
eda | -6.359 |
asma | -6.344 |
Token | lens |
Token ID | 10317 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
waves | +10.324 |
MX | +10.030 |
ovie | +9.428 |
oir | +9.311 |
pa | +8.484 |
Neg logit contributions | |
ullivan | -15.098 |
enhagen | -14.350 |
lication | -14.257 |
nown | -13.981 |
eda | -13.706 |
Token | ing |
Token ID | 278 |
Feature activation | -4.97e-01 |
Pos logit contributions | |
MX | +1.439 |
ovie | +1.351 |
oir | +1.287 |
resp | +1.202 |
butt | +1.193 |
Neg logit contributions | |
ullivan | -1.556 |
enhagen | -1.530 |
asma | -1.500 |
Hera | -1.466 |
eda | -1.465 |
Token | , |
Token ID | 11 |
Feature activation | -5.31e-01 |
Pos logit contributions | |
MX | +4.901 |
ovie | +4.561 |
oir | +4.347 |
resp | +3.975 |
pa | +3.972 |
Neg logit contributions | |
ullivan | -6.374 |
enhagen | -6.128 |
asma | -5.923 |
lication | -5.865 |
eda | -5.834 |
Token | another |
Token ID | 1194 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
MX | +5.137 |
ovie | +4.825 |
oir | +4.441 |
butt | +4.210 |
resp | +4.199 |
Neg logit contributions | |
ullivan | -6.666 |
enhagen | -6.542 |
asma | -6.419 |
eda | -6.331 |
lication | -6.329 |
Token | way |
Token ID | 835 |
Feature activation | -4.33e-01 |
Pos logit contributions | |
MX | +2.746 |
ovie | +2.584 |
oir | +2.461 |
butt | +2.310 |
resp | +2.282 |
Neg logit contributions | |
ullivan | -2.750 |
enhagen | -2.714 |
asma | -2.649 |
eda | -2.584 |
lication | -2.577 |
Token | well |
Token ID | 880 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
MX | +2.176 |
ovie | +2.012 |
oir | +1.945 |
resp | +1.811 |
butt | +1.806 |
Neg logit contributions | |
enhagen | -2.498 |
ullivan | -2.489 |
asma | -2.412 |
lication | -2.382 |
Hera | -2.359 |
Token | , |
Token ID | 11 |
Feature activation | +6.32e-02 |
Pos logit contributions | |
MX | +1.317 |
ovie | +1.225 |
oir | +1.169 |
butt | +1.085 |
resp | +1.080 |
Neg logit contributions | |
ullivan | -1.571 |
enhagen | -1.547 |
asma | -1.528 |
Hera | -1.495 |
eda | -1.493 |
Token | it |
Token ID | 340 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
ullivan | +0.749 |
enhagen | +0.737 |
asma | +0.725 |
Hera | +0.714 |
eda | +0.711 |
Neg logit contributions | |
MX | -0.698 |
ovie | -0.652 |
oir | -0.618 |
resp | -0.582 |
butt | -0.577 |
Token | will |
Token ID | 481 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
enhagen | +3.688 |
ullivan | +3.678 |
asma | +3.621 |
Hera | +3.559 |
eda | +3.547 |
Neg logit contributions | |
MX | -4.931 |
ovie | -4.585 |
oir | -4.334 |
resp | -4.141 |
butt | -4.080 |
Token | automatically |
Token ID | 6338 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
ullivan | +1.903 |
enhagen | +1.859 |
asma | +1.852 |
Hera | +1.817 |
eda | +1.808 |
Neg logit contributions | |
MX | -2.032 |
ovie | -1.896 |
oir | -1.784 |
resp | -1.694 |
butt | -1.674 |
Token | begin |
Token ID | 2221 |
Feature activation | +7.32e-01 |
Pos logit contributions | |
ullivan | +3.963 |
asma | +3.879 |
enhagen | +3.828 |
Hera | +3.813 |
eda | +3.739 |
Neg logit contributions | |
MX | -4.211 |
ovie | -3.910 |
oir | -3.706 |
resp | -3.494 |
butt | -3.448 |
Token | another |
Token ID | 1194 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
ullivan | +6.929 |
asma | +6.837 |
enhagen | +6.832 |
Hera | +6.825 |
eda | +6.645 |
Neg logit contributions | |
MX | -8.732 |
ovie | -8.107 |
oir | -7.776 |
resp | -7.340 |
butt | -7.281 |
Token | drawing |
Token ID | 8263 |
Feature activation | +3.29e-01 |
Pos logit contributions | |
ullivan | +4.645 |
enhagen | +4.489 |
Hera | +4.470 |
asma | +4.393 |
lication | +4.332 |
Neg logit contributions | |
MX | -5.271 |
ovie | -4.897 |
oir | -4.712 |
resp | -4.465 |
butt | -4.408 |
Token | or |
Token ID | 393 |
Feature activation | -3.79e-02 |
Pos logit contributions | |
ullivan | +3.623 |
enhagen | +3.574 |
asma | +3.442 |
lication | +3.440 |
Hera | +3.439 |
Neg logit contributions | |
MX | -3.826 |
ovie | -3.533 |
oir | -3.347 |
resp | -3.207 |
butt | -3.163 |
Token | poem |
Token ID | 21247 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
MX | +0.404 |
ovie | +0.376 |
oir | +0.358 |
resp | +0.333 |
butt | +0.331 |
Neg logit contributions | |
ullivan | -0.466 |
enhagen | -0.459 |
asma | -0.452 |
eda | -0.443 |
Hera | -0.443 |
Token | shortly |
Token ID | 8972 |
Feature activation | -4.44e-02 |
Pos logit contributions | |
ullivan | +1.932 |
enhagen | +1.915 |
asma | +1.868 |
Hera | +1.845 |
eda | +1.834 |
Neg logit contributions | |
MX | -1.885 |
ovie | -1.748 |
oir | -1.654 |
resp | -1.575 |
butt | -1.560 |
Token |
|
Token ID | 198 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
ullivan | +3.248 |
asma | +3.223 |
Hera | +3.183 |
eda | +3.168 |
enhagen | +3.032 |
Neg logit contributions | |
MX | -3.933 |
ovie | -3.792 |
oir | -3.576 |
resp | -3.353 |
sburgh | -3.348 |
Token | Free |
Token ID | 11146 |
Feature activation | +7.81e-01 |
Pos logit contributions | |
asma | +4.176 |
ullivan | +4.157 |
eda | +4.022 |
enhagen | +3.972 |
Hera | +3.909 |
Neg logit contributions | |
MX | -5.246 |
ovie | -5.151 |
oir | -4.955 |
sburgh | -4.642 |
butt | -4.570 |
Token | Sync |
Token ID | 28985 |
Feature activation | +4.35e-01 |
Pos logit contributions | |
asma | +7.231 |
enhagen | +7.144 |
ullivan | +7.034 |
Hera | +6.973 |
eda | +6.800 |
Neg logit contributions | |
ovie | -9.070 |
MX | -9.037 |
oir | -8.639 |
sburgh | -8.243 |
butt | -8.129 |
Token | Please |
Token ID | 4222 |
Feature activation | +3.00e-01 |
Pos logit contributions | |
ullivan | +4.579 |
asma | +4.564 |
enhagen | +4.535 |
Hera | +4.507 |
eda | +4.425 |
Neg logit contributions | |
MX | -5.025 |
ovie | -4.857 |
oir | -4.590 |
resp | -4.334 |
butt | -4.297 |
Token | have |
Token ID | 423 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
ullivan | +3.585 |
enhagen | +3.562 |
eda | +3.501 |
Hera | +3.501 |
asma | +3.501 |
Neg logit contributions | |
MX | -3.143 |
ovie | -2.960 |
oir | -2.808 |
resp | -2.644 |
butt | -2.588 |
Token | a |
Token ID | 257 |
Feature activation | +7.45e-01 |
Pos logit contributions | |
ullivan | +3.406 |
asma | +3.360 |
enhagen | +3.352 |
eda | +3.301 |
Hera | +3.288 |
Neg logit contributions | |
MX | -3.731 |
ovie | -3.549 |
oir | -3.356 |
resp | -3.207 |
sburgh | -3.130 |
Token | read |
Token ID | 1100 |
Feature activation | +6.04e-01 |
Pos logit contributions | |
asma | +7.082 |
ullivan | +6.978 |
Hera | +6.764 |
enhagen | +6.569 |
eda | +6.500 |
Neg logit contributions | |
MX | -8.987 |
ovie | -8.524 |
oir | -8.139 |
resp | -7.785 |
sburgh | -7.681 |
Token | of |
Token ID | 286 |
Feature activation | +8.30e-01 |
Pos logit contributions | |
ullivan | +5.971 |
enhagen | +5.834 |
Hera | +5.758 |
asma | +5.750 |
eda | +5.726 |
Neg logit contributions | |
MX | -7.309 |
ovie | -6.799 |
oir | -6.551 |
resp | -6.193 |
sburgh | -6.171 |
Token | our |
Token ID | 674 |
Feature activation | +8.29e-01 |
Pos logit contributions | |
enhagen | +7.804 |
asma | +7.767 |
Hera | +7.666 |
eda | +7.630 |
ullivan | +7.609 |
Neg logit contributions | |
MX | -9.761 |
ovie | -9.176 |
oir | -9.048 |
sburgh | -8.518 |
butt | -8.510 |
Token | detailed |
Token ID | 6496 |
Feature activation | +9.66e-01 |
Pos logit contributions | |
ullivan | +8.260 |
enhagen | +8.225 |
asma | +8.224 |
Hera | +8.011 |
eda | +7.892 |
Neg logit contributions | |
MX | -9.199 |
ovie | -8.878 |
oir | -8.592 |
sburgh | -8.032 |
butt | -8.001 |
Token | article |
Token ID | 2708 |
Feature activation | +4.04e-01 |
Pos logit contributions | |
asma | +9.043 |
enhagen | +8.933 |
ullivan | +8.853 |
Hera | +8.827 |
eda | +8.669 |
Neg logit contributions | |
MX | -10.772 |
ovie | -10.385 |
oir | -10.189 |
sburgh | -9.536 |
butt | -9.370 |
Token | medical |
Token ID | 3315 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
MX | +0.100 |
ovie | +0.093 |
oir | +0.089 |
resp | +0.084 |
butt | +0.084 |
Neg logit contributions | |
ullivan | -0.092 |
enhagen | -0.090 |
asma | -0.089 |
Hera | -0.087 |
eda | -0.087 |
Token | industry |
Token ID | 2831 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
MX | +3.686 |
ovie | +3.379 |
oir | +3.280 |
butt | +3.008 |
resp | +2.978 |
Neg logit contributions | |
ullivan | -4.724 |
enhagen | -4.663 |
asma | -4.517 |
Hera | -4.382 |
eda | -4.376 |
Token | such |
Token ID | 884 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
MX | +2.517 |
ovie | +2.337 |
oir | +2.241 |
butt | +2.069 |
resp | +2.060 |
Neg logit contributions | |
ullivan | -3.040 |
enhagen | -2.980 |
asma | -2.939 |
Hera | -2.871 |
eda | -2.861 |
Token | that |
Token ID | 326 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
ullivan | +2.210 |
enhagen | +2.151 |
asma | +2.135 |
eda | +2.103 |
Hera | +2.084 |
Neg logit contributions | |
MX | -2.532 |
ovie | -2.379 |
oir | -2.263 |
resp | -2.164 |
butt | -2.127 |
Token | the |
Token ID | 262 |
Feature activation | +6.44e-02 |
Pos logit contributions | |
MX | +1.213 |
ovie | +1.129 |
oir | +1.082 |
butt | +1.009 |
resp | +1.007 |
Neg logit contributions | |
ullivan | -1.273 |
enhagen | -1.252 |
asma | -1.231 |
Hera | -1.199 |
eda | -1.199 |
Token | very |
Token ID | 845 |
Feature activation | +6.96e-01 |
Pos logit contributions | |
ullivan | +0.725 |
enhagen | +0.714 |
asma | +0.703 |
Hera | +0.691 |
eda | +0.689 |
Neg logit contributions | |
MX | -0.748 |
ovie | -0.701 |
oir | -0.667 |
resp | -0.629 |
butt | -0.625 |
Token | definition |
Token ID | 6770 |
Feature activation | -3.25e-02 |
Pos logit contributions | |
Hera | +6.658 |
ullivan | +6.657 |
eda | +6.566 |
asma | +6.558 |
enhagen | +6.551 |
Neg logit contributions | |
MX | -8.381 |
ovie | -7.898 |
oir | -7.331 |
resp | -7.041 |
sburgh | -7.038 |
Token | of |
Token ID | 286 |
Feature activation | +6.69e-02 |
Pos logit contributions | |
MX | +0.365 |
ovie | +0.341 |
oir | +0.325 |
resp | +0.305 |
butt | +0.304 |
Neg logit contributions | |
ullivan | -0.381 |
enhagen | -0.374 |
asma | -0.368 |
Hera | -0.361 |
eda | -0.360 |
Token | � |
Token ID | 564 |
Feature activation | +7.53e-03 |
Pos logit contributions | |
ullivan | +0.757 |
enhagen | +0.744 |
asma | +0.733 |
Hera | +0.722 |
eda | +0.719 |
Neg logit contributions | |
MX | -0.776 |
ovie | -0.727 |
oir | -0.691 |
resp | -0.650 |
butt | -0.648 |
Token | � |
Token ID | 250 |
Feature activation | -3.65e-02 |
Pos logit contributions | |
ullivan | +0.077 |
enhagen | +0.076 |
asma | +0.074 |
Hera | +0.073 |
eda | +0.073 |
Neg logit contributions | |
MX | -0.095 |
ovie | -0.090 |
oir | -0.086 |
resp | -0.081 |
butt | -0.081 |
Token | med |
Token ID | 1150 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
MX | +0.354 |
ovie | +0.326 |
oir | +0.308 |
resp | +0.286 |
butt | +0.285 |
Neg logit contributions | |
ullivan | -0.485 |
enhagen | -0.478 |
asma | -0.471 |
Hera | -0.462 |
eda | -0.462 |
Token | just |
Token ID | 655 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
MX | +2.311 |
ovie | +2.169 |
oir | +2.045 |
resp | +1.927 |
butt | +1.913 |
Neg logit contributions | |
ullivan | -2.538 |
enhagen | -2.481 |
asma | -2.434 |
Hera | -2.374 |
lication | -2.373 |
Token | for |
Token ID | 329 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
ullivan | +1.362 |
enhagen | +1.339 |
asma | +1.325 |
Hera | +1.305 |
eda | +1.298 |
Neg logit contributions | |
MX | -1.346 |
ovie | -1.261 |
oir | -1.205 |
resp | -1.128 |
butt | -1.118 |
Token | yourself |
Token ID | 3511 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
ullivan | +1.793 |
enhagen | +1.777 |
asma | +1.746 |
Hera | +1.720 |
eda | +1.707 |
Neg logit contributions | |
MX | -1.880 |
ovie | -1.752 |
oir | -1.686 |
resp | -1.586 |
butt | -1.567 |
Token | , |
Token ID | 11 |
Feature activation | +7.86e-02 |
Pos logit contributions | |
ullivan | +2.768 |
enhagen | +2.725 |
asma | +2.676 |
Hera | +2.649 |
eda | +2.620 |
Neg logit contributions | |
MX | -2.868 |
ovie | -2.648 |
oir | -2.542 |
resp | -2.403 |
butt | -2.355 |
Token | but |
Token ID | 475 |
Feature activation | +4.99e-01 |
Pos logit contributions | |
ullivan | +0.926 |
enhagen | +0.911 |
asma | +0.896 |
Hera | +0.886 |
eda | +0.882 |
Neg logit contributions | |
MX | -0.872 |
ovie | -0.811 |
oir | -0.776 |
resp | -0.726 |
butt | -0.718 |
Token | for |
Token ID | 329 |
Feature activation | +7.59e-01 |
Pos logit contributions | |
ullivan | +5.153 |
enhagen | +5.107 |
Hera | +5.047 |
asma | +5.042 |
eda | +5.028 |
Neg logit contributions | |
MX | -5.871 |
ovie | -5.518 |
oir | -5.226 |
resp | -5.007 |
sburgh | -4.956 |
Token | a |
Token ID | 257 |
Feature activation | +5.32e-01 |
Pos logit contributions | |
enhagen | +7.286 |
eda | +7.197 |
ullivan | +7.149 |
Hera | +7.134 |
asma | +7.099 |
Neg logit contributions | |
MX | -8.819 |
ovie | -8.372 |
oir | -7.863 |
resp | -7.699 |
sburgh | -7.454 |
Token | few |
Token ID | 1178 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
ullivan | +5.455 |
asma | +5.417 |
Hera | +5.283 |
eda | +5.277 |
enhagen | +5.260 |
Neg logit contributions | |
MX | -6.131 |
ovie | -5.917 |
oir | -5.550 |
resp | -5.382 |
butt | -5.290 |
Token | different |
Token ID | 1180 |
Feature activation | +4.39e-01 |
Pos logit contributions | |
enhagen | +3.577 |
ullivan | +3.577 |
asma | +3.571 |
eda | +3.508 |
Hera | +3.481 |
Neg logit contributions | |
MX | -3.958 |
ovie | -3.775 |
oir | -3.573 |
resp | -3.402 |
butt | -3.360 |
Token | content |
Token ID | 2695 |
Feature activation | +3.11e-01 |
Pos logit contributions | |
ullivan | +4.345 |
asma | +4.294 |
enhagen | +4.292 |
eda | +4.291 |
Hera | +4.244 |
Neg logit contributions | |
MX | -5.321 |
ovie | -5.006 |
oir | -4.780 |
resp | -4.568 |
butt | -4.523 |
Token | spots |
Token ID | 10222 |
Feature activation | +5.94e-02 |
Pos logit contributions | |
ullivan | +3.263 |
enhagen | +3.186 |
asma | +3.182 |
Hera | +3.139 |
eda | +3.108 |
Neg logit contributions | |
MX | -3.731 |
ovie | -3.513 |
oir | -3.386 |
resp | -3.186 |
butt | -3.181 |
Token | country |
Token ID | 1499 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
ullivan | +2.574 |
enhagen | +2.537 |
asma | +2.511 |
Hera | +2.477 |
eda | +2.462 |
Neg logit contributions | |
MX | -3.450 |
ovie | -3.304 |
oir | -3.104 |
butt | -2.968 |
resp | -2.960 |
Token | . |
Token ID | 13 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
ullivan | +1.391 |
enhagen | +1.378 |
asma | +1.353 |
eda | +1.330 |
Hera | +1.327 |
Neg logit contributions | |
MX | -1.273 |
ovie | -1.181 |
oir | -1.122 |
resp | -1.054 |
butt | -1.045 |
Token |
|
Token ID | 198 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
ullivan | +4.047 |
asma | +3.975 |
enhagen | +3.960 |
Hera | +3.941 |
eda | +3.877 |
Neg logit contributions | |
MX | -4.415 |
ovie | -4.172 |
oir | -3.901 |
resp | -3.742 |
butt | -3.707 |
Token |
|
Token ID | 198 |
Feature activation | +2.59e-01 |
Pos logit contributions | |
MX | +1.397 |
ovie | +1.283 |
oir | +1.227 |
resp | +1.150 |
butt | +1.147 |
Neg logit contributions | |
ullivan | -1.679 |
enhagen | -1.678 |
asma | -1.619 |
Hera | -1.584 |
eda | -1.581 |
Token | Read |
Token ID | 5569 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
ullivan | +2.948 |
asma | +2.870 |
enhagen | +2.855 |
eda | +2.843 |
lication | +2.795 |
Neg logit contributions | |
MX | -2.858 |
ovie | -2.727 |
oir | -2.568 |
sburgh | -2.415 |
resp | -2.395 |
Token | full |
Token ID | 1336 |
Feature activation | +7.52e-01 |
Pos logit contributions | |
ullivan | +1.745 |
enhagen | +1.726 |
asma | +1.678 |
Hera | +1.669 |
eda | +1.666 |
Neg logit contributions | |
MX | -1.902 |
ovie | -1.803 |
oir | -1.701 |
resp | -1.612 |
butt | -1.610 |
Token | story |
Token ID | 1621 |
Feature activation | +1.14e-01 |
Pos logit contributions | |
ullivan | +7.590 |
enhagen | +7.431 |
Hera | +7.295 |
eda | +7.198 |
lication | +7.032 |
Neg logit contributions | |
MX | -8.628 |
ovie | -8.215 |
oir | -7.823 |
resp | -7.733 |
sburgh | -7.269 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +9.59e-03 |
Pos logit contributions | |
ullivan | +1.386 |
enhagen | +1.364 |
asma | +1.343 |
Hera | +1.329 |
eda | +1.323 |
Neg logit contributions | |
MX | -1.219 |
ovie | -1.139 |
oir | -1.080 |
resp | -1.012 |
butt | -1.001 |
Token | Asia |
Token ID | 38555 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
ullivan | +0.111 |
enhagen | +0.109 |
asma | +0.107 |
Hera | +0.105 |
eda | +0.105 |
Neg logit contributions | |
MX | -0.109 |
ovie | -0.102 |
oir | -0.097 |
resp | -0.091 |
butt | -0.091 |
Token | Health |
Token ID | 3893 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
MX | +0.188 |
ovie | +0.176 |
oir | +0.168 |
resp | +0.157 |
butt | +0.157 |
Neg logit contributions | |
ullivan | -0.190 |
enhagen | -0.187 |
asma | -0.184 |
Hera | -0.180 |
eda | -0.180 |
Token | Correspond |
Token ID | 34428 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
MX | +1.682 |
ovie | +1.568 |
oir | +1.501 |
butt | +1.405 |
resp | +1.401 |
Neg logit contributions | |
ullivan | -1.754 |
enhagen | -1.714 |
asma | -1.677 |
Hera | -1.641 |
eda | -1.631 |
Token | relatives |
Token ID | 12772 |
Feature activation | -9.32e-02 |
Pos logit contributions | |
ullivan | +0.384 |
enhagen | +0.376 |
asma | +0.370 |
Hera | +0.362 |
eda | +0.361 |
Neg logit contributions | |
MX | -0.495 |
ovie | -0.467 |
oir | -0.447 |
resp | -0.424 |
butt | -0.422 |
Token | would |
Token ID | 561 |
Feature activation | +4.46e-01 |
Pos logit contributions | |
MX | +1.021 |
ovie | +0.956 |
oir | +0.910 |
butt | +0.849 |
resp | +0.847 |
Neg logit contributions | |
ullivan | -1.108 |
enhagen | -1.095 |
asma | -1.075 |
Hera | -1.050 |
eda | -1.050 |
Token | make |
Token ID | 787 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
ullivan | +4.383 |
asma | +4.187 |
enhagen | +4.153 |
Hera | +4.135 |
eda | +4.104 |
Neg logit contributions | |
MX | -5.714 |
ovie | -5.272 |
oir | -4.929 |
resp | -4.861 |
butt | -4.718 |
Token | were |
Token ID | 547 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
MX | +1.667 |
ovie | +1.562 |
oir | +1.491 |
butt | +1.397 |
resp | +1.389 |
Neg logit contributions | |
ullivan | -1.870 |
enhagen | -1.843 |
asma | -1.811 |
eda | -1.769 |
Hera | -1.765 |
Token | generally |
Token ID | 4143 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
MX | +1.976 |
ovie | +1.844 |
oir | +1.754 |
butt | +1.638 |
resp | +1.626 |
Neg logit contributions | |
ullivan | -2.194 |
enhagen | -2.164 |
asma | -2.127 |
Hera | -2.074 |
eda | -2.073 |
Token | by |
Token ID | 416 |
Feature activation | +3.43e-01 |
Pos logit contributions | |
MX | +2.600 |
ovie | +2.420 |
oir | +2.307 |
butt | +2.170 |
resp | +2.152 |
Neg logit contributions | |
ullivan | -2.762 |
enhagen | -2.754 |
asma | -2.683 |
eda | -2.627 |
Hera | -2.603 |
Token | the |
Token ID | 262 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
ullivan | +3.972 |
enhagen | +3.827 |
Hera | +3.802 |
asma | +3.759 |
eda | +3.726 |
Neg logit contributions | |
MX | -3.819 |
ovie | -3.521 |
oir | -3.358 |
resp | -3.182 |
butt | -3.162 |
Token | book |
Token ID | 1492 |
Feature activation | +2.62e-01 |
Pos logit contributions | |
ullivan | +2.558 |
enhagen | +2.488 |
asma | +2.476 |
Hera | +2.454 |
eda | +2.429 |
Neg logit contributions | |
MX | -2.585 |
ovie | -2.441 |
oir | -2.307 |
resp | -2.184 |
butt | -2.161 |
Token | C |
Token ID | 327 |
Feature activation | -3.66e-01 |
Pos logit contributions | |
ullivan | +3.026 |
enhagen | +2.936 |
asma | +2.908 |
eda | +2.871 |
Hera | +2.863 |
Neg logit contributions | |
MX | -2.921 |
ovie | -2.730 |
oir | -2.570 |
resp | -2.449 |
butt | -2.400 |
Token | aj |
Token ID | 1228 |
Feature activation | -3.96e-01 |
Pos logit contributions | |
MX | +3.560 |
ovie | +3.344 |
oir | +3.136 |
resp | +2.957 |
butt | +2.813 |
Neg logit contributions | |
enhagen | -4.746 |
ullivan | -4.719 |
asma | -4.604 |
Hera | -4.589 |
lication | -4.476 |
Token | un |
Token ID | 403 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
MX | +3.568 |
ovie | +3.408 |
oir | +3.203 |
resp | +2.893 |
butt | +2.889 |
Neg logit contributions | |
enhagen | -5.303 |
ullivan | -5.285 |
Hera | -5.203 |
asma | -5.126 |
eda | -5.019 |
Token | a |
Token ID | 257 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
ullivan | +2.248 |
enhagen | +2.209 |
Hera | +2.166 |
asma | +2.153 |
eda | +2.136 |
Neg logit contributions | |
MX | -2.278 |
ovie | -2.127 |
oir | -2.039 |
resp | -1.910 |
butt | -1.910 |
Token | long |
Token ID | 890 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
ullivan | +4.171 |
enhagen | +4.064 |
Hera | +4.026 |
asma | +3.956 |
eda | +3.950 |
Neg logit contributions | |
MX | -4.368 |
ovie | -4.100 |
oir | -3.913 |
butt | -3.756 |
resp | -3.653 |
Token | weekend |
Token ID | 5041 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
ullivan | +1.806 |
enhagen | +1.787 |
asma | +1.733 |
Hera | +1.718 |
eda | +1.718 |
Neg logit contributions | |
MX | -1.811 |
ovie | -1.682 |
oir | -1.594 |
resp | -1.503 |
butt | -1.502 |
Token | . |
Token ID | 13 |
Feature activation | +3.63e-02 |
Pos logit contributions | |
ullivan | +1.366 |
enhagen | +1.350 |
asma | +1.321 |
Hera | +1.306 |
eda | +1.304 |
Neg logit contributions | |
MX | -1.292 |
ovie | -1.201 |
oir | -1.142 |
resp | -1.072 |
butt | -1.070 |
Token |
|
Token ID | 198 |
Feature activation | +8.50e-02 |
Pos logit contributions | |
ullivan | +0.418 |
enhagen | +0.411 |
asma | +0.405 |
Hera | +0.399 |
eda | +0.397 |
Neg logit contributions | |
MX | -0.413 |
ovie | -0.387 |
oir | -0.368 |
resp | -0.346 |
butt | -0.345 |
Token |
|
Token ID | 198 |
Feature activation | +2.41e-02 |
Pos logit contributions | |
ullivan | +0.974 |
asma | +0.949 |
enhagen | +0.948 |
Hera | +0.933 |
eda | +0.932 |
Neg logit contributions | |
MX | -0.963 |
ovie | -0.907 |
oir | -0.860 |
resp | -0.804 |
butt | -0.801 |
Token | The |
Token ID | 464 |
Feature activation | -1.93e-01 |
Pos logit contributions | |
ullivan | +0.269 |
enhagen | +0.264 |
asma | +0.261 |
eda | +0.255 |
Hera | +0.255 |
Neg logit contributions | |
MX | -0.281 |
ovie | -0.264 |
oir | -0.252 |
resp | -0.236 |
butt | -0.236 |
Token | trip |
Token ID | 5296 |
Feature activation | -1.42e-01 |
Pos logit contributions | |
MX | +2.227 |
ovie | +2.085 |
oir | +2.002 |
resp | +1.866 |
butt | +1.856 |
Neg logit contributions | |
ullivan | -2.178 |
enhagen | -2.126 |
asma | -2.110 |
eda | -2.050 |
lication | -2.037 |
Token | not |
Token ID | 407 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
MX | +1.594 |
ovie | +1.500 |
oir | +1.418 |
butt | +1.332 |
resp | +1.324 |
Neg logit contributions | |
ullivan | -1.672 |
enhagen | -1.628 |
asma | -1.610 |
Hera | -1.573 |
eda | -1.567 |
Token | only |
Token ID | 691 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
MX | +1.502 |
ovie | +1.403 |
oir | +1.317 |
resp | +1.225 |
butt | +1.208 |
Neg logit contributions | |
ullivan | -1.979 |
enhagen | -1.931 |
asma | -1.915 |
Hera | -1.879 |
eda | -1.864 |
Token | includes |
Token ID | 3407 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
enhagen | +2.547 |
ullivan | +2.537 |
asma | +2.497 |
Hera | +2.462 |
eda | +2.462 |
Neg logit contributions | |
MX | -2.793 |
ovie | -2.612 |
oir | -2.489 |
resp | -2.349 |
butt | -2.326 |
Token | d |
Token ID | 288 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
MX | +1.243 |
ovie | +1.162 |
oir | +1.113 |
resp | +1.042 |
butt | +1.038 |
Neg logit contributions | |
ullivan | -1.243 |
enhagen | -1.225 |
asma | -1.200 |
Hera | -1.176 |
eda | -1.174 |
Token | row |
Token ID | 808 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
ullivan | +2.460 |
asma | +2.393 |
enhagen | +2.392 |
eda | +2.362 |
lication | +2.309 |
Neg logit contributions | |
MX | -2.239 |
ovie | -2.060 |
oir | -1.934 |
butt | -1.827 |
resp | -1.822 |
Token | sy |
Token ID | 1837 |
Feature activation | +2.14e-01 |
Pos logit contributions | |
ullivan | +0.370 |
enhagen | +0.365 |
asma | +0.361 |
Hera | +0.355 |
eda | +0.355 |
Neg logit contributions | |
MX | -0.202 |
ovie | -0.184 |
oir | -0.171 |
resp | -0.155 |
butt | -0.154 |
Token | and |
Token ID | 290 |
Feature activation | +8.18e-02 |
Pos logit contributions | |
ullivan | +2.455 |
enhagen | +2.425 |
asma | +2.375 |
eda | +2.333 |
Hera | +2.313 |
Neg logit contributions | |
MX | -2.429 |
ovie | -2.271 |
oir | -2.143 |
resp | -2.030 |
sburgh | -2.014 |
Token | the |
Token ID | 262 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
ullivan | +0.929 |
enhagen | +0.911 |
asma | +0.898 |
Hera | +0.884 |
eda | +0.881 |
Neg logit contributions | |
MX | -0.944 |
ovie | -0.885 |
oir | -0.840 |
resp | -0.791 |
butt | -0.788 |
Token | moments |
Token ID | 7188 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
MX | +2.290 |
ovie | +2.140 |
oir | +2.060 |
resp | +1.913 |
butt | +1.901 |
Neg logit contributions | |
ullivan | -2.424 |
enhagen | -2.402 |
asma | -2.352 |
eda | -2.302 |
Hera | -2.289 |
Token | of |
Token ID | 286 |
Feature activation | +3.69e-01 |
Pos logit contributions | |
ullivan | +1.295 |
enhagen | +1.270 |
asma | +1.254 |
Hera | +1.229 |
eda | +1.229 |
Neg logit contributions | |
MX | -1.361 |
ovie | -1.271 |
oir | -1.208 |
resp | -1.140 |
butt | -1.138 |
Token | heightened |
Token ID | 25556 |
Feature activation | +6.25e-01 |
Pos logit contributions | |
ullivan | +4.013 |
asma | +3.924 |
Hera | +3.920 |
enhagen | +3.918 |
eda | +3.815 |
Neg logit contributions | |
MX | -4.310 |
ovie | -4.029 |
oir | -3.777 |
butt | -3.598 |
resp | -3.565 |
Token | attention |
Token ID | 3241 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
Hera | +6.355 |
asma | +6.308 |
ullivan | +6.292 |
enhagen | +6.160 |
eda | +6.070 |
Neg logit contributions | |
MX | -7.267 |
ovie | -6.832 |
oir | -6.270 |
butt | -6.039 |
sburgh | -5.996 |
Token | like |
Token ID | 588 |
Feature activation | +3.04e-01 |
Pos logit contributions | |
MX | +0.132 |
ovie | +0.123 |
oir | +0.118 |
resp | +0.111 |
butt | +0.110 |
Neg logit contributions | |
ullivan | -0.129 |
enhagen | -0.126 |
asma | -0.124 |
Hera | -0.122 |
eda | -0.122 |
Token | o |
Token ID | 267 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
ullivan | +3.428 |
asma | +3.349 |
enhagen | +3.329 |
Hera | +3.310 |
eda | +3.268 |
Neg logit contributions | |
MX | -3.482 |
ovie | -3.239 |
oir | -3.063 |
resp | -2.905 |
butt | -2.870 |
Token | or |
Token ID | 393 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
ullivan | +3.707 |
enhagen | +3.670 |
Hera | +3.611 |
asma | +3.590 |
eda | +3.542 |
Neg logit contributions | |
MX | -3.799 |
ovie | -3.574 |
oir | -3.367 |
butt | -3.173 |
resp | -3.170 |
Token | Rh |
Token ID | 10323 |
Feature activation | +8.98e-03 |
Pos logit contributions | |
ullivan | +3.504 |
enhagen | +3.463 |
Hera | +3.418 |
asma | +3.402 |
eda | +3.360 |
Neg logit contributions | |
MX | -3.316 |
ovie | -3.089 |
oir | -2.895 |
resp | -2.748 |
butt | -2.744 |
Token | ulic |
Token ID | 28575 |
Feature activation | +5.26e-01 |
Pos logit contributions | |
ullivan | +0.111 |
enhagen | +0.109 |
asma | +0.108 |
eda | +0.106 |
Hera | +0.105 |
Neg logit contributions | |
MX | -0.095 |
ovie | -0.088 |
oir | -0.084 |
resp | -0.078 |
butt | -0.078 |
Token | soldiers |
Token ID | 5795 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
ullivan | +5.908 |
Hera | +5.807 |
asma | +5.787 |
enhagen | +5.765 |
eda | +5.723 |
Neg logit contributions | |
MX | -5.765 |
ovie | -5.270 |
oir | -4.909 |
butt | -4.719 |
resp | -4.652 |
Token | , |
Token ID | 11 |
Feature activation | +2.64e-01 |
Pos logit contributions | |
ullivan | +1.728 |
enhagen | +1.707 |
asma | +1.681 |
Hera | +1.661 |
eda | +1.655 |
Neg logit contributions | |
MX | -1.745 |
ovie | -1.628 |
oir | -1.547 |
resp | -1.463 |
butt | -1.453 |
Token | and |
Token ID | 290 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
ullivan | +2.972 |
enhagen | +2.916 |
Hera | +2.877 |
asma | +2.864 |
eda | +2.827 |
Neg logit contributions | |
MX | -3.010 |
ovie | -2.822 |
oir | -2.680 |
resp | -2.519 |
butt | -2.509 |
Token | certainly |
Token ID | 3729 |
Feature activation | +4.63e-01 |
Pos logit contributions | |
ullivan | +1.234 |
enhagen | +1.216 |
asma | +1.198 |
Hera | +1.185 |
eda | +1.180 |
Neg logit contributions | |
MX | -1.193 |
ovie | -1.116 |
oir | -1.057 |
resp | -0.994 |
butt | -0.993 |
Token | not |
Token ID | 407 |
Feature activation | +5.07e-02 |
Pos logit contributions | |
enhagen | +4.431 |
ullivan | +4.418 |
Hera | +4.380 |
eda | +4.357 |
asma | +4.321 |
Neg logit contributions | |
MX | -5.750 |
ovie | -5.411 |
oir | -5.126 |
resp | -4.939 |
butt | -4.885 |
Token | all |
Token ID | 477 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
ullivan | +0.583 |
enhagen | +0.574 |
asma | +0.565 |
Hera | +0.558 |
eda | +0.555 |
Neg logit contributions | |
MX | -0.577 |
ovie | -0.540 |
oir | -0.513 |
resp | -0.483 |
butt | -0.481 |
Token | of |
Token ID | 286 |
Feature activation | -7.07e-03 |
Pos logit contributions | |
ullivan | +1.762 |
enhagen | +1.746 |
asma | +1.709 |
Hera | +1.693 |
eda | +1.684 |
Neg logit contributions | |
MX | -1.765 |
ovie | -1.656 |
oir | -1.567 |
butt | -1.473 |
resp | -1.472 |
Token | them |
Token ID | 606 |
Feature activation | +7.13e-02 |
Pos logit contributions | |
MX | +0.084 |
ovie | +0.078 |
oir | +0.075 |
resp | +0.070 |
butt | +0.070 |
Neg logit contributions | |
ullivan | -0.078 |
enhagen | -0.077 |
asma | -0.076 |
Hera | -0.074 |
eda | -0.074 |
Token | anyway |
Token ID | 6949 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
ullivan | +4.243 |
enhagen | +4.141 |
Hera | +4.107 |
asma | +4.075 |
eda | +4.028 |
Neg logit contributions | |
MX | -4.669 |
ovie | -4.292 |
oir | -4.082 |
sburgh | -3.887 |
resp | -3.873 |
Token | . |
Token ID | 13 |
Feature activation | +3.73e-01 |
Pos logit contributions | |
ullivan | +3.076 |
enhagen | +3.007 |
asma | +2.968 |
Hera | +2.934 |
eda | +2.926 |
Neg logit contributions | |
MX | -3.108 |
ovie | -2.840 |
oir | -2.715 |
resp | -2.574 |
sburgh | -2.555 |
Token | We |
Token ID | 775 |
Feature activation | -2.81e-02 |
Pos logit contributions | |
Hera | +3.901 |
ullivan | +3.869 |
asma | +3.801 |
eda | +3.762 |
enhagen | +3.703 |
Neg logit contributions | |
MX | -4.471 |
ovie | -4.185 |
oir | -3.968 |
butt | -3.743 |
resp | -3.743 |
Token | usually |
Token ID | 3221 |
Feature activation | +2.55e-01 |
Pos logit contributions | |
MX | +0.316 |
ovie | +0.296 |
oir | +0.282 |
resp | +0.265 |
butt | +0.263 |
Neg logit contributions | |
ullivan | -0.327 |
enhagen | -0.321 |
asma | -0.316 |
Hera | -0.310 |
eda | -0.309 |
Token | handle |
Token ID | 5412 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
ullivan | +2.851 |
enhagen | +2.808 |
asma | +2.796 |
Hera | +2.770 |
eda | +2.745 |
Neg logit contributions | |
MX | -2.950 |
ovie | -2.737 |
oir | -2.567 |
resp | -2.425 |
butt | -2.414 |
Token | textbooks |
Token ID | 31814 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
ullivan | +1.721 |
enhagen | +1.691 |
asma | +1.666 |
Hera | +1.653 |
eda | +1.637 |
Neg logit contributions | |
MX | -1.817 |
ovie | -1.704 |
oir | -1.615 |
resp | -1.515 |
butt | -1.513 |
Token | and |
Token ID | 290 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
MX | +0.138 |
ovie | +0.129 |
oir | +0.123 |
resp | +0.115 |
butt | +0.115 |
Neg logit contributions | |
ullivan | -0.149 |
enhagen | -0.147 |
asma | -0.145 |
Hera | -0.142 |
eda | -0.142 |
Token | other |
Token ID | 584 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
MX | +2.715 |
ovie | +2.517 |
oir | +2.449 |
butt | +2.261 |
resp | +2.246 |
Neg logit contributions | |
ullivan | -2.971 |
enhagen | -2.938 |
asma | -2.857 |
lication | -2.786 |
eda | -2.781 |
Token | light |
Token ID | 1657 |
Feature activation | +7.46e-02 |
Pos logit contributions | |
MX | +3.320 |
ovie | +3.044 |
oir | +2.984 |
resp | +2.775 |
butt | +2.769 |
Neg logit contributions | |
enhagen | -3.730 |
ullivan | -3.720 |
asma | -3.614 |
lication | -3.506 |
eda | -3.480 |
Token | modern |
Token ID | 3660 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
ullivan | +0.881 |
enhagen | +0.866 |
asma | +0.853 |
eda | +0.840 |
Hera | +0.837 |
Neg logit contributions | |
MX | -0.830 |
ovie | -0.774 |
oir | -0.734 |
resp | -0.688 |
butt | -0.684 |
Token | reference |
Token ID | 4941 |
Feature activation | -5.03e-01 |
Pos logit contributions | |
MX | +4.432 |
oir | +4.082 |
ovie | +4.067 |
resp | +3.690 |
iary | +3.649 |
Neg logit contributions | |
ullivan | -5.235 |
enhagen | -5.197 |
asma | -5.026 |
lication | -4.896 |
Hera | -4.886 |
Token | treated |
Token ID | 5716 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
MX | +2.122 |
ovie | +2.002 |
oir | +1.913 |
resp | +1.808 |
butt | +1.798 |
Neg logit contributions | |
ullivan | -2.049 |
enhagen | -2.009 |
asma | -1.959 |
eda | -1.907 |
Hera | -1.900 |
Token | as |
Token ID | 355 |
Feature activation | -3.05e-01 |
Pos logit contributions | |
ullivan | +1.276 |
enhagen | +1.252 |
asma | +1.240 |
Hera | +1.223 |
eda | +1.218 |
Neg logit contributions | |
MX | -1.290 |
ovie | -1.200 |
oir | -1.146 |
butt | -1.071 |
resp | -1.066 |
Token | Israeli |
Token ID | 6085 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
MX | +3.091 |
ovie | +2.897 |
oir | +2.734 |
resp | +2.620 |
butt | +2.544 |
Neg logit contributions | |
ullivan | -3.841 |
enhagen | -3.769 |
asma | -3.670 |
eda | -3.602 |
lication | -3.593 |
Token | spies |
Token ID | 28801 |
Feature activation | -4.66e-01 |
Pos logit contributions | |
MX | +1.743 |
ovie | +1.621 |
oir | +1.546 |
resp | +1.470 |
butt | +1.440 |
Neg logit contributions | |
ullivan | -1.802 |
enhagen | -1.767 |
asma | -1.730 |
eda | -1.695 |
Hera | -1.687 |
Token | . |
Token ID | 13 |
Feature activation | -2.91e-01 |
Pos logit contributions | |
MX | +4.312 |
ovie | +4.181 |
oir | +3.902 |
resp | +3.623 |
butt | +3.595 |
Neg logit contributions | |
ullivan | -6.145 |
enhagen | -5.944 |
asma | -5.903 |
Hera | -5.744 |
eda | -5.723 |
Token |
|
Token ID | 198 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
MX | +2.941 |
ovie | +2.746 |
oir | +2.602 |
resp | +2.414 |
butt | +2.381 |
Neg logit contributions | |
ullivan | -3.703 |
enhagen | -3.658 |
asma | -3.532 |
eda | -3.472 |
lication | -3.434 |
Token |
|
Token ID | 198 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
MX | +3.214 |
ovie | +2.877 |
oir | +2.765 |
resp | +2.590 |
butt | +2.587 |
Neg logit contributions | |
enhagen | -4.721 |
ullivan | -4.629 |
asma | -4.415 |
lication | -4.338 |
eda | -4.295 |
Token | But |
Token ID | 1537 |
Feature activation | -3.28e-01 |
Pos logit contributions | |
MX | +3.543 |
ovie | +3.213 |
oir | +3.053 |
resp | +2.913 |
butt | +2.882 |
Neg logit contributions | |
enhagen | -3.821 |
ullivan | -3.808 |
asma | -3.632 |
Hera | -3.592 |
eda | -3.520 |
Token | the |
Token ID | 262 |
Feature activation | -2.03e-01 |
Pos logit contributions | |
MX | +3.401 |
ovie | +3.214 |
oir | +3.035 |
resp | +2.834 |
butt | +2.822 |
Neg logit contributions | |
ullivan | -3.999 |
enhagen | -3.947 |
asma | -3.850 |
lication | -3.738 |
Hera | -3.737 |
Token | government |
Token ID | 1230 |
Feature activation | +2.56e-01 |
Pos logit contributions | |
MX | +2.263 |
ovie | +2.132 |
oir | +2.021 |
resp | +1.908 |
butt | +1.867 |
Neg logit contributions | |
ullivan | -2.387 |
enhagen | -2.334 |
asma | -2.289 |
Hera | -2.237 |
eda | -2.232 |
Token | appears |
Token ID | 3568 |
Feature activation | +2.85e-02 |
Pos logit contributions | |
ullivan | +2.798 |
enhagen | +2.778 |
asma | +2.731 |
Hera | +2.691 |
eda | +2.689 |
Neg logit contributions | |
MX | -2.998 |
ovie | -2.800 |
oir | -2.667 |
resp | -2.505 |
butt | -2.499 |
Token | to |
Token ID | 284 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
ullivan | +0.652 |
enhagen | +0.643 |
asma | +0.633 |
Hera | +0.620 |
eda | +0.618 |
Neg logit contributions | |
MX | -0.673 |
ovie | -0.630 |
oir | -0.601 |
resp | -0.565 |
butt | -0.562 |
Token | make |
Token ID | 787 |
Feature activation | -3.65e-04 |
Pos logit contributions | |
ullivan | +3.367 |
asma | +3.244 |
enhagen | +3.234 |
Hera | +3.234 |
eda | +3.179 |
Neg logit contributions | |
MX | -4.066 |
ovie | -3.874 |
oir | -3.651 |
resp | -3.420 |
butt | -3.411 |
Token | the |
Token ID | 262 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
MX | +0.004 |
ovie | +0.004 |
oir | +0.004 |
resp | +0.003 |
butt | +0.003 |
Neg logit contributions | |
ullivan | -0.004 |
enhagen | -0.004 |
asma | -0.004 |
Hera | -0.004 |
eda | -0.004 |
Token | chair |
Token ID | 5118 |
Feature activation | +4.52e-01 |
Pos logit contributions | |
ullivan | +2.570 |
enhagen | +2.489 |
asma | +2.475 |
Hera | +2.466 |
eda | +2.412 |
Neg logit contributions | |
MX | -2.840 |
ovie | -2.685 |
oir | -2.575 |
butt | -2.384 |
resp | -2.373 |
Token | move |
Token ID | 1445 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
ullivan | +4.883 |
Hera | +4.660 |
enhagen | +4.635 |
asma | +4.626 |
eda | +4.583 |
Neg logit contributions | |
MX | -5.274 |
ovie | -4.986 |
oir | -4.744 |
resp | -4.337 |
sburgh | -4.289 |
Token | in |
Token ID | 287 |
Feature activation | -8.73e-02 |
Pos logit contributions | |
ullivan | +1.193 |
enhagen | +1.173 |
asma | +1.153 |
Hera | +1.136 |
eda | +1.134 |
Neg logit contributions | |
MX | -1.146 |
ovie | -1.073 |
oir | -1.017 |
resp | -0.952 |
butt | -0.946 |
Token | a |
Token ID | 257 |
Feature activation | +6.10e-02 |
Pos logit contributions | |
MX | +0.940 |
ovie | +0.871 |
oir | +0.828 |
resp | +0.777 |
butt | +0.772 |
Neg logit contributions | |
ullivan | -1.063 |
enhagen | -1.048 |
asma | -1.029 |
eda | -1.010 |
Hera | -1.007 |
Token | forward |
Token ID | 2651 |
Feature activation | +5.51e-01 |
Pos logit contributions | |
ullivan | +0.693 |
enhagen | +0.678 |
asma | +0.670 |
Hera | +0.660 |
eda | +0.655 |
Neg logit contributions | |
MX | -0.704 |
ovie | -0.662 |
oir | -0.630 |
resp | -0.590 |
butt | -0.589 |
Token | direction |
Token ID | 4571 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
ullivan | +5.213 |
Hera | +5.054 |
asma | +5.039 |
enhagen | +4.961 |
eda | +4.953 |
Neg logit contributions | |
MX | -6.869 |
ovie | -6.559 |
oir | -6.281 |
sburgh | -5.883 |
butt | -5.850 |
Token | to |
Token ID | 284 |
Feature activation | -3.94e-02 |
Pos logit contributions | |
MX | +2.171 |
ovie | +2.023 |
oir | +1.916 |
resp | +1.792 |
butt | +1.786 |
Neg logit contributions | |
ullivan | -2.617 |
enhagen | -2.574 |
asma | -2.543 |
eda | -2.483 |
Hera | -2.481 |
Token | reach |
Token ID | 3151 |
Feature activation | -3.24e-01 |
Pos logit contributions | |
MX | +0.453 |
ovie | +0.423 |
oir | +0.404 |
resp | +0.380 |
butt | +0.378 |
Neg logit contributions | |
ullivan | -0.452 |
enhagen | -0.444 |
asma | -0.437 |
eda | -0.427 |
Hera | -0.427 |
Token |
|
Token ID | 198 |
Feature activation | +2.81e-01 |
Pos logit contributions | |
ullivan | +1.088 |
asma | +1.061 |
enhagen | +1.054 |
Hera | +1.041 |
eda | +1.039 |
Neg logit contributions | |
MX | -1.088 |
ovie | -1.023 |
oir | -0.970 |
resp | -0.907 |
butt | -0.903 |
Token | Sch |
Token ID | 14874 |
Feature activation | +5.47e-02 |
Pos logit contributions | |
ullivan | +3.110 |
asma | +2.997 |
eda | +2.932 |
enhagen | +2.921 |
Hera | +2.868 |
Neg logit contributions | |
MX | -3.263 |
ovie | -3.110 |
oir | -2.945 |
sburgh | -2.726 |
resp | -2.718 |
Token | w |
Token ID | 86 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
ullivan | +0.652 |
enhagen | +0.640 |
asma | +0.633 |
eda | +0.619 |
Hera | +0.616 |
Neg logit contributions | |
MX | -0.602 |
ovie | -0.559 |
oir | -0.531 |
resp | -0.499 |
butt | -0.496 |
Token | artz |
Token ID | 13636 |
Feature activation | +3.93e-01 |
Pos logit contributions | |
enhagen | +3.617 |
ullivan | +3.592 |
eda | +3.544 |
asma | +3.540 |
Hera | +3.356 |
Neg logit contributions | |
MX | -3.710 |
ovie | -3.415 |
oir | -3.214 |
butt | -3.078 |
resp | -3.052 |
Token | , |
Token ID | 11 |
Feature activation | -5.88e-02 |
Pos logit contributions | |
ullivan | +4.344 |
enhagen | +4.337 |
asma | +4.198 |
eda | +4.183 |
Hera | +4.079 |
Neg logit contributions | |
MX | -4.493 |
ovie | -4.201 |
oir | -4.003 |
resp | -3.803 |
butt | -3.683 |
Token | D |
Token ID | 360 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
MX | +0.692 |
ovie | +0.645 |
oir | +0.617 |
resp | +0.580 |
butt | +0.579 |
Neg logit contributions | |
ullivan | -0.658 |
enhagen | -0.650 |
asma | -0.635 |
eda | -0.620 |
Hera | -0.617 |
Token | ., |
Token ID | 1539 |
Feature activation | +6.28e-03 |
Pos logit contributions | |
MX | +1.951 |
ovie | +1.820 |
oir | +1.713 |
resp | +1.576 |
butt | +1.559 |
Neg logit contributions | |
ullivan | -2.810 |
enhagen | -2.790 |
asma | -2.739 |
Hera | -2.735 |
eda | -2.679 |
Token | Dodge |
Token ID | 26048 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
ullivan | +0.071 |
enhagen | +0.070 |
asma | +0.069 |
Hera | +0.067 |
eda | +0.067 |
Neg logit contributions | |
MX | -0.073 |
ovie | -0.068 |
oir | -0.065 |
resp | -0.061 |
butt | -0.061 |
Token | , |
Token ID | 11 |
Feature activation | -4.56e-02 |
Pos logit contributions | |
ullivan | +2.690 |
enhagen | +2.656 |
asma | +2.600 |
eda | +2.558 |
Hera | +2.537 |
Neg logit contributions | |
MX | -2.616 |
ovie | -2.437 |
oir | -2.299 |
resp | -2.177 |
butt | -2.134 |
Token | K |
Token ID | 509 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
MX | +0.538 |
ovie | +0.502 |
oir | +0.480 |
resp | +0.451 |
butt | +0.450 |
Neg logit contributions | |
ullivan | -0.510 |
enhagen | -0.503 |
asma | -0.492 |
eda | -0.481 |
Hera | -0.479 |
Token | . |
Token ID | 13 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
MX | +1.666 |
ovie | +1.536 |
oir | +1.458 |
resp | +1.333 |
butt | +1.319 |
Neg logit contributions | |
ullivan | -2.511 |
enhagen | -2.488 |
asma | -2.450 |
Hera | -2.434 |
eda | -2.405 |
Token | unk |
Token ID | 2954 |
Feature activation | -5.57e-01 |
Pos logit contributions | |
MX | +5.742 |
ovie | +5.616 |
oir | +5.403 |
resp | +4.822 |
butt | +4.657 |
Neg logit contributions | |
Hera | -8.781 |
ullivan | -8.733 |
enhagen | -8.570 |
asma | -8.307 |
rocal | -8.202 |
Token | lost |
Token ID | 2626 |
Feature activation | -8.07e-02 |
Pos logit contributions | |
MX | +5.779 |
ovie | +5.417 |
oir | +5.228 |
sburgh | +4.850 |
butt | +4.845 |
Neg logit contributions | |
ullivan | -6.663 |
enhagen | -6.330 |
asma | -6.217 |
Hera | -6.189 |
rocal | -6.154 |
Token | the |
Token ID | 262 |
Feature activation | -2.05e-02 |
Pos logit contributions | |
MX | +0.846 |
ovie | +0.786 |
oir | +0.750 |
resp | +0.695 |
butt | +0.694 |
Neg logit contributions | |
ullivan | -1.004 |
enhagen | -0.987 |
asma | -0.971 |
Hera | -0.953 |
eda | -0.953 |
Token | public |
Token ID | 1171 |
Feature activation | -8.98e-02 |
Pos logit contributions | |
MX | +0.238 |
ovie | +0.223 |
oir | +0.213 |
resp | +0.200 |
butt | +0.199 |
Neg logit contributions | |
ullivan | -0.231 |
enhagen | -0.227 |
asma | -0.224 |
Hera | -0.219 |
eda | -0.219 |
Token | view |
Token ID | 1570 |
Feature activation | -3.15e-01 |
Pos logit contributions | |
MX | +0.950 |
ovie | +0.886 |
oir | +0.846 |
butt | +0.785 |
resp | +0.784 |
Neg logit contributions | |
ullivan | -1.106 |
enhagen | -1.087 |
asma | -1.066 |
eda | -1.049 |
Hera | -1.048 |
Token | through |
Token ID | 832 |
Feature activation | -3.75e-01 |
Pos logit contributions | |
MX | +3.255 |
ovie | +3.057 |
oir | +2.939 |
butt | +2.725 |
resp | +2.675 |
Neg logit contributions | |
ullivan | -3.906 |
enhagen | -3.805 |
asma | -3.777 |
Hera | -3.684 |
eda | -3.680 |
Token | the |
Token ID | 262 |
Feature activation | -6.80e-02 |
Pos logit contributions | |
MX | +3.850 |
ovie | +3.674 |
oir | +3.389 |
butt | +3.146 |
resp | +3.142 |
Neg logit contributions | |
ullivan | -4.661 |
enhagen | -4.538 |
asma | -4.474 |
eda | -4.410 |
Hera | -4.390 |
Token | late |
Token ID | 2739 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
MX | +0.789 |
ovie | +0.740 |
oir | +0.705 |
resp | +0.661 |
butt | +0.659 |
Neg logit contributions | |
ullivan | -0.771 |
enhagen | -0.757 |
asma | -0.744 |
Hera | -0.729 |
eda | -0.729 |
Token | 1970 |
Token ID | 8069 |
Feature activation | +9.18e-03 |
Pos logit contributions | |
MX | +2.266 |
ovie | +2.120 |
oir | +2.019 |
butt | +1.883 |
resp | +1.879 |
Neg logit contributions | |
ullivan | -2.415 |
enhagen | -2.364 |
asma | -2.321 |
eda | -2.269 |
Hera | -2.265 |
Token | s |
Token ID | 82 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
ullivan | +0.114 |
enhagen | +0.113 |
asma | +0.111 |
Hera | +0.109 |
eda | +0.109 |
Neg logit contributions | |
MX | -0.096 |
ovie | -0.089 |
oir | -0.085 |
resp | -0.079 |
butt | -0.079 |
Token | and |
Token ID | 290 |
Feature activation | -2.15e-01 |
Pos logit contributions | |
ullivan | +0.257 |
enhagen | +0.253 |
asma | +0.249 |
Hera | +0.244 |
eda | +0.244 |
Neg logit contributions | |
MX | -0.236 |
ovie | -0.220 |
oir | -0.210 |
resp | -0.196 |
butt | -0.195 |
Token | two |
Token ID | 734 |
Feature activation | -5.01e-01 |
Pos logit contributions | |
MX | +4.168 |
ovie | +3.869 |
oir | +3.621 |
resp | +3.422 |
butt | +3.385 |
Neg logit contributions | |
ullivan | -5.465 |
enhagen | -5.384 |
asma | -5.287 |
lication | -5.124 |
Hera | -5.011 |
Token | major |
Token ID | 1688 |
Feature activation | -6.17e-01 |
Pos logit contributions | |
MX | +4.907 |
ovie | +4.486 |
oir | +4.338 |
resp | +4.053 |
butt | +3.975 |
Neg logit contributions | |
enhagen | -6.368 |
ullivan | -6.309 |
asma | -6.106 |
lication | -5.913 |
eda | -5.793 |
Token | laws |
Token ID | 3657 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
MX | +6.051 |
ovie | +5.543 |
oir | +5.394 |
resp | +5.112 |
pa | +4.972 |
Neg logit contributions | |
enhagen | -7.588 |
ullivan | -7.429 |
asma | -7.252 |
lication | -7.016 |
Hera | -6.829 |
Token | that |
Token ID | 326 |
Feature activation | -4.67e-02 |
Pos logit contributions | |
ullivan | +0.204 |
enhagen | +0.200 |
asma | +0.197 |
Hera | +0.194 |
eda | +0.193 |
Neg logit contributions | |
MX | -0.197 |
ovie | -0.184 |
oir | -0.175 |
resp | -0.164 |
butt | -0.164 |
Token | address |
Token ID | 2209 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
MX | +0.523 |
ovie | +0.489 |
oir | +0.465 |
resp | +0.437 |
butt | +0.435 |
Neg logit contributions | |
ullivan | -0.547 |
enhagen | -0.538 |
asma | -0.529 |
Hera | -0.519 |
eda | -0.517 |
Token | how |
Token ID | 703 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
MX | +1.788 |
ovie | +1.669 |
oir | +1.603 |
resp | +1.502 |
butt | +1.479 |
Neg logit contributions | |
ullivan | -1.970 |
enhagen | -1.931 |
asma | -1.893 |
Hera | -1.850 |
eda | -1.847 |
Token | guns |
Token ID | 6541 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
MX | +1.722 |
ovie | +1.604 |
oir | +1.540 |
resp | +1.441 |
butt | +1.421 |
Neg logit contributions | |
ullivan | -1.908 |
enhagen | -1.870 |
asma | -1.825 |
eda | -1.796 |
Hera | -1.790 |
Token | are |
Token ID | 389 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
MX | +3.327 |
ovie | +3.153 |
oir | +2.979 |
resp | +2.834 |
butt | +2.793 |
Neg logit contributions | |
ullivan | -3.729 |
enhagen | -3.638 |
asma | -3.555 |
Hera | -3.495 |
lication | -3.475 |
Token | carried |
Token ID | 5281 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
MX | +1.345 |
ovie | +1.256 |
oir | +1.203 |
resp | +1.127 |
butt | +1.118 |
Neg logit contributions | |
ullivan | -1.390 |
enhagen | -1.360 |
asma | -1.325 |
Hera | -1.306 |
eda | -1.305 |
Token | in |
Token ID | 287 |
Feature activation | -4.20e-01 |
Pos logit contributions | |
ullivan | +2.434 |
enhagen | +2.426 |
asma | +2.368 |
Hera | +2.349 |
eda | +2.343 |
Neg logit contributions | |
MX | -2.551 |
ovie | -2.406 |
oir | -2.255 |
butt | -2.109 |
resp | -2.107 |
Token | America |
Token ID | 2253 |
Feature activation | -2.76e-01 |
Pos logit contributions | |
MX | +4.824 |
ovie | +4.484 |
oir | +4.454 |
resp | +4.204 |
butt | +4.084 |
Neg logit contributions | |
ullivan | -4.604 |
enhagen | -4.482 |
asma | -4.354 |
eda | -4.276 |
lication | -4.228 |
Token | protect |
Token ID | 1805 |
Feature activation | -4.39e-02 |
Pos logit contributions | |
MX | +5.017 |
ovie | +4.565 |
oir | +4.434 |
butt | +4.224 |
resp | +4.139 |
Neg logit contributions | |
ullivan | -6.373 |
enhagen | -6.253 |
asma | -6.163 |
lication | -6.039 |
eda | -5.954 |
Token | Oklahoma |
Token ID | 10433 |
Feature activation | -1.77e-01 |
Pos logit contributions | |
MX | +0.490 |
ovie | +0.458 |
oir | +0.437 |
resp | +0.409 |
butt | +0.407 |
Neg logit contributions | |
ullivan | -0.516 |
enhagen | -0.508 |
asma | -0.500 |
Hera | -0.490 |
eda | -0.489 |
Token | residents |
Token ID | 5085 |
Feature activation | -9.75e-02 |
Pos logit contributions | |
MX | +1.896 |
ovie | +1.753 |
oir | +1.699 |
resp | +1.575 |
butt | +1.548 |
Neg logit contributions | |
ullivan | -2.155 |
enhagen | -2.118 |
asma | -2.092 |
Hera | -2.051 |
eda | -2.031 |
Token | impacted |
Token ID | 20755 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
MX | +1.080 |
ovie | +1.009 |
oir | +0.963 |
resp | +0.903 |
butt | +0.897 |
Neg logit contributions | |
ullivan | -1.154 |
enhagen | -1.136 |
asma | -1.117 |
Hera | -1.092 |
eda | -1.090 |
Token | by |
Token ID | 416 |
Feature activation | -6.66e-02 |
Pos logit contributions | |
MX | +1.635 |
ovie | +1.518 |
oir | +1.451 |
butt | +1.350 |
resp | +1.349 |
Neg logit contributions | |
ullivan | -1.822 |
enhagen | -1.795 |
asma | -1.775 |
Hera | -1.730 |
eda | -1.722 |
Token | sw |
Token ID | 1509 |
Feature activation | -7.66e-01 |
Pos logit contributions | |
MX | +0.715 |
ovie | +0.666 |
oir | +0.634 |
resp | +0.592 |
butt | +0.589 |
Neg logit contributions | |
ullivan | -0.811 |
enhagen | -0.797 |
asma | -0.786 |
Hera | -0.770 |
eda | -0.769 |
Token | arms |
Token ID | 8357 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
MX | +6.886 |
oir | +6.525 |
ovie | +6.500 |
resp | +5.647 |
ission | +5.596 |
Neg logit contributions | |
ullivan | -9.645 |
Hera | -9.590 |
enhagen | -9.587 |
asma | -9.143 |
cone | -9.112 |
Token | of |
Token ID | 286 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
ullivan | +1.394 |
enhagen | +1.377 |
asma | +1.356 |
Hera | +1.326 |
eda | +1.323 |
Neg logit contributions | |
MX | -1.460 |
ovie | -1.366 |
oir | -1.299 |
resp | -1.220 |
butt | -1.217 |
Token | fracking |
Token ID | 25441 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
ullivan | +1.299 |
enhagen | +1.272 |
asma | +1.258 |
Hera | +1.236 |
eda | +1.228 |
Neg logit contributions | |
MX | -1.330 |
ovie | -1.253 |
oir | -1.184 |
resp | -1.113 |
butt | -1.112 |
Token | - |
Token ID | 12 |
Feature activation | -5.28e-01 |
Pos logit contributions | |
MX | +2.030 |
ovie | +1.884 |
oir | +1.830 |
resp | +1.703 |
butt | +1.697 |
Neg logit contributions | |
ullivan | -2.079 |
enhagen | -2.060 |
asma | -1.999 |
eda | -1.961 |
Hera | -1.952 |
Token | induced |
Token ID | 17223 |
Feature activation | -4.04e-01 |
Pos logit contributions | |
MX | +4.314 |
ovie | +3.901 |
oir | +3.830 |
butt | +3.610 |
resp | +3.531 |
Neg logit contributions | |
ullivan | -7.522 |
enhagen | -7.480 |
asma | -7.292 |
Hera | -7.214 |
rocal | -7.014 |
Token |
|
Token ID | 198 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
MX | +0.363 |
ovie | +0.339 |
oir | +0.323 |
resp | +0.304 |
butt | +0.303 |
Neg logit contributions | |
ullivan | -0.360 |
enhagen | -0.355 |
asma | -0.348 |
Hera | -0.341 |
eda | -0.341 |
Token |
|
Token ID | 198 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
ullivan | +1.378 |
asma | +1.344 |
enhagen | +1.331 |
Hera | +1.324 |
eda | +1.321 |
Neg logit contributions | |
MX | -1.405 |
ovie | -1.327 |
oir | -1.261 |
resp | -1.179 |
butt | -1.170 |
Token | But |
Token ID | 1537 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
ullivan | +2.328 |
asma | +2.277 |
enhagen | +2.251 |
eda | +2.234 |
lication | +2.184 |
Neg logit contributions | |
MX | -2.447 |
ovie | -2.352 |
oir | -2.253 |
sburgh | -2.089 |
resp | -2.076 |
Token | at |
Token ID | 379 |
Feature activation | -1.86e-01 |
Pos logit contributions | |
MX | +1.310 |
ovie | +1.217 |
oir | +1.153 |
resp | +1.081 |
butt | +1.079 |
Neg logit contributions | |
ullivan | -1.479 |
enhagen | -1.457 |
asma | -1.434 |
Hera | -1.407 |
eda | -1.398 |
Token | the |
Token ID | 262 |
Feature activation | -6.44e-02 |
Pos logit contributions | |
MX | +1.979 |
ovie | +1.835 |
oir | +1.752 |
resp | +1.654 |
butt | +1.636 |
Neg logit contributions | |
ullivan | -2.258 |
enhagen | -2.210 |
asma | -2.194 |
Hera | -2.136 |
eda | -2.128 |
Token | Conservative |
Token ID | 11132 |
Feature activation | -8.57e-01 |
Pos logit contributions | |
MX | +0.747 |
ovie | +0.698 |
oir | +0.665 |
resp | +0.628 |
butt | +0.624 |
Neg logit contributions | |
ullivan | -0.730 |
enhagen | -0.717 |
asma | -0.705 |
Hera | -0.690 |
eda | -0.689 |
Token | Political |
Token ID | 14611 |
Feature activation | -3.10e-01 |
Pos logit contributions | |
MX | +4.917 |
ovie | +3.995 |
oir | +3.625 |
sburgh | +3.337 |
pa | +3.299 |
Neg logit contributions | |
ullivan | -13.725 |
asma | -13.237 |
lication | -13.179 |
enhagen | -13.081 |
zl | -13.021 |
Token | Action |
Token ID | 7561 |
Feature activation | -4.28e-01 |
Pos logit contributions | |
MX | +2.739 |
ovie | +2.455 |
oir | +2.306 |
sburgh | +2.122 |
butt | +2.099 |
Neg logit contributions | |
ullivan | -4.394 |
enhagen | -4.294 |
asma | -4.237 |
eda | -4.191 |
rocal | -4.111 |
Token | Conference |
Token ID | 8785 |
Feature activation | -4.94e-01 |
Pos logit contributions | |
MX | +3.988 |
ovie | +3.625 |
oir | +3.476 |
butt | +3.218 |
sburgh | +3.206 |
Neg logit contributions | |
ullivan | -5.827 |
enhagen | -5.627 |
asma | -5.451 |
eda | -5.431 |
rocal | -5.430 |
Token | in |
Token ID | 287 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
MX | +4.732 |
ovie | +4.368 |
oir | +4.200 |
butt | +3.878 |
sburgh | +3.870 |
Neg logit contributions | |
ullivan | -6.333 |
enhagen | -6.121 |
asma | -6.120 |
Hera | -6.012 |
lication | -5.941 |
Token | February |
Token ID | 3945 |
Feature activation | +8.51e-02 |
Pos logit contributions | |
MX | +2.445 |
ovie | +2.273 |
oir | +2.139 |
resp | +2.025 |
butt | +2.011 |
Neg logit contributions | |
ullivan | -2.954 |
enhagen | -2.906 |
asma | -2.850 |
lication | -2.789 |
eda | -2.773 |
Token | city |
Token ID | 1748 |
Feature activation | -4.21e-01 |
Pos logit contributions | |
ullivan | +0.488 |
enhagen | +0.480 |
asma | +0.474 |
eda | +0.464 |
Hera | +0.462 |
Neg logit contributions | |
MX | -0.486 |
ovie | -0.455 |
oir | -0.431 |
resp | -0.406 |
butt | -0.404 |
Token | and |
Token ID | 290 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
MX | +3.887 |
ovie | +3.429 |
oir | +3.355 |
butt | +3.228 |
resp | +3.204 |
Neg logit contributions | |
enhagen | -5.619 |
ullivan | -5.608 |
asma | -5.390 |
lication | -5.367 |
Hera | -5.355 |
Token | state |
Token ID | 1181 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
MX | +2.500 |
ovie | +2.327 |
oir | +2.243 |
butt | +2.045 |
sburgh | +2.029 |
Neg logit contributions | |
ullivan | -3.727 |
enhagen | -3.677 |
asma | -3.601 |
Hera | -3.546 |
lication | -3.466 |
Token | for |
Token ID | 329 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
MX | +1.874 |
ovie | +1.692 |
oir | +1.650 |
resp | +1.532 |
butt | +1.517 |
Neg logit contributions | |
ullivan | -2.337 |
enhagen | -2.333 |
asma | -2.249 |
lication | -2.216 |
Hera | -2.203 |
Token | free |
Token ID | 1479 |
Feature activation | +4.63e-01 |
Pos logit contributions | |
MX | +1.384 |
ovie | +1.277 |
oir | +1.215 |
resp | +1.136 |
butt | +1.125 |
Neg logit contributions | |
ullivan | -1.737 |
enhagen | -1.717 |
asma | -1.669 |
Hera | -1.654 |
eda | -1.647 |
Token | . |
Token ID | 13 |
Feature activation | -8.11e-01 |
Pos logit contributions | |
ullivan | +4.766 |
asma | +4.706 |
eda | +4.640 |
enhagen | +4.604 |
Hera | +4.429 |
Neg logit contributions | |
MX | -5.496 |
oir | -5.064 |
ovie | -5.059 |
butt | -4.732 |
resp | -4.629 |
Token | Any |
Token ID | 4377 |
Feature activation | -9.20e-01 |
Pos logit contributions | |
MX | +7.419 |
ovie | +6.585 |
oir | +6.422 |
butt | +6.215 |
sburgh | +5.921 |
Neg logit contributions | |
enhagen | -11.301 |
ullivan | -10.762 |
cone | -10.067 |
lication | -10.044 |
Hera | -9.896 |
Token | contribution |
Token ID | 10156 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
MX | +7.462 |
oir | +6.192 |
resp | +5.696 |
butt | +5.487 |
ovie | +5.313 |
Neg logit contributions | |
enhagen | -13.526 |
ullivan | -13.387 |
Hera | -12.999 |
eda | -12.471 |
lication | -12.370 |
Token | to |
Token ID | 284 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
MX | +1.980 |
ovie | +1.789 |
oir | +1.749 |
resp | +1.616 |
butt | +1.615 |
Neg logit contributions | |
ullivan | -2.254 |
enhagen | -2.198 |
asma | -2.145 |
eda | -2.132 |
Hera | -2.114 |
Token | help |
Token ID | 1037 |
Feature activation | -7.25e-01 |
Pos logit contributions | |
MX | +1.579 |
ovie | +1.456 |
oir | +1.417 |
butt | +1.349 |
resp | +1.318 |
Neg logit contributions | |
ullivan | -1.549 |
enhagen | -1.530 |
asma | -1.483 |
eda | -1.463 |
lication | -1.458 |
Token | fund |
Token ID | 1814 |
Feature activation | -4.25e-01 |
Pos logit contributions | |
MX | +5.486 |
oir | +4.490 |
butt | +4.198 |
ovie | +4.166 |
iary | +4.138 |
Neg logit contributions | |
ullivan | -11.139 |
lication | -10.791 |
enhagen | -10.559 |
Hera | -10.400 |
rocal | -10.296 |
Token | line |
Token ID | 1627 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
ullivan | +2.760 |
enhagen | +2.687 |
asma | +2.671 |
Hera | +2.647 |
eda | +2.623 |
Neg logit contributions | |
MX | -2.806 |
ovie | -2.681 |
oir | -2.481 |
resp | -2.355 |
butt | -2.339 |
Token | of |
Token ID | 286 |
Feature activation | -2.80e-03 |
Pos logit contributions | |
ullivan | +3.495 |
enhagen | +3.443 |
asma | +3.381 |
Hera | +3.337 |
eda | +3.301 |
Neg logit contributions | |
MX | -3.989 |
ovie | -3.756 |
oir | -3.571 |
sburgh | -3.385 |
resp | -3.365 |
Token | credit |
Token ID | 3884 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
MX | +0.026 |
ovie | +0.024 |
oir | +0.023 |
resp | +0.021 |
butt | +0.021 |
Neg logit contributions | |
ullivan | -0.038 |
enhagen | -0.038 |
asma | -0.037 |
Hera | -0.036 |
eda | -0.036 |
Token | at |
Token ID | 379 |
Feature activation | -1.78e-02 |
Pos logit contributions | |
ullivan | +2.778 |
enhagen | +2.745 |
asma | +2.712 |
Hera | +2.702 |
eda | +2.639 |
Neg logit contributions | |
MX | -2.865 |
ovie | -2.743 |
oir | -2.561 |
resp | -2.416 |
butt | -2.413 |
Token | Republic |
Token ID | 2066 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
MX | +0.194 |
ovie | +0.181 |
oir | +0.172 |
resp | +0.161 |
butt | +0.160 |
Neg logit contributions | |
ullivan | -0.214 |
enhagen | -0.210 |
asma | -0.207 |
Hera | -0.203 |
eda | -0.203 |
Token | National |
Token ID | 2351 |
Feature activation | -8.90e-01 |
Pos logit contributions | |
MX | +0.199 |
ovie | +0.185 |
oir | +0.176 |
resp | +0.164 |
butt | +0.163 |
Neg logit contributions | |
ullivan | -0.238 |
enhagen | -0.234 |
asma | -0.231 |
Hera | -0.226 |
eda | -0.226 |
Token | Bank |
Token ID | 5018 |
Feature activation | +3.12e-01 |
Pos logit contributions | |
MX | +7.801 |
oir | +7.366 |
ovie | +6.930 |
pa | +6.470 |
butt | +6.440 |
Neg logit contributions | |
ullivan | -11.776 |
enhagen | -11.130 |
lication | -10.576 |
asma | -10.534 |
Hera | -10.386 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e-02 |
Pos logit contributions | |
enhagen | +3.430 |
ullivan | +3.397 |
asma | +3.363 |
Hera | +3.308 |
eda | +3.307 |
Neg logit contributions | |
MX | -3.551 |
ovie | -3.391 |
oir | -3.152 |
resp | -2.990 |
butt | -2.979 |
Token | A |
Token ID | 317 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
MX | +1.110 |
ovie | +1.029 |
oir | +0.987 |
resp | +0.923 |
butt | +0.922 |
Neg logit contributions | |
ullivan | -1.152 |
enhagen | -1.137 |
asma | -1.109 |
eda | -1.085 |
Hera | -1.076 |
Token | decade |
Token ID | 5707 |
Feature activation | +3.71e-01 |
Pos logit contributions | |
ullivan | +1.491 |
enhagen | +1.462 |
asma | +1.446 |
Hera | +1.419 |
eda | +1.414 |
Neg logit contributions | |
MX | -1.593 |
ovie | -1.504 |
oir | -1.418 |
resp | -1.340 |
butt | -1.336 |
Token | - |
Token ID | 12 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
enhagen | +3.541 |
ullivan | +3.529 |
asma | +3.447 |
Hera | +3.413 |
eda | +3.397 |
Neg logit contributions | |
MX | -4.734 |
ovie | -4.466 |
oir | -4.226 |
butt | -4.004 |
sburgh | -3.984 |
Token | comedian |
Token ID | 23139 |
Feature activation | -8.20e-02 |
Pos logit contributions | |
ullivan | +3.613 |
enhagen | +3.497 |
Hera | +3.487 |
asma | +3.479 |
eda | +3.435 |
Neg logit contributions | |
MX | -3.649 |
ovie | -3.429 |
oir | -3.259 |
resp | -3.064 |
butt | -2.997 |
Token | has |
Token ID | 468 |
Feature activation | -1.42e-01 |
Pos logit contributions | |
MX | +0.904 |
ovie | +0.842 |
oir | +0.804 |
butt | +0.750 |
resp | +0.749 |
Neg logit contributions | |
ullivan | -0.976 |
enhagen | -0.961 |
asma | -0.942 |
eda | -0.925 |
Hera | -0.921 |
Token | long |
Token ID | 890 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
MX | +1.538 |
ovie | +1.431 |
oir | +1.368 |
butt | +1.281 |
resp | +1.267 |
Neg logit contributions | |
ullivan | -1.708 |
enhagen | -1.682 |
asma | -1.648 |
eda | -1.617 |
Hera | -1.611 |
Token | been |
Token ID | 587 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
ullivan | +1.266 |
enhagen | +1.252 |
asma | +1.228 |
Hera | +1.207 |
eda | +1.205 |
Neg logit contributions | |
MX | -1.276 |
ovie | -1.194 |
oir | -1.134 |
resp | -1.068 |
butt | -1.056 |
Token | on |
Token ID | 319 |
Feature activation | +3.99e-02 |
Pos logit contributions | |
MX | +2.656 |
ovie | +2.474 |
oir | +2.366 |
butt | +2.220 |
resp | +2.177 |
Neg logit contributions | |
ullivan | -2.797 |
enhagen | -2.748 |
asma | -2.689 |
lication | -2.648 |
eda | -2.635 |
Token | the |
Token ID | 262 |
Feature activation | -7.58e-01 |
Pos logit contributions | |
ullivan | +0.458 |
enhagen | +0.452 |
asma | +0.443 |
Hera | +0.437 |
eda | +0.434 |
Neg logit contributions | |
MX | -0.456 |
ovie | -0.425 |
oir | -0.405 |
resp | -0.381 |
butt | -0.378 |
Token | periphery |
Token ID | 46628 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
MX | +7.436 |
ovie | +7.130 |
oir | +6.619 |
resp | +6.208 |
butt | +6.097 |
Neg logit contributions | |
ullivan | -9.224 |
lication | -8.729 |
asma | -8.662 |
enhagen | -8.645 |
eda | -8.609 |
Token | of |
Token ID | 286 |
Feature activation | +3.68e-01 |
Pos logit contributions | |
MX | +2.827 |
ovie | +2.653 |
oir | +2.535 |
butt | +2.371 |
resp | +2.325 |
Neg logit contributions | |
ullivan | -3.404 |
enhagen | -3.329 |
asma | -3.299 |
eda | -3.252 |
Hera | -3.208 |
Token | mainstream |
Token ID | 8661 |
Feature activation | +9.61e-02 |
Pos logit contributions | |
ullivan | +4.061 |
enhagen | +4.005 |
asma | +3.917 |
Hera | +3.905 |
eda | +3.839 |
Neg logit contributions | |
MX | -4.280 |
ovie | -3.957 |
oir | -3.783 |
resp | -3.584 |
sburgh | -3.485 |
Token | success |
Token ID | 1943 |
Feature activation | +2.90e-02 |
Pos logit contributions | |
ullivan | +1.057 |
enhagen | +1.037 |
asma | +1.025 |
Hera | +1.008 |
eda | +1.003 |
Neg logit contributions | |
MX | -1.142 |
ovie | -1.074 |
oir | -1.021 |
resp | -0.964 |
butt | -0.954 |
Token | , |
Token ID | 11 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
ullivan | +0.347 |
enhagen | +0.341 |
asma | +0.336 |
Hera | +0.330 |
eda | +0.329 |
Neg logit contributions | |
MX | -0.319 |
ovie | -0.297 |
oir | -0.282 |
resp | -0.264 |
butt | -0.263 |