Token | one |
Token ID | 530 |
Feature activation | +7.84e+00 |
Pos logit contributions | |
yles | +3.596 |
roth | +3.193 |
hap | +2.964 |
estate | +2.867 |
heid | +2.798 |
Neg logit contributions | |
Attention | -3.190 |
anticipation | -2.854 |
haste | -2.556 |
hurry | -2.469 |
)", | -2.440 |
Token | who |
Token ID | 508 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
yles | +7.244 |
roth | +6.397 |
hap | +5.912 |
hood | +5.749 |
estate | +5.706 |
Neg logit contributions | |
Attention | -6.435 |
anticipation | -5.680 |
haste | -5.136 |
hurry | -4.952 |
)", | -4.905 |
Token | had |
Token ID | 550 |
Feature activation | +1.49e-02 |
Pos logit contributions | |
yles | +10.213 |
roth | +9.128 |
hap | +8.393 |
hood | +8.183 |
heid | +8.000 |
Neg logit contributions | |
Attention | -9.339 |
anticipation | -8.252 |
haste | -7.417 |
hurry | -6.997 |
)", | -6.986 |
Token | carried |
Token ID | 5281 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
yles | +0.015 |
roth | +0.014 |
hap | +0.013 |
estate | +0.013 |
heid | +0.012 |
Neg logit contributions | |
Attention | -0.012 |
anticipation | -0.010 |
haste | -0.009 |
hurry | -0.009 |
Action | -0.009 |
Token | them |
Token ID | 606 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
yles | +11.281 |
roth | +10.138 |
hood | +9.182 |
hap | +9.078 |
ods | +9.036 |
Neg logit contributions | |
Attention | -8.799 |
anticipation | -7.867 |
haste | -7.155 |
hurry | -6.824 |
)", | -6.808 |
Token | to |
Token ID | 284 |
Feature activation | +3.49e+01 |
Pos logit contributions | |
yles | +12.074 |
roth | +10.878 |
hood | +10.019 |
hap | +9.981 |
estate | +9.643 |
Neg logit contributions | |
Attention | -11.794 |
anticipation | -10.206 |
haste | -9.400 |
)", | -9.169 |
Begin | -8.889 |
Token | an |
Token ID | 281 |
Feature activation | +2.08e+01 |
Pos logit contributions | |
yles | +22.201 |
roth | +20.999 |
podium | +19.588 |
Memorial | +19.480 |
hood | +19.333 |
Neg logit contributions | |
Attention | -16.645 |
anticipation | -14.037 |
)", | -13.466 |
actionGroup | -13.060 |
ÃÂ | -12.816 |
Token | upset |
Token ID | 9247 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
yles | +16.647 |
roth | +15.240 |
onym | +14.276 |
oles | +13.852 |
hap | +13.836 |
Neg logit contributions | |
Attention | -13.125 |
anticipation | -11.342 |
haste | -10.690 |
)", | -10.231 |
hurry | -10.061 |
Token | victory |
Token ID | 5373 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
yles | +11.595 |
roth | +10.519 |
hood | +9.387 |
hap | +9.252 |
heid | +9.147 |
Neg logit contributions | |
Attention | -12.251 |
anticipation | -10.591 |
haste | -9.659 |
)", | -9.466 |
hurry | -9.217 |
Token | over |
Token ID | 625 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
yles | +11.469 |
roth | +10.443 |
hap | +9.237 |
hood | +9.153 |
heid | +8.889 |
Neg logit contributions | |
Attention | -12.037 |
anticipation | -10.594 |
haste | -9.757 |
hurry | -9.380 |
)", | -9.224 |
Token | Titan |
Token ID | 11977 |
Feature activation | +6.90e+00 |
Pos logit contributions | |
yles | +13.062 |
roth | +12.069 |
hap | +11.020 |
ods | +10.637 |
hood | +10.598 |
Neg logit contributions | |
Attention | -10.978 |
anticipation | -9.615 |
haste | -8.680 |
)", | -8.437 |
hurry | -8.313 |
Token | ojure |
Token ID | 32511 |
Feature activation | +5.03e+00 |
Pos logit contributions | |
yles | +3.866 |
roth | +3.409 |
hap | +3.181 |
estate | +3.056 |
hood | +2.998 |
Neg logit contributions | |
Attention | -3.355 |
anticipation | -2.985 |
haste | -2.654 |
hurry | -2.558 |
Action | -2.549 |
Token | . |
Token ID | 13 |
Feature activation | -5.09e+00 |
Pos logit contributions | |
yles | +4.329 |
roth | +3.757 |
hap | +3.498 |
estate | +3.396 |
heid | +3.317 |
Neg logit contributions | |
Attention | -4.656 |
anticipation | -4.212 |
haste | -3.797 |
hurry | -3.710 |
)", | -3.648 |
Token | test |
Token ID | 9288 |
Feature activation | +5.67e-01 |
Pos logit contributions | |
Attention | +5.049 |
anticipation | +4.646 |
haste | +4.222 |
Action | +4.131 |
hurry | +4.072 |
Neg logit contributions | |
yles | -4.020 |
roth | -3.378 |
hap | -3.025 |
estate | -3.008 |
heid | -2.906 |
Token | was |
Token ID | 373 |
Feature activation | +9.97e+00 |
Pos logit contributions | |
yles | +0.506 |
roth | +0.439 |
hap | +0.408 |
estate | +0.395 |
heid | +0.381 |
Neg logit contributions | |
Attention | -0.522 |
anticipation | -0.476 |
haste | -0.428 |
hurry | -0.416 |
Action | -0.413 |
Token | by |
Token ID | 416 |
Feature activation | -5.36e+00 |
Pos logit contributions | |
yles | +9.345 |
roth | +8.467 |
hap | +8.035 |
estate | +7.824 |
hood | +7.636 |
Neg logit contributions | |
Attention | -7.530 |
anticipation | -6.669 |
haste | -5.853 |
hurry | -5.720 |
)", | -5.607 |
Token | far |
Token ID | 1290 |
Feature activation | +3.31e+01 |
Pos logit contributions | |
Attention | +4.317 |
anticipation | +3.903 |
haste | +3.480 |
Action | +3.367 |
hurry | +3.349 |
Neg logit contributions | |
yles | -5.311 |
roth | -4.694 |
hap | -4.374 |
estate | -4.291 |
heid | -4.206 |
Token | the |
Token ID | 262 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
yles | +20.445 |
roth | +18.716 |
hood | +18.314 |
hap | +17.782 |
outwe | +16.968 |
Neg logit contributions | |
Attention | -18.141 |
anticipation | -15.872 |
hurry | -14.275 |
)", | -14.015 |
urgency | -13.876 |
Token | most |
Token ID | 749 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
yles | +13.392 |
roth | +12.059 |
hood | +10.890 |
hap | +10.836 |
iest | +10.750 |
Neg logit contributions | |
Attention | -14.911 |
anticipation | -13.263 |
)=( | -11.912 |
haste | -11.884 |
)", | -11.795 |
Token | used |
Token ID | 973 |
Feature activation | -3.46e-01 |
Pos logit contributions | |
yles | +2.020 |
roth | +1.746 |
hap | +1.629 |
estate | +1.586 |
hood | +1.531 |
Neg logit contributions | |
Attention | -2.115 |
anticipation | -1.925 |
haste | -1.731 |
hurry | -1.687 |
Action | -1.668 |
Token | . |
Token ID | 13 |
Feature activation | +3.46e+00 |
Pos logit contributions | |
Attention | +0.298 |
anticipation | +0.271 |
haste | +0.241 |
hurry | +0.234 |
Action | +0.233 |
Neg logit contributions | |
yles | -0.328 |
roth | -0.288 |
hap | -0.268 |
estate | -0.261 |
heid | -0.253 |
Token |
|
Token ID | 198 |
Feature activation | +8.09e-01 |
Pos logit contributions | |
yles | +3.353 |
roth | +2.965 |
hap | +2.780 |
estate | +2.700 |
hood | +2.629 |
Neg logit contributions | |
Attention | -2.815 |
anticipation | -2.563 |
haste | -2.278 |
hurry | -2.216 |
)", | -2.162 |
Token | Na |
Token ID | 11013 |
Feature activation | +3.13e-01 |
Pos logit contributions | |
yles | +8.070 |
roth | +7.218 |
hap | +6.661 |
heid | +6.445 |
hood | +6.381 |
Neg logit contributions | |
Attention | -7.311 |
anticipation | -6.530 |
haste | -5.850 |
)", | -5.691 |
hurry | -5.594 |
Token | ` |
Token ID | 63 |
Feature activation | +2.45e+00 |
Pos logit contributions | |
yles | +0.395 |
roth | +0.358 |
hap | +0.341 |
estate | +0.334 |
heid | +0.327 |
Neg logit contributions | |
Attention | -0.172 |
anticipation | -0.147 |
haste | -0.120 |
hurry | -0.113 |
Action | -0.111 |
Token | Vi |
Token ID | 38432 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
yles | +2.320 |
roth | +2.050 |
hap | +1.904 |
estate | +1.860 |
hood | +1.795 |
Neg logit contributions | |
Attention | -2.104 |
anticipation | -1.894 |
haste | -1.692 |
hurry | -1.637 |
Action | -1.621 |
Token | team |
Token ID | 1074 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
yles | +9.009 |
roth | +8.089 |
hap | +7.446 |
estate | +7.145 |
hood | +7.103 |
Neg logit contributions | |
Attention | -8.821 |
anticipation | -7.859 |
haste | -7.011 |
)", | -6.895 |
hurry | -6.744 |
Token | fresh |
Token ID | 4713 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
yles | +9.038 |
roth | +8.065 |
hap | +7.487 |
estate | +7.178 |
hood | +7.142 |
Neg logit contributions | |
Attention | -8.786 |
anticipation | -7.762 |
haste | -6.903 |
)", | -6.731 |
hurry | -6.680 |
Token | off |
Token ID | 572 |
Feature activation | +3.29e+01 |
Pos logit contributions | |
Attention | +0.733 |
anticipation | +0.641 |
haste | +0.538 |
hurry | +0.512 |
Action | +0.508 |
Neg logit contributions | |
yles | -1.387 |
roth | -1.249 |
hap | -1.186 |
estate | -1.162 |
heid | -1.131 |
Token | of |
Token ID | 286 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
yles | +21.159 |
roth | +20.129 |
ebin | +18.024 |
hap | +18.016 |
Memorial | +17.886 |
Neg logit contributions | |
Attention | -17.616 |
anticipation | -14.539 |
haste | -13.429 |
)", | -13.300 |
hurry | -13.149 |
Token | travel |
Token ID | 3067 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
yles | +19.427 |
roth | +18.272 |
hap | +17.111 |
acles | +16.578 |
ods | +16.562 |
Neg logit contributions | |
Attention | -16.363 |
anticipation | -13.850 |
haste | -12.971 |
hurry | -12.463 |
)", | -12.323 |
Token | from |
Token ID | 422 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
yles | +11.408 |
roth | +10.019 |
hap | +9.177 |
estate | +9.004 |
hood | +8.943 |
Neg logit contributions | |
Attention | -10.892 |
anticipation | -9.394 |
)", | -8.610 |
haste | -8.421 |
hurry | -8.297 |
Token | Down |
Token ID | 5588 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
yles | +14.558 |
roth | +13.324 |
hap | +12.483 |
oles | +12.089 |
hood | +11.975 |
Neg logit contributions | |
Attention | -10.619 |
anticipation | -8.920 |
haste | -8.214 |
)", | -7.986 |
Begin | -7.633 |
Token | Under |
Token ID | 4698 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
yles | +9.855 |
roth | +8.692 |
hap | +8.167 |
heid | +7.954 |
estate | +7.768 |
Neg logit contributions | |
Attention | -9.374 |
anticipation | -8.508 |
haste | -7.891 |
hurry | -7.387 |
)", | -7.349 |
Token | upside |
Token ID | 17196 |
Feature activation | +6.59e+00 |
Pos logit contributions | |
yles | +7.409 |
roth | +6.594 |
hap | +6.166 |
estate | +5.937 |
hood | +5.900 |
Neg logit contributions | |
Attention | -6.025 |
anticipation | -5.266 |
haste | -4.686 |
)", | -4.660 |
hurry | -4.518 |
Token | doesn |
Token ID | 1595 |
Feature activation | -7.27e+00 |
Pos logit contributions | |
yles | +5.980 |
roth | +5.292 |
hap | +4.895 |
estate | +4.817 |
hood | +4.668 |
Neg logit contributions | |
Attention | -5.639 |
anticipation | -4.968 |
haste | -4.500 |
)", | -4.365 |
Action | -4.332 |
Token | � |
Token ID | 447 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
Attention | +2.864 |
anticipation | +2.278 |
haste | +1.677 |
)", | +1.600 |
Action | +1.588 |
Neg logit contributions | |
yles | -10.109 |
roth | -9.079 |
hap | -8.708 |
estate | -8.581 |
onyms | -8.483 |
Token | � |
Token ID | 247 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
Attention | +1.397 |
anticipation | +1.262 |
haste | +1.107 |
hurry | +1.076 |
Action | +1.066 |
Neg logit contributions | |
yles | -1.670 |
roth | -1.476 |
hap | -1.378 |
estate | -1.342 |
heid | -1.316 |
Token | t |
Token ID | 83 |
Feature activation | +1.87e+01 |
Pos logit contributions | |
Attention | +1.093 |
anticipation | +1.007 |
haste | +0.902 |
hurry | +0.885 |
Action | +0.875 |
Neg logit contributions | |
yles | -0.950 |
roth | -0.814 |
hap | -0.753 |
estate | -0.727 |
heid | -0.708 |
Token | seem |
Token ID | 1283 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
yles | +13.657 |
roth | +12.545 |
hap | +12.169 |
estate | +11.029 |
hood | +10.998 |
Neg logit contributions | |
Attention | -15.374 |
anticipation | -13.076 |
ラン | -11.832 |
haste | -11.690 |
;;;;;;;; | -11.375 |
Token | to |
Token ID | 284 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
yles | +20.257 |
roth | +19.427 |
hap | +17.839 |
hood | +17.581 |
outwe | +17.495 |
Neg logit contributions | |
Attention | -19.337 |
anticipation | -16.353 |
)", | -15.264 |
ラン | -14.619 |
haste | -14.547 |
Token | be |
Token ID | 307 |
Feature activation | +2.89e+01 |
Pos logit contributions | |
yles | +13.266 |
roth | +12.270 |
hap | +11.544 |
estate | +10.641 |
hood | +10.532 |
Neg logit contributions | |
Attention | -15.487 |
anticipation | -13.293 |
haste | -12.006 |
ラン | -11.915 |
Action | -11.867 |
Token | significantly |
Token ID | 5566 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
yles | +19.544 |
roth | +18.636 |
hood | +17.290 |
outwe | +17.268 |
estate | +17.206 |
Neg logit contributions | |
Attention | -17.509 |
anticipation | -14.348 |
ラン | -13.811 |
haste | -13.501 |
Begin | -13.365 |
Token | better |
Token ID | 1365 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
yles | +13.555 |
roth | +12.281 |
hood | +11.730 |
outwe | +11.696 |
hap | +11.390 |
Neg logit contributions | |
Attention | -13.487 |
anticipation | -11.370 |
haste | -10.463 |
ラン | -10.102 |
Begin | -10.069 |
Token | as |
Token ID | 355 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
yles | +2.110 |
roth | +1.852 |
hap | +1.719 |
estate | +1.670 |
hood | +1.612 |
Neg logit contributions | |
Attention | -2.117 |
anticipation | -1.907 |
haste | -1.726 |
hurry | -1.667 |
Action | -1.658 |
Token | , |
Token ID | 11 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
yles | +9.771 |
roth | +8.753 |
hap | +7.985 |
hood | +7.772 |
estate | +7.701 |
Neg logit contributions | |
Attention | -10.289 |
anticipation | -8.995 |
haste | -8.337 |
)", | -8.175 |
hurry | -8.056 |
Token | and |
Token ID | 290 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
yles | +10.292 |
roth | +9.189 |
hap | +8.518 |
hood | +8.322 |
estate | +8.184 |
Neg logit contributions | |
Attention | -9.215 |
anticipation | -7.710 |
haste | -7.070 |
)", | -7.065 |
hurry | -6.854 |
Token | falling |
Token ID | 7463 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
yles | +12.335 |
roth | +11.119 |
hap | +10.290 |
hood | +10.178 |
enshr | +9.937 |
Neg logit contributions | |
Attention | -11.727 |
anticipation | -9.648 |
haste | -9.026 |
)", | -8.750 |
Begin | -8.588 |
Token | just |
Token ID | 655 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
yles | +10.826 |
roth | +9.563 |
hap | +8.937 |
hood | +8.759 |
estate | +8.686 |
Neg logit contributions | |
Attention | -9.048 |
anticipation | -7.705 |
haste | -6.935 |
)", | -6.848 |
Begin | -6.639 |
Token | short |
Token ID | 1790 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
yles | +12.981 |
roth | +11.620 |
hap | +10.969 |
hood | +10.818 |
ods | +10.741 |
Neg logit contributions | |
Attention | -8.012 |
anticipation | -6.599 |
haste | -5.875 |
)", | -5.782 |
Begin | -5.434 |
Token | of |
Token ID | 286 |
Feature activation | +3.25e+01 |
Pos logit contributions | |
yles | +11.531 |
roth | +10.376 |
hood | +9.465 |
hap | +9.392 |
estate | +8.891 |
Neg logit contributions | |
Attention | -13.344 |
anticipation | -11.596 |
)", | -10.842 |
haste | -10.650 |
hurry | -10.197 |
Token | the |
Token ID | 262 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
yles | +20.714 |
roth | +19.191 |
hood | +18.713 |
enshr | +18.622 |
Memorial | +18.362 |
Neg logit contributions | |
Attention | -18.129 |
)", | -14.748 |
actionGroup | -14.725 |
anticipation | -14.415 |
Begin | -14.205 |
Token | Stanley |
Token ID | 14167 |
Feature activation | +8.33e+00 |
Pos logit contributions | |
yles | +12.903 |
roth | +11.691 |
hap | +10.766 |
hood | +10.496 |
Memorial | +10.206 |
Neg logit contributions | |
Attention | -10.519 |
anticipation | -9.182 |
)", | -8.500 |
haste | -8.255 |
hurry | -7.979 |
Token | Cup |
Token ID | 5454 |
Feature activation | +7.96e+00 |
Pos logit contributions | |
yles | +4.859 |
roth | +3.974 |
hap | +3.499 |
hood | +3.296 |
estate | +3.235 |
Neg logit contributions | |
Attention | -9.697 |
anticipation | -9.039 |
haste | -8.469 |
hurry | -8.220 |
)", | -8.215 |
Token | Finals |
Token ID | 19705 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
yles | +6.475 |
roth | +5.659 |
hood | +4.948 |
hap | +4.941 |
estate | +4.886 |
Neg logit contributions | |
Attention | -7.504 |
anticipation | -6.739 |
haste | -6.250 |
)", | -6.127 |
hurry | -5.986 |
Token | by |
Token ID | 416 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
yles | +9.006 |
roth | +7.900 |
hap | +7.361 |
hood | +7.065 |
estate | +6.947 |
Neg logit contributions | |
Attention | -8.782 |
anticipation | -7.723 |
haste | -7.225 |
)", | -7.108 |
hurry | -6.916 |
Token | : |
Token ID | 1058 |
Feature activation | +2.97e+00 |
Pos logit contributions | |
yles | +11.633 |
roth | +10.623 |
hap | +10.032 |
estate | +9.664 |
hood | +9.635 |
Neg logit contributions | |
Attention | -10.368 |
anticipation | -9.467 |
haste | -8.400 |
)", | -8.134 |
hurry | -8.112 |
Token | Bh |
Token ID | 16581 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
yles | +3.006 |
roth | +2.675 |
hap | +2.514 |
estate | +2.443 |
hood | +2.381 |
Neg logit contributions | |
Attention | -2.294 |
anticipation | -2.085 |
haste | -1.832 |
hurry | -1.771 |
)", | -1.722 |
Token | air |
Token ID | 958 |
Feature activation | +7.78e+00 |
Pos logit contributions | |
yles | +1.326 |
roth | +1.137 |
hap | +1.051 |
estate | +1.009 |
heid | +0.971 |
Neg logit contributions | |
Attention | -1.652 |
anticipation | -1.520 |
haste | -1.381 |
hurry | -1.345 |
Action | -1.334 |
Token | ava |
Token ID | 4170 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
yles | +4.517 |
roth | +3.749 |
hap | +3.291 |
estate | +3.184 |
hood | +3.036 |
Neg logit contributions | |
Attention | -9.205 |
anticipation | -8.622 |
haste | -7.948 |
hurry | -7.766 |
)", | -7.614 |
Token | is |
Token ID | 318 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
yles | +10.698 |
roth | +9.560 |
hap | +9.076 |
hood | +8.773 |
estate | +8.606 |
Neg logit contributions | |
Attention | -10.134 |
anticipation | -9.321 |
haste | -8.276 |
hurry | -8.056 |
)", | -8.033 |
Token | considered |
Token ID | 3177 |
Feature activation | +3.18e+01 |
Pos logit contributions | |
yles | +12.957 |
roth | +12.024 |
hap | +11.427 |
enshr | +10.966 |
hood | +10.791 |
Neg logit contributions | |
Attention | -12.450 |
anticipation | -11.401 |
haste | -9.910 |
;;;;;;;; | -9.779 |
hurry | -9.749 |
Token | as |
Token ID | 355 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
yles | +20.020 |
roth | +19.126 |
hap | +18.714 |
enshr | +18.134 |
memorial | +18.047 |
Neg logit contributions | |
Attention | -16.954 |
anticipation | -15.480 |
;;;;;;;; | -13.559 |
Begin | -13.415 |
ÃÂ | -13.309 |
Token | a |
Token ID | 257 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
yles | +18.719 |
roth | +17.077 |
hap | +16.845 |
enshr | +16.412 |
memorial | +16.263 |
Neg logit contributions | |
Attention | -15.450 |
anticipation | -13.768 |
haste | -12.009 |
Begin | -11.931 |
;;;;;;;; | -11.913 |
Token | form |
Token ID | 1296 |
Feature activation | +5.04e+00 |
Pos logit contributions | |
yles | +13.826 |
roth | +12.342 |
hap | +11.704 |
memorial | +11.393 |
hood | +11.298 |
Neg logit contributions | |
Attention | -12.325 |
anticipation | -10.943 |
haste | -9.467 |
)", | -9.420 |
Begin | -9.293 |
Token | of |
Token ID | 286 |
Feature activation | +5.83e+00 |
Pos logit contributions | |
yles | +4.675 |
roth | +4.115 |
hap | +3.819 |
estate | +3.703 |
hood | +3.637 |
Neg logit contributions | |
Attention | -4.338 |
anticipation | -3.935 |
haste | -3.490 |
hurry | -3.395 |
Action | -3.356 |
Token | Shiva |
Token ID | 33995 |
Feature activation | +5.39e+00 |
Pos logit contributions | |
yles | +5.450 |
roth | +4.842 |
hap | +4.594 |
estate | +4.345 |
hood | +4.301 |
Neg logit contributions | |
Attention | -4.737 |
anticipation | -4.269 |
haste | -3.761 |
)", | -3.687 |
hurry | -3.682 |
Token | witnesses |
Token ID | 11432 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
yles | +6.035 |
roth | +5.391 |
hap | +5.126 |
estate | +4.972 |
hood | +4.783 |
Neg logit contributions | |
Attention | -5.282 |
anticipation | -4.642 |
haste | -4.177 |
hurry | -4.071 |
)", | -4.041 |
Token | range |
Token ID | 2837 |
Feature activation | +6.43e+00 |
Pos logit contributions | |
yles | +9.229 |
roth | +8.440 |
hap | +7.973 |
estate | +7.691 |
hood | +7.619 |
Neg logit contributions | |
Attention | -8.859 |
anticipation | -7.750 |
haste | -6.984 |
;;;;;;;; | -6.785 |
)", | -6.702 |
Token | from |
Token ID | 422 |
Feature activation | +1.81e+01 |
Pos logit contributions | |
yles | +6.499 |
roth | +5.841 |
hap | +5.535 |
estate | +5.346 |
hood | +5.220 |
Neg logit contributions | |
Attention | -4.841 |
anticipation | -4.291 |
haste | -3.776 |
hurry | -3.641 |
)", | -3.639 |
Token | several |
Token ID | 1811 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
yles | +12.936 |
roth | +11.229 |
hap | +10.759 |
hood | +10.429 |
memorial | +10.376 |
Neg logit contributions | |
Attention | -14.191 |
anticipation | -12.593 |
ÃÂ | -11.971 |
;;;;;;;; | -11.916 |
)", | -11.782 |
Token | hundred |
Token ID | 3470 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
yles | +10.798 |
roth | +9.414 |
hap | +8.777 |
hood | +8.404 |
onyms | +8.102 |
Neg logit contributions | |
Attention | -13.338 |
anticipation | -11.917 |
haste | -10.950 |
)", | -10.905 |
;;;;;;;; | -10.695 |
Token | to |
Token ID | 284 |
Feature activation | +3.14e+01 |
Pos logit contributions | |
yles | +3.012 |
roth | +2.633 |
hap | +2.421 |
estate | +2.314 |
hood | +2.271 |
Neg logit contributions | |
Attention | -3.330 |
anticipation | -3.038 |
haste | -2.767 |
hurry | -2.670 |
)", | -2.647 |
Token | several |
Token ID | 1811 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
yles | +18.711 |
roth | +16.650 |
hap | +16.239 |
memorial | +15.908 |
hood | +15.671 |
Neg logit contributions | |
Attention | -18.983 |
ÃÂ | -16.821 |
anticipation | -16.617 |
)", | -16.342 |
;;;;;;;; | -16.080 |
Token | thousand |
Token ID | 7319 |
Feature activation | -2.86e+00 |
Pos logit contributions | |
yles | +13.570 |
roth | +11.916 |
hap | +11.566 |
hood | +10.922 |
ods | +10.495 |
Neg logit contributions | |
Attention | -17.307 |
anticipation | -15.382 |
)", | -14.539 |
haste | -14.346 |
Begin | -14.056 |
Token | . |
Token ID | 13 |
Feature activation | +9.11e+00 |
Pos logit contributions | |
Attention | +2.464 |
anticipation | +2.241 |
haste | +1.976 |
hurry | +1.927 |
Action | +1.919 |
Neg logit contributions | |
yles | -2.712 |
roth | -2.374 |
hap | -2.201 |
estate | -2.177 |
heid | -2.097 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
yles | +6.838 |
roth | +5.928 |
hap | +5.452 |
estate | +5.233 |
hood | +5.193 |
Neg logit contributions | |
Attention | -8.409 |
anticipation | -8.036 |
haste | -7.578 |
hurry | -7.332 |
)", | -7.069 |
Token | Ped |
Token ID | 43468 |
Feature activation | +3.78e+00 |
Pos logit contributions | |
yles | +1.874 |
roth | +1.651 |
hap | +1.546 |
estate | +1.504 |
heid | +1.455 |
Neg logit contributions | |
Attention | -1.684 |
anticipation | -1.527 |
haste | -1.362 |
hurry | -1.323 |
Action | -1.303 |
Token | women |
Token ID | 1466 |
Feature activation | +1.53e+01 |
Pos logit contributions | |
yles | +12.096 |
roth | +10.362 |
hood | +10.193 |
hap | +9.681 |
enshr | +9.658 |
Neg logit contributions | |
Attention | -10.196 |
anticipation | -9.259 |
haste | -8.192 |
)", | -8.061 |
;;;;;;;; | -7.834 |
Token | together |
Token ID | 1978 |
Feature activation | +2.04e+01 |
Pos logit contributions | |
yles | +11.753 |
roth | +10.226 |
hood | +10.140 |
enshr | +9.780 |
memorial | +9.553 |
Neg logit contributions | |
Attention | -12.428 |
anticipation | -11.293 |
haste | -10.086 |
)", | -9.662 |
hurry | -9.634 |
Token | , |
Token ID | 11 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
yles | +15.384 |
roth | +13.277 |
hood | +13.192 |
enshr | +12.992 |
memorial | +12.839 |
Neg logit contributions | |
Attention | -14.749 |
anticipation | -13.440 |
haste | -12.111 |
hurry | -11.661 |
Begin | -11.266 |
Token | as |
Token ID | 355 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
yles | +13.862 |
roth | +12.501 |
enshr | +12.078 |
hood | +12.073 |
hap | +12.001 |
Neg logit contributions | |
Attention | -10.272 |
anticipation | -8.999 |
)", | -7.964 |
;;;;;;;; | -7.856 |
haste | -7.846 |
Token | well |
Token ID | 880 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
yles | +12.982 |
roth | +11.407 |
hap | +10.838 |
hood | +10.659 |
memorial | +10.622 |
Neg logit contributions | |
Attention | -10.211 |
anticipation | -8.836 |
haste | -8.082 |
)", | -7.793 |
hurry | -7.680 |
Token | as |
Token ID | 355 |
Feature activation | +3.11e+01 |
Pos logit contributions | |
yles | +10.548 |
roth | +9.165 |
hap | +8.604 |
estate | +8.274 |
hood | +8.179 |
Neg logit contributions | |
Attention | -14.374 |
anticipation | -12.925 |
haste | -12.013 |
)", | -11.987 |
hurry | -11.793 |
Token | the |
Token ID | 262 |
Feature activation | +1.76e+01 |
Pos logit contributions | |
yles | +21.370 |
memorial | +19.430 |
roth | +18.879 |
hood | +18.627 |
hap | +18.624 |
Neg logit contributions | |
Attention | -16.070 |
anticipation | -13.512 |
)", | -12.651 |
haste | -12.353 |
actionGroup | -12.293 |
Token | only |
Token ID | 691 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
yles | +13.377 |
roth | +11.647 |
memorial | +10.955 |
hap | +10.882 |
hood | +10.520 |
Neg logit contributions | |
Attention | -13.364 |
anticipation | -11.770 |
haste | -10.822 |
)", | -10.681 |
;;;;;;;; | -10.380 |
Token | one |
Token ID | 530 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
yles | +13.534 |
roth | +11.759 |
memorial | +11.707 |
enshr | +11.296 |
hood | +11.256 |
Neg logit contributions | |
Attention | -12.840 |
anticipation | -11.459 |
haste | -10.213 |
)", | -10.211 |
Begin | -9.845 |
Token | of |
Token ID | 286 |
Feature activation | +2.11e+00 |
Pos logit contributions | |
yles | +13.797 |
roth | +12.388 |
memorial | +11.971 |
enshr | +11.865 |
hood | +11.812 |
Neg logit contributions | |
Attention | -12.219 |
anticipation | -10.931 |
haste | -9.522 |
)", | -9.360 |
hurry | -9.278 |
Token | Keller |
Token ID | 35999 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
yles | +2.167 |
roth | +1.923 |
hap | +1.808 |
estate | +1.757 |
hood | +1.714 |
Neg logit contributions | |
Attention | -1.633 |
anticipation | -1.458 |
haste | -1.279 |
hurry | -1.236 |
Action | -1.225 |
Token | would |
Token ID | 561 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
yles | +12.777 |
roth | +11.617 |
hap | +10.761 |
estate | +10.547 |
hood | +10.514 |
Neg logit contributions | |
Attention | -9.100 |
anticipation | -8.045 |
haste | -6.837 |
)", | -6.730 |
;;;;;;;; | -6.505 |
Token | much |
Token ID | 881 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
yles | +12.400 |
roth | +11.293 |
hap | +10.698 |
estate | +10.217 |
hood | +10.145 |
Neg logit contributions | |
Attention | -9.588 |
anticipation | -8.549 |
haste | -7.359 |
)", | -7.245 |
Action | -7.039 |
Token | prefer |
Token ID | 4702 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
yles | +3.250 |
roth | +2.876 |
hap | +2.694 |
estate | +2.650 |
hood | +2.556 |
Neg logit contributions | |
Attention | -2.586 |
anticipation | -2.297 |
haste | -2.027 |
hurry | -1.959 |
Action | -1.952 |
Token | the |
Token ID | 262 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
yles | +17.605 |
roth | +16.282 |
estate | +15.087 |
hap | +14.961 |
hood | +14.678 |
Neg logit contributions | |
Attention | -13.522 |
anticipation | -11.783 |
)", | -10.384 |
haste | -10.199 |
Begin | -10.154 |
Token | lower |
Token ID | 2793 |
Feature activation | +2.31e+01 |
Pos logit contributions | |
yles | +12.685 |
roth | +11.460 |
estate | +10.791 |
hap | +10.679 |
hood | +10.405 |
Neg logit contributions | |
Attention | -10.752 |
anticipation | -9.387 |
)", | -8.290 |
haste | -8.229 |
Begin | -8.187 |
Token | res |
Token ID | 581 |
Feature activation | +3.10e+01 |
Pos logit contributions | |
yles | +16.616 |
roth | +15.105 |
estate | +15.078 |
hap | +14.288 |
hood | +14.181 |
Neg logit contributions | |
Attention | -15.085 |
anticipation | -13.006 |
;;;;;;;; | -11.702 |
)", | -11.587 |
Begin | -11.571 |
Token | without |
Token ID | 1231 |
Feature activation | +2.35e+01 |
Pos logit contributions | |
yles | +20.752 |
roth | +19.357 |
hap | +18.439 |
estate | +18.384 |
hood | +18.010 |
Neg logit contributions | |
Attention | -16.811 |
anticipation | -14.364 |
Begin | -13.146 |
ÃÂ | -12.754 |
ラン | -12.548 |
Token | screen |
Token ID | 3159 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
yles | +18.176 |
roth | +16.511 |
hap | +15.560 |
hood | +15.380 |
detrim | +15.137 |
Neg logit contributions | |
Attention | -13.618 |
anticipation | -12.076 |
Begin | -11.150 |
ÃÂ | -10.997 |
)", | -10.967 |
Token | door |
Token ID | 3420 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
yles | +8.824 |
roth | +7.473 |
hap | +6.828 |
hood | +6.583 |
estate | +6.471 |
Neg logit contributions | |
Attention | -12.523 |
anticipation | -11.198 |
hurry | -10.185 |
;;;;;;;; | -10.147 |
)", | -10.113 |
Token | effect |
Token ID | 1245 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
yles | +11.446 |
roth | +10.349 |
hap | +9.802 |
estate | +9.750 |
hood | +9.599 |
Neg logit contributions | |
Attention | -6.432 |
anticipation | -5.359 |
haste | -4.593 |
hurry | -4.551 |
)", | -4.536 |
Token | . |
Token ID | 13 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
yles | +17.699 |
roth | +15.922 |
hap | +15.198 |
estate | +15.125 |
hood | +14.942 |
Neg logit contributions | |
Attention | -13.132 |
anticipation | -11.385 |
)", | -10.085 |
haste | -10.070 |
hurry | -9.966 |
Token | t |
Token ID | 83 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
yles | +1.044 |
roth | +0.889 |
hap | +0.813 |
estate | +0.785 |
heid | +0.750 |
Neg logit contributions | |
Attention | -1.395 |
anticipation | -1.284 |
haste | -1.171 |
hurry | -1.140 |
Action | -1.134 |
Token | think |
Token ID | 892 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
yles | +11.916 |
roth | +10.848 |
hap | +9.763 |
hood | +9.429 |
estate | +9.424 |
Neg logit contributions | |
Attention | -14.095 |
anticipation | -12.401 |
haste | -11.010 |
;;;;;;;; | -10.940 |
)", | -10.760 |
Token | it |
Token ID | 340 |
Feature activation | +2.28e+01 |
Pos logit contributions | |
yles | +10.465 |
roth | +9.253 |
hap | +8.588 |
estate | +8.546 |
heid | +8.483 |
Neg logit contributions | |
Attention | -7.736 |
anticipation | -6.693 |
haste | -5.983 |
hurry | -5.731 |
)", | -5.696 |
Token | � |
Token ID | 447 |
Feature activation | +2.73e+00 |
Pos logit contributions | |
yles | +17.463 |
roth | +15.288 |
hood | +14.230 |
hap | +13.929 |
heid | +13.732 |
Neg logit contributions | |
Attention | -15.918 |
anticipation | -13.706 |
haste | -12.514 |
hurry | -12.049 |
)", | -11.961 |
Token | � |
Token ID | 247 |
Feature activation | +8.45e+00 |
Pos logit contributions | |
yles | +2.387 |
roth | +2.096 |
hap | +1.930 |
estate | +1.888 |
hood | +1.823 |
Neg logit contributions | |
Attention | -2.537 |
anticipation | -2.307 |
haste | -2.069 |
hurry | -2.024 |
Action | -1.998 |
Token | s |
Token ID | 82 |
Feature activation | +3.07e+01 |
Pos logit contributions | |
yles | +6.942 |
roth | +5.906 |
hap | +5.487 |
estate | +5.343 |
hood | +5.290 |
Neg logit contributions | |
Attention | -8.000 |
anticipation | -7.234 |
haste | -6.596 |
hurry | -6.399 |
Action | -6.345 |
Token | had |
Token ID | 550 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
yles | +20.280 |
roth | +18.180 |
hood | +17.741 |
memorial | +17.728 |
hap | +17.358 |
Neg logit contributions | |
Attention | -17.049 |
anticipation | -14.236 |
ラン | -13.621 |
Begin | -13.033 |
haste | -12.746 |
Token | an |
Token ID | 281 |
Feature activation | +5.81e+00 |
Pos logit contributions | |
yles | +10.168 |
roth | +8.901 |
hap | +8.353 |
estate | +8.298 |
hood | +7.970 |
Neg logit contributions | |
Attention | -9.623 |
anticipation | -8.441 |
haste | -7.693 |
)", | -7.612 |
hurry | -7.519 |
Token | entertainment |
Token ID | 9739 |
Feature activation | +8.64e+00 |
Pos logit contributions | |
yles | +5.586 |
roth | +4.901 |
estate | +4.588 |
hap | +4.573 |
hood | +4.408 |
Neg logit contributions | |
Attention | -4.608 |
anticipation | -4.018 |
haste | -3.703 |
hurry | -3.546 |
)", | -3.492 |
Token | concept |
Token ID | 3721 |
Feature activation | +7.80e+00 |
Pos logit contributions | |
yles | +8.148 |
roth | +7.263 |
estate | +6.739 |
hap | +6.650 |
hood | +6.517 |
Neg logit contributions | |
Attention | -6.698 |
anticipation | -5.787 |
haste | -5.339 |
)", | -5.074 |
hurry | -5.063 |
Token | that |
Token ID | 326 |
Feature activation | +9.29e+00 |
Pos logit contributions | |
yles | +6.870 |
roth | +6.032 |
hap | +5.482 |
estate | +5.443 |
hood | +5.364 |
Neg logit contributions | |
Attention | -6.723 |
anticipation | -5.999 |
haste | -5.499 |
)", | -5.293 |
hurry | -5.250 |
Token | this |
Token ID | 428 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
Attention | +0.443 |
anticipation | +0.395 |
haste | +0.343 |
hurry | +0.330 |
Action | +0.328 |
Neg logit contributions | |
yles | -0.641 |
roth | -0.571 |
hap | -0.535 |
estate | -0.524 |
heid | -0.510 |
Token | temple |
Token ID | 12505 |
Feature activation | +7.31e+00 |
Pos logit contributions | |
yles | +10.464 |
roth | +8.896 |
hap | +8.723 |
memorial | +8.316 |
estate | +8.268 |
Neg logit contributions | |
Attention | -12.250 |
anticipation | -10.947 |
haste | -9.895 |
)", | -9.871 |
;;;;;;;; | -9.828 |
Token | , |
Token ID | 11 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
yles | +6.812 |
roth | +5.992 |
hap | +5.695 |
estate | +5.500 |
hood | +5.358 |
Neg logit contributions | |
Attention | -5.911 |
anticipation | -5.365 |
haste | -4.767 |
)", | -4.575 |
hurry | -4.553 |
Token | 14 |
Token ID | 1478 |
Feature activation | +8.82e+00 |
Pos logit contributions | |
yles | +1.772 |
roth | +1.574 |
hap | +1.485 |
estate | +1.443 |
heid | +1.401 |
Neg logit contributions | |
Attention | -1.314 |
anticipation | -1.177 |
haste | -1.034 |
hurry | -0.996 |
Action | -0.981 |
Token | are |
Token ID | 389 |
Feature activation | +6.26e+00 |
Pos logit contributions | |
yles | +8.412 |
roth | +7.537 |
hap | +7.147 |
estate | +6.821 |
hood | +6.654 |
Neg logit contributions | |
Attention | -6.778 |
anticipation | -6.093 |
haste | -5.415 |
hurry | -5.141 |
)", | -5.108 |
Token | considered |
Token ID | 3177 |
Feature activation | +3.06e+01 |
Pos logit contributions | |
yles | +5.894 |
roth | +5.190 |
hap | +4.940 |
estate | +4.678 |
heid | +4.589 |
Neg logit contributions | |
Attention | -5.088 |
anticipation | -4.589 |
haste | -4.073 |
hurry | -3.967 |
)", | -3.925 |
Token | unique |
Token ID | 3748 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
yles | +21.074 |
hap | +19.192 |
roth | +19.100 |
memorial | +18.759 |
enshr | +18.340 |
Neg logit contributions | |
Attention | -15.735 |
anticipation | -14.388 |
Begin | -12.469 |
ÃÂ | -12.222 |
;;;;;;;; | -12.213 |
Token | . |
Token ID | 13 |
Feature activation | +8.17e+00 |
Pos logit contributions | |
yles | +12.321 |
roth | +10.637 |
hap | +10.268 |
onyms | +9.700 |
estate | +9.555 |
Neg logit contributions | |
Attention | -11.901 |
anticipation | -10.832 |
haste | -9.863 |
hurry | -9.579 |
)", | -9.537 |
Token | In |
Token ID | 554 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
yles | +7.624 |
roth | +6.777 |
hap | +6.361 |
estate | +6.135 |
hood | +6.066 |
Neg logit contributions | |
Attention | -6.164 |
anticipation | -5.841 |
haste | -5.296 |
hurry | -5.119 |
)", | -4.877 |
Token | some |
Token ID | 617 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
Attention | +8.275 |
anticipation | +7.855 |
haste | +6.814 |
Action | +6.564 |
hurry | +6.437 |
Neg logit contributions | |
yles | -10.387 |
roth | -8.942 |
estate | -8.287 |
hap | -8.126 |
heid | -8.004 |
Token | of |
Token ID | 286 |
Feature activation | +1.97e-01 |
Pos logit contributions | |
yles | +10.677 |
roth | +9.202 |
hap | +8.895 |
estate | +8.358 |
memorial | +8.209 |
Neg logit contributions | |
Attention | -10.438 |
anticipation | -8.916 |
Action | -8.023 |
;;;;;;;; | -7.987 |
)", | -7.964 |
Token | when |
Token ID | 618 |
Feature activation | +4.71e+00 |
Pos logit contributions | |
yles | +6.400 |
roth | +5.624 |
hap | +5.138 |
estate | +5.056 |
hood | +5.037 |
Neg logit contributions | |
Attention | -5.939 |
anticipation | -5.278 |
haste | -4.691 |
)", | -4.642 |
hurry | -4.545 |
Token | over |
Token ID | 625 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
yles | +4.119 |
roth | +3.554 |
hap | +3.278 |
estate | +3.193 |
hood | +3.160 |
Neg logit contributions | |
Attention | -4.265 |
anticipation | -3.815 |
haste | -3.453 |
)", | -3.371 |
hurry | -3.357 |
Token | the |
Token ID | 262 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
yles | +9.182 |
roth | +8.306 |
hap | +7.553 |
estate | +7.523 |
hood | +7.452 |
Neg logit contributions | |
Attention | -8.885 |
anticipation | -7.892 |
hurry | -6.984 |
haste | -6.960 |
)", | -6.816 |
Token | cap |
Token ID | 1451 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
yles | +8.423 |
roth | +7.623 |
hap | +6.744 |
hood | +6.674 |
estate | +6.598 |
Neg logit contributions | |
Attention | -9.448 |
anticipation | -8.494 |
)", | -7.627 |
haste | -7.601 |
hurry | -7.483 |
Token | , |
Token ID | 11 |
Feature activation | +2.43e+01 |
Pos logit contributions | |
yles | +13.889 |
roth | +12.527 |
hood | +11.361 |
hap | +11.221 |
estate | +11.134 |
Neg logit contributions | |
Attention | -12.710 |
anticipation | -11.148 |
)", | -10.230 |
haste | -9.852 |
;;;;;;;; | -9.790 |
Token | functionally |
Token ID | 48410 |
Feature activation | +3.06e+01 |
Pos logit contributions | |
yles | +18.544 |
roth | +16.642 |
outwe | +15.880 |
estate | +15.778 |
enshr | +15.692 |
Neg logit contributions | |
Attention | -14.916 |
anticipation | -12.590 |
)", | -11.963 |
ラン | -11.563 |
;;;;;;;; | -11.420 |
Token | useless |
Token ID | 13894 |
Feature activation | +8.85e+00 |
Pos logit contributions | |
yles | +21.659 |
enshr | +18.841 |
roth | +18.525 |
outwe | +18.359 |
estate | +18.195 |
Neg logit contributions | |
Attention | -17.420 |
anticipation | -14.688 |
ÃÂ | -13.720 |
;;;;;;;; | -13.123 |
)", | -12.994 |
Token | . |
Token ID | 13 |
Feature activation | +8.54e+00 |
Pos logit contributions | |
yles | +7.749 |
roth | +6.772 |
hap | +6.172 |
estate | +6.156 |
hood | +6.141 |
Neg logit contributions | |
Attention | -7.523 |
anticipation | -6.735 |
)", | -6.139 |
haste | -6.060 |
hurry | -5.870 |
Token |
|
Token ID | 198 |
Feature activation | +7.38e-01 |
Pos logit contributions | |
yles | +7.316 |
roth | +6.398 |
hap | +5.802 |
hood | +5.801 |
estate | +5.788 |
Neg logit contributions | |
Attention | -6.994 |
anticipation | -6.674 |
haste | -6.163 |
hurry | -5.912 |
)", | -5.836 |
Token |
|
Token ID | 198 |
Feature activation | +6.65e+00 |
Pos logit contributions | |
yles | +0.570 |
roth | +0.484 |
hap | +0.443 |
estate | +0.427 |
heid | +0.410 |
Neg logit contributions | |
Attention | -0.766 |
anticipation | -0.706 |
haste | -0.643 |
hurry | -0.628 |
Action | -0.622 |
Token | The |
Token ID | 464 |
Feature activation | +7.29e+00 |
Pos logit contributions | |
yles | +6.002 |
roth | +5.376 |
hap | +4.983 |
estate | +4.944 |
hood | +4.808 |
Neg logit contributions | |
Attention | -5.713 |
anticipation | -5.237 |
haste | -4.721 |
hurry | -4.574 |
Action | -4.433 |
Token |
|
Token ID | 198 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
yles | +6.068 |
roth | +5.336 |
hap | +4.889 |
estate | +4.732 |
heid | +4.635 |
Neg logit contributions | |
Attention | -6.817 |
anticipation | -6.435 |
haste | -5.808 |
hurry | -5.664 |
)", | -5.475 |
Token |
|
Token ID | 198 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
Attention | +1.233 |
anticipation | +1.130 |
haste | +1.026 |
Action | +0.998 |
hurry | +0.997 |
Neg logit contributions | |
yles | -0.990 |
roth | -0.841 |
hap | -0.775 |
estate | -0.749 |
onyms | -0.714 |
Token | So |
Token ID | 2396 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
yles | +1.022 |
roth | +0.898 |
hap | +0.839 |
estate | +0.816 |
heid | +0.790 |
Neg logit contributions | |
Attention | -0.922 |
anticipation | -0.836 |
haste | -0.745 |
hurry | -0.723 |
Action | -0.714 |
Token | , |
Token ID | 11 |
Feature activation | -4.69e+00 |
Pos logit contributions | |
Attention | +1.470 |
anticipation | +1.328 |
haste | +1.174 |
hurry | +1.143 |
Action | +1.132 |
Neg logit contributions | |
yles | -1.762 |
roth | -1.550 |
hap | -1.452 |
estate | -1.421 |
heid | -1.371 |
Token | after |
Token ID | 706 |
Feature activation | +2.09e+01 |
Pos logit contributions | |
Attention | +3.851 |
anticipation | +3.483 |
haste | +3.069 |
hurry | +3.004 |
Action | +2.976 |
Neg logit contributions | |
yles | -4.653 |
roth | -4.073 |
hap | -3.816 |
estate | -3.725 |
heid | -3.616 |
Token | almost |
Token ID | 2048 |
Feature activation | +3.04e+01 |
Pos logit contributions | |
yles | +16.690 |
roth | +15.052 |
hap | +14.291 |
hood | +13.939 |
memorial | +13.710 |
Neg logit contributions | |
Attention | -13.193 |
anticipation | -10.861 |
)", | -10.434 |
haste | -10.326 |
;;;;;;;; | -9.981 |
Token | a |
Token ID | 257 |
Feature activation | +1.98e+01 |
Pos logit contributions | |
yles | +18.765 |
hood | +17.292 |
roth | +17.223 |
memorial | +16.490 |
Memorial | +16.209 |
Neg logit contributions | |
Attention | -18.430 |
ÃÂ | -15.159 |
;;;;;;;; | -14.355 |
anticipation | -14.239 |
)=( | -14.158 |
Token | week |
Token ID | 1285 |
Feature activation | -5.57e+00 |
Pos logit contributions | |
yles | +12.022 |
roth | +9.848 |
hap | +9.202 |
hood | +8.970 |
memorial | +8.768 |
Neg logit contributions | |
Attention | -17.895 |
anticipation | -15.593 |
)", | -14.562 |
haste | -14.543 |
;;;;;;;; | -14.511 |
Token | of |
Token ID | 286 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
Attention | +4.268 |
anticipation | +3.950 |
haste | +3.411 |
Action | +3.295 |
hurry | +3.280 |
Neg logit contributions | |
yles | -5.670 |
roth | -5.015 |
hap | -4.765 |
estate | -4.664 |
heid | -4.432 |
Token | researching |
Token ID | 24114 |
Feature activation | +4.22e+00 |
Pos logit contributions | |
Attention | +4.369 |
anticipation | +4.112 |
haste | +3.576 |
Action | +3.471 |
hurry | +3.469 |
Neg logit contributions | |
yles | -4.584 |
roth | -3.977 |
hap | -3.745 |
estate | -3.661 |
heid | -3.521 |
Token | , |
Token ID | 11 |
Feature activation | +6.32e+00 |
Pos logit contributions | |
yles | +4.107 |
roth | +3.605 |
hap | +3.382 |
estate | +3.282 |
hood | +3.219 |
Neg logit contributions | |
Attention | -3.406 |
anticipation | -3.041 |
haste | -2.727 |
hurry | -2.636 |
)", | -2.624 |
Token | relatively |
Token ID | 5365 |
Feature activation | +5.42e+00 |
Pos logit contributions | |
yles | +4.295 |
roth | +3.764 |
hap | +3.564 |
estate | +3.453 |
hood | +3.382 |
Neg logit contributions | |
Attention | -3.778 |
anticipation | -3.349 |
haste | -3.015 |
hurry | -2.907 |
)", | -2.861 |
Token | morph |
Token ID | 17488 |
Feature activation | +8.70e+00 |
Pos logit contributions | |
yles | +5.131 |
roth | +4.418 |
hap | +4.195 |
estate | +4.081 |
hood | +3.995 |
Neg logit contributions | |
Attention | -4.590 |
anticipation | -4.053 |
haste | -3.631 |
hurry | -3.517 |
Action | -3.465 |
Token | ologically |
Token ID | 13437 |
Feature activation | +3.00e+00 |
Pos logit contributions | |
yles | +3.982 |
roth | +2.845 |
hap | +2.412 |
estate | +2.258 |
onyms | +2.199 |
Neg logit contributions | |
Attention | -11.626 |
anticipation | -10.788 |
haste | -10.207 |
hurry | -9.901 |
Action | -9.820 |
Token | unchanged |
Token ID | 21588 |
Feature activation | +2.88e+00 |
Pos logit contributions | |
yles | +2.892 |
roth | +2.530 |
hap | +2.390 |
estate | +2.304 |
heid | +2.253 |
Neg logit contributions | |
Attention | -2.530 |
anticipation | -2.258 |
haste | -2.022 |
hurry | -1.950 |
Action | -1.921 |
Token | for |
Token ID | 329 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
yles | +2.961 |
roth | +2.624 |
hap | +2.486 |
estate | +2.404 |
heid | +2.353 |
Neg logit contributions | |
Attention | -2.230 |
anticipation | -1.979 |
haste | -1.748 |
hurry | -1.682 |
Action | -1.657 |
Token | over |
Token ID | 625 |
Feature activation | +2.98e+01 |
Pos logit contributions | |
yles | +13.029 |
roth | +11.215 |
hap | +10.797 |
hood | +10.382 |
estate | +10.209 |
Neg logit contributions | |
Attention | -13.015 |
anticipation | -11.566 |
haste | -10.729 |
;;;;;;;; | -10.602 |
)", | -10.413 |
Token | a |
Token ID | 257 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
yles | +17.775 |
hap | +15.371 |
roth | +15.333 |
heid | +14.511 |
hood | +14.446 |
Neg logit contributions | |
Attention | -19.635 |
anticipation | -17.266 |
;;;;;;;; | -16.075 |
haste | -15.956 |
)", | -15.305 |
Token | million |
Token ID | 1510 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
yles | +7.965 |
roth | +6.463 |
hap | +6.255 |
oles | +5.675 |
heid | +5.631 |
Neg logit contributions | |
Attention | -12.301 |
anticipation | -11.098 |
haste | -10.344 |
Action | -9.925 |
)", | -9.911 |
Token | years |
Token ID | 812 |
Feature activation | +5.45e+00 |
Pos logit contributions | |
yles | +5.635 |
roth | +4.348 |
hap | +4.093 |
heid | +3.633 |
hood | +3.525 |
Neg logit contributions | |
Attention | -13.165 |
anticipation | -12.025 |
haste | -11.334 |
hurry | -11.050 |
;;;;;;;; | -10.915 |
Token | . |
Token ID | 13 |
Feature activation | -5.33e+00 |
Pos logit contributions | |
yles | +5.320 |
roth | +4.712 |
hap | +4.451 |
estate | +4.271 |
heid | +4.230 |
Neg logit contributions | |
Attention | -4.395 |
anticipation | -3.914 |
haste | -3.511 |
hurry | -3.383 |
)", | -3.302 |
Token | By |
Token ID | 2750 |
Feature activation | +4.60e+00 |
Pos logit contributions | |
Attention | +4.345 |
anticipation | +3.799 |
Action | +3.362 |
haste | +3.275 |
)", | +3.165 |
Neg logit contributions | |
yles | -5.348 |
roth | -4.713 |
hap | -4.414 |
estate | -4.356 |
onyms | -4.191 |
Token | didn |
Token ID | 1422 |
Feature activation | -9.26e+00 |
Pos logit contributions | |
yles | +5.232 |
roth | +4.540 |
hap | +4.283 |
estate | +4.129 |
hood | +4.104 |
Neg logit contributions | |
Attention | -5.052 |
anticipation | -4.552 |
haste | -4.049 |
)", | -3.925 |
hurry | -3.902 |
Token | 't |
Token ID | 470 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
Attention | +3.435 |
anticipation | +2.632 |
)", | +1.911 |
Action | +1.888 |
haste | +1.785 |
Neg logit contributions | |
yles | -12.861 |
roth | -11.623 |
hap | -11.205 |
estate | -11.065 |
detrim | -10.993 |
Token | get |
Token ID | 651 |
Feature activation | -6.16e+00 |
Pos logit contributions | |
yles | +10.336 |
roth | +8.989 |
hap | +8.782 |
hood | +8.345 |
memorial | +8.214 |
Neg logit contributions | |
Attention | -11.106 |
anticipation | -10.001 |
;;;;;;;; | -8.902 |
ラン | -8.706 |
haste | -8.602 |
Token | to |
Token ID | 284 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
Attention | +4.772 |
anticipation | +4.212 |
haste | +3.717 |
hurry | +3.597 |
Action | +3.590 |
Neg logit contributions | |
yles | -6.339 |
roth | -5.701 |
estate | -5.265 |
hap | -5.251 |
heid | -5.016 |
Token | know |
Token ID | 760 |
Feature activation | -7.79e+00 |
Pos logit contributions | |
yles | +11.334 |
roth | +10.206 |
hap | +9.725 |
hood | +9.350 |
heid | +9.170 |
Neg logit contributions | |
Attention | -8.917 |
anticipation | -8.099 |
haste | -6.901 |
;;;;;;;; | -6.823 |
)", | -6.726 |
Token | him |
Token ID | 683 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
Attention | +3.564 |
anticipation | +2.947 |
haste | +2.313 |
Action | +2.217 |
hurry | +2.200 |
Neg logit contributions | |
yles | -10.207 |
roth | -9.444 |
hap | -8.941 |
estate | -8.860 |
onyms | -8.551 |
Token | missed |
Token ID | 6825 |
Feature activation | -7.99e+00 |
Pos logit contributions | |
yles | +18.937 |
hood | +17.168 |
hap | +16.473 |
roth | +16.468 |
memorial | +16.420 |
Neg logit contributions | |
Attention | -18.926 |
anticipation | -16.190 |
ラン | -15.670 |
)=( | -15.117 |
ÃÂ | -14.851 |
Token | out |
Token ID | 503 |
Feature activation | +7.48e+00 |
Pos logit contributions | |
Attention | +5.068 |
anticipation | +4.371 |
haste | +3.670 |
Action | +3.622 |
hurry | +3.508 |
Neg logit contributions | |
yles | -9.095 |
roth | -8.211 |
estate | -7.802 |
hap | -7.538 |
heid | -7.448 |
Token | on |
Token ID | 319 |
Feature activation | +7.28e+00 |
Pos logit contributions | |
yles | +6.942 |
roth | +6.168 |
hap | +5.845 |
hood | +5.557 |
estate | +5.515 |
Neg logit contributions | |
Attention | -6.262 |
anticipation | -5.527 |
haste | -4.952 |
)", | -4.781 |
hurry | -4.754 |
Token | a |
Token ID | 257 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
yles | +8.195 |
roth | +7.356 |
hap | +7.079 |
hood | +6.817 |
estate | +6.729 |
Neg logit contributions | |
Attention | -4.487 |
anticipation | -3.840 |
haste | -3.336 |
)", | -3.184 |
hurry | -3.167 |
Token | wonderful |
Token ID | 7932 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
yles | +11.391 |
roth | +9.719 |
hap | +9.388 |
hood | +9.258 |
memorial | +9.077 |
Neg logit contributions | |
Attention | -11.139 |
anticipation | -9.762 |
)", | -8.823 |
haste | -8.685 |
)=( | -8.503 |
Token | Being |
Token ID | 11204 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
yles | +9.513 |
roth | +8.356 |
hap | +7.867 |
hood | +7.559 |
heid | +7.483 |
Neg logit contributions | |
Attention | -8.521 |
anticipation | -8.049 |
haste | -7.494 |
hurry | -7.253 |
)", | -7.108 |
Token | on |
Token ID | 319 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
yles | +13.987 |
roth | +12.694 |
hap | +11.633 |
enshr | +11.314 |
estate | +11.296 |
Neg logit contributions | |
Attention | -11.677 |
anticipation | -10.181 |
haste | -9.201 |
)", | -8.878 |
;;;;;;;; | -8.702 |
Token | the |
Token ID | 262 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
yles | +15.643 |
roth | +13.827 |
hap | +13.343 |
ods | +12.934 |
estate | +12.723 |
Neg logit contributions | |
Attention | -13.098 |
anticipation | -11.534 |
)", | -10.227 |
;;;;;;;; | -10.161 |
haste | -9.964 |
Token | sidelines |
Token ID | 29394 |
Feature activation | +2.06e+01 |
Pos logit contributions | |
yles | +10.152 |
roth | +8.978 |
hap | +8.366 |
ods | +8.120 |
estate | +8.092 |
Neg logit contributions | |
Attention | -9.290 |
anticipation | -8.191 |
)", | -7.449 |
haste | -7.427 |
;;;;;;;; | -7.210 |
Token | and |
Token ID | 290 |
Feature activation | +8.15e+00 |
Pos logit contributions | |
yles | +15.330 |
roth | +13.227 |
hap | +13.161 |
outwe | +12.812 |
hood | +12.702 |
Neg logit contributions | |
Attention | -14.862 |
anticipation | -12.275 |
ラン | -11.498 |
Begin | -11.300 |
haste | -11.278 |
Token | not |
Token ID | 407 |
Feature activation | +2.90e+01 |
Pos logit contributions | |
yles | +7.839 |
roth | +6.909 |
hap | +6.576 |
hood | +6.292 |
estate | +6.264 |
Neg logit contributions | |
Attention | -6.238 |
anticipation | -5.355 |
haste | -4.883 |
hurry | -4.652 |
Action | -4.645 |
Token | being |
Token ID | 852 |
Feature activation | +2.25e+01 |
Pos logit contributions | |
yles | +19.124 |
priv | +17.377 |
roth | +17.287 |
hood | +17.116 |
memorial | +16.913 |
Neg logit contributions | |
Attention | -16.956 |
anticipation | -13.500 |
ÃÂ | -13.203 |
haste | -13.152 |
ラン | -13.080 |
Token | able |
Token ID | 1498 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
yles | +15.821 |
roth | +14.408 |
priv | +13.941 |
hood | +13.677 |
memorial | +13.659 |
Neg logit contributions | |
Attention | -15.033 |
anticipation | -13.024 |
ラン | -12.067 |
haste | -11.982 |
ÃÂ | -11.968 |
Token | to |
Token ID | 284 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
yles | +10.285 |
roth | +8.922 |
hood | +8.109 |
hap | +8.076 |
ods | +7.584 |
Neg logit contributions | |
Attention | -19.052 |
anticipation | -17.277 |
ÃÂ | -16.172 |
;;;;;;;; | -15.738 |
haste | -15.520 |
Token | do |
Token ID | 466 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
yles | +12.480 |
roth | +11.442 |
hap | +10.730 |
memorial | +10.474 |
hood | +10.413 |
Neg logit contributions | |
Attention | -8.756 |
anticipation | -7.301 |
haste | -6.386 |
;;;;;;;; | -6.197 |
)", | -6.095 |
Token | anything |
Token ID | 1997 |
Feature activation | +9.77e-01 |
Pos logit contributions | |
yles | +8.784 |
roth | +7.576 |
hap | +7.214 |
estate | +6.860 |
hood | +6.838 |
Neg logit contributions | |
Attention | -8.267 |
anticipation | -7.425 |
haste | -6.685 |
)", | -6.503 |
hurry | -6.503 |
Token | . |
Token ID | 13 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
yles | +2.072 |
roth | +1.824 |
hap | +1.705 |
estate | +1.652 |
hood | +1.607 |
Neg logit contributions | |
Attention | -1.868 |
anticipation | -1.687 |
haste | -1.504 |
hurry | -1.455 |
Action | -1.438 |
Token |
|
Token ID | 198 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
yles | +11.240 |
roth | +9.917 |
hood | +9.123 |
hap | +9.042 |
estate | +8.823 |
Neg logit contributions | |
Attention | -10.569 |
anticipation | -10.464 |
haste | -9.983 |
hurry | -9.439 |
)", | -9.191 |
Token |
|
Token ID | 198 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
yles | +1.400 |
roth | +1.191 |
hap | +1.086 |
estate | +1.042 |
hood | +1.007 |
Neg logit contributions | |
Attention | -1.979 |
anticipation | -1.830 |
haste | -1.669 |
hurry | -1.633 |
Action | -1.608 |
Token | Twitter |
Token ID | 14254 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
yles | +9.580 |
roth | +8.632 |
hap | +8.097 |
estate | +7.990 |
hood | +7.981 |
Neg logit contributions | |
Attention | -10.284 |
anticipation | -9.550 |
haste | -8.820 |
hurry | -8.661 |
ÃÂ | -8.194 |
Token | was |
Token ID | 373 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
yles | +10.850 |
roth | +9.672 |
hap | +8.987 |
estate | +8.789 |
hood | +8.682 |
Neg logit contributions | |
Attention | -9.788 |
anticipation | -8.944 |
)", | -8.145 |
haste | -8.069 |
hurry | -7.722 |
Token | deemed |
Token ID | 10762 |
Feature activation | +2.90e+01 |
Pos logit contributions | |
yles | +13.077 |
roth | +12.319 |
hap | +11.493 |
hood | +11.084 |
estate | +11.062 |
Neg logit contributions | |
Attention | -10.947 |
anticipation | -9.821 |
)", | -8.719 |
;;;;;;;; | -8.580 |
haste | -8.499 |
Token | cooler |
Token ID | 19346 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
yles | +19.365 |
roth | +17.810 |
hood | +17.449 |
hap | +17.225 |
tops | +16.467 |
Neg logit contributions | |
Attention | -15.353 |
anticipation | -14.222 |
)", | -12.936 |
Begin | -12.516 |
ラン | -12.337 |
Token | than |
Token ID | 621 |
Feature activation | +4.62e+00 |
Pos logit contributions | |
yles | +10.273 |
roth | +9.225 |
hap | +8.564 |
hood | +8.239 |
estate | +8.230 |
Neg logit contributions | |
Attention | -10.228 |
anticipation | -9.033 |
)", | -8.492 |
haste | -8.274 |
;;;;;;;; | -7.940 |
Token | in |
Token ID | 287 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
yles | +4.597 |
roth | +4.055 |
hap | +3.826 |
estate | +3.683 |
hood | +3.649 |
Neg logit contributions | |
Attention | -3.629 |
anticipation | -3.213 |
haste | -2.865 |
)", | -2.752 |
hurry | -2.752 |
Token | the |
Token ID | 262 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
yles | +0.318 |
roth | +0.282 |
hap | +0.265 |
estate | +0.259 |
heid | +0.251 |
Neg logit contributions | |
Attention | -0.239 |
anticipation | -0.214 |
haste | -0.188 |
hurry | -0.181 |
Action | -0.180 |
Token | past |
Token ID | 1613 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
yles | +9.492 |
roth | +8.433 |
hap | +7.843 |
hood | +7.440 |
oles | +7.178 |
Neg logit contributions | |
Attention | -10.629 |
anticipation | -9.443 |
)", | -8.764 |
haste | -8.552 |
;;;;;;;; | -8.539 |
Token | � |
Token ID | 447 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
Attention | +2.864 |
anticipation | +2.278 |
haste | +1.677 |
)", | +1.600 |
Action | +1.588 |
Neg logit contributions | |
yles | -10.109 |
roth | -9.079 |
hap | -8.708 |
estate | -8.581 |
onyms | -8.483 |
Token | � |
Token ID | 247 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
Attention | +1.397 |
anticipation | +1.262 |
haste | +1.107 |
hurry | +1.076 |
Action | +1.066 |
Neg logit contributions | |
yles | -1.670 |
roth | -1.476 |
hap | -1.378 |
estate | -1.342 |
heid | -1.316 |
Token | t |
Token ID | 83 |
Feature activation | +1.87e+01 |
Pos logit contributions | |
Attention | +1.093 |
anticipation | +1.007 |
haste | +0.902 |
hurry | +0.885 |
Action | +0.875 |
Neg logit contributions | |
yles | -0.950 |
roth | -0.814 |
hap | -0.753 |
estate | -0.727 |
heid | -0.708 |
Token | seem |
Token ID | 1283 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
yles | +13.657 |
roth | +12.545 |
hap | +12.169 |
estate | +11.029 |
hood | +10.998 |
Neg logit contributions | |
Attention | -15.374 |
anticipation | -13.076 |
ラン | -11.832 |
haste | -11.690 |
;;;;;;;; | -11.375 |
Token | to |
Token ID | 284 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
yles | +20.257 |
roth | +19.427 |
hap | +17.839 |
hood | +17.581 |
outwe | +17.495 |
Neg logit contributions | |
Attention | -19.337 |
anticipation | -16.353 |
)", | -15.264 |
ラン | -14.619 |
haste | -14.547 |
Token | be |
Token ID | 307 |
Feature activation | +2.89e+01 |
Pos logit contributions | |
yles | +13.266 |
roth | +12.270 |
hap | +11.544 |
estate | +10.641 |
hood | +10.532 |
Neg logit contributions | |
Attention | -15.487 |
anticipation | -13.293 |
haste | -12.006 |
ラン | -11.915 |
Action | -11.867 |
Token | significantly |
Token ID | 5566 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
yles | +19.544 |
roth | +18.636 |
hood | +17.290 |
outwe | +17.268 |
estate | +17.206 |
Neg logit contributions | |
Attention | -17.509 |
anticipation | -14.348 |
ラン | -13.811 |
haste | -13.501 |
Begin | -13.365 |
Token | better |
Token ID | 1365 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
yles | +13.555 |
roth | +12.281 |
hood | +11.730 |
outwe | +11.696 |
hap | +11.390 |
Neg logit contributions | |
Attention | -13.487 |
anticipation | -11.370 |
haste | -10.463 |
ラン | -10.102 |
Begin | -10.069 |
Token | as |
Token ID | 355 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
yles | +2.110 |
roth | +1.852 |
hap | +1.719 |
estate | +1.670 |
hood | +1.612 |
Neg logit contributions | |
Attention | -2.117 |
anticipation | -1.907 |
haste | -1.726 |
hurry | -1.667 |
Action | -1.658 |
Token | Domin |
Token ID | 11817 |
Feature activation | +7.44e+00 |
Pos logit contributions | |
yles | +10.403 |
roth | +9.293 |
hap | +8.487 |
hood | +8.130 |
estate | +8.116 |
Neg logit contributions | |
Attention | -10.324 |
anticipation | -8.936 |
haste | -8.346 |
)", | -8.064 |
hurry | -8.024 |
Token | ik |
Token ID | 1134 |
Feature activation | +6.26e+00 |
Pos logit contributions | |
yles | +5.211 |
roth | +4.501 |
hap | +4.040 |
hood | +3.845 |
estate | +3.803 |
Neg logit contributions | |
Attention | -7.921 |
anticipation | -7.256 |
haste | -6.819 |
hurry | -6.586 |
Action | -6.462 |
Token | He |
Token ID | 679 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
Attention | +4.835 |
anticipation | +4.172 |
Action | +3.674 |
haste | +3.515 |
hurry | +3.417 |
Neg logit contributions | |
yles | -6.923 |
roth | -6.103 |
hap | -5.756 |
estate | -5.744 |
onyms | -5.519 |
Token | � |
Token ID | 447 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
yles | +1.430 |
roth | +1.259 |
hap | +1.173 |
estate | +1.138 |
heid | +1.105 |
Neg logit contributions | |
Attention | -1.275 |
anticipation | -1.148 |
haste | -1.021 |
hurry | -0.988 |
Action | -0.978 |
Token | � |
Token ID | 247 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
Attention | +2.072 |
anticipation | +1.872 |
haste | +1.657 |
hurry | +1.602 |
Action | +1.591 |
Neg logit contributions | |
yles | -2.459 |
roth | -2.158 |
hap | -2.019 |
estate | -1.966 |
heid | -1.913 |
Token | s |
Token ID | 82 |
Feature activation | +5.86e+00 |
Pos logit contributions | |
Attention | +2.158 |
anticipation | +1.956 |
haste | +1.730 |
hurry | +1.676 |
Action | +1.665 |
Neg logit contributions | |
yles | -2.483 |
roth | -2.182 |
hap | -2.045 |
estate | -1.993 |
heid | -1.941 |
Token | quite |
Token ID | 2407 |
Feature activation | +7.24e+00 |
Pos logit contributions | |
yles | +5.535 |
roth | +4.913 |
hap | +4.607 |
estate | +4.420 |
hood | +4.372 |
Neg logit contributions | |
Attention | -4.796 |
anticipation | -4.264 |
haste | -3.767 |
)", | -3.657 |
hurry | -3.649 |
Token | possibly |
Token ID | 5457 |
Feature activation | +2.88e+01 |
Pos logit contributions | |
yles | +6.616 |
roth | +5.953 |
hap | +5.618 |
estate | +5.326 |
hood | +5.294 |
Neg logit contributions | |
Attention | -5.956 |
anticipation | -5.260 |
haste | -4.672 |
hurry | -4.581 |
Action | -4.577 |
Token | the |
Token ID | 262 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
yles | +20.069 |
roth | +18.024 |
hap | +17.449 |
hood | +17.361 |
enshr | +17.144 |
Neg logit contributions | |
Attention | -16.464 |
anticipation | -14.334 |
)", | -13.086 |
haste | -12.968 |
ラン | -12.694 |
Token | best |
Token ID | 1266 |
Feature activation | -9.46e+00 |
Pos logit contributions | |
yles | +9.439 |
roth | +8.278 |
hap | +7.524 |
hood | +7.147 |
ods | +7.123 |
Neg logit contributions | |
Attention | -11.003 |
anticipation | -9.861 |
haste | -9.050 |
)", | -8.967 |
;;;;;;;; | -8.736 |
Token | in |
Token ID | 287 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
Attention | +8.268 |
anticipation | +7.746 |
haste | +6.888 |
hurry | +6.781 |
Action | +6.659 |
Neg logit contributions | |
yles | -8.228 |
roth | -7.157 |
hap | -6.792 |
estate | -6.605 |
onyms | -6.540 |
Token | baseball |
Token ID | 9283 |
Feature activation | -6.78e+00 |
Pos logit contributions | |
Attention | +2.868 |
anticipation | +2.616 |
haste | +2.287 |
hurry | +2.202 |
Action | +2.200 |
Neg logit contributions | |
yles | -3.695 |
roth | -3.286 |
hap | -3.056 |
estate | -3.023 |
heid | -2.951 |
Token | at |
Token ID | 379 |
Feature activation | -5.78e+00 |
Pos logit contributions | |
Attention | +5.376 |
anticipation | +4.954 |
haste | +4.290 |
hurry | +4.213 |
Action | +4.178 |
Neg logit contributions | |
yles | -6.680 |
roth | -5.858 |
hap | -5.462 |
estate | -5.333 |
heid | -5.222 |
Token | ` |
Token ID | 63 |
Feature activation | +2.45e+00 |
Pos logit contributions | |
yles | +0.395 |
roth | +0.358 |
hap | +0.341 |
estate | +0.334 |
heid | +0.327 |
Neg logit contributions | |
Attention | -0.172 |
anticipation | -0.147 |
haste | -0.120 |
hurry | -0.113 |
Action | -0.111 |
Token | Vi |
Token ID | 38432 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
yles | +2.320 |
roth | +2.050 |
hap | +1.904 |
estate | +1.860 |
hood | +1.795 |
Neg logit contributions | |
Attention | -2.104 |
anticipation | -1.894 |
haste | -1.692 |
hurry | -1.637 |
Action | -1.621 |
Token | team |
Token ID | 1074 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
yles | +9.009 |
roth | +8.089 |
hap | +7.446 |
estate | +7.145 |
hood | +7.103 |
Neg logit contributions | |
Attention | -8.821 |
anticipation | -7.859 |
haste | -7.011 |
)", | -6.895 |
hurry | -6.744 |
Token | fresh |
Token ID | 4713 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
yles | +9.038 |
roth | +8.065 |
hap | +7.487 |
estate | +7.178 |
hood | +7.142 |
Neg logit contributions | |
Attention | -8.786 |
anticipation | -7.762 |
haste | -6.903 |
)", | -6.731 |
hurry | -6.680 |
Token | off |
Token ID | 572 |
Feature activation | +3.29e+01 |
Pos logit contributions | |
Attention | +0.733 |
anticipation | +0.641 |
haste | +0.538 |
hurry | +0.512 |
Action | +0.508 |
Neg logit contributions | |
yles | -1.387 |
roth | -1.249 |
hap | -1.186 |
estate | -1.162 |
heid | -1.131 |
Token | of |
Token ID | 286 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
yles | +21.159 |
roth | +20.129 |
ebin | +18.024 |
hap | +18.016 |
Memorial | +17.886 |
Neg logit contributions | |
Attention | -17.616 |
anticipation | -14.539 |
haste | -13.429 |
)", | -13.300 |
hurry | -13.149 |
Token | travel |
Token ID | 3067 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
yles | +19.427 |
roth | +18.272 |
hap | +17.111 |
acles | +16.578 |
ods | +16.562 |
Neg logit contributions | |
Attention | -16.363 |
anticipation | -13.850 |
haste | -12.971 |
hurry | -12.463 |
)", | -12.323 |
Token | from |
Token ID | 422 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
yles | +11.408 |
roth | +10.019 |
hap | +9.177 |
estate | +9.004 |
hood | +8.943 |
Neg logit contributions | |
Attention | -10.892 |
anticipation | -9.394 |
)", | -8.610 |
haste | -8.421 |
hurry | -8.297 |
Token | Down |
Token ID | 5588 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
yles | +14.558 |
roth | +13.324 |
hap | +12.483 |
oles | +12.089 |
hood | +11.975 |
Neg logit contributions | |
Attention | -10.619 |
anticipation | -8.920 |
haste | -8.214 |
)", | -7.986 |
Begin | -7.633 |
Token | Under |
Token ID | 4698 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
yles | +9.855 |
roth | +8.692 |
hap | +8.167 |
heid | +7.954 |
estate | +7.768 |
Neg logit contributions | |
Attention | -9.374 |
anticipation | -8.508 |
haste | -7.891 |
hurry | -7.387 |
)", | -7.349 |
Token | ? |
Token ID | 30 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
yles | +12.057 |
roth | +10.810 |
hap | +10.069 |
hood | +9.677 |
heid | +9.629 |
Neg logit contributions | |
Attention | -11.130 |
anticipation | -10.015 |
haste | -9.084 |
)", | -9.014 |
hurry | -8.577 |
Token | being |
Token ID | 852 |
Feature activation | -3.18e+00 |
Pos logit contributions | |
Attention | +7.474 |
anticipation | +6.939 |
directed | +6.217 |
haste | +6.198 |
Action | +5.948 |
Neg logit contributions | |
yles | -8.850 |
roth | -8.038 |
hap | -7.310 |
estate | -7.250 |
onyms | -7.020 |
Token | planned |
Token ID | 6027 |
Feature activation | -2.67e+00 |
Pos logit contributions | |
Attention | +2.346 |
anticipation | +2.111 |
haste | +1.850 |
hurry | +1.782 |
Action | +1.756 |
Neg logit contributions | |
yles | -3.386 |
roth | -3.040 |
hap | -2.842 |
estate | -2.781 |
onyms | -2.716 |
Token | and |
Token ID | 290 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
Attention | +2.198 |
anticipation | +1.995 |
haste | +1.762 |
hurry | +1.707 |
Action | +1.703 |
Neg logit contributions | |
yles | -2.623 |
roth | -2.310 |
hap | -2.158 |
estate | -2.109 |
heid | -2.042 |
Token | the |
Token ID | 262 |
Feature activation | -7.60e+00 |
Pos logit contributions | |
Attention | +8.251 |
anticipation | +7.534 |
haste | +6.760 |
Action | +6.586 |
directed | +6.434 |
Neg logit contributions | |
yles | -10.204 |
roth | -9.195 |
hap | -8.459 |
estate | -8.430 |
heid | -8.059 |
Token | investigation |
Token ID | 3645 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
Attention | +6.676 |
anticipation | +6.200 |
haste | +5.594 |
Action | +5.430 |
hurry | +5.399 |
Neg logit contributions | |
yles | -6.775 |
roth | -5.987 |
hap | -5.561 |
estate | -5.506 |
heid | -5.348 |
Token | had |
Token ID | 550 |
Feature activation | -3.56e+01 |
Pos logit contributions | |
Attention | +9.394 |
anticipation | +8.786 |
haste | +7.920 |
directed | +7.704 |
hurry | +7.664 |
Neg logit contributions | |
yles | -12.193 |
roth | -11.052 |
hap | -10.374 |
estate | -10.034 |
onyms | -9.715 |
Token | been |
Token ID | 587 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
Attention | +18.764 |
anticipation | +17.937 |
directed | +17.569 |
focused | +17.547 |
aimed | +17.169 |
Neg logit contributions | |
yles | -24.734 |
roth | -21.053 |
estate | -19.655 |
heid | -19.133 |
onyms | -19.093 |
Token | priorit |
Token ID | 19086 |
Feature activation | -8.65e+00 |
Pos logit contributions | |
Attention | +9.834 |
anticipation | +9.544 |
directed | +9.050 |
haste | +8.513 |
aimed | +8.429 |
Neg logit contributions | |
yles | -14.644 |
roth | -13.024 |
hap | -12.094 |
onyms | -11.857 |
heid | -11.746 |
Token | ised |
Token ID | 1417 |
Feature activation | -9.47e+00 |
Pos logit contributions | |
Attention | +5.267 |
anticipation | +4.758 |
haste | +3.963 |
Action | +3.941 |
hurry | +3.852 |
Neg logit contributions | |
yles | -9.896 |
roth | -8.751 |
hap | -8.291 |
estate | -8.052 |
heid | -8.037 |
Token | accordingly |
Token ID | 16062 |
Feature activation | -2.41e+00 |
Pos logit contributions | |
Attention | +6.978 |
anticipation | +6.387 |
haste | +5.646 |
hurry | +5.479 |
Action | +5.425 |
Neg logit contributions | |
yles | -9.549 |
roth | -8.450 |
estate | -7.880 |
hap | -7.875 |
heid | -7.601 |
Token | , |
Token ID | 11 |
Feature activation | -9.48e-01 |
Pos logit contributions | |
Attention | +2.082 |
anticipation | +1.879 |
haste | +1.678 |
Action | +1.629 |
hurry | +1.625 |
Neg logit contributions | |
yles | -2.284 |
roth | -2.004 |
hap | -1.861 |
estate | -1.826 |
heid | -1.754 |
Token | his |
Token ID | 465 |
Feature activation | -6.39e+00 |
Pos logit contributions | |
Attention | +11.100 |
anticipation | +10.032 |
Action | +8.885 |
haste | +8.856 |
action | +8.643 |
Neg logit contributions | |
yles | -12.998 |
roth | -11.347 |
hap | -10.582 |
estate | -10.472 |
heid | -10.164 |
Token | first |
Token ID | 717 |
Feature activation | -5.04e+00 |
Pos logit contributions | |
Attention | +5.062 |
anticipation | +4.564 |
haste | +4.018 |
Action | +3.949 |
hurry | +3.902 |
Neg logit contributions | |
yles | -6.447 |
roth | -5.616 |
hap | -5.311 |
estate | -5.182 |
onyms | -4.995 |
Token | programming |
Token ID | 8300 |
Feature activation | -7.60e+00 |
Pos logit contributions | |
Attention | +4.273 |
anticipation | +3.856 |
haste | +3.421 |
Action | +3.376 |
hurry | +3.348 |
Neg logit contributions | |
yles | -4.830 |
roth | -4.249 |
hap | -3.945 |
estate | -3.855 |
onyms | -3.698 |
Token | class |
Token ID | 1398 |
Feature activation | -7.55e-01 |
Pos logit contributions | |
Attention | +5.114 |
anticipation | +4.534 |
haste | +3.930 |
Action | +3.825 |
hurry | +3.800 |
Neg logit contributions | |
yles | -8.366 |
roth | -7.468 |
hap | -7.169 |
estate | -6.935 |
onyms | -6.762 |
Token | ( |
Token ID | 357 |
Feature activation | -8.13e+00 |
Pos logit contributions | |
Attention | +0.647 |
anticipation | +0.585 |
haste | +0.520 |
hurry | +0.505 |
Action | +0.502 |
Neg logit contributions | |
yles | -0.721 |
roth | -0.633 |
hap | -0.592 |
estate | -0.576 |
heid | -0.556 |
Token | in |
Token ID | 259 |
Feature activation | -3.40e+01 |
Pos logit contributions | |
Attention | +7.640 |
anticipation | +7.001 |
haste | +6.301 |
Action | +6.213 |
)", | +6.141 |
Neg logit contributions | |
yles | -6.657 |
roth | -5.591 |
hap | -5.154 |
estate | -4.920 |
heid | -4.783 |
Token | the |
Token ID | 262 |
Feature activation | -1.47e+01 |
Pos logit contributions | |
Attention | +21.736 |
anticipation | +21.502 |
Action | +19.411 |
earnest | +18.805 |
haste | +18.579 |
Neg logit contributions | |
yles | -22.263 |
roth | -18.398 |
estate | -16.760 |
hap | -16.549 |
heid | -15.804 |
Token | wrong |
Token ID | 2642 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
Attention | +11.817 |
anticipation | +10.784 |
Action | +9.770 |
haste | +9.697 |
hurry | +9.419 |
Neg logit contributions | |
yles | -12.872 |
roth | -10.971 |
estate | -10.306 |
hap | -10.161 |
heid | -9.836 |
Token | language |
Token ID | 3303 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
Attention | +11.182 |
anticipation | +10.270 |
hurry | +9.336 |
haste | +9.295 |
Action | +8.802 |
Neg logit contributions | |
yles | -12.364 |
roth | -11.120 |
hap | -10.327 |
estate | -9.820 |
onyms | -9.673 |
Token | !) |
Token ID | 8133 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
Attention | +7.523 |
anticipation | +6.664 |
haste | +5.738 |
)", | +5.691 |
Action | +5.587 |
Neg logit contributions | |
yles | -13.153 |
roth | -11.664 |
hap | -11.204 |
estate | -10.883 |
heid | -10.455 |
Token | to |
Token ID | 284 |
Feature activation | +9.28e+00 |
Pos logit contributions | |
yles | +2.110 |
roth | +1.836 |
hap | +1.696 |
estate | +1.646 |
hood | +1.601 |
Neg logit contributions | |
Attention | -2.188 |
anticipation | -1.990 |
haste | -1.795 |
hurry | -1.742 |
)", | -1.718 |
Token | of |
Token ID | 286 |
Feature activation | -2.54e+00 |
Pos logit contributions | |
yles | +6.449 |
roth | +5.463 |
hap | +5.085 |
estate | +4.976 |
hood | +4.961 |
Neg logit contributions | |
Attention | -6.347 |
anticipation | -5.647 |
haste | -5.116 |
hurry | -4.986 |
)", | -4.976 |
Token | gun |
Token ID | 2485 |
Feature activation | +3.95e+00 |
Pos logit contributions | |
Attention | +2.006 |
anticipation | +1.816 |
haste | +1.595 |
hurry | +1.544 |
Action | +1.533 |
Neg logit contributions | |
yles | -2.579 |
roth | -2.301 |
hap | -2.151 |
estate | -2.099 |
heid | -2.036 |
Token | owners |
Token ID | 4393 |
Feature activation | +3.28e+00 |
Pos logit contributions | |
yles | +3.096 |
roth | +2.597 |
hap | +2.364 |
estate | +2.298 |
hood | +2.268 |
Neg logit contributions | |
Attention | -4.051 |
anticipation | -3.678 |
haste | -3.358 |
hurry | -3.278 |
)", | -3.243 |
Token | — |
Token ID | 960 |
Feature activation | -4.25e+00 |
Pos logit contributions | |
yles | +3.058 |
roth | +2.668 |
hap | +2.497 |
estate | +2.419 |
hood | +2.385 |
Neg logit contributions | |
Attention | -2.873 |
anticipation | -2.569 |
haste | -2.306 |
hurry | -2.230 |
Action | -2.200 |
Token | it |
Token ID | 270 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
Attention | +4.176 |
anticipation | +3.870 |
haste | +3.509 |
Action | +3.412 |
hurry | +3.386 |
Neg logit contributions | |
yles | -3.452 |
roth | -2.903 |
hap | -2.667 |
estate | -2.546 |
heid | -2.486 |
Token | has |
Token ID | 468 |
Feature activation | -3.36e+01 |
Pos logit contributions | |
Attention | +12.519 |
anticipation | +12.511 |
directed | +12.052 |
aimed | +11.513 |
action | +11.490 |
Neg logit contributions | |
yles | -15.207 |
roth | -13.088 |
hap | -11.899 |
ebin | -11.783 |
estate | -11.733 |
Token | expanded |
Token ID | 9902 |
Feature activation | +2.73e+00 |
Pos logit contributions | |
directed | +22.640 |
aimed | +21.593 |
Attention | +21.290 |
anticipation | +20.865 |
action | +20.796 |
Neg logit contributions | |
yles | -19.553 |
roth | -16.214 |
onyms | -14.873 |
ulia | -14.416 |
estate | -14.238 |
Token | them |
Token ID | 606 |
Feature activation | +8.19e+00 |
Pos logit contributions | |
yles | +2.726 |
roth | +2.384 |
hap | +2.252 |
estate | +2.192 |
hood | +2.145 |
Neg logit contributions | |
Attention | -2.209 |
anticipation | -1.968 |
haste | -1.740 |
hurry | -1.694 |
)", | -1.667 |
Token | , |
Token ID | 11 |
Feature activation | -1.68e+01 |
Pos logit contributions | |
yles | +6.864 |
roth | +5.854 |
hap | +5.548 |
hood | +5.388 |
estate | +5.341 |
Neg logit contributions | |
Attention | -7.580 |
anticipation | -6.661 |
haste | -6.037 |
)", | -5.916 |
hurry | -5.897 |
Token | including |
Token ID | 1390 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
Attention | +13.940 |
anticipation | +13.541 |
directed | +12.863 |
haste | +12.383 |
aimed | +12.341 |
Neg logit contributions | |
yles | -12.560 |
roth | -11.042 |
hap | -9.747 |
estate | -9.507 |
onyms | -9.404 |
Token | allowing |
Token ID | 5086 |
Feature activation | -4.32e+00 |
Pos logit contributions | |
yles | +2.291 |
roth | +1.997 |
hap | +1.879 |
estate | +1.831 |
hood | +1.778 |
Neg logit contributions | |
Attention | -2.034 |
anticipation | -1.828 |
haste | -1.629 |
hurry | -1.585 |
)", | -1.560 |
Token | " |
Token ID | 366 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
Attention | +0.433 |
anticipation | +0.385 |
haste | +0.335 |
hurry | +0.323 |
Action | +0.321 |
Neg logit contributions | |
yles | -0.621 |
roth | -0.554 |
hap | -0.521 |
estate | -0.509 |
heid | -0.495 |
Token | He |
Token ID | 1544 |
Feature activation | -6.83e+00 |
Pos logit contributions | |
Attention | +8.469 |
anticipation | +7.202 |
Begin | +6.456 |
Action | +6.374 |
Action | +6.272 |
Neg logit contributions | |
yles | -12.287 |
roth | -10.579 |
hap | -9.867 |
onyms | -9.794 |
estate | -9.742 |
Token | 's |
Token ID | 338 |
Feature activation | -5.76e+00 |
Pos logit contributions | |
Attention | +5.003 |
anticipation | +4.707 |
haste | +4.159 |
hurry | +4.075 |
directed | +3.993 |
Neg logit contributions | |
yles | -6.934 |
roth | -6.166 |
hap | -5.808 |
estate | -5.724 |
onyms | -5.516 |
Token | not |
Token ID | 407 |
Feature activation | +4.50e+00 |
Pos logit contributions | |
Attention | +4.612 |
anticipation | +4.220 |
haste | +3.723 |
hurry | +3.642 |
Action | +3.559 |
Neg logit contributions | |
yles | -5.801 |
roth | -5.070 |
hap | -4.775 |
estate | -4.654 |
onyms | -4.625 |
Token | flashy |
Token ID | 43115 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
yles | +4.346 |
roth | +3.889 |
hap | +3.615 |
estate | +3.503 |
hood | +3.464 |
Neg logit contributions | |
Attention | -3.650 |
anticipation | -3.251 |
haste | -2.842 |
)", | -2.767 |
Action | -2.753 |
Token | , |
Token ID | 11 |
Feature activation | -3.35e+01 |
Pos logit contributions | |
Attention | +7.580 |
anticipation | +6.991 |
haste | +6.152 |
hurry | +6.057 |
Action | +5.861 |
Neg logit contributions | |
yles | -10.495 |
roth | -9.061 |
hap | -8.772 |
estate | -8.499 |
onyms | -8.344 |
Token | he |
Token ID | 339 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
Attention | +17.610 |
anticipation | +17.329 |
hurry | +15.788 |
haste | +15.546 |
action | +15.240 |
Neg logit contributions | |
yles | -24.235 |
roth | -21.170 |
hap | -20.224 |
estate | -20.179 |
onyms | -19.838 |
Token | just |
Token ID | 655 |
Feature activation | -9.17e+00 |
Pos logit contributions | |
anticipation | +10.762 |
Attention | +10.472 |
hurry | +9.634 |
haste | +9.622 |
directed | +9.602 |
Neg logit contributions | |
yles | -19.447 |
roth | -17.621 |
estate | -16.956 |
hap | -16.538 |
ebin | -15.984 |
Token | does |
Token ID | 857 |
Feature activation | -1.52e+01 |
Pos logit contributions | |
Attention | +6.858 |
anticipation | +6.564 |
haste | +5.810 |
hurry | +5.765 |
directed | +5.567 |
Neg logit contributions | |
yles | -9.034 |
roth | -8.010 |
hap | -7.418 |
estate | -7.406 |
onyms | -7.201 |
Token | all |
Token ID | 477 |
Feature activation | -2.64e-01 |
Pos logit contributions | |
Attention | +9.820 |
anticipation | +9.057 |
haste | +7.932 |
hurry | +7.657 |
action | +7.550 |
Neg logit contributions | |
yles | -15.560 |
roth | -13.859 |
estate | -12.871 |
heid | -12.829 |
hap | -12.825 |
Token | the |
Token ID | 262 |
Feature activation | -3.40e+00 |
Pos logit contributions | |
Attention | +0.220 |
anticipation | +0.199 |
haste | +0.177 |
hurry | +0.171 |
Action | +0.170 |
Neg logit contributions | |
yles | -0.257 |
roth | -0.227 |
hap | -0.212 |
estate | -0.206 |
heid | -0.200 |
Token | 15 |
Token ID | 1315 |
Feature activation | -6.44e+00 |
Pos logit contributions | |
Attention | +5.960 |
anticipation | +5.440 |
haste | +4.769 |
Action | +4.685 |
hurry | +4.660 |
Neg logit contributions | |
yles | -6.214 |
roth | -5.466 |
hap | -5.101 |
estate | -4.965 |
heid | -4.829 |
Token | years |
Token ID | 812 |
Feature activation | -7.68e+00 |
Pos logit contributions | |
Attention | +6.514 |
anticipation | +6.038 |
haste | +5.468 |
Action | +5.389 |
hurry | +5.380 |
Neg logit contributions | |
yles | -4.881 |
roth | -4.182 |
hap | -3.869 |
estate | -3.732 |
onyms | -3.512 |
Token | . |
Token ID | 13 |
Feature activation | -6.57e+00 |
Pos logit contributions | |
Attention | +5.972 |
anticipation | +5.491 |
haste | +4.770 |
Action | +4.712 |
hurry | +4.666 |
Neg logit contributions | |
yles | -7.502 |
roth | -6.670 |
hap | -6.199 |
estate | -6.020 |
heid | -5.798 |
Token | The |
Token ID | 383 |
Feature activation | -3.10e+00 |
Pos logit contributions | |
Attention | +5.836 |
anticipation | +5.125 |
Action | +4.624 |
haste | +4.446 |
)", | +4.351 |
Neg logit contributions | |
yles | -6.111 |
roth | -5.306 |
hap | -4.970 |
estate | -4.851 |
onyms | -4.656 |
Token | event |
Token ID | 1785 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
Attention | +2.680 |
anticipation | +2.457 |
haste | +2.169 |
hurry | +2.109 |
Action | +2.102 |
Neg logit contributions | |
yles | -2.936 |
roth | -2.561 |
hap | -2.403 |
estate | -2.337 |
heid | -2.259 |
Token | in |
Token ID | 287 |
Feature activation | -3.28e+01 |
Pos logit contributions | |
Attention | +8.127 |
anticipation | +7.559 |
haste | +6.558 |
Action | +6.398 |
hurry | +6.369 |
Neg logit contributions | |
yles | -9.784 |
roth | -8.701 |
hap | -8.214 |
estate | -7.934 |
heid | -7.791 |
Token | Am |
Token ID | 1703 |
Feature activation | +6.37e-01 |
Pos logit contributions | |
anticipation | +21.993 |
Attention | +21.904 |
Action | +18.789 |
earnest | +18.528 |
response | +18.403 |
Neg logit contributions | |
yles | -20.919 |
roth | -17.984 |
estate | -16.981 |
hap | -16.393 |
heid | -15.876 |
Token | her |
Token ID | 372 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
yles | +0.528 |
roth | +0.453 |
hap | +0.418 |
estate | +0.404 |
heid | +0.388 |
Neg logit contributions | |
Attention | -0.626 |
anticipation | -0.574 |
haste | -0.519 |
hurry | -0.506 |
Action | -0.502 |
Token | st |
Token ID | 301 |
Feature activation | -8.54e+00 |
Pos logit contributions | |
yles | +1.045 |
roth | +0.864 |
hap | +0.778 |
estate | +0.744 |
heid | +0.707 |
Neg logit contributions | |
Attention | -1.767 |
anticipation | -1.640 |
haste | -1.510 |
hurry | -1.476 |
Action | -1.465 |
Token | was |
Token ID | 373 |
Feature activation | -6.29e+00 |
Pos logit contributions | |
Attention | +6.830 |
anticipation | +6.242 |
Action | +5.476 |
haste | +5.415 |
hurry | +5.271 |
Neg logit contributions | |
yles | -7.945 |
roth | -7.094 |
hap | -6.751 |
estate | -6.435 |
onyms | -6.276 |
Token | the |
Token ID | 262 |
Feature activation | -5.35e+00 |
Pos logit contributions | |
Attention | +4.980 |
anticipation | +4.613 |
haste | +4.038 |
Action | +3.924 |
hurry | +3.866 |
Neg logit contributions | |
yles | -6.252 |
roth | -5.500 |
hap | -5.114 |
estate | -4.970 |
onyms | -4.919 |
Token | Tour |
Token ID | 9852 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
Attention | +6.913 |
anticipation | +5.923 |
Action | +5.392 |
haste | +5.186 |
hurry | +5.087 |
Neg logit contributions | |
yles | -8.331 |
roth | -7.272 |
hap | -6.829 |
estate | -6.638 |
onyms | -6.489 |
Token | for |
Token ID | 329 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
Attention | +9.121 |
anticipation | +8.371 |
Action | +7.493 |
haste | +7.152 |
directed | +6.964 |
Neg logit contributions | |
yles | -11.736 |
roth | -10.134 |
hap | -9.791 |
estate | -9.141 |
onyms | -9.118 |
Token | the |
Token ID | 262 |
Feature activation | -5.80e+00 |
Pos logit contributions | |
Attention | +8.696 |
anticipation | +7.985 |
Action | +7.000 |
haste | +6.973 |
hurry | +6.635 |
Neg logit contributions | |
yles | -10.259 |
roth | -9.044 |
hap | -8.458 |
estate | -8.296 |
heid | -7.964 |
Token | Food |
Token ID | 7318 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
Attention | +4.772 |
anticipation | +4.401 |
haste | +3.880 |
Action | +3.792 |
hurry | +3.733 |
Neg logit contributions | |
yles | -5.628 |
roth | -4.938 |
hap | -4.628 |
estate | -4.522 |
onyms | -4.362 |
Token | Network |
Token ID | 7311 |
Feature activation | -9.82e+00 |
Pos logit contributions | |
Attention | +2.527 |
anticipation | +2.286 |
Action | +2.028 |
haste | +2.026 |
hurry | +1.974 |
Neg logit contributions | |
yles | -2.440 |
roth | -2.143 |
hap | -1.994 |
estate | -1.921 |
onyms | -1.848 |
Token | in |
Token ID | 287 |
Feature activation | -3.27e+01 |
Pos logit contributions | |
Attention | +7.233 |
anticipation | +6.505 |
Action | +5.840 |
haste | +5.514 |
hurry | +5.411 |
Neg logit contributions | |
yles | -9.810 |
roth | -8.679 |
hap | -8.235 |
estate | -8.008 |
onyms | -7.823 |
Token | 2000 |
Token ID | 4751 |
Feature activation | -7.58e+00 |
Pos logit contributions | |
anticipation | +18.319 |
Attention | +17.878 |
earnest | +15.830 |
Action | +15.312 |
haste | +15.077 |
Neg logit contributions | |
yles | -25.091 |
roth | -21.603 |
estate | -20.648 |
hap | -20.488 |
onyms | -19.909 |
Token | . |
Token ID | 13 |
Feature activation | -8.48e+00 |
Pos logit contributions | |
Attention | +5.990 |
anticipation | +5.471 |
haste | +4.746 |
Action | +4.695 |
hurry | +4.603 |
Neg logit contributions | |
yles | -7.397 |
roth | -6.416 |
hap | -6.064 |
estate | -5.963 |
onyms | -5.671 |
Token | He |
Token ID | 679 |
Feature activation | +2.25e+00 |
Pos logit contributions | |
Attention | +6.526 |
anticipation | +5.631 |
Action | +5.042 |
Focus | +4.698 |
haste | +4.685 |
Neg logit contributions | |
yles | -8.721 |
roth | -7.592 |
hap | -7.284 |
estate | -7.199 |
onyms | -6.847 |
Token | is |
Token ID | 318 |
Feature activation | +3.49e+00 |
Pos logit contributions | |
yles | +2.110 |
roth | +1.853 |
hap | +1.719 |
estate | +1.670 |
hood | +1.622 |
Neg logit contributions | |
Attention | -1.971 |
anticipation | -1.780 |
haste | -1.588 |
hurry | -1.537 |
Action | -1.518 |
Token | fiercely |
Token ID | 33285 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
yles | +3.343 |
roth | +2.968 |
hap | +2.773 |
estate | +2.687 |
hood | +2.609 |
Neg logit contributions | |
Attention | -2.915 |
anticipation | -2.630 |
haste | -2.331 |
hurry | -2.259 |
Action | -2.225 |
Token | letters |
Token ID | 7475 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
yles | +1.169 |
roth | +1.029 |
hap | +0.964 |
estate | +0.937 |
heid | +0.909 |
Neg logit contributions | |
Attention | -0.993 |
anticipation | -0.894 |
haste | -0.793 |
hurry | -0.767 |
Action | -0.760 |
Token | to |
Token ID | 284 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
Attention | +3.644 |
anticipation | +3.311 |
haste | +2.965 |
hurry | +2.862 |
Action | +2.846 |
Neg logit contributions | |
yles | -4.216 |
roth | -3.688 |
hap | -3.429 |
estate | -3.373 |
heid | -3.279 |
Token | a |
Token ID | 257 |
Feature activation | -8.00e+00 |
Pos logit contributions | |
Attention | +3.588 |
anticipation | +3.254 |
haste | +2.894 |
hurry | +2.830 |
Action | +2.829 |
Neg logit contributions | |
yles | -3.877 |
roth | -3.358 |
hap | -3.153 |
estate | -3.055 |
heid | -3.020 |
Token | nonprofit |
Token ID | 15346 |
Feature activation | -7.26e+00 |
Pos logit contributions | |
Attention | +6.534 |
anticipation | +5.949 |
haste | +5.346 |
hurry | +5.284 |
Action | +5.112 |
Neg logit contributions | |
yles | -7.405 |
roth | -6.541 |
hap | -6.211 |
estate | -5.989 |
onyms | -5.961 |
Token | group |
Token ID | 1448 |
Feature activation | -9.64e+00 |
Pos logit contributions | |
Attention | +6.067 |
anticipation | +5.616 |
haste | +4.948 |
Action | +4.918 |
hurry | +4.771 |
Neg logit contributions | |
yles | -6.722 |
roth | -5.980 |
hap | -5.551 |
estate | -5.395 |
onyms | -5.285 |
Token | in |
Token ID | 287 |
Feature activation | -3.26e+01 |
Pos logit contributions | |
Attention | +7.540 |
anticipation | +6.970 |
haste | +6.227 |
Action | +6.117 |
directed | +5.978 |
Neg logit contributions | |
yles | -9.112 |
roth | -8.073 |
hap | -7.459 |
estate | -7.338 |
heid | -7.212 |
Token | order |
Token ID | 1502 |
Feature activation | -9.89e-01 |
Pos logit contributions | |
anticipation | +21.057 |
Attention | +20.233 |
response | +18.077 |
haste | +17.880 |
earnest | +17.225 |
Neg logit contributions | |
yles | -21.827 |
roth | -19.178 |
estate | -18.284 |
hap | -18.238 |
heid | -17.938 |
Token | to |
Token ID | 284 |
Feature activation | -4.46e+00 |
Pos logit contributions | |
Attention | +0.882 |
anticipation | +0.806 |
haste | +0.722 |
hurry | +0.704 |
Action | +0.694 |
Neg logit contributions | |
yles | -0.903 |
roth | -0.791 |
hap | -0.735 |
estate | -0.717 |
heid | -0.692 |
Token | throw |
Token ID | 3714 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
Attention | +3.823 |
anticipation | +3.512 |
haste | +3.182 |
hurry | +3.161 |
Action | +3.029 |
Neg logit contributions | |
yles | -4.198 |
roth | -3.647 |
hap | -3.417 |
estate | -3.352 |
heid | -3.278 |
Token | up |
Token ID | 510 |
Feature activation | +4.94e+00 |
Pos logit contributions | |
Attention | +8.812 |
anticipation | +8.151 |
haste | +7.095 |
hurry | +6.595 |
Action | +6.546 |
Neg logit contributions | |
yles | -12.300 |
roth | -10.883 |
hap | -10.552 |
estate | -10.206 |
heid | -10.136 |
Token | a |
Token ID | 257 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
yles | +4.895 |
roth | +4.348 |
hap | +4.076 |
estate | +3.959 |
hood | +3.871 |
Neg logit contributions | |
Attention | -3.890 |
anticipation | -3.452 |
haste | -3.036 |
)", | -2.980 |
hurry | -2.944 |
Token | founded |
Token ID | 9393 |
Feature activation | +8.48e-02 |
Pos logit contributions | |
yles | +7.210 |
roth | +6.424 |
hap | +5.942 |
estate | +5.758 |
hood | +5.754 |
Neg logit contributions | |
Attention | -6.594 |
anticipation | -5.916 |
haste | -5.258 |
hurry | -5.045 |
)", | -4.984 |
Token | the |
Token ID | 262 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
yles | +0.082 |
roth | +0.072 |
hap | +0.068 |
estate | +0.066 |
heid | +0.064 |
Neg logit contributions | |
Attention | -0.071 |
anticipation | -0.064 |
haste | -0.057 |
hurry | -0.055 |
Action | -0.055 |
Token | Ag |
Token ID | 2449 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
Attention | +1.478 |
anticipation | +1.329 |
haste | +1.171 |
Action | +1.134 |
hurry | +1.132 |
Neg logit contributions | |
yles | -1.807 |
roth | -1.594 |
hap | -1.493 |
estate | -1.459 |
heid | -1.410 |
Token | ora |
Token ID | 5799 |
Feature activation | -4.80e+00 |
Pos logit contributions | |
yles | +1.355 |
roth | +1.146 |
hap | +1.038 |
estate | +1.005 |
heid | +0.957 |
Neg logit contributions | |
Attention | -1.928 |
anticipation | -1.788 |
haste | -1.637 |
hurry | -1.597 |
Action | -1.574 |
Token | Foundation |
Token ID | 5693 |
Feature activation | -8.23e+00 |
Pos logit contributions | |
Attention | +3.933 |
anticipation | +3.504 |
Action | +3.082 |
haste | +3.045 |
hurry | +2.975 |
Neg logit contributions | |
yles | -4.748 |
roth | -4.163 |
hap | -3.909 |
estate | -3.767 |
heid | -3.680 |
Token | in |
Token ID | 287 |
Feature activation | -3.20e+01 |
Pos logit contributions | |
Attention | +6.310 |
anticipation | +5.672 |
Action | +5.060 |
haste | +4.888 |
)", | +4.857 |
Neg logit contributions | |
yles | -8.120 |
roth | -7.094 |
hap | -6.744 |
estate | -6.513 |
heid | -6.310 |
Token | New |
Token ID | 968 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
anticipation | +19.891 |
Attention | +19.667 |
response | +16.778 |
Action | +16.720 |
earnest | +16.487 |
Neg logit contributions | |
yles | -22.870 |
roth | -20.381 |
hap | -19.090 |
estate | -18.666 |
onyms | -18.477 |
Token | York |
Token ID | 1971 |
Feature activation | -1.49e+01 |
Pos logit contributions | |
Attention | +7.865 |
anticipation | +6.494 |
Action | +5.726 |
haste | +5.215 |
)", | +5.211 |
Neg logit contributions | |
yles | -13.718 |
roth | -12.091 |
hap | -11.941 |
estate | -11.592 |
heid | -11.464 |
Token | with |
Token ID | 351 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
Attention | +9.706 |
anticipation | +8.839 |
Action | +7.976 |
directed | +7.580 |
)", | +7.534 |
Neg logit contributions | |
yles | -14.439 |
roth | -12.778 |
hap | -12.158 |
heid | -11.701 |
estate | -11.519 |
Token | the |
Token ID | 262 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
Attention | +10.586 |
anticipation | +9.633 |
haste | +8.479 |
Action | +8.320 |
action | +7.910 |
Neg logit contributions | |
yles | -12.993 |
roth | -11.365 |
estate | -10.862 |
hap | -10.577 |
heid | -10.155 |
Token | aid |
Token ID | 6133 |
Feature activation | -3.81e+00 |
Pos logit contributions | |
Attention | +12.023 |
anticipation | +11.445 |
haste | +9.726 |
Action | +9.403 |
earnest | +9.214 |
Neg logit contributions | |
yles | -15.085 |
roth | -13.067 |
estate | -12.415 |
heid | -11.997 |
hap | -11.968 |
Token | s |
Token ID | 82 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
Attention | +9.340 |
anticipation | +8.497 |
directed | +7.500 |
aimed | +7.355 |
Action | +7.322 |
Neg logit contributions | |
yles | -13.335 |
roth | -12.048 |
estate | -11.147 |
hap | -11.112 |
onyms | -10.905 |
Token | against |
Token ID | 1028 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
Attention | +12.105 |
anticipation | +10.763 |
directed | +10.127 |
aimed | +10.107 |
action | +9.580 |
Neg logit contributions | |
yles | -17.378 |
roth | -15.374 |
estate | -14.009 |
hap | -13.912 |
heid | -13.850 |
Token | the |
Token ID | 262 |
Feature activation | +6.69e-01 |
Pos logit contributions | |
Attention | +0.263 |
anticipation | +0.237 |
haste | +0.207 |
hurry | +0.200 |
Action | +0.198 |
Neg logit contributions | |
yles | -0.354 |
roth | -0.314 |
hap | -0.295 |
estate | -0.288 |
heid | -0.280 |
Token | protest |
Token ID | 5402 |
Feature activation | -4.30e+00 |
Pos logit contributions | |
yles | +0.695 |
roth | +0.617 |
hap | +0.580 |
estate | +0.565 |
heid | +0.549 |
Neg logit contributions | |
Attention | -0.517 |
anticipation | -0.463 |
haste | -0.406 |
hurry | -0.392 |
Action | -0.388 |
Token | movement |
Token ID | 3356 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
Attention | +3.266 |
anticipation | +2.966 |
haste | +2.579 |
Action | +2.519 |
hurry | +2.509 |
Neg logit contributions | |
yles | -4.433 |
roth | -3.948 |
hap | -3.709 |
estate | -3.621 |
heid | -3.489 |
Token | have |
Token ID | 423 |
Feature activation | -3.14e+01 |
Pos logit contributions | |
Attention | +12.519 |
anticipation | +11.164 |
Action | +10.086 |
hurry | +9.905 |
aimed | +9.905 |
Neg logit contributions | |
yles | -16.577 |
roth | -14.418 |
hap | -13.446 |
estate | -13.316 |
heid | -13.057 |
Token | come |
Token ID | 1282 |
Feature activation | -1.60e+01 |
Pos logit contributions | |
Attention | +17.480 |
aimed | +16.714 |
focused | +16.639 |
directed | +16.377 |
anticipation | +16.218 |
Neg logit contributions | |
yles | -22.275 |
roth | -19.461 |
estate | -18.770 |
onyms | -18.452 |
heid | -17.370 |
Token | in |
Token ID | 287 |
Feature activation | -2.25e+01 |
Pos logit contributions | |
Attention | +9.780 |
anticipation | +9.056 |
directed | +7.662 |
haste | +7.596 |
hurry | +7.561 |
Neg logit contributions | |
yles | -15.966 |
roth | -14.712 |
hap | -13.823 |
estate | -13.474 |
heid | -13.046 |
Token | border |
Token ID | 4865 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
anticipation | +15.292 |
Attention | +14.482 |
haste | +13.276 |
response | +13.048 |
earnest | +12.978 |
Neg logit contributions | |
yles | -19.189 |
roth | -17.262 |
hap | -16.419 |
estate | -16.181 |
onyms | -15.062 |
Token | cities |
Token ID | 4736 |
Feature activation | -8.88e+00 |
Pos logit contributions | |
yles | +0.025 |
roth | +0.022 |
hap | +0.020 |
estate | +0.020 |
heid | +0.019 |
Neg logit contributions | |
Attention | -0.022 |
anticipation | -0.020 |
haste | -0.018 |
hurry | -0.017 |
Action | -0.017 |
Token | , |
Token ID | 11 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
Attention | +6.598 |
anticipation | +6.062 |
haste | +5.244 |
Action | +5.208 |
hurry | +5.197 |
Neg logit contributions | |
yles | -8.864 |
roth | -7.785 |
hap | -7.346 |
estate | -7.205 |
heid | -7.025 |
Token | been |
Token ID | 587 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
Attention | +9.235 |
anticipation | +8.516 |
haste | +7.914 |
hurry | +7.522 |
directed | +7.492 |
Neg logit contributions | |
yles | -11.400 |
roth | -9.823 |
estate | -9.242 |
hap | -9.126 |
onyms | -8.788 |
Token | terrified |
Token ID | 22144 |
Feature activation | -1.92e+00 |
Pos logit contributions | |
yles | +1.559 |
roth | +1.382 |
hap | +1.296 |
estate | +1.260 |
hood | +1.221 |
Neg logit contributions | |
Attention | -1.254 |
anticipation | -1.123 |
haste | -0.990 |
hurry | -0.955 |
Action | -0.949 |
Token | even |
Token ID | 772 |
Feature activation | +6.85e+00 |
Pos logit contributions | |
Attention | +1.569 |
anticipation | +1.428 |
haste | +1.264 |
hurry | +1.224 |
Action | +1.210 |
Neg logit contributions | |
yles | -1.908 |
roth | -1.672 |
hap | -1.567 |
estate | -1.541 |
heid | -1.480 |
Token | if |
Token ID | 611 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
yles | +6.688 |
roth | +6.063 |
hap | +5.674 |
hood | +5.476 |
estate | +5.413 |
Neg logit contributions | |
Attention | -5.334 |
anticipation | -4.650 |
haste | -4.067 |
)", | -3.970 |
hurry | -3.945 |
Token | he |
Token ID | 339 |
Feature activation | -6.86e+00 |
Pos logit contributions | |
Attention | +7.870 |
anticipation | +7.062 |
haste | +6.170 |
Action | +5.875 |
hurry | +5.861 |
Neg logit contributions | |
yles | -12.809 |
roth | -11.462 |
estate | -10.824 |
hap | -10.518 |
onyms | -10.274 |
Token | had |
Token ID | 550 |
Feature activation | -3.14e+01 |
Pos logit contributions | |
Attention | +5.610 |
anticipation | +5.165 |
haste | +4.714 |
hurry | +4.616 |
directed | +4.601 |
Neg logit contributions | |
yles | -6.512 |
roth | -5.665 |
estate | -5.251 |
hap | -5.239 |
onyms | -4.991 |
Token | not |
Token ID | 407 |
Feature activation | -1.78e+01 |
Pos logit contributions | |
Attention | +18.382 |
directed | +18.087 |
anticipation | +17.168 |
haste | +16.757 |
aimed | +16.516 |
Neg logit contributions | |
yles | -22.478 |
roth | -19.045 |
estate | -18.066 |
onyms | -17.915 |
inctions | -16.706 |
Token | been |
Token ID | 587 |
Feature activation | +8.69e-01 |
Pos logit contributions | |
Attention | +12.923 |
directed | +11.860 |
anticipation | +11.843 |
haste | +11.328 |
hurry | +11.243 |
Neg logit contributions | |
yles | -15.537 |
roth | -13.190 |
estate | -12.210 |
onyms | -12.202 |
hap | -11.638 |
Token | the |
Token ID | 262 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
yles | +0.887 |
roth | +0.785 |
hap | +0.737 |
estate | +0.718 |
heid | +0.697 |
Neg logit contributions | |
Attention | -0.687 |
anticipation | -0.616 |
haste | -0.542 |
hurry | -0.523 |
Action | -0.518 |
Token | manager |
Token ID | 4706 |
Feature activation | -8.13e+00 |
Pos logit contributions | |
Attention | +1.290 |
anticipation | +1.177 |
haste | +1.050 |
hurry | +1.023 |
Action | +1.011 |
Neg logit contributions | |
yles | -1.383 |
roth | -1.201 |
hap | -1.122 |
estate | -1.095 |
heid | -1.058 |
Token | . |
Token ID | 13 |
Feature activation | -8.94e+00 |
Pos logit contributions | |
Attention | +6.113 |
anticipation | +5.576 |
haste | +4.993 |
hurry | +4.881 |
Action | +4.810 |
Neg logit contributions | |
yles | -8.222 |
roth | -7.149 |
hap | -6.691 |
estate | -6.620 |
heid | -6.414 |
Token | fracking |
Token ID | 25441 |
Feature activation | -1.00e+01 |
Pos logit contributions | |
Attention | +0.749 |
anticipation | +0.682 |
haste | +0.604 |
hurry | +0.586 |
Action | +0.581 |
Neg logit contributions | |
yles | -0.850 |
roth | -0.746 |
hap | -0.698 |
estate | -0.677 |
heid | -0.658 |
Token | the |
Token ID | 262 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
Attention | +7.720 |
anticipation | +7.340 |
haste | +6.268 |
Action | +6.210 |
hurry | +6.201 |
Neg logit contributions | |
yles | -9.402 |
roth | -8.446 |
hap | -8.013 |
estate | -7.676 |
heid | -7.594 |
Token | Barnett |
Token ID | 38174 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
yles | +0.116 |
roth | +0.101 |
hap | +0.095 |
estate | +0.092 |
heid | +0.089 |
Neg logit contributions | |
Attention | -0.109 |
anticipation | -0.099 |
haste | -0.088 |
hurry | -0.086 |
Action | -0.085 |
Token | in |
Token ID | 287 |
Feature activation | -2.99e+01 |
Pos logit contributions | |
yles | +1.774 |
roth | +1.550 |
hap | +1.445 |
estate | +1.409 |
hood | +1.365 |
Neg logit contributions | |
Attention | -1.616 |
anticipation | -1.460 |
haste | -1.311 |
hurry | -1.261 |
)", | -1.247 |
Token | earnest |
Token ID | 23176 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
anticipation | +20.688 |
Attention | +18.840 |
earnest | +18.307 |
haste | +17.377 |
response | +17.206 |
Neg logit contributions | |
yles | -20.577 |
roth | -18.655 |
hap | -18.131 |
estate | -17.809 |
heid | -16.408 |
Token | in |
Token ID | 287 |
Feature activation | -3.13e+01 |
Pos logit contributions | |
Attention | +7.910 |
anticipation | +7.382 |
haste | +6.354 |
hurry | +6.226 |
Action | +6.220 |
Neg logit contributions | |
yles | -10.473 |
roth | -9.286 |
hap | -8.822 |
estate | -8.452 |
heid | -8.256 |
Token | 2000 |
Token ID | 4751 |
Feature activation | -6.97e+00 |
Pos logit contributions | |
anticipation | +20.031 |
Attention | +18.322 |
earnest | +17.780 |
response | +16.727 |
haste | +16.546 |
Neg logit contributions | |
yles | -22.885 |
roth | -20.155 |
hap | -19.747 |
estate | -18.985 |
heid | -18.208 |
Token | . |
Token ID | 13 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
Attention | +5.571 |
anticipation | +5.146 |
haste | +4.468 |
hurry | +4.385 |
Action | +4.380 |
Neg logit contributions | |
yles | -6.789 |
roth | -5.913 |
hap | -5.582 |
estate | -5.455 |
heid | -5.230 |
Token | Suddenly |
Token ID | 24975 |
Feature activation | -9.36e+00 |
Pos logit contributions | |
Attention | +13.259 |
anticipation | +10.456 |
Action | +10.273 |
Focus | +9.674 |
Intent | +9.414 |
Neg logit contributions | |
yles | -19.147 |
roth | -16.850 |
hap | -16.630 |
estate | -16.274 |
ebin | -15.991 |
Token | every |
Token ID | 790 |
Feature activation | -9.82e+00 |
Pos logit contributions | |
Attention | +7.193 |
anticipation | +6.671 |
haste | +5.715 |
hurry | +5.675 |
Action | +5.565 |
Neg logit contributions | |
yles | -9.110 |
roth | -8.162 |
hap | -7.718 |
estate | -7.422 |
heid | -7.288 |
Token | well |
Token ID | 880 |
Feature activation | -2.73e+00 |
Pos logit contributions | |
Attention | +8.150 |
anticipation | +7.752 |
hurry | +6.726 |
haste | +6.675 |
action | +6.525 |
Neg logit contributions | |
yles | -8.907 |
roth | -7.972 |
hap | -7.450 |
estate | -7.038 |
heid | -6.999 |
Token | with |
Token ID | 351 |
Feature activation | -2.11e+01 |
Pos logit contributions | |
Attention | +3.531 |
anticipation | +3.210 |
haste | +2.855 |
hurry | +2.786 |
Action | +2.717 |
Neg logit contributions | |
yles | -4.224 |
roth | -3.727 |
hap | -3.500 |
estate | -3.427 |
heid | -3.295 |
Token | a |
Token ID | 257 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
Attention | +14.016 |
anticipation | +13.043 |
haste | +11.552 |
hurry | +11.142 |
Action | +10.838 |
Neg logit contributions | |
yles | -18.366 |
roth | -15.608 |
estate | -15.205 |
hap | -14.896 |
oles | -14.297 |
Token | lady |
Token ID | 10846 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
Attention | +11.712 |
anticipation | +10.760 |
hurry | +9.905 |
haste | +9.825 |
directed | +9.289 |
Neg logit contributions | |
yles | -14.635 |
roth | -12.579 |
hap | -12.115 |
estate | -11.960 |
onyms | -11.661 |
Token | , |
Token ID | 11 |
Feature activation | -9.33e+00 |
Pos logit contributions | |
Attention | +7.946 |
anticipation | +7.396 |
haste | +6.607 |
hurry | +6.439 |
earnest | +6.211 |
Neg logit contributions | |
yles | -10.656 |
roth | -9.371 |
hap | -8.819 |
estate | -8.658 |
heid | -8.338 |
Token | should |
Token ID | 815 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
Attention | +7.010 |
anticipation | +6.291 |
haste | +5.605 |
hurry | +5.455 |
earnest | +5.232 |
Neg logit contributions | |
yles | -9.363 |
roth | -8.253 |
hap | -7.717 |
estate | -7.707 |
heid | -7.366 |
Token | pay |
Token ID | 1414 |
Feature activation | -3.12e+01 |
Pos logit contributions | |
Attention | +13.589 |
anticipation | +12.126 |
hurry | +11.928 |
haste | +11.571 |
earnest | +11.134 |
Neg logit contributions | |
yles | -15.690 |
roth | -13.608 |
estate | -12.761 |
hap | -12.402 |
onyms | -12.371 |
Token | almost |
Token ID | 2048 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
Attention | +21.944 |
anticipation | +18.611 |
attention | +17.946 |
haste | +16.758 |
earnest | +16.314 |
Neg logit contributions | |
yles | -23.014 |
roth | -19.810 |
estate | -18.703 |
hap | -18.117 |
ramid | -17.657 |
Token | exclusive |
Token ID | 8568 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
Attention | +10.015 |
anticipation | +8.395 |
haste | +7.709 |
hurry | +7.141 |
attention | +7.104 |
Neg logit contributions | |
yles | -13.309 |
roth | -11.206 |
estate | -10.684 |
hap | -10.527 |
onyms | -10.287 |
Token | attention |
Token ID | 3241 |
Feature activation | -9.60e+00 |
Pos logit contributions | |
Attention | +10.888 |
anticipation | +8.219 |
attention | +7.546 |
haste | +6.922 |
hurry | +5.999 |
Neg logit contributions | |
yles | -21.784 |
roth | -19.514 |
hap | -18.613 |
estate | -18.475 |
igham | -17.797 |
Token | to |
Token ID | 284 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
Attention | +7.497 |
anticipation | +6.622 |
haste | +5.856 |
hurry | +5.708 |
Action | +5.548 |
Neg logit contributions | |
yles | -9.293 |
roth | -8.136 |
hap | -7.602 |
estate | -7.568 |
heid | -7.255 |
Token | her |
Token ID | 607 |
Feature activation | -8.86e+00 |
Pos logit contributions | |
Attention | +8.784 |
anticipation | +7.938 |
haste | +6.814 |
hurry | +6.621 |
action | +6.113 |
Neg logit contributions | |
yles | -13.744 |
roth | -12.441 |
estate | -11.600 |
hap | -11.516 |
heid | -11.364 |
Token | in |
Token ID | 287 |
Feature activation | -1.84e+01 |
Pos logit contributions | |
Attention | +3.288 |
anticipation | +3.007 |
haste | +2.630 |
Action | +2.600 |
hurry | +2.550 |
Neg logit contributions | |
yles | -3.977 |
roth | -3.485 |
hap | -3.300 |
estate | -3.225 |
heid | -3.110 |
Token | a |
Token ID | 257 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
Attention | +12.085 |
anticipation | +11.965 |
Action | +10.568 |
action | +10.522 |
haste | +10.129 |
Neg logit contributions | |
yles | -16.861 |
roth | -14.427 |
estate | -14.310 |
hap | -14.242 |
heid | -13.659 |
Token | new |
Token ID | 649 |
Feature activation | -6.92e+00 |
Pos logit contributions | |
Attention | +9.242 |
anticipation | +8.580 |
hurry | +7.982 |
haste | +7.815 |
Action | +7.630 |
Neg logit contributions | |
yles | -10.043 |
roth | -8.700 |
estate | -8.350 |
hap | -8.254 |
onyms | -8.166 |
Token | direction |
Token ID | 4571 |
Feature activation | -7.37e+00 |
Pos logit contributions | |
Attention | +5.018 |
anticipation | +4.530 |
haste | +3.934 |
hurry | +3.911 |
Action | +3.849 |
Neg logit contributions | |
yles | -7.226 |
roth | -6.434 |
hap | -6.087 |
estate | -6.060 |
onyms | -5.893 |
Token | that |
Token ID | 326 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
Attention | +5.708 |
anticipation | +5.207 |
haste | +4.573 |
Action | +4.460 |
hurry | +4.455 |
Neg logit contributions | |
yles | -7.270 |
roth | -6.370 |
hap | -6.008 |
estate | -5.958 |
heid | -5.746 |
Token | sees |
Token ID | 7224 |
Feature activation | -3.10e+01 |
Pos logit contributions | |
Attention | +10.508 |
anticipation | +9.965 |
haste | +8.722 |
Action | +8.689 |
hurry | +8.379 |
Neg logit contributions | |
yles | -11.770 |
roth | -10.397 |
estate | -9.837 |
hap | -9.834 |
heid | -9.523 |
Token | him |
Token ID | 683 |
Feature activation | -7.76e+00 |
Pos logit contributions | |
Attention | +19.751 |
anticipation | +18.847 |
Action | +17.100 |
action | +16.846 |
him | +16.533 |
Neg logit contributions | |
yles | -19.994 |
estate | -18.161 |
roth | -17.654 |
hap | -17.386 |
heid | -17.075 |
Token | struggle |
Token ID | 6531 |
Feature activation | -7.51e+00 |
Pos logit contributions | |
Attention | +6.422 |
anticipation | +5.986 |
hurry | +5.392 |
haste | +5.387 |
Action | +5.166 |
Neg logit contributions | |
yles | -7.108 |
roth | -6.230 |
hap | -5.802 |
estate | -5.689 |
heid | -5.567 |
Token | with |
Token ID | 351 |
Feature activation | -9.76e+00 |
Pos logit contributions | |
Attention | +5.745 |
anticipation | +5.318 |
haste | +4.556 |
hurry | +4.464 |
Action | +4.442 |
Neg logit contributions | |
yles | -7.420 |
roth | -6.655 |
estate | -6.238 |
hap | -6.186 |
heid | -5.816 |
Token | the |
Token ID | 262 |
Feature activation | -3.46e+00 |
Pos logit contributions | |
Attention | +7.885 |
anticipation | +7.175 |
haste | +6.259 |
Action | +6.096 |
hurry | +6.056 |
Neg logit contributions | |
yles | -9.191 |
roth | -8.170 |
hap | -7.688 |
estate | -7.662 |
heid | -7.285 |
Token | aftermath |
Token ID | 16280 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
Attention | +3.107 |
anticipation | +2.838 |
haste | +2.536 |
hurry | +2.452 |
Action | +2.446 |
Neg logit contributions | |
yles | -3.159 |
roth | -2.765 |
hap | -2.583 |
estate | -2.542 |
heid | -2.418 |
Token | air |
Token ID | 1633 |
Feature activation | -4.78e+00 |
Pos logit contributions | |
Attention | +4.744 |
anticipation | +4.429 |
haste | +3.896 |
hurry | +3.844 |
Action | +3.762 |
Neg logit contributions | |
yles | -5.485 |
roth | -4.770 |
hap | -4.470 |
estate | -4.334 |
onyms | -4.251 |
Token | , |
Token ID | 11 |
Feature activation | -1.37e+01 |
Pos logit contributions | |
Attention | +3.930 |
anticipation | +3.642 |
haste | +3.223 |
hurry | +3.152 |
Action | +3.094 |
Neg logit contributions | |
yles | -4.604 |
roth | -4.015 |
hap | -3.760 |
estate | -3.673 |
heid | -3.590 |
Token | attacking |
Token ID | 9274 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
Attention | +10.495 |
anticipation | +10.338 |
haste | +9.097 |
hurry | +8.950 |
directed | +8.658 |
Neg logit contributions | |
yles | -11.847 |
roth | -10.505 |
hap | -9.822 |
estate | -9.619 |
onyms | -9.440 |
Token | every |
Token ID | 790 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
Attention | +9.953 |
anticipation | +9.594 |
hurry | +8.071 |
haste | +8.043 |
action | +7.790 |
Neg logit contributions | |
yles | -13.066 |
roth | -11.614 |
estate | -11.125 |
hap | -11.040 |
onyms | -10.758 |
Token | pass |
Token ID | 1208 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
Attention | +10.552 |
anticipation | +10.328 |
action | +9.052 |
hurry | +9.048 |
haste | +8.862 |
Neg logit contributions | |
yles | -12.158 |
roth | -10.964 |
hap | -10.081 |
onyms | -10.048 |
heid | -9.811 |
Token | with |
Token ID | 351 |
Feature activation | -3.09e+01 |
Pos logit contributions | |
Attention | +8.401 |
anticipation | +8.326 |
haste | +7.140 |
hurry | +7.059 |
Action | +6.897 |
Neg logit contributions | |
yles | -11.586 |
roth | -10.155 |
hap | -9.685 |
estate | -9.403 |
onyms | -9.368 |
Token | the |
Token ID | 262 |
Feature activation | -1.78e+01 |
Pos logit contributions | |
anticipation | +22.005 |
Attention | +20.265 |
haste | +19.138 |
urgency | +18.277 |
hurry | +17.869 |
Neg logit contributions | |
yles | -19.332 |
roth | -17.707 |
estate | -17.186 |
hap | -16.466 |
heid | -16.012 |
Token | certainty |
Token ID | 18979 |
Feature activation | -2.42e+00 |
Pos logit contributions | |
anticipation | +14.041 |
Attention | +13.821 |
haste | +11.884 |
hurry | +11.585 |
urgency | +11.438 |
Neg logit contributions | |
yles | -14.639 |
roth | -13.113 |
hap | -12.527 |
estate | -12.336 |
onyms | -12.018 |
Token | that |
Token ID | 326 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
Attention | +2.012 |
anticipation | +1.839 |
haste | +1.621 |
hurry | +1.567 |
Action | +1.545 |
Neg logit contributions | |
yles | -2.351 |
roth | -2.078 |
hap | -1.950 |
estate | -1.902 |
heid | -1.838 |
Token | it |
Token ID | 340 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
Attention | +11.952 |
anticipation | +11.684 |
haste | +9.891 |
hurry | +9.872 |
action | +9.480 |
Neg logit contributions | |
yles | -15.826 |
roth | -14.223 |
hap | -13.478 |
estate | -13.254 |
heid | -12.986 |
Token | � |
Token ID | 447 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
Attention | +9.148 |
anticipation | +8.759 |
haste | +7.757 |
hurry | +7.519 |
directed | +7.407 |
Neg logit contributions | |
yles | -12.794 |
roth | -10.981 |
hap | -10.374 |
estate | -10.334 |
onyms | -9.880 |
Token | the |
Token ID | 262 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
yles | +2.550 |
roth | +2.256 |
hap | +2.106 |
estate | +2.030 |
hood | +1.988 |
Neg logit contributions | |
Attention | -2.202 |
anticipation | -1.991 |
haste | -1.775 |
hurry | -1.717 |
)", | -1.699 |
Token | Occupy |
Token ID | 25551 |
Feature activation | -8.74e+00 |
Pos logit contributions | |
yles | +1.968 |
roth | +1.722 |
hap | +1.603 |
estate | +1.548 |
heid | +1.506 |
Neg logit contributions | |
Attention | -1.867 |
anticipation | -1.693 |
haste | -1.520 |
hurry | -1.474 |
)", | -1.458 |
Token | Wall |
Token ID | 5007 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
Attention | +7.740 |
anticipation | +6.975 |
Action | +6.338 |
haste | +6.212 |
action | +6.012 |
Neg logit contributions | |
yles | -7.807 |
roth | -6.755 |
hap | -6.468 |
estate | -6.196 |
onyms | -5.843 |
Token | Street |
Token ID | 3530 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
Attention | +0.920 |
anticipation | +0.817 |
haste | +0.710 |
Action | +0.686 |
hurry | +0.685 |
Neg logit contributions | |
yles | -1.296 |
roth | -1.147 |
hap | -1.082 |
estate | -1.058 |
heid | -1.022 |
Token | protests |
Token ID | 8536 |
Feature activation | -5.02e+00 |
Pos logit contributions | |
Attention | +10.924 |
anticipation | +10.143 |
Action | +9.277 |
action | +9.027 |
haste | +8.862 |
Neg logit contributions | |
yles | -12.275 |
roth | -10.668 |
hap | -10.381 |
estate | -9.966 |
onyms | -9.506 |
Token | in |
Token ID | 287 |
Feature activation | -3.09e+01 |
Pos logit contributions | |
Attention | +4.030 |
anticipation | +3.667 |
haste | +3.200 |
Action | +3.145 |
hurry | +3.116 |
Neg logit contributions | |
yles | -5.013 |
roth | -4.406 |
hap | -4.107 |
estate | -4.060 |
heid | -3.915 |
Token | Wednesday |
Token ID | 3583 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
anticipation | +20.291 |
Attention | +19.627 |
earnest | +17.989 |
Action | +17.760 |
action | +17.591 |
Neg logit contributions | |
yles | -22.107 |
estate | -19.399 |
roth | -18.794 |
hap | -17.893 |
onyms | -17.527 |
Token | night |
Token ID | 1755 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
Attention | +9.388 |
anticipation | +8.863 |
Action | +7.623 |
haste | +7.572 |
action | +7.445 |
Neg logit contributions | |
yles | -12.234 |
roth | -10.585 |
estate | -9.888 |
hap | -9.787 |
heid | -9.390 |
Token | 's |
Token ID | 338 |
Feature activation | -7.54e+00 |
Pos logit contributions | |
Attention | +8.259 |
anticipation | +7.755 |
Action | +6.498 |
action | +6.340 |
haste | +6.145 |
Neg logit contributions | |
yles | -17.210 |
roth | -15.189 |
hap | -14.320 |
estate | -14.272 |
onyms | -14.011 |
Token | episode |
Token ID | 4471 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
Attention | +6.057 |
anticipation | +5.575 |
haste | +4.839 |
Action | +4.823 |
hurry | +4.706 |
Neg logit contributions | |
yles | -7.410 |
roth | -6.534 |
hap | -6.122 |
estate | -6.096 |
onyms | -5.884 |
Token | , |
Token ID | 11 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
Attention | +7.914 |
anticipation | +7.319 |
haste | +6.285 |
directed | +6.220 |
Action | +6.187 |
Neg logit contributions | |
yles | -11.522 |
roth | -10.240 |
hap | -9.825 |
estate | -9.549 |
heid | -9.314 |
Token | a |
Token ID | 257 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
Attention | +7.921 |
anticipation | +7.544 |
Action | +6.369 |
haste | +6.325 |
action | +6.288 |
Neg logit contributions | |
yles | -11.381 |
roth | -10.092 |
estate | -9.589 |
hap | -9.495 |
onyms | -9.078 |
Token | crash |
Token ID | 7014 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
Attention | +2.346 |
anticipation | +2.124 |
haste | +1.885 |
hurry | +1.843 |
Action | +1.808 |
Neg logit contributions | |
yles | -2.893 |
roth | -2.559 |
hap | -2.406 |
estate | -2.365 |
onyms | -2.287 |
Token | on |
Token ID | 319 |
Feature activation | +4.49e-01 |
Pos logit contributions | |
Attention | +1.317 |
anticipation | +1.190 |
haste | +1.047 |
hurry | +1.016 |
Action | +1.010 |
Neg logit contributions | |
yles | -1.627 |
roth | -1.441 |
hap | -1.350 |
estate | -1.318 |
heid | -1.278 |
Token | a |
Token ID | 257 |
Feature activation | -6.86e+00 |
Pos logit contributions | |
yles | +0.434 |
roth | +0.382 |
hap | +0.357 |
estate | +0.347 |
heid | +0.336 |
Neg logit contributions | |
Attention | -0.378 |
anticipation | -0.341 |
haste | -0.303 |
hurry | -0.294 |
Action | -0.291 |
Token | rally |
Token ID | 7903 |
Feature activation | -4.16e+00 |
Pos logit contributions | |
Attention | +5.661 |
anticipation | +5.201 |
haste | +4.606 |
hurry | +4.560 |
Action | +4.436 |
Neg logit contributions | |
yles | -6.504 |
roth | -5.786 |
hap | -5.482 |
estate | -5.331 |
onyms | -5.204 |
Token | in |
Token ID | 287 |
Feature activation | -3.07e+01 |
Pos logit contributions | |
Attention | +3.530 |
anticipation | +3.226 |
haste | +2.867 |
hurry | +2.800 |
Action | +2.767 |
Neg logit contributions | |
yles | -3.923 |
roth | -3.486 |
hap | -3.253 |
estate | -3.157 |
onyms | -3.078 |
Token | Italy |
Token ID | 8031 |
Feature activation | -2.69e+00 |
Pos logit contributions | |
Attention | +17.023 |
anticipation | +17.012 |
Action | +14.187 |
earnest | +14.176 |
action | +13.982 |
Neg logit contributions | |
yles | -25.118 |
roth | -21.798 |
estate | -21.205 |
hap | -21.073 |
onyms | -20.391 |
Token | last |
Token ID | 938 |
Feature activation | -6.13e+00 |
Pos logit contributions | |
Attention | +2.336 |
anticipation | +2.131 |
haste | +1.894 |
Action | +1.850 |
hurry | +1.832 |
Neg logit contributions | |
yles | -2.513 |
roth | -2.186 |
hap | -2.048 |
estate | -1.989 |
heid | -1.930 |
Token | Sunday |
Token ID | 3502 |
Feature activation | +6.78e+00 |
Pos logit contributions | |
Attention | +5.096 |
anticipation | +4.747 |
haste | +4.185 |
hurry | +4.083 |
Action | +4.039 |
Neg logit contributions | |
yles | -5.824 |
roth | -5.146 |
hap | -4.792 |
estate | -4.677 |
heid | -4.576 |
Token | . |
Token ID | 13 |
Feature activation | +1.65e-01 |
Pos logit contributions | |
yles | +5.421 |
roth | +4.711 |
hap | +4.357 |
estate | +4.138 |
hood | +4.080 |
Neg logit contributions | |
Attention | -6.571 |
anticipation | -5.911 |
haste | -5.400 |
)", | -5.245 |
hurry | -5.237 |
Token | We |
Token ID | 775 |
Feature activation | -9.40e+00 |
Pos logit contributions | |
yles | +0.143 |
roth | +0.124 |
hap | +0.114 |
estate | +0.111 |
heid | +0.107 |
Neg logit contributions | |
Attention | -0.156 |
anticipation | -0.143 |
haste | -0.129 |
hurry | -0.125 |
Action | -0.124 |
Token | an |
Token ID | 281 |
Feature activation | -7.37e+00 |
Pos logit contributions | |
anticipation | +14.714 |
Attention | +14.356 |
response | +12.442 |
haste | +12.384 |
Action | +12.170 |
Neg logit contributions | |
yles | -18.617 |
roth | -16.120 |
estate | -15.690 |
hap | -15.255 |
hood | -14.464 |
Token | interview |
Token ID | 2720 |
Feature activation | +6.92e-01 |
Pos logit contributions | |
Attention | +7.160 |
anticipation | +6.672 |
haste | +5.992 |
Action | +5.910 |
hurry | +5.850 |
Neg logit contributions | |
yles | -5.996 |
roth | -5.135 |
hap | -4.777 |
estate | -4.610 |
heid | -4.407 |
Token | with |
Token ID | 351 |
Feature activation | -3.28e+00 |
Pos logit contributions | |
yles | +0.649 |
roth | +0.568 |
hap | +0.529 |
estate | +0.514 |
heid | +0.499 |
Neg logit contributions | |
Attention | -0.604 |
anticipation | -0.547 |
haste | -0.488 |
hurry | -0.474 |
Action | -0.468 |
Token | the |
Token ID | 262 |
Feature activation | -7.19e+00 |
Pos logit contributions | |
Attention | +2.910 |
anticipation | +2.639 |
haste | +2.350 |
Action | +2.335 |
hurry | +2.283 |
Neg logit contributions | |
yles | -3.036 |
roth | -2.636 |
hap | -2.448 |
estate | -2.405 |
hood | -2.304 |
Token | Daily |
Token ID | 6714 |
Feature activation | -5.27e+00 |
Pos logit contributions | |
Attention | +5.597 |
anticipation | +5.049 |
Action | +4.452 |
haste | +4.371 |
hurry | +4.274 |
Neg logit contributions | |
yles | -7.201 |
roth | -6.307 |
hap | -5.934 |
estate | -5.859 |
onyms | -5.623 |
Token | in |
Token ID | 287 |
Feature activation | -3.06e+01 |
Pos logit contributions | |
Attention | +3.856 |
anticipation | +3.339 |
Action | +2.933 |
haste | +2.844 |
hurry | +2.782 |
Neg logit contributions | |
yles | -5.704 |
roth | -5.110 |
hap | -4.723 |
estate | -4.714 |
heid | -4.551 |
Token | November |
Token ID | 3389 |
Feature activation | -2.42e+00 |
Pos logit contributions | |
anticipation | +19.824 |
Attention | +19.263 |
response | +17.132 |
haste | +17.050 |
Action | +16.699 |
Neg logit contributions | |
yles | -21.561 |
roth | -18.535 |
estate | -18.376 |
hap | -17.520 |
inctions | -16.351 |
Token | that |
Token ID | 326 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
Attention | +2.067 |
anticipation | +1.892 |
haste | +1.675 |
Action | +1.631 |
hurry | +1.623 |
Neg logit contributions | |
yles | -2.309 |
roth | -2.016 |
hap | -1.890 |
estate | -1.844 |
heid | -1.768 |
Token | his |
Token ID | 465 |
Feature activation | -6.35e+00 |
Pos logit contributions | |
Attention | +8.471 |
anticipation | +7.789 |
Action | +6.686 |
haste | +6.534 |
hurry | +6.400 |
Neg logit contributions | |
yles | -11.868 |
roth | -10.552 |
hap | -10.023 |
estate | -9.764 |
onyms | -9.339 |
Token | campaign |
Token ID | 1923 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
Attention | +5.329 |
anticipation | +4.948 |
haste | +4.374 |
hurry | +4.283 |
Action | +4.252 |
Neg logit contributions | |
yles | -6.033 |
roth | -5.231 |
hap | -4.993 |
estate | -4.790 |
onyms | -4.647 |
Token | does |
Token ID | 857 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
Attention | +8.500 |
anticipation | +7.915 |
haste | +6.765 |
Action | +6.756 |
directed | +6.687 |
Neg logit contributions | |
yles | -10.227 |
roth | -8.939 |
hap | -8.608 |
estate | -8.212 |
onyms | -8.067 |
Token | as |
Token ID | 355 |
Feature activation | +6.90e+00 |
Pos logit contributions | |
yles | +10.602 |
roth | +9.228 |
hood | +8.636 |
hap | +8.568 |
heid | +8.303 |
Neg logit contributions | |
Attention | -14.017 |
anticipation | -12.603 |
)", | -11.474 |
Action | -11.314 |
haste | -11.048 |
Token | a |
Token ID | 257 |
Feature activation | +1.77e+00 |
Pos logit contributions | |
yles | +6.405 |
roth | +5.644 |
hap | +5.289 |
estate | +5.094 |
heid | +5.086 |
Neg logit contributions | |
Attention | -5.669 |
anticipation | -5.120 |
haste | -4.462 |
Action | -4.375 |
)", | -4.337 |
Token | violent |
Token ID | 6590 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
yles | +1.667 |
roth | +1.462 |
hap | +1.365 |
estate | +1.322 |
heid | +1.292 |
Neg logit contributions | |
Attention | -1.524 |
anticipation | -1.379 |
haste | -1.223 |
hurry | -1.184 |
Action | -1.180 |
Token | extremist |
Token ID | 20440 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
Attention | +1.809 |
anticipation | +1.656 |
haste | +1.500 |
hurry | +1.463 |
Action | +1.450 |
Neg logit contributions | |
yles | -1.711 |
roth | -1.474 |
hap | -1.364 |
estate | -1.331 |
onyms | -1.267 |
Token | . |
Token ID | 13 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
yles | +0.208 |
roth | +0.181 |
hap | +0.169 |
estate | +0.164 |
heid | +0.159 |
Neg logit contributions | |
Attention | -0.204 |
anticipation | -0.185 |
haste | -0.166 |
hurry | -0.161 |
Action | -0.160 |
Token | In |
Token ID | 554 |
Feature activation | -3.06e+01 |
Pos logit contributions | |
Attention | +9.115 |
anticipation | +7.608 |
Action | +6.983 |
Intent | +6.503 |
haste | +6.347 |
Neg logit contributions | |
yles | -13.212 |
roth | -11.516 |
hap | -11.158 |
estate | -10.749 |
onyms | -10.407 |
Token | April |
Token ID | 3035 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
anticipation | +20.209 |
Attention | +18.580 |
response | +17.470 |
haste | +17.351 |
action | +16.257 |
Neg logit contributions | |
yles | -22.325 |
roth | -18.235 |
estate | -17.563 |
hap | -17.291 |
ebin | -16.566 |
Token | 1961 |
Token ID | 20510 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
Attention | +2.717 |
anticipation | +2.414 |
haste | +1.975 |
Action | +1.866 |
hurry | +1.861 |
Neg logit contributions | |
yles | -5.840 |
roth | -5.248 |
hap | -4.996 |
estate | -4.899 |
heid | -4.750 |
Token | , |
Token ID | 11 |
Feature activation | -6.97e+00 |
Pos logit contributions | |
Attention | +1.388 |
anticipation | +1.264 |
haste | +1.123 |
hurry | +1.089 |
Action | +1.081 |
Neg logit contributions | |
yles | -1.544 |
roth | -1.353 |
hap | -1.263 |
estate | -1.229 |
heid | -1.183 |
Token | the |
Token ID | 262 |
Feature activation | +3.89e+00 |
Pos logit contributions | |
Attention | +5.405 |
anticipation | +5.003 |
haste | +4.333 |
Action | +4.190 |
hurry | +4.171 |
Neg logit contributions | |
yles | -7.048 |
roth | -6.209 |
hap | -5.809 |
estate | -5.662 |
onyms | -5.418 |
Token | government |
Token ID | 1230 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
yles | +3.629 |
roth | +3.198 |
hap | +2.986 |
estate | +2.870 |
heid | +2.836 |
Neg logit contributions | |
Attention | -3.306 |
anticipation | -2.959 |
haste | -2.643 |
hurry | -2.558 |
)", | -2.552 |
Token | advanced |
Token ID | 6190 |
Feature activation | -3.19e+00 |
Pos logit contributions | |
Attention | +1.495 |
anticipation | +1.353 |
haste | +1.202 |
hurry | +1.160 |
Action | +1.156 |
Neg logit contributions | |
yles | -1.731 |
roth | -1.515 |
hap | -1.420 |
estate | -1.388 |
heid | -1.338 |
Token | calculus |
Token ID | 41443 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
Attention | +2.620 |
anticipation | +2.370 |
haste | +2.100 |
hurry | +2.012 |
Action | +2.001 |
Neg logit contributions | |
yles | -3.183 |
roth | -2.777 |
hap | -2.636 |
estate | -2.575 |
heid | -2.454 |
Token | . |
Token ID | 13 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
Attention | +3.768 |
anticipation | +3.406 |
haste | +3.034 |
hurry | +2.954 |
Action | +2.914 |
Neg logit contributions | |
yles | -4.407 |
roth | -3.881 |
hap | -3.631 |
estate | -3.559 |
heid | -3.442 |
Token |
|
Token ID | 198 |
Feature activation | -3.07e+00 |
Pos logit contributions | |
Attention | +10.156 |
anticipation | +8.363 |
Action | +8.017 |
Focus | +7.530 |
haste | +7.309 |
Neg logit contributions | |
yles | -11.205 |
roth | -9.715 |
hap | -9.291 |
estate | -9.172 |
onyms | -8.643 |
Token |
|
Token ID | 198 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
Attention | +2.958 |
anticipation | +2.693 |
haste | +2.436 |
Action | +2.389 |
hurry | +2.364 |
Neg logit contributions | |
yles | -2.627 |
roth | -2.233 |
hap | -2.065 |
estate | -2.013 |
onyms | -1.937 |
Token | In |
Token ID | 818 |
Feature activation | -3.06e+01 |
Pos logit contributions | |
Attention | +11.054 |
anticipation | +9.489 |
Begin | +9.113 |
Action | +8.785 |
Action | +8.484 |
Neg logit contributions | |
yles | -14.005 |
roth | -11.604 |
hap | -10.907 |
onyms | -10.734 |
estate | -10.650 |
Token | : |
Token ID | 25 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
Attention | +21.474 |
anticipation | +20.741 |
Action | +19.126 |
response | +18.472 |
action | +18.376 |
Neg logit contributions | |
yles | -19.878 |
roth | -15.460 |
hap | -14.965 |
ebin | -14.247 |
estate | -13.878 |
Token | " |
Token ID | 366 |
Feature activation | -7.88e+00 |
Pos logit contributions | |
Attention | +8.102 |
anticipation | +6.829 |
Action | +6.369 |
haste | +5.929 |
Focus | +5.761 |
Neg logit contributions | |
yles | -10.014 |
roth | -8.680 |
hap | -8.296 |
estate | -8.067 |
onyms | -7.713 |
Token | R |
Token ID | 49 |
Feature activation | +8.98e-01 |
Pos logit contributions | |
Attention | +6.679 |
anticipation | +5.841 |
Action | +5.253 |
haste | +5.203 |
Begin | +5.049 |
Neg logit contributions | |
yles | -7.418 |
roth | -6.317 |
hap | -5.944 |
estate | -5.743 |
onyms | -5.658 |
Token | acial |
Token ID | 18150 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
yles | +0.706 |
roth | +0.601 |
hap | +0.551 |
estate | +0.532 |
heid | +0.510 |
Neg logit contributions | |
Attention | -0.921 |
anticipation | -0.848 |
haste | -0.772 |
hurry | -0.753 |
Action | -0.747 |
Token | profiling |
Token ID | 31582 |
Feature activation | -4.26e+00 |
Pos logit contributions | |
Attention | +0.201 |
anticipation | +0.181 |
haste | +0.161 |
hurry | +0.156 |
Action | +0.155 |
Neg logit contributions | |
yles | -0.229 |
roth | -0.201 |
hap | -0.188 |
estate | -0.183 |
heid | -0.177 |
Token | itarian |
Token ID | 8353 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
Attention | +4.009 |
anticipation | +3.599 |
haste | +3.195 |
Action | +3.191 |
hurry | +3.126 |
Neg logit contributions | |
yles | -4.200 |
roth | -3.623 |
hap | -3.464 |
estate | -3.294 |
heid | -3.162 |
Token | Movement |
Token ID | 15477 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
Attention | +8.342 |
anticipation | +7.295 |
Action | +7.091 |
haste | +6.301 |
action | +6.261 |
Neg logit contributions | |
yles | -9.881 |
roth | -8.579 |
hap | -8.228 |
estate | -7.954 |
onyms | -7.444 |
Token | ( |
Token ID | 357 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
Attention | +9.272 |
anticipation | +8.113 |
Action | +7.573 |
directed | +7.024 |
haste | +7.009 |
Neg logit contributions | |
yles | -11.421 |
roth | -10.043 |
hap | -9.558 |
estate | -9.232 |
onyms | -8.745 |
Token | AK |
Token ID | 10206 |
Feature activation | -5.25e+00 |
Pos logit contributions | |
yles | +1.796 |
roth | +1.561 |
hap | +1.458 |
estate | +1.407 |
heid | +1.368 |
Neg logit contributions | |
Attention | -1.847 |
anticipation | -1.682 |
haste | -1.515 |
hurry | -1.477 |
Action | -1.447 |
Token | ) |
Token ID | 8 |
Feature activation | -9.44e+00 |
Pos logit contributions | |
Attention | +4.029 |
anticipation | +3.620 |
Action | +3.155 |
haste | +3.106 |
)", | +3.061 |
Neg logit contributions | |
yles | -5.361 |
roth | -4.748 |
estate | -4.435 |
hap | -4.419 |
heid | -4.233 |
Token | in |
Token ID | 287 |
Feature activation | -3.06e+01 |
Pos logit contributions | |
Attention | +7.522 |
anticipation | +6.722 |
Action | +6.072 |
haste | +5.851 |
directed | +5.682 |
Neg logit contributions | |
yles | -9.141 |
roth | -7.994 |
hap | -7.517 |
estate | -7.322 |
onyms | -6.976 |
Token | relation |
Token ID | 8695 |
Feature activation | +6.08e+00 |
Pos logit contributions | |
Attention | +20.212 |
anticipation | +20.185 |
Action | +18.622 |
action | +18.035 |
response | +17.500 |
Neg logit contributions | |
yles | -22.077 |
roth | -18.642 |
estate | -18.202 |
igham | -17.423 |
hap | -16.791 |
Token | to |
Token ID | 284 |
Feature activation | -3.22e+00 |
Pos logit contributions | |
yles | +4.838 |
roth | +4.225 |
hap | +3.839 |
estate | +3.706 |
heid | +3.658 |
Neg logit contributions | |
Attention | -5.866 |
anticipation | -5.330 |
haste | -4.835 |
hurry | -4.702 |
)", | -4.673 |
Token | the |
Token ID | 262 |
Feature activation | +8.90e-01 |
Pos logit contributions | |
Attention | +2.535 |
anticipation | +2.295 |
haste | +2.009 |
Action | +1.944 |
hurry | +1.928 |
Neg logit contributions | |
yles | -3.304 |
roth | -2.920 |
hap | -2.737 |
estate | -2.686 |
heid | -2.598 |
Token | present |
Token ID | 1944 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
yles | +0.862 |
roth | +0.758 |
hap | +0.709 |
estate | +0.689 |
heid | +0.669 |
Neg logit contributions | |
Attention | -0.748 |
anticipation | -0.674 |
haste | -0.599 |
hurry | -0.580 |
Action | -0.573 |
Token | political |
Token ID | 1964 |
Feature activation | +6.49e+00 |
Pos logit contributions | |
yles | +1.924 |
roth | +1.649 |
hap | +1.523 |
estate | +1.473 |
heid | +1.430 |
Neg logit contributions | |
Attention | -2.228 |
anticipation | -2.030 |
haste | -1.832 |
hurry | -1.786 |
Action | -1.773 |
Token | cancer |
Token ID | 4890 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
yles | +3.747 |
roth | +3.265 |
hap | +3.079 |
estate | +2.956 |
hood | +2.876 |
Neg logit contributions | |
Attention | -3.571 |
anticipation | -3.249 |
haste | -2.920 |
hurry | -2.815 |
)", | -2.782 |
Token | and |
Token ID | 290 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
yles | +1.486 |
roth | +1.299 |
hap | +1.209 |
estate | +1.174 |
hood | +1.137 |
Neg logit contributions | |
Attention | -1.440 |
anticipation | -1.304 |
haste | -1.172 |
hurry | -1.137 |
Action | -1.118 |
Token | one |
Token ID | 530 |
Feature activation | +6.80e+00 |
Pos logit contributions | |
yles | +11.661 |
roth | +10.366 |
hap | +10.030 |
hood | +9.633 |
estate | +9.499 |
Neg logit contributions | |
Attention | -9.535 |
anticipation | -8.314 |
haste | -7.856 |
;;;;;;;; | -7.368 |
hurry | -7.365 |
Token | of |
Token ID | 286 |
Feature activation | +7.72e+00 |
Pos logit contributions | |
yles | +5.946 |
roth | +5.114 |
hap | +4.850 |
estate | +4.683 |
hood | +4.671 |
Neg logit contributions | |
Attention | -6.039 |
anticipation | -5.358 |
haste | -4.867 |
)", | -4.691 |
hurry | -4.662 |
Token | the |
Token ID | 262 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
yles | +6.714 |
roth | +5.825 |
hap | +5.552 |
estate | +5.155 |
hood | +5.119 |
Neg logit contributions | |
Attention | -6.670 |
anticipation | -5.999 |
haste | -5.426 |
hurry | -5.321 |
)", | -5.184 |
Token | hardest |
Token ID | 17612 |
Feature activation | +1.94e+01 |
Pos logit contributions | |
yles | +14.251 |
roth | +12.104 |
memorial | +11.857 |
hap | +11.286 |
hood | +11.280 |
Neg logit contributions | |
Attention | -14.554 |
anticipation | -12.380 |
haste | -11.573 |
ÃÂ | -11.427 |
)", | -11.411 |
Token | things |
Token ID | 1243 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
yles | +14.238 |
hood | +11.133 |
roth | +10.925 |
memorial | +10.893 |
hap | +10.888 |
Neg logit contributions | |
Attention | -15.759 |
anticipation | -13.671 |
haste | -12.672 |
Begin | -12.378 |
hurry | -12.315 |
Token | I |
Token ID | 314 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
yles | +11.395 |
roth | +9.677 |
hood | +9.166 |
hap | +9.080 |
estate | +8.704 |
Neg logit contributions | |
Attention | -11.213 |
anticipation | -9.915 |
haste | -9.224 |
hurry | -8.836 |
Begin | -8.475 |
Token | have |
Token ID | 423 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
yles | +10.728 |
roth | +9.037 |
hap | +8.717 |
hood | +8.526 |
estate | +8.200 |
Neg logit contributions | |
Attention | -13.067 |
anticipation | -11.524 |
haste | -10.420 |
;;;;;;;; | -10.062 |
Begin | -9.973 |
Token | dealt |
Token ID | 11829 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
yles | +1.750 |
roth | +1.510 |
hap | +1.404 |
estate | +1.350 |
hood | +1.315 |
Neg logit contributions | |
Attention | -1.937 |
anticipation | -1.759 |
haste | -1.586 |
hurry | -1.544 |
Action | -1.531 |
Token | with |
Token ID | 351 |
Feature activation | +7.08e+00 |
Pos logit contributions | |
yles | +8.836 |
roth | +7.279 |
hap | +6.592 |
estate | +6.541 |
hood | +6.484 |
Neg logit contributions | |
Attention | -11.773 |
anticipation | -10.753 |
haste | -10.073 |
hurry | -9.901 |
Action | -9.643 |
Token | salary |
Token ID | 9588 |
Feature activation | +2.73e+00 |
Pos logit contributions | |
yles | +7.834 |
roth | +6.860 |
hap | +6.315 |
estate | +6.301 |
hood | +6.290 |
Neg logit contributions | |
Attention | -7.363 |
anticipation | -6.603 |
)", | -5.980 |
haste | -5.976 |
Action | -5.743 |
Token | , |
Token ID | 11 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
yles | +2.491 |
roth | +2.173 |
hap | +2.004 |
estate | +1.962 |
hood | +1.916 |
Neg logit contributions | |
Attention | -2.426 |
anticipation | -2.184 |
haste | -1.968 |
hurry | -1.907 |
)", | -1.899 |
Token | making |
Token ID | 1642 |
Feature activation | -3.17e+00 |
Pos logit contributions | |
yles | +0.393 |
roth | +0.348 |
hap | +0.327 |
estate | +0.319 |
heid | +0.310 |
Neg logit contributions | |
Attention | -0.295 |
anticipation | -0.264 |
haste | -0.232 |
hurry | -0.224 |
Action | -0.221 |
Token | their |
Token ID | 511 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
Attention | +2.300 |
anticipation | +2.087 |
haste | +1.816 |
hurry | +1.736 |
Action | +1.705 |
Neg logit contributions | |
yles | -3.416 |
roth | -3.062 |
hap | -2.895 |
estate | -2.806 |
heid | -2.764 |
Token | Bird |
Token ID | 14506 |
Feature activation | +4.73e+00 |
Pos logit contributions | |
yles | +1.122 |
roth | +0.986 |
hap | +0.919 |
estate | +0.896 |
hood | +0.865 |
Neg logit contributions | |
Attention | -0.996 |
anticipation | -0.898 |
haste | -0.799 |
hurry | -0.773 |
Action | -0.769 |
Token | Rights |
Token ID | 6923 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
yles | +4.048 |
roth | +3.518 |
hap | +3.219 |
estate | +3.162 |
hood | +3.093 |
Neg logit contributions | |
Attention | -4.405 |
anticipation | -4.021 |
haste | -3.665 |
hurry | -3.560 |
)", | -3.544 |
Token | , |
Token ID | 11 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
yles | +14.900 |
roth | +13.183 |
hood | +12.437 |
estate | +12.330 |
enshr | +12.290 |
Neg logit contributions | |
Attention | -11.874 |
anticipation | -10.421 |
)", | -9.692 |
haste | -9.190 |
ラン | -9.074 |
Token | rights |
Token ID | 2489 |
Feature activation | +7.36e+00 |
Pos logit contributions | |
Attention | +0.853 |
anticipation | +0.769 |
haste | +0.679 |
hurry | +0.656 |
Action | +0.653 |
Neg logit contributions | |
yles | -1.035 |
roth | -0.911 |
hap | -0.855 |
estate | -0.832 |
heid | -0.809 |
Token | that |
Token ID | 326 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
yles | +6.284 |
roth | +5.439 |
hap | +4.976 |
estate | +4.879 |
hood | +4.866 |
Neg logit contributions | |
Attention | -6.660 |
anticipation | -5.916 |
haste | -5.358 |
)", | -5.339 |
hurry | -5.320 |
Token | allow |
Token ID | 1249 |
Feature activation | -4.16e+00 |
Pos logit contributions | |
yles | +2.245 |
roth | +1.969 |
hap | +1.841 |
estate | +1.800 |
hood | +1.747 |
Neg logit contributions | |
Attention | -1.940 |
anticipation | -1.739 |
haste | -1.547 |
hurry | -1.492 |
)", | -1.480 |
Token | the |
Token ID | 262 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
Attention | +2.977 |
anticipation | +2.690 |
haste | +2.315 |
hurry | +2.228 |
Action | +2.213 |
Neg logit contributions | |
yles | -4.478 |
roth | -4.033 |
hap | -3.847 |
estate | -3.711 |
heid | -3.618 |
Token | heard |
Token ID | 2982 |
Feature activation | +8.84e+00 |
Pos logit contributions | |
Attention | +2.437 |
anticipation | +2.219 |
haste | +2.001 |
hurry | +1.952 |
Action | +1.939 |
Neg logit contributions | |
yles | -2.405 |
roth | -2.069 |
hap | -1.924 |
estate | -1.880 |
heid | -1.809 |
Token | that |
Token ID | 326 |
Feature activation | +9.50e+00 |
Pos logit contributions | |
yles | +7.994 |
roth | +7.077 |
hap | +6.640 |
hood | +6.395 |
estate | +6.374 |
Neg logit contributions | |
Attention | -7.148 |
anticipation | -6.396 |
haste | -5.670 |
)", | -5.604 |
hurry | -5.443 |
Token | can |
Token ID | 460 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
yles | +8.818 |
roth | +7.813 |
hap | +7.370 |
estate | +7.137 |
hood | +7.044 |
Neg logit contributions | |
Attention | -7.413 |
anticipation | -6.669 |
haste | -5.905 |
)", | -5.720 |
hurry | -5.551 |
Token | equal |
Token ID | 4961 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
yles | +12.482 |
roth | +10.934 |
hap | +10.403 |
hood | +9.762 |
estate | +9.750 |
Neg logit contributions | |
Attention | -11.754 |
anticipation | -10.343 |
haste | -9.169 |
)", | -8.987 |
Action | -8.617 |
Token | or |
Token ID | 393 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
yles | +11.821 |
roth | +10.471 |
hap | +9.983 |
hood | +9.475 |
estate | +9.356 |
Neg logit contributions | |
Attention | -10.493 |
anticipation | -9.310 |
haste | -8.481 |
)", | -8.322 |
hurry | -8.264 |
Token | exceed |
Token ID | 7074 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
yles | +10.298 |
roth | +8.799 |
hap | +8.114 |
estate | +7.665 |
hood | +7.492 |
Neg logit contributions | |
Attention | -11.909 |
anticipation | -10.383 |
haste | -9.485 |
)", | -9.283 |
Action | -9.281 |
Token | the |
Token ID | 262 |
Feature activation | +7.88e+00 |
Pos logit contributions | |
yles | +15.571 |
roth | +13.801 |
hap | +13.396 |
hood | +12.648 |
enshr | +12.328 |
Neg logit contributions | |
Attention | -12.626 |
anticipation | -11.182 |
)", | -10.171 |
hurry | -10.121 |
haste | -10.097 |
Token | Silver |
Token ID | 7698 |
Feature activation | +5.50e+00 |
Pos logit contributions | |
yles | +7.358 |
roth | +6.513 |
hap | +6.111 |
estate | +5.856 |
hood | +5.820 |
Neg logit contributions | |
Attention | -6.232 |
anticipation | -5.568 |
haste | -4.988 |
)", | -4.934 |
hurry | -4.924 |
Token | Phant |
Token ID | 38699 |
Feature activation | +3.95e+00 |
Pos logit contributions | |
yles | +5.832 |
roth | +5.265 |
hap | +4.912 |
estate | +4.768 |
hood | +4.743 |
Neg logit contributions | |
Attention | -3.883 |
anticipation | -3.451 |
haste | -3.059 |
hurry | -2.941 |
)", | -2.847 |
Token | oms |
Token ID | 3150 |
Feature activation | +3.86e+00 |
Pos logit contributions | |
yles | +2.498 |
roth | +2.036 |
hap | +1.795 |
hood | +1.699 |
estate | +1.682 |
Neg logit contributions | |
Attention | -4.656 |
anticipation | -4.316 |
haste | -4.002 |
hurry | -3.923 |
Action | -3.851 |
Token | � |
Token ID | 447 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
yles | +3.771 |
roth | +3.363 |
hap | +3.140 |
estate | +3.026 |
hood | +2.968 |
Neg logit contributions | |
Attention | -3.134 |
anticipation | -2.818 |
haste | -2.519 |
hurry | -2.425 |
)", | -2.415 |
Token | last |
Token ID | 938 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
Attention | +3.465 |
anticipation | +3.168 |
haste | +2.786 |
hurry | +2.677 |
Action | +2.655 |
Neg logit contributions | |
yles | -4.536 |
roth | -4.031 |
hap | -3.724 |
estate | -3.683 |
heid | -3.586 |
Token | count |
Token ID | 954 |
Feature activation | -4.10e+00 |
Pos logit contributions | |
yles | +1.394 |
roth | +1.212 |
hap | +1.136 |
estate | +1.102 |
hood | +1.063 |
Neg logit contributions | |
Attention | -1.360 |
anticipation | -1.230 |
haste | -1.102 |
hurry | -1.069 |
Action | -1.058 |
Token | -- |
Token ID | 1377 |
Feature activation | +7.53e+00 |
Pos logit contributions | |
Attention | +3.293 |
anticipation | +3.010 |
haste | +2.651 |
Action | +2.559 |
hurry | +2.533 |
Neg logit contributions | |
yles | -4.085 |
roth | -3.590 |
hap | -3.371 |
estate | -3.293 |
heid | -3.180 |
Token | held |
Token ID | 2714 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
yles | +6.570 |
roth | +5.776 |
hap | +5.416 |
estate | +5.279 |
hood | +5.196 |
Neg logit contributions | |
Attention | -6.656 |
anticipation | -5.906 |
haste | -5.332 |
hurry | -5.149 |
)", | -5.120 |
Token | at |
Token ID | 379 |
Feature activation | +6.70e+00 |
Pos logit contributions | |
yles | +3.316 |
roth | +2.946 |
hap | +2.739 |
estate | +2.679 |
hood | +2.608 |
Neg logit contributions | |
Attention | -2.728 |
anticipation | -2.425 |
haste | -2.165 |
hurry | -2.098 |
)", | -2.081 |
Token | least |
Token ID | 1551 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
yles | +4.970 |
roth | +4.292 |
hap | +3.882 |
estate | +3.767 |
hood | +3.632 |
Neg logit contributions | |
Attention | -6.724 |
anticipation | -6.133 |
haste | -5.652 |
)", | -5.537 |
hurry | -5.504 |
Token | five |
Token ID | 1936 |
Feature activation | -9.77e-01 |
Pos logit contributions | |
yles | +12.146 |
roth | +11.025 |
hood | +9.995 |
estate | +9.989 |
hap | +9.850 |
Neg logit contributions | |
Attention | -14.115 |
anticipation | -12.380 |
)", | -11.879 |
;;;;;;;; | -11.672 |
ラン | -11.609 |
Token | restaurants |
Token ID | 10808 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
Attention | +0.818 |
anticipation | +0.741 |
haste | +0.656 |
hurry | +0.636 |
Action | +0.630 |
Neg logit contributions | |
yles | -0.953 |
roth | -0.837 |
hap | -0.786 |
estate | -0.762 |
heid | -0.740 |
Token | prior |
Token ID | 3161 |
Feature activation | +7.97e+00 |
Pos logit contributions | |
Attention | +1.166 |
anticipation | +1.058 |
haste | +0.934 |
hurry | +0.905 |
Action | +0.899 |
Neg logit contributions | |
yles | -1.397 |
roth | -1.229 |
hap | -1.150 |
estate | -1.121 |
heid | -1.087 |
Token | . |
Token ID | 13 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
yles | +6.498 |
roth | +5.549 |
hap | +5.199 |
estate | +4.998 |
hood | +4.863 |
Neg logit contributions | |
Attention | -7.544 |
anticipation | -6.806 |
haste | -6.206 |
)", | -6.081 |
hurry | -6.053 |
Token | That |
Token ID | 1320 |
Feature activation | -4.27e-01 |
Pos logit contributions | |
yles | +2.420 |
roth | +2.127 |
hap | +1.971 |
estate | +1.909 |
heid | +1.856 |
Neg logit contributions | |
Attention | -2.387 |
anticipation | -2.195 |
haste | -1.981 |
hurry | -1.926 |
)", | -1.888 |
Token | bigger |
Token ID | 5749 |
Feature activation | +8.29e+00 |
Pos logit contributions | |
yles | +7.134 |
roth | +6.294 |
hap | +5.921 |
hood | +5.659 |
estate | +5.595 |
Neg logit contributions | |
Attention | -6.047 |
anticipation | -5.400 |
haste | -4.679 |
)", | -4.565 |
Action | -4.515 |
Token | problem |
Token ID | 1917 |
Feature activation | +7.02e+00 |
Pos logit contributions | |
yles | +7.027 |
roth | +6.060 |
hap | +5.721 |
hood | +5.529 |
estate | +5.481 |
Neg logit contributions | |
Attention | -7.241 |
anticipation | -6.476 |
haste | -5.816 |
)", | -5.707 |
Begin | -5.636 |
Token | . |
Token ID | 13 |
Feature activation | +7.09e+00 |
Pos logit contributions | |
yles | +6.000 |
roth | +5.232 |
hap | +4.924 |
estate | +4.730 |
hood | +4.683 |
Neg logit contributions | |
Attention | -6.307 |
anticipation | -5.668 |
haste | -5.097 |
Action | -4.922 |
hurry | -4.848 |
Token | I |
Token ID | 314 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
yles | +6.788 |
roth | +6.035 |
hap | +5.704 |
hood | +5.519 |
heid | +5.506 |
Neg logit contributions | |
Attention | -5.205 |
anticipation | -4.958 |
haste | -4.419 |
hurry | -4.239 |
)", | -4.023 |
Token | don |
Token ID | 836 |
Feature activation | -7.76e+00 |
Pos logit contributions | |
yles | +11.777 |
roth | +10.745 |
hap | +10.259 |
estate | +9.720 |
hood | +9.659 |
Neg logit contributions | |
Attention | -12.641 |
anticipation | -11.092 |
haste | -9.746 |
;;;;;;;; | -9.741 |
ラン | -9.539 |
Token | 't |
Token ID | 470 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
Attention | +2.997 |
anticipation | +2.431 |
haste | +1.794 |
)", | +1.729 |
Action | +1.683 |
Neg logit contributions | |
yles | -10.744 |
roth | -9.712 |
hap | -9.251 |
estate | -9.155 |
onyms | -9.009 |
Token | think |
Token ID | 892 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
yles | +12.185 |
roth | +11.270 |
hap | +10.847 |
hood | +10.036 |
estate | +9.896 |
Neg logit contributions | |
Attention | -16.646 |
anticipation | -14.520 |
ラン | -13.378 |
;;;;;;;; | -13.259 |
ÃÂ | -13.169 |
Token | you |
Token ID | 345 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
yles | +13.611 |
roth | +11.885 |
hap | +11.493 |
hood | +11.179 |
enshr | +11.131 |
Neg logit contributions | |
Attention | -11.138 |
anticipation | -9.946 |
ラン | -8.987 |
ÃÂ | -8.861 |
;;;;;;;; | -8.632 |
Token | can |
Token ID | 460 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
yles | +12.263 |
roth | +11.204 |
hap | +10.738 |
enshr | +10.143 |
hood | +10.080 |
Neg logit contributions | |
Attention | -14.419 |
anticipation | -12.866 |
ラン | -11.740 |
;;;;;;;; | -11.512 |
Action | -11.209 |
Token | start |
Token ID | 923 |
Feature activation | +1.84e+01 |
Pos logit contributions | |
yles | +16.303 |
roth | +14.654 |
hap | +14.573 |
memorial | +13.827 |
acles | +13.377 |
Neg logit contributions | |
Attention | -15.938 |
anticipation | -13.269 |
ラン | -12.163 |
ÃÂ | -12.012 |
;;;;;;;; | -11.760 |
Token | blaming |
Token ID | 24630 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
yles | +14.563 |
roth | +12.838 |
hap | +12.449 |
hood | +12.057 |
heid | +12.036 |
Neg logit contributions | |
Attention | -13.379 |
anticipation | -11.266 |
Begin | -10.349 |
ÃÂ | -10.237 |
;;;;;;;; | -10.236 |
Token | to |
Token ID | 284 |
Feature activation | +5.49e+00 |
Pos logit contributions | |
yles | +4.952 |
roth | +4.304 |
hap | +4.002 |
estate | +3.920 |
hood | +3.859 |
Neg logit contributions | |
Attention | -4.916 |
anticipation | -4.360 |
haste | -3.965 |
Action | -3.847 |
hurry | -3.803 |
Token | vac |
Token ID | 6658 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
yles | +4.938 |
roth | +4.348 |
hap | +4.034 |
estate | +3.936 |
hood | +3.852 |
Neg logit contributions | |
Attention | -4.837 |
anticipation | -4.321 |
haste | -3.830 |
Action | -3.760 |
)", | -3.727 |
Token | ate |
Token ID | 378 |
Feature activation | +9.35e+00 |
Pos logit contributions | |
yles | +0.328 |
roth | +0.274 |
hap | +0.248 |
estate | +0.238 |
heid | +0.227 |
Neg logit contributions | |
Attention | -0.510 |
anticipation | -0.472 |
haste | -0.433 |
hurry | -0.423 |
Action | -0.420 |
Token | the |
Token ID | 262 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
yles | +8.777 |
roth | +7.730 |
hap | +7.323 |
estate | +7.241 |
hood | +7.009 |
Neg logit contributions | |
Attention | -7.339 |
anticipation | -6.427 |
haste | -5.762 |
)", | -5.648 |
hurry | -5.540 |
Token | White |
Token ID | 2635 |
Feature activation | +7.09e+00 |
Pos logit contributions | |
yles | +9.227 |
roth | +8.091 |
hap | +7.405 |
estate | +7.237 |
hood | +6.986 |
Neg logit contributions | |
Attention | -9.861 |
anticipation | -8.841 |
haste | -8.022 |
)", | -8.003 |
Begin | -7.769 |
Token | House |
Token ID | 2097 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
yles | +5.703 |
roth | +4.943 |
hap | +4.492 |
estate | +4.399 |
hood | +4.381 |
Neg logit contributions | |
Attention | -6.552 |
anticipation | -6.137 |
haste | -5.615 |
hurry | -5.472 |
)", | -5.292 |
Token | for |
Token ID | 329 |
Feature activation | +5.23e-02 |
Pos logit contributions | |
yles | +3.084 |
roth | +2.707 |
hap | +2.544 |
estate | +2.471 |
hood | +2.381 |
Neg logit contributions | |
Attention | -2.760 |
anticipation | -2.481 |
haste | -2.215 |
)", | -2.137 |
hurry | -2.131 |
Token | another |
Token ID | 1194 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
yles | +0.051 |
roth | +0.045 |
hap | +0.042 |
estate | +0.041 |
heid | +0.039 |
Neg logit contributions | |
Attention | -0.044 |
anticipation | -0.040 |
haste | -0.035 |
hurry | -0.034 |
Action | -0.034 |
Token | half |
Token ID | 2063 |
Feature activation | +1.88e+01 |
Pos logit contributions | |
yles | +9.833 |
roth | +8.402 |
hap | +7.876 |
estate | +7.853 |
hood | +7.488 |
Neg logit contributions | |
Attention | -9.540 |
anticipation | -8.305 |
haste | -7.449 |
)", | -7.381 |
Action | -7.258 |
Token | - |
Token ID | 12 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
yles | +13.560 |
roth | +11.305 |
hood | +10.828 |
estate | +10.678 |
hap | +10.584 |
Neg logit contributions | |
Attention | -15.709 |
anticipation | -13.611 |
)", | -12.875 |
;;;;;;;; | -12.543 |
ÃÂ | -12.083 |
Token | month |
Token ID | 8424 |
Feature activation | -3.94e+00 |
Pos logit contributions | |
yles | +8.959 |
roth | +7.583 |
estate | +7.223 |
hap | +6.894 |
hood | +6.672 |
Neg logit contributions | |
Attention | -13.532 |
anticipation | -12.388 |
haste | -11.337 |
)", | -11.300 |
;;;;;;;; | -11.265 |
Token |
|
Token ID | 198 |
Feature activation | -7.37e+00 |
Pos logit contributions | |
yles | +4.018 |
roth | +3.437 |
hap | +3.110 |
estate | +3.034 |
heid | +2.937 |
Neg logit contributions | |
Attention | -5.334 |
anticipation | -4.938 |
haste | -4.518 |
hurry | -4.394 |
)", | -4.374 |
Token |
|
Token ID | 198 |
Feature activation | -3.88e+00 |
Pos logit contributions | |
Attention | +6.405 |
anticipation | +5.763 |
haste | +5.141 |
Action | +5.125 |
hurry | +4.968 |
Neg logit contributions | |
yles | -6.835 |
roth | -5.798 |
hap | -5.466 |
estate | -5.354 |
onyms | -5.239 |
Token | Good |
Token ID | 10248 |
Feature activation | +6.41e+00 |
Pos logit contributions | |
Attention | +3.274 |
anticipation | +2.977 |
haste | +2.637 |
hurry | +2.547 |
Action | +2.540 |
Neg logit contributions | |
yles | -3.707 |
roth | -3.199 |
hap | -2.980 |
estate | -2.889 |
heid | -2.820 |
Token | updates |
Token ID | 5992 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
yles | +5.623 |
roth | +4.875 |
hap | +4.472 |
estate | +4.409 |
hood | +4.320 |
Neg logit contributions | |
Attention | -5.671 |
anticipation | -5.020 |
haste | -4.553 |
)", | -4.451 |
hurry | -4.447 |
Token | ? |
Token ID | 30 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
Attention | +8.367 |
anticipation | +7.567 |
haste | +6.534 |
hurry | +6.450 |
Action | +6.163 |
Neg logit contributions | |
yles | -15.905 |
roth | -13.944 |
hap | -13.476 |
estate | -12.999 |
onyms | -12.816 |
Token | No |
Token ID | 1400 |
Feature activation | +2.91e+00 |
Pos logit contributions | |
Attention | +5.229 |
anticipation | +3.742 |
Action | +3.307 |
Focus | +2.888 |
haste | +2.832 |
Neg logit contributions | |
yles | -15.878 |
roth | -14.261 |
hap | -13.894 |
estate | -13.576 |
onyms | -13.265 |
Token | more |
Token ID | 517 |
Feature activation | -3.99e+00 |
Pos logit contributions | |
yles | +2.514 |
roth | +2.168 |
hap | +2.025 |
estate | +1.948 |
hood | +1.940 |
Neg logit contributions | |
Attention | -2.706 |
anticipation | -2.443 |
haste | -2.177 |
)", | -2.151 |
Action | -2.120 |
Token | bad |
Token ID | 2089 |
Feature activation | +4.41e+00 |
Pos logit contributions | |
Attention | +2.731 |
anticipation | +2.477 |
haste | +2.165 |
hurry | +2.096 |
Action | +2.019 |
Neg logit contributions | |
yles | -4.440 |
roth | -3.956 |
hap | -3.787 |
estate | -3.711 |
heid | -3.649 |
Token | news |
Token ID | 1705 |
Feature activation | +6.55e+00 |
Pos logit contributions | |
yles | +3.572 |
roth | +3.104 |
hap | +2.854 |
hood | +2.813 |
estate | +2.759 |
Neg logit contributions | |
Attention | -4.269 |
anticipation | -3.783 |
haste | -3.403 |
)", | -3.354 |
Action | -3.349 |
Token | pl |
Token ID | 458 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
yles | +5.742 |
roth | +5.057 |
hap | +4.728 |
estate | +4.618 |
hood | +4.542 |
Neg logit contributions | |
Attention | -5.722 |
anticipation | -4.985 |
haste | -4.422 |
Action | -4.417 |
;;;;;;;; | -4.323 |
Token | s |
Token ID | 82 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
Attention | +0.947 |
anticipation | +0.857 |
haste | +0.767 |
hurry | +0.743 |
Action | +0.735 |
Neg logit contributions | |
yles | -1.047 |
roth | -0.917 |
hap | -0.855 |
estate | -0.832 |
heid | -0.808 |
Token | marijuana |
Token ID | 5727 |
Feature activation | -5.10e+00 |
Pos logit contributions | |
Attention | +3.738 |
anticipation | +3.357 |
haste | +2.887 |
hurry | +2.809 |
Action | +2.792 |
Neg logit contributions | |
yles | -5.242 |
roth | -4.706 |
hap | -4.414 |
estate | -4.365 |
heid | -4.231 |
Token | . |
Token ID | 13 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
Attention | +3.981 |
anticipation | +3.613 |
haste | +3.160 |
Action | +3.066 |
hurry | +3.051 |
Neg logit contributions | |
yles | -5.141 |
roth | -4.601 |
hap | -4.339 |
estate | -4.178 |
heid | -4.105 |
Token |
|
Token ID | 198 |
Feature activation | +9.42e-01 |
Pos logit contributions | |
Attention | +0.724 |
anticipation | +0.661 |
haste | +0.594 |
hurry | +0.579 |
Action | +0.577 |
Neg logit contributions | |
yles | -0.663 |
roth | -0.573 |
hap | -0.531 |
estate | -0.514 |
heid | -0.495 |
Token |
|
Token ID | 198 |
Feature activation | -4.03e+00 |
Pos logit contributions | |
yles | +0.724 |
roth | +0.616 |
hap | +0.563 |
estate | +0.543 |
heid | +0.521 |
Neg logit contributions | |
Attention | -0.979 |
anticipation | -0.903 |
haste | -0.823 |
hurry | -0.804 |
Action | -0.795 |
Token | H |
Token ID | 39 |
Feature activation | -3.21e-02 |
Pos logit contributions | |
Attention | +3.331 |
anticipation | +3.002 |
haste | +2.635 |
Action | +2.582 |
)", | +2.573 |
Neg logit contributions | |
yles | -3.934 |
roth | -3.397 |
hap | -3.157 |
estate | -3.070 |
onyms | -3.010 |
Token | emp |
Token ID | 45787 |
Feature activation | +2.94e-01 |
Pos logit contributions | |
Attention | +0.023 |
anticipation | +0.021 |
haste | +0.018 |
hurry | +0.017 |
Action | +0.017 |
Neg logit contributions | |
yles | -0.035 |
roth | -0.031 |
hap | -0.029 |
estate | -0.029 |
heid | -0.028 |
Token | Supporters |
Token ID | 39995 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
yles | +0.279 |
roth | +0.245 |
hap | +0.228 |
estate | +0.222 |
heid | +0.215 |
Neg logit contributions | |
Attention | -0.253 |
anticipation | -0.229 |
haste | -0.204 |
hurry | -0.198 |
Action | -0.196 |
Token | State |
Token ID | 1812 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
yles | +0.207 |
roth | +0.183 |
hap | +0.172 |
estate | +0.168 |
heid | +0.163 |
Neg logit contributions | |
Attention | -0.161 |
anticipation | -0.144 |
haste | -0.127 |
hurry | -0.123 |
Action | -0.121 |
Token | Senators |
Token ID | 22195 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
Attention | +3.843 |
anticipation | +3.424 |
Action | +3.048 |
haste | +3.020 |
hurry | +2.964 |
Neg logit contributions | |
yles | -4.186 |
roth | -3.638 |
hap | -3.424 |
estate | -3.353 |
heid | -3.223 |
Token | Russell |
Token ID | 11563 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
yles | +1.525 |
roth | +1.346 |
hap | +1.259 |
estate | +1.223 |
heid | +1.186 |
Neg logit contributions | |
Attention | -1.298 |
anticipation | -1.173 |
haste | -1.043 |
hurry | -1.006 |
Action | -0.991 |
Token | Rud |
Token ID | 17421 |
Feature activation | +6.70e+00 |
Pos logit contributions | |
yles | +1.414 |
roth | +1.259 |
hap | +1.176 |
estate | +1.132 |
heid | +1.114 |
Neg logit contributions | |
Attention | -1.172 |
anticipation | -1.066 |
haste | -0.949 |
hurry | -0.912 |
)", | -0.897 |
Token |
|
Token ID | 198 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
yles | +10.141 |
roth | +8.668 |
hood | +7.897 |
hap | +7.853 |
ods | +7.777 |
Neg logit contributions | |
Attention | -10.203 |
anticipation | -9.814 |
haste | -9.141 |
hurry | -8.760 |
)", | -8.708 |
Token |
|
Token ID | 198 |
Feature activation | +6.33e+00 |
Pos logit contributions | |
yles | +1.108 |
roth | +0.942 |
hap | +0.860 |
estate | +0.827 |
hood | +0.796 |
Neg logit contributions | |
Attention | -1.532 |
anticipation | -1.415 |
haste | -1.290 |
hurry | -1.259 |
Action | -1.245 |
Token | That |
Token ID | 2504 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
yles | +5.834 |
roth | +5.298 |
hap | +4.901 |
estate | +4.734 |
hood | +4.728 |
Neg logit contributions | |
Attention | -5.272 |
anticipation | -4.836 |
haste | -4.374 |
hurry | -4.253 |
Action | -4.012 |
Token | is |
Token ID | 318 |
Feature activation | +8.25e+00 |
Pos logit contributions | |
yles | +2.140 |
roth | +1.901 |
hap | +1.784 |
estate | +1.738 |
hood | +1.695 |
Neg logit contributions | |
Attention | -1.638 |
anticipation | -1.455 |
haste | -1.287 |
hurry | -1.240 |
Action | -1.224 |
Token | something |
Token ID | 1223 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
yles | +7.511 |
roth | +6.664 |
hap | +6.257 |
hood | +6.042 |
ods | +5.892 |
Neg logit contributions | |
Attention | -6.767 |
anticipation | -5.935 |
haste | -5.410 |
)", | -5.150 |
hurry | -5.135 |
Token | they |
Token ID | 484 |
Feature activation | +3.36e+00 |
Pos logit contributions | |
yles | +10.182 |
roth | +8.919 |
hap | +8.149 |
hood | +8.109 |
oles | +7.802 |
Neg logit contributions | |
Attention | -10.379 |
anticipation | -9.062 |
haste | -8.255 |
)", | -8.117 |
hurry | -7.872 |
Token | all |
Token ID | 477 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
yles | +3.348 |
roth | +2.974 |
hap | +2.774 |
estate | +2.700 |
hood | +2.639 |
Neg logit contributions | |
Attention | -2.705 |
anticipation | -2.410 |
haste | -2.136 |
hurry | -2.035 |
Action | -2.031 |
Token | feel |
Token ID | 1254 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
yles | +10.562 |
roth | +9.189 |
hap | +8.464 |
hood | +8.463 |
estate | +8.170 |
Neg logit contributions | |
Attention | -10.310 |
anticipation | -8.979 |
haste | -8.025 |
)", | -7.853 |
Action | -7.793 |
Token | guilty |
Token ID | 6717 |
Feature activation | +6.85e+00 |
Pos logit contributions | |
yles | +9.365 |
roth | +8.118 |
hap | +7.670 |
hood | +7.573 |
estate | +7.347 |
Neg logit contributions | |
Attention | -8.908 |
anticipation | -7.704 |
haste | -7.050 |
)", | -6.933 |
hurry | -6.768 |
Token | about |
Token ID | 546 |
Feature activation | +9.91e+00 |
Pos logit contributions | |
yles | +6.791 |
roth | +5.969 |
hap | +5.566 |
hood | +5.530 |
estate | +5.485 |
Neg logit contributions | |
Attention | -5.294 |
anticipation | -4.568 |
haste | -4.133 |
)", | -3.983 |
hurry | -3.927 |
Token | — |
Token ID | 851 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
yles | +8.002 |
roth | +6.893 |
hap | +6.418 |
hood | +6.320 |
estate | +6.238 |
Neg logit contributions | |
Attention | -9.005 |
anticipation | -8.061 |
)", | -7.317 |
haste | -7.295 |
hurry | -7.035 |
Token | your |
Token ID | 534 |
Feature activation | +2.98e+00 |
Pos logit contributions | |
yles | +0.226 |
roth | +0.201 |
hap | +0.189 |
estate | +0.185 |
heid | +0.180 |
Neg logit contributions | |
Attention | -0.157 |
anticipation | -0.140 |
haste | -0.122 |
hurry | -0.117 |
Action | -0.116 |
Token | different |
Token ID | 1180 |
Feature activation | +9.86e+00 |
Pos logit contributions | |
yles | +2.691 |
roth | +2.337 |
hap | +2.178 |
estate | +2.111 |
hood | +2.048 |
Neg logit contributions | |
Attention | -2.669 |
anticipation | -2.416 |
haste | -2.170 |
hurry | -2.095 |
)", | -2.089 |
Token | media |
Token ID | 2056 |
Feature activation | +8.35e+00 |
Pos logit contributions | |
yles | +8.648 |
roth | +7.394 |
hap | +6.964 |
estate | +6.747 |
hood | +6.746 |
Neg logit contributions | |
Attention | -8.252 |
anticipation | -7.409 |
haste | -6.614 |
)", | -6.577 |
;;;;;;;; | -6.483 |
Token | outlets |
Token ID | 12527 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
yles | +6.936 |
roth | +5.931 |
hap | +5.553 |
hood | +5.378 |
estate | +5.341 |
Neg logit contributions | |
Attention | -7.526 |
anticipation | -6.700 |
)", | -6.093 |
haste | -6.058 |
hurry | -5.879 |
Token | . |
Token ID | 13 |
Feature activation | -8.14e+00 |
Pos logit contributions | |
Attention | +1.248 |
anticipation | +1.135 |
haste | +1.015 |
hurry | +0.985 |
Action | +0.977 |
Neg logit contributions | |
yles | -1.352 |
roth | -1.183 |
hap | -1.099 |
estate | -1.070 |
heid | -1.038 |
Token | Pixel |
Token ID | 11349 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
Attention | +6.239 |
anticipation | +5.295 |
Action | +4.862 |
haste | +4.533 |
Focus | +4.510 |
Neg logit contributions | |
yles | -8.539 |
roth | -7.457 |
hap | -7.097 |
estate | -6.896 |
onyms | -6.713 |
Token | pipe |
Token ID | 34360 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
yles | +0.893 |
roth | +0.760 |
hap | +0.697 |
estate | +0.671 |
hood | +0.639 |
Neg logit contributions | |
Attention | -1.274 |
anticipation | -1.170 |
haste | -1.071 |
hurry | -1.045 |
Action | -1.037 |
Token | supports |
Token ID | 6971 |
Feature activation | -5.00e+00 |
Pos logit contributions | |
Attention | +1.577 |
anticipation | +1.428 |
haste | +1.274 |
hurry | +1.234 |
Action | +1.231 |
Neg logit contributions | |
yles | -1.820 |
roth | -1.595 |
hap | -1.494 |
estate | -1.451 |
heid | -1.409 |
Token | over |
Token ID | 625 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
Attention | +4.358 |
anticipation | +3.972 |
haste | +3.554 |
Action | +3.490 |
hurry | +3.473 |
Neg logit contributions | |
yles | -4.633 |
roth | -4.057 |
hap | -3.784 |
estate | -3.695 |
heid | -3.614 |
Token | 110 |
Token ID | 9796 |
Feature activation | -2.81e+00 |
Pos logit contributions | |
yles | +9.404 |
roth | +8.111 |
hap | +7.427 |
hood | +7.110 |
heid | +7.012 |
Neg logit contributions | |
Attention | -12.894 |
anticipation | -11.928 |
haste | -10.833 |
)", | -10.660 |
;;;;;;;; | -10.638 |
Token | services |
Token ID | 2594 |
Feature activation | -8.69e+00 |
Pos logit contributions | |
Attention | +2.355 |
anticipation | +2.138 |
haste | +1.901 |
hurry | +1.851 |
Action | +1.849 |
Neg logit contributions | |
yles | -2.711 |
roth | -2.395 |
hap | -2.237 |
estate | -2.183 |
heid | -2.117 |
Token | . |
Token ID | 13 |
Feature activation | -3.30e+00 |
Pos logit contributions | |
yles | +2.222 |
roth | +1.945 |
hap | +1.815 |
estate | +1.758 |
hood | +1.703 |
Neg logit contributions | |
Attention | -2.084 |
anticipation | -1.879 |
haste | -1.676 |
hurry | -1.625 |
)", | -1.607 |
Token |
|
Token ID | 198 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
Attention | +2.769 |
anticipation | +2.470 |
haste | +2.165 |
Action | +2.155 |
hurry | +2.087 |
Neg logit contributions | |
yles | -3.248 |
roth | -2.857 |
hap | -2.681 |
estate | -2.621 |
heid | -2.514 |
Token |
|
Token ID | 198 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
Attention | +1.968 |
anticipation | +1.800 |
haste | +1.634 |
Action | +1.594 |
hurry | +1.586 |
Neg logit contributions | |
yles | -1.660 |
roth | -1.413 |
hap | -1.306 |
estate | -1.267 |
onyms | -1.214 |
Token | SF |
Token ID | 20802 |
Feature activation | -9.21e+00 |
Pos logit contributions | |
Attention | +2.274 |
anticipation | +2.061 |
haste | +1.824 |
Action | +1.778 |
hurry | +1.752 |
Neg logit contributions | |
yles | -2.579 |
roth | -2.238 |
hap | -2.087 |
estate | -2.031 |
onyms | -1.969 |
Token | PD |
Token ID | 5760 |
Feature activation | -1.52e+01 |
Pos logit contributions | |
Attention | +6.277 |
anticipation | +5.665 |
haste | +4.849 |
Action | +4.849 |
hurry | +4.606 |
Neg logit contributions | |
yles | -9.673 |
roth | -8.715 |
hap | -8.096 |
estate | -8.060 |
heid | -7.866 |
Token | and |
Token ID | 290 |
Feature activation | -3.87e+00 |
Pos logit contributions | |
Attention | +11.693 |
anticipation | +10.783 |
Action | +10.046 |
directed | +9.363 |
haste | +9.229 |
Neg logit contributions | |
yles | -13.551 |
roth | -11.476 |
estate | -10.882 |
hap | -10.833 |
heid | -10.652 |
Token | SF |
Token ID | 14362 |
Feature activation | -7.79e+00 |
Pos logit contributions | |
Attention | +2.970 |
anticipation | +2.689 |
haste | +2.342 |
Action | +2.292 |
hurry | +2.239 |
Neg logit contributions | |
yles | -4.028 |
roth | -3.564 |
hap | -3.335 |
estate | -3.270 |
heid | -3.176 |
Token | M |
Token ID | 44 |
Feature activation | -4.25e+00 |
Pos logit contributions | |
Attention | +5.991 |
anticipation | +5.419 |
Action | +4.744 |
haste | +4.742 |
hurry | +4.501 |
Neg logit contributions | |
yles | -7.701 |
roth | -6.844 |
hap | -6.313 |
estate | -6.297 |
onyms | -6.087 |
Token | TA |
Token ID | 5603 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
Attention | +2.739 |
anticipation | +2.385 |
haste | +2.027 |
Action | +1.986 |
hurry | +1.926 |
Neg logit contributions | |
yles | -4.884 |
roth | -4.415 |
hap | -4.175 |
estate | -4.110 |
onyms | -4.011 |
Token | parking |
Token ID | 7647 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
Attention | +13.987 |
anticipation | +12.907 |
Action | +12.177 |
directed | +11.337 |
action | +11.212 |
Neg logit contributions | |
yles | -16.532 |
roth | -14.055 |
heid | -13.183 |
estate | -13.006 |
hap | -12.981 |
Token | enforcement |
Token ID | 5394 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
Attention | +3.893 |
anticipation | +3.590 |
haste | +3.141 |
hurry | +3.037 |
Action | +3.032 |
Neg logit contributions | |
yles | -4.981 |
roth | -4.433 |
hap | -4.175 |
estate | -4.068 |
heid | -3.925 |
Token | the |
Token ID | 262 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
Attention | +0.065 |
anticipation | +0.058 |
haste | +0.051 |
hurry | +0.049 |
Action | +0.049 |
Neg logit contributions | |
yles | -0.084 |
roth | -0.075 |
hap | -0.070 |
estate | -0.068 |
heid | -0.066 |
Token | country |
Token ID | 1499 |
Feature activation | -3.08e+00 |
Pos logit contributions | |
Attention | +1.181 |
anticipation | +1.068 |
haste | +0.938 |
hurry | +0.909 |
Action | +0.905 |
Neg logit contributions | |
yles | -1.434 |
roth | -1.267 |
hap | -1.191 |
estate | -1.153 |
onyms | -1.121 |
Token | and |
Token ID | 290 |
Feature activation | -7.51e+00 |
Pos logit contributions | |
Attention | +2.588 |
anticipation | +2.373 |
haste | +2.092 |
hurry | +2.042 |
Action | +2.022 |
Neg logit contributions | |
yles | -2.970 |
roth | -2.616 |
hap | -2.445 |
estate | -2.348 |
heid | -2.299 |
Token | have |
Token ID | 423 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
Attention | +6.356 |
anticipation | +5.866 |
haste | +5.127 |
hurry | +5.098 |
Action | +4.980 |
Neg logit contributions | |
yles | -7.012 |
roth | -6.148 |
hap | -5.801 |
estate | -5.443 |
heid | -5.436 |
Token | been |
Token ID | 587 |
Feature activation | +8.74e-01 |
Pos logit contributions | |
Attention | +11.413 |
anticipation | +10.614 |
haste | +9.335 |
directed | +9.150 |
action | +8.960 |
Neg logit contributions | |
yles | -13.347 |
roth | -11.692 |
hap | -11.097 |
onyms | -10.779 |
estate | -10.632 |
Token | a |
Token ID | 257 |
Feature activation | -2.93e+00 |
Pos logit contributions | |
yles | +0.815 |
roth | +0.712 |
hap | +0.664 |
estate | +0.645 |
heid | +0.624 |
Neg logit contributions | |
Attention | -0.768 |
anticipation | -0.697 |
haste | -0.623 |
hurry | -0.604 |
Action | -0.599 |
Token | company |
Token ID | 1664 |
Feature activation | -5.98e+00 |
Pos logit contributions | |
Attention | +2.653 |
anticipation | +2.427 |
haste | +2.166 |
hurry | +2.132 |
Action | +2.088 |
Neg logit contributions | |
yles | -2.646 |
roth | -2.314 |
hap | -2.161 |
estate | -2.095 |
onyms | -2.020 |
Token | symbol |
Token ID | 6194 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
Attention | +5.353 |
anticipation | +4.941 |
haste | +4.365 |
hurry | +4.293 |
Action | +4.251 |
Neg logit contributions | |
yles | -5.348 |
roth | -4.714 |
hap | -4.406 |
estate | -4.260 |
onyms | -4.144 |
Token | for |
Token ID | 329 |
Feature activation | -1.86e-01 |
Pos logit contributions | |
yles | +1.169 |
roth | +1.040 |
hap | +0.979 |
estate | +0.956 |
hood | +0.928 |
Neg logit contributions | |
Attention | -0.819 |
anticipation | -0.728 |
haste | -0.637 |
hurry | -0.612 |
Action | -0.604 |
Token | 80 |
Token ID | 4019 |
Feature activation | -3.03e+00 |
Pos logit contributions | |
Attention | +0.170 |
anticipation | +0.155 |
haste | +0.139 |
hurry | +0.135 |
Action | +0.134 |
Neg logit contributions | |
yles | -0.167 |
roth | -0.145 |
hap | -0.135 |
estate | -0.131 |
heid | -0.126 |
Token | years |
Token ID | 812 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
Attention | +3.211 |
anticipation | +2.976 |
haste | +2.711 |
hurry | +2.663 |
Action | +2.654 |
Neg logit contributions | |
yles | -2.237 |
roth | -1.912 |
hap | -1.746 |
estate | -1.668 |
onyms | -1.589 |
Token | reason |
Token ID | 1738 |
Feature activation | +2.80e+00 |
Pos logit contributions | |
Attention | +1.318 |
anticipation | +1.180 |
haste | +1.034 |
hurry | +0.997 |
Action | +0.991 |
Neg logit contributions | |
yles | -1.810 |
roth | -1.611 |
hap | -1.504 |
estate | -1.473 |
heid | -1.430 |
Token | Cal |
Token ID | 2199 |
Feature activation | +3.39e+00 |
Pos logit contributions | |
yles | +2.907 |
roth | +2.583 |
hap | +2.443 |
estate | +2.379 |
hood | +2.321 |
Neg logit contributions | |
Attention | -2.126 |
anticipation | -1.892 |
haste | -1.657 |
hurry | -1.586 |
)", | -1.585 |
Token | Quant |
Token ID | 16972 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
yles | +3.084 |
roth | +2.690 |
hap | +2.486 |
estate | +2.421 |
heid | +2.324 |
Neg logit contributions | |
Attention | -3.038 |
anticipation | -2.766 |
haste | -2.498 |
hurry | -2.414 |
Action | -2.374 |
Token | rill |
Token ID | 20190 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
yles | +1.112 |
roth | +0.958 |
hap | +0.883 |
estate | +0.857 |
heid | +0.822 |
Neg logit contributions | |
Attention | -1.275 |
anticipation | -1.167 |
haste | -1.058 |
hurry | -1.028 |
Action | -1.018 |
Token | had |
Token ID | 550 |
Feature activation | -1.89e+01 |
Pos logit contributions | |
Attention | +0.944 |
anticipation | +0.856 |
haste | +0.760 |
hurry | +0.738 |
Action | +0.734 |
Neg logit contributions | |
yles | -1.092 |
roth | -0.955 |
hap | -0.896 |
estate | -0.872 |
heid | -0.846 |
Token | to |
Token ID | 284 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
Attention | +13.020 |
anticipation | +12.394 |
haste | +11.033 |
hurry | +10.936 |
directed | +10.802 |
Neg logit contributions | |
yles | -17.215 |
roth | -14.620 |
onyms | -13.565 |
hap | -13.539 |
heid | -13.307 |
Token | stress |
Token ID | 5503 |
Feature activation | -5.07e+00 |
Pos logit contributions | |
Attention | +1.202 |
anticipation | +1.094 |
haste | +0.983 |
hurry | +0.962 |
Action | +0.940 |
Neg logit contributions | |
yles | -1.309 |
roth | -1.140 |
hap | -1.066 |
estate | -1.039 |
heid | -1.007 |
Token | even |
Token ID | 772 |
Feature activation | +8.39e+00 |
Pos logit contributions | |
Attention | +3.885 |
anticipation | +3.515 |
haste | +3.095 |
hurry | +2.976 |
Action | +2.947 |
Neg logit contributions | |
yles | -5.229 |
roth | -4.615 |
hap | -4.372 |
estate | -4.261 |
heid | -4.159 |
Token | just |
Token ID | 655 |
Feature activation | +4.23e+00 |
Pos logit contributions | |
yles | +8.095 |
roth | +7.240 |
hap | +6.771 |
estate | +6.664 |
hood | +6.617 |
Neg logit contributions | |
Attention | -6.351 |
anticipation | -5.595 |
haste | -4.936 |
)", | -4.838 |
hurry | -4.743 |
Token | his |
Token ID | 465 |
Feature activation | -3.55e+00 |
Pos logit contributions | |
yles | +4.051 |
roth | +3.565 |
hap | +3.360 |
estate | +3.283 |
hood | +3.183 |
Neg logit contributions | |
Attention | -3.469 |
anticipation | -3.090 |
haste | -2.749 |
)", | -2.663 |
hurry | -2.656 |
Token | first |
Token ID | 717 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
Attention | +3.063 |
anticipation | +2.815 |
haste | +2.509 |
hurry | +2.426 |
Action | +2.390 |
Neg logit contributions | |
yles | -3.380 |
roth | -2.954 |
hap | -2.768 |
estate | -2.683 |
heid | -2.597 |
Token | books |
Token ID | 3835 |
Feature activation | -4.67e+00 |
Pos logit contributions | |
yles | +2.677 |
roth | +2.349 |
hap | +2.192 |
estate | +2.127 |
hood | +2.070 |
Neg logit contributions | |
Attention | -2.491 |
anticipation | -2.238 |
haste | -2.011 |
hurry | -1.953 |
)", | -1.932 |
Token | take |
Token ID | 1011 |
Feature activation | -1.72e+01 |
Pos logit contributions | |
Attention | +3.858 |
anticipation | +3.496 |
haste | +3.065 |
hurry | +2.981 |
Action | +2.974 |
Neg logit contributions | |
yles | -4.554 |
roth | -3.979 |
hap | -3.725 |
estate | -3.617 |
heid | -3.551 |
Token | the |
Token ID | 262 |
Feature activation | -6.36e+00 |
Pos logit contributions | |
Attention | +13.184 |
anticipation | +12.458 |
action | +10.840 |
haste | +10.720 |
Action | +10.526 |
Neg logit contributions | |
yles | -14.243 |
roth | -12.887 |
heid | -11.966 |
estate | -11.916 |
hap | -11.828 |
Token | reader |
Token ID | 9173 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
Attention | +5.724 |
anticipation | +5.337 |
haste | +4.674 |
hurry | +4.597 |
Action | +4.553 |
Neg logit contributions | |
yles | -5.634 |
roth | -4.942 |
hap | -4.655 |
estate | -4.496 |
heid | -4.371 |
Token | beyond |
Token ID | 3675 |
Feature activation | +8.87e+00 |
Pos logit contributions | |
Attention | +7.764 |
anticipation | +7.193 |
hurry | +6.123 |
Action | +6.093 |
haste | +6.059 |
Neg logit contributions | |
yles | -10.912 |
roth | -9.447 |
hap | -9.044 |
estate | -8.899 |
heid | -8.622 |
Token | falling |
Token ID | 7463 |
Feature activation | -3.78e+00 |
Pos logit contributions | |
yles | +8.322 |
roth | +7.366 |
hap | +6.921 |
hood | +6.652 |
estate | +6.612 |
Neg logit contributions | |
Attention | -6.958 |
anticipation | -6.026 |
haste | -5.531 |
)", | -5.350 |
hurry | -5.291 |
Token | in |
Token ID | 287 |
Feature activation | -4.65e+00 |
Pos logit contributions | |
Attention | +2.845 |
anticipation | +2.591 |
haste | +2.231 |
hurry | +2.179 |
Action | +2.155 |
Neg logit contributions | |
yles | -3.953 |
roth | -3.509 |
hap | -3.289 |
estate | -3.256 |
heid | -3.173 |
Token | love |
Token ID | 1842 |
Feature activation | +4.02e+00 |
Pos logit contributions | |
Attention | +2.762 |
anticipation | +2.463 |
haste | +2.050 |
hurry | +1.958 |
Action | +1.880 |
Neg logit contributions | |
yles | -5.616 |
roth | -5.047 |
hap | -4.768 |
estate | -4.722 |
heid | -4.639 |
Token | and |
Token ID | 290 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
yles | +3.601 |
roth | +3.156 |
hap | +2.900 |
estate | +2.793 |
hood | +2.761 |
Neg logit contributions | |
Attention | -3.634 |
anticipation | -3.256 |
haste | -2.961 |
hurry | -2.859 |
)", | -2.836 |
Token | into |
Token ID | 656 |
Feature activation | +2.71e+00 |
Pos logit contributions | |
yles | +1.557 |
roth | +1.369 |
hap | +1.280 |
estate | +1.242 |
hood | +1.204 |
Neg logit contributions | |
Attention | -1.381 |
anticipation | -1.242 |
haste | -1.110 |
hurry | -1.073 |
Action | -1.066 |
Token | the |
Token ID | 262 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
yles | +2.617 |
roth | +2.320 |
hap | +2.168 |
estate | +2.086 |
hood | +2.046 |
Neg logit contributions | |
Attention | -2.265 |
anticipation | -2.010 |
haste | -1.806 |
hurry | -1.737 |
Action | -1.726 |
Token | booth |
Token ID | 18600 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
yles | +7.107 |
roth | +6.149 |
hap | +5.697 |
estate | +5.677 |
hood | +5.520 |
Neg logit contributions | |
Attention | -8.268 |
anticipation | -7.146 |
haste | -6.639 |
)", | -6.476 |
hurry | -6.449 |
Token | or |
Token ID | 393 |
Feature activation | +3.03e+00 |
Pos logit contributions | |
Attention | +0.163 |
anticipation | +0.148 |
haste | +0.132 |
hurry | +0.128 |
Action | +0.127 |
Neg logit contributions | |
yles | -0.172 |
roth | -0.151 |
hap | -0.140 |
estate | -0.136 |
heid | -0.132 |
Token | queue |
Token ID | 16834 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
yles | +2.865 |
roth | +2.526 |
hap | +2.361 |
estate | +2.302 |
hood | +2.238 |
Neg logit contributions | |
Attention | -2.559 |
anticipation | -2.291 |
haste | -2.047 |
hurry | -1.966 |
Action | -1.962 |
Token | line |
Token ID | 1627 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
Attention | +1.382 |
anticipation | +1.259 |
haste | +1.105 |
hurry | +1.070 |
Action | +1.054 |
Neg logit contributions | |
yles | -1.748 |
roth | -1.553 |
hap | -1.449 |
estate | -1.416 |
heid | -1.375 |
Token | , |
Token ID | 11 |
Feature activation | -4.25e+00 |
Pos logit contributions | |
yles | +1.074 |
roth | +0.938 |
hap | +0.875 |
estate | +0.850 |
heid | +0.821 |
Neg logit contributions | |
Attention | -1.031 |
anticipation | -0.932 |
haste | -0.835 |
hurry | -0.810 |
Action | -0.803 |
Token | but |
Token ID | 475 |
Feature activation | -6.44e-01 |
Pos logit contributions | |
Attention | +3.102 |
anticipation | +2.816 |
haste | +2.437 |
hurry | +2.363 |
Action | +2.311 |
Neg logit contributions | |
yles | -4.572 |
roth | -4.081 |
hap | -3.827 |
estate | -3.734 |
heid | -3.658 |
Token | in |
Token ID | 287 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
Attention | +0.501 |
anticipation | +0.450 |
haste | +0.395 |
hurry | +0.382 |
Action | +0.378 |
Neg logit contributions | |
yles | -0.667 |
roth | -0.591 |
hap | -0.555 |
estate | -0.542 |
heid | -0.526 |
Token | the |
Token ID | 262 |
Feature activation | -8.92e-01 |
Pos logit contributions | |
Attention | +9.880 |
anticipation | +9.479 |
haste | +8.092 |
Action | +7.974 |
hurry | +7.686 |
Neg logit contributions | |
yles | -13.143 |
roth | -11.385 |
hap | -10.555 |
estate | -10.525 |
onyms | -10.465 |
Token | 21 |
Token ID | 2310 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
Attention | +0.770 |
anticipation | +0.700 |
haste | +0.624 |
hurry | +0.605 |
Action | +0.599 |
Neg logit contributions | |
yles | -0.851 |
roth | -0.743 |
hap | -0.696 |
estate | -0.677 |
heid | -0.654 |
Token | st |
Token ID | 301 |
Feature activation | +6.52e+00 |
Pos logit contributions | |
Attention | +2.887 |
anticipation | +2.671 |
haste | +2.456 |
hurry | +2.398 |
Action | +2.384 |
Neg logit contributions | |
yles | -1.895 |
roth | -1.590 |
hap | -1.441 |
estate | -1.376 |
heid | -1.313 |
Token | century |
Token ID | 4289 |
Feature activation | +2.67e+00 |
Pos logit contributions | |
yles | +4.105 |
roth | +3.210 |
hap | +2.865 |
estate | +2.814 |
hood | +2.738 |
Neg logit contributions | |
Attention | -7.488 |
anticipation | -6.914 |
haste | -6.366 |
)", | -6.244 |
hurry | -6.194 |
Token | F |
Token ID | 376 |
Feature activation | -4.65e+00 |
Pos logit contributions | |
Attention | +3.522 |
anticipation | +3.102 |
Action | +2.684 |
haste | +2.682 |
hurry | +2.638 |
Neg logit contributions | |
yles | -4.548 |
roth | -4.031 |
hap | -3.862 |
estate | -3.713 |
onyms | -3.604 |
Token | inc |
Token ID | 1939 |
Feature activation | -2.26e+00 |
Pos logit contributions | |
Attention | +3.963 |
anticipation | +3.614 |
haste | +3.183 |
Action | +3.104 |
hurry | +3.071 |
Neg logit contributions | |
yles | -4.205 |
roth | -3.744 |
hap | -3.517 |
heid | -3.422 |
estate | -3.373 |
Token | her |
Token ID | 372 |
Feature activation | -2.04e+01 |
Pos logit contributions | |
Attention | +1.955 |
anticipation | +1.771 |
haste | +1.567 |
Action | +1.534 |
hurry | +1.526 |
Neg logit contributions | |
yles | -2.125 |
roth | -1.851 |
hap | -1.741 |
estate | -1.699 |
onyms | -1.637 |
Token | � |
Token ID | 447 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
Attention | +12.570 |
anticipation | +11.496 |
Action | +10.581 |
directed | +10.355 |
action | +9.993 |
Neg logit contributions | |
yles | -18.659 |
roth | -16.100 |
hap | -15.931 |
estate | -15.279 |
heid | -14.951 |
Token | � |
Token ID | 247 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
Attention | +0.966 |
anticipation | +0.874 |
haste | +0.778 |
hurry | +0.752 |
Action | +0.747 |
Neg logit contributions | |
yles | -1.092 |
roth | -0.957 |
hap | -0.896 |
estate | -0.871 |
heid | -0.845 |
Token | s |
Token ID | 82 |
Feature activation | -1.88e+01 |
Pos logit contributions | |
Attention | +16.011 |
anticipation | +14.924 |
directed | +13.732 |
Action | +13.316 |
action | +13.089 |
Neg logit contributions | |
yles | -17.110 |
roth | -14.430 |
hap | -13.962 |
onyms | -13.748 |
estate | -13.322 |
Token | forthcoming |
Token ID | 21220 |
Feature activation | -2.09e+01 |
Pos logit contributions | |
Attention | +14.434 |
anticipation | +13.494 |
Action | +12.267 |
action | +12.012 |
directed | +11.691 |
Neg logit contributions | |
yles | -15.258 |
roth | -12.919 |
estate | -12.186 |
hap | -12.030 |
onyms | -11.887 |
Token | Netflix |
Token ID | 12074 |
Feature activation | -1.70e+01 |
Pos logit contributions | |
Attention | +15.340 |
anticipation | +14.537 |
Action | +13.256 |
action | +13.201 |
directed | +12.827 |
Neg logit contributions | |
yles | -16.487 |
roth | -14.124 |
estate | -13.623 |
hap | -13.409 |
onyms | -12.733 |
Token | series |
Token ID | 2168 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
Attention | +11.370 |
anticipation | +10.269 |
action | +9.449 |
Action | +9.441 |
directed | +9.009 |
Neg logit contributions | |
yles | -15.987 |
roth | -14.529 |
hap | -13.664 |
estate | -13.551 |
onyms | -12.956 |
Token | , |
Token ID | 11 |
Feature activation | -1.49e+01 |
Pos logit contributions | |
Attention | +9.665 |
anticipation | +8.495 |
Action | +7.539 |
directed | +7.241 |
haste | +7.095 |
Neg logit contributions | |
yles | -11.629 |
roth | -10.169 |
hap | -9.591 |
estate | -9.499 |
onyms | -9.094 |
Token | Mind |
Token ID | 10175 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
Attention | +11.754 |
anticipation | +10.398 |
Action | +9.410 |
directed | +9.174 |
haste | +8.721 |
Neg logit contributions | |
yles | -13.308 |
roth | -11.621 |
hap | -10.889 |
estate | -10.735 |
heid | -10.198 |
Token | arms |
Token ID | 5101 |
Feature activation | -6.94e-01 |
Pos logit contributions | |
Attention | +9.476 |
anticipation | +8.823 |
haste | +7.969 |
hurry | +7.757 |
Action | +7.582 |
Neg logit contributions | |
yles | -11.840 |
roth | -10.292 |
estate | -9.838 |
hap | -9.697 |
onyms | -9.237 |
Token | above |
Token ID | 2029 |
Feature activation | -6.28e+00 |
Pos logit contributions | |
Attention | +0.604 |
anticipation | +0.550 |
haste | +0.491 |
hurry | +0.477 |
Action | +0.472 |
Neg logit contributions | |
yles | -0.653 |
roth | -0.571 |
hap | -0.532 |
estate | -0.518 |
heid | -0.501 |
Token | his |
Token ID | 465 |
Feature activation | -7.56e+00 |
Pos logit contributions | |
Attention | +3.121 |
anticipation | +2.737 |
haste | +2.163 |
hurry | +2.020 |
Action | +1.980 |
Neg logit contributions | |
yles | -8.106 |
roth | -7.331 |
estate | -6.963 |
hap | -6.962 |
heid | -6.715 |
Token | head |
Token ID | 1182 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
Attention | +4.957 |
anticipation | +4.497 |
haste | +3.928 |
hurry | +3.745 |
Action | +3.660 |
Neg logit contributions | |
yles | -8.481 |
roth | -7.481 |
estate | -7.211 |
hap | -7.194 |
onyms | -6.846 |
Token | in |
Token ID | 287 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
yles | +1.347 |
roth | +1.174 |
hap | +1.091 |
estate | +1.057 |
heid | +1.024 |
Neg logit contributions | |
Attention | -1.359 |
anticipation | -1.230 |
haste | -1.106 |
hurry | -1.071 |
Action | -1.064 |
Token | disgusted |
Token ID | 36943 |
Feature activation | -2.30e+01 |
Pos logit contributions | |
anticipation | +17.278 |
Attention | +15.836 |
haste | +14.851 |
response | +14.088 |
hurry | +13.843 |
Neg logit contributions | |
yles | -18.720 |
roth | -16.231 |
estate | -15.384 |
hap | -15.146 |
heid | -14.457 |
Token | frustration |
Token ID | 14285 |
Feature activation | -7.30e+00 |
Pos logit contributions | |
anticipation | +16.960 |
Attention | +16.112 |
haste | +15.064 |
hurry | +13.759 |
response | +13.698 |
Neg logit contributions | |
yles | -18.739 |
roth | -16.237 |
estate | -15.644 |
hap | -15.412 |
onyms | -14.348 |
Token | . |
Token ID | 13 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
Attention | +5.781 |
anticipation | +5.409 |
haste | +4.738 |
hurry | +4.637 |
Action | +4.516 |
Neg logit contributions | |
yles | -7.183 |
roth | -6.268 |
hap | -5.844 |
estate | -5.796 |
heid | -5.539 |
Token |
|
Token ID | 198 |
Feature activation | -2.83e+00 |
Pos logit contributions | |
Attention | +9.317 |
anticipation | +7.975 |
Action | +7.284 |
haste | +6.862 |
Intent | +6.752 |
Neg logit contributions | |
yles | -10.580 |
roth | -9.156 |
hap | -8.730 |
estate | -8.675 |
onyms | -8.289 |
Token |
|
Token ID | 198 |
Feature activation | -7.53e+00 |
Pos logit contributions | |
Attention | +2.760 |
anticipation | +2.521 |
haste | +2.283 |
Action | +2.237 |
hurry | +2.204 |
Neg logit contributions | |
yles | -2.383 |
roth | -2.024 |
hap | -1.878 |
estate | -1.813 |
onyms | -1.745 |
Token | A |
Token ID | 32 |
Feature activation | -6.74e+00 |
Pos logit contributions | |
Attention | +6.027 |
anticipation | +5.406 |
haste | +4.759 |
Begin | +4.691 |
Action | +4.687 |
Neg logit contributions | |
yles | -7.276 |
roth | -6.234 |
hap | -5.817 |
estate | -5.674 |
onyms | -5.628 |
Token | launched |
Token ID | 5611 |
Feature activation | +3.10e+00 |
Pos logit contributions | |
Attention | +5.644 |
anticipation | +5.094 |
Action | +4.410 |
haste | +4.330 |
directed | +4.220 |
Neg logit contributions | |
yles | -8.075 |
roth | -7.159 |
hap | -6.736 |
estate | -6.597 |
onyms | -6.379 |
Token | by |
Token ID | 416 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
yles | +2.983 |
roth | +2.613 |
hap | +2.442 |
estate | +2.374 |
hood | +2.312 |
Neg logit contributions | |
Attention | -2.608 |
anticipation | -2.342 |
haste | -2.096 |
hurry | -2.037 |
)", | -1.987 |
Token | Chancellor |
Token ID | 19477 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
Attention | +1.299 |
anticipation | +1.168 |
haste | +1.023 |
hurry | +0.991 |
Action | +0.990 |
Neg logit contributions | |
yles | -1.691 |
roth | -1.494 |
hap | -1.403 |
estate | -1.370 |
heid | -1.327 |
Token | Angela |
Token ID | 17799 |
Feature activation | +8.87e-01 |
Pos logit contributions | |
Attention | +1.347 |
anticipation | +1.177 |
haste | +0.979 |
Action | +0.943 |
hurry | +0.942 |
Neg logit contributions | |
yles | -2.543 |
roth | -2.289 |
hap | -2.179 |
estate | -2.140 |
heid | -2.081 |
Token | Merkel |
Token ID | 18263 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
yles | +0.706 |
roth | +0.605 |
hap | +0.553 |
estate | +0.534 |
heid | +0.514 |
Neg logit contributions | |
Attention | -0.897 |
anticipation | -0.826 |
haste | -0.752 |
hurry | -0.732 |
Action | -0.723 |
Token | in |
Token ID | 287 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
yles | +0.433 |
roth | +0.382 |
hap | +0.357 |
estate | +0.347 |
heid | +0.336 |
Neg logit contributions | |
Attention | -0.373 |
anticipation | -0.337 |
haste | -0.299 |
hurry | -0.289 |
Action | -0.286 |
Token | 2010 |
Token ID | 3050 |
Feature activation | +7.25e+00 |
Pos logit contributions | |
anticipation | +14.387 |
Attention | +13.900 |
haste | +12.257 |
response | +11.903 |
earnest | +11.524 |
Neg logit contributions | |
yles | -23.068 |
roth | -20.237 |
estate | -19.995 |
hap | -19.296 |
onyms | -18.674 |
Token | , |
Token ID | 11 |
Feature activation | -2.38e+00 |
Pos logit contributions | |
yles | +6.097 |
roth | +5.338 |
hap | +4.896 |
estate | +4.740 |
hood | +4.690 |
Neg logit contributions | |
Attention | -6.638 |
anticipation | -5.962 |
haste | -5.429 |
hurry | -5.306 |
)", | -5.259 |
Token | to |
Token ID | 284 |
Feature activation | -5.36e+00 |
Pos logit contributions | |
Attention | +1.838 |
anticipation | +1.654 |
haste | +1.442 |
Action | +1.400 |
hurry | +1.387 |
Neg logit contributions | |
yles | -2.480 |
roth | -2.195 |
hap | -2.067 |
estate | -2.012 |
heid | -1.953 |
Token | prepare |
Token ID | 8335 |
Feature activation | -8.09e+00 |
Pos logit contributions | |
Attention | +4.493 |
anticipation | +4.181 |
haste | +3.688 |
hurry | +3.664 |
Action | +3.592 |
Neg logit contributions | |
yles | -5.077 |
roth | -4.433 |
hap | -4.183 |
estate | -4.090 |
heid | -3.951 |
Token | for |
Token ID | 329 |
Feature activation | +8.10e+00 |
Pos logit contributions | |
Attention | +5.737 |
anticipation | +5.321 |
haste | +4.578 |
Action | +4.396 |
hurry | +4.390 |
Neg logit contributions | |
yles | -8.536 |
roth | -7.569 |
hap | -7.109 |
estate | -6.986 |
onyms | -6.756 |
Token | load |
Token ID | 3440 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
Attention | +9.772 |
anticipation | +9.336 |
haste | +8.278 |
hurry | +7.911 |
Action | +7.719 |
Neg logit contributions | |
yles | -11.836 |
roth | -10.330 |
onyms | -9.508 |
estate | -9.436 |
hap | -9.394 |
Token | < |
Token ID | 1279 |
Feature activation | -1.62e+01 |
Pos logit contributions | |
Attention | +9.084 |
anticipation | +7.768 |
haste | +6.773 |
Action | +6.629 |
Begin | +6.577 |
Neg logit contributions | |
yles | -13.789 |
roth | -12.278 |
hap | -11.268 |
onyms | -11.196 |
estate | -10.982 |
Token | ' |
Token ID | 705 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
Attention | +10.853 |
anticipation | +9.411 |
Action | +8.902 |
action | +8.037 |
haste | +7.897 |
Neg logit contributions | |
yles | -16.494 |
roth | -14.101 |
onyms | -13.166 |
hap | -13.145 |
heid | -13.013 |
Token | a |
Token ID | 64 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
Attention | +8.485 |
anticipation | +7.547 |
Action | +6.932 |
haste | +6.880 |
action | +6.606 |
Neg logit contributions | |
yles | -9.801 |
roth | -8.386 |
hap | -7.562 |
heid | -7.391 |
estate | -7.373 |
Token | > |
Token ID | 1875 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
Attention | +8.459 |
anticipation | +7.239 |
Action | +6.496 |
haste | +6.305 |
action | +5.904 |
Neg logit contributions | |
yles | -15.229 |
roth | -13.624 |
hap | -12.433 |
onyms | -12.380 |
heid | -12.014 |
Token | ( |
Token ID | 357 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
Attention | +9.274 |
anticipation | +8.110 |
haste | +6.937 |
Action | +6.928 |
hurry | +6.727 |
Neg logit contributions | |
yles | -14.843 |
roth | -13.105 |
estate | -12.156 |
onyms | -12.041 |
hap | -11.780 |
Token | & |
Token ID | 1222 |
Feature activation | -1.77e+01 |
Pos logit contributions | |
Attention | +16.064 |
anticipation | +15.187 |
action | +13.562 |
Action | +13.506 |
haste | +13.224 |
Neg logit contributions | |
yles | -18.228 |
roth | -15.343 |
onyms | -13.804 |
heid | -13.480 |
hap | -13.261 |
Token | self |
Token ID | 2116 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
Attention | +10.584 |
anticipation | +9.482 |
Action | +8.296 |
action | +8.008 |
haste | +7.561 |
Neg logit contributions | |
yles | -18.744 |
roth | -16.464 |
hap | -15.020 |
estate | -15.015 |
onyms | -15.010 |
Token | , |
Token ID | 837 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
Attention | +7.234 |
anticipation | +5.809 |
haste | +4.871 |
Action | +4.536 |
action | +4.194 |
Neg logit contributions | |
yles | -20.357 |
roth | -18.149 |
hap | -17.178 |
estate | -16.691 |
onyms | -16.497 |
Token | ord |
Token ID | 2760 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
Attention | +15.316 |
anticipation | +14.578 |
action | +12.985 |
Action | +12.931 |
haste | +12.816 |
Neg logit contributions | |
yles | -17.280 |
roth | -14.517 |
onyms | -13.163 |
hap | -12.769 |
heid | -12.577 |
Token | : |
Token ID | 1058 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
Attention | +9.523 |
anticipation | +8.319 |
haste | +7.281 |
Action | +7.218 |
hurry | +6.809 |
Neg logit contributions | |
yles | -12.768 |
roth | -10.941 |
hap | -10.430 |
onyms | -9.998 |
estate | -9.818 |
Token | her |
Token ID | 607 |
Feature activation | -3.67e+00 |
Pos logit contributions | |
Attention | +15.170 |
anticipation | +14.546 |
action | +13.221 |
Action | +12.760 |
haste | +11.920 |
Neg logit contributions | |
yles | -20.489 |
roth | -18.407 |
hap | -18.224 |
estate | -17.797 |
onyms | -17.739 |
Token | from |
Token ID | 422 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
Attention | +2.981 |
anticipation | +2.726 |
haste | +2.402 |
Action | +2.332 |
hurry | +2.325 |
Neg logit contributions | |
yles | -3.633 |
roth | -3.169 |
hap | -3.005 |
estate | -2.924 |
onyms | -2.819 |
Token | the |
Token ID | 262 |
Feature activation | -8.83e-01 |
Pos logit contributions | |
Attention | +10.995 |
anticipation | +10.447 |
haste | +9.263 |
Action | +8.968 |
hurry | +8.951 |
Neg logit contributions | |
yles | -11.779 |
roth | -10.214 |
hap | -9.556 |
estate | -9.310 |
onyms | -9.240 |
Token | crowded |
Token ID | 18012 |
Feature activation | +8.80e-01 |
Pos logit contributions | |
Attention | +0.774 |
anticipation | +0.704 |
haste | +0.629 |
hurry | +0.610 |
Action | +0.605 |
Neg logit contributions | |
yles | -0.827 |
roth | -0.722 |
hap | -0.675 |
estate | -0.657 |
heid | -0.634 |
Token | streets |
Token ID | 6483 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
yles | +0.845 |
roth | +0.743 |
hap | +0.693 |
estate | +0.675 |
heid | +0.654 |
Neg logit contributions | |
Attention | -0.747 |
anticipation | -0.675 |
haste | -0.601 |
hurry | -0.582 |
Action | -0.576 |
Token | of |
Token ID | 286 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
Attention | +1.033 |
anticipation | +0.932 |
haste | +0.823 |
hurry | +0.796 |
Action | +0.790 |
Neg logit contributions | |
yles | -1.293 |
roth | -1.141 |
hap | -1.074 |
estate | -1.046 |
heid | -1.009 |
Token | New |
Token ID | 968 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
Attention | +13.334 |
anticipation | +12.508 |
haste | +10.642 |
Action | +10.595 |
action | +10.411 |
Neg logit contributions | |
yles | -17.104 |
roth | -14.864 |
hap | -14.431 |
onyms | -13.963 |
estate | -13.873 |
Token | Orleans |
Token ID | 12255 |
Feature activation | -3.65e+00 |
Pos logit contributions | |
Attention | +6.257 |
anticipation | +4.677 |
Action | +3.770 |
Focus | +3.193 |
hurry | +3.041 |
Neg logit contributions | |
yles | -20.498 |
roth | -18.262 |
hap | -18.069 |
estate | -17.894 |
onyms | -17.800 |
Token | to |
Token ID | 284 |
Feature activation | +6.91e-01 |
Pos logit contributions | |
Attention | +3.073 |
anticipation | +2.804 |
haste | +2.480 |
Action | +2.422 |
hurry | +2.406 |
Neg logit contributions | |
yles | -3.483 |
roth | -3.042 |
hap | -2.857 |
estate | -2.771 |
onyms | -2.658 |
Token | v |
Token ID | 410 |
Feature activation | -3.42e-01 |
Pos logit contributions | |
yles | +0.692 |
roth | +0.611 |
hap | +0.572 |
estate | +0.557 |
heid | +0.541 |
Neg logit contributions | |
Attention | -0.559 |
anticipation | -0.501 |
haste | -0.443 |
hurry | -0.428 |
Action | -0.424 |
Token | oodoo |
Token ID | 36038 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
Attention | +0.340 |
anticipation | +0.313 |
haste | +0.284 |
hurry | +0.276 |
Action | +0.275 |
Neg logit contributions | |
yles | -0.279 |
roth | -0.238 |
hap | -0.220 |
estate | -0.213 |
heid | -0.203 |