Token | Th |
Token ID | 817 |
Feature activation | -2.48e+00 |
Pos logit contributions | |
hua | +2.242 |
uces | +2.165 |
rito | +2.075 |
itous | +2.067 |
hi | +1.968 |
Neg logit contributions | |
oyal | -2.769 |
stown | -2.583 |
charging | -2.528 |
atically | -2.516 |
agy | -2.463 |
Token | ING |
Token ID | 2751 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
oyal | +1.356 |
stown | +1.215 |
charging | +1.177 |
atically | +1.170 |
Wolfe | +1.141 |
Neg logit contributions | |
hua | -2.187 |
uces | -2.136 |
rito | -2.077 |
itous | -2.072 |
048 | -1.998 |
Token | Premiere |
Token ID | 44151 |
Feature activation | -6.45e-01 |
Pos logit contributions | |
hua | +0.771 |
uces | +0.748 |
rito | +0.718 |
itous | +0.716 |
048 | +0.683 |
Neg logit contributions | |
oyal | -0.857 |
stown | -0.790 |
charging | -0.774 |
atically | -0.770 |
agy | -0.755 |
Token |
|
Token ID | 198 |
Feature activation | +3.64e+00 |
Pos logit contributions | |
oyal | +0.452 |
stown | +0.416 |
charging | +0.406 |
atically | +0.404 |
Wolfe | +0.396 |
Neg logit contributions | |
hua | -0.468 |
uces | -0.455 |
rito | -0.439 |
itous | -0.438 |
048 | -0.419 |
Token |
|
Token ID | 198 |
Feature activation | +8.62e+00 |
Pos logit contributions | |
hua | +2.338 |
uces | +2.171 |
itous | +2.124 |
rito | +2.121 |
048 | +2.113 |
Neg logit contributions | |
oyal | -2.870 |
atically | -2.582 |
stown | -2.576 |
charging | -2.553 |
Gleaming | -2.550 |
Token | D |
Token ID | 35 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
hua | +4.077 |
uces | +3.944 |
rito | +3.730 |
itous | +3.675 |
048 | +3.655 |
Neg logit contributions | |
oyal | -7.906 |
stown | -7.366 |
atically | -7.284 |
Wolfe | -7.238 |
Gleaming | -7.128 |
Token | iameter |
Token ID | 13173 |
Feature activation | +3.55e+00 |
Pos logit contributions | |
hua | +2.618 |
uces | +2.117 |
iameter | +1.995 |
itous | +1.530 |
048 | +1.520 |
Neg logit contributions | |
oyal | -20.375 |
Wolfe | -19.712 |
Gleaming | -19.576 |
atically | -19.532 |
stown | -19.521 |
Token | : |
Token ID | 25 |
Feature activation | -2.52e+00 |
Pos logit contributions | |
hua | +1.820 |
uces | +1.715 |
itous | +1.626 |
rito | +1.623 |
048 | +1.593 |
Neg logit contributions | |
oyal | -3.259 |
stown | -2.970 |
charging | -2.941 |
atically | -2.936 |
Gleaming | -2.891 |
Token | 57 |
Token ID | 7632 |
Feature activation | -8.50e-01 |
Pos logit contributions | |
oyal | +1.827 |
stown | +1.694 |
charging | +1.653 |
atically | +1.645 |
Wolfe | +1.624 |
Neg logit contributions | |
hua | -1.757 |
uces | -1.708 |
rito | -1.651 |
itous | -1.648 |
048 | -1.560 |
Token | . |
Token ID | 13 |
Feature activation | -3.08e-01 |
Pos logit contributions | |
oyal | +0.665 |
stown | +0.618 |
charging | +0.605 |
atically | +0.599 |
Wolfe | +0.594 |
Neg logit contributions | |
hua | -0.547 |
uces | -0.528 |
rito | -0.509 |
itous | -0.508 |
048 | -0.480 |
Token | 2 |
Token ID | 17 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
oyal | +0.246 |
stown | +0.229 |
charging | +0.224 |
atically | +0.223 |
Wolfe | +0.220 |
Neg logit contributions | |
hua | -0.193 |
uces | -0.187 |
rito | -0.179 |
itous | -0.179 |
048 | -0.170 |
Token | 4 |
Token ID | 604 |
Feature activation | +5.94e+00 |
Pos logit contributions | |
hua | +1.846 |
uces | +1.795 |
rito | +1.735 |
itous | +1.731 |
048 | +1.666 |
Neg logit contributions | |
oyal | -1.743 |
stown | -1.605 |
charging | -1.565 |
atically | -1.561 |
Wolfe | -1.529 |
Token | 64 |
Token ID | 2414 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
hua | +3.266 |
uces | +3.167 |
rito | +3.036 |
itous | +3.020 |
048 | +2.893 |
Neg logit contributions | |
oyal | -5.030 |
stown | -4.758 |
charging | -4.640 |
atically | -4.604 |
Wolfe | -4.599 |
Token | 406 |
Token ID | 29703 |
Feature activation | +6.35e+00 |
Pos logit contributions | |
hua | +1.596 |
uces | +1.546 |
rito | +1.486 |
itous | +1.479 |
048 | +1.420 |
Neg logit contributions | |
oyal | -1.945 |
stown | -1.807 |
charging | -1.764 |
atically | -1.759 |
Wolfe | -1.736 |
Token | Mem |
Token ID | 4942 |
Feature activation | -4.95e+00 |
Pos logit contributions | |
hua | +4.248 |
uces | +4.143 |
rito | +3.984 |
itous | +3.961 |
048 | +3.826 |
Neg logit contributions | |
oyal | -4.591 |
stown | -4.302 |
charging | -4.154 |
atically | -4.146 |
agy | -4.100 |
Token | c |
Token ID | 66 |
Feature activation | -4.21e+00 |
Pos logit contributions | |
oyal | +3.136 |
stown | +2.877 |
charging | +2.823 |
atically | +2.801 |
agy | +2.698 |
Neg logit contributions | |
hua | -3.809 |
uces | -3.772 |
rito | -3.647 |
itous | -3.631 |
inguishable | -3.497 |
Token | py |
Token ID | 9078 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
oyal | +2.758 |
stown | +2.517 |
atically | +2.471 |
charging | +2.462 |
agy | +2.383 |
Neg logit contributions | |
hua | -3.202 |
uces | -3.168 |
itous | -3.037 |
rito | -3.017 |
inguishable | -2.905 |
Token | Reading |
Token ID | 36120 |
Feature activation | +9.57e-01 |
Pos logit contributions | |
hua | +6.978 |
048 | +6.642 |
>>>>>>>> | +6.640 |
rito | +6.422 |
uces | +6.397 |
Neg logit contributions | |
oyal | -13.818 |
stown | -13.173 |
Armstrong | -13.149 |
Gleaming | -13.111 |
Wolfe | -12.858 |
Token | 55 |
Token ID | 5996 |
Feature activation | +2.44e+00 |
Pos logit contributions | |
hua | +0.698 |
uces | +0.679 |
rito | +0.656 |
itous | +0.654 |
048 | +0.627 |
Neg logit contributions | |
oyal | -0.667 |
stown | -0.613 |
charging | -0.598 |
atically | -0.595 |
Wolfe | -0.585 |
Token | 80 |
Token ID | 1795 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
hua | +1.073 |
uces | +0.989 |
itous | +0.919 |
rito | +0.916 |
048 | +0.913 |
Neg logit contributions | |
oyal | -2.402 |
stown | -2.251 |
atically | -2.235 |
charging | -2.224 |
agy | -2.216 |
Token | 953 |
Token ID | 49649 |
Feature activation | +3.54e-01 |
Pos logit contributions | |
hua | +0.674 |
uces | +0.646 |
rito | +0.632 |
itous | +0.625 |
048 | +0.611 |
Neg logit contributions | |
oyal | -1.000 |
stown | -0.930 |
charging | -0.916 |
atically | -0.910 |
Gleaming | -0.902 |
Token | 16 |
Token ID | 1467 |
Feature activation | +3.17e+00 |
Pos logit contributions | |
hua | +0.242 |
uces | +0.234 |
rito | +0.225 |
itous | +0.225 |
048 | +0.214 |
Neg logit contributions | |
oyal | -0.265 |
stown | -0.245 |
charging | -0.239 |
atically | -0.238 |
Wolfe | -0.234 |
Token | � |
Token ID | 564 |
Feature activation | -9.82e-01 |
Pos logit contributions | |
hua | +3.045 |
uces | +2.883 |
rito | +2.798 |
itous | +2.738 |
hi | +2.713 |
Neg logit contributions | |
oyal | -3.265 |
stown | -2.951 |
charging | -2.900 |
atically | -2.896 |
agy | -2.807 |
Token | � |
Token ID | 250 |
Feature activation | +4.34e+00 |
Pos logit contributions | |
oyal | +0.760 |
stown | +0.694 |
charging | +0.684 |
atically | +0.684 |
Wolfe | +0.668 |
Neg logit contributions | |
hua | -0.644 |
uces | -0.620 |
itous | -0.604 |
rito | -0.595 |
liest | -0.567 |
Token | [ |
Token ID | 58 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
hua | +2.946 |
uces | +2.811 |
rito | +2.721 |
itous | +2.656 |
hi | +2.643 |
Neg logit contributions | |
oyal | -3.243 |
stown | -2.978 |
atically | -2.917 |
charging | -2.898 |
Gleaming | -2.861 |
Token | � |
Token ID | 447 |
Feature activation | +6.83e-01 |
Pos logit contributions | |
hua | +2.175 |
uces | +2.074 |
rito | +2.009 |
itous | +1.985 |
hi | +1.929 |
Neg logit contributions | |
oyal | -2.322 |
stown | -2.129 |
atically | -2.072 |
charging | -2.063 |
Wolfe | -2.056 |
Token | � |
Token ID | 250 |
Feature activation | +4.18e+00 |
Pos logit contributions | |
hua | +0.482 |
uces | +0.468 |
rito | +0.452 |
itous | +0.450 |
048 | +0.431 |
Neg logit contributions | |
oyal | -0.493 |
stown | -0.454 |
charging | -0.444 |
atically | -0.442 |
Wolfe | -0.433 |
Token | G |
Token ID | 38 |
Feature activation | +1.59e+01 |
Pos logit contributions | |
hua | +2.911 |
uces | +2.781 |
rito | +2.691 |
itous | +2.646 |
hi | +2.609 |
Neg logit contributions | |
oyal | -3.038 |
stown | -2.803 |
atically | -2.727 |
charging | -2.716 |
Wolfe | -2.697 |
Token | on |
Token ID | 261 |
Feature activation | +4.28e+00 |
Pos logit contributions | |
uces | +8.134 |
rito | +8.061 |
hua | +7.963 |
atos | +7.736 |
hi | +7.640 |
Neg logit contributions | |
Gleaming | -11.950 |
Wolfe | -11.702 |
oyal | -11.644 |
stown | -11.176 |
charging | -11.123 |
Token | � |
Token ID | 447 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
hua | +2.925 |
uces | +2.815 |
rito | +2.695 |
itous | +2.687 |
hi | +2.587 |
Neg logit contributions | |
oyal | -3.160 |
stown | -2.894 |
charging | -2.850 |
atically | -2.816 |
Gleaming | -2.803 |
Token | � |
Token ID | 251 |
Feature activation | +2.96e+00 |
Pos logit contributions | |
hua | +1.129 |
uces | +1.096 |
rito | +1.057 |
itous | +1.052 |
048 | +1.006 |
Neg logit contributions | |
oyal | -1.184 |
stown | -1.093 |
charging | -1.068 |
atically | -1.063 |
Wolfe | -1.044 |
Token | ] |
Token ID | 60 |
Feature activation | +5.05e+00 |
Pos logit contributions | |
hua | +2.090 |
uces | +2.013 |
rito | +1.937 |
itous | +1.915 |
048 | +1.857 |
Neg logit contributions | |
oyal | -2.133 |
stown | -1.961 |
charging | -1.933 |
atically | -1.908 |
Gleaming | -1.880 |
Token | contains |
Token ID | 4909 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
hua | +3.660 |
uces | +3.502 |
rito | +3.386 |
itous | +3.330 |
hi | +3.251 |
Neg logit contributions | |
oyal | -3.541 |
stown | -3.248 |
charging | -3.154 |
atically | -3.132 |
Gleaming | -3.083 |
Token | Daytona |
Token ID | 47299 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
hua | +1.231 |
uces | +1.177 |
rito | +1.133 |
itous | +1.132 |
048 | +1.066 |
Neg logit contributions | |
oyal | -1.999 |
stown | -1.828 |
charging | -1.810 |
atically | -1.806 |
agy | -1.791 |
Token | Beach |
Token ID | 8511 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
oyal | +1.567 |
stown | +1.446 |
charging | +1.412 |
atically | +1.397 |
Wolfe | +1.379 |
Neg logit contributions | |
hua | -1.661 |
uces | -1.619 |
rito | -1.565 |
itous | -1.559 |
048 | -1.490 |
Token | where |
Token ID | 810 |
Feature activation | -8.71e-01 |
Pos logit contributions | |
hua | +0.730 |
uces | +0.701 |
rito | +0.676 |
itous | +0.675 |
048 | +0.644 |
Neg logit contributions | |
oyal | -0.881 |
stown | -0.808 |
charging | -0.793 |
atically | -0.792 |
agy | -0.779 |
Token | Whites |
Token ID | 29290 |
Feature activation | +5.36e+00 |
Pos logit contributions | |
oyal | +0.604 |
stown | +0.553 |
charging | +0.540 |
atically | +0.538 |
agy | +0.526 |
Neg logit contributions | |
hua | -0.640 |
uces | -0.621 |
rito | -0.601 |
itous | -0.599 |
048 | -0.573 |
Token | and |
Token ID | 290 |
Feature activation | +2.81e+00 |
Pos logit contributions | |
hua | +3.355 |
rito | +3.081 |
uces | +3.037 |
itous | +2.976 |
hi | +2.907 |
Neg logit contributions | |
oyal | -4.224 |
stown | -3.830 |
charging | -3.807 |
atically | -3.795 |
Gleaming | -3.782 |
Token | Blacks |
Token ID | 27875 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
hua | +2.304 |
uces | +2.248 |
rito | +2.177 |
itous | +2.168 |
048 | +2.102 |
Neg logit contributions | |
oyal | -1.661 |
stown | -1.500 |
charging | -1.474 |
atically | -1.466 |
agy | -1.446 |
Token | could |
Token ID | 714 |
Feature activation | +6.06e+00 |
Pos logit contributions | |
hua | +8.324 |
rito | +7.699 |
itous | +7.406 |
hi | +7.185 |
uces | +7.136 |
Neg logit contributions | |
oyal | -11.870 |
charging | -10.759 |
覚醒 | -10.648 |
agy | -10.590 |
Gleaming | -10.411 |
Token | sit |
Token ID | 1650 |
Feature activation | +7.80e+00 |
Pos logit contributions | |
hua | +4.105 |
rito | +3.900 |
uces | +3.889 |
itous | +3.883 |
048 | +3.638 |
Neg logit contributions | |
oyal | -4.378 |
charging | -3.987 |
stown | -3.911 |
agy | -3.846 |
Gleaming | -3.800 |
Token | in |
Token ID | 287 |
Feature activation | +5.45e+00 |
Pos logit contributions | |
hua | +4.724 |
uces | +4.514 |
itous | +4.427 |
rito | +4.269 |
liest | +4.208 |
Neg logit contributions | |
oyal | -6.170 |
charging | -5.581 |
stown | -5.509 |
Gleaming | -5.443 |
agy | -5.439 |
Token | the |
Token ID | 262 |
Feature activation | +5.93e+00 |
Pos logit contributions | |
hua | +3.563 |
uces | +3.406 |
itous | +3.345 |
rito | +3.293 |
048 | +3.181 |
Neg logit contributions | |
oyal | -4.087 |
stown | -3.760 |
charging | -3.707 |
agy | -3.662 |
atically | -3.645 |
Token | same |
Token ID | 976 |
Feature activation | +5.66e+00 |
Pos logit contributions | |
hua | +3.263 |
uces | +3.055 |
itous | +3.012 |
rito | +3.002 |
048 | +2.874 |
Neg logit contributions | |
oyal | -4.962 |
stown | -4.670 |
charging | -4.628 |
agy | -4.539 |
atically | -4.523 |
Token | . |
Token ID | 13 |
Feature activation | +2.87e+00 |
Pos logit contributions | |
hua | +1.508 |
uces | +1.448 |
rito | +1.395 |
itous | +1.390 |
048 | +1.313 |
Neg logit contributions | |
oyal | -2.076 |
stown | -1.942 |
charging | -1.903 |
atically | -1.890 |
Wolfe | -1.867 |
Token | � |
Token ID | 447 |
Feature activation | +2.15e+00 |
Pos logit contributions | |
hua | +2.173 |
uces | +2.096 |
rito | +2.028 |
itous | +2.007 |
048 | +1.976 |
Neg logit contributions | |
oyal | -1.897 |
stown | -1.734 |
charging | -1.706 |
atically | -1.703 |
agy | -1.661 |
Token | � |
Token ID | 251 |
Feature activation | +9.31e-01 |
Pos logit contributions | |
hua | +1.533 |
uces | +1.489 |
rito | +1.438 |
itous | +1.427 |
048 | +1.375 |
Neg logit contributions | |
oyal | -1.526 |
stown | -1.412 |
charging | -1.377 |
atically | -1.370 |
Wolfe | -1.346 |
Token |
|
Token ID | 198 |
Feature activation | +7.38e-01 |
Pos logit contributions | |
hua | +0.687 |
uces | +0.665 |
rito | +0.642 |
itous | +0.640 |
048 | +0.618 |
Neg logit contributions | |
oyal | -0.641 |
stown | -0.588 |
charging | -0.578 |
atically | -0.574 |
agy | -0.562 |
Token |
|
Token ID | 198 |
Feature activation | +5.32e-01 |
Pos logit contributions | |
hua | +0.515 |
uces | +0.490 |
itous | +0.476 |
rito | +0.475 |
048 | +0.465 |
Neg logit contributions | |
oyal | -0.544 |
stown | -0.494 |
atically | -0.487 |
charging | -0.486 |
Gleaming | -0.477 |
Token | D |
Token ID | 35 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
hua | +0.358 |
uces | +0.345 |
rito | +0.333 |
itous | +0.331 |
048 | +0.318 |
Neg logit contributions | |
oyal | -0.401 |
stown | -0.371 |
charging | -0.363 |
atically | -0.362 |
Wolfe | -0.356 |
Token | arth |
Token ID | 11999 |
Feature activation | +2.52e+00 |
Pos logit contributions | |
hua | +8.279 |
uces | +7.998 |
rito | +7.891 |
itous | +7.846 |
hi | +7.590 |
Neg logit contributions | |
Gleaming | -11.123 |
Wolfe | -11.034 |
charging | -10.994 |
stown | -10.958 |
oyal | -10.780 |
Token | Camel |
Token ID | 43281 |
Feature activation | -3.74e+00 |
Pos logit contributions | |
hua | +1.769 |
uces | +1.715 |
rito | +1.658 |
itous | +1.654 |
048 | +1.571 |
Neg logit contributions | |
oyal | -1.822 |
stown | -1.674 |
charging | -1.650 |
atically | -1.632 |
agy | -1.604 |
Token | though |
Token ID | 996 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
oyal | +2.660 |
stown | +2.466 |
charging | +2.392 |
atically | +2.392 |
Wolfe | +2.358 |
Neg logit contributions | |
hua | -2.657 |
uces | -2.582 |
rito | -2.490 |
itous | -2.474 |
048 | -2.367 |
Token | didn |
Token ID | 1422 |
Feature activation | -4.18e+00 |
Pos logit contributions | |
oyal | +0.849 |
stown | +0.785 |
charging | +0.768 |
atically | +0.764 |
Wolfe | +0.750 |
Neg logit contributions | |
hua | -0.774 |
uces | -0.751 |
rito | -0.724 |
itous | -0.721 |
048 | -0.688 |
Token | � |
Token ID | 447 |
Feature activation | -2.14e+00 |
Pos logit contributions | |
oyal | +2.986 |
stown | +2.770 |
charging | +2.683 |
atically | +2.680 |
agy | +2.623 |
Neg logit contributions | |
hua | -2.927 |
uces | -2.885 |
itous | -2.772 |
rito | -2.764 |
inguishable | -2.658 |
Token | . |
Token ID | 13 |
Feature activation | +4.11e+00 |
Pos logit contributions | |
oyal | +1.351 |
stown | +1.259 |
charging | +1.228 |
atically | +1.217 |
Wolfe | +1.202 |
Neg logit contributions | |
hua | -1.297 |
uces | -1.258 |
rito | -1.220 |
itous | -1.204 |
048 | -1.162 |
Token | ( |
Token ID | 357 |
Feature activation | +3.93e+00 |
Pos logit contributions | |
hua | +2.879 |
uces | +2.754 |
rito | +2.689 |
itous | +2.675 |
048 | +2.576 |
Neg logit contributions | |
oyal | -2.973 |
stown | -2.663 |
charging | -2.649 |
atically | -2.644 |
agy | -2.604 |
Token | Wa |
Token ID | 33484 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
hua | +2.579 |
uces | +2.460 |
rito | +2.388 |
itous | +2.354 |
hi | +2.288 |
Neg logit contributions | |
oyal | -3.002 |
stown | -2.776 |
atically | -2.722 |
charging | -2.717 |
Gleaming | -2.716 |
Token | ub |
Token ID | 549 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
hua | +0.954 |
uces | +0.909 |
rito | +0.871 |
itous | +0.862 |
hi | +0.803 |
Neg logit contributions | |
oyal | -1.700 |
stown | -1.615 |
charging | -1.596 |
atically | -1.591 |
Gleaming | -1.586 |
Token | ges |
Token ID | 3212 |
Feature activation | +4.29e+00 |
Pos logit contributions | |
hua | +1.826 |
uces | +1.756 |
rito | +1.654 |
itous | +1.647 |
048 | +1.580 |
Neg logit contributions | |
oyal | -2.738 |
stown | -2.545 |
charging | -2.516 |
Wolfe | -2.500 |
atically | -2.493 |
Token | hig |
Token ID | 25196 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
hua | +2.227 |
uces | +2.076 |
hi | +1.997 |
rito | +1.985 |
itous | +1.927 |
Neg logit contributions | |
oyal | -3.866 |
stown | -3.670 |
Gleaming | -3.578 |
charging | -3.577 |
Wolfe | -3.573 |
Token | Rice |
Token ID | 13823 |
Feature activation | +8.18e+00 |
Pos logit contributions | |
hua | +3.690 |
rito | +3.056 |
hi | +2.750 |
uces | +2.688 |
048 | +2.586 |
Neg logit contributions | |
oyal | -16.323 |
覚醒 | -15.457 |
charging | -15.425 |
atically | -15.342 |
oun | -15.170 |
Token | / |
Token ID | 14 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
hua | +3.509 |
048 | +3.028 |
uces | +2.970 |
hi | +2.926 |
rito | +2.847 |
Neg logit contributions | |
oyal | -7.935 |
atically | -7.379 |
Gleaming | -7.319 |
stown | -7.315 |
charging | -7.276 |
Token | CBC |
Token ID | 29208 |
Feature activation | +3.86e+00 |
Pos logit contributions | |
hua | +1.525 |
uces | +1.416 |
rito | +1.395 |
itous | +1.383 |
048 | +1.360 |
Neg logit contributions | |
oyal | -1.923 |
stown | -1.767 |
atically | -1.728 |
charging | -1.727 |
Gleaming | -1.725 |
Token | ) |
Token ID | 8 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
hua | +2.532 |
uces | +2.448 |
rito | +2.364 |
itous | +2.345 |
048 | +2.235 |
Neg logit contributions | |
oyal | -2.960 |
stown | -2.736 |
charging | -2.688 |
atically | -2.685 |
Gleaming | -2.637 |
Token |
|
Token ID | 198 |
Feature activation | -8.85e-01 |
Pos logit contributions | |
oyal | +0.991 |
stown | +0.912 |
charging | +0.889 |
atically | +0.884 |
Wolfe | +0.869 |
Neg logit contributions | |
hua | -1.056 |
uces | -1.027 |
rito | -0.992 |
itous | -0.989 |
048 | -0.947 |
Token | not |
Token ID | 407 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
hua | +1.220 |
uces | +1.164 |
rito | +1.134 |
itous | +1.118 |
048 | +1.082 |
Neg logit contributions | |
oyal | -1.872 |
stown | -1.745 |
charging | -1.723 |
atically | -1.708 |
Gleaming | -1.690 |
Token | deep |
Token ID | 2769 |
Feature activation | +6.88e-01 |
Pos logit contributions | |
hua | +0.633 |
uces | +0.605 |
rito | +0.577 |
itous | +0.574 |
hi | +0.541 |
Neg logit contributions | |
oyal | -1.178 |
stown | -1.101 |
charging | -1.085 |
atically | -1.076 |
Wolfe | -1.064 |
Token | fried |
Token ID | 23018 |
Feature activation | +3.57e+00 |
Pos logit contributions | |
hua | +0.467 |
uces | +0.453 |
rito | +0.439 |
itous | +0.436 |
048 | +0.419 |
Neg logit contributions | |
oyal | -0.518 |
stown | -0.473 |
charging | -0.465 |
atically | -0.461 |
Wolfe | -0.456 |
Token | . |
Token ID | 13 |
Feature activation | +4.53e+00 |
Pos logit contributions | |
hua | +1.972 |
uces | +1.839 |
rito | +1.806 |
itous | +1.782 |
hi | +1.742 |
Neg logit contributions | |
oyal | -3.107 |
stown | -2.862 |
charging | -2.848 |
atically | -2.828 |
Gleaming | -2.807 |
Token | 6 |
Token ID | 718 |
Feature activation | +6.20e+00 |
Pos logit contributions | |
hua | +2.955 |
uces | +2.848 |
rito | +2.752 |
itous | +2.730 |
048 | +2.596 |
Neg logit contributions | |
oyal | -3.511 |
stown | -3.246 |
atically | -3.182 |
charging | -3.178 |
Wolfe | -3.119 |
Token | . |
Token ID | 13 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
hua | +3.151 |
uces | +2.809 |
hi | +2.799 |
048 | +2.796 |
rito | +2.771 |
Neg logit contributions | |
oyal | -5.594 |
Gleaming | -5.146 |
charging | -5.128 |
atically | -5.118 |
stown | -5.063 |
Token | Drain |
Token ID | 36024 |
Feature activation | +6.67e+00 |
Pos logit contributions | |
uces | +4.188 |
hua | +4.173 |
rito | +3.901 |
hi | +3.834 |
048 | +3.805 |
Neg logit contributions | |
oyal | -15.105 |
charging | -14.239 |
opers | -14.176 |
atically | -14.128 |
iking | -14.095 |
Token | on |
Token ID | 319 |
Feature activation | +2.78e+00 |
Pos logit contributions | |
hua | +3.453 |
uces | +3.267 |
itous | +3.165 |
rito | +3.111 |
hi | +3.101 |
Neg logit contributions | |
oyal | -5.829 |
atically | -5.374 |
Gleaming | -5.365 |
stown | -5.348 |
agy | -5.295 |
Token | a |
Token ID | 257 |
Feature activation | +6.11e+00 |
Pos logit contributions | |
hua | +1.800 |
uces | +1.721 |
rito | +1.660 |
itous | +1.653 |
048 | +1.599 |
Neg logit contributions | |
oyal | -2.161 |
stown | -1.986 |
atically | -1.958 |
charging | -1.952 |
agy | -1.933 |
Token | paper |
Token ID | 3348 |
Feature activation | +4.33e+00 |
Pos logit contributions | |
hua | +2.041 |
uces | +1.728 |
itous | +1.680 |
rito | +1.668 |
hi | +1.605 |
Neg logit contributions | |
oyal | -6.559 |
agy | -6.256 |
atically | -6.214 |
stown | -6.207 |
charging | -6.172 |
Token | towel |
Token ID | 24808 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
hua | +2.071 |
uces | +1.929 |
rito | +1.887 |
itous | +1.825 |
048 | +1.794 |
Neg logit contributions | |
oyal | -4.033 |
stown | -3.779 |
charging | -3.756 |
Gleaming | -3.748 |
agy | -3.714 |
Token | of |
Token ID | 286 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
hua | +0.394 |
uces | +0.378 |
rito | +0.367 |
itous | +0.364 |
048 | +0.349 |
Neg logit contributions | |
oyal | -0.480 |
stown | -0.442 |
charging | -0.437 |
atically | -0.434 |
Gleaming | -0.425 |
Token | Zo |
Token ID | 31645 |
Feature activation | -5.64e+00 |
Pos logit contributions | |
oyal | +0.536 |
stown | +0.475 |
charging | +0.461 |
atically | +0.457 |
agy | +0.443 |
Neg logit contributions | |
hua | -0.966 |
uces | -0.944 |
rito | -0.919 |
itous | -0.916 |
048 | -0.887 |
Token | ology |
Token ID | 1435 |
Feature activation | +8.41e-01 |
Pos logit contributions | |
oyal | +2.789 |
stown | +2.454 |
atically | +2.356 |
charging | +2.352 |
agy | +2.296 |
Neg logit contributions | |
hua | -5.237 |
uces | -5.129 |
rito | -4.990 |
itous | -4.955 |
inguishable | -4.808 |
Token | 62 |
Token ID | 8190 |
Feature activation | +8.43e+00 |
Pos logit contributions | |
hua | +0.543 |
uces | +0.522 |
rito | +0.506 |
itous | +0.498 |
048 | +0.482 |
Neg logit contributions | |
oyal | -0.658 |
stown | -0.610 |
charging | -0.599 |
atically | -0.596 |
Wolfe | -0.584 |
Token | ( |
Token ID | 357 |
Feature activation | +7.21e+00 |
Pos logit contributions | |
hua | +4.084 |
uces | +3.866 |
rito | +3.726 |
itous | +3.602 |
048 | +3.534 |
Neg logit contributions | |
oyal | -7.564 |
atically | -7.023 |
stown | -7.018 |
charging | -6.931 |
Wolfe | -6.898 |
Token | 5 |
Token ID | 20 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
hua | +4.005 |
uces | +3.784 |
rito | +3.705 |
048 | +3.628 |
itous | +3.600 |
Neg logit contributions | |
oyal | -5.999 |
stown | -5.660 |
atically | -5.542 |
Wolfe | -5.464 |
Gleaming | -5.450 |
Token | ) |
Token ID | 8 |
Feature activation | +3.90e+00 |
Pos logit contributions | |
hua | +7.159 |
uces | +6.703 |
048 | +6.696 |
itous | +6.632 |
hi | +6.445 |
Neg logit contributions | |
oyal | -12.013 |
stown | -11.596 |
atically | -11.555 |
charging | -10.977 |
Gleaming | -10.880 |
Token | 401 |
Token ID | 22219 |
Feature activation | +6.27e+00 |
Pos logit contributions | |
hua | +2.542 |
uces | +2.422 |
itous | +2.350 |
rito | +2.335 |
048 | +2.330 |
Neg logit contributions | |
oyal | -2.974 |
stown | -2.790 |
atically | -2.730 |
charging | -2.690 |
agy | -2.614 |
Token | - |
Token ID | 12 |
Feature activation | -3.05e+00 |
Pos logit contributions | |
hua | +3.826 |
uces | +3.568 |
048 | +3.509 |
rito | +3.487 |
itous | +3.464 |
Neg logit contributions | |
oyal | -5.004 |
stown | -4.705 |
atically | -4.570 |
charging | -4.534 |
Gleaming | -4.487 |
Token | 414 |
Token ID | 37309 |
Feature activation | +3.29e+00 |
Pos logit contributions | |
oyal | +2.269 |
stown | +2.125 |
charging | +2.067 |
atically | +2.037 |
agy | +2.028 |
Neg logit contributions | |
hua | -2.048 |
uces | -2.011 |
rito | -1.938 |
itous | -1.931 |
inguishable | -1.830 |
Token | ; |
Token ID | 26 |
Feature activation | +2.16e+00 |
Pos logit contributions | |
hua | +2.041 |
uces | +1.919 |
rito | +1.880 |
itous | +1.865 |
048 | +1.794 |
Neg logit contributions | |
oyal | -2.646 |
stown | -2.468 |
atically | -2.416 |
charging | -2.415 |
Gleaming | -2.358 |
Token | inch |
Token ID | 11111 |
Feature activation | -2.84e+00 |
Pos logit contributions | |
oyal | +4.524 |
stown | +4.305 |
charging | +4.179 |
Wolfe | +4.126 |
Armstrong | +4.078 |
Neg logit contributions | |
hua | -4.237 |
uces | -4.174 |
itous | -3.973 |
rito | -3.955 |
liest | -3.856 |
Token | in |
Token ID | 287 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
oyal | +2.211 |
stown | +2.085 |
charging | +2.034 |
atically | +2.028 |
Wolfe | +2.003 |
Neg logit contributions | |
hua | -1.798 |
uces | -1.741 |
rito | -1.681 |
itous | -1.640 |
048 | -1.559 |
Token | diameter |
Token ID | 14753 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
hua | +0.955 |
uces | +0.913 |
rito | +0.860 |
itous | +0.856 |
048 | +0.802 |
Neg logit contributions | |
oyal | -2.044 |
stown | -1.926 |
charging | -1.891 |
atically | -1.885 |
Wolfe | -1.859 |
Token | average |
Token ID | 2811 |
Feature activation | +1.72e+00 |
Pos logit contributions | |
oyal | +1.716 |
stown | +1.597 |
atically | +1.558 |
charging | +1.557 |
Wolfe | +1.533 |
Neg logit contributions | |
hua | -1.617 |
uces | -1.561 |
rito | -1.519 |
itous | -1.509 |
048 | -1.435 |
Token | . |
Token ID | 13 |
Feature activation | +2.76e-01 |
Pos logit contributions | |
hua | +1.121 |
uces | +1.092 |
rito | +1.043 |
itous | +1.038 |
048 | +0.995 |
Neg logit contributions | |
oyal | -1.335 |
stown | -1.222 |
charging | -1.200 |
atically | -1.192 |
Gleaming | -1.166 |
Token | D |
Token ID | 35 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
hua | +0.205 |
uces | +0.199 |
rito | +0.191 |
itous | +0.190 |
048 | +0.185 |
Neg logit contributions | |
oyal | -0.190 |
stown | -0.173 |
charging | -0.170 |
atically | -0.170 |
agy | -0.165 |
Token | rying |
Token ID | 14992 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
hua | +9.556 |
uces | +9.411 |
rito | +9.116 |
atos | +8.953 |
itous | +8.935 |
Neg logit contributions | |
oyal | -9.384 |
Gleaming | -8.994 |
charging | -8.789 |
Wolfe | -8.725 |
stown | -8.719 |
Token | the |
Token ID | 262 |
Feature activation | -2.19e+00 |
Pos logit contributions | |
oyal | +0.893 |
stown | +0.825 |
charging | +0.806 |
atically | +0.803 |
Wolfe | +0.788 |
Neg logit contributions | |
hua | -0.849 |
uces | -0.824 |
rito | -0.796 |
itous | -0.793 |
048 | -0.757 |
Token | mushrooms |
Token ID | 23452 |
Feature activation | +8.02e-01 |
Pos logit contributions | |
oyal | +1.509 |
stown | +1.393 |
charging | +1.357 |
atically | +1.349 |
Wolfe | +1.334 |
Neg logit contributions | |
hua | -1.604 |
uces | -1.559 |
itous | -1.511 |
rito | -1.510 |
048 | -1.440 |
Token | as |
Token ID | 355 |
Feature activation | -3.05e-01 |
Pos logit contributions | |
hua | +0.544 |
uces | +0.533 |
rito | +0.508 |
itous | +0.506 |
048 | +0.485 |
Neg logit contributions | |
oyal | -0.604 |
stown | -0.554 |
charging | -0.542 |
atically | -0.534 |
agy | -0.528 |
Token | described |
Token ID | 3417 |
Feature activation | -6.80e-01 |
Pos logit contributions | |
oyal | +0.223 |
stown | +0.205 |
charging | +0.200 |
atically | +0.199 |
Wolfe | +0.196 |
Neg logit contributions | |
hua | -0.214 |
uces | -0.207 |
rito | -0.200 |
itous | -0.199 |
048 | -0.191 |
Token | were |
Token ID | 547 |
Feature activation | -1.10e-01 |
Pos logit contributions | |
hua | +0.663 |
uces | +0.634 |
rito | +0.621 |
itous | +0.616 |
048 | +0.588 |
Neg logit contributions | |
oyal | -0.689 |
stown | -0.631 |
charging | -0.620 |
atically | -0.610 |
Gleaming | -0.604 |
Token | men |
Token ID | 1450 |
Feature activation | +4.43e+00 |
Pos logit contributions | |
oyal | +0.079 |
stown | +0.073 |
charging | +0.071 |
atically | +0.070 |
agy | +0.069 |
Neg logit contributions | |
hua | -0.078 |
uces | -0.075 |
rito | -0.073 |
itous | -0.072 |
048 | -0.069 |
Token | and |
Token ID | 290 |
Feature activation | +2.51e+00 |
Pos logit contributions | |
hua | +2.766 |
uces | +2.601 |
rito | +2.535 |
itous | +2.504 |
hi | +2.409 |
Neg logit contributions | |
oyal | -3.511 |
stown | -3.259 |
Gleaming | -3.205 |
charging | -3.177 |
agy | -3.141 |
Token | women |
Token ID | 1466 |
Feature activation | +3.48e+00 |
Pos logit contributions | |
hua | +1.669 |
uces | +1.608 |
rito | +1.564 |
itous | +1.542 |
048 | +1.474 |
Neg logit contributions | |
oyal | -1.915 |
stown | -1.756 |
charging | -1.719 |
atically | -1.711 |
agy | -1.689 |
Token | of |
Token ID | 286 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
hua | +2.181 |
uces | +2.061 |
rito | +2.010 |
itous | +1.984 |
hi | +1.905 |
Neg logit contributions | |
oyal | -2.780 |
stown | -2.572 |
charging | -2.514 |
Gleaming | -2.507 |
agy | -2.470 |
Token | all |
Token ID | 477 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
hua | +5.006 |
uces | +4.859 |
rito | +4.742 |
itous | +4.660 |
hi | +4.448 |
Neg logit contributions | |
oyal | -9.652 |
stown | -9.103 |
charging | -9.077 |
agy | -9.067 |
Gleaming | -8.908 |
Token | ethnic |
Token ID | 9450 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
uces | +6.327 |
hua | +6.278 |
rito | +6.002 |
itous | +5.955 |
hi | +5.769 |
Neg logit contributions | |
oyal | -12.110 |
Gleaming | -11.399 |
charging | -11.299 |
stown | -11.261 |
atically | -11.236 |
Token | ities |
Token ID | 871 |
Feature activation | +6.24e+00 |
Pos logit contributions | |
hua | +5.113 |
uces | +5.084 |
rito | +5.058 |
itous | +4.921 |
liest | +4.513 |
Neg logit contributions | |
oyal | -12.736 |
stown | -12.191 |
charging | -12.090 |
atically | -11.898 |
agy | -11.873 |
Token | . |
Token ID | 13 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
hua | +3.699 |
uces | +3.475 |
rito | +3.435 |
itous | +3.373 |
hi | +3.269 |
Neg logit contributions | |
oyal | -5.062 |
stown | -4.746 |
Gleaming | -4.624 |
charging | -4.575 |
agy | -4.538 |
Token | This |
Token ID | 770 |
Feature activation | +2.56e+00 |
Pos logit contributions | |
hua | +1.472 |
uces | +1.401 |
rito | +1.368 |
itous | +1.354 |
048 | +1.322 |
Neg logit contributions | |
oyal | -1.383 |
stown | -1.246 |
charging | -1.238 |
atically | -1.234 |
agy | -1.209 |
Token | seems |
Token ID | 2331 |
Feature activation | +3.67e+00 |
Pos logit contributions | |
hua | +1.715 |
uces | +1.641 |
rito | +1.591 |
itous | +1.590 |
hi | +1.511 |
Neg logit contributions | |
oyal | -1.941 |
stown | -1.776 |
charging | -1.756 |
atically | -1.726 |
agy | -1.722 |
Token | affect |
Token ID | 2689 |
Feature activation | -8.72e-01 |
Pos logit contributions | |
oyal | +1.136 |
stown | +1.046 |
charging | +1.020 |
atically | +1.019 |
Wolfe | +0.997 |
Neg logit contributions | |
hua | -1.173 |
uces | -1.140 |
rito | -1.099 |
itous | -1.095 |
048 | -1.048 |
Token | many |
Token ID | 867 |
Feature activation | -8.16e-01 |
Pos logit contributions | |
oyal | +0.627 |
stown | +0.577 |
charging | +0.564 |
atically | +0.561 |
Wolfe | +0.550 |
Neg logit contributions | |
hua | -0.618 |
uces | -0.600 |
rito | -0.579 |
itous | -0.578 |
048 | -0.552 |
Token | — |
Token ID | 851 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
oyal | +0.577 |
stown | +0.530 |
charging | +0.518 |
atically | +0.514 |
Wolfe | +0.505 |
Neg logit contributions | |
hua | -0.589 |
uces | -0.572 |
itous | -0.552 |
rito | -0.551 |
048 | -0.526 |
Token | for |
Token ID | 329 |
Feature activation | +7.79e-01 |
Pos logit contributions | |
oyal | +0.079 |
stown | +0.073 |
charging | +0.072 |
atically | +0.071 |
Wolfe | +0.070 |
Neg logit contributions | |
hua | -0.070 |
uces | -0.068 |
rito | -0.065 |
itous | -0.065 |
048 | -0.062 |
Token | good |
Token ID | 922 |
Feature activation | +3.34e+00 |
Pos logit contributions | |
hua | +0.530 |
uces | +0.511 |
itous | +0.494 |
rito | +0.492 |
048 | +0.469 |
Neg logit contributions | |
oyal | -0.584 |
stown | -0.537 |
charging | -0.524 |
atically | -0.523 |
Gleaming | -0.513 |
Token | or |
Token ID | 393 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
hua | +2.210 |
uces | +2.111 |
rito | +2.053 |
itous | +2.051 |
048 | +1.946 |
Neg logit contributions | |
oyal | -2.552 |
stown | -2.358 |
charging | -2.306 |
Gleaming | -2.287 |
atically | -2.279 |
Token | evil |
Token ID | 6181 |
Feature activation | +6.75e+00 |
Pos logit contributions | |
hua | +6.376 |
itous | +5.779 |
uces | +5.587 |
hi | +5.409 |
rito | +5.291 |
Neg logit contributions | |
oyal | -12.738 |
stown | -12.457 |
agy | -11.676 |
Gleaming | -11.663 |
charging | -11.633 |
Token | — |
Token ID | 851 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
hua | +4.379 |
uces | +4.201 |
itous | +4.106 |
rito | +4.075 |
048 | +3.836 |
Neg logit contributions | |
oyal | -5.068 |
stown | -4.703 |
charging | -4.614 |
Gleaming | -4.584 |
atically | -4.488 |
Token | is |
Token ID | 318 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
oyal | +0.748 |
stown | +0.689 |
charging | +0.674 |
atically | +0.670 |
Wolfe | +0.657 |
Neg logit contributions | |
hua | -0.738 |
uces | -0.717 |
rito | -0.692 |
itous | -0.690 |
048 | -0.659 |
Token | now |
Token ID | 783 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
hua | +1.469 |
uces | +1.425 |
rito | +1.379 |
itous | +1.376 |
liest | +1.311 |
Neg logit contributions | |
oyal | -1.564 |
stown | -1.443 |
charging | -1.409 |
atically | -1.400 |
Gleaming | -1.378 |
Token | scaling |
Token ID | 20796 |
Feature activation | -4.80e+00 |
Pos logit contributions | |
oyal | +1.408 |
stown | +1.297 |
charging | +1.268 |
atically | +1.263 |
Wolfe | +1.240 |
Neg logit contributions | |
hua | -1.396 |
uces | -1.357 |
rito | -1.309 |
itous | -1.304 |
048 | -1.248 |
Token | venture |
Token ID | 13189 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
oyal | +3.206 |
stown | +2.946 |
charging | +2.862 |
atically | +2.792 |
Wolfe | +2.776 |
Neg logit contributions | |
hua | -3.298 |
uces | -3.236 |
itous | -3.121 |
rito | -3.117 |
048 | -2.975 |
Token | , |
Token ID | 11 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
oyal | +0.917 |
stown | +0.848 |
charging | +0.830 |
atically | +0.826 |
Wolfe | +0.811 |
Neg logit contributions | |
hua | -0.832 |
uces | -0.807 |
rito | -0.778 |
itous | -0.775 |
048 | -0.739 |
Token | S |
Token ID | 311 |
Feature activation | -3.48e+00 |
Pos logit contributions | |
oyal | +0.933 |
stown | +0.860 |
charging | +0.841 |
atically | +0.837 |
Wolfe | +0.821 |
Neg logit contributions | |
hua | -0.898 |
uces | -0.872 |
rito | -0.841 |
itous | -0.838 |
048 | -0.801 |
Token | BI |
Token ID | 3483 |
Feature activation | +6.47e+00 |
Pos logit contributions | |
oyal | +1.731 |
stown | +1.489 |
charging | +1.432 |
atically | +1.403 |
agy | +1.384 |
Neg logit contributions | |
hua | -3.236 |
uces | -3.151 |
itous | -3.062 |
rito | -3.051 |
048 | -2.958 |
Token | Wire |
Token ID | 14712 |
Feature activation | +2.63e+00 |
Pos logit contributions | |
hua | +4.480 |
uces | +4.302 |
rito | +4.092 |
itous | +4.070 |
hi | +3.977 |
Neg logit contributions | |
oyal | -4.585 |
atically | -4.190 |
stown | -4.187 |
charging | -4.134 |
agy | -4.043 |
Token | x |
Token ID | 87 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
hua | +1.670 |
uces | +1.577 |
rito | +1.506 |
itous | +1.472 |
hi | +1.454 |
Neg logit contributions | |
oyal | -2.101 |
stown | -1.922 |
atically | -1.910 |
charging | -1.903 |
Gleaming | -1.884 |
Token | Asia |
Token ID | 7229 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
hua | +7.219 |
uces | +6.677 |
rito | +6.155 |
itous | +6.140 |
hi | +6.050 |
Neg logit contributions | |
oyal | -11.388 |
atically | -10.977 |
stown | -10.634 |
charging | -10.556 |
CLOSE | -10.416 |
Token | . |
Token ID | 13 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
hua | +0.906 |
uces | +0.875 |
rito | +0.841 |
itous | +0.836 |
048 | +0.798 |
Neg logit contributions | |
oyal | -1.091 |
stown | -1.013 |
charging | -0.993 |
atically | -0.992 |
Wolfe | -0.971 |
Token | The |
Token ID | 383 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
hua | +1.688 |
uces | +1.618 |
rito | +1.572 |
itous | +1.551 |
048 | +1.508 |
Neg logit contributions | |
oyal | -1.693 |
stown | -1.552 |
atically | -1.529 |
charging | -1.525 |
agy | -1.491 |
Token | collaboration |
Token ID | 12438 |
Feature activation | +8.07e-01 |
Pos logit contributions | |
hua | +1.022 |
uces | +0.982 |
rito | +0.948 |
itous | +0.944 |
048 | +0.906 |
Neg logit contributions | |
oyal | -1.145 |
stown | -1.055 |
charging | -1.043 |
atically | -1.039 |
agy | -1.022 |
Token | means |
Token ID | 1724 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
hua | +0.562 |
uces | +0.547 |
rito | +0.523 |
itous | +0.521 |
048 | +0.501 |
Neg logit contributions | |
oyal | -0.590 |
stown | -0.541 |
charging | -0.531 |
atically | -0.527 |
agy | -0.515 |
Token | open |
Token ID | 1280 |
Feature activation | +6.29e+00 |
Pos logit contributions | |
hua | +1.644 |
uces | +1.609 |
rito | +1.552 |
itous | +1.547 |
048 | +1.469 |
Neg logit contributions | |
oyal | -2.289 |
stown | -2.117 |
atically | -2.084 |
charging | -2.065 |
agy | -2.055 |
Token | internet |
Token ID | 5230 |
Feature activation | +4.57e+00 |
Pos logit contributions | |
hua | +3.245 |
uces | +3.124 |
itous | +2.980 |
rito | +2.943 |
hi | +2.814 |
Neg logit contributions | |
oyal | -5.612 |
stown | -5.166 |
Gleaming | -5.165 |
atically | -5.060 |
charging | -5.028 |
Token | for |
Token ID | 329 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
hua | +2.675 |
uces | +2.562 |
rito | +2.508 |
itous | +2.502 |
048 | +2.343 |
Neg logit contributions | |
oyal | -3.781 |
stown | -3.497 |
Gleaming | -3.413 |
charging | -3.404 |
atically | -3.391 |
Token | Americans |
Token ID | 3399 |
Feature activation | +4.60e-01 |
Pos logit contributions | |
hua | +0.965 |
uces | +0.939 |
rito | +0.910 |
itous | +0.903 |
048 | +0.867 |
Neg logit contributions | |
oyal | -1.044 |
stown | -0.958 |
atically | -0.932 |
charging | -0.929 |
agy | -0.918 |
Token | of |
Token ID | 286 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
hua | +0.306 |
uces | +0.296 |
rito | +0.286 |
itous | +0.285 |
048 | +0.271 |
Neg logit contributions | |
oyal | -0.350 |
stown | -0.325 |
charging | -0.317 |
atically | -0.315 |
Wolfe | -0.310 |
Token | all |
Token ID | 477 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
hua | +5.608 |
rito | +5.520 |
uces | +5.381 |
itous | +5.340 |
hi | +5.085 |
Neg logit contributions | |
oyal | -7.867 |
stown | -7.526 |
agy | -7.384 |
Gleaming | -7.248 |
charging | -7.219 |
Token | income |
Token ID | 3739 |
Feature activation | +7.73e+00 |
Pos logit contributions | |
hua | +6.411 |
uces | +6.408 |
rito | +6.199 |
itous | +6.160 |
liest | +5.962 |
Neg logit contributions | |
oyal | -11.748 |
Gleaming | -11.162 |
stown | -11.066 |
agy | -10.947 |
charging | -10.808 |
Token | classes |
Token ID | 6097 |
Feature activation | +3.95e+00 |
Pos logit contributions | |
hua | +3.889 |
uces | +3.778 |
rito | +3.723 |
itous | +3.531 |
liest | +3.522 |
Neg logit contributions | |
oyal | -6.644 |
stown | -6.213 |
Gleaming | -6.101 |
charging | -6.081 |
Wolfe | -6.007 |
Token | — |
Token ID | 960 |
Feature activation | -2.71e+00 |
Pos logit contributions | |
hua | +2.489 |
uces | +2.400 |
rito | +2.325 |
itous | +2.305 |
048 | +2.202 |
Neg logit contributions | |
oyal | -3.099 |
stown | -2.894 |
charging | -2.800 |
atically | -2.793 |
Gleaming | -2.774 |
Token | Federal |
Token ID | 24099 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
oyal | +2.127 |
stown | +1.981 |
charging | +1.952 |
atically | +1.927 |
Wolfe | +1.891 |
Neg logit contributions | |
hua | -1.722 |
uces | -1.684 |
itous | -1.604 |
rito | -1.600 |
048 | -1.522 |
Token | Communications |
Token ID | 14620 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
hua | +2.067 |
uces | +2.021 |
rito | +1.960 |
itous | +1.948 |
048 | +1.856 |
Neg logit contributions | |
oyal | -2.284 |
stown | -2.083 |
charging | -2.050 |
atically | -2.043 |
Gleaming | -2.020 |
Token | uper |
Token ID | 48568 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
hua | +0.375 |
uces | +0.367 |
rito | +0.354 |
itous | +0.354 |
048 | +0.338 |
Neg logit contributions | |
oyal | -0.326 |
stown | -0.299 |
charging | -0.291 |
atically | -0.290 |
Wolfe | -0.284 |
Token | ation |
Token ID | 341 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
oyal | +3.222 |
stown | +3.015 |
charging | +2.989 |
atically | +2.988 |
agy | +2.924 |
Neg logit contributions | |
hua | -1.577 |
uces | -1.463 |
rito | -1.367 |
itous | -1.334 |
048 | -1.318 |
Token | . |
Token ID | 13 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
hua | +0.923 |
uces | +0.898 |
rito | +0.863 |
itous | +0.860 |
048 | +0.819 |
Neg logit contributions | |
oyal | -1.172 |
stown | -1.082 |
charging | -1.060 |
atically | -1.042 |
Gleaming | -1.038 |
Token |
|
Token ID | 198 |
Feature activation | -3.22e+00 |
Pos logit contributions | |
oyal | +1.296 |
stown | +1.188 |
charging | +1.159 |
atically | +1.154 |
Wolfe | +1.134 |
Neg logit contributions | |
hua | -1.463 |
uces | -1.425 |
rito | -1.377 |
itous | -1.374 |
048 | -1.315 |
Token |
|
Token ID | 198 |
Feature activation | -2.47e+00 |
Pos logit contributions | |
oyal | +2.103 |
stown | +1.941 |
charging | +1.885 |
atically | +1.870 |
Wolfe | +1.835 |
Neg logit contributions | |
hua | -2.463 |
uces | -2.421 |
rito | -2.336 |
itous | -2.323 |
inguishable | -2.227 |
Token | D |
Token ID | 35 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
oyal | +1.849 |
stown | +1.710 |
charging | +1.679 |
atically | +1.667 |
Wolfe | +1.629 |
Neg logit contributions | |
hua | -1.661 |
uces | -1.620 |
itous | -1.555 |
rito | -1.552 |
048 | -1.468 |
Token | ani |
Token ID | 3216 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
hua | +6.923 |
uces | +6.731 |
rito | +6.715 |
hi | +6.618 |
itous | +6.552 |
Neg logit contributions | |
oyal | -11.412 |
Gleaming | -11.368 |
stown | -11.212 |
charging | -11.085 |
Wolfe | -10.952 |
Token | highlights |
Token ID | 11330 |
Feature activation | -2.11e+00 |
Pos logit contributions | |
hua | +0.117 |
uces | +0.114 |
rito | +0.109 |
itous | +0.109 |
048 | +0.104 |
Neg logit contributions | |
oyal | -0.121 |
stown | -0.111 |
charging | -0.109 |
atically | -0.108 |
agy | -0.106 |
Token | the |
Token ID | 262 |
Feature activation | -6.46e-01 |
Pos logit contributions | |
oyal | +1.472 |
stown | +1.354 |
charging | +1.324 |
atically | +1.321 |
Wolfe | +1.298 |
Neg logit contributions | |
hua | -1.534 |
uces | -1.488 |
rito | -1.439 |
itous | -1.434 |
048 | -1.370 |
Token | importance |
Token ID | 6817 |
Feature activation | +2.44e+00 |
Pos logit contributions | |
oyal | +0.425 |
stown | +0.389 |
charging | +0.380 |
atically | +0.377 |
Wolfe | +0.369 |
Neg logit contributions | |
hua | -0.496 |
uces | -0.484 |
rito | -0.468 |
itous | -0.467 |
048 | -0.448 |
Token | of |
Token ID | 286 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
hua | +1.657 |
uces | +1.607 |
rito | +1.551 |
itous | +1.546 |
048 | +1.472 |
Neg logit contributions | |
oyal | -1.827 |
stown | -1.691 |
charging | -1.654 |
atically | -1.645 |
Wolfe | -1.615 |
Token | TV |
Token ID | 3195 |
Feature activation | -8.17e-01 |
Pos logit contributions | |
hua | +2.582 |
uces | +2.475 |
rito | +2.416 |
itous | +2.375 |
048 | +2.306 |
Neg logit contributions | |
oyal | -3.055 |
stown | -2.830 |
atically | -2.798 |
agy | -2.775 |
charging | -2.743 |
Token | provider |
Token ID | 10131 |
Feature activation | -2.19e+00 |
Pos logit contributions | |
oyal | +0.594 |
stown | +0.548 |
charging | +0.535 |
atically | +0.533 |
Wolfe | +0.523 |
Neg logit contributions | |
hua | -0.573 |
uces | -0.556 |
rito | -0.536 |
itous | -0.535 |
048 | -0.510 |
Token | . |
Token ID | 13 |
Feature activation | -8.80e-01 |
Pos logit contributions | |
oyal | +1.647 |
stown | +1.521 |
charging | +1.495 |
atically | +1.484 |
Wolfe | +1.459 |
Neg logit contributions | |
hua | -1.479 |
uces | -1.434 |
itous | -1.373 |
rito | -1.373 |
048 | -1.305 |
Token |
|
Token ID | 198 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
oyal | +0.587 |
stown | +0.538 |
charging | +0.524 |
atically | +0.522 |
Wolfe | +0.511 |
Neg logit contributions | |
hua | -0.669 |
uces | -0.651 |
rito | -0.630 |
itous | -0.628 |
048 | -0.602 |
Token |
|
Token ID | 198 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
hua | +1.018 |
uces | +0.964 |
itous | +0.937 |
rito | +0.936 |
048 | +0.919 |
Neg logit contributions | |
oyal | -1.115 |
stown | -1.009 |
atically | -1.000 |
charging | -0.996 |
Gleaming | -0.983 |
Token | D |
Token ID | 35 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
oyal | +0.179 |
stown | +0.166 |
charging | +0.162 |
atically | +0.162 |
Wolfe | +0.159 |
Neg logit contributions | |
hua | -0.150 |
uces | -0.146 |
rito | -0.140 |
itous | -0.140 |
048 | -0.132 |
Token | ish |
Token ID | 680 |
Feature activation | -5.95e-02 |
Pos logit contributions | |
hua | +5.939 |
itous | +5.782 |
hi | +5.704 |
uces | +5.680 |
rito | +5.646 |
Neg logit contributions | |
Wolfe | -12.675 |
Gleaming | -12.504 |
oyal | -12.192 |
charging | -12.062 |
atically | -12.024 |
Token | , |
Token ID | 11 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
oyal | +0.043 |
stown | +0.040 |
charging | +0.039 |
atically | +0.039 |
Wolfe | +0.038 |
Neg logit contributions | |
hua | -0.042 |
uces | -0.041 |
rito | -0.039 |
itous | -0.039 |
048 | -0.037 |
Token | however |
Token ID | 2158 |
Feature activation | -3.72e+00 |
Pos logit contributions | |
hua | +1.307 |
uces | +1.268 |
rito | +1.227 |
itous | +1.217 |
048 | +1.168 |
Neg logit contributions | |
oyal | -1.551 |
stown | -1.433 |
charging | -1.393 |
atically | -1.391 |
agy | -1.360 |
Token | , |
Token ID | 11 |
Feature activation | -3.88e+00 |
Pos logit contributions | |
oyal | +2.636 |
stown | +2.415 |
charging | +2.380 |
atically | +2.363 |
Wolfe | +2.335 |
Neg logit contributions | |
hua | -2.629 |
uces | -2.552 |
itous | -2.467 |
rito | -2.467 |
048 | -2.348 |
Token | says |
Token ID | 1139 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
oyal | +2.642 |
stown | +2.443 |
atically | +2.394 |
charging | +2.387 |
Wolfe | +2.354 |
Neg logit contributions | |
hua | -2.859 |
uces | -2.775 |
rito | -2.676 |
itous | -2.672 |
048 | -2.550 |
Token | or |
Token ID | 393 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
hua | +3.238 |
uces | +3.125 |
itous | +3.009 |
rito | +3.001 |
048 | +2.919 |
Neg logit contributions | |
oyal | -3.975 |
stown | -3.708 |
charging | -3.564 |
Wolfe | -3.561 |
Gleaming | -3.532 |
Token | 9 |
Token ID | 860 |
Feature activation | +4.59e+00 |
Pos logit contributions | |
hua | +1.159 |
uces | +1.130 |
itous | +1.081 |
rito | +1.078 |
048 | +1.044 |
Neg logit contributions | |
oyal | -1.266 |
stown | -1.166 |
charging | -1.134 |
atically | -1.125 |
Wolfe | -1.114 |
Token | smaller |
Token ID | 4833 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
hua | +2.860 |
uces | +2.746 |
itous | +2.633 |
rito | +2.624 |
048 | +2.551 |
Neg logit contributions | |
oyal | -3.667 |
stown | -3.372 |
charging | -3.288 |
atically | -3.275 |
Wolfe | -3.269 |
Token | ones |
Token ID | 3392 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
hua | +0.914 |
uces | +0.892 |
itous | +0.858 |
rito | +0.857 |
048 | +0.824 |
Neg logit contributions | |
oyal | -0.852 |
stown | -0.778 |
charging | -0.760 |
atically | -0.757 |
Wolfe | -0.744 |
Token | . |
Token ID | 13 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
hua | +0.648 |
uces | +0.628 |
rito | +0.602 |
itous | +0.601 |
048 | +0.574 |
Neg logit contributions | |
oyal | -0.803 |
stown | -0.746 |
charging | -0.727 |
atically | -0.723 |
Wolfe | -0.717 |
Token | D |
Token ID | 35 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
hua | +1.237 |
uces | +1.195 |
rito | +1.153 |
itous | +1.148 |
048 | +1.120 |
Neg logit contributions | |
oyal | -1.267 |
stown | -1.161 |
atically | -1.132 |
charging | -1.131 |
agy | -1.111 |
Token | illon |
Token ID | 23027 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
hua | +5.808 |
uces | +5.151 |
itous | +4.987 |
rito | +4.976 |
hi | +4.938 |
Neg logit contributions | |
oyal | -12.840 |
Gleaming | -12.822 |
stown | -12.684 |
Wolfe | -12.609 |
atically | -12.272 |
Token | says |
Token ID | 1139 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
hua | +1.564 |
uces | +1.514 |
itous | +1.456 |
rito | +1.455 |
048 | +1.400 |
Neg logit contributions | |
oyal | -1.556 |
stown | -1.418 |
charging | -1.399 |
atically | -1.388 |
Gleaming | -1.361 |
Token | that |
Token ID | 326 |
Feature activation | -3.68e-01 |
Pos logit contributions | |
oyal | +0.842 |
stown | +0.777 |
charging | +0.760 |
atically | +0.756 |
Wolfe | +0.741 |
Neg logit contributions | |
hua | -0.812 |
uces | -0.788 |
rito | -0.761 |
itous | -0.758 |
048 | -0.724 |
Token | in |
Token ID | 287 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
oyal | +0.268 |
stown | +0.247 |
charging | +0.241 |
atically | +0.240 |
Wolfe | +0.236 |
Neg logit contributions | |
hua | -0.257 |
uces | -0.250 |
rito | -0.240 |
itous | -0.240 |
048 | -0.230 |
Token | terms |
Token ID | 2846 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
hua | +0.863 |
uces | +0.834 |
rito | +0.802 |
itous | +0.798 |
048 | +0.768 |
Neg logit contributions | |
oyal | -0.930 |
stown | -0.853 |
atically | -0.836 |
charging | -0.830 |
agy | -0.817 |
Token | OV |
Token ID | 8874 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
oyal | +2.175 |
stown | +1.989 |
charging | +1.939 |
atically | +1.918 |
Wolfe | +1.884 |
Neg logit contributions | |
hua | -2.391 |
uces | -2.320 |
itous | -2.238 |
rito | -2.236 |
inguishable | -2.127 |
Token | even |
Token ID | 772 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
oyal | +1.084 |
stown | +1.021 |
charging | +1.003 |
atically | +1.000 |
Wolfe | +0.986 |
Neg logit contributions | |
hua | -0.532 |
uces | -0.508 |
rito | -0.481 |
itous | -0.479 |
048 | -0.450 |
Token | double |
Token ID | 4274 |
Feature activation | +7.91e-01 |
Pos logit contributions | |
oyal | +2.729 |
stown | +2.574 |
charging | +2.510 |
atically | +2.500 |
Wolfe | +2.458 |
Neg logit contributions | |
hua | -2.022 |
uces | -1.960 |
rito | -1.877 |
itous | -1.872 |
inguishable | -1.765 |
Token | or |
Token ID | 393 |
Feature activation | +8.95e-01 |
Pos logit contributions | |
hua | +0.516 |
uces | +0.497 |
itous | +0.476 |
rito | +0.474 |
048 | +0.460 |
Neg logit contributions | |
oyal | -0.615 |
stown | -0.567 |
atically | -0.554 |
charging | -0.554 |
Gleaming | -0.545 |
Token | 4 |
Token ID | 604 |
Feature activation | +7.30e+00 |
Pos logit contributions | |
hua | +0.632 |
uces | +0.613 |
itous | +0.589 |
rito | +0.585 |
048 | +0.574 |
Neg logit contributions | |
oyal | -0.641 |
stown | -0.590 |
charging | -0.579 |
atically | -0.575 |
Wolfe | -0.566 |
Token | x |
Token ID | 87 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
hua | +4.147 |
uces | +3.723 |
hi | +3.645 |
048 | +3.642 |
itous | +3.526 |
Neg logit contributions | |
oyal | -6.174 |
stown | -5.612 |
Gleaming | -5.602 |
charging | -5.586 |
atically | -5.550 |
Token | 1080 |
Token ID | 17729 |
Feature activation | +4.27e+00 |
Pos logit contributions | |
hua | +3.183 |
1080 | +2.883 |
048 | +2.726 |
uces | +2.351 |
hi | +2.342 |
Neg logit contributions | |
oyal | -15.294 |
agy | -14.871 |
stown | -14.680 |
Gleaming | -14.654 |
atically | -14.640 |
Token | P |
Token ID | 47 |
Feature activation | +8.32e+00 |
Pos logit contributions | |
hua | +2.350 |
uces | +2.148 |
itous | +2.133 |
rito | +2.118 |
048 | +2.114 |
Neg logit contributions | |
oyal | -3.692 |
atically | -3.394 |
stown | -3.374 |
charging | -3.362 |
Gleaming | -3.352 |
Token | resolution |
Token ID | 6323 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
hua | +1.756 |
uces | +1.473 |
048 | +1.420 |
itous | +1.330 |
Resolution | +1.320 |
Neg logit contributions | |
oyal | -9.764 |
stown | -9.317 |
agy | -9.241 |
Gleaming | -9.215 |
charging | -9.168 |
Token | you |
Token ID | 345 |
Feature activation | +5.18e+00 |
Pos logit contributions | |
hua | +0.894 |
uces | +0.863 |
rito | +0.825 |
itous | +0.818 |
048 | +0.796 |
Neg logit contributions | |
oyal | -1.206 |
stown | -1.112 |
charging | -1.090 |
atically | -1.088 |
Gleaming | -1.076 |
Token | will |
Token ID | 481 |
Feature activation | -9.76e-02 |
Pos logit contributions | |
hua | +3.150 |
uces | +3.015 |
rito | +2.952 |
048 | +2.851 |
itous | +2.844 |
Neg logit contributions | |
oyal | -4.064 |
stown | -3.719 |
Gleaming | -3.715 |
charging | -3.663 |
atically | -3.626 |
Token | men |
Token ID | 1450 |
Feature activation | +4.43e+00 |
Pos logit contributions | |
oyal | +0.079 |
stown | +0.073 |
charging | +0.071 |
atically | +0.070 |
agy | +0.069 |
Neg logit contributions | |
hua | -0.078 |
uces | -0.075 |
rito | -0.073 |
itous | -0.072 |
048 | -0.069 |
Token | and |
Token ID | 290 |
Feature activation | +2.51e+00 |
Pos logit contributions | |
hua | +2.766 |
uces | +2.601 |
rito | +2.535 |
itous | +2.504 |
hi | +2.409 |
Neg logit contributions | |
oyal | -3.511 |
stown | -3.259 |
Gleaming | -3.205 |
charging | -3.177 |
agy | -3.141 |
Token | women |
Token ID | 1466 |
Feature activation | +3.48e+00 |
Pos logit contributions | |
hua | +1.669 |
uces | +1.608 |
rito | +1.564 |
itous | +1.542 |
048 | +1.474 |
Neg logit contributions | |
oyal | -1.915 |
stown | -1.756 |
charging | -1.719 |
atically | -1.711 |
agy | -1.689 |
Token | of |
Token ID | 286 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
hua | +2.181 |
uces | +2.061 |
rito | +2.010 |
itous | +1.984 |
hi | +1.905 |
Neg logit contributions | |
oyal | -2.780 |
stown | -2.572 |
charging | -2.514 |
Gleaming | -2.507 |
agy | -2.470 |
Token | all |
Token ID | 477 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
hua | +5.006 |
uces | +4.859 |
rito | +4.742 |
itous | +4.660 |
hi | +4.448 |
Neg logit contributions | |
oyal | -9.652 |
stown | -9.103 |
charging | -9.077 |
agy | -9.067 |
Gleaming | -8.908 |
Token | ethnic |
Token ID | 9450 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
uces | +6.327 |
hua | +6.278 |
rito | +6.002 |
itous | +5.955 |
hi | +5.769 |
Neg logit contributions | |
oyal | -12.110 |
Gleaming | -11.399 |
charging | -11.299 |
stown | -11.261 |
atically | -11.236 |
Token | ities |
Token ID | 871 |
Feature activation | +6.24e+00 |
Pos logit contributions | |
hua | +5.113 |
uces | +5.084 |
rito | +5.058 |
itous | +4.921 |
liest | +4.513 |
Neg logit contributions | |
oyal | -12.736 |
stown | -12.191 |
charging | -12.090 |
atically | -11.898 |
agy | -11.873 |
Token | . |
Token ID | 13 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
hua | +3.699 |
uces | +3.475 |
rito | +3.435 |
itous | +3.373 |
hi | +3.269 |
Neg logit contributions | |
oyal | -5.062 |
stown | -4.746 |
Gleaming | -4.624 |
charging | -4.575 |
agy | -4.538 |
Token | This |
Token ID | 770 |
Feature activation | +2.56e+00 |
Pos logit contributions | |
hua | +1.472 |
uces | +1.401 |
rito | +1.368 |
itous | +1.354 |
048 | +1.322 |
Neg logit contributions | |
oyal | -1.383 |
stown | -1.246 |
charging | -1.238 |
atically | -1.234 |
agy | -1.209 |
Token | seems |
Token ID | 2331 |
Feature activation | +3.67e+00 |
Pos logit contributions | |
hua | +1.715 |
uces | +1.641 |
rito | +1.591 |
itous | +1.590 |
hi | +1.511 |
Neg logit contributions | |
oyal | -1.941 |
stown | -1.776 |
charging | -1.756 |
atically | -1.726 |
agy | -1.722 |
Token | clear |
Token ID | 1598 |
Feature activation | +2.73e+00 |
Pos logit contributions | |
hua | +2.281 |
uces | +2.209 |
rito | +2.114 |
itous | +2.100 |
hi | +1.998 |
Neg logit contributions | |
oyal | -2.899 |
stown | -2.719 |
charging | -2.657 |
atically | -2.619 |
Gleaming | -2.594 |
Token | � |
Token ID | 447 |
Feature activation | +5.75e-02 |
Pos logit contributions | |
hua | +3.078 |
uces | +2.951 |
rito | +2.879 |
itous | +2.843 |
hi | +2.717 |
Neg logit contributions | |
oyal | -3.681 |
stown | -3.412 |
charging | -3.377 |
atically | -3.330 |
agy | -3.305 |
Token | � |
Token ID | 247 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
hua | +0.041 |
uces | +0.040 |
rito | +0.039 |
itous | +0.039 |
048 | +0.037 |
Neg logit contributions | |
oyal | -0.041 |
stown | -0.038 |
charging | -0.037 |
atically | -0.036 |
Wolfe | -0.036 |
Token | s |
Token ID | 82 |
Feature activation | +9.96e-01 |
Pos logit contributions | |
hua | +1.304 |
uces | +1.265 |
rito | +1.223 |
itous | +1.220 |
048 | +1.165 |
Neg logit contributions | |
oyal | -1.270 |
stown | -1.171 |
charging | -1.147 |
atically | -1.137 |
Wolfe | -1.122 |
Token | anti |
Token ID | 3098 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
hua | +0.674 |
uces | +0.649 |
rito | +0.629 |
itous | +0.629 |
048 | +0.597 |
Neg logit contributions | |
oyal | -0.744 |
stown | -0.688 |
charging | -0.676 |
atically | -0.670 |
agy | -0.662 |
Token | - |
Token ID | 12 |
Feature activation | -7.17e-01 |
Pos logit contributions | |
oyal | +0.204 |
stown | +0.191 |
atically | +0.187 |
charging | +0.185 |
Gleaming | +0.184 |
Neg logit contributions | |
hua | -0.151 |
uces | -0.145 |
rito | -0.140 |
itous | -0.139 |
048 | -0.133 |
Token | Pet |
Token ID | 25803 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
oyal | +0.561 |
stown | +0.519 |
charging | +0.511 |
atically | +0.504 |
Wolfe | +0.494 |
Neg logit contributions | |
hua | -0.464 |
uces | -0.451 |
rito | -0.432 |
itous | -0.431 |
048 | -0.411 |
Token | ro |
Token ID | 305 |
Feature activation | -4.35e+00 |
Pos logit contributions | |
rito | +5.427 |
hua | +5.170 |
hi | +4.655 |
itous | +4.375 |
uces | +4.208 |
Neg logit contributions | |
oyal | -12.904 |
Gleaming | -12.667 |
atically | -12.536 |
=] | -12.491 |
agy | -12.412 |
Token | car |
Token ID | 7718 |
Feature activation | -3.75e+00 |
Pos logit contributions | |
oyal | +3.214 |
stown | +2.977 |
charging | +2.937 |
atically | +2.881 |
agy | +2.808 |
Neg logit contributions | |
hua | -2.949 |
uces | -2.900 |
itous | -2.782 |
rito | -2.763 |
048 | -2.647 |
Token | ibe |
Token ID | 32438 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
oyal | +2.813 |
stown | +2.599 |
charging | +2.547 |
atically | +2.531 |
Wolfe | +2.481 |
Neg logit contributions | |
hua | -2.526 |
uces | -2.458 |
rito | -2.361 |
itous | -2.350 |
048 | -2.254 |
Token | position |
Token ID | 2292 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
oyal | +1.480 |
stown | +1.360 |
charging | +1.329 |
atically | +1.321 |
Wolfe | +1.301 |
Neg logit contributions | |
hua | -1.467 |
uces | -1.433 |
rito | -1.379 |
itous | -1.373 |
048 | -1.312 |
Token | and |
Token ID | 290 |
Feature activation | -3.69e+00 |
Pos logit contributions | |
hua | +2.113 |
uces | +2.027 |
rito | +1.953 |
itous | +1.950 |
048 | +1.865 |
Neg logit contributions | |
oyal | -2.609 |
stown | -2.428 |
charging | -2.369 |
atically | -2.335 |
Gleaming | -2.335 |
Token | prior |
Token ID | 3161 |
Feature activation | -9.29e-01 |
Pos logit contributions | |
oyal | +1.392 |
stown | +1.273 |
charging | +1.239 |
atically | +1.230 |
Wolfe | +1.208 |
Neg logit contributions | |
hua | -1.739 |
uces | -1.697 |
rito | -1.643 |
itous | -1.639 |
048 | -1.573 |
Token | incident |
Token ID | 4519 |
Feature activation | +3.17e+00 |
Pos logit contributions | |
oyal | +0.631 |
stown | +0.578 |
charging | +0.564 |
atically | +0.561 |
Wolfe | +0.550 |
Neg logit contributions | |
hua | -0.695 |
uces | -0.677 |
rito | -0.654 |
itous | -0.652 |
048 | -0.625 |
Token | : |
Token ID | 25 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
hua | +1.862 |
uces | +1.767 |
rito | +1.704 |
itous | +1.693 |
048 | +1.625 |
Neg logit contributions | |
oyal | -2.670 |
stown | -2.461 |
charging | -2.419 |
Gleaming | -2.414 |
atically | -2.405 |
Token |
|
Token ID | 198 |
Feature activation | +7.94e-01 |
Pos logit contributions | |
hua | +1.181 |
uces | +1.146 |
rito | +1.106 |
itous | +1.103 |
048 | +1.058 |
Neg logit contributions | |
oyal | -1.152 |
stown | -1.059 |
charging | -1.034 |
atically | -1.031 |
Wolfe | -1.007 |
Token |
|
Token ID | 198 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
hua | +0.556 |
uces | +0.529 |
itous | +0.513 |
rito | +0.513 |
048 | +0.502 |
Neg logit contributions | |
oyal | -0.584 |
stown | -0.530 |
atically | -0.524 |
charging | -0.522 |
Gleaming | -0.512 |
Token | D |
Token ID | 35 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
hua | +0.427 |
uces | +0.413 |
rito | +0.398 |
itous | +0.396 |
048 | +0.378 |
Neg logit contributions | |
oyal | -0.510 |
stown | -0.473 |
charging | -0.463 |
atically | -0.462 |
Wolfe | -0.454 |
Token | ani |
Token ID | 3216 |
Feature activation | +7.45e+00 |
Pos logit contributions | |
hua | +6.141 |
uces | +6.133 |
itous | +5.866 |
rito | +5.728 |
hi | +5.696 |
Neg logit contributions | |
Gleaming | -12.039 |
Wolfe | -11.782 |
stown | -11.429 |
charging | -11.359 |
atically | -11.301 |
Token | els |
Token ID | 1424 |
Feature activation | +2.93e+00 |
Pos logit contributions | |
hua | +1.863 |
uces | +1.828 |
048 | +1.482 |
itous | +1.451 |
rito | +1.402 |
Neg logit contributions | |
oyal | -8.371 |
Gleaming | -8.132 |
stown | -8.019 |
atically | -7.949 |
charging | -7.931 |
Token | � |
Token ID | 447 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
hua | +2.049 |
uces | +2.000 |
itous | +1.914 |
rito | +1.911 |
048 | +1.848 |
Neg logit contributions | |
oyal | -2.120 |
stown | -1.919 |
charging | -1.893 |
atically | -1.889 |
agy | -1.865 |
Token | � |
Token ID | 247 |
Feature activation | +3.39e+00 |
Pos logit contributions | |
hua | +2.585 |
uces | +2.499 |
rito | +2.402 |
itous | +2.367 |
048 | +2.276 |
Neg logit contributions | |
oyal | -3.389 |
stown | -3.173 |
charging | -3.087 |
atically | -3.072 |
Wolfe | -3.034 |
Token | mug |
Token ID | 25152 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
hua | +2.435 |
uces | +2.363 |
rito | +2.279 |
itous | +2.267 |
048 | +2.200 |
Neg logit contributions | |
oyal | -2.383 |
stown | -2.153 |
charging | -2.111 |
atically | -2.105 |
agy | -2.086 |
Token | mates |
Token ID | 27973 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
hua | +1.175 |
uces | +1.139 |
rito | +1.099 |
itous | +1.093 |
048 | +1.052 |
Neg logit contributions | |
oyal | -1.232 |
stown | -1.128 |
charging | -1.111 |
atically | -1.101 |
Wolfe | -1.080 |
Token | , |
Token ID | 11 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
oyal | +2.220 |
stown | +2.039 |
charging | +1.970 |
atically | +1.963 |
Wolfe | +1.941 |
Neg logit contributions | |
hua | -2.526 |
uces | -2.484 |
itous | -2.379 |
rito | -2.376 |
048 | -2.268 |
Token | V |
Token ID | 569 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
oyal | +1.595 |
stown | +1.479 |
charging | +1.444 |
atically | +1.433 |
Wolfe | +1.416 |
Neg logit contributions | |
hua | -1.557 |
uces | -1.521 |
itous | -1.465 |
rito | -1.460 |
048 | -1.386 |
Token | Ps |
Token ID | 12016 |
Feature activation | -4.08e+00 |
Pos logit contributions | |
oyal | +1.587 |
stown | +1.463 |
atically | +1.430 |
charging | +1.425 |
Wolfe | +1.399 |
Neg logit contributions | |
hua | -1.440 |
uces | -1.399 |
rito | -1.335 |
itous | -1.335 |
048 | -1.274 |
Token | See |
Token ID | 4091 |
Feature activation | -7.40e-01 |
Pos logit contributions | |
oyal | +2.832 |
stown | +2.594 |
charging | +2.528 |
atically | +2.518 |
agy | +2.473 |
Neg logit contributions | |
hua | -2.938 |
uces | -2.888 |
rito | -2.769 |
itous | -2.760 |
048 | -2.631 |
Token | Gallery |
Token ID | 12917 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
oyal | +0.610 |
stown | +0.562 |
charging | +0.560 |
agy | +0.550 |
atically | +0.547 |
Neg logit contributions | |
hua | -0.454 |
uces | -0.427 |
rito | -0.415 |
itous | -0.413 |
048 | -0.396 |
Token | Donald |
Token ID | 3759 |
Feature activation | +4.99e+00 |
Pos logit contributions | |
oyal | +8.289 |
stown | +7.913 |
Others | +7.872 |
Wolfe | +7.566 |
CLOSE | +7.532 |
Neg logit contributions | |
hua | -12.190 |
uces | -11.764 |
rito | -11.500 |
itous | -11.339 |
048 | -11.060 |
Token | Trump |
Token ID | 1301 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
hua | +2.940 |
uces | +2.744 |
rito | +2.667 |
itous | +2.645 |
048 | +2.620 |
Neg logit contributions | |
oyal | -4.173 |
Gleaming | -3.733 |
atically | -3.729 |
charging | -3.726 |
stown | -3.643 |
Token | passes |
Token ID | 8318 |
Feature activation | +7.23e-01 |
Pos logit contributions | |
oyal | +1.355 |
stown | +1.257 |
charging | +1.230 |
atically | +1.223 |
Wolfe | +1.202 |
Neg logit contributions | |
hua | -1.203 |
uces | -1.167 |
rito | -1.125 |
itous | -1.122 |
048 | -1.067 |
Token | on |
Token ID | 319 |
Feature activation | -8.14e-01 |
Pos logit contributions | |
hua | +0.494 |
uces | +0.479 |
rito | +0.461 |
itous | +0.460 |
048 | +0.438 |
Neg logit contributions | |
oyal | -0.538 |
stown | -0.497 |
charging | -0.486 |
atically | -0.484 |
Wolfe | -0.474 |
Token | ' |
Token ID | 705 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
oyal | +0.602 |
stown | +0.559 |
charging | +0.548 |
atically | +0.541 |
Wolfe | +0.534 |
Neg logit contributions | |
hua | -0.556 |
uces | -0.544 |
rito | -0.521 |
itous | -0.520 |
048 | -0.498 |
Token | and |
Token ID | 290 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
oyal | +4.315 |
stown | +4.015 |
charging | +3.859 |
atically | +3.791 |
Wolfe | +3.729 |
Neg logit contributions | |
hua | -5.084 |
uces | -4.994 |
rito | -4.817 |
itous | -4.708 |
048 | -4.658 |
Token | get |
Token ID | 651 |
Feature activation | +2.06e-02 |
Pos logit contributions | |
oyal | +0.744 |
stown | +0.685 |
charging | +0.669 |
atically | +0.666 |
Wolfe | +0.654 |
Neg logit contributions | |
hua | -0.739 |
uces | -0.718 |
rito | -0.693 |
itous | -0.691 |
048 | -0.660 |
Token | three |
Token ID | 1115 |
Feature activation | -5.10e+00 |
Pos logit contributions | |
hua | +0.016 |
uces | +0.016 |
itous | +0.016 |
rito | +0.015 |
hi | +0.015 |
Neg logit contributions | |
oyal | -0.013 |
stown | -0.012 |
atically | -0.011 |
charging | -0.011 |
agy | -0.011 |
Token | actions |
Token ID | 4028 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
oyal | +3.009 |
stown | +2.730 |
charging | +2.650 |
atically | +2.641 |
Wolfe | +2.561 |
Neg logit contributions | |
hua | -4.271 |
uces | -4.119 |
rito | -4.017 |
itous | -3.964 |
048 | -3.864 |
Token | in |
Token ID | 287 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
hua | +0.282 |
uces | +0.270 |
rito | +0.261 |
itous | +0.260 |
048 | +0.249 |
Neg logit contributions | |
oyal | -0.384 |
stown | -0.352 |
charging | -0.350 |
atically | -0.348 |
Gleaming | -0.343 |
Token | your |
Token ID | 534 |
Feature activation | -1.59e+01 |
Pos logit contributions | |
oyal | +0.926 |
stown | +0.859 |
charging | +0.842 |
atically | +0.839 |
Wolfe | +0.825 |
Neg logit contributions | |
hua | -0.727 |
uces | -0.703 |
rito | -0.675 |
itous | -0.673 |
048 | -0.640 |
Token | inbox |
Token ID | 13734 |
Feature activation | -4.76e+00 |
Pos logit contributions | |
stown | +3.963 |
oyal | +3.878 |
Armstrong | +3.191 |
charging | +3.189 |
atically | +3.078 |
Neg logit contributions | |
hua | -16.401 |
uces | -16.109 |
inguishable | -15.952 |
ADRA | -15.767 |
itous | -15.588 |
Token | every |
Token ID | 790 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
oyal | +3.249 |
stown | +3.020 |
charging | +2.922 |
atically | +2.903 |
Wolfe | +2.838 |
Neg logit contributions | |
hua | -3.505 |
uces | -3.442 |
rito | -3.275 |
itous | -3.273 |
048 | -3.139 |
Token | week |
Token ID | 1285 |
Feature activation | -5.46e+00 |
Pos logit contributions | |
oyal | +2.252 |
stown | +2.085 |
charging | +2.025 |
atically | +2.024 |
Wolfe | +1.972 |
Neg logit contributions | |
hua | -2.628 |
uces | -2.583 |
rito | -2.470 |
itous | -2.460 |
inguishable | -2.375 |
Token | . |
Token ID | 13 |
Feature activation | -7.25e-01 |
Pos logit contributions | |
oyal | +3.957 |
stown | +3.701 |
charging | +3.584 |
atically | +3.544 |
Wolfe | +3.505 |
Neg logit contributions | |
hua | -3.738 |
uces | -3.702 |
rito | -3.526 |
itous | -3.504 |
inguishable | -3.398 |
Token |
|
Token ID | 198 |
Feature activation | -2.13e+00 |
Pos logit contributions | |
oyal | +0.503 |
stown | +0.461 |
atically | +0.453 |
charging | +0.452 |
agy | +0.441 |
Neg logit contributions | |
hua | -0.531 |
uces | -0.515 |
rito | -0.498 |
itous | -0.496 |
048 | -0.478 |
Token | it |
Token ID | 340 |
Feature activation | -2.26e+00 |
Pos logit contributions | |
oyal | +0.026 |
stown | +0.024 |
charging | +0.023 |
atically | +0.023 |
agy | +0.022 |
Neg logit contributions | |
hua | -0.023 |
uces | -0.022 |
rito | -0.021 |
itous | -0.021 |
048 | -0.020 |
Token | is |
Token ID | 318 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
oyal | +1.609 |
stown | +1.487 |
charging | +1.451 |
atically | +1.451 |
Wolfe | +1.425 |
Neg logit contributions | |
hua | -1.593 |
uces | -1.550 |
rito | -1.501 |
itous | -1.492 |
048 | -1.425 |
Token | for |
Token ID | 329 |
Feature activation | +4.78e+00 |
Pos logit contributions | |
oyal | +0.268 |
stown | +0.248 |
charging | +0.243 |
atically | +0.242 |
Wolfe | +0.237 |
Neg logit contributions | |
hua | -0.243 |
uces | -0.236 |
rito | -0.227 |
itous | -0.227 |
048 | -0.216 |
Token | making |
Token ID | 1642 |
Feature activation | -5.67e-01 |
Pos logit contributions | |
hua | +3.006 |
uces | +2.869 |
itous | +2.801 |
rito | +2.762 |
048 | +2.664 |
Neg logit contributions | |
oyal | -3.674 |
stown | -3.454 |
atically | -3.367 |
charging | -3.339 |
agy | -3.330 |
Token | the |
Token ID | 262 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
oyal | +0.415 |
stown | +0.383 |
charging | +0.375 |
atically | +0.373 |
agy | +0.365 |
Neg logit contributions | |
hua | -0.394 |
uces | -0.382 |
itous | -0.368 |
rito | -0.368 |
048 | -0.351 |
Token | latter |
Token ID | 6846 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
oyal | +1.817 |
stown | +1.658 |
charging | +1.618 |
atically | +1.610 |
Wolfe | +1.586 |
Neg logit contributions | |
hua | -2.103 |
uces | -2.051 |
rito | -1.986 |
itous | -1.967 |
048 | -1.893 |
Token | argument |
Token ID | 4578 |
Feature activation | -4.13e+00 |
Pos logit contributions | |
oyal | +8.379 |
Wolfe | +7.627 |
atically | +7.597 |
stown | +7.573 |
Armstrong | +7.425 |
Neg logit contributions | |
uces | -10.937 |
hua | -10.937 |
rito | -10.895 |
itous | -10.402 |
inguishable | -10.312 |
Token | — |
Token ID | 960 |
Feature activation | -4.00e+00 |
Pos logit contributions | |
oyal | +2.839 |
stown | +2.624 |
atically | +2.596 |
charging | +2.534 |
Wolfe | +2.523 |
Neg logit contributions | |
hua | -2.970 |
uces | -2.906 |
rito | -2.808 |
itous | -2.763 |
048 | -2.668 |
Token | that |
Token ID | 5562 |
Feature activation | -5.61e+00 |
Pos logit contributions | |
oyal | +2.756 |
stown | +2.532 |
charging | +2.521 |
atically | +2.468 |
Wolfe | +2.400 |
Neg logit contributions | |
hua | -2.915 |
uces | -2.863 |
rito | -2.739 |
itous | -2.729 |
048 | -2.614 |
Token | it |
Token ID | 340 |
Feature activation | -5.31e-01 |
Pos logit contributions | |
oyal | +3.926 |
stown | +3.591 |
charging | +3.519 |
atically | +3.507 |
Wolfe | +3.506 |
Neg logit contributions | |
hua | -3.957 |
uces | -3.846 |
rito | -3.817 |
itous | -3.678 |
inguishable | -3.547 |
Token | was |
Token ID | 373 |
Feature activation | -3.85e+00 |
Pos logit contributions | |
oyal | +0.394 |
stown | +0.364 |
charging | +0.356 |
atically | +0.355 |
Wolfe | +0.348 |
Neg logit contributions | |
hua | -0.364 |
uces | -0.353 |
rito | -0.340 |
itous | -0.339 |
048 | -0.324 |
Token | . |
Token ID | 13 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
oyal | +3.385 |
stown | +3.138 |
atically | +3.076 |
charging | +3.071 |
Wolfe | +2.991 |
Neg logit contributions | |
hua | -3.199 |
uces | -3.123 |
itous | -2.985 |
rito | -2.983 |
048 | -2.853 |
Token | Share |
Token ID | 8734 |
Feature activation | -6.36e+00 |
Pos logit contributions | |
oyal | +1.693 |
stown | +1.557 |
charging | +1.513 |
atically | +1.507 |
Wolfe | +1.483 |
Neg logit contributions | |
hua | -1.871 |
uces | -1.824 |
rito | -1.760 |
itous | -1.756 |
048 | -1.681 |
Token | a |
Token ID | 257 |
Feature activation | -5.53e+00 |
Pos logit contributions | |
oyal | +4.233 |
stown | +3.904 |
charging | +3.815 |
Wolfe | +3.767 |
atically | +3.767 |
Neg logit contributions | |
hua | -4.640 |
uces | -4.500 |
rito | -4.333 |
itous | -4.271 |
048 | -4.173 |
Token | picture |
Token ID | 4286 |
Feature activation | -9.28e+00 |
Pos logit contributions | |
oyal | +3.780 |
stown | +3.485 |
charging | +3.369 |
Wolfe | +3.368 |
atically | +3.364 |
Neg logit contributions | |
hua | -3.999 |
uces | -3.916 |
rito | -3.713 |
itous | -3.683 |
048 | -3.578 |
Token | on |
Token ID | 319 |
Feature activation | -6.16e+00 |
Pos logit contributions | |
oyal | +5.901 |
stown | +5.411 |
atically | +5.287 |
charging | +5.175 |
Wolfe | +5.134 |
Neg logit contributions | |
uces | -6.870 |
hua | -6.809 |
rito | -6.405 |
itous | -6.376 |
048 | -6.281 |
Token | Instagram |
Token ID | 10767 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
oyal | +4.138 |
stown | +3.818 |
charging | +3.676 |
Others | +3.660 |
atically | +3.656 |
Neg logit contributions | |
hua | -4.588 |
uces | -4.448 |
rito | -4.259 |
itous | -4.246 |
048 | -4.074 |
Token | . |
Token ID | 13 |
Feature activation | -3.54e+00 |
Pos logit contributions | |
oyal | +8.208 |
stown | +7.487 |
atically | +7.317 |
charging | +7.256 |
Others | +7.150 |
Neg logit contributions | |
uces | -10.954 |
hua | -10.938 |
itous | -10.366 |
rito | -10.234 |
liest | -10.033 |
Token | Text |
Token ID | 8255 |
Feature activation | -4.85e+00 |
Pos logit contributions | |
oyal | +2.372 |
stown | +2.192 |
charging | +2.115 |
atically | +2.111 |
Wolfe | +2.089 |
Neg logit contributions | |
hua | -2.658 |
uces | -2.605 |
rito | -2.505 |
itous | -2.503 |
048 | -2.394 |
Token | your |
Token ID | 534 |
Feature activation | -2.31e+00 |
Pos logit contributions | |
oyal | +3.396 |
stown | +3.152 |
charging | +3.061 |
atically | +3.050 |
Wolfe | +3.005 |
Neg logit contributions | |
hua | -3.463 |
uces | -3.383 |
itous | -3.247 |
rito | -3.246 |
048 | -3.109 |
Token | buds |
Token ID | 36402 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
oyal | +1.531 |
stown | +1.409 |
atically | +1.361 |
charging | +1.359 |
Wolfe | +1.338 |
Neg logit contributions | |
hua | -1.763 |
uces | -1.718 |
rito | -1.657 |
itous | -1.655 |
048 | -1.585 |
Token | . |
Token ID | 13 |
Feature activation | -4.51e-01 |
Pos logit contributions | |
oyal | +2.427 |
stown | +2.250 |
atically | +2.187 |
charging | +2.186 |
Wolfe | +2.151 |
Neg logit contributions | |
hua | -2.339 |
uces | -2.284 |
itous | -2.194 |
rito | -2.192 |
048 | -2.107 |
Token | posted |
Token ID | 4481 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
oyal | +1.376 |
stown | +1.282 |
atically | +1.245 |
charging | +1.244 |
Wolfe | +1.228 |
Neg logit contributions | |
hua | -1.297 |
uces | -1.260 |
rito | -1.217 |
itous | -1.210 |
048 | -1.154 |
Token | this |
Token ID | 428 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
hua | +1.155 |
uces | +1.114 |
rito | +1.072 |
itous | +1.072 |
048 | +1.024 |
Neg logit contributions | |
oyal | -1.314 |
stown | -1.212 |
charging | -1.190 |
atically | -1.184 |
agy | -1.158 |
Token | cryptic |
Token ID | 47774 |
Feature activation | -3.59e+00 |
Pos logit contributions | |
oyal | +0.747 |
stown | +0.673 |
charging | +0.652 |
atically | +0.650 |
Wolfe | +0.633 |
Neg logit contributions | |
hua | -1.147 |
uces | -1.121 |
rito | -1.088 |
itous | -1.085 |
048 | -1.047 |
Token | message |
Token ID | 3275 |
Feature activation | -7.48e-01 |
Pos logit contributions | |
oyal | +2.418 |
stown | +2.241 |
atically | +2.156 |
Wolfe | +2.154 |
charging | +2.143 |
Neg logit contributions | |
hua | -2.642 |
uces | -2.615 |
rito | -2.496 |
itous | -2.465 |
048 | -2.409 |
Token | on |
Token ID | 319 |
Feature activation | -2.86e+00 |
Pos logit contributions | |
oyal | +0.545 |
stown | +0.505 |
charging | +0.492 |
atically | +0.490 |
Wolfe | +0.483 |
Neg logit contributions | |
hua | -0.520 |
uces | -0.508 |
rito | -0.489 |
itous | -0.485 |
048 | -0.465 |
Token | her |
Token ID | 607 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
oyal | +1.505 |
stown | +1.358 |
charging | +1.296 |
atically | +1.293 |
Wolfe | +1.279 |
Neg logit contributions | |
hua | -2.556 |
uces | -2.510 |
rito | -2.443 |
itous | -2.427 |
048 | -2.334 |
Token | Instagram |
Token ID | 10767 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
oyal | +6.141 |
stown | +5.500 |
Wolfe | +5.177 |
Armstrong | +5.112 |
atically | +4.968 |
Neg logit contributions | |
hua | -12.354 |
uces | -12.168 |
rito | -11.852 |
itous | -11.518 |
atos | -11.291 |
Token | following |
Token ID | 1708 |
Feature activation | -5.11e+00 |
Pos logit contributions | |
oyal | +8.105 |
stown | +7.575 |
charging | +7.471 |
atically | +7.395 |
Wolfe | +7.374 |
Neg logit contributions | |
uces | -8.154 |
hua | -8.007 |
rito | -7.820 |
itous | -7.514 |
inguishable | -7.496 |
Token | the |
Token ID | 262 |
Feature activation | -3.24e+00 |
Pos logit contributions | |
oyal | +3.276 |
stown | +3.067 |
charging | +2.944 |
Wolfe | +2.933 |
atically | +2.929 |
Neg logit contributions | |
hua | -3.898 |
uces | -3.823 |
rito | -3.696 |
itous | -3.678 |
inguishable | -3.551 |
Token | incident |
Token ID | 4519 |
Feature activation | -4.90e+00 |
Pos logit contributions | |
oyal | +1.954 |
stown | +1.784 |
charging | +1.733 |
atically | +1.720 |
Wolfe | +1.691 |
Neg logit contributions | |
hua | -2.648 |
uces | -2.593 |
rito | -2.517 |
itous | -2.498 |
048 | -2.394 |
Token |
|
Token ID | 198 |
Feature activation | -3.48e+00 |
Pos logit contributions | |
oyal | +3.573 |
stown | +3.340 |
charging | +3.242 |
atically | +3.231 |
Wolfe | +3.223 |
Neg logit contributions | |
hua | -3.286 |
uces | -3.212 |
rito | -3.090 |
itous | -3.066 |
048 | -2.933 |
Token | requests |
Token ID | 7007 |
Feature activation | +6.03e+00 |
Pos logit contributions | |
hua | +1.555 |
uces | +1.498 |
rito | +1.451 |
itous | +1.442 |
048 | +1.387 |
Neg logit contributions | |
oyal | -1.553 |
stown | -1.422 |
atically | -1.392 |
charging | -1.389 |
agy | -1.363 |
Token | for |
Token ID | 329 |
Feature activation | +6.47e+00 |
Pos logit contributions | |
hua | +3.196 |
uces | +2.951 |
rito | +2.900 |
itous | +2.850 |
048 | +2.728 |
Neg logit contributions | |
oyal | -5.362 |
stown | -4.980 |
Gleaming | -4.932 |
atically | -4.891 |
charging | -4.856 |
Token | comment |
Token ID | 2912 |
Feature activation | +3.30e+00 |
Pos logit contributions | |
hua | +3.765 |
uces | +3.585 |
rito | +3.443 |
itous | +3.414 |
hi | +3.267 |
Neg logit contributions | |
oyal | -5.422 |
stown | -4.983 |
atically | -4.911 |
Gleaming | -4.905 |
charging | -4.849 |
Token | and |
Token ID | 290 |
Feature activation | -5.95e-01 |
Pos logit contributions | |
hua | +2.004 |
uces | +1.893 |
rito | +1.846 |
itous | +1.827 |
048 | +1.752 |
Neg logit contributions | |
oyal | -2.686 |
stown | -2.498 |
atically | -2.443 |
Gleaming | -2.441 |
charging | -2.433 |
Token | Boh |
Token ID | 44366 |
Feature activation | +1.00e-01 |
Pos logit contributions | |
oyal | +0.434 |
stown | +0.401 |
charging | +0.392 |
atically | +0.390 |
Wolfe | +0.384 |
Neg logit contributions | |
hua | -0.414 |
uces | -0.403 |
rito | -0.389 |
itous | -0.387 |
048 | -0.370 |
Token | oli |
Token ID | 11106 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
hua | +0.058 |
uces | +0.056 |
rito | +0.054 |
itous | +0.053 |
048 | +0.050 |
Neg logit contributions | |
oyal | -0.085 |
stown | -0.079 |
charging | -0.078 |
atically | -0.077 |
Wolfe | -0.076 |
Token | ub |
Token ID | 549 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
oyal | +9.631 |
stown | +8.667 |
agy | +8.287 |
atically | +8.182 |
charging | +8.107 |
Neg logit contributions | |
hua | -8.973 |
uces | -8.915 |
itous | -8.720 |
liest | -8.648 |
rito | -8.527 |
Token | ov |
Token ID | 709 |
Feature activation | -8.19e-01 |
Pos logit contributions | |
oyal | +1.937 |
stown | +1.745 |
charging | +1.684 |
atically | +1.681 |
agy | +1.631 |
Neg logit contributions | |
hua | -2.961 |
uces | -2.895 |
rito | -2.811 |
itous | -2.806 |
048 | -2.702 |
Token | could |
Token ID | 714 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
oyal | +0.615 |
stown | +0.569 |
charging | +0.556 |
atically | +0.554 |
Wolfe | +0.544 |
Neg logit contributions | |
hua | -0.554 |
uces | -0.538 |
rito | -0.518 |
itous | -0.516 |
048 | -0.492 |
Token | not |
Token ID | 407 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
hua | +0.982 |
uces | +0.945 |
rito | +0.912 |
itous | +0.904 |
048 | +0.863 |
Neg logit contributions | |
oyal | -1.373 |
stown | -1.279 |
charging | -1.257 |
atically | -1.250 |
Wolfe | -1.230 |
Token | be |
Token ID | 307 |
Feature activation | +3.37e+00 |
Pos logit contributions | |
hua | +1.291 |
uces | +1.247 |
rito | +1.217 |
itous | +1.200 |
048 | +1.158 |
Neg logit contributions | |
oyal | -1.379 |
stown | -1.262 |
charging | -1.245 |
atically | -1.227 |
Gleaming | -1.215 |
Token | transact |
Token ID | 48878 |
Feature activation | +4.37e+00 |
Pos logit contributions | |
oyal | +0.583 |
stown | +0.538 |
charging | +0.526 |
atically | +0.524 |
Wolfe | +0.513 |
Neg logit contributions | |
hua | -0.562 |
uces | -0.546 |
rito | -0.526 |
itous | -0.525 |
048 | -0.501 |
Token | ional |
Token ID | 1538 |
Feature activation | +2.41e+00 |
Pos logit contributions | |
hua | +0.933 |
uces | +0.835 |
rito | +0.735 |
itous | +0.714 |
hi | +0.606 |
Neg logit contributions | |
oyal | -5.188 |
stown | -4.985 |
Gleaming | -4.942 |
charging | -4.878 |
Wolfe | -4.857 |
Token | in |
Token ID | 287 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
hua | +1.541 |
uces | +1.481 |
itous | +1.438 |
rito | +1.426 |
048 | +1.360 |
Neg logit contributions | |
oyal | -1.870 |
stown | -1.731 |
charging | -1.703 |
atically | -1.684 |
agy | -1.676 |
Token | nature |
Token ID | 3450 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
oyal | +1.120 |
stown | +1.034 |
charging | +1.011 |
atically | +1.004 |
Wolfe | +0.987 |
Neg logit contributions | |
hua | -1.139 |
uces | -1.108 |
rito | -1.070 |
itous | -1.066 |
048 | -1.020 |
Token | to |
Token ID | 284 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
hua | +0.687 |
uces | +0.664 |
rito | +0.639 |
itous | +0.638 |
048 | +0.608 |
Neg logit contributions | |
oyal | -0.818 |
stown | -0.757 |
charging | -0.743 |
atically | -0.737 |
Wolfe | -0.726 |
Token | being |
Token ID | 852 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
oyal | +6.948 |
stown | +6.349 |
charging | +6.226 |
atically | +6.175 |
Armstrong | +5.935 |
Neg logit contributions | |
hua | -8.092 |
uces | -7.935 |
rito | -7.740 |
itous | -7.418 |
048 | -7.413 |
Token | more |
Token ID | 517 |
Feature activation | -9.78e+00 |
Pos logit contributions | |
oyal | +7.892 |
stown | +7.298 |
atically | +7.128 |
charging | +7.030 |
Armstrong | +6.934 |
Neg logit contributions | |
hua | -10.292 |
uces | -10.022 |
rito | -9.834 |
048 | -9.533 |
itous | -9.513 |
Token | of |
Token ID | 286 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
oyal | +6.368 |
stown | +5.848 |
atically | +5.717 |
charging | +5.695 |
Armstrong | +5.578 |
Neg logit contributions | |
hua | -7.068 |
uces | -6.945 |
rito | -6.650 |
itous | -6.523 |
048 | -6.478 |
Token | recognized |
Token ID | 8018 |
Feature activation | +8.62e-01 |
Pos logit contributions | |
oyal | +1.793 |
stown | +1.642 |
charging | +1.609 |
atically | +1.600 |
Wolfe | +1.563 |
Neg logit contributions | |
hua | -1.915 |
uces | -1.871 |
rito | -1.801 |
itous | -1.791 |
048 | -1.727 |
Token | partner |
Token ID | 5212 |
Feature activation | +2.57e+00 |
Pos logit contributions | |
hua | +0.554 |
uces | +0.534 |
itous | +0.516 |
rito | +0.515 |
048 | +0.489 |
Neg logit contributions | |
oyal | -0.673 |
stown | -0.626 |
charging | -0.611 |
atically | -0.606 |
agy | -0.601 |
Token | for |
Token ID | 329 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
hua | +1.664 |
uces | +1.597 |
rito | +1.551 |
itous | +1.545 |
048 | +1.472 |
Neg logit contributions | |
oyal | -1.978 |
stown | -1.838 |
charging | -1.794 |
Gleaming | -1.792 |
atically | -1.787 |
Token | operations |
Token ID | 4560 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
oyal | +5.782 |
charging | +5.267 |
stown | +5.239 |
Armstrong | +5.156 |
atically | +5.143 |
Neg logit contributions | |
hua | -5.932 |
uces | -5.755 |
itous | -5.501 |
rito | -5.417 |
inguishable | -5.265 |
Token | . |
Token ID | 13 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
oyal | +1.714 |
stown | +1.583 |
charging | +1.557 |
atically | +1.552 |
Wolfe | +1.520 |
Neg logit contributions | |
hua | -1.544 |
uces | -1.504 |
rito | -1.442 |
itous | -1.438 |
048 | -1.366 |
Token | A |
Token ID | 317 |
Feature activation | -3.91e+00 |
Pos logit contributions | |
oyal | +1.297 |
stown | +1.189 |
charging | +1.159 |
atically | +1.153 |
Wolfe | +1.137 |
Neg logit contributions | |
hua | -1.479 |
uces | -1.442 |
rito | -1.395 |
itous | -1.392 |
048 | -1.331 |
Token | Soy |
Token ID | 30022 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
oyal | +2.792 |
stown | +2.607 |
charging | +2.540 |
atically | +2.531 |
Wolfe | +2.487 |
Neg logit contributions | |
hua | -2.708 |
uces | -2.640 |
rito | -2.539 |
itous | -2.527 |
048 | -2.421 |
Token | uz |
Token ID | 10277 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
oyal | +1.167 |
stown | +1.064 |
charging | +1.037 |
atically | +1.030 |
Wolfe | +1.009 |
Neg logit contributions | |
hua | -1.451 |
uces | -1.414 |
rito | -1.369 |
itous | -1.368 |
048 | -1.313 |
Token | carrying |
Token ID | 6872 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
oyal | +0.099 |
stown | +0.090 |
charging | +0.088 |
atically | +0.087 |
agy | +0.086 |
Neg logit contributions | |
hua | -0.118 |
uces | -0.116 |
rito | -0.112 |
itous | -0.111 |
048 | -0.107 |
Token | NASA |
Token ID | 8884 |
Feature activation | -7.47e+00 |
Pos logit contributions | |
oyal | +7.753 |
Armstrong | +7.631 |
stown | +7.421 |
atically | +7.240 |
charging | +7.207 |
Neg logit contributions | |
hua | -10.158 |
uces | -9.934 |
itous | -9.601 |
rito | -9.435 |
hyde | -9.129 |
Token | astronaut |
Token ID | 33779 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
oyal | +3.942 |
stown | +3.613 |
atically | +3.483 |
Armstrong | +3.449 |
charging | +3.394 |
Neg logit contributions | |
hua | -6.458 |
uces | -6.369 |
itous | -6.172 |
rito | -6.153 |
048 | -5.908 |
Token | Shane |
Token ID | 24379 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
oyal | +6.980 |
Armstrong | +6.683 |
atically | +6.477 |
stown | +6.477 |
charging | +6.436 |
Neg logit contributions | |
hua | -7.322 |
uces | -7.194 |
itous | -6.907 |
rito | -6.774 |
>>>>>>>> | -6.489 |
Token | Kim |
Token ID | 6502 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
oyal | +1.434 |
stown | +1.321 |
charging | +1.286 |
atically | +1.283 |
Wolfe | +1.272 |
Neg logit contributions | |
hua | -1.430 |
uces | -1.394 |
rito | -1.349 |
itous | -1.340 |
048 | -1.285 |
Token | b |
Token ID | 65 |
Feature activation | -3.19e-01 |
Pos logit contributions | |
oyal | +2.613 |
stown | +2.406 |
charging | +2.345 |
atically | +2.329 |
Wolfe | +2.298 |
Neg logit contributions | |
hua | -2.602 |
uces | -2.561 |
itous | -2.459 |
rito | -2.451 |
048 | -2.353 |
Token | biological |
Token ID | 10685 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
oyal | +1.864 |
stown | +1.721 |
charging | +1.686 |
atically | +1.679 |
Wolfe | +1.648 |
Neg logit contributions | |
hua | -2.027 |
uces | -1.974 |
rito | -1.912 |
itous | -1.898 |
048 | -1.827 |
Token | angle |
Token ID | 9848 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
oyal | +0.992 |
stown | +0.909 |
charging | +0.886 |
atically | +0.882 |
Wolfe | +0.865 |
Neg logit contributions | |
hua | -1.143 |
uces | -1.112 |
rito | -1.077 |
itous | -1.072 |
048 | -1.029 |
Token | to |
Token ID | 284 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
hua | +0.917 |
uces | +0.887 |
rito | +0.852 |
itous | +0.850 |
048 | +0.806 |
Neg logit contributions | |
oyal | -1.108 |
stown | -1.027 |
charging | -1.003 |
atically | -0.993 |
Gleaming | -0.980 |
Token | argue |
Token ID | 7267 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
oyal | +1.380 |
stown | +1.256 |
charging | +1.223 |
atically | +1.216 |
Wolfe | +1.186 |
Neg logit contributions | |
hua | -1.721 |
uces | -1.675 |
rito | -1.625 |
itous | -1.620 |
048 | -1.556 |
Token | against |
Token ID | 1028 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
oyal | +1.361 |
stown | +1.258 |
atically | +1.230 |
charging | +1.229 |
Wolfe | +1.205 |
Neg logit contributions | |
hua | -1.393 |
uces | -1.346 |
rito | -1.308 |
itous | -1.299 |
048 | -1.245 |
Token | co |
Token ID | 763 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
oyal | +0.750 |
stown | +0.693 |
charging | +0.678 |
atically | +0.675 |
Wolfe | +0.663 |
Neg logit contributions | |
hua | -0.688 |
uces | -0.668 |
rito | -0.644 |
itous | -0.641 |
048 | -0.612 |
Token | - |
Token ID | 12 |
Feature activation | -9.04e+00 |
Pos logit contributions | |
oyal | +8.651 |
charging | +8.349 |
stown | +8.080 |
agy | +7.781 |
opers | +7.770 |
Neg logit contributions | |
hua | -8.833 |
rito | -8.587 |
uces | -8.569 |
itous | -8.385 |
inguishable | -8.260 |
Token | education |
Token ID | 40796 |
Feature activation | -5.33e-01 |
Pos logit contributions | |
oyal | +6.029 |
charging | +5.796 |
stown | +5.740 |
agy | +5.367 |
Wolfe | +5.332 |
Neg logit contributions | |
hua | -6.208 |
uces | -6.181 |
itous | -5.998 |
rito | -5.947 |
inguishable | -5.682 |
Token | when |
Token ID | 618 |
Feature activation | -3.65e+00 |
Pos logit contributions | |
oyal | +0.406 |
stown | +0.376 |
charging | +0.368 |
atically | +0.367 |
Wolfe | +0.360 |
Neg logit contributions | |
hua | -0.355 |
uces | -0.344 |
rito | -0.331 |
itous | -0.330 |
048 | -0.314 |
Token | he |
Token ID | 339 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
oyal | +2.507 |
stown | +2.312 |
charging | +2.268 |
atically | +2.245 |
Wolfe | +2.224 |
Neg logit contributions | |
hua | -2.663 |
uces | -2.610 |
rito | -2.517 |
itous | -2.501 |
048 | -2.401 |
Token | wrote |
Token ID | 2630 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
oyal | +0.778 |
stown | +0.702 |
charging | +0.685 |
atically | +0.677 |
agy | +0.662 |
Neg logit contributions | |
hua | -1.057 |
uces | -1.029 |
rito | -0.999 |
itous | -0.997 |
048 | -0.960 |
Token | Broad |
Token ID | 9765 |
Feature activation | +8.72e-01 |
Pos logit contributions | |
hua | +4.114 |
uces | +3.994 |
rito | +3.884 |
itous | +3.817 |
048 | +3.734 |
Neg logit contributions | |
oyal | -4.526 |
stown | -4.135 |
charging | -4.063 |
atically | -4.039 |
agy | -3.960 |
Token | City |
Token ID | 2254 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
hua | +0.526 |
uces | +0.507 |
rito | +0.485 |
itous | +0.482 |
048 | +0.457 |
Neg logit contributions | |
oyal | -0.722 |
stown | -0.666 |
charging | -0.657 |
atically | -0.654 |
agy | -0.643 |
Token | and |
Token ID | 290 |
Feature activation | -4.04e-01 |
Pos logit contributions | |
hua | +0.959 |
uces | +0.930 |
rito | +0.895 |
itous | +0.893 |
048 | +0.854 |
Neg logit contributions | |
oyal | -1.102 |
stown | -1.015 |
charging | -0.997 |
atically | -0.993 |
Wolfe | -0.971 |
Token | once |
Token ID | 1752 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
oyal | +0.297 |
stown | +0.275 |
charging | +0.269 |
atically | +0.267 |
Wolfe | +0.263 |
Neg logit contributions | |
hua | -0.279 |
uces | -0.271 |
rito | -0.261 |
itous | -0.260 |
048 | -0.248 |
Token | did |
Token ID | 750 |
Feature activation | +2.97e+00 |
Pos logit contributions | |
hua | +1.661 |
uces | +1.614 |
itous | +1.555 |
rito | +1.555 |
048 | +1.480 |
Neg logit contributions | |
oyal | -1.754 |
stown | -1.601 |
charging | -1.571 |
atically | -1.552 |
Gleaming | -1.533 |
Token | cart |
Token ID | 6383 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
hua | +2.054 |
uces | +2.001 |
rito | +1.941 |
itous | +1.931 |
048 | +1.842 |
Neg logit contributions | |
oyal | -2.137 |
stown | -1.982 |
charging | -1.927 |
atically | -1.923 |
Gleaming | -1.882 |
Token | whe |
Token ID | 12491 |
Feature activation | +2.51e+00 |
Pos logit contributions | |
oyal | +8.215 |
agy | +7.330 |
charging | +7.305 |
atically | +7.212 |
stown | +7.175 |
Neg logit contributions | |
hua | -10.161 |
uces | -9.912 |
inguishable | -9.376 |
rito | -9.277 |
itous | -9.231 |
Token | els |
Token ID | 1424 |
Feature activation | -6.07e-01 |
Pos logit contributions | |
hua | +0.992 |
uces | +0.943 |
rito | +0.885 |
itous | +0.875 |
048 | +0.801 |
Neg logit contributions | |
oyal | -2.584 |
stown | -2.441 |
charging | -2.402 |
atically | -2.393 |
Wolfe | -2.365 |
Token | in |
Token ID | 287 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
oyal | +0.463 |
stown | +0.429 |
charging | +0.420 |
atically | +0.418 |
Wolfe | +0.411 |
Neg logit contributions | |
hua | -0.403 |
uces | -0.391 |
rito | -0.376 |
itous | -0.375 |
048 | -0.357 |
Token | a |
Token ID | 257 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
hua | +0.163 |
uces | +0.158 |
rito | +0.153 |
itous | +0.152 |
048 | +0.146 |
Neg logit contributions | |
oyal | -0.171 |
stown | -0.157 |
charging | -0.154 |
atically | -0.153 |
Wolfe | -0.150 |
Token | glitter |
Token ID | 31133 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
oyal | +1.401 |
stown | +1.298 |
charging | +1.271 |
atically | +1.263 |
Wolfe | +1.244 |
Neg logit contributions | |
hua | -1.309 |
uces | -1.273 |
rito | -1.223 |
itous | -1.219 |
048 | -1.163 |
Token | boy |
Token ID | 7081 |
Feature activation | +4.11e+00 |
Pos logit contributions | |
oyal | +1.581 |
stown | +1.424 |
atically | +1.363 |
charging | +1.341 |
Wolfe | +1.324 |
Neg logit contributions | |
hua | -2.779 |
uces | -2.735 |
itous | -2.646 |
rito | -2.643 |
inguishable | -2.548 |
Token | . |
Token ID | 13 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
hua | +2.595 |
uces | +2.505 |
rito | +2.398 |
itous | +2.395 |
liest | +2.288 |
Neg logit contributions | |
oyal | -3.229 |
charging | -2.942 |
stown | -2.939 |
atically | -2.923 |
agy | -2.842 |
Token |
|
Token ID | 198 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
hua | +1.681 |
uces | +1.631 |
rito | +1.575 |
itous | +1.567 |
048 | +1.498 |
Neg logit contributions | |
oyal | -1.701 |
stown | -1.565 |
charging | -1.529 |
atically | -1.522 |
Wolfe | -1.487 |
Token |
|
Token ID | 198 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
oyal | +1.228 |
stown | +1.127 |
charging | +1.100 |
atically | +1.095 |
Wolfe | +1.072 |
Neg logit contributions | |
hua | -1.331 |
uces | -1.294 |
rito | -1.251 |
itous | -1.247 |
048 | -1.195 |
Token | H |
Token ID | 39 |
Feature activation | -2.96e+00 |
Pos logit contributions | |
oyal | +1.095 |
stown | +1.017 |
charging | +0.997 |
atically | +0.992 |
Wolfe | +0.969 |
Neg logit contributions | |
hua | -0.928 |
uces | -0.905 |
rito | -0.868 |
itous | -0.868 |
048 | -0.821 |
Token | app |
Token ID | 1324 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
oyal | +2.127 |
stown | +1.946 |
atically | +1.911 |
charging | +1.901 |
agy | +1.867 |
Neg logit contributions | |
hua | -2.100 |
uces | -2.033 |
rito | -1.956 |
itous | -1.943 |
048 | -1.868 |
Token | conc |
Token ID | 1673 |
Feature activation | -8.06e+00 |
Pos logit contributions | |
oyal | +8.741 |
stown | +8.500 |
atically | +8.359 |
charging | +8.169 |
agy | +8.002 |
Neg logit contributions | |
hua | -8.740 |
uces | -8.358 |
rito | -8.346 |
itous | -8.122 |
hyde | -7.743 |
Token | urs |
Token ID | 1834 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
oyal | +5.753 |
stown | +5.345 |
charging | +5.203 |
atically | +5.149 |
agy | +5.052 |
Neg logit contributions | |
hua | -5.528 |
uces | -5.188 |
rito | -5.109 |
hyde | -4.980 |
itous | -4.963 |
Token | : |
Token ID | 25 |
Feature activation | -5.51e+00 |
Pos logit contributions | |
oyal | +3.529 |
stown | +3.268 |
atically | +3.239 |
Wolfe | +3.203 |
charging | +3.175 |
Neg logit contributions | |
hua | -3.469 |
uces | -3.374 |
rito | -3.259 |
itous | -3.254 |
048 | -3.084 |
Token | " |
Token ID | 366 |
Feature activation | -6.22e-01 |
Pos logit contributions | |
oyal | +3.953 |
stown | +3.691 |
atically | +3.625 |
Wolfe | +3.600 |
Others | +3.581 |
Neg logit contributions | |
hua | -3.765 |
uces | -3.648 |
rito | -3.533 |
itous | -3.498 |
048 | -3.359 |
Token | The |
Token ID | 464 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
oyal | +0.462 |
stown | +0.427 |
charging | +0.418 |
atically | +0.416 |
Wolfe | +0.408 |
Neg logit contributions | |
hua | -0.425 |
uces | -0.412 |
rito | -0.397 |
itous | -0.396 |
048 | -0.378 |
Token | a |
Token ID | 257 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
hua | +1.439 |
uces | +1.401 |
rito | +1.349 |
itous | +1.344 |
hi | +1.284 |
Neg logit contributions | |
oyal | -1.471 |
stown | -1.361 |
charging | -1.331 |
atically | -1.313 |
agy | -1.302 |
Token | player |
Token ID | 2137 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
oyal | +1.578 |
stown | +1.451 |
charging | +1.416 |
atically | +1.413 |
Wolfe | +1.388 |
Neg logit contributions | |
hua | -1.630 |
uces | -1.588 |
rito | -1.534 |
itous | -1.528 |
048 | -1.463 |
Token | on |
Token ID | 319 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
oyal | +2.963 |
stown | +2.757 |
atically | +2.664 |
charging | +2.657 |
Wolfe | +2.607 |
Neg logit contributions | |
hua | -2.871 |
uces | -2.838 |
rito | -2.703 |
itous | -2.697 |
048 | -2.576 |
Token | Twitter |
Token ID | 3009 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
oyal | +2.135 |
stown | +1.970 |
atically | +1.927 |
charging | +1.923 |
Wolfe | +1.896 |
Neg logit contributions | |
hua | -1.990 |
uces | -1.935 |
rito | -1.866 |
itous | -1.860 |
048 | -1.765 |
Token | or |
Token ID | 393 |
Feature activation | -6.18e+00 |
Pos logit contributions | |
oyal | +7.653 |
stown | +7.096 |
atically | +6.846 |
charging | +6.794 |
Wolfe | +6.584 |
Neg logit contributions | |
hua | -9.246 |
uces | -9.170 |
itous | -8.873 |
rito | -8.829 |
liest | -8.544 |
Token | Instagram |
Token ID | 10767 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
oyal | +3.737 |
stown | +3.422 |
atically | +3.338 |
charging | +3.284 |
Wolfe | +3.269 |
Neg logit contributions | |
hua | -4.897 |
uces | -4.814 |
rito | -4.648 |
itous | -4.643 |
048 | -4.485 |
Token | using |
Token ID | 1262 |
Feature activation | -6.28e+00 |
Pos logit contributions | |
oyal | +8.124 |
stown | +7.374 |
atically | +7.284 |
charging | +7.001 |
Armstrong | +6.906 |
Neg logit contributions | |
uces | -9.634 |
hua | -9.583 |
itous | -9.207 |
rito | -9.055 |
liest | -8.836 |
Token | the |
Token ID | 262 |
Feature activation | -5.79e+00 |
Pos logit contributions | |
oyal | +4.627 |
stown | +4.309 |
atically | +4.277 |
charging | +4.176 |
Wolfe | +4.170 |
Neg logit contributions | |
hua | -4.153 |
uces | -3.979 |
itous | -3.882 |
rito | -3.861 |
inguishable | -3.667 |
Token | hashtag |
Token ID | 23950 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
oyal | +4.292 |
stown | +3.963 |
atically | +3.914 |
charging | +3.843 |
Wolfe | +3.819 |
Neg logit contributions | |
hua | -3.863 |
uces | -3.769 |
rito | -3.622 |
itous | -3.588 |
048 | -3.408 |
Token | # |
Token ID | 1303 |
Feature activation | -5.02e+00 |
Pos logit contributions | |
oyal | +7.569 |
stown | +7.166 |
atically | +7.060 |
Armstrong | +6.950 |
Wolfe | +6.843 |
Neg logit contributions | |
hua | -6.866 |
uces | -6.656 |
itous | -6.457 |
rito | -6.390 |
inguishable | -6.076 |
Token | Ask |
Token ID | 25214 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
oyal | +4.075 |
stown | +3.776 |
charging | +3.721 |
atically | +3.690 |
agy | +3.638 |
Neg logit contributions | |
hua | -2.970 |
uces | -2.918 |
itous | -2.802 |
rito | -2.783 |
inguishable | -2.614 |
Token | 08 |
Token ID | 2919 |
Feature activation | +2.91e+00 |
Pos logit contributions | |
oyal | +4.587 |
stown | +4.278 |
charging | +4.231 |
atically | +4.179 |
agy | +4.129 |
Neg logit contributions | |
hua | -2.763 |
uces | -2.643 |
rito | -2.572 |
itous | -2.558 |
inguishable | -2.379 |
Token | 45 |
Token ID | 2231 |
Feature activation | -4.23e+00 |
Pos logit contributions | |
hua | +1.490 |
uces | +1.409 |
rito | +1.346 |
itous | +1.327 |
048 | +1.316 |
Neg logit contributions | |
oyal | -2.638 |
stown | -2.466 |
atically | -2.456 |
charging | -2.439 |
Gleaming | -2.397 |
Token | 287 |
Token ID | 38721 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
oyal | +3.042 |
stown | +2.826 |
charging | +2.755 |
atically | +2.722 |
Wolfe | +2.717 |
Neg logit contributions | |
hua | -2.927 |
uces | -2.881 |
rito | -2.777 |
itous | -2.757 |
inguishable | -2.606 |
Token | 119 |
Token ID | 15136 |
Feature activation | -3.00e+00 |
Pos logit contributions | |
oyal | +1.807 |
stown | +1.679 |
charging | +1.638 |
atically | +1.623 |
Wolfe | +1.610 |
Neg logit contributions | |
hua | -1.673 |
uces | -1.638 |
rito | -1.574 |
itous | -1.569 |
inguishable | -1.481 |
Token | 8 |
Token ID | 23 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
oyal | +2.388 |
stown | +2.231 |
charging | +2.183 |
atically | +2.172 |
Wolfe | +2.153 |
Neg logit contributions | |
hua | -1.858 |
uces | -1.818 |
rito | -1.745 |
itous | -1.740 |
inguishable | -1.628 |
Token | ; |
Token ID | 26 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
oyal | +2.470 |
stown | +2.268 |
charging | +2.256 |
atically | +2.233 |
Wolfe | +2.217 |
Neg logit contributions | |
hua | -2.226 |
uces | -2.204 |
rito | -2.114 |
itous | -2.108 |
inguishable | -1.987 |
Token | adventure |
Token ID | 8855 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
oyal | +8.232 |
atically | +7.376 |
stown | +7.343 |
agy | +7.261 |
Armstrong | +7.147 |
Neg logit contributions | |
hua | -9.599 |
uces | -9.031 |
rito | -8.925 |
itous | -8.815 |
inguishable | -8.622 |
Token | company |
Token ID | 39722 |
Feature activation | -9.07e+00 |
Pos logit contributions | |
oyal | +7.999 |
stown | +7.450 |
charging | +7.388 |
atically | +6.986 |
opers | +6.802 |
Neg logit contributions | |
hua | -8.162 |
uces | -7.990 |
itous | -7.683 |
inguishable | -7.580 |
>>>>>>>> | -7.478 |
Token | . |
Token ID | 13 |
Feature activation | -6.94e+00 |
Pos logit contributions | |
oyal | +6.179 |
stown | +5.667 |
charging | +5.574 |
atically | +5.344 |
agy | +5.225 |
Neg logit contributions | |
hua | -6.293 |
uces | -6.113 |
itous | -6.050 |
rito | -5.806 |
inguishable | -5.740 |
Token | co |
Token ID | 1073 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
oyal | +4.117 |
stown | +3.679 |
charging | +3.636 |
atically | +3.495 |
agy | +3.360 |
Neg logit contributions | |
hua | -5.554 |
uces | -5.532 |
itous | -5.400 |
rito | -5.324 |
inguishable | -5.184 |
Token | . |
Token ID | 13 |
Feature activation | -7.18e+00 |
Pos logit contributions | |
oyal | +6.750 |
stown | +6.210 |
charging | +5.862 |
agy | +5.703 |
atically | +5.665 |
Neg logit contributions | |
uces | -7.309 |
hua | -7.236 |
rito | -6.936 |
inguishable | -6.903 |
itous | -6.889 |
Token | - |
Token ID | 12 |
Feature activation | +2.73e+00 |
Pos logit contributions | |
hua | +0.507 |
uces | +0.493 |
rito | +0.475 |
itous | +0.474 |
048 | +0.453 |
Neg logit contributions | |
oyal | -0.505 |
stown | -0.465 |
charging | -0.454 |
atically | -0.451 |
Wolfe | -0.443 |
Token | for |
Token ID | 1640 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
hua | +1.927 |
uces | +1.867 |
rito | +1.792 |
itous | +1.791 |
048 | +1.711 |
Neg logit contributions | |
oyal | -1.948 |
stown | -1.808 |
charging | -1.746 |
atically | -1.745 |
Wolfe | -1.727 |
Token | - |
Token ID | 12 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
hua | +1.937 |
uces | +1.873 |
rito | +1.790 |
itous | +1.786 |
liest | +1.691 |
Neg logit contributions | |
oyal | -2.612 |
stown | -2.441 |
charging | -2.374 |
atically | -2.364 |
Gleaming | -2.336 |
Token | something |
Token ID | 18927 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
hua | +1.543 |
uces | +1.493 |
rito | +1.450 |
itous | +1.437 |
048 | +1.378 |
Neg logit contributions | |
oyal | -1.445 |
stown | -1.333 |
atically | -1.297 |
Gleaming | -1.283 |
charging | -1.282 |
Token | was |
Token ID | 373 |
Feature activation | -3.47e+00 |
Pos logit contributions | |
oyal | +1.199 |
stown | +1.103 |
atically | +1.087 |
charging | +1.074 |
Wolfe | +1.063 |
Neg logit contributions | |
hua | -1.232 |
uces | -1.198 |
rito | -1.161 |
itous | -1.149 |
048 | -1.107 |
Token | co |
Token ID | 763 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
oyal | +2.434 |
stown | +2.250 |
atically | +2.207 |
charging | +2.187 |
Wolfe | +2.167 |
Neg logit contributions | |
hua | -2.494 |
uces | -2.437 |
rito | -2.342 |
itous | -2.331 |
048 | -2.234 |
Token | - |
Token ID | 12 |
Feature activation | -9.47e+00 |
Pos logit contributions | |
oyal | +9.484 |
atically | +8.691 |
charging | +8.627 |
stown | +8.606 |
agy | +8.523 |
Neg logit contributions | |
hua | -8.068 |
uces | -7.771 |
rito | -7.411 |
itous | -7.337 |
048 | -7.193 |
Token | opted |
Token ID | 45256 |
Feature activation | +3.70e+00 |
Pos logit contributions | |
oyal | +5.632 |
stown | +5.216 |
charging | +5.156 |
atically | +5.111 |
agy | +4.885 |
Neg logit contributions | |
hua | -7.271 |
uces | -7.213 |
rito | -6.825 |
itous | -6.814 |
048 | -6.631 |
Token | into |
Token ID | 656 |
Feature activation | -2.19e+00 |
Pos logit contributions | |
hua | +2.120 |
uces | +2.023 |
itous | +1.958 |
rito | +1.942 |
048 | +1.828 |
Neg logit contributions | |
oyal | -3.151 |
stown | -2.927 |
charging | -2.873 |
Gleaming | -2.825 |
atically | -2.790 |
Token | the |
Token ID | 262 |
Feature activation | -6.70e-01 |
Pos logit contributions | |
oyal | +1.538 |
stown | +1.416 |
charging | +1.382 |
atically | +1.379 |
Wolfe | +1.362 |
Neg logit contributions | |
hua | -1.586 |
uces | -1.540 |
rito | -1.489 |
itous | -1.483 |
048 | -1.425 |
Token | belief |
Token ID | 4901 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
oyal | +0.490 |
stown | +0.452 |
charging | +0.442 |
atically | +0.440 |
Wolfe | +0.431 |
Neg logit contributions | |
hua | -0.467 |
uces | -0.453 |
rito | -0.437 |
itous | -0.436 |
048 | -0.416 |
Token | to |
Token ID | 284 |
Feature activation | -4.69e+00 |
Pos logit contributions | |
stown | +3.917 |
oyal | +3.849 |
charging | +3.601 |
Wolfe | +3.587 |
Armstrong | +3.584 |
Neg logit contributions | |
hua | -5.150 |
uces | -4.978 |
rito | -4.797 |
itous | -4.723 |
inguishable | -4.643 |
Token | be |
Token ID | 307 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
oyal | +3.671 |
stown | +3.451 |
atically | +3.380 |
charging | +3.357 |
Wolfe | +3.351 |
Neg logit contributions | |
hua | -2.915 |
uces | -2.781 |
rito | -2.729 |
itous | -2.701 |
048 | -2.559 |
Token | informed |
Token ID | 7981 |
Feature activation | -7.57e+00 |
Pos logit contributions | |
oyal | +1.027 |
stown | +0.936 |
atically | +0.908 |
charging | +0.899 |
Wolfe | +0.879 |
Neg logit contributions | |
hua | -1.761 |
uces | -1.729 |
rito | -1.682 |
itous | -1.673 |
048 | -1.629 |
Token | of |
Token ID | 286 |
Feature activation | -4.10e+00 |
Pos logit contributions | |
oyal | +4.353 |
stown | +4.201 |
Wolfe | +4.029 |
Armstrong | +3.990 |
atically | +3.941 |
Neg logit contributions | |
hua | -6.015 |
uces | -5.948 |
itous | -5.845 |
rito | -5.764 |
liest | -5.505 |
Token | important |
Token ID | 1593 |
Feature activation | -3.85e+00 |
Pos logit contributions | |
oyal | +2.769 |
stown | +2.555 |
charging | +2.522 |
atically | +2.464 |
Wolfe | +2.445 |
Neg logit contributions | |
hua | -3.060 |
uces | -3.004 |
rito | -2.908 |
itous | -2.857 |
048 | -2.750 |
Token | news |
Token ID | 1705 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
oyal | +2.805 |
stown | +2.629 |
charging | +2.559 |
Wolfe | +2.531 |
atically | +2.506 |
Neg logit contributions | |
hua | -2.631 |
uces | -2.580 |
rito | -2.481 |
itous | -2.453 |
048 | -2.341 |
Token | as |
Token ID | 355 |
Feature activation | -6.01e+00 |
Pos logit contributions | |
oyal | +8.139 |
stown | +7.566 |
atically | +7.444 |
Armstrong | +7.400 |
charging | +7.232 |
Neg logit contributions | |
hua | -9.245 |
uces | -9.002 |
rito | -8.775 |
itous | -8.746 |
inguishable | -8.621 |
Token | it |
Token ID | 340 |
Feature activation | -5.04e+00 |
Pos logit contributions | |
oyal | +3.889 |
stown | +3.580 |
charging | +3.525 |
Armstrong | +3.524 |
atically | +3.463 |
Neg logit contributions | |
hua | -4.507 |
uces | -4.453 |
itous | -4.223 |
rito | -4.197 |
048 | -4.132 |
Token | happens |
Token ID | 4325 |
Feature activation | -6.41e+00 |
Pos logit contributions | |
oyal | +2.340 |
stown | +2.175 |
atically | +2.133 |
Wolfe | +2.046 |
Armstrong | +2.036 |
Neg logit contributions | |
hua | -4.565 |
uces | -4.467 |
rito | -4.421 |
itous | -4.391 |
048 | -4.320 |
Token | in |
Token ID | 287 |
Feature activation | -5.60e+00 |
Pos logit contributions | |
oyal | +4.486 |
stown | +4.175 |
Wolfe | +4.031 |
Others | +4.020 |
charging | +4.004 |
Neg logit contributions | |
hua | -4.432 |
uces | -4.331 |
itous | -4.231 |
rito | -4.189 |
inguishable | -4.035 |
Token | Greater |
Token ID | 18169 |
Feature activation | -6.30e+00 |
Pos logit contributions | |
oyal | +3.053 |
stown | +2.748 |
Wolfe | +2.730 |
Armstrong | +2.684 |
charging | +2.663 |
Neg logit contributions | |
hua | -4.884 |
uces | -4.804 |
rito | -4.610 |
itous | -4.552 |
048 | -4.390 |
Token | can |
Token ID | 460 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
hua | +2.224 |
uces | +2.124 |
rito | +2.065 |
itous | +2.060 |
hi | +1.983 |
Neg logit contributions | |
oyal | -2.316 |
stown | -2.114 |
charging | -2.097 |
atically | -2.053 |
agy | -2.035 |
Token | tolerate |
Token ID | 21923 |
Feature activation | +2.07e+00 |
Pos logit contributions | |
hua | +1.317 |
uces | +1.267 |
rito | +1.239 |
itous | +1.231 |
048 | +1.179 |
Neg logit contributions | |
oyal | -1.385 |
stown | -1.276 |
charging | -1.252 |
atically | -1.236 |
Wolfe | -1.224 |
Token | . |
Token ID | 13 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
hua | +1.266 |
uces | +1.223 |
rito | +1.173 |
itous | +1.172 |
048 | +1.111 |
Neg logit contributions | |
oyal | -1.688 |
stown | -1.559 |
charging | -1.535 |
atically | -1.513 |
Gleaming | -1.496 |
Token | After |
Token ID | 2293 |
Feature activation | +6.00e+00 |
Pos logit contributions | |
oyal | +0.088 |
stown | +0.081 |
charging | +0.079 |
atically | +0.079 |
Wolfe | +0.077 |
Neg logit contributions | |
hua | -0.093 |
uces | -0.090 |
rito | -0.087 |
itous | -0.087 |
048 | -0.083 |
Token | the |
Token ID | 262 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
hua | +4.110 |
uces | +3.902 |
rito | +3.751 |
itous | +3.725 |
hi | +3.622 |
Neg logit contributions | |
oyal | -4.411 |
stown | -3.955 |
charging | -3.868 |
atically | -3.868 |
Gleaming | -3.819 |
Token | A |
Token ID | 317 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
hua | +0.215 |
uces | +0.207 |
rito | +0.201 |
itous | +0.200 |
048 | +0.193 |
Neg logit contributions | |
oyal | -0.194 |
stown | -0.177 |
charging | -0.174 |
atically | -0.172 |
agy | -0.168 |
Token | OG |
Token ID | 7730 |
Feature activation | +2.34e+00 |
Pos logit contributions | |
oyal | +6.944 |
stown | +6.109 |
agy | +5.820 |
atically | +5.801 |
Wolfe | +5.739 |
Neg logit contributions | |
hua | -10.333 |
uces | -10.100 |
itous | -9.950 |
048 | -9.565 |
liest | -9.563 |
Token | S |
Token ID | 50 |
Feature activation | +7.23e-01 |
Pos logit contributions | |
hua | +1.614 |
uces | +1.546 |
rito | +1.500 |
itous | +1.487 |
048 | +1.444 |
Neg logit contributions | |
oyal | -1.739 |
stown | -1.580 |
charging | -1.569 |
atically | -1.539 |
agy | -1.520 |
Token | - |
Token ID | 12 |
Feature activation | +4.24e+00 |
Pos logit contributions | |
hua | +0.512 |
uces | +0.495 |
rito | +0.478 |
itous | +0.476 |
048 | +0.457 |
Neg logit contributions | |
oyal | -0.523 |
stown | -0.479 |
charging | -0.472 |
atically | -0.467 |
agy | -0.458 |
Token | AG |
Token ID | 4760 |
Feature activation | +3.49e+00 |
Pos logit contributions | |
hua | +3.196 |
uces | +3.024 |
rito | +2.955 |
itous | +2.933 |
048 | +2.865 |
Neg logit contributions | |
oyal | -2.854 |
stown | -2.598 |
charging | -2.526 |
atically | -2.510 |
Wolfe | -2.485 |
Token | U |
Token ID | 52 |
Feature activation | +3.05e+00 |
Pos logit contributions | |
hua | +2.261 |
uces | +2.179 |
rito | +2.090 |
itous | +2.064 |
048 | +1.997 |
Neg logit contributions | |
oyal | -2.691 |
stown | -2.498 |
charging | -2.461 |
atically | -2.452 |
agy | -2.402 |
Token | GDP |
Token ID | 12396 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
oyal | +3.495 |
stown | +3.254 |
charging | +3.174 |
Wolfe | +3.155 |
atically | +3.152 |
Neg logit contributions | |
hua | -3.353 |
uces | -3.293 |
itous | -3.172 |
rito | -3.166 |
048 | -3.015 |
Token | for |
Token ID | 329 |
Feature activation | +1.92e-01 |
Pos logit contributions | |
oyal | +1.506 |
stown | +1.387 |
charging | +1.361 |
atically | +1.354 |
Wolfe | +1.328 |
Neg logit contributions | |
hua | -1.454 |
uces | -1.418 |
itous | -1.364 |
rito | -1.360 |
048 | -1.297 |
Token | the |
Token ID | 262 |
Feature activation | +6.95e-01 |
Pos logit contributions | |
hua | +0.132 |
uces | +0.128 |
rito | +0.124 |
itous | +0.123 |
048 | +0.117 |
Neg logit contributions | |
oyal | -0.142 |
stown | -0.131 |
charging | -0.128 |
atically | -0.128 |
Wolfe | -0.125 |
Token | state |
Token ID | 1181 |
Feature activation | +3.74e+00 |
Pos logit contributions | |
hua | +0.465 |
uces | +0.449 |
rito | +0.436 |
itous | +0.432 |
048 | +0.414 |
Neg logit contributions | |
oyal | -0.526 |
stown | -0.484 |
charging | -0.476 |
atically | -0.474 |
agy | -0.465 |
Token | of |
Token ID | 286 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
hua | +2.406 |
uces | +2.308 |
rito | +2.254 |
itous | +2.219 |
048 | +2.125 |
Neg logit contributions | |
oyal | -2.899 |
stown | -2.682 |
charging | -2.634 |
atically | -2.624 |
Gleaming | -2.621 |
Token | Co |
Token ID | 1766 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
hua | +0.694 |
uces | +0.671 |
rito | +0.648 |
itous | +0.645 |
048 | +0.619 |
Neg logit contributions | |
oyal | -0.780 |
stown | -0.717 |
charging | -0.703 |
atically | -0.701 |
agy | -0.688 |
Token | ahu |
Token ID | 12196 |
Feature activation | -2.78e+00 |
Pos logit contributions | |
oyal | +9.560 |
stown | +9.066 |
opers | +8.804 |
agy | +8.611 |
Others | +8.445 |
Neg logit contributions | |
hua | -7.503 |
uces | -7.448 |
048 | -7.188 |
itous | -7.083 |
rito | -6.976 |
Token | ila |
Token ID | 10102 |
Feature activation | -4.73e+00 |
Pos logit contributions | |
oyal | +2.213 |
stown | +2.055 |
charging | +2.022 |
atically | +1.999 |
Wolfe | +1.974 |
Neg logit contributions | |
hua | -1.732 |
uces | -1.701 |
itous | -1.623 |
rito | -1.623 |
048 | -1.550 |
Token | . |
Token ID | 13 |
Feature activation | -7.70e-01 |
Pos logit contributions | |
oyal | +3.378 |
stown | +3.150 |
charging | +3.055 |
atically | +3.012 |
Wolfe | +2.971 |
Neg logit contributions | |
hua | -3.243 |
uces | -3.206 |
itous | -3.093 |
rito | -3.027 |
048 | -2.918 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -9.40e-01 |
Pos logit contributions | |
oyal | +0.534 |
stown | +0.491 |
charging | +0.479 |
atically | +0.477 |
Wolfe | +0.468 |
Neg logit contributions | |
hua | -0.563 |
uces | -0.549 |
rito | -0.530 |
itous | -0.529 |
048 | -0.505 |
Token | If |
Token ID | 1532 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
oyal | +0.722 |
stown | +0.668 |
charging | +0.656 |
atically | +0.651 |
Wolfe | +0.637 |
Neg logit contributions | |
hua | -0.618 |
uces | -0.601 |
rito | -0.577 |
itous | -0.576 |
048 | -0.546 |
Token | ' |
Token ID | 6 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
hua | +1.248 |
uces | +1.169 |
itous | +1.117 |
rito | +1.108 |
048 | +1.094 |
Neg logit contributions | |
oyal | -2.155 |
stown | -1.998 |
charging | -1.972 |
atically | -1.969 |
agy | -1.946 |
Token | s |
Token ID | 82 |
Feature activation | -2.83e+00 |
Pos logit contributions | |
oyal | +1.650 |
stown | +1.519 |
charging | +1.477 |
atically | +1.470 |
Wolfe | +1.433 |
Neg logit contributions | |
hua | -1.908 |
uces | -1.863 |
rito | -1.801 |
itous | -1.795 |
048 | -1.715 |
Token | frame |
Token ID | 5739 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
oyal | +1.759 |
stown | +1.613 |
charging | +1.561 |
atically | +1.559 |
Wolfe | +1.524 |
Neg logit contributions | |
hua | -2.272 |
uces | -2.221 |
rito | -2.148 |
itous | -2.139 |
048 | -2.053 |
Token | | |
Token ID | 930 |
Feature activation | -4.17e+00 |
Pos logit contributions | |
hua | +0.709 |
uces | +0.676 |
rito | +0.652 |
itous | +0.646 |
048 | +0.639 |
Neg logit contributions | |
oyal | -0.871 |
stown | -0.795 |
charging | -0.782 |
atically | -0.779 |
agy | -0.773 |
Token | void |
Token ID | 7951 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
oyal | +2.319 |
stown | +2.125 |
charging | +2.028 |
atically | +2.021 |
Wolfe | +1.971 |
Neg logit contributions | |
hua | -3.603 |
uces | -3.505 |
rito | -3.409 |
itous | -3.405 |
liest | -3.252 |
Token | * |
Token ID | 1635 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
oyal | +1.215 |
stown | +1.111 |
charging | +1.083 |
atically | +1.076 |
agy | +1.059 |
Neg logit contributions | |
hua | -1.386 |
uces | -1.348 |
rito | -1.305 |
itous | -1.301 |
048 | -1.256 |
Token | arg |
Token ID | 853 |
Feature activation | -4.10e-01 |
Pos logit contributions | |
oyal | +3.824 |
charging | +3.380 |
stown | +3.092 |
atically | +2.964 |
abo | +2.880 |
Neg logit contributions | |
hua | -13.834 |
uces | -13.438 |
itous | -13.251 |
rito | -12.961 |
liest | -12.872 |
Token | | |
Token ID | 930 |
Feature activation | -4.26e+00 |
Pos logit contributions | |
oyal | +0.315 |
stown | +0.289 |
charging | +0.284 |
atically | +0.284 |
agy | +0.279 |
Neg logit contributions | |
hua | -0.271 |
uces | -0.262 |
rito | -0.252 |
itous | -0.251 |
048 | -0.244 |
Token | + |
Token ID | 1343 |
Feature activation | -3.67e+00 |
Pos logit contributions | |
oyal | +2.497 |
stown | +2.244 |
charging | +2.209 |
atically | +2.164 |
Wolfe | +2.120 |
Neg logit contributions | |
hua | -3.531 |
uces | -3.423 |
rito | -3.350 |
itous | -3.335 |
048 | -3.194 |
Token | -------------------- |
Token ID | 19351 |
Feature activation | -4.67e+00 |
Pos logit contributions | |
oyal | +1.973 |
stown | +1.769 |
charging | +1.711 |
atically | +1.690 |
Wolfe | +1.639 |
Neg logit contributions | |
hua | -3.250 |
uces | -3.188 |
rito | -3.098 |
itous | -3.083 |
048 | -2.964 |
Token | --+ |
Token ID | 44785 |
Feature activation | -4.76e+00 |
Pos logit contributions | |
oyal | +3.517 |
stown | +3.236 |
charging | +3.191 |
atically | +3.190 |
agy | +3.083 |
Neg logit contributions | |
hua | -3.115 |
uces | -3.011 |
rito | -2.920 |
itous | -2.885 |
inguishable | -2.742 |
Token | the |
Token ID | 262 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
oyal | +0.046 |
stown | +0.043 |
charging | +0.042 |
atically | +0.041 |
Wolfe | +0.040 |
Neg logit contributions | |
hua | -0.047 |
uces | -0.046 |
rito | -0.044 |
itous | -0.044 |
048 | -0.042 |
Token | players |
Token ID | 1938 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
hua | +1.502 |
uces | +1.464 |
itous | +1.406 |
rito | +1.405 |
048 | +1.347 |
Neg logit contributions | |
oyal | -1.539 |
stown | -1.418 |
charging | -1.390 |
atically | -1.382 |
agy | -1.365 |
Token | when |
Token ID | 618 |
Feature activation | -7.19e+00 |
Pos logit contributions | |
oyal | +1.168 |
stown | +1.078 |
charging | +1.053 |
atically | +1.053 |
Wolfe | +1.037 |
Neg logit contributions | |
hua | -1.126 |
uces | -1.093 |
rito | -1.058 |
itous | -1.050 |
048 | -1.003 |
Token | over |
Token ID | 625 |
Feature activation | -3.50e+00 |
Pos logit contributions | |
oyal | +4.470 |
stown | +4.183 |
charging | +4.114 |
Wolfe | +4.108 |
Armstrong | +4.072 |
Neg logit contributions | |
hua | -5.605 |
uces | -5.437 |
rito | -5.343 |
itous | -5.184 |
inguishable | -5.019 |
Token | the |
Token ID | 262 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
oyal | +2.451 |
stown | +2.290 |
charging | +2.261 |
atically | +2.182 |
Wolfe | +2.153 |
Neg logit contributions | |
hua | -2.523 |
uces | -2.452 |
itous | -2.381 |
rito | -2.380 |
inguishable | -2.249 |
Token | cap |
Token ID | 1451 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
oyal | +2.799 |
stown | +2.560 |
charging | +2.504 |
atically | +2.470 |
Wolfe | +2.439 |
Neg logit contributions | |
hua | -3.597 |
uces | -3.505 |
rito | -3.422 |
itous | -3.394 |
liest | -3.235 |
Token | , |
Token ID | 11 |
Feature activation | -7.08e+00 |
Pos logit contributions | |
oyal | +7.795 |
atically | +7.290 |
charging | +7.288 |
stown | +7.260 |
Wolfe | +7.180 |
Neg logit contributions | |
hua | -9.399 |
uces | -8.759 |
rito | -8.746 |
itous | -8.567 |
048 | -8.098 |
Token | functionally |
Token ID | 48410 |
Feature activation | -2.05e+00 |
Pos logit contributions | |
oyal | +4.915 |
stown | +4.460 |
atically | +4.422 |
charging | +4.397 |
Wolfe | +4.357 |
Neg logit contributions | |
hua | -5.126 |
uces | -4.901 |
itous | -4.749 |
rito | -4.724 |
048 | -4.463 |
Token | useless |
Token ID | 13894 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
oyal | +1.471 |
stown | +1.355 |
charging | +1.324 |
atically | +1.319 |
Wolfe | +1.293 |
Neg logit contributions | |
hua | -1.456 |
uces | -1.414 |
rito | -1.365 |
itous | -1.361 |
048 | -1.301 |
Token | . |
Token ID | 13 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
hua | +1.113 |
uces | +1.082 |
itous | +1.040 |
rito | +1.038 |
048 | +0.986 |
Neg logit contributions | |
oyal | -1.437 |
stown | -1.332 |
charging | -1.305 |
atically | -1.298 |
Gleaming | -1.281 |
Token |
|
Token ID | 198 |
Feature activation | -1.96e-01 |
Pos logit contributions | |
hua | +0.122 |
uces | +0.118 |
rito | +0.115 |
itous | +0.114 |
048 | +0.110 |
Neg logit contributions | |
oyal | -0.116 |
stown | -0.106 |
charging | -0.104 |
atically | -0.104 |
agy | -0.101 |
Token | for |
Token ID | 329 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
hua | +0.662 |
uces | +0.641 |
itous | +0.615 |
rito | +0.614 |
048 | +0.586 |
Neg logit contributions | |
oyal | -0.726 |
stown | -0.662 |
charging | -0.654 |
atically | -0.643 |
Gleaming | -0.640 |
Token | Mary |
Token ID | 5335 |
Feature activation | -2.82e+00 |
Pos logit contributions | |
hua | +2.768 |
uces | +2.676 |
itous | +2.567 |
rito | +2.555 |
048 | +2.455 |
Neg logit contributions | |
oyal | -3.005 |
stown | -2.734 |
charging | -2.705 |
atically | -2.655 |
agy | -2.641 |
Token | to |
Token ID | 284 |
Feature activation | -2.56e+00 |
Pos logit contributions | |
oyal | +2.066 |
stown | +1.912 |
atically | +1.861 |
charging | +1.853 |
Wolfe | +1.835 |
Neg logit contributions | |
hua | -1.933 |
uces | -1.888 |
rito | -1.813 |
itous | -1.807 |
048 | -1.726 |
Token | be |
Token ID | 307 |
Feature activation | -3.09e+00 |
Pos logit contributions | |
oyal | +1.746 |
stown | +1.610 |
atically | +1.562 |
charging | +1.551 |
Wolfe | +1.531 |
Neg logit contributions | |
hua | -1.896 |
uces | -1.857 |
rito | -1.789 |
itous | -1.775 |
048 | -1.702 |
Token | named |
Token ID | 3706 |
Feature activation | -5.95e-01 |
Pos logit contributions | |
oyal | +2.093 |
stown | +1.934 |
atically | +1.881 |
charging | +1.866 |
Wolfe | +1.845 |
Neg logit contributions | |
hua | -2.290 |
uces | -2.243 |
rito | -2.167 |
itous | -2.159 |
048 | -2.064 |
Token | Co |
Token ID | 1766 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
oyal | +0.439 |
stown | +0.406 |
charging | +0.397 |
atically | +0.395 |
Wolfe | +0.388 |
Neg logit contributions | |
hua | -0.409 |
uces | -0.397 |
rito | -0.383 |
itous | -0.382 |
048 | -0.364 |
Token | - |
Token ID | 12 |
Feature activation | -7.56e+00 |
Pos logit contributions | |
oyal | +9.104 |
stown | +8.644 |
opers | +8.102 |
agy | +8.042 |
atically | +7.983 |
Neg logit contributions | |
hua | -7.789 |
uces | -7.602 |
048 | -7.552 |
itous | -7.367 |
rito | -7.307 |
Token | Red |
Token ID | 7738 |
Feature activation | +4.59e+00 |
Pos logit contributions | |
oyal | +6.013 |
stown | +5.766 |
charging | +5.555 |
atically | +5.428 |
Wolfe | +5.347 |
Neg logit contributions | |
uces | -4.443 |
hua | -4.397 |
itous | -4.204 |
rito | -4.099 |
048 | -3.921 |
Token | empt |
Token ID | 1791 |
Feature activation | +4.23e+00 |
Pos logit contributions | |
hua | +2.929 |
uces | +2.879 |
rito | +2.699 |
itous | +2.678 |
hi | +2.568 |
Neg logit contributions | |
oyal | -3.544 |
stown | -3.323 |
charging | -3.274 |
Gleaming | -3.255 |
agy | -3.244 |
Token | rix |
Token ID | 8609 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
hua | +2.730 |
uces | +2.651 |
rito | +2.595 |
itous | +2.559 |
hi | +2.440 |
Neg logit contributions | |
oyal | -3.210 |
stown | -3.043 |
atically | -3.007 |
charging | -2.942 |
Gleaming | -2.927 |
Token | , |
Token ID | 11 |
Feature activation | -4.44e+00 |
Pos logit contributions | |
hua | +1.127 |
uces | +1.093 |
rito | +1.047 |
itous | +1.046 |
048 | +0.996 |
Neg logit contributions | |
oyal | -1.344 |
stown | -1.242 |
charging | -1.227 |
atically | -1.214 |
agy | -1.197 |
Token | . |
Token ID | 13 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
oyal | +1.811 |
stown | +1.686 |
charging | +1.646 |
atically | +1.639 |
Wolfe | +1.612 |
Neg logit contributions | |
hua | -1.503 |
uces | -1.465 |
rito | -1.405 |
itous | -1.399 |
048 | -1.323 |
Token | x |
Token ID | 87 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
oyal | +1.128 |
stown | +1.042 |
charging | +1.019 |
atically | +1.014 |
Wolfe | +0.995 |
Neg logit contributions | |
hua | -1.065 |
uces | -1.035 |
rito | -0.997 |
itous | -0.994 |
048 | -0.948 |
Token | . |
Token ID | 13 |
Feature activation | -3.97e-01 |
Pos logit contributions | |
hua | +0.643 |
uces | +0.606 |
itous | +0.586 |
rito | +0.584 |
048 | +0.567 |
Neg logit contributions | |
oyal | -0.911 |
stown | -0.841 |
charging | -0.831 |
atically | -0.828 |
Gleaming | -0.819 |
Token | x |
Token ID | 87 |
Feature activation | +3.15e+00 |
Pos logit contributions | |
oyal | +0.299 |
stown | +0.276 |
charging | +0.270 |
atically | +0.269 |
Wolfe | +0.265 |
Neg logit contributions | |
hua | -0.269 |
uces | -0.258 |
rito | -0.249 |
itous | -0.249 |
048 | -0.238 |
Token | . |
Token ID | 13 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
hua | +1.749 |
uces | +1.605 |
itous | +1.563 |
rito | +1.549 |
048 | +1.544 |
Neg logit contributions | |
oyal | -2.735 |
stown | -2.529 |
atically | -2.508 |
charging | -2.495 |
Gleaming | -2.493 |
Token | 174 |
Token ID | 22985 |
Feature activation | +9.88e+00 |
Pos logit contributions | |
oyal | +0.178 |
stown | +0.169 |
atically | +0.164 |
charging | +0.163 |
Wolfe | +0.163 |
Neg logit contributions | |
hua | -0.099 |
uces | -0.094 |
itous | -0.089 |
rito | -0.089 |
048 | -0.085 |
Token | 107 |
Token ID | 16226 |
Feature activation | +6.03e+00 |
Pos logit contributions | |
hua | +4.680 |
uces | +4.186 |
hi | +4.069 |
048 | +4.060 |
liest | +3.989 |
Neg logit contributions | |
oyal | -9.036 |
charging | -8.145 |
stown | -8.085 |
atically | -8.043 |
agy | -8.014 |
Token | 20 |
Token ID | 1238 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
hua | +2.777 |
uces | +2.536 |
048 | +2.525 |
rito | +2.405 |
itous | +2.371 |
Neg logit contributions | |
oyal | -5.741 |
atically | -5.317 |
charging | -5.303 |
stown | -5.289 |
agy | -5.218 |
Token | 40 |
Token ID | 1821 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
oyal | +1.402 |
stown | +1.314 |
charging | +1.287 |
atically | +1.278 |
Wolfe | +1.262 |
Neg logit contributions | |
hua | -0.915 |
uces | -0.889 |
itous | -0.848 |
rito | -0.847 |
inguishable | -0.788 |
Token | x |
Token ID | 2124 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
oyal | +0.761 |
stown | +0.698 |
charging | +0.684 |
atically | +0.681 |
agy | +0.666 |
Neg logit contributions | |
hua | -0.746 |
uces | -0.723 |
rito | -0.697 |
itous | -0.695 |
048 | -0.667 |
Token | . |
Token ID | 13 |
Feature activation | -7.84e-01 |
Pos logit contributions | |
oyal | +1.497 |
stown | +1.392 |
charging | +1.362 |
atically | +1.356 |
Wolfe | +1.333 |
Neg logit contributions | |
hua | -1.220 |
uces | -1.184 |
rito | -1.137 |
itous | -1.133 |
048 | -1.074 |
Token | male |
Token ID | 4257 |
Feature activation | +6.70e+00 |
Pos logit contributions | |
hua | +1.406 |
uces | +1.367 |
itous | +1.318 |
rito | +1.312 |
048 | +1.250 |
Neg logit contributions | |
oyal | -1.794 |
stown | -1.641 |
charging | -1.617 |
atically | -1.606 |
agy | -1.576 |
Token | pedoph |
Token ID | 27706 |
Feature activation | +6.31e+00 |
Pos logit contributions | |
hua | +4.100 |
uces | +4.036 |
itous | +3.898 |
rito | +3.853 |
liest | +3.724 |
Neg logit contributions | |
oyal | -5.290 |
stown | -4.701 |
charging | -4.694 |
atically | -4.650 |
Gleaming | -4.603 |
Token | ile |
Token ID | 576 |
Feature activation | +5.20e+00 |
Pos logit contributions | |
uces | +1.545 |
hua | +1.503 |
rito | +1.402 |
itous | +1.371 |
hi | +1.124 |
Neg logit contributions | |
oyal | -7.275 |
stown | -6.968 |
charging | -6.819 |
Gleaming | -6.797 |
atically | -6.734 |
Token | is |
Token ID | 318 |
Feature activation | +5.24e+00 |
Pos logit contributions | |
hua | +3.227 |
uces | +3.175 |
itous | +3.063 |
rito | +3.043 |
liest | +2.964 |
Neg logit contributions | |
oyal | -4.154 |
stown | -3.711 |
charging | -3.668 |
Gleaming | -3.597 |
atically | -3.578 |
Token | not |
Token ID | 407 |
Feature activation | +5.11e+00 |
Pos logit contributions | |
hua | +3.424 |
uces | +3.323 |
rito | +3.195 |
itous | +3.157 |
048 | +3.101 |
Neg logit contributions | |
oyal | -4.000 |
stown | -3.580 |
charging | -3.484 |
Gleaming | -3.465 |
atically | -3.436 |
Token | gay |
Token ID | 5650 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
hua | +3.310 |
uces | +3.177 |
rito | +3.055 |
itous | +3.049 |
liest | +2.943 |
Neg logit contributions | |
oyal | -3.950 |
stown | -3.579 |
charging | -3.477 |
agy | -3.452 |
atically | -3.420 |
Token | . |
Token ID | 13 |
Feature activation | +2.90e+00 |
Pos logit contributions | |
hua | +5.571 |
uces | +5.190 |
itous | +5.141 |
rito | +5.065 |
liest | +5.010 |
Neg logit contributions | |
oyal | -8.456 |
Gleaming | -7.690 |
charging | -7.645 |
stown | -7.621 |
CLOSE | -7.466 |
Token | In |
Token ID | 554 |
Feature activation | +2.92e-01 |
Pos logit contributions | |
hua | +2.048 |
uces | +1.956 |
itous | +1.895 |
rito | +1.889 |
048 | +1.837 |
Neg logit contributions | |
oyal | -2.096 |
stown | -1.903 |
charging | -1.882 |
atically | -1.862 |
agy | -1.815 |
Token | this |
Token ID | 428 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
hua | +0.206 |
uces | +0.199 |
rito | +0.192 |
itous | +0.192 |
048 | +0.183 |
Neg logit contributions | |
oyal | -0.212 |
stown | -0.195 |
charging | -0.190 |
atically | -0.189 |
Wolfe | -0.185 |
Token | context |
Token ID | 4732 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
oyal | +0.746 |
stown | +0.681 |
charging | +0.662 |
atically | +0.659 |
Wolfe | +0.646 |
Neg logit contributions | |
hua | -0.938 |
uces | -0.915 |
rito | -0.886 |
itous | -0.883 |
048 | -0.849 |
Token | , |
Token ID | 11 |
Feature activation | +3.36e+00 |
Pos logit contributions | |
oyal | +0.093 |
stown | +0.086 |
charging | +0.085 |
atically | +0.084 |
Wolfe | +0.083 |
Neg logit contributions | |
hua | -0.085 |
uces | -0.083 |
rito | -0.080 |
itous | -0.079 |
048 | -0.076 |
Token | / |
Token ID | 14 |
Feature activation | -4.55e-01 |
Pos logit contributions | |
hua | +2.132 |
uces | +1.900 |
hi | +1.837 |
rito | +1.833 |
itous | +1.827 |
Neg logit contributions | |
oyal | -4.318 |
atically | -3.961 |
stown | -3.954 |
Gleaming | -3.927 |
charging | -3.927 |
Token | 226 |
Token ID | 24909 |
Feature activation | -3.70e+00 |
Pos logit contributions | |
oyal | +0.354 |
stown | +0.329 |
charging | +0.322 |
atically | +0.320 |
Wolfe | +0.315 |
Neg logit contributions | |
hua | -0.295 |
uces | -0.286 |
rito | -0.275 |
itous | -0.274 |
048 | -0.261 |
Token | 4 |
Token ID | 604 |
Feature activation | -8.20e-01 |
Pos logit contributions | |
oyal | +2.396 |
stown | +2.214 |
charging | +2.156 |
atically | +2.123 |
Wolfe | +2.100 |
Neg logit contributions | |
hua | -2.865 |
uces | -2.789 |
rito | -2.690 |
itous | -2.681 |
048 | -2.565 |
Token | * |
Token ID | 9 |
Feature activation | -4.70e+00 |
Pos logit contributions | |
oyal | +0.591 |
stown | +0.543 |
charging | +0.531 |
atically | +0.528 |
Wolfe | +0.519 |
Neg logit contributions | |
hua | -0.581 |
uces | -0.560 |
rito | -0.543 |
itous | -0.541 |
048 | -0.523 |
Token | 0 |
Token ID | 657 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
oyal | +2.712 |
charging | +2.362 |
atically | +2.349 |
stown | +2.345 |
Wolfe | +2.283 |
Neg logit contributions | |
hua | -3.939 |
uces | -3.816 |
rito | -3.722 |
itous | -3.702 |
liest | -3.589 |
Token | . |
Token ID | 13 |
Feature activation | +9.94e+00 |
Pos logit contributions | |
oyal | +1.084 |
stown | +1.005 |
charging | +0.986 |
atically | +0.983 |
Wolfe | +0.965 |
Neg logit contributions | |
hua | -0.843 |
uces | -0.811 |
rito | -0.781 |
itous | -0.779 |
048 | -0.742 |
Token | 9 |
Token ID | 24 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
hua | +4.442 |
048 | +4.001 |
uces | +3.940 |
rito | +3.837 |
itous | +3.726 |
Neg logit contributions | |
oyal | -9.084 |
Gleaming | -8.652 |
charging | -8.606 |
stown | -8.514 |
Wolfe | -8.488 |
Token | 242 |
Token ID | 27877 |
Feature activation | -4.91e+00 |
Pos logit contributions | |
oyal | +0.086 |
stown | +0.079 |
charging | +0.078 |
atically | +0.077 |
Wolfe | +0.076 |
Neg logit contributions | |
hua | -0.075 |
uces | -0.072 |
rito | -0.070 |
itous | -0.070 |
048 | -0.066 |
Token | 4 |
Token ID | 604 |
Feature activation | +6.50e-02 |
Pos logit contributions | |
oyal | +2.950 |
stown | +2.639 |
charging | +2.595 |
agy | +2.558 |
atically | +2.558 |
Neg logit contributions | |
hua | -4.080 |
uces | -3.904 |
rito | -3.779 |
itous | -3.742 |
048 | -3.649 |
Token | * |
Token ID | 9 |
Feature activation | -3.52e+00 |
Pos logit contributions | |
hua | +0.045 |
uces | +0.043 |
rito | +0.042 |
itous | +0.042 |
048 | +0.041 |
Neg logit contributions | |
oyal | -0.048 |
stown | -0.044 |
charging | -0.043 |
atically | -0.043 |
Wolfe | -0.042 |
Token | 4 |
Token ID | 604 |
Feature activation | +6.59e-01 |
Pos logit contributions | |
oyal | +2.288 |
stown | +2.109 |
charging | +2.048 |
atically | +2.034 |
Wolfe | +2.004 |
Neg logit contributions | |
hua | -2.713 |
uces | -2.648 |
rito | -2.570 |
itous | -2.552 |
048 | -2.425 |
Token | you |
Token ID | 345 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
hua | +1.999 |
uces | +1.921 |
rito | +1.859 |
itous | +1.846 |
hi | +1.775 |
Neg logit contributions | |
oyal | -2.467 |
stown | -2.253 |
charging | -2.201 |
atically | -2.188 |
agy | -2.163 |
Token | think |
Token ID | 892 |
Feature activation | -5.19e+00 |
Pos logit contributions | |
hua | +1.316 |
uces | +1.261 |
rito | +1.241 |
itous | +1.230 |
048 | +1.186 |
Neg logit contributions | |
oyal | -1.249 |
stown | -1.142 |
charging | -1.119 |
atically | -1.083 |
agy | -1.072 |
Token | of |
Token ID | 286 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
oyal | +3.335 |
stown | +3.129 |
atically | +3.064 |
Wolfe | +3.010 |
charging | +2.996 |
Neg logit contributions | |
hua | -3.930 |
uces | -3.823 |
itous | -3.697 |
rito | -3.679 |
048 | -3.547 |
Token | characters |
Token ID | 3435 |
Feature activation | +4.99e-01 |
Pos logit contributions | |
oyal | +1.008 |
stown | +0.936 |
charging | +0.916 |
atically | +0.913 |
Wolfe | +0.899 |
Neg logit contributions | |
hua | -0.968 |
uces | -0.940 |
rito | -0.905 |
itous | -0.905 |
048 | -0.862 |
Token | for |
Token ID | 329 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
hua | +0.329 |
uces | +0.318 |
rito | +0.306 |
itous | +0.305 |
048 | +0.291 |
Neg logit contributions | |
oyal | -0.383 |
stown | -0.355 |
charging | -0.347 |
atically | -0.345 |
Wolfe | -0.339 |
Token | Dick |
Token ID | 11740 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
hua | +1.844 |
uces | +1.790 |
rito | +1.731 |
itous | +1.716 |
048 | +1.645 |
Neg logit contributions | |
oyal | -2.000 |
stown | -1.843 |
charging | -1.799 |
atically | -1.795 |
agy | -1.766 |
Token | Grayson |
Token ID | 42657 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
hua | +4.024 |
uces | +3.786 |
rito | +3.597 |
liest | +3.576 |
itous | +3.505 |
Neg logit contributions | |
oyal | -9.835 |
charging | -9.009 |
stown | -8.984 |
agy | -8.894 |
Gleaming | -8.881 |
Token | to |
Token ID | 284 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
hua | +2.528 |
uces | +2.427 |
rito | +2.336 |
itous | +2.335 |
048 | +2.235 |
Neg logit contributions | |
oyal | -3.214 |
stown | -2.968 |
charging | -2.904 |
atically | -2.883 |
agy | -2.856 |
Token | fight |
Token ID | 1907 |
Feature activation | +4.37e+00 |
Pos logit contributions | |
hua | +0.894 |
uces | +0.865 |
rito | +0.840 |
itous | +0.835 |
048 | +0.805 |
Neg logit contributions | |
oyal | -0.866 |
stown | -0.795 |
charging | -0.779 |
atically | -0.762 |
Gleaming | -0.756 |
Token | , |
Token ID | 11 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
hua | +2.697 |
uces | +2.582 |
itous | +2.476 |
rito | +2.472 |
hi | +2.377 |
Neg logit contributions | |
oyal | -3.522 |
stown | -3.219 |
charging | -3.157 |
agy | -3.103 |
Gleaming | -3.098 |
Token | Mid |
Token ID | 7215 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
oyal | +1.544 |
stown | +1.429 |
charging | +1.401 |
atically | +1.395 |
Wolfe | +1.377 |
Neg logit contributions | |
hua | -1.512 |
uces | -1.471 |
rito | -1.415 |
itous | -1.413 |
048 | -1.349 |
Token | the |
Token ID | 262 |
Feature activation | -7.96e-01 |
Pos logit contributions | |
hua | +2.312 |
uces | +2.255 |
rito | +2.158 |
itous | +2.156 |
liest | +2.081 |
Neg logit contributions | |
oyal | -2.546 |
stown | -2.308 |
atically | -2.274 |
charging | -2.269 |
agy | -2.237 |
Token | producers |
Token ID | 11408 |
Feature activation | +2.52e+00 |
Pos logit contributions | |
oyal | +0.562 |
stown | +0.517 |
charging | +0.505 |
atically | +0.503 |
Wolfe | +0.492 |
Neg logit contributions | |
hua | -0.574 |
uces | -0.558 |
rito | -0.539 |
itous | -0.537 |
048 | -0.514 |
Token | of |
Token ID | 286 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
hua | +1.746 |
uces | +1.703 |
rito | +1.674 |
itous | +1.642 |
hi | +1.584 |
Neg logit contributions | |
oyal | -1.816 |
stown | -1.665 |
charging | -1.611 |
atically | -1.599 |
agy | -1.593 |
Token | what |
Token ID | 644 |
Feature activation | -9.58e-01 |
Pos logit contributions | |
oyal | +1.460 |
stown | +1.355 |
charging | +1.325 |
atically | +1.318 |
Wolfe | +1.300 |
Neg logit contributions | |
hua | -1.322 |
uces | -1.278 |
itous | -1.233 |
rito | -1.230 |
048 | -1.174 |
Token | that |
Token ID | 326 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
oyal | +0.659 |
stown | +0.605 |
charging | +0.591 |
atically | +0.588 |
Wolfe | +0.576 |
Neg logit contributions | |
hua | -0.707 |
uces | -0.688 |
rito | -0.665 |
itous | -0.663 |
048 | -0.635 |
Token | beef |
Token ID | 12023 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
oyal | +0.836 |
stown | +0.779 |
charging | +0.762 |
atically | +0.759 |
Wolfe | +0.748 |
Neg logit contributions | |
hua | -0.677 |
uces | -0.654 |
rito | -0.630 |
itous | -0.628 |
048 | -0.597 |
Token | are |
Token ID | 389 |
Feature activation | +3.19e+00 |
Pos logit contributions | |
hua | +6.069 |
uces | +6.067 |
rito | +5.859 |
hi | +5.571 |
liest | +5.501 |
Neg logit contributions | |
oyal | -8.003 |
Gleaming | -7.185 |
stown | -7.155 |
charging | -7.122 |
atically | -7.088 |
Token | being |
Token ID | 852 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
hua | +2.129 |
uces | +2.064 |
rito | +1.994 |
itous | +1.972 |
liest | +1.901 |
Neg logit contributions | |
oyal | -2.394 |
stown | -2.191 |
Gleaming | -2.103 |
atically | -2.102 |
agy | -2.093 |
Token | paid |
Token ID | 3432 |
Feature activation | +6.01e+00 |
Pos logit contributions | |
hua | +0.886 |
uces | +0.861 |
rito | +0.827 |
itous | +0.825 |
048 | +0.788 |
Neg logit contributions | |
oyal | -1.002 |
stown | -0.920 |
charging | -0.897 |
atically | -0.897 |
Gleaming | -0.882 |
Token | and |
Token ID | 290 |
Feature activation | -2.97e+00 |
Pos logit contributions | |
hua | +3.290 |
uces | +3.222 |
rito | +3.056 |
itous | +3.052 |
liest | +2.967 |
Neg logit contributions | |
oyal | -5.066 |
stown | -4.634 |
Gleaming | -4.587 |
agy | -4.545 |
atically | -4.511 |
Token | what |
Token ID | 644 |
Feature activation | -2.91e+00 |
Pos logit contributions | |
oyal | +2.082 |
stown | +1.923 |
charging | +1.889 |
atically | +1.874 |
Wolfe | +1.842 |
Neg logit contributions | |
hua | -2.140 |
uces | -2.081 |
rito | -2.008 |
itous | -2.002 |
048 | -1.911 |
Token | mathematical |
Token ID | 18069 |
Feature activation | -5.76e-01 |
Pos logit contributions | |
hua | +1.757 |
uces | +1.700 |
rito | +1.650 |
itous | +1.630 |
hi | +1.573 |
Neg logit contributions | |
oyal | -1.783 |
stown | -1.631 |
charging | -1.584 |
agy | -1.558 |
atically | -1.550 |
Token | reasoning |
Token ID | 14607 |
Feature activation | -8.17e-01 |
Pos logit contributions | |
oyal | +0.395 |
stown | +0.361 |
charging | +0.353 |
atically | +0.349 |
agy | +0.343 |
Neg logit contributions | |
hua | -0.427 |
uces | -0.416 |
itous | -0.401 |
rito | -0.401 |
048 | -0.384 |
Token | and |
Token ID | 290 |
Feature activation | +5.20e-01 |
Pos logit contributions | |
oyal | +0.628 |
stown | +0.582 |
charging | +0.570 |
atically | +0.566 |
Wolfe | +0.557 |
Neg logit contributions | |
hua | -0.539 |
uces | -0.522 |
rito | -0.502 |
itous | -0.501 |
048 | -0.477 |
Token | logic |
Token ID | 9156 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
hua | +0.370 |
uces | +0.359 |
rito | +0.347 |
itous | +0.346 |
048 | +0.331 |
Neg logit contributions | |
oyal | -0.372 |
stown | -0.343 |
charging | -0.335 |
atically | -0.330 |
agy | -0.327 |
Token | to |
Token ID | 284 |
Feature activation | +8.53e-01 |
Pos logit contributions | |
hua | +0.825 |
uces | +0.797 |
itous | +0.765 |
rito | +0.762 |
048 | +0.725 |
Neg logit contributions | |
oyal | -1.018 |
stown | -0.947 |
charging | -0.925 |
atically | -0.908 |
Gleaming | -0.906 |
Token | a |
Token ID | 257 |
Feature activation | +3.22e+00 |
Pos logit contributions | |
hua | +0.609 |
uces | +0.590 |
rito | +0.571 |
itous | +0.567 |
048 | +0.544 |
Neg logit contributions | |
oyal | -0.609 |
stown | -0.560 |
charging | -0.548 |
atically | -0.541 |
agy | -0.533 |
Token | greater |
Token ID | 3744 |
Feature activation | +3.30e+00 |
Pos logit contributions | |
hua | +2.103 |
uces | +1.993 |
itous | +1.966 |
rito | +1.948 |
hi | +1.862 |
Neg logit contributions | |
oyal | -2.497 |
stown | -2.280 |
atically | -2.225 |
charging | -2.224 |
agy | -2.180 |
Token | degree |
Token ID | 4922 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
hua | +2.064 |
uces | +1.937 |
itous | +1.909 |
rito | +1.906 |
hi | +1.797 |
Neg logit contributions | |
oyal | -2.661 |
stown | -2.454 |
charging | -2.403 |
atically | -2.394 |
Gleaming | -2.354 |
Token | than |
Token ID | 621 |
Feature activation | +8.92e-01 |
Pos logit contributions | |
hua | +1.990 |
uces | +1.899 |
rito | +1.846 |
itous | +1.832 |
048 | +1.730 |
Neg logit contributions | |
oyal | -2.647 |
stown | -2.460 |
charging | -2.405 |
Gleaming | -2.369 |
atically | -2.365 |
Token | human |
Token ID | 1692 |
Feature activation | +3.36e+00 |
Pos logit contributions | |
hua | +0.625 |
uces | +0.606 |
rito | +0.583 |
itous | +0.580 |
048 | +0.557 |
Neg logit contributions | |
oyal | -0.653 |
stown | -0.598 |
charging | -0.585 |
atically | -0.581 |
agy | -0.570 |
Token | toddlers |
Token ID | 50142 |
Feature activation | +4.44e+00 |
Pos logit contributions | |
hua | +2.253 |
uces | +2.202 |
itous | +2.110 |
rito | +2.083 |
liest | +2.026 |
Neg logit contributions | |
oyal | -2.531 |
stown | -2.295 |
charging | -2.284 |
Gleaming | -2.249 |
atically | -2.221 |
Token | assessments |
Token ID | 21837 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
hua | +0.675 |
uces | +0.655 |
itous | +0.635 |
rito | +0.632 |
048 | +0.603 |
Neg logit contributions | |
oyal | -0.683 |
stown | -0.624 |
charging | -0.612 |
atically | -0.610 |
Wolfe | -0.600 |
Token | of |
Token ID | 286 |
Feature activation | +7.61e-01 |
Pos logit contributions | |
hua | +1.107 |
uces | +1.060 |
itous | +1.030 |
rito | +1.028 |
048 | +0.974 |
Neg logit contributions | |
oyal | -1.288 |
stown | -1.193 |
charging | -1.162 |
atically | -1.158 |
Gleaming | -1.145 |
Token | foreign |
Token ID | 3215 |
Feature activation | +3.95e+00 |
Pos logit contributions | |
hua | +0.525 |
uces | +0.509 |
itous | +0.491 |
rito | +0.491 |
048 | +0.468 |
Neg logit contributions | |
oyal | -0.561 |
stown | -0.517 |
charging | -0.505 |
atically | -0.503 |
agy | -0.494 |
Token | officials |
Token ID | 2828 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
hua | +2.461 |
uces | +2.341 |
itous | +2.261 |
rito | +2.241 |
liest | +2.167 |
Neg logit contributions | |
oyal | -3.110 |
stown | -2.895 |
charging | -2.844 |
atically | -2.832 |
Gleaming | -2.827 |
Token | or |
Token ID | 393 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
hua | +1.398 |
uces | +1.342 |
itous | +1.303 |
rito | +1.296 |
048 | +1.236 |
Neg logit contributions | |
oyal | -1.636 |
stown | -1.511 |
charging | -1.473 |
atically | -1.471 |
Gleaming | -1.454 |
Token | the |
Token ID | 262 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
hua | +1.194 |
uces | +1.154 |
itous | +1.114 |
rito | +1.109 |
048 | +1.057 |
Neg logit contributions | |
oyal | -1.275 |
stown | -1.177 |
charging | -1.147 |
atically | -1.142 |
agy | -1.126 |
Token | exposure |
Token ID | 7111 |
Feature activation | +4.51e+00 |
Pos logit contributions | |
hua | +0.926 |
uces | +0.895 |
itous | +0.871 |
rito | +0.865 |
048 | +0.826 |
Neg logit contributions | |
oyal | -0.960 |
stown | -0.885 |
charging | -0.861 |
atically | -0.860 |
agy | -0.843 |
Token | of |
Token ID | 286 |
Feature activation | +3.62e+00 |
Pos logit contributions | |
hua | +2.962 |
uces | +2.860 |
itous | +2.772 |
rito | +2.761 |
048 | +2.624 |
Neg logit contributions | |
oyal | -3.463 |
stown | -3.202 |
charging | -3.121 |
atically | -3.104 |
Gleaming | -3.066 |
Token | pressure |
Token ID | 3833 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
hua | +2.320 |
uces | +2.234 |
itous | +2.169 |
rito | +2.158 |
liest | +2.058 |
Neg logit contributions | |
oyal | -2.807 |
stown | -2.570 |
atically | -2.524 |
charging | -2.519 |
agy | -2.498 |
Token | tactics |
Token ID | 10815 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
hua | +1.165 |
uces | +1.124 |
rito | +1.087 |
itous | +1.082 |
048 | +1.039 |
Neg logit contributions | |
oyal | -1.258 |
stown | -1.161 |
atically | -1.127 |
charging | -1.125 |
Gleaming | -1.111 |
Token | used |
Token ID | 973 |
Feature activation | +4.15e+00 |
Pos logit contributions | |
oyal | +0.746 |
stown | +0.692 |
charging | +0.678 |
atically | +0.677 |
Wolfe | +0.666 |
Neg logit contributions | |
hua | -0.685 |
uces | -0.666 |
rito | -0.641 |
itous | -0.637 |
048 | -0.609 |
Token | � |
Token ID | 447 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
hua | +1.934 |
uces | +1.864 |
rito | +1.806 |
itous | +1.791 |
048 | +1.756 |
Neg logit contributions | |
oyal | -1.805 |
stown | -1.643 |
charging | -1.628 |
atically | -1.618 |
agy | -1.581 |
Token | � |
Token ID | 251 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
hua | +1.052 |
uces | +1.022 |
rito | +0.988 |
itous | +0.983 |
048 | +0.946 |
Neg logit contributions | |
oyal | -0.971 |
stown | -0.895 |
charging | -0.872 |
atically | -0.867 |
Wolfe | -0.851 |
Token |
|
Token ID | 198 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
oyal | +0.093 |
stown | +0.085 |
charging | +0.083 |
atically | +0.082 |
agy | +0.081 |
Neg logit contributions | |
hua | -0.100 |
uces | -0.098 |
rito | -0.094 |
itous | -0.094 |
048 | -0.090 |
Token |
|
Token ID | 198 |
Feature activation | +1.92e+00 |
Pos logit contributions | |
oyal | +0.704 |
stown | +0.644 |
charging | +0.631 |
atically | +0.629 |
Wolfe | +0.615 |
Neg logit contributions | |
hua | -0.737 |
uces | -0.713 |
rito | -0.689 |
itous | -0.688 |
048 | -0.663 |
Token | In |
Token ID | 818 |
Feature activation | +2.69e+00 |
Pos logit contributions | |
hua | +1.273 |
uces | +1.221 |
rito | +1.180 |
itous | +1.173 |
048 | +1.128 |
Neg logit contributions | |
oyal | -1.471 |
stown | -1.365 |
charging | -1.335 |
atically | -1.333 |
Wolfe | -1.316 |
Token | the |
Token ID | 262 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
hua | +1.841 |
uces | +1.757 |
rito | +1.697 |
itous | +1.688 |
hi | +1.615 |
Neg logit contributions | |
oyal | -2.024 |
stown | -1.864 |
atically | -1.812 |
charging | -1.804 |
agy | -1.771 |
Token | case |
Token ID | 1339 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
hua | +1.511 |
uces | +1.460 |
itous | +1.415 |
rito | +1.409 |
048 | +1.354 |
Neg logit contributions | |
oyal | -1.454 |
stown | -1.323 |
charging | -1.297 |
atically | -1.295 |
agy | -1.276 |
Token | of |
Token ID | 286 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
hua | +1.274 |
uces | +1.239 |
rito | +1.191 |
itous | +1.188 |
048 | +1.135 |
Neg logit contributions | |
oyal | -1.359 |
stown | -1.255 |
charging | -1.229 |
atically | -1.223 |
Wolfe | -1.202 |
Token | the |
Token ID | 262 |
Feature activation | +2.54e+00 |
Pos logit contributions | |
hua | +1.480 |
uces | +1.423 |
rito | +1.377 |
itous | +1.375 |
liest | +1.306 |
Neg logit contributions | |
oyal | -1.704 |
stown | -1.572 |
charging | -1.540 |
atically | -1.537 |
agy | -1.512 |
Token | recent |
Token ID | 2274 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
hua | +1.673 |
uces | +1.606 |
itous | +1.562 |
rito | +1.556 |
liest | +1.481 |
Neg logit contributions | |
oyal | -1.948 |
stown | -1.794 |
charging | -1.759 |
atically | -1.756 |
agy | -1.734 |
Token | US |
Token ID | 1294 |
Feature activation | +2.65e+00 |
Pos logit contributions | |
hua | +1.018 |
uces | +0.983 |
itous | +0.948 |
rito | +0.945 |
048 | +0.899 |
Neg logit contributions | |
oyal | -1.232 |
stown | -1.136 |
charging | -1.117 |
atically | -1.114 |
agy | -1.094 |
Token |
|
Token ID | 198 |
Feature activation | +4.70e-01 |
Pos logit contributions | |
oyal | +0.353 |
stown | +0.321 |
charging | +0.315 |
atically | +0.315 |
Wolfe | +0.308 |
Neg logit contributions | |
hua | -0.355 |
uces | -0.341 |
itous | -0.331 |
rito | -0.331 |
048 | -0.319 |
Token | " |
Token ID | 1 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
hua | +0.310 |
uces | +0.299 |
rito | +0.289 |
itous | +0.287 |
048 | +0.275 |
Neg logit contributions | |
oyal | -0.361 |
stown | -0.334 |
charging | -0.328 |
atically | -0.327 |
Wolfe | -0.322 |
Token | As |
Token ID | 1722 |
Feature activation | -4.10e+00 |
Pos logit contributions | |
oyal | +1.885 |
stown | +1.733 |
charging | +1.693 |
atically | +1.684 |
Wolfe | +1.651 |
Neg logit contributions | |
hua | -1.926 |
uces | -1.882 |
rito | -1.811 |
itous | -1.806 |
048 | -1.719 |
Token | you |
Token ID | 345 |
Feature activation | -9.92e-01 |
Pos logit contributions | |
oyal | +2.817 |
stown | +2.591 |
charging | +2.531 |
atically | +2.514 |
Wolfe | +2.493 |
Neg logit contributions | |
hua | -3.017 |
uces | -2.936 |
rito | -2.822 |
itous | -2.813 |
048 | -2.694 |
Token | may |
Token ID | 743 |
Feature activation | +4.02e+00 |
Pos logit contributions | |
oyal | +0.774 |
stown | +0.718 |
charging | +0.704 |
atically | +0.699 |
Wolfe | +0.687 |
Neg logit contributions | |
hua | -0.641 |
uces | -0.620 |
rito | -0.597 |
itous | -0.595 |
048 | -0.566 |
Token | have |
Token ID | 423 |
Feature activation | +2.25e+00 |
Pos logit contributions | |
hua | +2.411 |
uces | +2.297 |
rito | +2.256 |
itous | +2.247 |
hi | +2.144 |
Neg logit contributions | |
oyal | -3.245 |
stown | -3.015 |
charging | -3.008 |
Wolfe | -2.926 |
atically | -2.921 |
Token | heard |
Token ID | 2982 |
Feature activation | -3.86e+00 |
Pos logit contributions | |
hua | +1.297 |
uces | +1.236 |
itous | +1.191 |
rito | +1.189 |
hi | +1.125 |
Neg logit contributions | |
oyal | -1.911 |
stown | -1.781 |
charging | -1.758 |
atically | -1.724 |
Gleaming | -1.699 |
Token | , |
Token ID | 11 |
Feature activation | -3.61e+00 |
Pos logit contributions | |
oyal | +2.812 |
stown | +2.591 |
atically | +2.553 |
charging | +2.516 |
Wolfe | +2.504 |
Neg logit contributions | |
hua | -2.673 |
uces | -2.601 |
rito | -2.497 |
itous | -2.488 |
048 | -2.380 |
Token | Winter |
Token ID | 10633 |
Feature activation | -3.34e+00 |
Pos logit contributions | |
oyal | +2.411 |
stown | +2.208 |
atically | +2.151 |
charging | +2.150 |
Wolfe | +2.137 |
Neg logit contributions | |
hua | -2.727 |
uces | -2.649 |
rito | -2.554 |
itous | -2.541 |
048 | -2.436 |
Token | ke |
Token ID | 365 |
Feature activation | +1.77e+00 |
Pos logit contributions | |
oyal | +1.934 |
stown | +1.744 |
charging | +1.696 |
atically | +1.683 |
Wolfe | +1.642 |
Neg logit contributions | |
hua | -2.839 |
uces | -2.767 |
rito | -2.688 |
itous | -2.681 |
048 | -2.585 |
Token | wl |
Token ID | 40989 |
Feature activation | -8.66e-01 |
Pos logit contributions | |
hua | +1.114 |
uces | +1.050 |
rito | +1.007 |
itous | +0.990 |
048 | +0.960 |
Neg logit contributions | |
oyal | -1.432 |
stown | -1.326 |
charging | -1.304 |
atically | -1.291 |
Gleaming | -1.284 |
Token | a |
Token ID | 257 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
oyal | +1.577 |
stown | +1.455 |
charging | +1.422 |
atically | +1.416 |
Wolfe | +1.396 |
Neg logit contributions | |
hua | -1.550 |
uces | -1.504 |
rito | -1.453 |
itous | -1.448 |
048 | -1.384 |
Token | vibrant |
Token ID | 21266 |
Feature activation | -3.87e+00 |
Pos logit contributions | |
oyal | +1.456 |
stown | +1.345 |
charging | +1.315 |
atically | +1.310 |
Wolfe | +1.287 |
Neg logit contributions | |
hua | -1.379 |
uces | -1.339 |
rito | -1.291 |
itous | -1.287 |
048 | -1.229 |
Token | left |
Token ID | 1364 |
Feature activation | +4.38e-01 |
Pos logit contributions | |
oyal | +2.715 |
stown | +2.515 |
atically | +2.441 |
charging | +2.437 |
Wolfe | +2.399 |
Neg logit contributions | |
hua | -2.792 |
uces | -2.704 |
rito | -2.617 |
itous | -2.617 |
048 | -2.508 |
Token | can |
Token ID | 460 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
hua | +0.297 |
uces | +0.288 |
rito | +0.277 |
itous | +0.276 |
048 | +0.263 |
Neg logit contributions | |
oyal | -0.328 |
stown | -0.303 |
charging | -0.297 |
atically | -0.295 |
Wolfe | -0.290 |
Token | only |
Token ID | 691 |
Feature activation | -4.03e-01 |
Pos logit contributions | |
hua | +0.915 |
uces | +0.891 |
rito | +0.861 |
itous | +0.858 |
048 | +0.820 |
Neg logit contributions | |
oyal | -0.886 |
stown | -0.814 |
charging | -0.799 |
atically | -0.788 |
Wolfe | -0.777 |
Token | be |
Token ID | 307 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
oyal | +0.266 |
stown | +0.243 |
charging | +0.237 |
atically | +0.236 |
Wolfe | +0.231 |
Neg logit contributions | |
hua | -0.310 |
uces | -0.301 |
rito | -0.292 |
itous | -0.291 |
048 | -0.279 |
Token | grounded |
Token ID | 22804 |
Feature activation | +6.12e+00 |
Pos logit contributions | |
hua | +1.432 |
uces | +1.398 |
rito | +1.338 |
itous | +1.335 |
048 | +1.265 |
Neg logit contributions | |
oyal | -1.490 |
stown | -1.364 |
charging | -1.340 |
atically | -1.328 |
Gleaming | -1.307 |
Token | in |
Token ID | 287 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
hua | +3.451 |
uces | +3.329 |
itous | +3.192 |
rito | +3.155 |
048 | +2.969 |
Neg logit contributions | |
oyal | -5.174 |
stown | -4.763 |
charging | -4.731 |
Gleaming | -4.670 |
Wolfe | -4.576 |
Token | a |
Token ID | 257 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
oyal | +1.505 |
stown | +1.388 |
charging | +1.357 |
atically | +1.350 |
Wolfe | +1.327 |
Neg logit contributions | |
hua | -1.521 |
uces | -1.477 |
rito | -1.428 |
itous | -1.424 |
048 | -1.362 |
Token | rebuilt |
Token ID | 30080 |
Feature activation | +5.40e-01 |
Pos logit contributions | |
hua | +0.685 |
uces | +0.661 |
rito | +0.636 |
itous | +0.635 |
048 | +0.604 |
Neg logit contributions | |
oyal | -0.768 |
stown | -0.707 |
charging | -0.694 |
atically | -0.688 |
agy | -0.678 |
Token | labor |
Token ID | 4827 |
Feature activation | +3.82e+00 |
Pos logit contributions | |
hua | +0.362 |
uces | +0.353 |
rito | +0.339 |
itous | +0.337 |
048 | +0.320 |
Neg logit contributions | |
oyal | -0.407 |
stown | -0.373 |
charging | -0.368 |
atically | -0.365 |
agy | -0.359 |
Token | , |
Token ID | 11 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
hua | +0.888 |
uces | +0.851 |
rito | +0.822 |
itous | +0.820 |
048 | +0.781 |
Neg logit contributions | |
oyal | -1.113 |
stown | -1.027 |
charging | -1.008 |
atically | -0.994 |
Gleaming | -0.992 |
Token | noting |
Token ID | 10820 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
oyal | +0.871 |
stown | +0.796 |
charging | +0.775 |
atically | +0.772 |
Wolfe | +0.754 |
Neg logit contributions | |
hua | -0.988 |
uces | -0.961 |
rito | -0.930 |
itous | -0.928 |
048 | -0.890 |
Token | that |
Token ID | 326 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
oyal | +1.393 |
stown | +1.285 |
charging | +1.256 |
atically | +1.255 |
Wolfe | +1.234 |
Neg logit contributions | |
hua | -1.414 |
uces | -1.374 |
rito | -1.329 |
itous | -1.324 |
048 | -1.264 |
Token | Apple |
Token ID | 4196 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
hua | +0.229 |
uces | +0.222 |
rito | +0.213 |
itous | +0.213 |
048 | +0.204 |
Neg logit contributions | |
oyal | -0.246 |
stown | -0.226 |
charging | -0.221 |
atically | -0.220 |
agy | -0.216 |
Token | PR |
Token ID | 4810 |
Feature activation | -2.69e+00 |
Pos logit contributions | |
oyal | +0.789 |
stown | +0.729 |
charging | +0.713 |
atically | +0.710 |
Wolfe | +0.696 |
Neg logit contributions | |
hua | -0.729 |
uces | -0.708 |
rito | -0.682 |
itous | -0.680 |
048 | -0.649 |
Token | didn |
Token ID | 1422 |
Feature activation | -3.38e+00 |
Pos logit contributions | |
oyal | +1.941 |
stown | +1.786 |
atically | +1.750 |
charging | +1.740 |
Wolfe | +1.710 |
Neg logit contributions | |
hua | -1.887 |
uces | -1.839 |
itous | -1.767 |
rito | -1.763 |
048 | -1.675 |
Token | 't |
Token ID | 470 |
Feature activation | -4.53e-01 |
Pos logit contributions | |
oyal | +2.521 |
stown | +2.347 |
charging | +2.280 |
atically | +2.276 |
Wolfe | +2.230 |
Neg logit contributions | |
hua | -2.271 |
uces | -2.224 |
rito | -2.134 |
itous | -2.128 |
inguishable | -2.029 |
Token | warn |
Token ID | 9828 |
Feature activation | +7.23e-01 |
Pos logit contributions | |
oyal | +0.316 |
stown | +0.290 |
charging | +0.284 |
atically | +0.281 |
Wolfe | +0.276 |
Neg logit contributions | |
hua | -0.330 |
uces | -0.320 |
rito | -0.311 |
itous | -0.310 |
048 | -0.297 |
Token | her |
Token ID | 607 |
Feature activation | -4.78e-01 |
Pos logit contributions | |
hua | +0.514 |
uces | +0.499 |
rito | +0.482 |
itous | +0.481 |
048 | +0.462 |
Neg logit contributions | |
oyal | -0.517 |
stown | -0.474 |
charging | -0.464 |
atically | -0.461 |
agy | -0.453 |
Token | beforehand |
Token ID | 27091 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
oyal | +0.348 |
stown | +0.320 |
charging | +0.313 |
atically | +0.311 |
agy | +0.305 |
Neg logit contributions | |
hua | -0.335 |
uces | -0.323 |
rito | -0.313 |
itous | -0.312 |
048 | -0.298 |
Token | -- |
Token ID | 1377 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
hua | +2.273 |
uces | +2.145 |
itous | +2.092 |
rito | +2.090 |
048 | +2.005 |
Neg logit contributions | |
oyal | -2.740 |
stown | -2.532 |
charging | -2.477 |
atically | -2.457 |
Gleaming | -2.436 |
Token | noting |
Token ID | 10820 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
oyal | +1.960 |
stown | +1.807 |
charging | +1.768 |
atically | +1.756 |
Wolfe | +1.729 |
Neg logit contributions | |
hua | -2.075 |
uces | -2.022 |
rito | -1.950 |
itous | -1.942 |
048 | -1.856 |
Token | that |
Token ID | 326 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
oyal | +1.716 |
stown | +1.587 |
atically | +1.548 |
charging | +1.540 |
Wolfe | +1.519 |
Neg logit contributions | |
hua | -1.837 |
uces | -1.777 |
rito | -1.725 |
itous | -1.710 |
048 | -1.638 |
Token | she |
Token ID | 673 |
Feature activation | -8.56e-01 |
Pos logit contributions | |
hua | +0.250 |
uces | +0.243 |
rito | +0.234 |
itous | +0.234 |
048 | +0.224 |
Neg logit contributions | |
oyal | -0.261 |
stown | -0.240 |
charging | -0.235 |
atically | -0.233 |
agy | -0.229 |
Token | would |
Token ID | 561 |
Feature activation | -2.66e+00 |
Pos logit contributions | |
oyal | +0.641 |
stown | +0.592 |
charging | +0.580 |
atically | +0.576 |
Wolfe | +0.566 |
Neg logit contributions | |
hua | -0.580 |
uces | -0.562 |
rito | -0.542 |
itous | -0.540 |
048 | -0.516 |
Token | not |
Token ID | 407 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
oyal | +1.909 |
stown | +1.766 |
atically | +1.724 |
charging | +1.718 |
Wolfe | +1.685 |
Neg logit contributions | |
hua | -1.887 |
uces | -1.833 |
rito | -1.757 |
itous | -1.754 |
048 | -1.668 |
Token | have |
Token ID | 423 |
Feature activation | -3.14e+00 |
Pos logit contributions | |
hua | +0.870 |
uces | +0.846 |
rito | +0.824 |
itous | +0.824 |
048 | +0.790 |
Neg logit contributions | |
oyal | -0.844 |
stown | -0.771 |
charging | -0.762 |
atically | -0.744 |
Gleaming | -0.742 |
Token | qualified |
Token ID | 10617 |
Feature activation | +3.84e+00 |
Pos logit contributions | |
oyal | +1.988 |
stown | +1.823 |
atically | +1.776 |
charging | +1.769 |
Wolfe | +1.739 |
Neg logit contributions | |
hua | -2.476 |
uces | -2.420 |
rito | -2.334 |
itous | -2.328 |
048 | -2.235 |
Token | for |
Token ID | 329 |
Feature activation | +3.07e+00 |
Pos logit contributions | |
hua | +2.262 |
uces | +2.154 |
itous | +2.072 |
rito | +2.069 |
048 | +1.976 |
Neg logit contributions | |
oyal | -3.200 |
stown | -2.944 |
charging | -2.910 |
Gleaming | -2.891 |
atically | -2.857 |
Token | the |
Token ID | 262 |
Feature activation | +2.44e+00 |
Pos logit contributions | |
hua | +2.035 |
uces | +1.960 |
itous | +1.897 |
rito | +1.891 |
048 | +1.812 |
Neg logit contributions | |
oyal | -2.318 |
stown | -2.129 |
charging | -2.109 |
atically | -2.091 |
agy | -2.075 |
Token | scholarship |
Token ID | 18652 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
hua | +1.677 |
uces | +1.618 |
rito | +1.565 |
itous | +1.562 |
048 | +1.505 |
Neg logit contributions | |
oyal | -1.788 |
charging | -1.640 |
stown | -1.636 |
atically | -1.618 |
agy | -1.602 |
Token | under |
Token ID | 739 |
Feature activation | -4.82e+00 |
Pos logit contributions | |
oyal | +1.738 |
stown | +1.610 |
charging | +1.571 |
atically | +1.566 |
Wolfe | +1.539 |
Neg logit contributions | |
hua | -1.608 |
uces | -1.561 |
rito | -1.505 |
itous | -1.500 |
048 | -1.429 |
Token | of |
Token ID | 286 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
oyal | +2.322 |
stown | +2.147 |
charging | +2.099 |
Wolfe | +2.095 |
atically | +2.083 |
Neg logit contributions | |
hua | -2.253 |
uces | -2.193 |
itous | -2.106 |
rito | -2.094 |
048 | -1.991 |
Token | the |
Token ID | 262 |
Feature activation | -3.18e+00 |
Pos logit contributions | |
oyal | +0.091 |
stown | +0.084 |
charging | +0.082 |
atically | +0.081 |
Wolfe | +0.080 |
Neg logit contributions | |
hua | -0.093 |
uces | -0.090 |
rito | -0.087 |
itous | -0.087 |
048 | -0.083 |
Token | raid |
Token ID | 9513 |
Feature activation | -7.86e-01 |
Pos logit contributions | |
oyal | +1.663 |
stown | +1.501 |
charging | +1.447 |
Wolfe | +1.437 |
atically | +1.435 |
Neg logit contributions | |
hua | -2.858 |
uces | -2.793 |
itous | -2.698 |
rito | -2.692 |
048 | -2.603 |
Token | : |
Token ID | 25 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
oyal | +0.612 |
stown | +0.569 |
charging | +0.557 |
atically | +0.555 |
Wolfe | +0.545 |
Neg logit contributions | |
hua | -0.508 |
uces | -0.493 |
rito | -0.473 |
itous | -0.472 |
048 | -0.448 |
Token |
|
Token ID | 198 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
oyal | +1.108 |
stown | +1.013 |
charging | +0.994 |
atically | +0.984 |
Wolfe | +0.978 |
Neg logit contributions | |
hua | -1.278 |
uces | -1.243 |
rito | -1.206 |
itous | -1.199 |
048 | -1.149 |
Token |
|
Token ID | 198 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
oyal | +1.136 |
stown | +1.042 |
charging | +1.017 |
atically | +1.012 |
Wolfe | +0.992 |
Neg logit contributions | |
hua | -1.237 |
uces | -1.204 |
rito | -1.163 |
itous | -1.160 |
048 | -1.111 |
Token | Male |
Token ID | 25486 |
Feature activation | +3.56e+00 |
Pos logit contributions | |
oyal | +1.246 |
stown | +1.153 |
charging | +1.132 |
atically | +1.122 |
Wolfe | +1.101 |
Neg logit contributions | |
hua | -1.108 |
uces | -1.079 |
rito | -1.034 |
itous | -1.034 |
048 | -0.979 |
Token | Officer |
Token ID | 10391 |
Feature activation | +2.52e+00 |
Pos logit contributions | |
hua | +2.418 |
uces | +2.351 |
rito | +2.271 |
itous | +2.239 |
048 | +2.166 |
Neg logit contributions | |
oyal | -2.629 |
stown | -2.405 |
atically | -2.372 |
charging | -2.362 |
agy | -2.321 |
Token | : |
Token ID | 25 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
hua | +1.551 |
uces | +1.513 |
rito | +1.460 |
itous | +1.445 |
048 | +1.387 |
Neg logit contributions | |
oyal | -2.034 |
stown | -1.872 |
charging | -1.834 |
atically | -1.822 |
agy | -1.798 |
Token | � |
Token ID | 564 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
hua | +0.965 |
uces | +0.937 |
rito | +0.908 |
itous | +0.901 |
048 | +0.867 |
Neg logit contributions | |
oyal | -0.965 |
stown | -0.887 |
charging | -0.866 |
atically | -0.864 |
agy | -0.846 |
Token | � |
Token ID | 250 |
Feature activation | +3.78e+00 |
Pos logit contributions | |
oyal | +0.867 |
stown | +0.792 |
atically | +0.779 |
charging | +0.779 |
Wolfe | +0.758 |
Neg logit contributions | |
hua | -0.751 |
uces | -0.719 |
itous | -0.701 |
rito | -0.690 |
liest | -0.661 |
Token | Lenin |
Token ID | 22899 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
oyal | +0.993 |
stown | +0.912 |
charging | +0.890 |
atically | +0.886 |
Wolfe | +0.868 |
Neg logit contributions | |
hua | -1.071 |
uces | -1.042 |
rito | -1.007 |
itous | -1.003 |
048 | -0.961 |
Token | ist |
Token ID | 396 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
oyal | +1.577 |
stown | +1.462 |
atically | +1.421 |
charging | +1.420 |
Wolfe | +1.394 |
Neg logit contributions | |
hua | -1.438 |
uces | -1.397 |
rito | -1.347 |
itous | -1.338 |
048 | -1.281 |
Token | ideology |
Token ID | 12959 |
Feature activation | +3.04e+00 |
Pos logit contributions | |
hua | +1.089 |
uces | +1.058 |
itous | +1.019 |
rito | +1.019 |
048 | +0.977 |
Neg logit contributions | |
oyal | -1.047 |
stown | -0.960 |
charging | -0.948 |
atically | -0.933 |
agy | -0.915 |
Token | that |
Token ID | 326 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
hua | +2.013 |
uces | +1.946 |
rito | +1.884 |
itous | +1.872 |
048 | +1.784 |
Neg logit contributions | |
oyal | -2.304 |
stown | -2.131 |
charging | -2.104 |
agy | -2.038 |
atically | -2.035 |
Token | flowed |
Token ID | 35456 |
Feature activation | +6.90e-01 |
Pos logit contributions | |
hua | +0.217 |
uces | +0.211 |
rito | +0.203 |
itous | +0.202 |
048 | +0.193 |
Neg logit contributions | |
oyal | -0.223 |
stown | -0.206 |
charging | -0.202 |
atically | -0.200 |
agy | -0.196 |
Token | from |
Token ID | 422 |
Feature activation | -2.57e+00 |
Pos logit contributions | |
hua | +0.465 |
uces | +0.451 |
itous | +0.434 |
rito | +0.433 |
048 | +0.412 |
Neg logit contributions | |
oyal | -0.521 |
stown | -0.481 |
charging | -0.471 |
atically | -0.463 |
agy | -0.458 |
Token | that |
Token ID | 326 |
Feature activation | -4.19e+00 |
Pos logit contributions | |
oyal | +1.828 |
stown | +1.687 |
atically | +1.645 |
charging | +1.641 |
Wolfe | +1.617 |
Neg logit contributions | |
hua | -1.829 |
uces | -1.776 |
rito | -1.718 |
itous | -1.705 |
048 | -1.630 |
Token | defeat |
Token ID | 7433 |
Feature activation | -3.55e+00 |
Pos logit contributions | |
oyal | +2.702 |
stown | +2.438 |
atically | +2.394 |
charging | +2.360 |
Wolfe | +2.357 |
Neg logit contributions | |
hua | -3.251 |
uces | -3.158 |
rito | -3.080 |
itous | -3.031 |
048 | -2.948 |
Token | , |
Token ID | 11 |
Feature activation | +5.07e-01 |
Pos logit contributions | |
oyal | +2.540 |
stown | +2.350 |
atically | +2.322 |
charging | +2.284 |
Wolfe | +2.243 |
Neg logit contributions | |
hua | -2.464 |
uces | -2.406 |
rito | -2.325 |
itous | -2.296 |
048 | -2.207 |
Token | led |
Token ID | 2957 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
hua | +0.353 |
uces | +0.342 |
rito | +0.330 |
itous | +0.330 |
048 | +0.315 |
Neg logit contributions | |
oyal | -0.370 |
stown | -0.342 |
charging | -0.335 |
atically | -0.331 |
Wolfe | -0.325 |
Token | the |
Token ID | 262 |
Feature activation | -3.24e+00 |
Pos logit contributions | |
oyal | +1.615 |
stown | +1.484 |
atically | +1.458 |
charging | +1.447 |
Wolfe | +1.434 |
Neg logit contributions | |
hua | -1.629 |
uces | -1.583 |
rito | -1.535 |
itous | -1.522 |
048 | -1.462 |
Token | that |
Token ID | 326 |
Feature activation | +4.04e+00 |
Pos logit contributions | |
hua | +3.702 |
uces | +3.504 |
itous | +3.444 |
rito | +3.419 |
048 | +3.261 |
Neg logit contributions | |
oyal | -5.287 |
stown | -4.901 |
Gleaming | -4.801 |
charging | -4.783 |
atically | -4.761 |
Token | they |
Token ID | 484 |
Feature activation | +6.77e-01 |
Pos logit contributions | |
hua | +2.707 |
uces | +2.611 |
rito | +2.523 |
itous | +2.493 |
048 | +2.429 |
Neg logit contributions | |
oyal | -3.010 |
stown | -2.734 |
atically | -2.704 |
charging | -2.702 |
Gleaming | -2.655 |
Token | rec |
Token ID | 664 |
Feature activation | -4.31e+00 |
Pos logit contributions | |
hua | +0.477 |
uces | +0.459 |
rito | +0.448 |
itous | +0.447 |
048 | +0.430 |
Neg logit contributions | |
oyal | -0.487 |
stown | -0.446 |
charging | -0.439 |
atically | -0.433 |
Gleaming | -0.426 |
Token | use |
Token ID | 1904 |
Feature activation | -4.82e+00 |
Pos logit contributions | |
oyal | +3.044 |
stown | +2.846 |
charging | +2.769 |
atically | +2.727 |
agy | +2.689 |
Neg logit contributions | |
hua | -3.067 |
uces | -2.977 |
itous | -2.865 |
rito | -2.845 |
048 | -2.760 |
Token | themselves |
Token ID | 2405 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
oyal | +1.797 |
stown | +1.589 |
charging | +1.494 |
atically | +1.488 |
Wolfe | +1.454 |
Neg logit contributions | |
hua | -5.014 |
uces | -4.877 |
itous | -4.762 |
rito | -4.762 |
048 | -4.609 |
Token | , |
Token ID | 11 |
Feature activation | -4.06e+00 |
Pos logit contributions | |
hua | +1.555 |
uces | +1.497 |
rito | +1.443 |
itous | +1.439 |
048 | +1.374 |
Neg logit contributions | |
oyal | -1.873 |
stown | -1.726 |
charging | -1.694 |
atically | -1.678 |
Gleaming | -1.678 |
Token | giving |
Token ID | 3501 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
oyal | +2.672 |
stown | +2.463 |
charging | +2.431 |
atically | +2.401 |
Wolfe | +2.376 |
Neg logit contributions | |
hua | -3.081 |
uces | -3.008 |
rito | -2.907 |
itous | -2.887 |
048 | -2.748 |
Token | rise |
Token ID | 4485 |
Feature activation | -1.59e-02 |
Pos logit contributions | |
oyal | +0.955 |
stown | +0.879 |
charging | +0.859 |
atically | +0.854 |
Wolfe | +0.839 |
Neg logit contributions | |
hua | -0.976 |
uces | -0.947 |
rito | -0.916 |
itous | -0.912 |
048 | -0.872 |
Token | to |
Token ID | 284 |
Feature activation | +4.36e-01 |
Pos logit contributions | |
oyal | +0.013 |
stown | +0.012 |
charging | +0.011 |
atically | +0.011 |
Gleaming | +0.011 |
Neg logit contributions | |
hua | -0.010 |
uces | -0.010 |
rito | -0.009 |
itous | -0.009 |
048 | -0.009 |
Token | an |
Token ID | 281 |
Feature activation | +3.10e+00 |
Pos logit contributions | |
hua | +0.306 |
uces | +0.297 |
rito | +0.287 |
itous | +0.286 |
048 | +0.273 |
Neg logit contributions | |
oyal | -0.316 |
stown | -0.291 |
charging | -0.284 |
atically | -0.284 |
Wolfe | -0.278 |
Token | appeal |
Token ID | 5198 |
Feature activation | +3.54e+00 |
Pos logit contributions | |
hua | +2.128 |
uces | +2.080 |
itous | +2.021 |
rito | +1.996 |
048 | +1.903 |
Neg logit contributions | |
oyal | -2.250 |
stown | -2.090 |
charging | -2.033 |
atically | -2.031 |
agy | -1.981 |
Token | wanted |
Token ID | 2227 |
Feature activation | -2.52e+00 |
Pos logit contributions | |
oyal | +0.859 |
stown | +0.795 |
charging | +0.778 |
atically | +0.775 |
Wolfe | +0.761 |
Neg logit contributions | |
hua | -0.766 |
uces | -0.743 |
rito | -0.715 |
itous | -0.713 |
048 | -0.680 |
Token | to |
Token ID | 284 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
oyal | +1.769 |
stown | +1.645 |
charging | +1.612 |
atically | +1.609 |
Wolfe | +1.588 |
Neg logit contributions | |
hua | -1.795 |
uces | -1.733 |
rito | -1.684 |
itous | -1.665 |
048 | -1.611 |
Token | go |
Token ID | 467 |
Feature activation | -3.26e+00 |
Pos logit contributions | |
oyal | +1.809 |
stown | +1.671 |
atically | +1.631 |
charging | +1.627 |
Wolfe | +1.595 |
Neg logit contributions | |
hua | -1.890 |
uces | -1.837 |
rito | -1.767 |
itous | -1.764 |
048 | -1.687 |
Token | counter |
Token ID | 3753 |
Feature activation | -7.53e+00 |
Pos logit contributions | |
oyal | +2.321 |
stown | +2.164 |
atically | +2.118 |
charging | +2.110 |
Wolfe | +2.081 |
Neg logit contributions | |
hua | -2.293 |
uces | -2.225 |
rito | -2.155 |
itous | -2.126 |
048 | -2.048 |
Token | - |
Token ID | 12 |
Feature activation | -6.51e+00 |
Pos logit contributions | |
oyal | +5.024 |
stown | +4.742 |
charging | +4.724 |
atically | +4.612 |
Wolfe | +4.522 |
Neg logit contributions | |
hua | -5.308 |
uces | -5.242 |
rito | -5.050 |
itous | -4.923 |
inguishable | -4.823 |
Token | clock |
Token ID | 15750 |
Feature activation | -7.75e+00 |
Pos logit contributions | |
oyal | +3.125 |
charging | +2.876 |
stown | +2.864 |
atically | +2.800 |
agy | +2.597 |
Neg logit contributions | |
hua | -5.873 |
uces | -5.836 |
rito | -5.678 |
itous | -5.585 |
048 | -5.457 |
Token | wise |
Token ID | 3083 |
Feature activation | -5.02e+00 |
Pos logit contributions | |
oyal | +3.837 |
stown | +3.559 |
atically | +3.371 |
charging | +3.347 |
Wolfe | +3.169 |
Neg logit contributions | |
hua | -6.993 |
uces | -6.912 |
rito | -6.749 |
itous | -6.503 |
048 | -6.420 |
Token | and |
Token ID | 290 |
Feature activation | -2.79e+00 |
Pos logit contributions | |
oyal | +3.560 |
stown | +3.352 |
atically | +3.291 |
charging | +3.264 |
Wolfe | +3.208 |
Neg logit contributions | |
hua | -3.481 |
uces | -3.402 |
rito | -3.299 |
itous | -3.226 |
inguishable | -3.122 |
Token | we |
Token ID | 356 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
oyal | +2.004 |
stown | +1.865 |
atically | +1.823 |
charging | +1.814 |
Wolfe | +1.792 |
Neg logit contributions | |
hua | -1.957 |
uces | -1.904 |
rito | -1.830 |
itous | -1.822 |
048 | -1.742 |
Token | were |
Token ID | 547 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
oyal | +1.012 |
stown | +0.937 |
charging | +0.916 |
atically | +0.913 |
Wolfe | +0.896 |
Neg logit contributions | |
hua | -0.918 |
uces | -0.891 |
rito | -0.857 |
itous | -0.855 |
048 | -0.815 |
Token | still |
Token ID | 991 |
Feature activation | +2.79e+00 |
Pos logit contributions | |
hua | +1.093 |
uces | +1.054 |
rito | +1.024 |
itous | +1.018 |
hi | +0.972 |
Neg logit contributions | |
oyal | -1.277 |
stown | -1.165 |
charging | -1.141 |
agy | -1.131 |
atically | -1.122 |
Token | out |
Token ID | 503 |
Feature activation | +9.78e-01 |
Pos logit contributions | |
hua | +1.993 |
uces | +1.922 |
itous | +1.855 |
rito | +1.839 |
hi | +1.770 |
Neg logit contributions | |
oyal | -2.286 |
stown | -2.085 |
charging | -2.043 |
atically | -2.012 |
agy | -1.985 |
Token | to |
Token ID | 284 |
Feature activation | +7.87e-01 |
Pos logit contributions | |
hua | +0.642 |
uces | +0.622 |
rito | +0.599 |
itous | +0.597 |
048 | +0.568 |
Neg logit contributions | |
oyal | -0.754 |
stown | -0.698 |
charging | -0.683 |
atically | -0.679 |
Wolfe | -0.667 |
Token | do |
Token ID | 466 |
Feature activation | -2.41e+00 |
Pos logit contributions | |
hua | +0.556 |
uces | +0.539 |
rito | +0.524 |
itous | +0.523 |
048 | +0.501 |
Neg logit contributions | |
oyal | -0.566 |
stown | -0.517 |
charging | -0.509 |
atically | -0.501 |
agy | -0.494 |
Token | , |
Token ID | 11 |
Feature activation | -4.05e+00 |
Pos logit contributions | |
oyal | +1.808 |
stown | +1.672 |
atically | +1.649 |
charging | +1.640 |
Wolfe | +1.610 |
Neg logit contributions | |
hua | -1.624 |
uces | -1.584 |
rito | -1.516 |
itous | -1.512 |
048 | -1.443 |
Token | but |
Token ID | 475 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
oyal | +2.949 |
stown | +2.717 |
charging | +2.681 |
atically | +2.676 |
Wolfe | +2.636 |
Neg logit contributions | |
hua | -2.810 |
uces | -2.733 |
rito | -2.614 |
itous | -2.610 |
048 | -2.477 |
Token | lack |
Token ID | 3092 |
Feature activation | -8.19e+00 |
Pos logit contributions | |
oyal | +0.860 |
stown | +0.794 |
charging | +0.776 |
atically | +0.773 |
Wolfe | +0.758 |
Neg logit contributions | |
hua | -0.811 |
uces | -0.788 |
rito | -0.759 |
itous | -0.757 |
048 | -0.723 |
Token | of |
Token ID | 286 |
Feature activation | -5.99e+00 |
Pos logit contributions | |
oyal | +5.352 |
stown | +4.878 |
charging | +4.764 |
atically | +4.712 |
Wolfe | +4.687 |
Neg logit contributions | |
hua | -5.994 |
uces | -5.899 |
rito | -5.670 |
itous | -5.621 |
048 | -5.525 |
Token | experience |
Token ID | 1998 |
Feature activation | -4.48e+00 |
Pos logit contributions | |
oyal | +4.335 |
stown | +4.022 |
charging | +3.950 |
Wolfe | +3.886 |
atically | +3.866 |
Neg logit contributions | |
hua | -4.094 |
uces | -4.013 |
rito | -3.899 |
itous | -3.798 |
048 | -3.657 |
Token | in |
Token ID | 287 |
Feature activation | -4.61e+00 |
Pos logit contributions | |
oyal | +3.111 |
stown | +2.896 |
atically | +2.843 |
charging | +2.842 |
Wolfe | +2.795 |
Neg logit contributions | |
hua | -3.217 |
uces | -3.124 |
rito | -3.025 |
itous | -2.991 |
inguishable | -2.860 |
Token | planning |
Token ID | 5410 |
Feature activation | -5.93e+00 |
Pos logit contributions | |
oyal | +3.203 |
stown | +2.967 |
charging | +2.895 |
atically | +2.877 |
Wolfe | +2.847 |
Neg logit contributions | |
hua | -3.359 |
uces | -3.253 |
rito | -3.119 |
itous | -3.108 |
inguishable | -2.982 |
Token | and |
Token ID | 290 |
Feature activation | -5.71e+00 |
Pos logit contributions | |
oyal | +4.012 |
stown | +3.767 |
atically | +3.700 |
Wolfe | +3.665 |
charging | +3.661 |
Neg logit contributions | |
hua | -4.285 |
uces | -4.138 |
rito | -4.049 |
itous | -3.968 |
048 | -3.813 |
Token | the |
Token ID | 262 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
oyal | +0.300 |
stown | +0.278 |
charging | +0.272 |
atically | +0.270 |
Wolfe | +0.265 |
Neg logit contributions | |
hua | -0.267 |
uces | -0.259 |
rito | -0.249 |
itous | -0.248 |
048 | -0.237 |
Token | capacity |
Token ID | 5339 |
Feature activation | -3.94e+00 |
Pos logit contributions | |
hua | +1.127 |
uces | +1.092 |
rito | +1.053 |
itous | +1.047 |
048 | +1.003 |
Neg logit contributions | |
oyal | -1.246 |
stown | -1.150 |
charging | -1.123 |
atically | -1.121 |
agy | -1.096 |
Token | from |
Token ID | 422 |
Feature activation | -6.28e+00 |
Pos logit contributions | |
oyal | +2.805 |
stown | +2.622 |
charging | +2.575 |
atically | +2.566 |
Wolfe | +2.547 |
Neg logit contributions | |
hua | -2.733 |
uces | -2.656 |
rito | -2.562 |
itous | -2.558 |
048 | -2.433 |
Token | 1 |
Token ID | 352 |
Feature activation | -7.58e+00 |
Pos logit contributions | |
oyal | +4.238 |
stown | +3.934 |
charging | +3.876 |
atically | +3.846 |
Wolfe | +3.825 |
Neg logit contributions | |
hua | -4.542 |
uces | -4.430 |
itous | -4.306 |
rito | -4.293 |
inguishable | -4.069 |
Token | , |
Token ID | 11 |
Feature activation | -6.15e+00 |
Pos logit contributions | |
oyal | +5.030 |
stown | +4.603 |
charging | +4.520 |
Wolfe | +4.484 |
atically | +4.443 |
Neg logit contributions | |
uces | -5.471 |
hua | -5.394 |
itous | -5.325 |
rito | -5.147 |
liest | -4.995 |
Token | 700 |
Token ID | 9879 |
Feature activation | -7.90e+00 |
Pos logit contributions | |
oyal | +4.629 |
stown | +4.331 |
charging | +4.232 |
atically | +4.205 |
Wolfe | +4.167 |
Neg logit contributions | |
hua | -3.884 |
uces | -3.834 |
rito | -3.709 |
itous | -3.707 |
inguishable | -3.473 |
Token | seats |
Token ID | 8632 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
oyal | +5.116 |
charging | +4.718 |
stown | +4.689 |
Wolfe | +4.597 |
atically | +4.541 |
Neg logit contributions | |
uces | -5.696 |
hua | -5.680 |
itous | -5.467 |
rito | -5.403 |
inguishable | -5.186 |
Token | to |
Token ID | 284 |
Feature activation | -6.81e+00 |
Pos logit contributions | |
oyal | +2.430 |
stown | +2.236 |
charging | +2.194 |
atically | +2.189 |
Wolfe | +2.145 |
Neg logit contributions | |
hua | -2.383 |
uces | -2.335 |
rito | -2.253 |
itous | -2.243 |
inguishable | -2.130 |
Token | 2 |
Token ID | 362 |
Feature activation | +5.92e-01 |
Pos logit contributions | |
oyal | +4.383 |
stown | +4.023 |
charging | +3.994 |
atically | +3.939 |
Wolfe | +3.895 |
Neg logit contributions | |
hua | -5.081 |
uces | -4.984 |
itous | -4.850 |
rito | -4.846 |
inguishable | -4.598 |
Token | , |
Token ID | 11 |
Feature activation | -3.50e+00 |
Pos logit contributions | |
hua | +0.371 |
uces | +0.352 |
rito | +0.340 |
itous | +0.336 |
048 | +0.328 |
Neg logit contributions | |
oyal | -0.475 |
stown | -0.440 |
atically | -0.433 |
charging | -0.432 |
agy | -0.426 |
Token | 000 |
Token ID | 830 |
Feature activation | -6.38e+00 |
Pos logit contributions | |
oyal | +2.707 |
stown | +2.509 |
charging | +2.475 |
atically | +2.445 |
Wolfe | +2.415 |
Neg logit contributions | |
hua | -2.243 |
uces | -2.193 |
itous | -2.116 |
rito | -2.112 |
liest | -1.968 |
Token | and |
Token ID | 290 |
Feature activation | -2.91e+00 |
Pos logit contributions | |
oyal | +2.476 |
stown | +2.268 |
charging | +2.216 |
atically | +2.178 |
Wolfe | +2.162 |
Neg logit contributions | |
hua | -2.910 |
uces | -2.827 |
rito | -2.771 |
itous | -2.690 |
048 | -2.619 |
Token | anx |
Token ID | 7296 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
oyal | +1.828 |
stown | +1.658 |
charging | +1.610 |
atically | +1.606 |
Wolfe | +1.576 |
Neg logit contributions | |
hua | -2.322 |
uces | -2.258 |
rito | -2.199 |
itous | -2.176 |
048 | -2.100 |
Token | io |
Token ID | 952 |
Feature activation | -6.97e+00 |
Pos logit contributions | |
oyal | +3.296 |
stown | +3.070 |
atically | +2.985 |
charging | +2.964 |
agy | +2.900 |
Neg logit contributions | |
hua | -3.008 |
uces | -2.917 |
rito | -2.767 |
itous | -2.755 |
048 | -2.655 |
Token | ly |
Token ID | 306 |
Feature activation | -8.64e+00 |
Pos logit contributions | |
oyal | +4.916 |
stown | +4.512 |
charging | +4.446 |
atically | +4.426 |
agy | +4.237 |
Neg logit contributions | |
hua | -4.929 |
uces | -4.753 |
rito | -4.609 |
itous | -4.528 |
inguishable | -4.426 |
Token | tic |
Token ID | 13370 |
Feature activation | -8.37e+00 |
Pos logit contributions | |
oyal | +3.724 |
stown | +3.374 |
atically | +3.365 |
charging | +3.144 |
tics | +2.991 |
Neg logit contributions | |
hua | -8.284 |
uces | -8.234 |
rito | -7.909 |
itous | -7.789 |
048 | -7.747 |
Token | - |
Token ID | 12 |
Feature activation | -7.87e+00 |
Pos logit contributions | |
oyal | +4.718 |
stown | +4.314 |
charging | +4.138 |
atically | +4.112 |
Armstrong | +4.082 |
Neg logit contributions | |
hua | -6.903 |
uces | -6.678 |
rito | -6.649 |
inguishable | -6.284 |
048 | -6.273 |
Token | like |
Token ID | 2339 |
Feature activation | -6.21e+00 |
Pos logit contributions | |
oyal | +4.267 |
charging | +3.844 |
stown | +3.806 |
atically | +3.786 |
iking | +3.586 |
Neg logit contributions | |
hua | -6.706 |
uces | -6.537 |
rito | -6.427 |
itous | -6.217 |
048 | -6.181 |
Token | effects |
Token ID | 3048 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
oyal | +3.257 |
stown | +2.952 |
charging | +2.828 |
atically | +2.779 |
Wolfe | +2.773 |
Neg logit contributions | |
hua | -5.472 |
uces | -5.330 |
rito | -5.290 |
itous | -5.066 |
048 | -5.019 |
Token | in |
Token ID | 287 |
Feature activation | -3.37e+00 |
Pos logit contributions | |
oyal | +1.964 |
stown | +1.790 |
atically | +1.786 |
charging | +1.768 |
Wolfe | +1.738 |
Neg logit contributions | |
hua | -1.849 |
uces | -1.792 |
rito | -1.741 |
itous | -1.712 |
048 | -1.645 |
Token | rodent |
Token ID | 50074 |
Feature activation | -3.24e+00 |
Pos logit contributions | |
oyal | +2.198 |
stown | +2.018 |
charging | +1.968 |
atically | +1.965 |
Wolfe | +1.938 |
Neg logit contributions | |
hua | -2.597 |
uces | -2.504 |
rito | -2.443 |
itous | -2.428 |
048 | -2.332 |
Token | models |
Token ID | 4981 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
oyal | +2.512 |
stown | +2.318 |
atically | +2.275 |
charging | +2.271 |
Wolfe | +2.231 |
Neg logit contributions | |
hua | -2.120 |
uces | -2.040 |
rito | -1.983 |
itous | -1.963 |
048 | -1.871 |
Token | th |
Token ID | 400 |
Feature activation | +5.26e+00 |
Pos logit contributions | |
hua | +2.412 |
uces | +2.330 |
rito | +2.247 |
itous | +2.224 |
048 | +2.119 |
Neg logit contributions | |
oyal | -3.073 |
stown | -2.822 |
atically | -2.807 |
charging | -2.799 |
agy | -2.750 |
Token | grade |
Token ID | 9559 |
Feature activation | -9.63e-01 |
Pos logit contributions | |
hua | +2.853 |
uces | +2.739 |
itous | +2.629 |
rito | +2.598 |
048 | +2.502 |
Neg logit contributions | |
oyal | -4.586 |
charging | -4.230 |
atically | -4.167 |
stown | -4.132 |
agy | -4.126 |
Token | ... |
Token ID | 986 |
Feature activation | +6.54e-01 |
Pos logit contributions | |
oyal | +0.727 |
stown | +0.673 |
charging | +0.658 |
atically | +0.655 |
Wolfe | +0.644 |
Neg logit contributions | |
hua | -0.647 |
uces | -0.627 |
rito | -0.604 |
itous | -0.602 |
048 | -0.574 |
Token | On |
Token ID | 2202 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
hua | +0.453 |
uces | +0.438 |
rito | +0.423 |
itous | +0.422 |
048 | +0.403 |
Neg logit contributions | |
oyal | -0.481 |
stown | -0.443 |
charging | -0.433 |
atically | -0.432 |
Wolfe | -0.423 |
Token | the |
Token ID | 262 |
Feature activation | -9.28e+00 |
Pos logit contributions | |
oyal | +2.874 |
stown | +2.635 |
Wolfe | +2.544 |
charging | +2.541 |
Armstrong | +2.531 |
Neg logit contributions | |
hua | -3.488 |
uces | -3.407 |
itous | -3.285 |
rito | -3.279 |
048 | -3.138 |
Token | right |
Token ID | 826 |
Feature activation | -7.78e+00 |
Pos logit contributions | |
oyal | +5.104 |
stown | +4.537 |
charging | +4.393 |
Wolfe | +4.365 |
Armstrong | +4.306 |
Neg logit contributions | |
hua | -7.700 |
uces | -7.483 |
rito | -7.182 |
itous | -7.060 |
hyde | -6.959 |
Token | : |
Token ID | 25 |
Feature activation | -4.47e+00 |
Pos logit contributions | |
oyal | +5.415 |
stown | +5.130 |
charging | +4.890 |
atically | +4.877 |
Armstrong | +4.872 |
Neg logit contributions | |
hua | -5.295 |
uces | -5.024 |
rito | -4.932 |
itous | -4.848 |
048 | -4.711 |
Token | Me |
Token ID | 2185 |
Feature activation | -6.06e+00 |
Pos logit contributions | |
oyal | +3.189 |
stown | +2.997 |
charging | +2.904 |
Wolfe | +2.895 |
atically | +2.880 |
Neg logit contributions | |
hua | -3.128 |
uces | -3.025 |
rito | -2.932 |
itous | -2.926 |
048 | -2.767 |
Token | in |
Token ID | 287 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
oyal | +4.308 |
stown | +3.946 |
atically | +3.907 |
charging | +3.904 |
agy | +3.851 |
Neg logit contributions | |
hua | -4.115 |
uces | -4.045 |
itous | -3.918 |
rito | -3.892 |
048 | -3.761 |
Token | 11 |
Token ID | 1367 |
Feature activation | +5.69e+00 |
Pos logit contributions | |
hua | +1.021 |
uces | +0.982 |
rito | +0.951 |
itous | +0.945 |
048 | +0.908 |
Neg logit contributions | |
oyal | -1.211 |
stown | -1.109 |
charging | -1.091 |
atically | -1.090 |
agy | -1.071 |
Token | th |
Token ID | 400 |
Feature activation | +3.26e+00 |
Pos logit contributions | |
hua | +2.411 |
uces | +2.213 |
rito | +2.145 |
itous | +2.132 |
hi | +1.990 |
Neg logit contributions | |
oyal | -5.680 |
stown | -5.283 |
atically | -5.268 |
charging | -5.224 |
Gleaming | -5.176 |