Token | seconds |
Token ID | 4201 |
Feature activation | +1.20e-01 |
Pos logit contributions | |
ATH | +1.806 |
ares | +1.579 |
aring | +1.579 |
aldi | +1.552 |
anamo | +1.552 |
Neg logit contributions | |
Zoro | -1.613 |
ibilities | -1.474 |
ells | -1.446 |
chapter | -1.327 |
ible | -1.297 |
Token | later |
Token ID | 1568 |
Feature activation | +2.88e-03 |
Pos logit contributions | |
ATH | +1.223 |
ares | +1.095 |
aring | +1.090 |
ARE | +1.073 |
anamo | +1.071 |
Neg logit contributions | |
Zoro | -0.782 |
ibilities | -0.688 |
ells | -0.685 |
chapter | -0.608 |
vitamins | -0.596 |
Token | by |
Token ID | 416 |
Feature activation | +6.84e-01 |
Pos logit contributions | |
ATH | +0.026 |
ares | +0.023 |
aring | +0.023 |
anamo | +0.023 |
ARE | +0.023 |
Neg logit contributions | |
Zoro | -0.022 |
ibilities | -0.020 |
ells | -0.019 |
chapter | -0.018 |
vitamins | -0.017 |
Token | a |
Token ID | 257 |
Feature activation | +4.60e-01 |
Pos logit contributions | |
ATH | +5.448 |
ares | +4.756 |
aring | +4.632 |
Mehran | +4.609 |
Stacy | +4.606 |
Neg logit contributions | |
Zoro | -5.384 |
ibilities | -5.241 |
ells | -5.053 |
ible | -4.553 |
chapter | -4.510 |
Token | deaf |
Token ID | 21815 |
Feature activation | +8.67e-01 |
Pos logit contributions | |
ATH | +3.815 |
aring | +3.278 |
ares | +3.263 |
ARE | +3.166 |
Stacy | +3.163 |
Neg logit contributions | |
Zoro | -3.687 |
ibilities | -3.547 |
ells | -3.403 |
vitamins | -3.115 |
ible | -3.044 |
Token | ening |
Token ID | 3101 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
ATH | +5.260 |
aring | +4.452 |
ares | +4.256 |
aldi | +4.180 |
ARE | +4.146 |
Neg logit contributions | |
Zoro | -8.585 |
ibilities | -8.096 |
ells | -7.916 |
vitamins | -7.433 |
Directions | -7.306 |
Token | th |
Token ID | 294 |
Feature activation | +7.59e-01 |
Pos logit contributions | |
ATH | +11.378 |
aring | +9.650 |
ares | +9.473 |
fare | +9.386 |
aldi | +9.204 |
Neg logit contributions | |
ibilities | -12.531 |
Zoro | -12.146 |
ells | -11.842 |
okers | -10.650 |
Directions | -10.568 |
Token | ud |
Token ID | 463 |
Feature activation | +7.42e-01 |
Pos logit contributions | |
ATH | +4.406 |
ares | +3.920 |
aring | +3.862 |
aldi | +3.648 |
ARE | +3.548 |
Neg logit contributions | |
Zoro | -7.885 |
ibilities | -7.357 |
ells | -7.057 |
Directions | -6.862 |
vitamins | -6.762 |
Token | from |
Token ID | 422 |
Feature activation | +3.98e-01 |
Pos logit contributions | |
ATH | +5.751 |
ares | +5.017 |
aring | +4.995 |
aria | +4.814 |
ARE | +4.797 |
Neg logit contributions | |
Zoro | -6.230 |
ibilities | -5.773 |
ells | -5.749 |
vitamins | -5.141 |
chapter | -5.131 |
Token | the |
Token ID | 262 |
Feature activation | +5.48e-01 |
Pos logit contributions | |
ATH | +3.394 |
ares | +2.942 |
aring | +2.921 |
anamo | +2.912 |
Stacy | +2.899 |
Neg logit contributions | |
Zoro | -3.120 |
ibilities | -2.923 |
ells | -2.848 |
vitamins | -2.568 |
chapter | -2.568 |
Token | collapsing |
Token ID | 30792 |
Feature activation | +7.37e-01 |
Pos logit contributions | |
ATH | +4.446 |
aring | +3.862 |
ares | +3.862 |
aldi | +3.783 |
Stacy | +3.732 |
Neg logit contributions | |
Zoro | -4.441 |
ibilities | -4.202 |
ells | -4.077 |
vitamins | -3.644 |
ibly | -3.637 |
Token | to |
Token ID | 284 |
Feature activation | -7.73e-02 |
Pos logit contributions | |
ATH | +1.566 |
ares | +1.380 |
anamo | +1.379 |
aring | +1.369 |
ARE | +1.361 |
Neg logit contributions | |
Zoro | -1.344 |
ibilities | -1.202 |
ells | -1.185 |
chapter | -1.107 |
vitamins | -1.075 |
Token | stand |
Token ID | 1302 |
Feature activation | -3.37e-02 |
Pos logit contributions | |
Zoro | +0.625 |
ibilities | +0.563 |
ells | +0.556 |
chapter | +0.510 |
ible | +0.498 |
Neg logit contributions | |
ATH | -0.669 |
ares | -0.586 |
aring | -0.583 |
ARE | -0.574 |
Stacy | -0.571 |
Token | toe |
Token ID | 21189 |
Feature activation | +4.39e-01 |
Pos logit contributions | |
Zoro | +0.289 |
ibilities | +0.263 |
ells | +0.260 |
chapter | +0.242 |
vitamins | +0.236 |
Neg logit contributions | |
ATH | -0.273 |
ares | -0.237 |
aring | -0.235 |
anamo | -0.233 |
ARE | -0.232 |
Token | - |
Token ID | 12 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
ATH | +3.780 |
aring | +3.279 |
ares | +3.269 |
anamo | +3.218 |
ARE | +3.210 |
Neg logit contributions | |
Zoro | -3.527 |
ibilities | -3.151 |
ells | -3.112 |
chapter | -2.882 |
vitamins | -2.835 |
Token | to |
Token ID | 1462 |
Feature activation | +6.23e-01 |
Pos logit contributions | |
ATH | +3.280 |
ares | +2.863 |
aring | +2.851 |
anamo | +2.816 |
ARE | +2.777 |
Neg logit contributions | |
Zoro | -3.189 |
ibilities | -2.846 |
ells | -2.774 |
chapter | -2.621 |
vitamins | -2.563 |
Token | - |
Token ID | 12 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
ATH | +4.637 |
aring | +4.078 |
ares | +4.052 |
kind | +3.891 |
aria | +3.866 |
Neg logit contributions | |
Zoro | -5.502 |
ibilities | -5.003 |
ells | -4.830 |
vitamins | -4.662 |
Directions | -4.596 |
Token | toe |
Token ID | 44579 |
Feature activation | +7.40e-01 |
Pos logit contributions | |
ATH | +2.384 |
ares | +1.648 |
aria | +1.534 |
toes | +1.501 |
kind | +1.483 |
Neg logit contributions | |
Zoro | -21.330 |
ibilities | -19.991 |
vitamins | -19.410 |
Directions | -19.356 |
chapter | -19.273 |
Token | with |
Token ID | 351 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
ATH | +4.867 |
Stacy | +4.117 |
ares | +4.111 |
aring | +4.088 |
Mehran | +4.023 |
Neg logit contributions | |
Zoro | -6.933 |
ibilities | -6.643 |
ells | -6.526 |
chapter | -5.977 |
vitamins | -5.936 |
Token | the |
Token ID | 262 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
ATH | +1.338 |
ares | +1.151 |
Stacy | +1.147 |
aring | +1.143 |
anamo | +1.132 |
Neg logit contributions | |
Zoro | -1.422 |
ibilities | -1.314 |
ells | -1.290 |
chapter | -1.189 |
ible | -1.172 |
Token | world |
Token ID | 995 |
Feature activation | -4.56e-01 |
Pos logit contributions | |
ATH | +1.921 |
ares | +1.656 |
Stacy | +1.653 |
aring | +1.649 |
aldi | +1.626 |
Neg logit contributions | |
Zoro | -1.928 |
ibilities | -1.775 |
ells | -1.740 |
chapter | -1.586 |
ible | -1.572 |
Token | � |
Token ID | 447 |
Feature activation | +3.15e-02 |
Pos logit contributions | |
Zoro | +3.437 |
ibilities | +2.994 |
ells | +2.971 |
chapter | +2.825 |
vitamins | +2.704 |
Neg logit contributions | |
ATH | -4.144 |
anamo | -3.722 |
ares | -3.676 |
aring | -3.626 |
ARE | -3.622 |
Token | 26 |
Token ID | 2608 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
ATH | +0.999 |
ares | +0.880 |
aring | +0.874 |
aldi | +0.863 |
ARE | +0.861 |
Neg logit contributions | |
Zoro | -0.901 |
ibilities | -0.828 |
ells | -0.812 |
chapter | -0.734 |
vitamins | -0.727 |
Token | and |
Token ID | 290 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
ATH | +1.483 |
ares | +1.298 |
aring | +1.294 |
anamo | +1.280 |
ARE | +1.276 |
Neg logit contributions | |
Zoro | -1.340 |
ibilities | -1.203 |
ells | -1.187 |
chapter | -1.098 |
vitamins | -1.077 |
Token | includes |
Token ID | 3407 |
Feature activation | +4.01e-01 |
Pos logit contributions | |
ATH | +0.801 |
ares | +0.695 |
aring | +0.691 |
ARE | +0.681 |
anamo | +0.681 |
Neg logit contributions | |
Zoro | -0.869 |
ibilities | -0.799 |
ells | -0.788 |
chapter | -0.729 |
ible | -0.714 |
Token | " |
Token ID | 366 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
ATH | +3.384 |
ares | +3.007 |
aring | +2.975 |
Stacy | +2.974 |
aldi | +2.941 |
Neg logit contributions | |
Zoro | -3.174 |
ibilities | -2.923 |
ells | -2.862 |
ible | -2.592 |
chapter | -2.588 |
Token | A |
Token ID | 32 |
Feature activation | -5.21e-02 |
Pos logit contributions | |
ATH | +0.875 |
ares | +0.748 |
aring | +0.742 |
ARE | +0.739 |
anamo | +0.736 |
Neg logit contributions | |
Zoro | -1.007 |
ibilities | -0.919 |
ells | -0.903 |
chapter | -0.848 |
vitamins | -0.830 |
Token | Christmas |
Token ID | 6786 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
Zoro | +0.383 |
ibilities | +0.342 |
ells | +0.336 |
chapter | +0.310 |
vitamins | +0.301 |
Neg logit contributions | |
ATH | -0.489 |
ares | -0.432 |
aring | -0.430 |
anamo | -0.430 |
ARE | -0.425 |
Token | Story |
Token ID | 8362 |
Feature activation | +2.93e-01 |
Pos logit contributions | |
ATH | +8.031 |
Stacy | +7.828 |
aring | +7.219 |
ares | +7.190 |
kind | +7.124 |
Neg logit contributions | |
ibilities | -13.761 |
Zoro | -13.501 |
ells | -13.273 |
ibly | -11.676 |
vitamins | -11.518 |
Token | " |
Token ID | 1 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
ATH | +2.466 |
ares | +2.174 |
aring | +2.152 |
ARE | +2.121 |
Stacy | +2.111 |
Neg logit contributions | |
Zoro | -2.392 |
ibilities | -2.199 |
ells | -2.150 |
chapter | -1.955 |
vitamins | -1.943 |
Token | and |
Token ID | 290 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
ATH | +1.459 |
ares | +1.278 |
aring | +1.272 |
anamo | +1.261 |
ARE | +1.254 |
Neg logit contributions | |
Zoro | -1.353 |
ibilities | -1.226 |
ells | -1.207 |
chapter | -1.102 |
ible | -1.090 |
Token | " |
Token ID | 366 |
Feature activation | +3.60e-03 |
Pos logit contributions | |
ATH | +2.219 |
ares | +1.965 |
aring | +1.952 |
anamo | +1.949 |
ARE | +1.933 |
Neg logit contributions | |
Zoro | -1.750 |
ibilities | -1.558 |
ells | -1.536 |
chapter | -1.413 |
ible | -1.372 |
Token | Mir |
Token ID | 27453 |
Feature activation | -6.52e-01 |
Pos logit contributions | |
ATH | +0.028 |
ares | +0.024 |
aring | +0.024 |
anamo | +0.024 |
ARE | +0.024 |
Neg logit contributions | |
Zoro | -0.032 |
ibilities | -0.029 |
ells | -0.029 |
chapter | -0.027 |
vitamins | -0.027 |
Token | George |
Token ID | 4502 |
Feature activation | +7.42e-01 |
Pos logit contributions | |
ATH | +2.424 |
ares | +2.114 |
Stacy | +2.107 |
anamo | +2.099 |
aring | +2.093 |
Neg logit contributions | |
Zoro | -2.463 |
ibilities | -2.289 |
ells | -2.238 |
chapter | -2.029 |
vitamins | -2.011 |
Token | Soros |
Token ID | 27900 |
Feature activation | -5.95e-02 |
Pos logit contributions | |
ATH | +3.879 |
Stacy | +3.322 |
aring | +3.133 |
ares | +3.100 |
ARE | +3.075 |
Neg logit contributions | |
Zoro | -8.093 |
ibilities | -7.580 |
ells | -7.510 |
chapter | -7.046 |
vitamins | -6.961 |
Token | 's |
Token ID | 338 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
Zoro | +0.461 |
ibilities | +0.412 |
ells | +0.407 |
chapter | +0.377 |
vitamins | +0.366 |
Neg logit contributions | |
ATH | -0.535 |
ares | -0.470 |
anamo | -0.468 |
aring | -0.467 |
ARE | -0.463 |
Token | pre |
Token ID | 662 |
Feature activation | +3.89e-01 |
Pos logit contributions | |
ATH | +1.738 |
ares | +1.536 |
aring | +1.521 |
anamo | +1.514 |
Stacy | +1.507 |
Neg logit contributions | |
Zoro | -1.598 |
ibilities | -1.451 |
ells | -1.421 |
chapter | -1.292 |
vitamins | -1.273 |
Token | - |
Token ID | 12 |
Feature activation | +9.21e-01 |
Pos logit contributions | |
ATH | +3.277 |
aring | +2.890 |
ares | +2.878 |
anamo | +2.831 |
aryl | +2.817 |
Neg logit contributions | |
Zoro | -3.202 |
ibilities | -2.861 |
ells | -2.814 |
chapter | -2.629 |
vitamins | -2.561 |
Token | tax |
Token ID | 19290 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
ATH | +6.651 |
Bern | +5.612 |
ares | +5.573 |
aring | +5.559 |
anamo | +5.555 |
Neg logit contributions | |
Zoro | -8.361 |
ibilities | -7.720 |
ells | -7.329 |
chapter | -6.952 |
vitamins | -6.853 |
Token | dollars |
Token ID | 5054 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
ATH | +11.150 |
ares | +10.124 |
aring | +9.885 |
ARE | +9.765 |
foundation | +9.577 |
Neg logit contributions | |
Zoro | -11.283 |
ibilities | -10.464 |
ells | -10.288 |
vitamins | -8.797 |
chapter | -8.556 |
Token | . |
Token ID | 13 |
Feature activation | +5.45e-02 |
Pos logit contributions | |
ATH | +1.004 |
ares | +0.878 |
aring | +0.873 |
ARE | +0.867 |
anamo | +0.867 |
Neg logit contributions | |
Zoro | -0.917 |
ibilities | -0.824 |
ells | -0.814 |
chapter | -0.746 |
vitamins | -0.736 |
Token | See |
Token ID | 4091 |
Feature activation | -3.03e-02 |
Pos logit contributions | |
ATH | +0.470 |
ares | +0.410 |
aring | +0.407 |
anamo | +0.407 |
ARE | +0.405 |
Neg logit contributions | |
Zoro | -0.439 |
ibilities | -0.400 |
ells | -0.393 |
chapter | -0.362 |
vitamins | -0.356 |
Token | earlier |
Token ID | 2961 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
Zoro | +0.242 |
ibilities | +0.217 |
ells | +0.215 |
chapter | +0.198 |
vitamins | +0.194 |
Neg logit contributions | |
ATH | -0.265 |
ares | -0.233 |
aring | -0.232 |
anamo | -0.231 |
ARE | -0.230 |
Token | Mark |
Token ID | 2940 |
Feature activation | +4.07e-01 |
Pos logit contributions | |
ATH | +1.393 |
ares | +1.223 |
aring | +1.212 |
anamo | +1.207 |
ARE | +1.204 |
Neg logit contributions | |
Zoro | -1.306 |
ibilities | -1.185 |
ells | -1.173 |
vitamins | -1.059 |
chapter | -1.056 |
Token | organic |
Token ID | 10469 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
Zoro | +0.210 |
ibilities | +0.190 |
ells | +0.188 |
chapter | +0.175 |
ible | +0.170 |
Neg logit contributions | |
ATH | -0.198 |
ares | -0.173 |
aring | -0.171 |
ARE | -0.170 |
anamo | -0.170 |
Token | consumer |
Token ID | 7172 |
Feature activation | -2.89e-01 |
Pos logit contributions | |
ATH | +3.589 |
ares | +3.140 |
aring | +3.122 |
aryl | +3.102 |
ARE | +3.084 |
Neg logit contributions | |
Zoro | -3.592 |
ells | -3.236 |
ibilities | -3.218 |
chapter | -2.883 |
| -2.780 |
Token | demand |
Token ID | 3512 |
Feature activation | -6.10e-01 |
Pos logit contributions | |
Zoro | +2.191 |
ibilities | +1.937 |
ells | +1.902 |
chapter | +1.806 |
vitamins | +1.760 |
Neg logit contributions | |
ATH | -2.630 |
anamo | -2.354 |
ares | -2.322 |
aring | -2.315 |
ARE | -2.285 |
Token | . |
Token ID | 13 |
Feature activation | +5.32e-01 |
Pos logit contributions | |
Zoro | +4.424 |
ibilities | +3.900 |
ells | +3.779 |
chapter | +3.633 |
vitamins | +3.538 |
Neg logit contributions | |
ATH | -5.670 |
anamo | -5.152 |
ares | -4.988 |
aring | -4.956 |
Mehran | -4.951 |
Token | It |
Token ID | 632 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
ATH | +4.272 |
ares | +3.752 |
Stacy | +3.746 |
ARE | +3.725 |
aring | +3.723 |
Neg logit contributions | |
Zoro | -4.339 |
ibilities | -4.171 |
ells | -4.008 |
ibly | -3.641 |
chapter | -3.639 |
Token | has |
Token ID | 468 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
ATH | +6.892 |
aring | +6.268 |
ares | +6.218 |
Mehran | +5.917 |
aria | +5.909 |
Neg logit contributions | |
Zoro | -8.935 |
ibilities | -8.376 |
ells | -7.865 |
Directions | -7.328 |
vitamins | -7.287 |
Token | been |
Token ID | 587 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
ATH | +9.119 |
aring | +8.027 |
aria | +7.765 |
ares | +7.681 |
Stacy | +7.611 |
Neg logit contributions | |
Zoro | -12.799 |
ibilities | -12.128 |
ells | -11.918 |
Directions | -10.792 |
vitamins | -10.660 |
Token | attained |
Token ID | 28681 |
Feature activation | +3.09e-01 |
Pos logit contributions | |
ATH | +9.299 |
aring | +8.137 |
ares | +8.061 |
Stacy | +7.985 |
aria | +7.908 |
Neg logit contributions | |
Zoro | -9.384 |
ibilities | -8.844 |
ells | -8.660 |
vitamins | -7.500 |
Directions | -7.438 |
Token | by |
Token ID | 416 |
Feature activation | +6.17e-01 |
Pos logit contributions | |
ATH | +2.636 |
ares | +2.297 |
aring | +2.290 |
anamo | +2.255 |
aryl | +2.248 |
Neg logit contributions | |
Zoro | -2.499 |
ibilities | -2.264 |
ells | -2.238 |
chapter | -2.057 |
vitamins | -2.011 |
Token | gaming |
Token ID | 7776 |
Feature activation | +8.98e-02 |
Pos logit contributions | |
ATH | +4.875 |
aring | +4.257 |
ares | +4.247 |
aryl | +4.187 |
Stacy | +4.155 |
Neg logit contributions | |
Zoro | -5.116 |
ibilities | -4.765 |
ells | -4.632 |
ible | -4.164 |
chapter | -4.136 |
Token | the |
Token ID | 262 |
Feature activation | +4.39e-01 |
Pos logit contributions | |
ATH | +0.778 |
ares | +0.682 |
aring | +0.676 |
ARE | +0.673 |
aryl | +0.667 |
Neg logit contributions | |
Zoro | -0.723 |
ibilities | -0.648 |
ells | -0.643 |
chapter | -0.595 |
vitamins | -0.575 |
Token | got |
Token ID | 1392 |
Feature activation | -3.65e-01 |
Pos logit contributions | |
ATH | +0.205 |
ares | +0.179 |
aring | +0.178 |
ARE | +0.175 |
anamo | +0.175 |
Neg logit contributions | |
Zoro | -0.204 |
ibilities | -0.184 |
ells | -0.182 |
chapter | -0.169 |
ible | -0.164 |
Token | it |
Token ID | 340 |
Feature activation | -7.08e-01 |
Pos logit contributions | |
Zoro | +2.767 |
ibilities | +2.412 |
ells | +2.387 |
chapter | +2.271 |
vitamins | +2.197 |
Neg logit contributions | |
ATH | -3.356 |
anamo | -2.980 |
ares | -2.944 |
aring | -2.926 |
aryl | -2.911 |
Token | . |
Token ID | 13 |
Feature activation | +9.87e-02 |
Pos logit contributions | |
Zoro | +5.089 |
ells | +4.331 |
ibilities | +4.319 |
chapter | +4.158 |
ible | +3.995 |
Neg logit contributions | |
ATH | -6.640 |
anamo | -6.025 |
ares | -5.842 |
ARE | -5.801 |
aryl | -5.771 |
Token | If |
Token ID | 1002 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
ATH | +0.848 |
ares | +0.738 |
aring | +0.733 |
ARE | +0.730 |
Stacy | +0.729 |
Neg logit contributions | |
Zoro | -0.790 |
ibilities | -0.735 |
ells | -0.719 |
chapter | -0.653 |
vitamins | -0.651 |
Token | a |
Token ID | 257 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
ATH | +0.964 |
ares | +0.850 |
aring | +0.846 |
anamo | +0.844 |
ARE | +0.837 |
Neg logit contributions | |
Zoro | -0.782 |
ibilities | -0.699 |
ells | -0.692 |
chapter | -0.634 |
ible | -0.616 |
Token | fairy |
Token ID | 25607 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
ATH | +1.358 |
aring | +1.187 |
ares | +1.186 |
ARE | +1.171 |
anamo | +1.167 |
Neg logit contributions | |
Zoro | -1.159 |
ibilities | -1.066 |
ells | -1.053 |
chapter | -0.937 |
ible | -0.929 |
Token | had |
Token ID | 550 |
Feature activation | +2.56e-01 |
Pos logit contributions | |
ATH | +11.314 |
aring | +10.279 |
kind | +10.184 |
Stacy | +10.049 |
ares | +10.044 |
Neg logit contributions | |
ibilities | -9.962 |
Zoro | -9.956 |
ells | -9.440 |
ible | -8.362 |
ibly | -8.162 |
Token | come |
Token ID | 1282 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
ATH | +2.181 |
ares | +1.913 |
aring | +1.908 |
Stacy | +1.880 |
ARE | +1.868 |
Neg logit contributions | |
Zoro | -2.027 |
ibilities | -1.883 |
ells | -1.857 |
chapter | -1.657 |
ible | -1.651 |
Token | and |
Token ID | 290 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
ATH | +1.881 |
aring | +1.669 |
ares | +1.653 |
Stacy | +1.609 |
ARE | +1.600 |
Neg logit contributions | |
Zoro | -1.960 |
ibilities | -1.827 |
ells | -1.798 |
chapter | -1.626 |
ible | -1.613 |
Token | offered |
Token ID | 4438 |
Feature activation | +6.63e-02 |
Pos logit contributions | |
ATH | +3.004 |
aring | +2.671 |
ares | +2.656 |
Stacy | +2.620 |
ARE | +2.582 |
Neg logit contributions | |
Zoro | -2.719 |
ibilities | -2.585 |
ells | -2.518 |
ible | -2.253 |
chapter | -2.210 |
Token | to |
Token ID | 284 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
ATH | +0.622 |
ares | +0.550 |
aring | +0.547 |
anamo | +0.544 |
ARE | +0.541 |
Neg logit contributions | |
Zoro | -0.483 |
ibilities | -0.433 |
ells | -0.428 |
chapter | -0.390 |
ible | -0.379 |
Token | discern |
Token ID | 22024 |
Feature activation | -2.72e-01 |
Pos logit contributions | |
Zoro | +3.492 |
ibilities | +3.150 |
ells | +3.111 |
chapter | +2.924 |
vitamins | +2.836 |
Neg logit contributions | |
ATH | -3.392 |
anamo | -2.945 |
ares | -2.944 |
aring | -2.922 |
ARE | -2.898 |
Token | the |
Token ID | 262 |
Feature activation | -9.18e-01 |
Pos logit contributions | |
Zoro | +2.087 |
ibilities | +1.866 |
ells | +1.845 |
chapter | +1.693 |
vitamins | +1.650 |
Neg logit contributions | |
ATH | -2.466 |
ares | -2.169 |
aring | -2.158 |
ARE | -2.137 |
anamo | -2.130 |
Token | size |
Token ID | 2546 |
Feature activation | +6.18e-01 |
Pos logit contributions | |
Zoro | +4.268 |
ibilities | +3.558 |
ells | +3.454 |
chapter | +3.406 |
ible | +3.178 |
Neg logit contributions | |
ATH | -10.605 |
anamo | -10.062 |
aldi | -9.647 |
aryl | -9.628 |
merce | -9.581 |
Token | of |
Token ID | 286 |
Feature activation | +3.71e-01 |
Pos logit contributions | |
ATH | +4.073 |
ares | +3.416 |
aring | +3.385 |
ARE | +3.356 |
Mehran | +3.336 |
Neg logit contributions | |
Zoro | -5.781 |
ibilities | -5.594 |
ells | -5.484 |
vitamins | -5.034 |
utor | -4.952 |
Token | individual |
Token ID | 1981 |
Feature activation | -4.54e-01 |
Pos logit contributions | |
ATH | +2.773 |
ares | +2.388 |
aring | +2.385 |
aryl | +2.344 |
ARE | +2.340 |
Neg logit contributions | |
Zoro | -3.354 |
ibilities | -3.084 |
ells | -2.964 |
vitamins | -2.721 |
chapter | -2.681 |
Token | pixels |
Token ID | 17848 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
Zoro | +3.308 |
ibilities | +2.931 |
ells | +2.897 |
chapter | +2.678 |
vitamins | +2.592 |
Neg logit contributions | |
ATH | -4.285 |
ares | -3.786 |
anamo | -3.779 |
aring | -3.765 |
ARE | -3.738 |
Token | due |
Token ID | 2233 |
Feature activation | +4.06e-01 |
Pos logit contributions | |
ATH | +6.671 |
aring | +5.463 |
ares | +5.147 |
aldi | +5.037 |
Mehran | +4.959 |
Neg logit contributions | |
Zoro | -15.432 |
ibilities | -14.500 |
ells | -14.438 |
ible | -13.456 |
ibly | -13.343 |
Token | to |
Token ID | 284 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
ATH | +3.004 |
aring | +2.561 |
ares | +2.544 |
aria | +2.525 |
Stacy | +2.496 |
Neg logit contributions | |
Zoro | -3.640 |
ibilities | -3.430 |
ells | -3.326 |
vitamins | -3.031 |
ible | -2.957 |
Token | the |
Token ID | 262 |
Feature activation | +5.17e-01 |
Pos logit contributions | |
ATH | +1.162 |
ares | +1.007 |
aring | +0.999 |
ARE | +0.987 |
Stacy | +0.977 |
Neg logit contributions | |
Zoro | -1.146 |
ibilities | -1.052 |
ells | -1.030 |
vitamins | -0.924 |
chapter | -0.921 |
Token | amount |
Token ID | 2033 |
Feature activation | +9.05e-02 |
Pos logit contributions | |
ATH | +3.078 |
aring | +2.612 |
ares | +2.596 |
kind | +2.476 |
ARE | +2.464 |
Neg logit contributions | |
Zoro | -5.482 |
ibilities | -4.965 |
ells | -4.937 |
vitamins | -4.533 |
utor | -4.526 |
Token | they |
Token ID | 484 |
Feature activation | -2.88e-02 |
Pos logit contributions | |
ATH | +0.772 |
ares | +0.683 |
aring | +0.672 |
ARE | +0.666 |
Mehran | +0.659 |
Neg logit contributions | |
Zoro | -0.731 |
ibilities | -0.656 |
ells | -0.649 |
chapter | -0.594 |
ible | -0.580 |
Token | site |
Token ID | 2524 |
Feature activation | -3.58e-01 |
Pos logit contributions | |
ATH | +0.305 |
ares | +0.270 |
aring | +0.269 |
anamo | +0.268 |
ARE | +0.266 |
Neg logit contributions | |
Zoro | -0.237 |
ibilities | -0.210 |
ells | -0.207 |
chapter | -0.191 |
vitamins | -0.185 |
Token | C |
Token ID | 327 |
Feature activation | +4.75e-01 |
Pos logit contributions | |
Zoro | +2.943 |
ibilities | +2.630 |
ells | +2.609 |
chapter | +2.474 |
vitamins | +2.376 |
Neg logit contributions | |
ATH | -3.019 |
anamo | -2.654 |
ares | -2.629 |
aryl | -2.593 |
aring | -2.592 |
Token | NET |
Token ID | 12884 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
ATH | +3.948 |
aring | +3.515 |
ares | +3.479 |
aryl | +3.366 |
ARE | +3.362 |
Neg logit contributions | |
Zoro | -4.135 |
ells | -3.510 |
ibilities | -3.508 |
chapter | -3.327 |
vitamins | -3.217 |
Token | 's |
Token ID | 338 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
ATH | +3.123 |
aring | +2.712 |
ares | +2.703 |
ARE | +2.695 |
anamo | +2.663 |
Neg logit contributions | |
Zoro | -3.100 |
ibilities | -2.810 |
ells | -2.729 |
chapter | -2.518 |
ibly | -2.504 |
Token | in |
Token ID | 287 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
ATH | +9.182 |
Stacy | +8.405 |
aring | +8.231 |
ARE | +8.189 |
ares | +8.165 |
Neg logit contributions | |
Zoro | -10.063 |
ells | -9.207 |
ibilities | -9.188 |
ibly | -8.406 |
vitamins | -8.164 |
Token | - |
Token ID | 12 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
ATH | +4.227 |
aring | +3.743 |
ares | +3.684 |
ARE | +3.622 |
Stacy | +3.583 |
Neg logit contributions | |
Zoro | -4.084 |
ibilities | -3.644 |
ells | -3.588 |
vitamins | -3.302 |
chapter | -3.288 |
Token | depth |
Token ID | 18053 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
ATH | +4.725 |
kind | +4.164 |
aring | +3.566 |
ARE | +3.389 |
ares | +3.310 |
Neg logit contributions | |
Zoro | -17.789 |
ibilities | -16.322 |
ells | -15.706 |
vitamins | -15.562 |
ibly | -15.411 |
Token | coverage |
Token ID | 5197 |
Feature activation | +4.76e-01 |
Pos logit contributions | |
ATH | +8.840 |
Stacy | +7.690 |
ARE | +7.538 |
aring | +7.528 |
aldi | +7.426 |
Neg logit contributions | |
Zoro | -10.761 |
ibilities | -9.979 |
ells | -9.865 |
ibly | -9.218 |
utor | -8.831 |
Token | . |
Token ID | 13 |
Feature activation | -7.81e-02 |
Pos logit contributions | |
ATH | +3.788 |
aring | +3.307 |
ares | +3.263 |
ARE | +3.237 |
Stacy | +3.212 |
Neg logit contributions | |
Zoro | -4.068 |
ibilities | -3.673 |
ells | -3.653 |
vitamins | -3.324 |
ibly | -3.300 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +6.74e-01 |
Pos logit contributions | |
Zoro | +0.616 |
ibilities | +0.551 |
ells | +0.544 |
chapter | +0.509 |
ible | +0.493 |
Neg logit contributions | |
ATH | -0.690 |
ares | -0.606 |
anamo | -0.605 |
aring | -0.601 |
ARE | -0.595 |
Token | After |
Token ID | 3260 |
Feature activation | +4.65e-02 |
Pos logit contributions | |
ATH | +5.332 |
ARE | +4.503 |
ares | +4.385 |
aring | +4.373 |
Bern | +4.330 |
Neg logit contributions | |
Zoro | -5.966 |
ibilities | -5.401 |
ells | -5.288 |
chapter | -4.975 |
vitamins | -4.924 |
Token | picking |
Token ID | 10868 |
Feature activation | +2.21e-01 |
Pos logit contributions | |
ATH | +1.828 |
aring | +1.604 |
ares | +1.579 |
aldi | +1.557 |
Stacy | +1.549 |
Neg logit contributions | |
Zoro | -1.875 |
ibilities | -1.762 |
ells | -1.709 |
chapter | -1.545 |
ible | -1.541 |
Token | up |
Token ID | 510 |
Feature activation | +2.83e-01 |
Pos logit contributions | |
ATH | +1.704 |
aring | +1.456 |
ares | +1.455 |
aldi | +1.428 |
ARE | +1.427 |
Neg logit contributions | |
Zoro | -1.973 |
ibilities | -1.802 |
ells | -1.778 |
chapter | -1.656 |
ible | -1.625 |
Token | on |
Token ID | 319 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
ATH | +2.146 |
ares | +1.842 |
aring | +1.840 |
aldi | +1.810 |
ARE | +1.803 |
Neg logit contributions | |
Zoro | -2.545 |
ibilities | -2.340 |
ells | -2.308 |
chapter | -2.141 |
ible | -2.103 |
Token | Zen |
Token ID | 14760 |
Feature activation | +8.66e-02 |
Pos logit contributions | |
ATH | +1.947 |
ares | +1.708 |
aring | +1.703 |
anamo | +1.681 |
aldi | +1.679 |
Neg logit contributions | |
Zoro | -1.768 |
ibilities | -1.599 |
ells | -1.577 |
chapter | -1.452 |
ible | -1.415 |
Token | and |
Token ID | 290 |
Feature activation | +2.92e-01 |
Pos logit contributions | |
ATH | +0.819 |
ares | +0.726 |
aring | +0.722 |
anamo | +0.720 |
ARE | +0.715 |
Neg logit contributions | |
Zoro | -0.626 |
ibilities | -0.559 |
ells | -0.550 |
chapter | -0.506 |
vitamins | -0.490 |
Token | so |
Token ID | 523 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
ATH | +2.462 |
aring | +2.158 |
ares | +2.149 |
aldi | +2.115 |
Stacy | +2.114 |
Neg logit contributions | |
Zoro | -2.327 |
ibilities | -2.159 |
ells | -2.123 |
chapter | -1.932 |
ible | -1.903 |
Token | on |
Token ID | 319 |
Feature activation | +8.89e-01 |
Pos logit contributions | |
ATH | +8.385 |
aring | +7.473 |
ares | +7.079 |
aldi | +6.928 |
aryl | +6.927 |
Neg logit contributions | |
Zoro | -13.817 |
ibilities | -12.823 |
ells | -12.294 |
chapter | -11.666 |
ible | -11.596 |
Token | . |
Token ID | 13 |
Feature activation | +2.55e-01 |
Pos logit contributions | |
ATH | +6.836 |
aring | +5.989 |
ares | +5.881 |
aldi | +5.813 |
aryl | +5.795 |
Neg logit contributions | |
Zoro | -7.364 |
ibilities | -6.733 |
ells | -6.561 |
chapter | -5.990 |
vitamins | -5.946 |
Token |
|
Token ID | 198 |
Feature activation | +3.90e-01 |
Pos logit contributions | |
ATH | +2.167 |
ares | +1.881 |
aring | +1.880 |
Stacy | +1.868 |
ARE | +1.859 |
Neg logit contributions | |
Zoro | -2.032 |
ibilities | -1.916 |
ells | -1.849 |
chapter | -1.700 |
vitamins | -1.685 |
Token |
|
Token ID | 198 |
Feature activation | +3.57e-02 |
Pos logit contributions | |
ATH | +3.156 |
ares | +2.705 |
aring | +2.679 |
ARE | +2.675 |
kind | +2.666 |
Neg logit contributions | |
Zoro | -3.282 |
ibilities | -3.072 |
ells | -2.928 |
vitamins | -2.727 |
ibly | -2.637 |
Token | Q |
Token ID | 48 |
Feature activation | +7.28e-02 |
Pos logit contributions | |
ATH | +0.282 |
ares | +0.240 |
ARE | +0.239 |
aring | +0.239 |
anamo | +0.236 |
Neg logit contributions | |
Zoro | -0.319 |
ibilities | -0.290 |
ells | -0.285 |
chapter | -0.268 |
vitamins | -0.262 |
Token | . |
Token ID | 13 |
Feature activation | +2.57e-02 |
Pos logit contributions | |
Zoro | +2.376 |
ibilities | +2.060 |
ells | +2.049 |
chapter | +1.946 |
ible | +1.862 |
Neg logit contributions | |
ATH | -2.990 |
anamo | -2.660 |
ares | -2.625 |
aldi | -2.595 |
ARE | -2.586 |
Token |
|
Token ID | 198 |
Feature activation | +5.37e-01 |
Pos logit contributions | |
ATH | +0.246 |
ares | +0.217 |
anamo | +0.217 |
aring | +0.215 |
ARE | +0.215 |
Neg logit contributions | |
Zoro | -0.186 |
ibilities | -0.163 |
ells | -0.162 |
chapter | -0.149 |
vitamins | -0.144 |
Token |
|
Token ID | 198 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
ATH | +4.175 |
aring | +3.543 |
ares | +3.541 |
ARE | +3.520 |
kind | +3.506 |
Neg logit contributions | |
Zoro | -4.581 |
ibilities | -4.314 |
ells | -4.137 |
vitamins | -3.872 |
ibly | -3.757 |
Token | ( |
Token ID | 7 |
Feature activation | +2.57e-01 |
Pos logit contributions | |
ATH | +1.127 |
ares | +0.960 |
aring | +0.955 |
ARE | +0.955 |
anamo | +0.934 |
Neg logit contributions | |
Zoro | -1.285 |
ibilities | -1.172 |
ells | -1.151 |
chapter | -1.083 |
vitamins | -1.057 |
Token | Reporting |
Token ID | 42159 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
ATH | +1.656 |
aring | +1.362 |
ares | +1.359 |
ARE | +1.351 |
anamo | +1.330 |
Neg logit contributions | |
Zoro | -2.658 |
ibilities | -2.431 |
ells | -2.411 |
chapter | -2.298 |
vitamins | -2.249 |
Token | by |
Token ID | 416 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
ATH | +2.922 |
ares | +2.582 |
Stacy | +2.560 |
aring | +2.553 |
ARE | +2.540 |
Neg logit contributions | |
Zoro | -2.518 |
ibilities | -2.274 |
ells | -2.254 |
chapter | -2.040 |
ible | -2.012 |
Token | Z |
Token ID | 1168 |
Feature activation | +2.15e-01 |
Pos logit contributions | |
ATH | +10.333 |
Stacy | +9.480 |
Mehran | +9.401 |
ares | +8.885 |
aring | +8.834 |
Neg logit contributions | |
ibilities | -10.564 |
Zoro | -10.443 |
ells | -10.316 |
ible | -9.341 |
ibly | -9.327 |
Token | ey |
Token ID | 2959 |
Feature activation | -6.71e-02 |
Pos logit contributions | |
ATH | +1.746 |
ares | +1.539 |
aring | +1.524 |
aryl | +1.503 |
aldi | +1.501 |
Neg logit contributions | |
Zoro | -1.838 |
ibilities | -1.652 |
ells | -1.622 |
chapter | -1.532 |
vitamins | -1.495 |
Token | ad |
Token ID | 324 |
Feature activation | +5.37e-01 |
Pos logit contributions | |
Zoro | +0.626 |
ibilities | +0.570 |
ells | +0.564 |
chapter | +0.532 |
vitamins | +0.520 |
Neg logit contributions | |
ATH | -0.496 |
ares | -0.425 |
anamo | -0.422 |
aring | -0.422 |
ARE | -0.416 |
Token | Mas |
Token ID | 11066 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
ATH | +4.346 |
ares | +3.862 |
aring | +3.810 |
Mehran | +3.754 |
aria | +3.752 |
Neg logit contributions | |
Zoro | -4.364 |
ibilities | -4.054 |
ells | -3.952 |
chapter | -3.711 |
vitamins | -3.688 |
Token | ro |
Token ID | 305 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
ATH | +2.522 |
ares | +2.231 |
aring | +2.201 |
anamo | +2.167 |
aldi | +2.163 |
Neg logit contributions | |
Zoro | -2.971 |
ibilities | -2.677 |
ells | -2.638 |
chapter | -2.494 |
vitamins | -2.450 |
Token | � |
Token ID | 447 |
Feature activation | +4.22e-02 |
Pos logit contributions | |
ATH | +2.783 |
ares | +2.422 |
aring | +2.408 |
anamo | +2.345 |
ARE | +2.344 |
Neg logit contributions | |
Zoro | -2.794 |
ibilities | -2.536 |
ells | -2.436 |
chapter | -2.282 |
ible | -2.243 |
Token | � |
Token ID | 247 |
Feature activation | -2.52e-01 |
Pos logit contributions | |
ATH | +0.242 |
ares | +0.196 |
aring | +0.192 |
aldi | +0.188 |
ARE | +0.188 |
Neg logit contributions | |
Zoro | -0.470 |
ibilities | -0.435 |
ells | -0.429 |
chapter | -0.406 |
vitamins | -0.401 |
Token | s |
Token ID | 82 |
Feature activation | +5.66e-01 |
Pos logit contributions | |
Zoro | +2.298 |
ibilities | +2.088 |
ells | +2.064 |
chapter | +1.943 |
vitamins | +1.894 |
Neg logit contributions | |
ATH | -1.919 |
ares | -1.647 |
aring | -1.634 |
anamo | -1.633 |
ARE | -1.615 |
Token | after |
Token ID | 706 |
Feature activation | +5.77e-01 |
Pos logit contributions | |
ATH | +4.439 |
ares | +3.852 |
aring | +3.822 |
ARE | +3.764 |
aryl | +3.696 |
Neg logit contributions | |
Zoro | -4.835 |
ibilities | -4.489 |
ells | -4.421 |
vitamins | -3.961 |
ible | -3.929 |
Token | - |
Token ID | 12 |
Feature activation | +9.79e-01 |
Pos logit contributions | |
ATH | +4.367 |
ares | +3.815 |
aring | +3.743 |
ARE | +3.639 |
aryl | +3.627 |
Neg logit contributions | |
Zoro | -5.231 |
ibilities | -4.657 |
ells | -4.643 |
ible | -4.241 |
chapter | -4.237 |
Token | tax |
Token ID | 19290 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
ATH | +4.774 |
ares | +3.778 |
aring | +3.531 |
kind | +3.488 |
ARE | +3.442 |
Neg logit contributions | |
Zoro | -11.288 |
ibilities | -10.320 |
ells | -10.208 |
chapter | -9.704 |
vitamins | -9.638 |
Token | income |
Token ID | 3739 |
Feature activation | +1.75e-03 |
Pos logit contributions | |
ATH | +9.811 |
ares | +8.307 |
aring | +8.226 |
ARE | +8.072 |
lodging | +8.055 |
Neg logit contributions | |
Zoro | -11.802 |
ells | -11.211 |
ibilities | -10.743 |
vitamins | -9.819 |
utor | -9.518 |
Token | would |
Token ID | 561 |
Feature activation | +2.44e-01 |
Pos logit contributions | |
ATH | +0.015 |
ares | +0.013 |
aring | +0.013 |
anamo | +0.013 |
ARE | +0.013 |
Neg logit contributions | |
Zoro | -0.014 |
ibilities | -0.013 |
ells | -0.013 |
chapter | -0.012 |
vitamins | -0.011 |
Token | total |
Token ID | 2472 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
ATH | +2.070 |
aring | +1.822 |
ares | +1.793 |
aryl | +1.762 |
ARE | +1.752 |
Neg logit contributions | |
Zoro | -2.014 |
ibilities | -1.785 |
ells | -1.774 |
chapter | -1.613 |
vitamins | -1.604 |
Token | $ |
Token ID | 720 |
Feature activation | +4.63e-03 |
Pos logit contributions | |
ATH | +1.306 |
ares | +1.137 |
aring | +1.127 |
ARE | +1.105 |
anamo | +1.101 |
Neg logit contributions | |
Zoro | -1.461 |
ibilities | -1.336 |
ells | -1.320 |
chapter | -1.214 |
vitamins | -1.194 |
Token | 150 |
Token ID | 8628 |
Feature activation | +5.54e-01 |
Pos logit contributions | |
ATH | +0.034 |
ares | +0.029 |
aring | +0.028 |
ARE | +0.028 |
anamo | +0.028 |
Neg logit contributions | |
Zoro | -0.044 |
ibilities | -0.040 |
ells | -0.040 |
chapter | -0.037 |
vitamins | -0.037 |
Token | than |
Token ID | 621 |
Feature activation | +4.17e-01 |
Pos logit contributions | |
ATH | +3.138 |
ares | +2.815 |
aring | +2.804 |
ARE | +2.753 |
anamo | +2.727 |
Neg logit contributions | |
Zoro | -2.594 |
ells | -2.327 |
ibilities | -2.287 |
ible | -2.045 |
chapter | -2.033 |
Token | , |
Token ID | 11 |
Feature activation | +3.10e-02 |
Pos logit contributions | |
ATH | +2.839 |
ares | +2.430 |
aring | +2.409 |
ARE | +2.399 |
Stacy | +2.383 |
Neg logit contributions | |
Zoro | -3.982 |
ibilities | -3.704 |
ells | -3.667 |
ible | -3.355 |
chapter | -3.326 |
Token | probably |
Token ID | 2192 |
Feature activation | +4.02e-01 |
Pos logit contributions | |
ATH | +0.259 |
ares | +0.226 |
aring | +0.224 |
ARE | +0.223 |
anamo | +0.222 |
Neg logit contributions | |
Zoro | -0.259 |
ibilities | -0.234 |
ells | -0.232 |
chapter | -0.213 |
vitamins | -0.209 |
Token | , |
Token ID | 11 |
Feature activation | +4.79e-01 |
Pos logit contributions | |
ATH | +3.346 |
ares | +2.944 |
aring | +2.918 |
ARE | +2.870 |
Stacy | +2.869 |
Neg logit contributions | |
Zoro | -3.287 |
ibilities | -3.006 |
ells | -2.985 |
chapter | -2.657 |
ible | -2.650 |
Token | a |
Token ID | 257 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
ATH | +3.230 |
ares | +2.736 |
aring | +2.700 |
Stacy | +2.680 |
ARE | +2.678 |
Neg logit contributions | |
Zoro | -4.627 |
ibilities | -4.304 |
ells | -4.268 |
ible | -3.888 |
vitamins | -3.862 |
Token | mid |
Token ID | 3095 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
ATH | +2.477 |
aring | +2.169 |
ares | +2.169 |
ARE | +2.147 |
Stacy | +2.143 |
Neg logit contributions | |
Zoro | -2.333 |
ibilities | -2.119 |
ells | -2.116 |
vitamins | -1.876 |
ible | -1.872 |
Token | - |
Token ID | 12 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
ATH | +9.918 |
aring | +8.912 |
ares | +8.665 |
ARE | +8.629 |
aria | +8.356 |
Neg logit contributions | |
Zoro | -11.809 |
ells | -10.660 |
ibilities | -10.651 |
vitamins | -9.705 |
ible | -9.528 |
Token | April |
Token ID | 16784 |
Feature activation | +4.71e-01 |
Pos logit contributions | |
ATH | +5.870 |
ARE | +4.700 |
aring | +4.633 |
ares | +4.588 |
Bern | +4.329 |
Neg logit contributions | |
Zoro | -14.136 |
ibilities | -12.955 |
ells | -12.749 |
vitamins | -12.088 |
ible | -11.762 |
Token | launch |
Token ID | 4219 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
ATH | +4.004 |
aring | +3.525 |
ares | +3.483 |
ARE | +3.439 |
Stacy | +3.433 |
Neg logit contributions | |
Zoro | -3.738 |
ells | -3.415 |
ibilities | -3.348 |
vitamins | -3.004 |
chapter | -3.001 |
Token | . |
Token ID | 13 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
Zoro | +1.144 |
ibilities | +1.019 |
ells | +1.007 |
chapter | +0.934 |
vitamins | +0.904 |
Neg logit contributions | |
ATH | -1.378 |
ares | -1.214 |
anamo | -1.208 |
aring | -1.207 |
ARE | -1.196 |
Token | � |
Token ID | 447 |
Feature activation | -4.33e-02 |
Pos logit contributions | |
Zoro | +0.118 |
ibilities | +0.106 |
ells | +0.105 |
chapter | +0.097 |
vitamins | +0.094 |
Neg logit contributions | |
ATH | -0.136 |
ares | -0.119 |
aring | -0.118 |
anamo | -0.118 |
ARE | -0.117 |
Token | the |
Token ID | 262 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
ATH | +3.566 |
ares | +3.114 |
aring | +3.078 |
Stacy | +3.067 |
ARE | +3.064 |
Neg logit contributions | |
Zoro | -3.193 |
ibilities | -2.945 |
ells | -2.888 |
chapter | -2.619 |
ible | -2.602 |
Token | 50 |
Token ID | 2026 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
ATH | +1.017 |
ares | +0.878 |
aring | +0.872 |
Stacy | +0.865 |
ARE | +0.863 |
Neg logit contributions | |
Zoro | -1.071 |
ibilities | -0.987 |
ells | -0.974 |
chapter | -0.889 |
ible | -0.880 |
Token | th |
Token ID | 400 |
Feature activation | -1.98e-02 |
Pos logit contributions | |
ATH | +0.729 |
ares | +0.609 |
aring | +0.605 |
Stacy | +0.588 |
ARE | +0.588 |
Neg logit contributions | |
Zoro | -1.133 |
ibilities | -1.056 |
ells | -1.037 |
chapter | -0.968 |
vitamins | -0.960 |
Token | anniversary |
Token ID | 11162 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
Zoro | +0.203 |
ibilities | +0.185 |
ells | +0.184 |
chapter | +0.175 |
ible | +0.170 |
Neg logit contributions | |
ATH | -0.130 |
anamo | -0.109 |
ares | -0.108 |
aring | -0.107 |
ARE | -0.106 |
Token | of |
Token ID | 286 |
Feature activation | -2.80e-02 |
Pos logit contributions | |
ATH | +2.934 |
ares | +2.545 |
aring | +2.537 |
anamo | +2.520 |
ARE | +2.503 |
Neg logit contributions | |
Zoro | -2.944 |
ibilities | -2.668 |
ells | -2.647 |
chapter | -2.449 |
vitamins | -2.397 |
Token | Sultan |
Token ID | 37399 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
Zoro | +0.210 |
ibilities | +0.187 |
ells | +0.185 |
chapter | +0.171 |
vitamins | +0.166 |
Neg logit contributions | |
ATH | -0.259 |
ares | -0.228 |
anamo | -0.227 |
aring | -0.227 |
ARE | -0.225 |
Token | Hassan |
Token ID | 24485 |
Feature activation | +6.55e-01 |
Pos logit contributions | |
ATH | +8.928 |
Mehran | +8.381 |
aring | +8.004 |
ares | +7.905 |
Stacy | +7.866 |
Neg logit contributions | |
Zoro | -11.559 |
ibilities | -11.183 |
ells | -11.031 |
vitamins | -10.375 |
chapter | -10.018 |
Token | al |
Token ID | 435 |
Feature activation | +3.83e-01 |
Pos logit contributions | |
ATH | +3.297 |
ares | +2.758 |
aring | +2.756 |
aldi | +2.676 |
aria | +2.642 |
Neg logit contributions | |
Zoro | -7.313 |
ibilities | -6.976 |
ells | -6.666 |
vitamins | -6.425 |
Directions | -6.338 |
Token | - |
Token ID | 12 |
Feature activation | +3.66e-01 |
Pos logit contributions | |
ATH | +3.245 |
ares | +2.874 |
aring | +2.828 |
anamo | +2.815 |
aria | +2.798 |
Neg logit contributions | |
Zoro | -3.005 |
ibilities | -2.830 |
ells | -2.753 |
chapter | -2.567 |
vitamins | -2.504 |
Token | B |
Token ID | 33 |
Feature activation | -4.33e-02 |
Pos logit contributions | |
ATH | +2.730 |
ares | +2.291 |
ARE | +2.289 |
aring | +2.276 |
Mehran | +2.208 |
Neg logit contributions | |
Zoro | -3.302 |
ibilities | -3.170 |
ells | -3.102 |
vitamins | -2.880 |
chapter | -2.872 |
Token | olk |
Token ID | 13597 |
Feature activation | -4.57e-02 |
Pos logit contributions | |
Zoro | +0.387 |
ibilities | +0.348 |
ells | +0.340 |
chapter | +0.327 |
vitamins | +0.322 |
Neg logit contributions | |
ATH | -0.339 |
ares | -0.296 |
aring | -0.295 |
aldi | -0.291 |
aryl | -0.290 |
Token | community |
Token ID | 2055 |
Feature activation | -6.14e-02 |
Pos logit contributions | |
ATH | +0.872 |
ares | +0.760 |
aring | +0.756 |
anamo | +0.748 |
ARE | +0.747 |
Neg logit contributions | |
Zoro | -0.866 |
ibilities | -0.787 |
ells | -0.776 |
chapter | -0.719 |
vitamins | -0.701 |
Token | , |
Token ID | 11 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
Zoro | +0.487 |
ibilities | +0.434 |
ells | +0.430 |
chapter | +0.402 |
vitamins | +0.390 |
Neg logit contributions | |
ATH | -0.541 |
anamo | -0.474 |
ares | -0.474 |
aring | -0.469 |
ARE | -0.467 |
Token | in |
Token ID | 287 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
ATH | +1.317 |
aring | +1.149 |
ares | +1.147 |
ARE | +1.134 |
anamo | +1.126 |
Neg logit contributions | |
Zoro | -1.300 |
ibilities | -1.195 |
ells | -1.177 |
chapter | -1.071 |
ible | -1.056 |
Token | media |
Token ID | 2056 |
Feature activation | -1.98e-01 |
Pos logit contributions | |
ATH | +2.296 |
aring | +2.001 |
ares | +1.998 |
anamo | +1.964 |
ARE | +1.960 |
Neg logit contributions | |
Zoro | -2.273 |
ibilities | -2.060 |
ells | -2.031 |
chapter | -1.853 |
ible | -1.825 |
Token | and |
Token ID | 290 |
Feature activation | +8.56e-01 |
Pos logit contributions | |
Zoro | +1.516 |
ibilities | +1.350 |
ells | +1.334 |
chapter | +1.251 |
vitamins | +1.208 |
Neg logit contributions | |
ATH | -1.794 |
anamo | -1.581 |
ares | -1.568 |
aring | -1.551 |
aldi | -1.547 |
Token | so |
Token ID | 523 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
ATH | +6.361 |
aring | +5.600 |
ares | +5.493 |
ARE | +5.456 |
aldi | +5.441 |
Neg logit contributions | |
Zoro | -7.160 |
ibilities | -6.723 |
ells | -6.563 |
ible | -5.718 |
ibly | -5.718 |
Token | on |
Token ID | 319 |
Feature activation | +5.59e-01 |
Pos logit contributions | |
ATH | +8.457 |
aring | +7.510 |
ares | +7.203 |
aryl | +7.082 |
aldi | +7.034 |
Neg logit contributions | |
Zoro | -13.158 |
ibilities | -11.973 |
ells | -11.599 |
chapter | -10.980 |
ible | -10.805 |
Token | , |
Token ID | 11 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
ATH | +4.595 |
aring | +4.092 |
ares | +4.066 |
ARE | +3.968 |
Stacy | +3.944 |
Neg logit contributions | |
Zoro | -4.563 |
ibilities | -4.117 |
ells | -4.029 |
chapter | -3.724 |
vitamins | -3.650 |
Token | has |
Token ID | 468 |
Feature activation | +1.98e-01 |
Pos logit contributions | |
ATH | +1.227 |
aring | +1.075 |
ares | +1.072 |
ARE | +1.055 |
anamo | +1.048 |
Neg logit contributions | |
Zoro | -1.214 |
ibilities | -1.110 |
ells | -1.093 |
chapter | -1.003 |
ible | -0.982 |
Token | got |
Token ID | 1392 |
Feature activation | -7.33e-02 |
Pos logit contributions | |
ATH | +1.657 |
aring | +1.445 |
ares | +1.439 |
ARE | +1.415 |
aldi | +1.414 |
Neg logit contributions | |
Zoro | -1.624 |
ibilities | -1.478 |
ells | -1.465 |
chapter | -1.334 |
ible | -1.307 |
Token | to |
Token ID | 284 |
Feature activation | +4.10e-01 |
Pos logit contributions | |
Zoro | +0.580 |
ibilities | +0.519 |
ells | +0.512 |
chapter | +0.478 |
vitamins | +0.464 |
Neg logit contributions | |
ATH | -0.647 |
ares | -0.568 |
anamo | -0.565 |
aring | -0.563 |
ARE | -0.559 |
Token | and |
Token ID | 290 |
Feature activation | +5.29e-01 |
Pos logit contributions | |
ATH | +4.181 |
Stacy | +3.658 |
ares | +3.649 |
aring | +3.639 |
aryl | +3.568 |
Neg logit contributions | |
Zoro | -4.214 |
ibilities | -3.949 |
ells | -3.887 |
chapter | -3.497 |
ible | -3.444 |
Token | you |
Token ID | 345 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
ATH | +4.330 |
aring | +3.818 |
Stacy | +3.737 |
ares | +3.711 |
aldi | +3.666 |
Neg logit contributions | |
Zoro | -4.270 |
ibilities | -3.991 |
ells | -3.954 |
chapter | -3.540 |
ible | -3.487 |
Token | will |
Token ID | 481 |
Feature activation | +3.97e-01 |
Pos logit contributions | |
ATH | +2.436 |
aring | +2.140 |
ares | +2.136 |
aldi | +2.057 |
ARE | +2.056 |
Neg logit contributions | |
Zoro | -2.552 |
ibilities | -2.335 |
ells | -2.276 |
chapter | -2.098 |
ible | -2.085 |
Token | smell |
Token ID | 8508 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
ATH | +3.472 |
aring | +3.064 |
ares | +3.025 |
Stacy | +2.986 |
aryl | +2.969 |
Neg logit contributions | |
Zoro | -3.070 |
ibilities | -2.765 |
ells | -2.738 |
chapter | -2.449 |
ible | -2.416 |
Token | the |
Token ID | 262 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
ATH | +8.909 |
Stacy | +7.853 |
aring | +7.778 |
ares | +7.551 |
aryl | +7.439 |
Neg logit contributions | |
Zoro | -9.379 |
ells | -8.833 |
ibilities | -8.733 |
utor | -7.860 |
chapter | -7.669 |
Token | scent |
Token ID | 21212 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
ATH | +8.317 |
Stacy | +7.351 |
aring | +7.175 |
ares | +7.131 |
aldi | +7.112 |
Neg logit contributions | |
Zoro | -8.143 |
ibilities | -7.409 |
ells | -7.250 |
ible | -6.459 |
ibly | -6.425 |
Token | of |
Token ID | 286 |
Feature activation | +9.56e-01 |
Pos logit contributions | |
ATH | +8.668 |
aring | +7.762 |
Stacy | +7.532 |
ares | +7.466 |
aryl | +7.411 |
Neg logit contributions | |
Zoro | -11.790 |
ibilities | -10.843 |
ells | -10.649 |
utor | -9.667 |
chapter | -9.602 |
Token | burning |
Token ID | 9482 |
Feature activation | +3.78e-01 |
Pos logit contributions | |
ATH | +7.855 |
Stacy | +6.977 |
aring | +6.835 |
aldi | +6.660 |
aryl | +6.657 |
Neg logit contributions | |
Zoro | -7.100 |
ibilities | -6.719 |
ells | -6.601 |
ibly | -5.803 |
ible | -5.780 |
Token | flesh |
Token ID | 11222 |
Feature activation | +7.54e-01 |
Pos logit contributions | |
ATH | +2.784 |
aring | +2.384 |
ares | +2.374 |
Stacy | +2.368 |
aryl | +2.357 |
Neg logit contributions | |
Zoro | -3.423 |
ibilities | -3.121 |
ells | -3.089 |
chapter | -2.876 |
ible | -2.798 |
Token | . |
Token ID | 13 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
ATH | +5.855 |
aring | +5.139 |
ares | +5.096 |
aryl | +5.074 |
aldi | +5.028 |
Neg logit contributions | |
Zoro | -6.269 |
ibilities | -5.712 |
ells | -5.562 |
chapter | -5.145 |
vitamins | -5.020 |
Token | � |
Token ID | 447 |
Feature activation | +3.49e-02 |
Pos logit contributions | |
ATH | +1.202 |
ares | +1.036 |
aring | +1.028 |
ARE | +1.027 |
Stacy | +1.022 |
Neg logit contributions | |
Zoro | -1.164 |
ibilities | -1.073 |
ells | -1.044 |
chapter | -0.964 |
vitamins | -0.945 |
Token | / |
Token ID | 1220 |
Feature activation | +9.59e-01 |
Pos logit contributions | |
ATH | +6.972 |
ares | +5.984 |
aring | +5.940 |
ARE | +5.901 |
aldi | +5.666 |
Neg logit contributions | |
Zoro | -7.942 |
ibilities | -7.223 |
ells | -7.009 |
ibly | -6.525 |
vitamins | -6.486 |
Token | Me |
Token ID | 2185 |
Feature activation | +4.06e-01 |
Pos logit contributions | |
ATH | +7.173 |
ARE | +6.093 |
ares | +6.044 |
aring | +5.953 |
aldi | +5.851 |
Neg logit contributions | |
Zoro | -8.280 |
ibilities | -7.609 |
ells | -7.463 |
ibly | -6.656 |
vitamins | -6.653 |
Token | / |
Token ID | 1220 |
Feature activation | +5.66e-01 |
Pos logit contributions | |
ATH | +3.535 |
ares | +3.119 |
ARE | +3.050 |
aring | +3.013 |
aria | +2.952 |
Neg logit contributions | |
Zoro | -3.257 |
ibilities | -2.921 |
ells | -2.812 |
chapter | -2.617 |
vitamins | -2.606 |
Token | 2000 |
Token ID | 4751 |
Feature activation | +9.24e-01 |
Pos logit contributions | |
ATH | +4.412 |
ares | +3.845 |
ARE | +3.802 |
aring | +3.799 |
aldi | +3.739 |
Neg logit contributions | |
Zoro | -4.782 |
ibilities | -4.447 |
ells | -4.349 |
chapter | -3.953 |
vitamins | -3.913 |
Token | / |
Token ID | 1220 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
ATH | +6.684 |
ares | +5.667 |
ARE | +5.632 |
aring | +5.605 |
aldi | +5.517 |
Neg logit contributions | |
Zoro | -8.166 |
ibilities | -7.575 |
ells | -7.330 |
chapter | -6.743 |
ibly | -6.707 |
Token | XP |
Token ID | 11961 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
ATH | +2.830 |
ares | +2.422 |
ARE | +2.399 |
aring | +2.391 |
aldi | +2.354 |
Neg logit contributions | |
Zoro | -3.357 |
ibilities | -3.130 |
ells | -3.059 |
chapter | -2.822 |
vitamins | -2.767 |
Token | I |
Token ID | 314 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
ATH | +9.735 |
ARE | +8.085 |
ares | +8.017 |
aring | +7.940 |
aldi | +7.905 |
Neg logit contributions | |
Zoro | -11.805 |
ibilities | -11.006 |
ells | -10.710 |
ibly | -9.750 |
chapter | -9.560 |
Token |
|
Token ID | 198 |
Feature activation | +3.06e-01 |
Pos logit contributions | |
ATH | +2.770 |
ares | +2.412 |
ARE | +2.376 |
aring | +2.371 |
aldi | +2.311 |
Neg logit contributions | |
Zoro | -3.093 |
ibilities | -2.752 |
ells | -2.718 |
chapter | -2.548 |
vitamins | -2.484 |
Token |
|
Token ID | 198 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
ATH | +2.544 |
ares | +2.203 |
aring | +2.190 |
ARE | +2.178 |
aria | +2.141 |
Neg logit contributions | |
Zoro | -2.527 |
ibilities | -2.350 |
ells | -2.261 |
vitamins | -2.084 |
chapter | -2.031 |
Token | Develop |
Token ID | 19246 |
Feature activation | -3.74e-01 |
Pos logit contributions | |
ATH | +2.168 |
ARE | +1.830 |
ares | +1.828 |
aring | +1.817 |
aria | +1.753 |
Neg logit contributions | |
Zoro | -2.653 |
ibilities | -2.415 |
ells | -2.383 |
chapter | -2.238 |
vitamins | -2.192 |
Token | ed |
Token ID | 276 |
Feature activation | -3.54e-03 |
Pos logit contributions | |
Zoro | +2.837 |
ibilities | +2.521 |
ells | +2.504 |
chapter | +2.331 |
ible | +2.287 |
Neg logit contributions | |
ATH | -3.395 |
anamo | -3.012 |
ares | -2.984 |
ARE | -2.961 |
aring | -2.948 |
Token | usted |
Token ID | 8459 |
Feature activation | +7.74e-02 |
Pos logit contributions | |
Zoro | +3.483 |
ibilities | +3.180 |
ells | +3.147 |
chapter | +2.978 |
ible | +2.899 |
Neg logit contributions | |
ATH | -2.644 |
ares | -2.243 |
anamo | -2.236 |
aring | -2.225 |
ARE | -2.211 |
Token | her |
Token ID | 607 |
Feature activation | +6.49e-01 |
Pos logit contributions | |
ATH | +0.709 |
ares | +0.625 |
aring | +0.621 |
anamo | +0.620 |
ARE | +0.615 |
Neg logit contributions | |
Zoro | -0.586 |
ibilities | -0.523 |
ells | -0.516 |
chapter | -0.477 |
vitamins | -0.463 |
Token | 55 |
Token ID | 5996 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
ATH | +5.134 |
ares | +4.393 |
Stacy | +4.388 |
aring | +4.365 |
aryl | +4.324 |
Neg logit contributions | |
Zoro | -5.334 |
ibilities | -5.143 |
ells | -4.937 |
ible | -4.418 |
vitamins | -4.361 |
Token | percent |
Token ID | 1411 |
Feature activation | +5.81e-01 |
Pos logit contributions | |
ATH | +6.504 |
aring | +5.333 |
ares | +5.261 |
ARE | +5.112 |
Stacy | +5.074 |
Neg logit contributions | |
Zoro | -13.124 |
ibilities | -12.299 |
ells | -12.016 |
chapter | -11.323 |
ible | -11.163 |
Token | to |
Token ID | 284 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
ATH | +4.868 |
ares | +4.216 |
aring | +4.207 |
anamo | +4.180 |
ARE | +4.144 |
Neg logit contributions | |
Zoro | -4.775 |
ibilities | -4.291 |
ells | -4.242 |
chapter | -3.939 |
vitamins | -3.855 |
Token | 39 |
Token ID | 5014 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
ATH | +1.455 |
ares | +1.260 |
Stacy | +1.256 |
aring | +1.255 |
ARE | +1.233 |
Neg logit contributions | |
Zoro | -1.509 |
ibilities | -1.436 |
ells | -1.392 |
ible | -1.253 |
vitamins | -1.247 |
Token | percent |
Token ID | 1411 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
ATH | +4.472 |
ares | +3.593 |
Stacy | +3.428 |
aring | +3.367 |
ARE | +3.088 |
Neg logit contributions | |
Zoro | -16.063 |
ibilities | -15.758 |
ells | -15.415 |
ibly | -14.072 |
utor | -13.915 |
Token | . |
Token ID | 13 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
ATH | +2.103 |
ares | +1.843 |
aring | +1.834 |
anamo | +1.827 |
ARE | +1.816 |
Neg logit contributions | |
Zoro | -1.880 |
ibilities | -1.690 |
ells | -1.666 |
chapter | -1.538 |
vitamins | -1.497 |
Token | Keystone |
Token ID | 29055 |
Feature activation | -4.58e-01 |
Pos logit contributions | |
ATH | +1.938 |
ares | +1.697 |
Stacy | +1.679 |
aring | +1.679 |
ARE | +1.674 |
Neg logit contributions | |
Zoro | -1.854 |
ibilities | -1.719 |
ells | -1.672 |
chapter | -1.529 |
ible | -1.506 |
Token | is |
Token ID | 318 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
Zoro | +3.170 |
ibilities | +2.757 |
ells | +2.747 |
chapter | +2.595 |
vitamins | +2.462 |
Neg logit contributions | |
ATH | -4.413 |
anamo | -3.954 |
ares | -3.930 |
aldi | -3.897 |
ARE | -3.890 |
Token | far |
Token ID | 1290 |
Feature activation | +4.64e-01 |
Pos logit contributions | |
ATH | +1.938 |
ares | +1.694 |
aring | +1.692 |
anamo | +1.657 |
aryl | +1.649 |
Neg logit contributions | |
Zoro | -1.954 |
ibilities | -1.788 |
ells | -1.751 |
chapter | -1.594 |
ible | -1.581 |
Token | National |
Token ID | 16186 |
Feature activation | +3.13e-01 |
Pos logit contributions | |
Zoro | +0.636 |
ibilities | +0.578 |
ells | +0.571 |
chapter | +0.537 |
vitamins | +0.526 |
Neg logit contributions | |
ATH | -0.526 |
ares | -0.448 |
aring | -0.444 |
ARE | -0.444 |
anamo | -0.441 |
Token | Rifle |
Token ID | 19685 |
Feature activation | +3.64e-02 |
Pos logit contributions | |
ATH | +2.264 |
ares | +1.939 |
aring | +1.924 |
anamo | +1.918 |
Stacy | +1.888 |
Neg logit contributions | |
Zoro | -2.880 |
ibilities | -2.694 |
ells | -2.640 |
chapter | -2.441 |
ible | -2.427 |
Token | Association |
Token ID | 5396 |
Feature activation | +2.28e-02 |
Pos logit contributions | |
ATH | +0.384 |
ares | +0.346 |
aring | +0.345 |
Stacy | +0.342 |
ARE | +0.341 |
Neg logit contributions | |
Zoro | -0.221 |
ibilities | -0.195 |
ells | -0.193 |
chapter | -0.166 |
ible | -0.165 |
Token | Ham |
Token ID | 4345 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
ATH | +0.190 |
ares | +0.166 |
aring | +0.164 |
ARE | +0.164 |
anamo | +0.163 |
Neg logit contributions | |
Zoro | -0.190 |
ibilities | -0.173 |
ells | -0.170 |
chapter | -0.156 |
ible | -0.154 |
Token | mers |
Token ID | 11056 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
ATH | +1.240 |
ares | +1.050 |
aring | +1.033 |
anamo | +1.026 |
aldi | +1.013 |
Neg logit contributions | |
Zoro | -1.904 |
ibilities | -1.753 |
ells | -1.728 |
chapter | -1.629 |
vitamins | -1.607 |
Token | Obama |
Token ID | 2486 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
ATH | +2.292 |
ares | +1.992 |
aring | +1.972 |
anamo | +1.960 |
ARE | +1.943 |
Neg logit contributions | |
Zoro | -2.532 |
ibilities | -2.292 |
ells | -2.269 |
chapter | -2.104 |
vitamins | -2.083 |
Token |
|
Token ID | 198 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
ATH | +9.463 |
ares | +8.221 |
aring | +7.992 |
aria | +7.729 |
anamo | +7.705 |
Neg logit contributions | |
Zoro | -11.366 |
ibilities | -10.513 |
ells | -10.222 |
vitamins | -9.664 |
ibly | -9.385 |
Token |
|
Token ID | 198 |
Feature activation | +9.78e-02 |
Pos logit contributions | |
ATH | +1.292 |
ares | +1.127 |
aring | +1.119 |
ARE | +1.110 |
aria | +1.093 |
Neg logit contributions | |
Zoro | -1.202 |
ibilities | -1.111 |
ells | -1.068 |
vitamins | -0.987 |
chapter | -0.967 |
Token | During |
Token ID | 7191 |
Feature activation | -4.27e-01 |
Pos logit contributions | |
ATH | +0.735 |
ARE | +0.617 |
ares | +0.615 |
aring | +0.611 |
anamo | +0.598 |
Neg logit contributions | |
Zoro | -0.923 |
ibilities | -0.842 |
ells | -0.828 |
chapter | -0.775 |
vitamins | -0.768 |
Token | the |
Token ID | 262 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
Zoro | +3.162 |
ibilities | +2.794 |
ells | +2.751 |
chapter | +2.654 |
vitamins | +2.502 |
Neg logit contributions | |
ATH | -3.918 |
anamo | -3.468 |
ares | -3.447 |
ARE | -3.417 |
aring | -3.411 |
Token | 2008 |
Token ID | 3648 |
Feature activation | +5.66e-01 |
Pos logit contributions | |
ATH | +2.052 |
ares | +1.797 |
aring | +1.786 |
ARE | +1.754 |
aryl | +1.747 |
Neg logit contributions | |
Zoro | -2.108 |
ibilities | -1.932 |
ells | -1.911 |
ible | -1.717 |
chapter | -1.712 |
Token | former |
Token ID | 1966 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
Zoro | +2.003 |
ibilities | +1.790 |
ells | +1.773 |
chapter | +1.675 |
vitamins | +1.611 |
Neg logit contributions | |
ATH | -2.104 |
anamo | -1.840 |
ares | -1.838 |
aring | -1.823 |
ARE | -1.808 |
Token | chief |
Token ID | 4039 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
Zoro | +1.522 |
ibilities | +1.367 |
ells | +1.352 |
chapter | +1.271 |
vitamins | +1.229 |
Neg logit contributions | |
ATH | -1.542 |
ares | -1.344 |
anamo | -1.340 |
aring | -1.335 |
ARE | -1.322 |
Token | executive |
Token ID | 4640 |
Feature activation | -2.18e-01 |
Pos logit contributions | |
ATH | +3.740 |
Stacy | +3.177 |
aring | +3.170 |
aryl | +3.120 |
ARE | +3.115 |
Neg logit contributions | |
Zoro | -4.476 |
ells | -4.118 |
ibilities | -4.108 |
vitamins | -3.670 |
ibly | -3.668 |
Token | of |
Token ID | 286 |
Feature activation | +2.93e-01 |
Pos logit contributions | |
Zoro | +1.754 |
ibilities | +1.569 |
ells | +1.545 |
chapter | +1.458 |
vitamins | +1.409 |
Neg logit contributions | |
ATH | -1.901 |
ares | -1.667 |
anamo | -1.667 |
aring | -1.647 |
ARE | -1.637 |
Token | Hy |
Token ID | 6707 |
Feature activation | +7.12e-02 |
Pos logit contributions | |
ATH | +2.434 |
ares | +2.107 |
aring | +2.093 |
anamo | +2.076 |
Stacy | +2.076 |
Neg logit contributions | |
Zoro | -2.430 |
ibilities | -2.220 |
ells | -2.178 |
chapter | -2.013 |
vitamins | -1.970 |
Token | att |
Token ID | 1078 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
ATH | +0.513 |
ares | +0.437 |
aring | +0.436 |
anamo | +0.432 |
aldi | +0.428 |
Neg logit contributions | |
Zoro | -0.681 |
ibilities | -0.618 |
ells | -0.609 |
chapter | -0.578 |
vitamins | -0.565 |
Token | Hot |
Token ID | 6964 |
Feature activation | +1.68e-01 |
Pos logit contributions | |
ATH | +9.636 |
lodging | +8.597 |
Bern | +8.549 |
aria | +8.430 |
Stacy | +8.421 |
Neg logit contributions | |
Zoro | -10.609 |
ibilities | -10.274 |
ells | -9.725 |
ibly | -9.101 |
utor | -8.978 |
Token | els |
Token ID | 1424 |
Feature activation | +3.49e-01 |
Pos logit contributions | |
ATH | +1.390 |
ares | +1.222 |
aring | +1.221 |
aldi | +1.190 |
ARE | +1.190 |
Neg logit contributions | |
Zoro | -1.404 |
ibilities | -1.296 |
ells | -1.234 |
chapter | -1.171 |
ible | -1.154 |
Token | Corp |
Token ID | 11421 |
Feature activation | -4.20e-02 |
Pos logit contributions | |
ATH | +2.949 |
ares | +2.604 |
aring | +2.581 |
ARE | +2.550 |
anamo | +2.536 |
Neg logit contributions | |
Zoro | -2.810 |
ibilities | -2.560 |
ells | -2.492 |
chapter | -2.277 |
vitamins | -2.263 |
Token | . |
Token ID | 13 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
Zoro | +0.322 |
ibilities | +0.288 |
ells | +0.286 |
chapter | +0.266 |
ible | +0.258 |
Neg logit contributions | |
ATH | -0.380 |
anamo | -0.334 |
ares | -0.332 |
aring | -0.330 |
aldi | -0.328 |
Token |
|
Token ID | 198 |
Feature activation | -2.65e-01 |
Pos logit contributions | |
ATH | +1.208 |
ares | +1.058 |
aring | +1.053 |
anamo | +1.051 |
ARE | +1.043 |
Neg logit contributions | |
Zoro | -1.068 |
ibilities | -0.961 |
ells | -0.946 |
chapter | -0.870 |
vitamins | -0.855 |
Token | being |
Token ID | 852 |
Feature activation | +5.61e-02 |
Pos logit contributions | |
ATH | +2.354 |
aring | +2.060 |
ares | +2.053 |
aryl | +2.000 |
anamo | +1.999 |
Neg logit contributions | |
Zoro | -2.157 |
ibilities | -2.006 |
ells | -1.944 |
chapter | -1.790 |
vitamins | -1.761 |
Token | eaten |
Token ID | 17065 |
Feature activation | +4.18e-01 |
Pos logit contributions | |
ATH | +0.503 |
ares | +0.439 |
aring | +0.436 |
anamo | +0.432 |
ARE | +0.430 |
Neg logit contributions | |
Zoro | -0.436 |
ibilities | -0.397 |
ells | -0.390 |
chapter | -0.358 |
ible | -0.349 |
Token | alive |
Token ID | 6776 |
Feature activation | +4.08e-02 |
Pos logit contributions | |
ATH | +3.480 |
aring | +3.032 |
ares | +3.030 |
aryl | +2.976 |
ARE | +2.938 |
Neg logit contributions | |
Zoro | -3.405 |
ibilities | -3.152 |
ells | -3.071 |
chapter | -2.825 |
vitamins | -2.776 |
Token | by |
Token ID | 416 |
Feature activation | +5.49e-01 |
Pos logit contributions | |
ATH | +0.354 |
ares | +0.309 |
aring | +0.308 |
anamo | +0.305 |
ARE | +0.304 |
Neg logit contributions | |
Zoro | -0.329 |
ibilities | -0.298 |
ells | -0.293 |
chapter | -0.272 |
vitamins | -0.265 |
Token | As |
Token ID | 1081 |
Feature activation | -4.36e-01 |
Pos logit contributions | |
ATH | +4.464 |
aring | +3.859 |
ares | +3.848 |
Stacy | +3.739 |
ARE | +3.737 |
Neg logit contributions | |
Zoro | -4.428 |
ibilities | -4.218 |
ells | -4.056 |
ibly | -3.690 |
chapter | -3.674 |
Token | mode |
Token ID | 14171 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
Zoro | +3.746 |
ibilities | +3.407 |
ells | +3.365 |
chapter | +3.156 |
ible | +3.092 |
Neg logit contributions | |
ATH | -3.517 |
anamo | -3.013 |
ARE | -2.992 |
ares | -2.990 |
aring | -2.983 |
Token | us |
Token ID | 385 |
Feature activation | +5.14e-01 |
Pos logit contributions | |
ATH | +7.756 |
aring | +6.500 |
ares | +6.460 |
aryl | +5.828 |
reth | +5.812 |
Neg logit contributions | |
Zoro | -13.235 |
ibilities | -12.317 |
chapter | -11.599 |
ells | -11.567 |
Directions | -11.298 |
Token | . |
Token ID | 13 |
Feature activation | +4.24e-01 |
Pos logit contributions | |
ATH | +4.224 |
ares | +3.662 |
aring | +3.656 |
Stacy | +3.591 |
aldi | +3.584 |
Neg logit contributions | |
Zoro | -4.110 |
ibilities | -3.909 |
ells | -3.801 |
chapter | -3.434 |
vitamins | -3.430 |
Token | The |
Token ID | 383 |
Feature activation | +5.88e-02 |
Pos logit contributions | |
ATH | +3.486 |
ares | +3.021 |
aring | +2.988 |
ARE | +2.980 |
Stacy | +2.945 |
Neg logit contributions | |
Zoro | -3.482 |
ibilities | -3.289 |
ells | -3.165 |
vitamins | -2.906 |
ibly | -2.884 |
Token | player |
Token ID | 2137 |
Feature activation | +5.41e-02 |
Pos logit contributions | |
ATH | +0.526 |
ares | +0.462 |
aring | +0.458 |
ARE | +0.454 |
aldi | +0.454 |
Neg logit contributions | |
Zoro | -0.455 |
ibilities | -0.412 |
ells | -0.406 |
chapter | -0.367 |
vitamins | -0.362 |
Token | must |
Token ID | 1276 |
Feature activation | +5.82e-01 |
Pos logit contributions | |
ATH | +0.463 |
ares | +0.402 |
aring | +0.400 |
aldi | +0.393 |
ARE | +0.392 |
Neg logit contributions | |
Zoro | -0.442 |
ibilities | -0.405 |
ells | -0.394 |
chapter | -0.364 |
ible | -0.358 |
Token | States |
Token ID | 1829 |
Feature activation | -5.37e-01 |
Pos logit contributions | |
Zoro | +3.840 |
ibilities | +3.416 |
ells | +3.400 |
chapter | +3.225 |
vitamins | +3.105 |
Neg logit contributions | |
ATH | -3.598 |
anamo | -3.135 |
ares | -3.078 |
aring | -3.060 |
aryl | -3.057 |
Token | Constitution |
Token ID | 7965 |
Feature activation | -6.40e-01 |
Pos logit contributions | |
Zoro | +3.764 |
ells | +3.290 |
ibilities | +3.240 |
chapter | +3.153 |
ible | +2.938 |
Neg logit contributions | |
ATH | -5.130 |
anamo | -4.593 |
aryl | -4.541 |
aldi | -4.527 |
aring | -4.518 |
Token | . |
Token ID | 13 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
Zoro | +4.531 |
ells | +3.947 |
ibilities | +3.935 |
chapter | +3.890 |
ible | +3.559 |
Neg logit contributions | |
ATH | -5.977 |
anamo | -5.333 |
ares | -5.224 |
ARE | -5.210 |
aldi | -5.209 |
Token | Article |
Token ID | 10172 |
Feature activation | -4.03e-01 |
Pos logit contributions | |
Zoro | +1.185 |
ibilities | +1.063 |
ells | +1.049 |
chapter | +0.971 |
vitamins | +0.946 |
Neg logit contributions | |
ATH | -1.363 |
ares | -1.197 |
aring | -1.189 |
anamo | -1.188 |
ARE | -1.180 |
Token | IV |
Token ID | 8363 |
Feature activation | -8.54e-01 |
Pos logit contributions | |
Zoro | +2.804 |
ibilities | +2.449 |
ells | +2.398 |
chapter | +2.291 |
vitamins | +2.159 |
Neg logit contributions | |
ATH | -3.913 |
anamo | -3.508 |
ares | -3.472 |
aring | -3.457 |
ARE | -3.454 |
Token | , |
Token ID | 11 |
Feature activation | -1.77e+00 |
Pos logit contributions | |
Zoro | +5.774 |
ibilities | +5.061 |
chapter | +4.982 |
ells | +4.966 |
ible | +4.490 |
Neg logit contributions | |
ATH | -7.947 |
anamo | -7.132 |
Mehran | -7.131 |
aldi | -7.095 |
ARE | -7.069 |
Token | Section |
Token ID | 7275 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
Zoro | +8.984 |
chapter | +8.943 |
ibilities | +7.562 |
ells | +7.457 |
verse | +7.318 |
Neg logit contributions | |
ATH | -16.186 |
anamo | -15.651 |
Mehran | -15.206 |
aldi | -15.180 |
merce | -14.965 |
Token | 1 |
Token ID | 352 |
Feature activation | -9.43e-01 |
Pos logit contributions | |
Zoro | +6.278 |
chapter | +5.235 |
ibilities | +5.214 |
ells | +5.179 |
ible | +4.604 |
Neg logit contributions | |
ATH | -11.253 |
anamo | -10.320 |
aryl | -10.101 |
aldi | -10.098 |
Mehran | -10.000 |
Token | reads |
Token ID | 9743 |
Feature activation | +2.19e-01 |
Pos logit contributions | |
Zoro | +6.420 |
ells | +5.762 |
ibilities | +5.752 |
chapter | +5.480 |
ible | +5.025 |
Neg logit contributions | |
ATH | -8.664 |
anamo | -7.768 |
aldi | -7.741 |
Mehran | -7.659 |
ARE | -7.573 |
Token | , |
Token ID | 11 |
Feature activation | -2.17e-01 |
Pos logit contributions | |
ATH | +1.907 |
ares | +1.671 |
aring | +1.660 |
anamo | +1.656 |
ARE | +1.646 |
Neg logit contributions | |
Zoro | -1.754 |
ibilities | -1.573 |
ells | -1.556 |
chapter | -1.440 |
vitamins | -1.407 |
Token | in |
Token ID | 287 |
Feature activation | -3.96e-01 |
Pos logit contributions | |
Zoro | +1.499 |
ibilities | +1.312 |
ells | +1.288 |
chapter | +1.231 |
vitamins | +1.151 |
Neg logit contributions | |
ATH | -2.114 |
ares | -1.876 |
anamo | -1.871 |
aldi | -1.864 |
aring | -1.860 |
Token | be |
Token ID | 307 |
Feature activation | +5.61e-02 |
Pos logit contributions | |
ATH | +1.212 |
aring | +1.060 |
ares | +1.047 |
ARE | +1.034 |
aldi | +1.032 |
Neg logit contributions | |
Zoro | -1.204 |
ells | -1.068 |
ibilities | -1.067 |
chapter | -0.976 |
vitamins | -0.970 |
Token | replaced |
Token ID | 6928 |
Feature activation | +7.09e-02 |
Pos logit contributions | |
ATH | +0.508 |
ares | +0.450 |
aring | +0.448 |
aldi | +0.444 |
ARE | +0.441 |
Neg logit contributions | |
Zoro | -0.428 |
ibilities | -0.380 |
ells | -0.379 |
chapter | -0.339 |
vitamins | -0.337 |
Token | , |
Token ID | 11 |
Feature activation | -4.74e-01 |
Pos logit contributions | |
ATH | +0.606 |
ares | +0.529 |
aring | +0.526 |
anamo | +0.521 |
ARE | +0.519 |
Neg logit contributions | |
Zoro | -0.578 |
ibilities | -0.521 |
ells | -0.518 |
chapter | -0.475 |
vitamins | -0.465 |
Token | renegoti |
Token ID | 48312 |
Feature activation | -6.28e-01 |
Pos logit contributions | |
Zoro | +3.778 |
ibilities | +3.368 |
ells | +3.304 |
chapter | +3.176 |
vitamins | +3.065 |
Neg logit contributions | |
ATH | -4.106 |
anamo | -3.610 |
ares | -3.607 |
aring | -3.550 |
ARE | -3.537 |
Token | ated |
Token ID | 515 |
Feature activation | -3.90e-01 |
Pos logit contributions | |
Zoro | +6.235 |
ibilities | +5.813 |
ells | +5.772 |
ible | +5.486 |
chapter | +5.486 |
Neg logit contributions | |
ATH | -4.073 |
ARE | -3.290 |
anamo | -3.290 |
Stacy | -3.237 |
ares | -3.235 |
Token | or |
Token ID | 393 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
Zoro | +2.900 |
ibilities | +2.581 |
ells | +2.527 |
chapter | +2.407 |
ible | +2.317 |
Neg logit contributions | |
ATH | -3.587 |
anamo | -3.212 |
ares | -3.150 |
aring | -3.127 |
ARE | -3.118 |
Token | rem |
Token ID | 816 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
Zoro | +10.300 |
ibilities | +9.046 |
chapter | +9.001 |
ells | +8.522 |
| +8.418 |
Neg logit contributions | |
ATH | -13.557 |
anamo | -12.973 |
ARE | -12.092 |
ares | -11.983 |
adish | -11.911 |
Token | ade |
Token ID | 671 |
Feature activation | +2.14e-01 |
Pos logit contributions | |
ATH | +1.465 |
aring | +1.270 |
ares | +1.269 |
aria | +1.230 |
aldi | +1.230 |
Neg logit contributions | |
Zoro | -2.372 |
ibilities | -2.161 |
ells | -2.116 |
chapter | -2.043 |
vitamins | -2.006 |
Token | . |
Token ID | 13 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
ATH | +1.791 |
ares | +1.565 |
aring | +1.557 |
ARE | +1.534 |
aldi | +1.531 |
Neg logit contributions | |
Zoro | -1.767 |
ibilities | -1.602 |
ells | -1.598 |
chapter | -1.440 |
vitamins | -1.422 |
Token | How |
Token ID | 1374 |
Feature activation | -2.20e-01 |
Pos logit contributions | |
ATH | +0.142 |
ares | +0.125 |
aring | +0.124 |
anamo | +0.123 |
ARE | +0.123 |
Neg logit contributions | |
Zoro | -0.126 |
ibilities | -0.114 |
ells | -0.112 |
chapter | -0.104 |
vitamins | -0.102 |
Token | this |
Token ID | 428 |
Feature activation | +1.79e-01 |
Pos logit contributions | |
Zoro | +1.778 |
ibilities | +1.595 |
ells | +1.578 |
chapter | +1.472 |
vitamins | +1.428 |
Neg logit contributions | |
ATH | -1.901 |
ares | -1.662 |
anamo | -1.655 |
aring | -1.650 |
ARE | -1.636 |
Token |
|
Token ID | 198 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
Zoro | +1.221 |
ibilities | +1.094 |
ells | +1.071 |
chapter | +0.981 |
vitamins | +0.964 |
Neg logit contributions | |
ATH | -1.543 |
ares | -1.361 |
aring | -1.354 |
ARE | -1.344 |
anamo | -1.328 |
Token | http |
Token ID | 4023 |
Feature activation | -4.93e-01 |
Pos logit contributions | |
Zoro | +1.154 |
ibilities | +1.054 |
ells | +1.046 |
chapter | +0.986 |
ible | +0.961 |
Neg logit contributions | |
ATH | -0.894 |
ares | -0.764 |
anamo | -0.763 |
aring | -0.757 |
ARE | -0.746 |
Token | :// |
Token ID | 1378 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
Zoro | +4.164 |
ells | +3.745 |
ibilities | +3.742 |
chapter | +3.537 |
ible | +3.419 |
Neg logit contributions | |
ATH | -3.953 |
anamo | -3.560 |
ares | -3.434 |
merce | -3.425 |
aryl | -3.415 |
Token | www |
Token ID | 2503 |
Feature activation | -8.73e-01 |
Pos logit contributions | |
Zoro | +1.849 |
ibilities | +1.685 |
ells | +1.674 |
chapter | +1.547 |
ible | +1.522 |
Neg logit contributions | |
ATH | -1.910 |
anamo | -1.668 |
ares | -1.656 |
Stacy | -1.649 |
aring | -1.646 |
Token | . |
Token ID | 13 |
Feature activation | -7.70e-01 |
Pos logit contributions | |
Zoro | +5.486 |
ells | +4.776 |
ibilities | +4.648 |
chapter | +4.503 |
| +4.367 |
Neg logit contributions | |
ATH | -8.528 |
anamo | -8.171 |
merce | -8.028 |
aryl | -7.713 |
aldi | -7.710 |
Token | board |
Token ID | 3526 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
Zoro | +6.655 |
ells | +6.252 |
ibilities | +6.238 |
ible | +5.855 |
chapter | +5.719 |
Neg logit contributions | |
ATH | -5.550 |
Stacy | -4.897 |
Mehran | -4.862 |
anamo | -4.797 |
ARE | -4.726 |
Token | game |
Token ID | 6057 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
Zoro | +10.141 |
ells | +9.562 |
ibilities | +9.303 |
chapter | +9.154 |
ible | +8.965 |
Neg logit contributions | |
ATH | -12.777 |
Mehran | -11.649 |
Stacy | -11.627 |
anamo | -11.389 |
aryl | -11.097 |
Token | ge |
Token ID | 469 |
Feature activation | -5.48e-01 |
Pos logit contributions | |
Zoro | +0.093 |
ibilities | +0.084 |
ells | +0.084 |
chapter | +0.079 |
ible | +0.077 |
Neg logit contributions | |
ATH | -0.076 |
ares | -0.065 |
anamo | -0.065 |
aring | -0.065 |
ARE | -0.064 |
Token | ek |
Token ID | 988 |
Feature activation | -2.77e-01 |
Pos logit contributions | |
Zoro | +3.993 |
ells | +3.637 |
ibilities | +3.628 |
chapter | +3.378 |
ible | +3.306 |
Neg logit contributions | |
ATH | -4.982 |
anamo | -4.432 |
ARE | -4.359 |
Stacy | -4.317 |
ares | -4.307 |
Token | . |
Token ID | 13 |
Feature activation | -3.44e-01 |
Pos logit contributions | |
Zoro | +2.125 |
ibilities | +1.895 |
ells | +1.872 |
chapter | +1.739 |
vitamins | +1.684 |
Neg logit contributions | |
ATH | -2.507 |
ares | -2.206 |
anamo | -2.195 |
aring | -2.192 |
ARE | -2.174 |
Token | com |
Token ID | 785 |
Feature activation | +2.74e-01 |
Pos logit contributions | |
Zoro | +3.236 |
ibilities | +2.941 |
ells | +2.925 |
chapter | +2.768 |
ible | +2.696 |
Neg logit contributions | |
ATH | -2.503 |
anamo | -2.152 |
ares | -2.120 |
aring | -2.104 |
ARE | -2.091 |
Token | side |
Token ID | 1735 |
Feature activation | -6.16e-01 |
Pos logit contributions | |
Zoro | +6.327 |
chapter | +5.189 |
ibilities | +5.089 |
ells | +4.998 |
ible | +4.839 |
Neg logit contributions | |
ATH | -11.156 |
anamo | -10.803 |
aryl | -10.103 |
merce | -9.963 |
ARE | -9.955 |
Token | for |
Token ID | 329 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Zoro | +4.420 |
ibilities | +3.836 |
ells | +3.802 |
chapter | +3.590 |
ible | +3.455 |
Neg logit contributions | |
ATH | -5.795 |
anamo | -5.226 |
ares | -5.104 |
Mehran | -5.062 |
ARE | -5.058 |
Token | about |
Token ID | 546 |
Feature activation | -9.47e-01 |
Pos logit contributions | |
Zoro | +7.825 |
chapter | +6.545 |
ells | +6.506 |
ibilities | +6.301 |
vitamins | +6.133 |
Neg logit contributions | |
ATH | -10.850 |
anamo | -10.166 |
aryl | -9.696 |
merce | -9.646 |
aring | -9.534 |
Token | 2 |
Token ID | 362 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
Zoro | +6.756 |
ells | +5.758 |
chapter | +5.671 |
ibilities | +5.658 |
vitamins | +5.248 |
Neg logit contributions | |
ATH | -8.742 |
anamo | -8.011 |
aryl | -7.721 |
ARE | -7.632 |
aring | -7.622 |
Token | / |
Token ID | 14 |
Feature activation | -4.08e-01 |
Pos logit contributions | |
Zoro | +7.047 |
ells | +5.991 |
ibilities | +5.956 |
chapter | +5.700 |
| +5.372 |
Neg logit contributions | |
ATH | -14.196 |
anamo | -13.628 |
Mehran | -12.954 |
aryl | -12.859 |
aldi | -12.793 |
Token | 3 |
Token ID | 18 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
Zoro | +3.494 |
ibilities | +3.186 |
ells | +3.152 |
chapter | +2.964 |
ible | +2.888 |
Neg logit contributions | |
ATH | -3.235 |
anamo | -2.878 |
Mehran | -2.779 |
ares | -2.777 |
aring | -2.764 |
Token | minutes |
Token ID | 2431 |
Feature activation | -1.39e-01 |
Pos logit contributions | |
Zoro | +9.601 |
chapter | +8.290 |
ibilities | +7.997 |
ells | +7.825 |
ible | +7.746 |
Neg logit contributions | |
anamo | -13.060 |
ATH | -13.035 |
ARE | -12.012 |
Mehran | -11.852 |
aryl | -11.800 |
Token | until |
Token ID | 1566 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
Zoro | +1.083 |
ibilities | +0.968 |
ells | +0.957 |
chapter | +0.889 |
vitamins | +0.862 |
Neg logit contributions | |
ATH | -1.240 |
ares | -1.089 |
anamo | -1.083 |
aring | -1.082 |
ARE | -1.073 |
Token | golden |
Token ID | 10861 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
Zoro | +7.029 |
ells | +5.967 |
ibilities | +5.883 |
chapter | +5.730 |
vitamins | +5.585 |
Neg logit contributions | |
ATH | -9.230 |
anamo | -8.564 |
ares | -8.194 |
aryl | -8.191 |
ARE | -8.098 |
Token | brown |
Token ID | 7586 |
Feature activation | -2.70e-01 |
Pos logit contributions | |
ATH | +1.442 |
aring | +1.277 |
ares | +1.274 |
aryl | +1.250 |
ARE | +1.250 |
Neg logit contributions | |
Zoro | -1.217 |
ibilities | -1.089 |
ells | -1.067 |
chapter | -0.987 |
vitamins | -0.963 |
Token | . |
Token ID | 13 |
Feature activation | -9.97e-01 |
Pos logit contributions | |
Zoro | +1.997 |
ibilities | +1.768 |
ells | +1.765 |
chapter | +1.633 |
ible | +1.597 |
Neg logit contributions | |
ATH | -2.509 |
anamo | -2.243 |
ares | -2.222 |
ARE | -2.200 |
aring | -2.194 |
Token | : |
Token ID | 25 |
Feature activation | -6.02e-01 |
Pos logit contributions | |
ATH | +0.027 |
ares | +0.023 |
aring | +0.023 |
ARE | +0.023 |
Stacy | +0.022 |
Neg logit contributions | |
Zoro | -0.027 |
ibilities | -0.025 |
ells | -0.024 |
chapter | -0.022 |
vitamins | -0.022 |
Token | 47 |
Token ID | 2857 |
Feature activation | +4.57e-01 |
Pos logit contributions | |
Zoro | +4.274 |
ells | +3.740 |
ibilities | +3.725 |
chapter | +3.484 |
ible | +3.341 |
Neg logit contributions | |
ATH | -5.702 |
anamo | -5.153 |
ares | -5.069 |
aring | -5.041 |
aldi | -5.012 |
Token | ] |
Token ID | 60 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
ATH | +2.298 |
ares | +1.819 |
aring | +1.781 |
ARE | +1.722 |
aria | +1.698 |
Neg logit contributions | |
Zoro | -5.249 |
ibilities | -5.038 |
ells | -4.865 |
vitamins | -4.649 |
chapter | -4.522 |
Token | < |
Token ID | 1279 |
Feature activation | +6.19e-02 |
Pos logit contributions | |
Zoro | +2.757 |
ibilities | +2.260 |
ells | +2.220 |
chapter | +2.053 |
| +1.961 |
Neg logit contributions | |
ATH | -6.265 |
aldi | -5.802 |
ares | -5.782 |
anamo | -5.766 |
aryl | -5.746 |
Token | ok |
Token ID | 482 |
Feature activation | -3.49e-01 |
Pos logit contributions | |
ATH | +0.458 |
ares | +0.391 |
aring | +0.388 |
anamo | +0.388 |
ARE | +0.383 |
Neg logit contributions | |
Zoro | -0.578 |
ibilities | -0.527 |
ells | -0.521 |
chapter | -0.492 |
vitamins | -0.480 |
Token | clock |
Token ID | 15750 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
Zoro | +2.612 |
ells | +2.332 |
ibilities | +2.331 |
chapter | +2.156 |
ible | +2.103 |
Neg logit contributions | |
ATH | -3.149 |
aring | -2.761 |
anamo | -2.759 |
ARE | -2.759 |
ares | -2.758 |
Token | zy |
Token ID | 7357 |
Feature activation | -6.61e-01 |
Pos logit contributions | |
Zoro | +6.713 |
ibilities | +5.418 |
ells | +5.192 |
chapter | +5.025 |
ible | +4.863 |
Neg logit contributions | |
ATH | -16.763 |
Mehran | -15.178 |
anamo | -15.162 |
Stacy | -14.951 |
ARE | -14.847 |
Token | > |
Token ID | 29 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
Zoro | +4.253 |
ells | +3.743 |
ibilities | +3.686 |
chapter | +3.432 |
ible | +3.296 |
Neg logit contributions | |
ATH | -6.614 |
anamo | -6.101 |
aryl | -5.902 |
aring | -5.891 |
merce | -5.880 |
Token | lol |
Token ID | 19462 |
Feature activation | +1.84e-02 |
Pos logit contributions | |
Zoro | +2.326 |
ibilities | +2.055 |
ells | +2.039 |
chapter | +1.918 |
vitamins | +1.852 |
Neg logit contributions | |
ATH | -2.534 |
anamo | -2.220 |
ares | -2.215 |
aring | -2.198 |
aryl | -2.179 |
Token | m |
Token ID | 285 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
ATH | +0.155 |
ares | +0.135 |
aring | +0.135 |
anamo | +0.134 |
ARE | +0.133 |
Neg logit contributions | |
Zoro | -0.152 |
ibilities | -0.137 |
ells | -0.136 |
chapter | -0.126 |
vitamins | -0.123 |
Token | 2 |
Token ID | 17 |
Feature activation | +4.91e-02 |
Pos logit contributions | |
Zoro | +1.006 |
ibilities | +0.912 |
ells | +0.899 |
chapter | +0.845 |
ible | +0.828 |
Neg logit contributions | |
ATH | -1.047 |
anamo | -0.925 |
aring | -0.901 |
Mehran | -0.900 |
aldi | -0.894 |
Token | there |
Token ID | 612 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
Zoro | +0.590 |
ibilities | +0.528 |
ells | +0.522 |
chapter | +0.487 |
vitamins | +0.471 |
Neg logit contributions | |
ATH | -0.648 |
ares | -0.568 |
anamo | -0.566 |
aring | -0.563 |
ARE | -0.560 |
Token | than |
Token ID | 621 |
Feature activation | +9.61e-02 |
Pos logit contributions | |
Zoro | +2.130 |
ibilities | +1.881 |
ells | +1.864 |
chapter | +1.744 |
ible | +1.677 |
Neg logit contributions | |
ATH | -2.627 |
anamo | -2.318 |
ares | -2.317 |
aring | -2.295 |
ARE | -2.287 |
Token | most |
Token ID | 749 |
Feature activation | +3.38e-02 |
Pos logit contributions | |
ATH | +0.843 |
ares | +0.744 |
aring | +0.739 |
anamo | +0.730 |
Stacy | +0.729 |
Neg logit contributions | |
Zoro | -0.758 |
ibilities | -0.689 |
ells | -0.677 |
chapter | -0.619 |
ible | -0.607 |
Token | . |
Token ID | 13 |
Feature activation | -4.77e-01 |
Pos logit contributions | |
ATH | +0.292 |
ares | +0.256 |
aring | +0.254 |
anamo | +0.252 |
ARE | +0.251 |
Neg logit contributions | |
Zoro | -0.274 |
ibilities | -0.247 |
ells | -0.244 |
chapter | -0.226 |
ible | -0.220 |
Token | - |
Token ID | 532 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
Zoro | +3.700 |
ells | +3.222 |
ibilities | +3.215 |
chapter | +3.049 |
ible | +2.897 |
Neg logit contributions | |
ATH | -4.226 |
anamo | -3.774 |
ares | -3.729 |
aring | -3.716 |
aryl | -3.674 |
Token | July |
Token ID | 2901 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
Zoro | +1.509 |
ibilities | +1.395 |
ells | +1.382 |
chapter | +1.307 |
vitamins | +1.287 |
Neg logit contributions | |
ATH | -0.854 |
ares | -0.694 |
aring | -0.689 |
anamo | -0.685 |
ARE | -0.678 |
Token | 6 |
Token ID | 718 |
Feature activation | -7.34e-05 |
Pos logit contributions | |
Zoro | +5.972 |
ells | +3.967 |
chapter | +3.869 |
| +3.600 |
ible | +3.423 |
Neg logit contributions | |
ATH | -17.945 |
merce | -17.647 |
anamo | -17.231 |
aryl | -16.970 |
ares | -16.507 |
Token | , |
Token ID | 11 |
Feature activation | -2.32e-01 |
Pos logit contributions | |
Zoro | +0.001 |
ibilities | +0.001 |
ells | +0.001 |
chapter | +0.000 |
vitamins | +0.000 |
Neg logit contributions | |
ATH | -0.001 |
ares | -0.001 |
aring | -0.001 |
ARE | -0.001 |
Stacy | -0.001 |
Token | 2010 |
Token ID | 3050 |
Feature activation | +5.74e-01 |
Pos logit contributions | |
Zoro | +2.117 |
ibilities | +1.923 |
ells | +1.905 |
chapter | +1.796 |
ible | +1.748 |
Neg logit contributions | |
ATH | -1.762 |
ares | -1.511 |
anamo | -1.508 |
aring | -1.498 |
ARE | -1.482 |
Token | R |
Token ID | 49 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
ATH | +3.648 |
ARE | +3.051 |
aring | +2.880 |
ares | +2.874 |
Bern | +2.770 |
Neg logit contributions | |
Zoro | -5.896 |
ibilities | -5.638 |
ells | -5.324 |
vitamins | -5.134 |
chapter | -5.103 |
Token | iff |
Token ID | 733 |
Feature activation | +3.57e-01 |
Pos logit contributions | |
Zoro | +1.030 |
ibilities | +0.930 |
ells | +0.910 |
chapter | +0.865 |
vitamins | +0.848 |
Neg logit contributions | |
ATH | -0.874 |
aring | -0.755 |
ares | -0.751 |
ARE | -0.734 |
anamo | -0.734 |
Token | but |
Token ID | 475 |
Feature activation | -1.53e-02 |
Pos logit contributions | |
ATH | +0.955 |
ares | +0.835 |
aring | +0.834 |
anamo | +0.826 |
ARE | +0.821 |
Neg logit contributions | |
Zoro | -0.882 |
ibilities | -0.793 |
ells | -0.779 |
chapter | -0.716 |
ible | -0.704 |
Token | who |
Token ID | 508 |
Feature activation | -3.82e-01 |
Pos logit contributions | |
Zoro | +0.122 |
ibilities | +0.110 |
ells | +0.108 |
chapter | +0.100 |
ible | +0.098 |
Neg logit contributions | |
ATH | -0.133 |
ares | -0.117 |
aring | -0.117 |
anamo | -0.116 |
ARE | -0.115 |
Token | will |
Token ID | 481 |
Feature activation | -6.51e-01 |
Pos logit contributions | |
Zoro | +3.083 |
ibilities | +2.762 |
ells | +2.754 |
chapter | +2.563 |
vitamins | +2.481 |
Neg logit contributions | |
ATH | -3.290 |
anamo | -2.867 |
ares | -2.856 |
aring | -2.843 |
ARE | -2.823 |
Token | get |
Token ID | 651 |
Feature activation | -6.69e-01 |
Pos logit contributions | |
Zoro | +5.171 |
ibilities | +4.620 |
ells | +4.604 |
chapter | +4.382 |
ible | +4.193 |
Neg logit contributions | |
ATH | -5.579 |
anamo | -4.967 |
ares | -4.864 |
aldi | -4.818 |
aring | -4.818 |
Token | the |
Token ID | 262 |
Feature activation | -3.05e-01 |
Pos logit contributions | |
Zoro | +4.848 |
ibilities | +4.267 |
ells | +4.231 |
chapter | +4.058 |
vitamins | +3.866 |
Neg logit contributions | |
ATH | -6.170 |
anamo | -5.496 |
ares | -5.413 |
aring | -5.358 |
aryl | -5.351 |
Token | blame |
Token ID | 8138 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
Zoro | +2.437 |
ibilities | +2.176 |
ells | +2.155 |
chapter | +2.023 |
vitamins | +1.960 |
Neg logit contributions | |
ATH | -2.664 |
anamo | -2.333 |
ares | -2.330 |
aring | -2.316 |
ARE | -2.299 |
Token | ? |
Token ID | 30 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
Zoro | +8.708 |
ells | +7.729 |
ibilities | +7.675 |
chapter | +7.468 |
| +7.256 |
Neg logit contributions | |
ATH | -13.217 |
anamo | -11.973 |
ARE | -11.943 |
ares | -11.751 |
aldi | -11.694 |
Token | | |
Token ID | 930 |
Feature activation | +5.33e-02 |
Pos logit contributions | |
Zoro | +1.522 |
ibilities | +1.346 |
ells | +1.345 |
chapter | +1.251 |
ible | +1.197 |
Neg logit contributions | |
ATH | -1.878 |
ares | -1.656 |
anamo | -1.651 |
aring | -1.642 |
ARE | -1.636 |
Token | Ad |
Token ID | 1215 |
Feature activation | +5.27e-01 |
Pos logit contributions | |
ATH | +0.388 |
ares | +0.330 |
anamo | +0.327 |
aring | +0.327 |
ARE | +0.324 |
Neg logit contributions | |
Zoro | -0.504 |
ibilities | -0.461 |
ells | -0.456 |
chapter | -0.429 |
vitamins | -0.420 |
Token | ity |
Token ID | 414 |
Feature activation | +4.99e-01 |
Pos logit contributions | |
ATH | +3.701 |
ares | +3.302 |
aring | +3.203 |
aryl | +3.195 |
Stacy | +3.179 |
Neg logit contributions | |
Zoro | -4.929 |
ibilities | -4.402 |
ells | -4.377 |
chapter | -4.088 |
vitamins | -4.029 |
Token | a |
Token ID | 64 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
ATH | +3.268 |
aring | +2.772 |
ares | +2.744 |
anamo | +2.724 |
aldi | +2.672 |
Neg logit contributions | |
Zoro | -5.004 |
ibilities | -4.640 |
ells | -4.535 |
chapter | -4.322 |
vitamins | -4.247 |
Token | е |
Token ID | 16843 |
Feature activation | -1.39e-01 |
Pos logit contributions | |
Zoro | +3.119 |
ibilities | +2.833 |
ells | +2.819 |
chapter | +2.643 |
ible | +2.578 |
Neg logit contributions | |
ATH | -2.820 |
anamo | -2.456 |
ares | -2.429 |
aring | -2.404 |
ARE | -2.388 |
Token | к |
Token ID | 31583 |
Feature activation | -5.94e-01 |
Pos logit contributions | |
Zoro | +0.951 |
ibilities | +0.833 |
ells | +0.823 |
chapter | +0.758 |
vitamins | +0.729 |
Neg logit contributions | |
ATH | -1.381 |
ares | -1.230 |
anamo | -1.228 |
aring | -1.224 |
ARE | -1.213 |
Token | о |
Token ID | 15166 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
Zoro | +4.491 |
ells | +3.972 |
ibilities | +3.957 |
chapter | +3.738 |
vitamins | +3.576 |
Neg logit contributions | |
ATH | -5.249 |
anamo | -4.689 |
ares | -4.636 |
aring | -4.619 |
aryl | -4.554 |
Token | т |
Token ID | 20375 |
Feature activation | -7.28e-01 |
Pos logit contributions | |
ATH | +2.007 |
ares | +1.700 |
aring | +1.689 |
anamo | +1.683 |
ARE | +1.678 |
Neg logit contributions | |
Zoro | -2.588 |
ibilities | -2.360 |
ells | -2.328 |
chapter | -2.189 |
vitamins | -2.142 |
Token | о |
Token ID | 15166 |
Feature activation | +1.30e-02 |
Pos logit contributions | |
Zoro | +4.538 |
ells | +3.969 |
ibilities | +3.939 |
chapter | +3.705 |
| +3.550 |
Neg logit contributions | |
ATH | -7.105 |
anamo | -6.425 |
ares | -6.417 |
Stacy | -6.378 |
aring | -6.352 |
Token | р |
Token ID | 21169 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
ATH | +0.124 |
ares | +0.110 |
anamo | +0.109 |
aring | +0.109 |
ARE | +0.108 |
Neg logit contributions | |
Zoro | -0.093 |
ibilities | -0.082 |
ells | -0.082 |
chapter | -0.076 |
vitamins | -0.073 |
Token | ы |
Token ID | 45035 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
Zoro | +6.478 |
ibilities | +5.502 |
ells | +5.249 |
chapter | +5.222 |
ible | +4.937 |
Neg logit contributions | |
ATH | -14.913 |
anamo | -13.759 |
ares | -13.682 |
aring | -13.486 |
Stacy | -13.443 |
Token | е |
Token ID | 16843 |
Feature activation | -3.13e-02 |
Pos logit contributions | |
Zoro | +0.779 |
ells | +0.679 |
ibilities | +0.678 |
chapter | +0.626 |
vitamins | +0.605 |
Neg logit contributions | |
ATH | -1.153 |
ares | -1.033 |
aring | -1.026 |
anamo | -1.026 |
ARE | -1.013 |
Token | � |
Token ID | 12466 |
Feature activation | -3.67e-01 |
Pos logit contributions | |
Zoro | +0.204 |
ibilities | +0.179 |
ells | +0.175 |
chapter | +0.160 |
ible | +0.154 |
Neg logit contributions | |
ATH | -0.319 |
ares | -0.285 |
aring | -0.284 |
anamo | -0.283 |
ARE | -0.282 |
Token | � |
Token ID | 116 |
Feature activation | -2.55e-01 |
Pos logit contributions | |
Zoro | +2.967 |
ibilities | +2.683 |
ells | +2.661 |
chapter | +2.484 |
ible | +2.418 |
Neg logit contributions | |
ATH | -3.106 |
anamo | -2.728 |
ares | -2.701 |
aring | -2.685 |
ARE | -2.683 |
Token | м |
Token ID | 43108 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
Zoro | +1.817 |
ibilities | +1.595 |
ells | +1.583 |
chapter | +1.471 |
vitamins | +1.417 |
Neg logit contributions | |
ATH | -2.450 |
anamo | -2.171 |
ares | -2.170 |
aring | -2.155 |
ARE | -2.133 |
Token | ts |
Token ID | 912 |
Feature activation | -7.89e-01 |
Pos logit contributions | |
Zoro | +0.248 |
ibilities | +0.210 |
ells | +0.206 |
chapter | +0.192 |
vitamins | +0.185 |
Neg logit contributions | |
ATH | -0.365 |
ares | -0.334 |
aring | -0.330 |
aldi | -0.323 |
anamo | -0.321 |
Token | into |
Token ID | 656 |
Feature activation | -6.17e-01 |
Pos logit contributions | |
Zoro | +5.460 |
ibilities | +4.804 |
ells | +4.745 |
chapter | +4.574 |
ible | +4.380 |
Neg logit contributions | |
ATH | -7.626 |
anamo | -6.828 |
aldi | -6.622 |
ARE | -6.560 |
aryl | -6.555 |
Token | small |
Token ID | 1402 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
Zoro | +4.237 |
ibilities | +3.673 |
ells | +3.666 |
chapter | +3.440 |
ible | +3.295 |
Neg logit contributions | |
ATH | -6.098 |
anamo | -5.480 |
ares | -5.353 |
aldi | -5.341 |
aring | -5.333 |
Token | pieces |
Token ID | 5207 |
Feature activation | +4.35e-02 |
Pos logit contributions | |
ATH | +0.843 |
ares | +0.712 |
aring | +0.678 |
Stacy | +0.669 |
ARE | +0.661 |
Neg logit contributions | |
Zoro | -1.493 |
ibilities | -1.382 |
ells | -1.353 |
chapter | -1.275 |
ibly | -1.266 |
Token | with |
Token ID | 351 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
ATH | +0.291 |
ares | +0.251 |
aring | +0.249 |
Stacy | +0.240 |
ARE | +0.239 |
Neg logit contributions | |
Zoro | -0.428 |
ibilities | -0.397 |
ells | -0.394 |
chapter | -0.363 |
vitamins | -0.361 |
Token | a |
Token ID | 257 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
Zoro | +1.317 |
ibilities | +1.200 |
ells | +1.180 |
chapter | +1.088 |
vitamins | +1.066 |
Neg logit contributions | |
ATH | -1.278 |
ares | -1.115 |
aring | -1.110 |
ARE | -1.092 |
Stacy | -1.080 |
Token | knife |
Token ID | 9845 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
Zoro | +5.260 |
chapter | +3.915 |
ells | +3.603 |
ibilities | +3.544 |
ible | +3.461 |
Neg logit contributions | |
ATH | -17.336 |
anamo | -16.648 |
merce | -16.227 |
aryl | -15.918 |
ares | -15.837 |
Token | . |
Token ID | 13 |
Feature activation | -7.97e-01 |
Pos logit contributions | |
Zoro | +1.053 |
ibilities | +0.957 |
ells | +0.936 |
chapter | +0.861 |
vitamins | +0.845 |
Neg logit contributions | |
ATH | -1.134 |
ares | -0.996 |
aring | -0.991 |
ARE | -0.979 |
aldi | -0.968 |
Token | 3 |
Token ID | 513 |
Feature activation | +8.84e-02 |
Pos logit contributions | |
Zoro | +5.451 |
ibilities | +4.857 |
ells | +4.594 |
chapter | +4.372 |
| +4.255 |
Neg logit contributions | |
ATH | -7.402 |
ares | -6.738 |
anamo | -6.673 |
aring | -6.586 |
Mehran | -6.579 |
Token | . |
Token ID | 13 |
Feature activation | -5.00e-01 |
Pos logit contributions | |
ATH | +0.734 |
ares | +0.641 |
aring | +0.635 |
ARE | +0.631 |
Stacy | +0.618 |
Neg logit contributions | |
Zoro | -0.742 |
ibilities | -0.682 |
ells | -0.662 |
chapter | -0.608 |
vitamins | -0.607 |
Token | In |
Token ID | 554 |
Feature activation | -7.14e-01 |
Pos logit contributions | |
Zoro | +3.476 |
ibilities | +2.957 |
ells | +2.926 |
chapter | +2.736 |
ible | +2.651 |
Neg logit contributions | |
ATH | -4.877 |
anamo | -4.366 |
ares | -4.323 |
aring | -4.284 |
aryl | -4.283 |
Token | happen |
Token ID | 1645 |
Feature activation | -5.12e-01 |
Pos logit contributions | |
Zoro | +0.404 |
ibilities | +0.363 |
ells | +0.357 |
chapter | +0.327 |
vitamins | +0.318 |
Neg logit contributions | |
ATH | -0.492 |
ares | -0.433 |
aring | -0.431 |
anamo | -0.427 |
ARE | -0.427 |
Token | , |
Token ID | 11 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
Zoro | +3.698 |
ibilities | +3.242 |
ells | +3.195 |
chapter | +3.049 |
ible | +2.916 |
Neg logit contributions | |
ATH | -4.721 |
anamo | -4.258 |
ares | -4.194 |
aldi | -4.170 |
ARE | -4.151 |
Token | and |
Token ID | 290 |
Feature activation | -5.02e-01 |
Pos logit contributions | |
Zoro | +2.090 |
ibilities | +1.862 |
ells | +1.844 |
chapter | +1.734 |
vitamins | +1.682 |
Neg logit contributions | |
ATH | -2.214 |
ares | -1.936 |
anamo | -1.930 |
aring | -1.917 |
ARE | -1.906 |
Token | it |
Token ID | 340 |
Feature activation | -3.58e-01 |
Pos logit contributions | |
Zoro | +3.831 |
ells | +3.342 |
ibilities | +3.334 |
chapter | +3.163 |
vitamins | +3.049 |
Neg logit contributions | |
ATH | -4.516 |
anamo | -4.006 |
ares | -3.960 |
ARE | -3.916 |
aring | -3.905 |
Token | comes |
Token ID | 2058 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
Zoro | +2.794 |
ibilities | +2.479 |
ells | +2.475 |
chapter | +2.305 |
vitamins | +2.234 |
Neg logit contributions | |
ATH | -3.186 |
anamo | -2.803 |
ares | -2.783 |
ARE | -2.775 |
aring | -2.758 |
Token | fully |
Token ID | 3938 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
Zoro | +8.580 |
ells | +7.149 |
ibilities | +7.125 |
chapter | +7.056 |
vitamins | +6.838 |
Neg logit contributions | |
ATH | -9.835 |
anamo | -8.927 |
merce | -8.562 |
aryl | -8.557 |
aldi | -8.531 |
Token | loaded |
Token ID | 9639 |
Feature activation | -7.17e-01 |
Pos logit contributions | |
Zoro | +9.496 |
chapter | +7.761 |
ibilities | +7.690 |
ells | +7.496 |
| +7.344 |
Neg logit contributions | |
ATH | -12.591 |
ares | -11.375 |
anamo | -11.265 |
aldi | -11.145 |
merce | -11.093 |
Token | with |
Token ID | 351 |
Feature activation | -6.82e-01 |
Pos logit contributions | |
Zoro | +5.742 |
ibilities | +5.094 |
ells | +4.958 |
chapter | +4.828 |
ible | +4.716 |
Neg logit contributions | |
ATH | -5.960 |
anamo | -5.351 |
ares | -5.231 |
aldi | -5.224 |
ARE | -5.181 |
Token | 18 |
Token ID | 1248 |
Feature activation | -6.59e-01 |
Pos logit contributions | |
Zoro | +5.466 |
ibilities | +4.798 |
ells | +4.740 |
chapter | +4.607 |
vitamins | +4.524 |
Neg logit contributions | |
ATH | -5.824 |
anamo | -5.168 |
ares | -5.057 |
ARE | -5.009 |
aring | -5.009 |
Token | distinct |
Token ID | 7310 |
Feature activation | -7.84e-01 |
Pos logit contributions | |
Zoro | +5.271 |
ibilities | +4.711 |
ells | +4.625 |
chapter | +4.473 |
vitamins | +4.339 |
Neg logit contributions | |
ATH | -5.575 |
anamo | -4.945 |
ares | -4.801 |
ARE | -4.788 |
aring | -4.783 |
Token | types |
Token ID | 3858 |
Feature activation | -6.07e-01 |
Pos logit contributions | |
Zoro | +5.998 |
ibilities | +5.350 |
ells | +5.254 |
chapter | +5.064 |
vitamins | +4.897 |
Neg logit contributions | |
ATH | -6.842 |
anamo | -6.126 |
ares | -5.937 |
ARE | -5.899 |
aring | -5.897 |
Token | , |
Token ID | 11 |
Feature activation | +6.64e-02 |
Pos logit contributions | |
ATH | +2.739 |
aring | +2.418 |
ares | +2.400 |
ARE | +2.369 |
Stacy | +2.356 |
Neg logit contributions | |
Zoro | -2.515 |
ibilities | -2.260 |
ells | -2.246 |
chapter | -2.038 |
ible | -2.007 |
Token | � |
Token ID | 564 |
Feature activation | -5.71e-02 |
Pos logit contributions | |
ATH | +0.600 |
ares | +0.528 |
aring | +0.527 |
ARE | +0.522 |
anamo | +0.521 |
Neg logit contributions | |
Zoro | -0.509 |
ibilities | -0.457 |
ells | -0.450 |
chapter | -0.415 |
ible | -0.405 |
Token | � |
Token ID | 250 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
Zoro | +0.503 |
ibilities | +0.456 |
ells | +0.451 |
chapter | +0.424 |
vitamins | +0.412 |
Neg logit contributions | |
ATH | -0.452 |
ares | -0.390 |
anamo | -0.388 |
aring | -0.387 |
ARE | -0.384 |
Token | What |
Token ID | 2061 |
Feature activation | -3.91e-01 |
Pos logit contributions | |
Zoro | +2.415 |
ibilities | +2.187 |
ells | +2.175 |
chapter | +2.037 |
vitamins | +1.983 |
Neg logit contributions | |
ATH | -2.157 |
anamo | -1.866 |
ares | -1.863 |
aring | -1.847 |
ARE | -1.825 |
Token | the |
Token ID | 262 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
Zoro | +3.029 |
ibilities | +2.699 |
ells | +2.686 |
chapter | +2.508 |
vitamins | +2.424 |
Neg logit contributions | |
ATH | -3.491 |
anamo | -3.084 |
ares | -3.053 |
aring | -3.040 |
aryl | -3.018 |
Token | hell |
Token ID | 5968 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
Zoro | +0.103 |
ibilities | +0.093 |
ells | +0.092 |
chapter | +0.085 |
vitamins | +0.083 |
Neg logit contributions | |
ATH | -0.105 |
ares | -0.092 |
aring | -0.091 |
anamo | -0.090 |
ARE | -0.090 |
Token | . |
Token ID | 13 |
Feature activation | -4.57e-04 |
Pos logit contributions | |
Zoro | +9.101 |
ells | +8.135 |
ibilities | +8.073 |
chapter | +7.721 |
| +7.351 |
Neg logit contributions | |
ATH | -12.136 |
anamo | -11.405 |
aryl | -10.928 |
aldi | -10.905 |
merce | -10.838 |
Token | Maybe |
Token ID | 6674 |
Feature activation | -3.91e-01 |
Pos logit contributions | |
Zoro | +0.004 |
ibilities | +0.003 |
ells | +0.003 |
chapter | +0.003 |
ible | +0.003 |
Neg logit contributions | |
ATH | -0.004 |
ares | -0.003 |
ARE | -0.003 |
aring | -0.003 |
Stacy | -0.003 |
Token | I |
Token ID | 314 |
Feature activation | -3.20e-01 |
Pos logit contributions | |
Zoro | +2.915 |
ibilities | +2.572 |
ells | +2.552 |
chapter | +2.409 |
vitamins | +2.320 |
Neg logit contributions | |
ATH | -3.621 |
anamo | -3.200 |
ares | -3.188 |
aring | -3.153 |
ARE | -3.141 |
Token | should |
Token ID | 815 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
Zoro | +2.602 |
ibilities | +2.336 |
ells | +2.320 |
chapter | +2.176 |
vitamins | +2.107 |
Neg logit contributions | |
ATH | -2.728 |
anamo | -2.398 |
ares | -2.375 |
aring | -2.353 |
ARE | -2.345 |
Token | give |
Token ID | 1577 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
Zoro | +1.166 |
ibilities | +1.047 |
ells | +1.031 |
chapter | +0.949 |
ible | +0.928 |
Neg logit contributions | |
ATH | -1.278 |
ares | -1.117 |
aring | -1.117 |
ARE | -1.101 |
anamo | -1.095 |
Token | on |
Token ID | 319 |
Feature activation | -8.88e-01 |
Pos logit contributions | |
Zoro | +6.613 |
ells | +5.714 |
ibilities | +5.672 |
chapter | +5.479 |
vitamins | +5.179 |
Neg logit contributions | |
ATH | -8.594 |
anamo | -7.818 |
Mehran | -7.533 |
aryl | -7.479 |
ares | -7.458 |
Token | each |
Token ID | 1123 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
Zoro | +6.351 |
ells | +5.574 |
ibilities | +5.424 |
chapter | +5.196 |
ible | +5.084 |
Neg logit contributions | |
ATH | -8.043 |
anamo | -7.478 |
aryl | -7.276 |
Mehran | -7.050 |
aring | -7.025 |
Token | side |
Token ID | 1735 |
Feature activation | -6.16e-01 |
Pos logit contributions | |
Zoro | +6.327 |
chapter | +5.189 |
ibilities | +5.089 |
ells | +4.998 |
ible | +4.839 |
Neg logit contributions | |
ATH | -11.156 |
anamo | -10.803 |
aryl | -10.103 |
merce | -9.963 |
ARE | -9.955 |
Token | for |
Token ID | 329 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Zoro | +4.420 |
ibilities | +3.836 |
ells | +3.802 |
chapter | +3.590 |
ible | +3.455 |
Neg logit contributions | |
ATH | -5.795 |
anamo | -5.226 |
ares | -5.104 |
Mehran | -5.062 |
ARE | -5.058 |
Token | about |
Token ID | 546 |
Feature activation | -9.47e-01 |
Pos logit contributions | |
Zoro | +7.825 |
chapter | +6.545 |
ells | +6.506 |
ibilities | +6.301 |
vitamins | +6.133 |
Neg logit contributions | |
ATH | -10.850 |
anamo | -10.166 |
aryl | -9.696 |
merce | -9.646 |
aring | -9.534 |
Token | 2 |
Token ID | 362 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
Zoro | +6.756 |
ells | +5.758 |
chapter | +5.671 |
ibilities | +5.658 |
vitamins | +5.248 |
Neg logit contributions | |
ATH | -8.742 |
anamo | -8.011 |
aryl | -7.721 |
ARE | -7.632 |
aring | -7.622 |
Token | / |
Token ID | 14 |
Feature activation | -4.08e-01 |
Pos logit contributions | |
Zoro | +7.047 |
ells | +5.991 |
ibilities | +5.956 |
chapter | +5.700 |
| +5.372 |
Neg logit contributions | |
ATH | -14.196 |
anamo | -13.628 |
Mehran | -12.954 |
aryl | -12.859 |
aldi | -12.793 |
Token | 3 |
Token ID | 18 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
Zoro | +3.494 |
ibilities | +3.186 |
ells | +3.152 |
chapter | +2.964 |
ible | +2.888 |
Neg logit contributions | |
ATH | -3.235 |
anamo | -2.878 |
Mehran | -2.779 |
ares | -2.777 |
aring | -2.764 |
Token | minutes |
Token ID | 2431 |
Feature activation | -1.39e-01 |
Pos logit contributions | |
Zoro | +9.601 |
chapter | +8.290 |
ibilities | +7.997 |
ells | +7.825 |
ible | +7.746 |
Neg logit contributions | |
anamo | -13.060 |
ATH | -13.035 |
ARE | -12.012 |
Mehran | -11.852 |
aryl | -11.800 |
Token | until |
Token ID | 1566 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
Zoro | +1.083 |
ibilities | +0.968 |
ells | +0.957 |
chapter | +0.889 |
vitamins | +0.862 |
Neg logit contributions | |
ATH | -1.240 |
ares | -1.089 |
anamo | -1.083 |
aring | -1.082 |
ARE | -1.073 |
Token | golden |
Token ID | 10861 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
Zoro | +7.029 |
ells | +5.967 |
ibilities | +5.883 |
chapter | +5.730 |
vitamins | +5.585 |
Neg logit contributions | |
ATH | -9.230 |
anamo | -8.564 |
ares | -8.194 |
aryl | -8.191 |
ARE | -8.098 |
Token | B |
Token ID | 33 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
Zoro | +3.343 |
ells | +3.001 |
ibilities | +2.995 |
chapter | +2.833 |
ible | +2.698 |
Neg logit contributions | |
ATH | -3.656 |
anamo | -3.314 |
ares | -3.263 |
aring | -3.210 |
aldi | -3.204 |
Token | , |
Token ID | 11 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
Zoro | +1.588 |
ibilities | +1.410 |
ells | +1.394 |
chapter | +1.307 |
vitamins | +1.257 |
Neg logit contributions | |
ATH | -1.907 |
anamo | -1.684 |
ares | -1.680 |
aring | -1.670 |
ARE | -1.657 |
Token | � |
Token ID | 447 |
Feature activation | +5.01e-02 |
Pos logit contributions | |
ATH | +1.917 |
ares | +1.660 |
aring | +1.654 |
ARE | +1.638 |
anamo | +1.636 |
Neg logit contributions | |
Zoro | -1.922 |
ibilities | -1.769 |
ells | -1.735 |
chapter | -1.576 |
ible | -1.564 |
Token | � |
Token ID | 251 |
Feature activation | +8.52e-02 |
Pos logit contributions | |
ATH | +0.362 |
ares | +0.308 |
aring | +0.305 |
anamo | +0.303 |
ARE | +0.302 |
Neg logit contributions | |
Zoro | -0.478 |
ibilities | -0.437 |
ells | -0.432 |
chapter | -0.406 |
vitamins | -0.398 |
Token | said |
Token ID | 531 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
ATH | +0.726 |
ares | +0.633 |
aring | +0.630 |
anamo | +0.624 |
ARE | +0.622 |
Neg logit contributions | |
Zoro | -0.702 |
ibilities | -0.637 |
ells | -0.626 |
chapter | -0.579 |
ible | -0.566 |
Token | board |
Token ID | 3096 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
Zoro | +2.040 |
ibilities | +1.840 |
ells | +1.827 |
chapter | +1.728 |
vitamins | +1.673 |
Neg logit contributions | |
ATH | -1.804 |
anamo | -1.555 |
ares | -1.553 |
aring | -1.540 |
ARE | -1.526 |
Token | chair |
Token ID | 5118 |
Feature activation | -4.09e-01 |
Pos logit contributions | |
Zoro | +9.225 |
chapter | +8.135 |
ells | +8.022 |
ibilities | +7.997 |
| +7.533 |
Neg logit contributions | |
ATH | -11.939 |
anamo | -11.267 |
ares | -10.593 |
adish | -10.442 |
aryl | -10.405 |
Token | Mari |
Token ID | 29423 |
Feature activation | -3.60e-01 |
Pos logit contributions | |
Zoro | +3.824 |
ibilities | +3.469 |
ells | +3.453 |
chapter | +3.270 |
ible | +3.186 |
Neg logit contributions | |
ATH | -2.990 |
anamo | -2.568 |
ares | -2.515 |
ARE | -2.482 |
aring | -2.472 |
Token | Rut |
Token ID | 21214 |
Feature activation | -5.01e-02 |
Pos logit contributions | |
Zoro | +3.198 |
ibilities | +2.883 |
ells | +2.861 |
chapter | +2.692 |
ible | +2.625 |
Neg logit contributions | |
ATH | -2.809 |
anamo | -2.425 |
ares | -2.389 |
aring | -2.379 |
ARE | -2.366 |
Token | ka |
Token ID | 4914 |
Feature activation | -7.59e-01 |
Pos logit contributions | |
Zoro | +0.407 |
ibilities | +0.364 |
ells | +0.360 |
chapter | +0.336 |
vitamins | +0.327 |
Neg logit contributions | |
ATH | -0.432 |
ares | -0.379 |
anamo | -0.377 |
aring | -0.376 |
ARE | -0.372 |
Token | in |
Token ID | 287 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
Zoro | +5.185 |
ells | +4.509 |
ibilities | +4.451 |
chapter | +4.243 |
ible | +4.066 |
Neg logit contributions | |
ATH | -7.105 |
anamo | -6.470 |
aldi | -6.219 |
ares | -6.210 |
ARE | -6.179 |
Token | Ground |
Token ID | 13706 |
Feature activation | -4.17e-01 |
Pos logit contributions | |
ATH | +2.331 |
aring | +2.045 |
ares | +2.039 |
Stacy | +2.036 |
ARE | +2.014 |
Neg logit contributions | |
Zoro | -2.171 |
ibilities | -1.992 |
ells | -1.950 |
ible | -1.748 |
chapter | -1.746 |
Token | Zero |
Token ID | 12169 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
Zoro | +3.750 |
ells | +3.402 |
ibilities | +3.396 |
chapter | +3.217 |
ible | +3.124 |
Neg logit contributions | |
ATH | -3.182 |
anamo | -2.693 |
merce | -2.678 |
ares | -2.668 |
Mehran | -2.660 |
Token | for |
Token ID | 329 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
ATH | +0.916 |
ares | +0.804 |
aring | +0.803 |
ARE | +0.791 |
anamo | +0.790 |
Neg logit contributions | |
Zoro | -0.835 |
ibilities | -0.753 |
ells | -0.744 |
chapter | -0.678 |
ible | -0.669 |
Token | social |
Token ID | 1919 |
Feature activation | +6.96e-02 |
Pos logit contributions | |
ATH | +0.856 |
ares | +0.750 |
aring | +0.745 |
anamo | +0.738 |
ARE | +0.736 |
Neg logit contributions | |
Zoro | -0.821 |
ibilities | -0.745 |
ells | -0.734 |
chapter | -0.674 |
ible | -0.662 |
Token | justice |
Token ID | 5316 |
Feature activation | -8.65e-03 |
Pos logit contributions | |
ATH | +0.592 |
ares | +0.516 |
anamo | +0.515 |
aring | +0.512 |
ARE | +0.508 |
Neg logit contributions | |
Zoro | -0.573 |
ibilities | -0.515 |
ells | -0.509 |
chapter | -0.477 |
vitamins | -0.462 |
Token | brain |
Token ID | 3632 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
Zoro | +0.070 |
ibilities | +0.064 |
ells | +0.063 |
chapter | +0.058 |
ible | +0.056 |
Neg logit contributions | |
ATH | -0.074 |
ares | -0.065 |
aring | -0.065 |
ARE | -0.064 |
anamo | -0.064 |
Token | washing |
Token ID | 38524 |
Feature activation | -2.26e-01 |
Pos logit contributions | |
Zoro | +9.190 |
ells | +8.253 |
ibilities | +8.140 |
chapter | +8.018 |
vitamins | +8.009 |
Neg logit contributions | |
ATH | -11.576 |
Mehran | -10.492 |
anamo | -10.325 |
aryl | -10.145 |
merce | -10.139 |
Token | , |
Token ID | 11 |
Feature activation | +1.41e-02 |
Pos logit contributions | |
Zoro | +1.823 |
ibilities | +1.634 |
ells | +1.614 |
chapter | +1.513 |
vitamins | +1.467 |
Neg logit contributions | |
ATH | -1.959 |
anamo | -1.714 |
ares | -1.712 |
aring | -1.700 |
ARE | -1.687 |
Token | the |
Token ID | 262 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
ATH | +0.124 |
ares | +0.108 |
aring | +0.108 |
anamo | +0.107 |
ARE | +0.107 |
Neg logit contributions | |
Zoro | -0.112 |
ibilities | -0.101 |
ells | -0.100 |
chapter | -0.092 |
ible | -0.089 |
Token | Social |
Token ID | 5483 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
ATH | +0.913 |
ares | +0.800 |
aring | +0.796 |
anamo | +0.788 |
Stacy | +0.785 |
Neg logit contributions | |
Zoro | -0.859 |
ibilities | -0.776 |
ells | -0.766 |
chapter | -0.700 |
ible | -0.689 |
Token | Justice |
Token ID | 4796 |
Feature activation | -2.24e-01 |
Pos logit contributions | |
Zoro | +1.274 |
ibilities | +1.136 |
ells | +1.133 |
chapter | +1.067 |
ible | +1.025 |
Neg logit contributions | |
ATH | -1.364 |
anamo | -1.198 |
ares | -1.184 |
aldi | -1.172 |
aring | -1.171 |
Token | the |
Token ID | 262 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
ATH | +1.637 |
ares | +1.433 |
aring | +1.419 |
ARE | +1.414 |
anamo | +1.402 |
Neg logit contributions | |
Zoro | -1.424 |
ibilities | -1.293 |
ells | -1.267 |
chapter | -1.172 |
ible | -1.140 |
Token | more |
Token ID | 517 |
Feature activation | -8.02e-01 |
Pos logit contributions | |
Zoro | +2.098 |
ibilities | +1.873 |
ells | +1.853 |
chapter | +1.726 |
vitamins | +1.674 |
Neg logit contributions | |
ATH | -2.364 |
ares | -2.073 |
anamo | -2.067 |
aring | -2.060 |
ARE | -2.043 |
Token | compact |
Token ID | 16001 |
Feature activation | -5.81e-01 |
Pos logit contributions | |
Zoro | +5.993 |
ells | +5.151 |
ibilities | +5.122 |
chapter | +4.929 |
vitamins | +4.733 |
Neg logit contributions | |
ATH | -7.212 |
anamo | -6.613 |
ARE | -6.343 |
ares | -6.339 |
aring | -6.287 |
Token | yo |
Token ID | 27406 |
Feature activation | -9.39e-01 |
Pos logit contributions | |
Zoro | +3.907 |
ibilities | +3.357 |
ells | +3.351 |
chapter | +3.067 |
ible | +2.993 |
Neg logit contributions | |
ATH | -5.803 |
anamo | -5.226 |
ares | -5.127 |
ARE | -5.103 |
aring | -5.098 |
Token | - |
Token ID | 12 |
Feature activation | -8.00e-01 |
Pos logit contributions | |
Zoro | +6.134 |
ells | +5.320 |
ibilities | +5.233 |
chapter | +4.853 |
ible | +4.641 |
Neg logit contributions | |
ATH | -9.122 |
anamo | -8.435 |
merce | -8.158 |
aldi | -8.131 |
ARE | -8.119 |
Token | y |
Token ID | 88 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
Zoro | +6.109 |
ells | +5.759 |
ibilities | +5.621 |
ible | +5.022 |
vitamins | +5.004 |
Neg logit contributions | |
ATH | -6.698 |
Stacy | -5.850 |
ARE | -5.832 |
aldi | -5.801 |
anamo | -5.796 |
Token | os |
Token ID | 418 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
Zoro | +10.351 |
ells | +9.937 |
ibilities | +9.490 |
ible | +8.532 |
chapter | +8.474 |
Neg logit contributions | |
ATH | -10.906 |
ARE | -9.597 |
Stacy | -9.553 |
anamo | -9.376 |
aryl | -9.297 |
Token | in |
Token ID | 287 |
Feature activation | -4.60e-02 |
Pos logit contributions | |
Zoro | +0.888 |
ibilities | +0.797 |
ells | +0.787 |
chapter | +0.732 |
vitamins | +0.711 |
Neg logit contributions | |
ATH | -0.982 |
ares | -0.861 |
aring | -0.856 |
anamo | -0.855 |
ARE | -0.847 |
Token | this |
Token ID | 428 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
Zoro | +0.356 |
ibilities | +0.318 |
ells | +0.315 |
chapter | +0.292 |
vitamins | +0.283 |
Neg logit contributions | |
ATH | -0.413 |
ares | -0.363 |
anamo | -0.363 |
aring | -0.361 |
ARE | -0.358 |
Token | shootout |
Token ID | 34995 |
Feature activation | -6.85e-02 |
Pos logit contributions | |
ATH | +2.194 |
ares | +1.828 |
aring | +1.802 |
ARE | +1.775 |
anamo | +1.773 |
Neg logit contributions | |
Zoro | -3.530 |
ibilities | -3.314 |
ells | -3.241 |
ible | -3.032 |
chapter | -3.028 |
Token | , |
Token ID | 11 |
Feature activation | -3.49e-02 |
Pos logit contributions | |
Zoro | +0.535 |
ibilities | +0.480 |
ells | +0.473 |
chapter | +0.439 |
vitamins | +0.427 |
Neg logit contributions | |
ATH | -0.611 |
ares | -0.537 |
aring | -0.534 |
anamo | -0.532 |
ARE | -0.528 |
Token | are |
Token ID | 389 |
Feature activation | -7.23e-01 |
Pos logit contributions | |
Zoro | +2.245 |
ibilities | +2.005 |
ells | +1.980 |
chapter | +1.863 |
vitamins | +1.798 |
Neg logit contributions | |
ATH | -2.415 |
anamo | -2.122 |
ares | -2.105 |
aring | -2.088 |
aryl | -2.077 |
Token | moving |
Token ID | 3867 |
Feature activation | -3.68e-01 |
Pos logit contributions | |
Zoro | +5.690 |
ells | +5.012 |
ibilities | +4.980 |
chapter | +4.805 |
vitamins | +4.512 |
Neg logit contributions | |
ATH | -6.228 |
anamo | -5.597 |
ares | -5.429 |
ARE | -5.401 |
aryl | -5.382 |
Token | along |
Token ID | 1863 |
Feature activation | -2.89e-01 |
Pos logit contributions | |
Zoro | +2.978 |
ibilities | +2.634 |
ells | +2.623 |
chapter | +2.479 |
ible | +2.377 |
Neg logit contributions | |
ATH | -3.176 |
anamo | -2.804 |
ares | -2.782 |
aring | -2.756 |
ARE | -2.733 |
Token | . |
Token ID | 13 |
Feature activation | -4.62e-01 |
Pos logit contributions | |
Zoro | +2.239 |
ibilities | +1.983 |
ells | +1.958 |
chapter | +1.840 |
ible | +1.770 |
Neg logit contributions | |
ATH | -2.602 |
anamo | -2.305 |
ares | -2.292 |
aring | -2.273 |
ARE | -2.258 |
Token | Good |
Token ID | 4599 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
Zoro | +3.763 |
ibilities | +3.335 |
ells | +3.315 |
chapter | +3.149 |
ible | +3.020 |
Neg logit contributions | |
ATH | -3.918 |
anamo | -3.490 |
ares | -3.425 |
aring | -3.408 |
aryl | -3.390 |
Token | ? |
Token ID | 30 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
Zoro | +1.454 |
ells | +1.309 |
ibilities | +1.304 |
chapter | +1.212 |
vitamins | +1.171 |
Neg logit contributions | |
ATH | -1.708 |
anamo | -1.520 |
ares | -1.494 |
aring | -1.483 |
ARE | -1.480 |
Token | Why |
Token ID | 4162 |
Feature activation | -1.76e-01 |
Pos logit contributions | |
Zoro | +8.060 |
ells | +6.549 |
ibilities | +6.350 |
chapter | +6.178 |
| +5.985 |
Neg logit contributions | |
ATH | -13.437 |
anamo | -12.368 |
merce | -12.216 |
aryl | -12.159 |
aldi | -12.020 |
Token | good |
Token ID | 922 |
Feature activation | -2.28e-01 |
Pos logit contributions | |
Zoro | +1.421 |
ibilities | +1.278 |
ells | +1.259 |
chapter | +1.161 |
vitamins | +1.133 |
Neg logit contributions | |
ATH | -1.522 |
ares | -1.336 |
aring | -1.330 |
ARE | -1.318 |
anamo | -1.309 |
Token | ? |
Token ID | 30 |
Feature activation | -9.76e-01 |
Pos logit contributions | |
Zoro | +1.798 |
ibilities | +1.610 |
ells | +1.588 |
chapter | +1.477 |
vitamins | +1.433 |
Neg logit contributions | |
ATH | -2.020 |
ares | -1.772 |
aring | -1.760 |
anamo | -1.756 |
ARE | -1.745 |
Token | We |
Token ID | 775 |
Feature activation | -6.46e-01 |
Pos logit contributions | |
Zoro | +5.644 |
ells | +4.481 |
ibilities | +4.392 |
chapter | +4.305 |
| +4.123 |
Neg logit contributions | |
ATH | -10.173 |
anamo | -9.858 |
merce | -9.815 |
aryl | -9.564 |
aldi | -9.462 |
Token | need |
Token ID | 761 |
Feature activation | +3.04e-01 |
Pos logit contributions | |
Zoro | +3.699 |
ibilities | +3.158 |
ells | +3.077 |
chapter | +2.922 |
ible | +2.765 |
Neg logit contributions | |
ATH | -6.974 |
anamo | -6.454 |
Mehran | -6.259 |
aldi | -6.250 |
aryl | -6.243 |
Token | s |
Token ID | 82 |
Feature activation | -7.27e-02 |
Pos logit contributions | |
Zoro | +1.084 |
ibilities | +0.972 |
ells | +0.962 |
chapter | +0.898 |
vitamins | +0.870 |
Neg logit contributions | |
ATH | -1.161 |
ares | -1.015 |
anamo | -1.012 |
aring | -1.008 |
ARE | -1.000 |
Token | forthcoming |
Token ID | 21220 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
Zoro | +0.600 |
ibilities | +0.541 |
ells | +0.535 |
chapter | +0.495 |
vitamins | +0.483 |
Neg logit contributions | |
ATH | -0.617 |
ares | -0.539 |
aring | -0.535 |
anamo | -0.531 |
ARE | -0.528 |
Token | Netflix |
Token ID | 12074 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
Zoro | +1.425 |
ibilities | +1.288 |
ells | +1.275 |
chapter | +1.188 |
vitamins | +1.158 |
Neg logit contributions | |
ATH | -1.379 |
ares | -1.198 |
aring | -1.190 |
anamo | -1.186 |
ARE | -1.176 |
Token | series |
Token ID | 2168 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
Zoro | +2.489 |
ibilities | +2.243 |
ells | +2.219 |
chapter | +2.088 |
vitamins | +2.025 |
Neg logit contributions | |
ATH | -2.403 |
ares | -2.085 |
anamo | -2.081 |
aring | -2.068 |
ARE | -2.051 |
Token | , |
Token ID | 11 |
Feature activation | -4.67e-01 |
Pos logit contributions | |
Zoro | +1.098 |
ibilities | +0.982 |
ells | +0.972 |
chapter | +0.907 |
vitamins | +0.879 |
Neg logit contributions | |
ATH | -1.189 |
ares | -1.039 |
anamo | -1.036 |
aring | -1.032 |
ARE | -1.024 |
Token | Mind |
Token ID | 10175 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
Zoro | +3.820 |
ibilities | +3.367 |
ells | +3.357 |
chapter | +3.198 |
vitamins | +3.072 |
Neg logit contributions | |
ATH | -3.928 |
anamo | -3.431 |
ares | -3.424 |
aring | -3.386 |
ARE | -3.381 |
Token | hunter |
Token ID | 37488 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
Zoro | +10.101 |
ells | +9.151 |
chapter | +8.567 |
ibilities | +8.419 |
| +8.363 |
Neg logit contributions | |
ATH | -11.265 |
merce | -10.259 |
Mehran | -10.185 |
ares | -9.642 |
ARE | -9.481 |
Token | . |
Token ID | 13 |
Feature activation | +4.72e-02 |
Pos logit contributions | |
ATH | +1.551 |
ares | +1.359 |
aring | +1.352 |
anamo | +1.346 |
ARE | +1.337 |
Neg logit contributions | |
Zoro | -1.362 |
ibilities | -1.228 |
ells | -1.210 |
chapter | -1.114 |
ible | -1.088 |
Token | � |
Token ID | 564 |
Feature activation | +9.08e-02 |
Pos logit contributions | |
ATH | +0.410 |
ares | +0.360 |
aring | +0.357 |
ARE | +0.354 |
anamo | +0.353 |
Neg logit contributions | |
Zoro | -0.380 |
ibilities | -0.345 |
ells | -0.337 |
chapter | -0.313 |
vitamins | -0.307 |
Token | � |
Token ID | 250 |
Feature activation | -2.62e-01 |
Pos logit contributions | |
ATH | +0.638 |
ares | +0.538 |
aring | +0.534 |
anamo | +0.531 |
ARE | +0.526 |
Neg logit contributions | |
Zoro | -0.886 |
ibilities | -0.812 |
ells | -0.802 |
chapter | -0.757 |
vitamins | -0.741 |
Token | No |
Token ID | 2949 |
Feature activation | -4.18e-01 |
Pos logit contributions | |
Zoro | +2.198 |
ibilities | +1.981 |
ells | +1.965 |
chapter | +1.836 |
ible | +1.784 |
Neg logit contributions | |
ATH | -2.179 |
ares | -1.897 |
anamo | -1.896 |
aring | -1.883 |
ARE | -1.861 |
Token | this |
Token ID | 428 |
Feature activation | -8.24e-02 |
Pos logit contributions | |
Zoro | +0.670 |
ibilities | +0.605 |
ells | +0.597 |
chapter | +0.550 |
ible | +0.538 |
Neg logit contributions | |
ATH | -0.737 |
ares | -0.647 |
aring | -0.642 |
anamo | -0.641 |
ARE | -0.636 |
Token | week |
Token ID | 1285 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
Zoro | +0.619 |
ibilities | +0.554 |
ells | +0.546 |
chapter | +0.502 |
vitamins | +0.489 |
Neg logit contributions | |
ATH | -0.759 |
ares | -0.670 |
aring | -0.665 |
anamo | -0.663 |
ARE | -0.659 |
Token | , |
Token ID | 11 |
Feature activation | -6.98e-02 |
Pos logit contributions | |
Zoro | +1.225 |
ibilities | +1.087 |
ells | +1.076 |
chapter | +1.004 |
vitamins | +0.969 |
Neg logit contributions | |
ATH | -1.440 |
ares | -1.268 |
anamo | -1.265 |
aring | -1.261 |
ARE | -1.251 |
Token | the |
Token ID | 262 |
Feature activation | -3.63e-01 |
Pos logit contributions | |
Zoro | +0.556 |
ibilities | +0.501 |
ells | +0.495 |
chapter | +0.458 |
ible | +0.446 |
Neg logit contributions | |
ATH | -0.611 |
ares | -0.535 |
anamo | -0.532 |
aring | -0.531 |
ARE | -0.527 |
Token | reliably |
Token ID | 26995 |
Feature activation | -5.88e-01 |
Pos logit contributions | |
Zoro | +2.911 |
ibilities | +2.594 |
ells | +2.562 |
chapter | +2.417 |
vitamins | +2.331 |
Neg logit contributions | |
ATH | -3.158 |
ares | -2.764 |
anamo | -2.763 |
aring | -2.748 |
ARE | -2.724 |
Token | offensive |
Token ID | 5859 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
Zoro | +4.545 |
ibilities | +3.963 |
ells | +3.942 |
chapter | +3.772 |
vitamins | +3.603 |
Neg logit contributions | |
ATH | -5.213 |
anamo | -4.670 |
ares | -4.600 |
aldi | -4.539 |
ARE | -4.535 |
Token | Fox |
Token ID | 5426 |
Feature activation | -3.73e-01 |
Pos logit contributions | |
Zoro | +10.562 |
chapter | +9.140 |
ibilities | +8.935 |
ells | +8.832 |
| +8.547 |
Neg logit contributions | |
ATH | -10.693 |
anamo | -9.711 |
aring | -9.206 |
merce | -9.196 |
ARE | -9.152 |
Token | News |
Token ID | 3000 |
Feature activation | -2.86e-01 |
Pos logit contributions | |
Zoro | +2.969 |
ells | +2.619 |
ibilities | +2.617 |
chapter | +2.482 |
vitamins | +2.374 |
Neg logit contributions | |
ATH | -3.247 |
anamo | -2.855 |
ares | -2.853 |
aring | -2.829 |
ARE | -2.813 |
Token | show |
Token ID | 905 |
Feature activation | -5.87e-01 |
Pos logit contributions | |
Zoro | +2.260 |
ibilities | +2.006 |
ells | +1.984 |
chapter | +1.876 |
vitamins | +1.807 |
Neg logit contributions | |
ATH | -2.525 |
ares | -2.213 |
anamo | -2.211 |
aring | -2.202 |
ARE | -2.185 |
Token | managed |
Token ID | 5257 |
Feature activation | +4.48e-02 |
Pos logit contributions | |
Zoro | +4.502 |
ibilities | +3.905 |
ells | +3.889 |
chapter | +3.717 |
vitamins | +3.541 |
Neg logit contributions | |
ATH | -5.248 |
anamo | -4.608 |
ares | -4.566 |
ARE | -4.564 |
aring | -4.556 |
Token | to |
Token ID | 284 |
Feature activation | +1.79e-01 |
Pos logit contributions | |
ATH | +0.407 |
anamo | +0.361 |
ares | +0.358 |
aring | +0.357 |
ARE | +0.354 |
Neg logit contributions | |
Zoro | -0.340 |
ibilities | -0.303 |
ells | -0.301 |
chapter | -0.281 |
vitamins | -0.270 |
Token | of |
Token ID | 286 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
ATH | +0.325 |
aring | +0.282 |
ares | +0.281 |
anamo | +0.279 |
ARE | +0.277 |
Neg logit contributions | |
Zoro | -0.323 |
ibilities | -0.291 |
ells | -0.289 |
chapter | -0.267 |
vitamins | -0.260 |
Token | the |
Token ID | 262 |
Feature activation | -2.94e-01 |
Pos logit contributions | |
Zoro | +0.893 |
ibilities | +0.809 |
ells | +0.801 |
chapter | +0.741 |
ible | +0.724 |
Neg logit contributions | |
ATH | -0.887 |
ares | -0.771 |
aring | -0.766 |
anamo | -0.762 |
ARE | -0.757 |
Token | theory |
Token ID | 4583 |
Feature activation | -5.58e-02 |
Pos logit contributions | |
Zoro | +2.489 |
ibilities | +2.228 |
ells | +2.201 |
chapter | +2.092 |
vitamins | +2.022 |
Neg logit contributions | |
ATH | -2.440 |
anamo | -2.127 |
ares | -2.121 |
aring | -2.105 |
ARE | -2.089 |
Token | is |
Token ID | 318 |
Feature activation | -7.44e-01 |
Pos logit contributions | |
Zoro | +0.450 |
ibilities | +0.405 |
ells | +0.400 |
chapter | +0.372 |
vitamins | +0.362 |
Neg logit contributions | |
ATH | -0.483 |
ares | -0.423 |
aring | -0.421 |
anamo | -0.420 |
ARE | -0.416 |
Token | its |
Token ID | 663 |
Feature activation | -5.05e-01 |
Pos logit contributions | |
Zoro | +5.061 |
ibilities | +4.311 |
ells | +4.182 |
chapter | +4.114 |
vitamins | +3.858 |
Neg logit contributions | |
ATH | -7.163 |
anamo | -6.436 |
ares | -6.356 |
ARE | -6.346 |
aldi | -6.332 |
Token | alleged |
Token ID | 4260 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
Zoro | +3.888 |
ibilities | +3.405 |
ells | +3.352 |
chapter | +3.237 |
vitamins | +3.068 |
Neg logit contributions | |
ATH | -4.583 |
anamo | -4.084 |
ares | -4.014 |
ARE | -3.968 |
aring | -3.966 |
Token | ability |
Token ID | 2694 |
Feature activation | -4.81e-01 |
Pos logit contributions | |
Zoro | +9.951 |
ibilities | +8.595 |
chapter | +8.561 |
ells | +8.120 |
vitamins | +7.977 |
Neg logit contributions | |
ATH | -11.399 |
anamo | -10.705 |
aldi | -9.954 |
merce | -9.931 |
ARE | -9.889 |
Token | to |
Token ID | 284 |
Feature activation | -9.93e-02 |
Pos logit contributions | |
Zoro | +3.201 |
ibilities | +2.850 |
ells | +2.725 |
chapter | +2.610 |
ible | +2.507 |
Neg logit contributions | |
ATH | -4.696 |
anamo | -4.244 |
ares | -4.214 |
aldi | -4.186 |
ARE | -4.182 |
Token | combine |
Token ID | 12082 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
Zoro | +0.814 |
ibilities | +0.731 |
ells | +0.729 |
chapter | +0.668 |
vitamins | +0.654 |
Neg logit contributions | |
ATH | -0.843 |
ares | -0.735 |
aring | -0.734 |
ARE | -0.721 |
aryl | -0.718 |
Token | an |
Token ID | 281 |
Feature activation | -9.24e-02 |
Pos logit contributions | |
ATH | +2.493 |
ares | +2.211 |
aring | +2.198 |
Stacy | +2.168 |
ARE | +2.166 |
Neg logit contributions | |
Zoro | -2.241 |
ells | -2.053 |
ibilities | -2.052 |
chapter | -1.820 |
ible | -1.787 |
Token | acceptance |
Token ID | 13427 |
Feature activation | +1.44e-01 |
Pos logit contributions | |
Zoro | +0.762 |
ibilities | +0.685 |
ells | +0.677 |
chapter | +0.633 |
vitamins | +0.614 |
Neg logit contributions | |
ATH | -0.785 |
ares | -0.685 |
anamo | -0.681 |
aring | -0.680 |
ARE | -0.674 |
Token | about |
Token ID | 546 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
ATH | +1.255 |
ares | +1.101 |
aring | +1.098 |
ARE | +1.088 |
Stacy | +1.080 |
Neg logit contributions | |
Zoro | -1.158 |
ibilities | -1.048 |
ells | -1.027 |
chapter | -0.947 |
vitamins | -0.937 |
Token | this |
Token ID | 428 |
Feature activation | +5.80e-01 |
Pos logit contributions | |
Zoro | +1.250 |
ibilities | +1.113 |
ells | +1.102 |
chapter | +1.039 |
vitamins | +1.000 |
Neg logit contributions | |
ATH | -1.385 |
anamo | -1.213 |
ares | -1.210 |
aring | -1.201 |
ARE | -1.196 |
Token | article |
Token ID | 2708 |
Feature activation | +6.01e-01 |
Pos logit contributions | |
ATH | +4.651 |
aring | +4.043 |
ares | +4.024 |
Stacy | +3.989 |
ARE | +3.968 |
Neg logit contributions | |
Zoro | -4.872 |
ibilities | -4.468 |
ells | -4.408 |
ibly | -3.973 |
ible | -3.962 |
Token | Santos |
Token ID | 28458 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
ATH | +4.899 |
aring | +4.297 |
ARE | +4.293 |
ares | +4.252 |
Stacy | +4.164 |
Neg logit contributions | |
Zoro | -4.977 |
ibilities | -4.569 |
ells | -4.389 |
vitamins | -4.059 |
chapter | -4.016 |
Token | Tour |
Token ID | 9852 |
Feature activation | -4.34e-01 |
Pos logit contributions | |
Zoro | +0.931 |
ibilities | +0.839 |
ells | +0.829 |
chapter | +0.773 |
vitamins | +0.753 |
Neg logit contributions | |
ATH | -0.944 |
ares | -0.823 |
anamo | -0.818 |
aring | -0.817 |
ARE | -0.809 |
Token | Down |
Token ID | 5588 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
Zoro | +3.451 |
ibilities | +3.068 |
ells | +3.059 |
chapter | +2.878 |
vitamins | +2.769 |
Neg logit contributions | |
ATH | -3.772 |
anamo | -3.322 |
ares | -3.286 |
ARE | -3.272 |
aring | -3.268 |
Token | Under |
Token ID | 4698 |
Feature activation | +3.28e-02 |
Pos logit contributions | |
Zoro | +7.182 |
ells | +6.417 |
ibilities | +6.308 |
chapter | +5.642 |
ible | +5.562 |
Neg logit contributions | |
ATH | -13.532 |
anamo | -12.388 |
merce | -12.152 |
ARE | -11.961 |
aldi | -11.939 |
Token | Stage |
Token ID | 15371 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
ATH | +0.287 |
ares | +0.252 |
aring | +0.250 |
ARE | +0.248 |
anamo | +0.247 |
Neg logit contributions | |
Zoro | -0.262 |
ibilities | -0.236 |
ells | -0.233 |
chapter | -0.214 |
ible | -0.210 |
Token | 2 |
Token ID | 362 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
ATH | +1.526 |
ares | +1.349 |
aring | +1.342 |
ARE | +1.328 |
aldi | +1.321 |
Neg logit contributions | |
Zoro | -1.318 |
ibilities | -1.195 |
ells | -1.189 |
chapter | -1.066 |
ible | -1.049 |
Token | Results |
Token ID | 15691 |
Feature activation | +9.04e-02 |
Pos logit contributions | |
Zoro | +1.237 |
ibilities | +1.109 |
ells | +1.097 |
chapter | +1.024 |
vitamins | +0.993 |
Neg logit contributions | |
ATH | -1.318 |
ares | -1.152 |
anamo | -1.147 |
aring | -1.144 |
ARE | -1.134 |
Token | : |
Token ID | 25 |
Feature activation | -7.90e-02 |
Pos logit contributions | |
ATH | +0.789 |
ares | +0.697 |
aring | +0.690 |
ARE | +0.684 |
anamo | +0.678 |
Neg logit contributions | |
Zoro | -0.716 |
ibilities | -0.651 |
ells | -0.643 |
chapter | -0.588 |
vitamins | -0.578 |
Token | find |
Token ID | 1064 |
Feature activation | +9.13e-02 |
Pos logit contributions | |
ATH | +2.653 |
aring | +2.330 |
ares | +2.301 |
Stacy | +2.250 |
aldi | +2.236 |
Neg logit contributions | |
Zoro | -2.850 |
ells | -2.592 |
ibilities | -2.564 |
ible | -2.316 |
chapter | -2.316 |
Token | much |
Token ID | 881 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
ATH | +0.787 |
ares | +0.690 |
aring | +0.687 |
anamo | +0.679 |
ARE | +0.677 |
Neg logit contributions | |
Zoro | -0.735 |
ibilities | -0.660 |
ells | -0.657 |
chapter | -0.603 |
ible | -0.589 |
Token | to |
Token ID | 284 |
Feature activation | +5.61e-01 |
Pos logit contributions | |
ATH | +1.377 |
ares | +1.198 |
aring | +1.191 |
ARE | +1.176 |
Stacy | +1.168 |
Neg logit contributions | |
Zoro | -1.336 |
ells | -1.214 |
ibilities | -1.208 |
chapter | -1.098 |
ible | -1.078 |
Token | like |
Token ID | 588 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
ATH | +4.636 |
aring | +4.003 |
ares | +3.984 |
ARE | +3.931 |
Stacy | +3.917 |
Neg logit contributions | |
Zoro | -4.534 |
ells | -4.126 |
ibilities | -4.077 |
vitamins | -3.634 |
chapter | -3.626 |
Token | about |
Token ID | 546 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
ATH | +2.444 |
aring | +2.110 |
ares | +2.105 |
Stacy | +2.094 |
anamo | +2.088 |
Neg logit contributions | |
Zoro | -2.298 |
ells | -2.093 |
ibilities | -2.090 |
chapter | -1.889 |
vitamins | -1.863 |
Token | Fedora |
Token ID | 32245 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
Zoro | +0.929 |
ibilities | +0.833 |
ells | +0.823 |
chapter | +0.770 |
vitamins | +0.747 |
Neg logit contributions | |
ATH | -0.989 |
ares | -0.865 |
anamo | -0.862 |
aring | -0.858 |
ARE | -0.852 |
Token | 24 |
Token ID | 1987 |
Feature activation | +7.43e-01 |
Pos logit contributions | |
ATH | +9.552 |
aldi | +7.965 |
Stacy | +7.878 |
aring | +7.878 |
aria | +7.874 |
Neg logit contributions | |
Zoro | -9.707 |
ibilities | -9.015 |
ells | -8.724 |
vitamins | -8.070 |
ibly | -7.902 |
Token | . |
Token ID | 13 |
Feature activation | +5.86e-01 |
Pos logit contributions | |
ATH | +6.060 |
aring | +5.265 |
aldi | +5.220 |
ares | +5.171 |
Stacy | +5.102 |
Neg logit contributions | |
Zoro | -6.036 |
ibilities | -5.427 |
ells | -5.382 |
chapter | -4.920 |
vitamins | -4.906 |
Token | Also |
Token ID | 4418 |
Feature activation | +9.66e-02 |
Pos logit contributions | |
ATH | +4.719 |
Stacy | +4.104 |
ares | +4.083 |
aring | +4.075 |
ARE | +4.031 |
Neg logit contributions | |
Zoro | -4.786 |
ibilities | -4.468 |
ells | -4.384 |
vitamins | -4.060 |
ibly | -4.014 |
Token | , |
Token ID | 11 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
ATH | +0.858 |
ares | +0.755 |
aring | +0.754 |
anamo | +0.748 |
ARE | +0.742 |
Neg logit contributions | |
Zoro | -0.754 |
ibilities | -0.675 |
ells | -0.667 |
chapter | -0.617 |
vitamins | -0.600 |
Token | anyone |
Token ID | 2687 |
Feature activation | +3.29e-01 |
Pos logit contributions | |
ATH | +2.025 |
aring | +1.796 |
ares | +1.787 |
aldi | +1.758 |
Stacy | +1.756 |
Neg logit contributions | |
Zoro | -1.901 |
ibilities | -1.735 |
ells | -1.728 |
chapter | -1.550 |
ible | -1.534 |
Token | at |
Token ID | 379 |
Feature activation | -5.04e-02 |
Pos logit contributions | |
ATH | +2.809 |
aring | +2.438 |
ARE | +2.430 |
ares | +2.428 |
aldi | +2.414 |
Neg logit contributions | |
Zoro | -2.501 |
ibilities | -2.310 |
ells | -2.230 |
chapter | -2.013 |
ibly | -2.004 |
Token | 5 |
Token ID | 642 |
Feature activation | +4.04e-01 |
Pos logit contributions | |
Zoro | +0.380 |
ibilities | +0.341 |
ells | +0.333 |
ible | +0.303 |
chapter | +0.302 |
Neg logit contributions | |
ATH | -0.459 |
ares | -0.405 |
aring | -0.403 |
anamo | -0.403 |
ARE | -0.402 |
Token | p |
Token ID | 279 |
Feature activation | +4.30e-01 |
Pos logit contributions | |
ATH | +3.167 |
aring | +2.700 |
ares | +2.699 |
ARE | +2.674 |
anamo | +2.664 |
Neg logit contributions | |
Zoro | -3.592 |
ibilities | -3.251 |
ells | -3.197 |
chapter | -2.991 |
ible | -2.936 |
Token | . |
Token ID | 13 |
Feature activation | +6.30e-01 |
Pos logit contributions | |
ATH | +3.303 |
ares | +2.885 |
aring | +2.849 |
ARE | +2.776 |
aria | +2.738 |
Neg logit contributions | |
Zoro | -3.836 |
ibilities | -3.517 |
ells | -3.368 |
vitamins | -3.211 |
chapter | -3.117 |
Token | m |
Token ID | 76 |
Feature activation | +8.87e-01 |
Pos logit contributions | |
ATH | +2.978 |
ares | +2.430 |
aring | +2.372 |
kind | +2.219 |
aria | +2.198 |
Neg logit contributions | |
Zoro | -7.351 |
ibilities | -6.953 |
ells | -6.605 |
vitamins | -6.546 |
chapter | -6.329 |
Token | . |
Token ID | 13 |
Feature activation | +9.03e-01 |
Pos logit contributions | |
ATH | +7.296 |
ares | +6.246 |
aring | +6.227 |
aryl | +6.221 |
ARE | +6.205 |
Neg logit contributions | |
Zoro | -7.319 |
ibilities | -6.529 |
ells | -6.392 |
chapter | -5.925 |
vitamins | -5.886 |
Token | on |
Token ID | 319 |
Feature activation | +6.14e-01 |
Pos logit contributions | |
ATH | +5.870 |
aryl | +4.810 |
ARE | +4.810 |
ares | +4.802 |
Stacy | +4.777 |
Neg logit contributions | |
Zoro | -8.857 |
ibilities | -8.183 |
ells | -8.043 |
ible | -7.567 |
ibly | -7.548 |
Token | Dec |
Token ID | 4280 |
Feature activation | +4.44e-01 |
Pos logit contributions | |
ATH | +4.098 |
Stacy | +3.524 |
ares | +3.491 |
ARE | +3.485 |
aring | +3.454 |
Neg logit contributions | |
Zoro | -5.817 |
ibilities | -5.426 |
ells | -5.321 |
ible | -4.953 |
ibly | -4.889 |
Token | . |
Token ID | 13 |
Feature activation | +4.16e-01 |
Pos logit contributions | |
ATH | +3.477 |
ares | +3.090 |
aring | +3.076 |
ARE | +2.973 |
aria | +2.952 |
Neg logit contributions | |
Zoro | -3.887 |
ibilities | -3.477 |
ells | -3.361 |
vitamins | -3.199 |
chapter | -3.163 |
Token | 27 |
Token ID | 2681 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
ATH | +3.437 |
Stacy | +2.999 |
ares | +2.981 |
aring | +2.939 |
ARE | +2.934 |
Neg logit contributions | |
Zoro | -3.332 |
ibilities | -3.204 |
ells | -3.091 |
vitamins | -2.810 |
ibly | -2.759 |
Token | , |
Token ID | 11 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
ATH | +1.823 |
anamo | +1.623 |
ares | +1.620 |
aring | +1.602 |
ARE | +1.590 |
Neg logit contributions | |
Zoro | -1.440 |
ibilities | -1.283 |
ells | -1.260 |
chapter | -1.178 |
vitamins | -1.127 |
Token | */ |
Token ID | 9466 |
Feature activation | -2.15e-01 |
Pos logit contributions | |
ATH | +2.169 |
ares | +1.935 |
aring | +1.913 |
ARE | +1.911 |
aryl | +1.878 |
Neg logit contributions | |
Zoro | -1.764 |
ibilities | -1.568 |
ells | -1.528 |
chapter | -1.405 |
vitamins | -1.392 |
Token | There |
Token ID | 1318 |
Feature activation | -9.84e-03 |
Pos logit contributions | |
Zoro | +1.643 |
ibilities | +1.458 |
ells | +1.445 |
chapter | +1.346 |
vitamins | +1.299 |
Neg logit contributions | |
ATH | -1.960 |
ares | -1.722 |
anamo | -1.722 |
aring | -1.711 |
ARE | -1.699 |
Token | can |
Token ID | 460 |
Feature activation | +2.62e-01 |
Pos logit contributions | |
Zoro | +0.079 |
ibilities | +0.071 |
ells | +0.070 |
chapter | +0.065 |
vitamins | +0.063 |
Neg logit contributions | |
ATH | -0.086 |
ares | -0.075 |
aring | -0.075 |
anamo | -0.074 |
ARE | -0.074 |
Token | be |
Token ID | 307 |
Feature activation | +1.68e-01 |
Pos logit contributions | |
ATH | +2.202 |
ares | +1.907 |
aring | +1.903 |
ARE | +1.888 |
anamo | +1.884 |
Neg logit contributions | |
Zoro | -2.179 |
ibilities | -1.957 |
ells | -1.934 |
chapter | -1.806 |
vitamins | -1.763 |
Token | no |
Token ID | 645 |
Feature activation | -4.38e-02 |
Pos logit contributions | |
ATH | +1.361 |
ares | +1.189 |
aring | +1.175 |
ARE | +1.169 |
aldi | +1.163 |
Neg logit contributions | |
Zoro | -1.424 |
ibilities | -1.295 |
ells | -1.282 |
chapter | -1.175 |
ible | -1.157 |
Token | bl |
Token ID | 698 |
Feature activation | +8.81e-01 |
Pos logit contributions | |
Zoro | +0.359 |
ibilities | +0.323 |
ells | +0.320 |
chapter | +0.293 |
vitamins | +0.288 |
Neg logit contributions | |
ATH | -0.372 |
ares | -0.326 |
aring | -0.325 |
ARE | -0.322 |
anamo | -0.321 |
Token | anks |
Token ID | 2283 |
Feature activation | +9.02e-02 |
Pos logit contributions | |
ATH | +6.576 |
ares | +6.005 |
aring | +5.976 |
anamo | +5.512 |
aryl | +5.478 |
Neg logit contributions | |
Zoro | -7.814 |
ibilities | -6.748 |
ells | -6.519 |
vitamins | -6.388 |
chapter | -6.241 |
Token | between |
Token ID | 1022 |
Feature activation | +1.28e-01 |
Pos logit contributions | |
ATH | +0.767 |
ares | +0.669 |
aring | +0.666 |
ARE | +0.654 |
anamo | +0.652 |
Neg logit contributions | |
Zoro | -0.743 |
ibilities | -0.667 |
ells | -0.657 |
chapter | -0.607 |
vitamins | -0.600 |
Token | " |
Token ID | 366 |
Feature activation | +2.29e-01 |
Pos logit contributions | |
ATH | +1.117 |
ares | +0.990 |
aring | +0.983 |
ARE | +0.976 |
aryl | +0.962 |
Neg logit contributions | |
Zoro | -1.016 |
ibilities | -0.909 |
ells | -0.886 |
chapter | -0.808 |
ible | -0.801 |
Token | vim |
Token ID | 31124 |
Feature activation | +5.00e-01 |
Pos logit contributions | |
ATH | +1.828 |
ares | +1.605 |
ARE | +1.581 |
aring | +1.580 |
anamo | +1.550 |
Neg logit contributions | |
Zoro | -2.002 |
ibilities | -1.792 |
ells | -1.757 |
chapter | -1.646 |
vitamins | -1.617 |
Token | " |
Token ID | 1 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
ATH | +4.017 |
ares | +3.480 |
ARE | +3.474 |
aring | +3.461 |
anamo | +3.417 |
Neg logit contributions | |
Zoro | -4.239 |
ibilities | -3.805 |
ells | -3.755 |
chapter | -3.447 |
vitamins | -3.410 |
Token |
|
Token ID | 198 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
Zoro | +0.080 |
ibilities | +0.072 |
ells | +0.071 |
chapter | +0.065 |
vitamins | +0.063 |
Neg logit contributions | |
ATH | -0.099 |
ares | -0.087 |
aring | -0.087 |
anamo | -0.087 |
ARE | -0.086 |
Token |
|
Token ID | 198 |
Feature activation | -5.87e-02 |
Pos logit contributions | |
ATH | +1.382 |
ares | +1.203 |
aring | +1.200 |
ARE | +1.190 |
aria | +1.166 |
Neg logit contributions | |
Zoro | -1.261 |
ibilities | -1.164 |
ells | -1.123 |
vitamins | -1.033 |
chapter | -1.017 |
Token | � |
Token ID | 447 |
Feature activation | -2.99e-01 |
Pos logit contributions | |
Zoro | +0.500 |
ibilities | +0.451 |
ells | +0.445 |
chapter | +0.417 |
vitamins | +0.406 |
Neg logit contributions | |
ATH | -0.486 |
ares | -0.421 |
aring | -0.418 |
anamo | -0.416 |
ARE | -0.415 |
Token | � |
Token ID | 250 |
Feature activation | +3.07e-01 |
Pos logit contributions | |
Zoro | +2.673 |
ibilities | +2.423 |
ells | +2.398 |
chapter | +2.268 |
vitamins | +2.197 |
Neg logit contributions | |
ATH | -2.284 |
anamo | -1.979 |
ares | -1.970 |
aring | -1.955 |
aryl | -1.950 |
Token | Ke |
Token ID | 8896 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
ATH | +2.444 |
ares | +2.098 |
aring | +2.091 |
ARE | +2.073 |
aldi | +2.021 |
Neg logit contributions | |
Zoro | -2.695 |
ibilities | -2.445 |
ells | -2.395 |
chapter | -2.257 |
vitamins | -2.212 |
Token | pler |
Token ID | 20053 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
ATH | +0.928 |
ares | +0.792 |
aring | +0.789 |
aldi | +0.768 |
ARE | +0.766 |
Neg logit contributions | |
Zoro | -1.180 |
ibilities | -1.076 |
ells | -1.052 |
chapter | -0.989 |
vitamins | -0.982 |
Token | - |
Token ID | 12 |
Feature activation | +5.89e-01 |
Pos logit contributions | |
ATH | +7.747 |
aring | +6.732 |
ares | +6.690 |
aldi | +6.518 |
aria | +6.517 |
Neg logit contributions | |
Zoro | -8.329 |
ibilities | -7.627 |
ells | -7.383 |
ibly | -6.809 |
ible | -6.764 |
Token | 10 |
Token ID | 940 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
ATH | +3.492 |
ares | +2.873 |
aring | +2.860 |
ARE | +2.784 |
aldi | +2.750 |
Neg logit contributions | |
Zoro | -6.354 |
ibilities | -5.781 |
ells | -5.759 |
chapter | -5.450 |
vitamins | -5.399 |
Token | c |
Token ID | 66 |
Feature activation | +3.24e-01 |
Pos logit contributions | |
ATH | +0.094 |
ares | +0.080 |
anamo | +0.080 |
aring | +0.079 |
ARE | +0.079 |
Neg logit contributions | |
Zoro | -0.119 |
ibilities | -0.109 |
ells | -0.108 |
chapter | -0.102 |
vitamins | -0.099 |
Token | didn |
Token ID | 1422 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
ATH | +2.648 |
ares | +2.311 |
aring | +2.308 |
aldi | +2.261 |
Stacy | +2.247 |
Neg logit contributions | |
Zoro | -2.706 |
ibilities | -2.476 |
ells | -2.392 |
chapter | -2.211 |
ible | -2.178 |
Token | � |
Token ID | 447 |
Feature activation | -2.53e-01 |
Pos logit contributions | |
ATH | +0.139 |
ares | +0.121 |
aring | +0.120 |
ARE | +0.119 |
aria | +0.118 |
Neg logit contributions | |
Zoro | -0.123 |
ibilities | -0.111 |
ells | -0.108 |
chapter | -0.099 |
vitamins | -0.099 |
Token | in |
Token ID | 287 |
Feature activation | +4.48e-01 |
Pos logit contributions | |
ATH | +3.029 |
ares | +2.627 |
aring | +2.625 |
anamo | +2.614 |
ARE | +2.607 |
Neg logit contributions | |
Zoro | -2.980 |
ibilities | -2.672 |
ells | -2.648 |
chapter | -2.459 |
vitamins | -2.390 |
Token | Wisconsin |
Token ID | 9279 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
ATH | +3.061 |
ares | +2.567 |
aring | +2.565 |
ARE | +2.537 |
Stacy | +2.520 |
Neg logit contributions | |
Zoro | -4.355 |
ibilities | -3.989 |
ells | -3.964 |
chapter | -3.682 |
vitamins | -3.614 |
Token | would |
Token ID | 561 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
ATH | +3.013 |
ares | +2.690 |
aring | +2.651 |
ARE | +2.614 |
Stacy | +2.555 |
Neg logit contributions | |
Zoro | -2.934 |
ibilities | -2.676 |
ells | -2.610 |
chapter | -2.352 |
vitamins | -2.337 |
Token | vote |
Token ID | 3015 |
Feature activation | +4.83e-02 |
Pos logit contributions | |
ATH | +1.649 |
aring | +1.391 |
ares | +1.383 |
ARE | +1.354 |
aryl | +1.343 |
Neg logit contributions | |
Zoro | -2.238 |
ells | -2.042 |
ibilities | -2.028 |
chapter | -1.853 |
vitamins | -1.848 |
Token | for |
Token ID | 329 |
Feature activation | +4.96e-01 |
Pos logit contributions | |
ATH | +0.447 |
ares | +0.396 |
aring | +0.394 |
ARE | +0.391 |
anamo | +0.389 |
Neg logit contributions | |
Zoro | -0.359 |
ibilities | -0.321 |
ells | -0.317 |
chapter | -0.291 |
vitamins | -0.284 |
Token | Romney |
Token ID | 8431 |
Feature activation | +8.13e-01 |
Pos logit contributions | |
ATH | +2.726 |
aring | +2.233 |
ares | +2.224 |
Stacy | +2.177 |
ARE | +2.173 |
Neg logit contributions | |
Zoro | -5.324 |
ibilities | -5.081 |
ells | -5.038 |
chapter | -4.667 |
vitamins | -4.615 |
Token | . |
Token ID | 13 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
ATH | +6.403 |
aring | +5.441 |
ares | +5.425 |
aryl | +5.355 |
Stacy | +5.314 |
Neg logit contributions | |
Zoro | -6.866 |
ibilities | -6.364 |
ells | -6.253 |
chapter | -5.672 |
vitamins | -5.568 |
Token |
|
Token ID | 198 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
ATH | +1.065 |
ares | +0.930 |
aring | +0.921 |
Stacy | +0.919 |
ARE | +0.918 |
Neg logit contributions | |
Zoro | -0.980 |
ibilities | -0.912 |
ells | -0.894 |
chapter | -0.818 |
vitamins | -0.805 |
Token |
|
Token ID | 198 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
ATH | +1.651 |
ares | +1.435 |
aring | +1.429 |
ARE | +1.416 |
aria | +1.396 |
Neg logit contributions | |
Zoro | -1.565 |
ibilities | -1.438 |
ells | -1.389 |
vitamins | -1.281 |
chapter | -1.258 |
Token | In |
Token ID | 818 |
Feature activation | +2.19e-01 |
Pos logit contributions | |
ATH | +2.130 |
ARE | +1.812 |
ares | +1.784 |
aring | +1.768 |
Bern | +1.738 |
Neg logit contributions | |
Zoro | -2.536 |
ibilities | -2.303 |
ells | -2.263 |
chapter | -2.131 |
vitamins | -2.085 |
Token | Ohio |
Token ID | 6835 |
Feature activation | -2.66e-02 |
Pos logit contributions | |
ATH | +1.578 |
ares | +1.346 |
aring | +1.342 |
ARE | +1.316 |
Stacy | +1.312 |
Neg logit contributions | |
Zoro | -2.051 |
ibilities | -1.898 |
ells | -1.879 |
chapter | -1.721 |
ible | -1.696 |
Token | profit |
Token ID | 7630 |
Feature activation | +1.71e-01 |
Pos logit contributions | |
ATH | +7.861 |
aring | +6.785 |
Mehran | +6.686 |
ares | +6.606 |
ARE | +6.587 |
Neg logit contributions | |
Zoro | -8.638 |
ibilities | -8.193 |
ells | -7.904 |
ibly | -7.221 |
vitamins | -7.167 |
Token | margin |
Token ID | 10330 |
Feature activation | +4.36e-01 |
Pos logit contributions | |
ATH | +1.442 |
aring | +1.252 |
ares | +1.245 |
ARE | +1.227 |
Stacy | +1.219 |
Neg logit contributions | |
Zoro | -1.415 |
ibilities | -1.302 |
ells | -1.275 |
chapter | -1.162 |
vitamins | -1.153 |
Token | on |
Token ID | 319 |
Feature activation | +4.28e-01 |
Pos logit contributions | |
ATH | +3.520 |
aring | +3.099 |
ares | +3.092 |
Stacy | +3.025 |
ARE | +2.989 |
Neg logit contributions | |
Zoro | -3.597 |
ibilities | -3.361 |
ells | -3.289 |
chapter | -2.956 |
vitamins | -2.937 |
Token | $ |
Token ID | 720 |
Feature activation | +8.22e-02 |
Pos logit contributions | |
ATH | +3.439 |
ares | +3.018 |
aring | +2.991 |
Stacy | +2.955 |
ARE | +2.945 |
Neg logit contributions | |
Zoro | -3.576 |
ibilities | -3.317 |
ells | -3.264 |
chapter | -2.922 |
ible | -2.895 |
Token | 700 |
Token ID | 9879 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
ATH | +0.612 |
ares | +0.522 |
aring | +0.516 |
anamo | +0.511 |
ARE | +0.510 |
Neg logit contributions | |
Zoro | -0.763 |
ibilities | -0.698 |
ells | -0.691 |
chapter | -0.648 |
vitamins | -0.637 |
Token | million |
Token ID | 1510 |
Feature activation | +3.07e-01 |
Pos logit contributions | |
ATH | +1.539 |
ares | +1.312 |
anamo | +1.309 |
aring | +1.300 |
ARE | +1.289 |
Neg logit contributions | |
Zoro | -1.916 |
ibilities | -1.743 |
ells | -1.727 |
chapter | -1.631 |
vitamins | -1.588 |
Token | in |
Token ID | 287 |
Feature activation | +6.44e-01 |
Pos logit contributions | |
ATH | +2.547 |
ares | +2.247 |
aring | +2.234 |
ARE | +2.186 |
Stacy | +2.170 |
Neg logit contributions | |
Zoro | -2.542 |
ibilities | -2.340 |
ells | -2.270 |
chapter | -2.075 |
vitamins | -2.068 |
Token | revenue |
Token ID | 6426 |
Feature activation | +1.37e-02 |
Pos logit contributions | |
ATH | +4.532 |
ares | +4.039 |
aring | +3.913 |
Stacy | +3.859 |
ARE | +3.853 |
Neg logit contributions | |
Zoro | -5.840 |
ibilities | -5.442 |
ells | -5.362 |
vitamins | -4.831 |
ibly | -4.825 |
Token | delivers |
Token ID | 16316 |
Feature activation | +9.55e-02 |
Pos logit contributions | |
ATH | +0.118 |
ares | +0.104 |
aring | +0.103 |
ARE | +0.102 |
anamo | +0.101 |
Neg logit contributions | |
Zoro | -0.110 |
ibilities | -0.100 |
ells | -0.098 |
chapter | -0.091 |
vitamins | -0.089 |
Token | operating |
Token ID | 5361 |
Feature activation | -2.18e-01 |
Pos logit contributions | |
ATH | +0.810 |
ares | +0.709 |
aring | +0.705 |
ARE | +0.697 |
anamo | +0.694 |
Neg logit contributions | |
Zoro | -0.782 |
ibilities | -0.710 |
ells | -0.700 |
chapter | -0.646 |
vitamins | -0.629 |
Token | profits |
Token ID | 10177 |
Feature activation | -4.73e-01 |
Pos logit contributions | |
Zoro | +1.800 |
ibilities | +1.617 |
ells | +1.598 |
chapter | +1.501 |
vitamins | +1.455 |
Neg logit contributions | |
ATH | -1.841 |
anamo | -1.605 |
ares | -1.603 |
aring | -1.592 |
ARE | -1.580 |
Token | jury |
Token ID | 9002 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
ATH | +5.504 |
aring | +4.620 |
Stacy | +4.602 |
aryl | +4.583 |
ARE | +4.549 |
Neg logit contributions | |
Zoro | -8.374 |
ibilities | -7.827 |
ells | -7.765 |
ibly | -7.105 |
vitamins | -7.083 |
Token | , |
Token ID | 11 |
Feature activation | +4.11e-01 |
Pos logit contributions | |
ATH | +1.652 |
ares | +1.456 |
anamo | +1.450 |
aring | +1.446 |
ARE | +1.434 |
Neg logit contributions | |
Zoro | -1.369 |
ibilities | -1.218 |
ells | -1.204 |
chapter | -1.118 |
vitamins | -1.082 |
Token | execution |
Token ID | 9706 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
ATH | +3.429 |
aring | +2.992 |
ares | +2.976 |
ARE | +2.958 |
anamo | +2.957 |
Neg logit contributions | |
Zoro | -3.385 |
ibilities | -3.064 |
ells | -3.037 |
chapter | -2.736 |
vitamins | -2.718 |
Token | or |
Token ID | 273 |
Feature activation | +3.46e-01 |
Pos logit contributions | |
ATH | +1.774 |
aring | +1.564 |
ares | +1.562 |
anamo | +1.544 |
ARE | +1.543 |
Neg logit contributions | |
Zoro | -1.543 |
ibilities | -1.390 |
ells | -1.368 |
chapter | -1.265 |
vitamins | -1.233 |
Token | , |
Token ID | 11 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
ATH | +3.033 |
ares | +2.657 |
aring | +2.650 |
anamo | +2.633 |
ARE | +2.619 |
Neg logit contributions | |
Zoro | -2.727 |
ibilities | -2.438 |
ells | -2.418 |
chapter | -2.218 |
vitamins | -2.174 |
Token | isn |
Token ID | 2125 |
Feature activation | +4.27e-02 |
Pos logit contributions | |
ATH | +2.256 |
ares | +1.962 |
aring | +1.960 |
ARE | +1.941 |
aryl | +1.935 |
Neg logit contributions | |
Zoro | -2.195 |
ibilities | -1.980 |
ells | -1.970 |
chapter | -1.786 |
vitamins | -1.756 |
Token | 't |
Token ID | 470 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
ATH | +0.384 |
ares | +0.340 |
aring | +0.338 |
anamo | +0.333 |
aryl | +0.333 |
Neg logit contributions | |
Zoro | -0.332 |
ibilities | -0.295 |
ells | -0.292 |
chapter | -0.267 |
vitamins | -0.264 |
Token | it |
Token ID | 340 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
Zoro | +1.120 |
ibilities | +0.999 |
ells | +0.985 |
chapter | +0.925 |
ible | +0.893 |
Neg logit contributions | |
ATH | -1.305 |
ares | -1.147 |
anamo | -1.143 |
aring | -1.136 |
ARE | -1.132 |
Token | way |
Token ID | 835 |
Feature activation | -2.08e-01 |
Pos logit contributions | |
Zoro | +2.772 |
ibilities | +2.455 |
ells | +2.439 |
chapter | +2.320 |
ible | +2.213 |
Neg logit contributions | |
ATH | -3.210 |
anamo | -2.843 |
ares | -2.806 |
aring | -2.776 |
ARE | -2.774 |
Token | too |
Token ID | 1165 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
Zoro | +1.804 |
ibilities | +1.633 |
ells | +1.615 |
chapter | +1.524 |
ible | +1.475 |
Neg logit contributions | |
ATH | -1.671 |
ares | -1.441 |
anamo | -1.437 |
aring | -1.426 |
ARE | -1.418 |
Token | late |
Token ID | 2739 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
Zoro | +2.610 |
ibilities | +2.327 |
ells | +2.295 |
chapter | +2.180 |
ible | +2.070 |
Neg logit contributions | |
ATH | -3.100 |
anamo | -2.726 |
ares | -2.701 |
ARE | -2.671 |
aring | -2.664 |
Token | been |
Token ID | 587 |
Feature activation | +2.38e-02 |
Pos logit contributions | |
ATH | +2.192 |
aring | +1.919 |
ares | +1.899 |
Stacy | +1.896 |
aldi | +1.889 |
Neg logit contributions | |
Zoro | -2.034 |
ibilities | -1.869 |
ells | -1.837 |
chapter | -1.642 |
ible | -1.632 |
Token | hospitalized |
Token ID | 31736 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
ATH | +0.199 |
ares | +0.172 |
aring | +0.172 |
anamo | +0.171 |
ARE | +0.170 |
Neg logit contributions | |
Zoro | -0.199 |
ibilities | -0.182 |
ells | -0.178 |
chapter | -0.166 |
vitamins | -0.162 |
Token | and |
Token ID | 290 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
ATH | +2.048 |
aring | +1.777 |
ares | +1.773 |
Stacy | +1.745 |
ARE | +1.739 |
Neg logit contributions | |
Zoro | -2.082 |
ibilities | -1.905 |
ells | -1.887 |
chapter | -1.713 |
ible | -1.691 |
Token | could |
Token ID | 714 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
Zoro | +1.048 |
ibilities | +0.937 |
ells | +0.927 |
chapter | +0.867 |
vitamins | +0.841 |
Neg logit contributions | |
ATH | -1.137 |
ares | -0.996 |
anamo | -0.992 |
aring | -0.988 |
ARE | -0.980 |
Token | not |
Token ID | 407 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
ATH | +2.134 |
aring | +1.880 |
ares | +1.871 |
aria | +1.831 |
aryl | +1.829 |
Neg logit contributions | |
Zoro | -2.065 |
ells | -1.845 |
ibilities | -1.817 |
chapter | -1.660 |
vitamins | -1.651 |
Token | be |
Token ID | 307 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
ATH | +1.587 |
aring | +1.393 |
ares | +1.380 |
aryl | +1.358 |
ARE | +1.353 |
Neg logit contributions | |
Zoro | -1.610 |
ells | -1.457 |
ibilities | -1.434 |
chapter | -1.308 |
vitamins | -1.296 |
Token | reached |
Token ID | 4251 |
Feature activation | -2.12e-01 |
Pos logit contributions | |
ATH | +1.377 |
aring | +1.192 |
ares | +1.185 |
ARE | +1.166 |
Stacy | +1.162 |
Neg logit contributions | |
Zoro | -1.628 |
ibilities | -1.499 |
ells | -1.495 |
chapter | -1.366 |
vitamins | -1.349 |
Token | for |
Token ID | 329 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
Zoro | +1.510 |
ibilities | +1.333 |
ells | +1.316 |
chapter | +1.220 |
ible | +1.177 |
Neg logit contributions | |
ATH | -2.039 |
ares | -1.807 |
anamo | -1.806 |
aring | -1.794 |
ARE | -1.785 |
Token | comment |
Token ID | 2912 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
Zoro | +0.858 |
ibilities | +0.738 |
ells | +0.731 |
chapter | +0.673 |
ible | +0.641 |
Neg logit contributions | |
ATH | -1.493 |
anamo | -1.346 |
ares | -1.342 |
aring | -1.327 |
aldi | -1.326 |
Token | . |
Token ID | 13 |
Feature activation | -5.40e-02 |
Pos logit contributions | |
ATH | +1.217 |
ares | +1.069 |
aring | +1.064 |
anamo | +1.054 |
ARE | +1.047 |
Neg logit contributions | |
Zoro | -1.129 |
ibilities | -1.014 |
ells | -1.004 |
chapter | -0.925 |
vitamins | -0.910 |
Token |
|
Token ID | 198 |
Feature activation | -6.73e-02 |
Pos logit contributions | |
Zoro | +0.392 |
ibilities | +0.345 |
ells | +0.342 |
chapter | +0.316 |
ible | +0.305 |
Neg logit contributions | |
ATH | -0.511 |
ares | -0.453 |
anamo | -0.452 |
aring | -0.450 |
ARE | -0.446 |
Token | neighbor |
Token ID | 4780 |
Feature activation | -4.97e-01 |
Pos logit contributions | |
ATH | +2.078 |
ares | +1.828 |
aring | +1.824 |
ARE | +1.781 |
aria | +1.766 |
Neg logit contributions | |
Zoro | -2.024 |
ibilities | -1.849 |
ells | -1.823 |
chapter | -1.624 |
ibly | -1.617 |
Token | , |
Token ID | 11 |
Feature activation | +6.53e-02 |
Pos logit contributions | |
Zoro | +3.582 |
ells | +3.082 |
ibilities | +3.053 |
chapter | +2.941 |
vitamins | +2.790 |
Neg logit contributions | |
ATH | -4.653 |
anamo | -4.205 |
ares | -4.134 |
ARE | -4.102 |
aryl | -4.099 |
Token | the |
Token ID | 262 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
ATH | +0.567 |
ares | +0.494 |
aring | +0.493 |
anamo | +0.487 |
ARE | +0.485 |
Neg logit contributions | |
Zoro | -0.523 |
ibilities | -0.477 |
ells | -0.469 |
chapter | -0.430 |
ible | -0.421 |
Token | Andromeda |
Token ID | 34542 |
Feature activation | +5.24e-01 |
Pos logit contributions | |
ATH | +1.932 |
ares | +1.700 |
aring | +1.686 |
ARE | +1.654 |
aldi | +1.652 |
Neg logit contributions | |
Zoro | -1.830 |
ibilities | -1.673 |
ells | -1.642 |
chapter | -1.488 |
ible | -1.463 |
Token | Galaxy |
Token ID | 9252 |
Feature activation | -1.49e-01 |
Pos logit contributions | |
ATH | +3.915 |
ares | +3.329 |
aring | +3.308 |
aria | +3.277 |
aldi | +3.223 |
Neg logit contributions | |
Zoro | -4.760 |
ibilities | -4.360 |
ells | -4.345 |
vitamins | -3.914 |
ibly | -3.891 |
Token | . |
Token ID | 13 |
Feature activation | +3.37e-01 |
Pos logit contributions | |
Zoro | +1.114 |
ibilities | +0.986 |
ells | +0.979 |
chapter | +0.914 |
vitamins | +0.879 |
Neg logit contributions | |
ATH | -1.384 |
anamo | -1.225 |
ares | -1.221 |
aring | -1.212 |
ARE | -1.204 |
Token | The |
Token ID | 383 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
ATH | +2.754 |
ares | +2.414 |
Stacy | +2.413 |
aring | +2.403 |
ARE | +2.362 |
Neg logit contributions | |
Zoro | -2.739 |
ibilities | -2.644 |
ells | -2.528 |
ibly | -2.324 |
vitamins | -2.305 |
Token | two |
Token ID | 734 |
Feature activation | +9.02e-02 |
Pos logit contributions | |
ATH | +2.418 |
ares | +2.107 |
aring | +2.100 |
aldi | +2.080 |
Stacy | +2.061 |
Neg logit contributions | |
Zoro | -2.360 |
ibilities | -2.153 |
ells | -2.116 |
ibly | -1.909 |
chapter | -1.908 |
Token | are |
Token ID | 389 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
ATH | +0.812 |
ares | +0.719 |
aring | +0.715 |
ARE | +0.706 |
anamo | +0.703 |
Neg logit contributions | |
Zoro | -0.691 |
ibilities | -0.620 |
ells | -0.613 |
chapter | -0.562 |
ible | -0.548 |
Token | rushing |
Token ID | 15795 |
Feature activation | +3.93e-01 |
Pos logit contributions | |
Zoro | +0.912 |
ibilities | +0.820 |
ells | +0.810 |
chapter | +0.749 |
vitamins | +0.728 |
Neg logit contributions | |
ATH | -1.011 |
ares | -0.885 |
aring | -0.880 |
anamo | -0.878 |
ARE | -0.871 |
Token | toward |
Token ID | 3812 |
Feature activation | +5.46e-01 |
Pos logit contributions | |
ATH | +3.125 |
ares | +2.668 |
aring | +2.623 |
Stacy | +2.621 |
ARE | +2.597 |
Neg logit contributions | |
Zoro | -3.339 |
ibilities | -3.138 |
ells | -3.093 |
chapter | -2.761 |
ible | -2.738 |
Token | see |
Token ID | 766 |
Feature activation | -4.71e-02 |
Pos logit contributions | |
ATH | +1.677 |
aring | +1.507 |
ares | +1.493 |
ARE | +1.461 |
Stacy | +1.442 |
Neg logit contributions | |
Zoro | -1.540 |
ibilities | -1.395 |
ells | -1.388 |
chapter | -1.243 |
vitamins | -1.239 |
Token | if |
Token ID | 611 |
Feature activation | +7.75e-02 |
Pos logit contributions | |
Zoro | +0.375 |
ibilities | +0.336 |
ells | +0.334 |
chapter | +0.306 |
vitamins | +0.299 |
Neg logit contributions | |
ATH | -0.410 |
ares | -0.362 |
aring | -0.362 |
ARE | -0.357 |
aldi | -0.352 |
Token | it |
Token ID | 340 |
Feature activation | +4.03e-01 |
Pos logit contributions | |
ATH | +0.683 |
ares | +0.604 |
aring | +0.602 |
ARE | +0.595 |
aldi | +0.590 |
Neg logit contributions | |
Zoro | -0.604 |
ibilities | -0.540 |
ells | -0.538 |
chapter | -0.490 |
ible | -0.481 |
Token | � |
Token ID | 447 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
ATH | +3.534 |
ares | +3.205 |
aring | +3.144 |
aryl | +3.079 |
aldi | +3.076 |
Neg logit contributions | |
Zoro | -3.058 |
ibilities | -2.717 |
ells | -2.653 |
chapter | -2.457 |
ible | -2.411 |
Token | � |
Token ID | 247 |
Feature activation | +2.29e-01 |
Pos logit contributions | |
ATH | +1.256 |
ares | +1.018 |
aring | +0.975 |
ARE | +0.966 |
aldi | +0.962 |
Neg logit contributions | |
Zoro | -2.690 |
ibilities | -2.477 |
ells | -2.404 |
chapter | -2.299 |
vitamins | -2.282 |
Token | s |
Token ID | 82 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
ATH | +1.588 |
ares | +1.373 |
aring | +1.335 |
anamo | +1.308 |
aldi | +1.298 |
Neg logit contributions | |
Zoro | -2.276 |
ibilities | -2.017 |
ells | -1.957 |
chapter | -1.901 |
vitamins | -1.869 |
Token | � |
Token ID | 564 |
Feature activation | -7.97e-03 |
Pos logit contributions | |
ATH | +2.454 |
ares | +2.179 |
aring | +2.171 |
ARE | +2.112 |
Stacy | +2.108 |
Neg logit contributions | |
Zoro | -2.411 |
ibilities | -2.216 |
ells | -2.172 |
chapter | -1.962 |
vitamins | -1.962 |
Token | � |
Token ID | 250 |
Feature activation | +8.26e-02 |
Pos logit contributions | |
Zoro | +0.080 |
ibilities | +0.074 |
ells | +0.073 |
chapter | +0.068 |
vitamins | +0.067 |
Neg logit contributions | |
ATH | -0.054 |
ares | -0.045 |
aring | -0.045 |
aldi | -0.044 |
ARE | -0.044 |
Token | on |
Token ID | 261 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
ATH | +0.668 |
ares | +0.578 |
aring | +0.577 |
ARE | +0.569 |
anamo | +0.567 |
Neg logit contributions | |
Zoro | -0.716 |
ibilities | -0.646 |
ells | -0.638 |
chapter | -0.602 |
vitamins | -0.588 |
Token | . |
Token ID | 13 |
Feature activation | -9.21e-02 |
Pos logit contributions | |
ATH | +0.224 |
ares | +0.196 |
aring | +0.196 |
ARE | +0.193 |
anamo | +0.192 |
Neg logit contributions | |
Zoro | -0.209 |
ibilities | -0.187 |
ells | -0.186 |
chapter | -0.171 |
vitamins | -0.168 |
Token | � |
Token ID | 447 |
Feature activation | +1.44e-01 |
Pos logit contributions | |
Zoro | +0.714 |
ibilities | +0.640 |
ells | +0.631 |
chapter | +0.586 |
vitamins | +0.569 |
Neg logit contributions | |
ATH | -0.827 |
ares | -0.729 |
aring | -0.725 |
anamo | -0.720 |
ARE | -0.717 |
Token | It |
Token ID | 632 |
Feature activation | -6.70e-03 |
Pos logit contributions | |
Zoro | +1.308 |
ibilities | +1.173 |
ells | +1.159 |
chapter | +1.078 |
vitamins | +1.046 |
Neg logit contributions | |
ATH | -1.454 |
ares | -1.275 |
anamo | -1.267 |
aring | -1.266 |
ARE | -1.256 |
Token | won |
Token ID | 1839 |
Feature activation | -6.64e-02 |
Pos logit contributions | |
Zoro | +0.055 |
ibilities | +0.049 |
ells | +0.049 |
chapter | +0.045 |
vitamins | +0.044 |
Neg logit contributions | |
ATH | -0.057 |
ares | -0.050 |
aring | -0.050 |
anamo | -0.050 |
ARE | -0.049 |
Token | 't |
Token ID | 470 |
Feature activation | -7.72e-01 |
Pos logit contributions | |
Zoro | +0.511 |
ibilities | +0.459 |
ells | +0.451 |
chapter | +0.413 |
vitamins | +0.404 |
Neg logit contributions | |
ATH | -0.607 |
ares | -0.532 |
aring | -0.529 |
ARE | -0.521 |
Stacy | -0.518 |
Token | be |
Token ID | 307 |
Feature activation | -3.74e-01 |
Pos logit contributions | |
Zoro | +5.168 |
ibilities | +4.629 |
ells | +4.400 |
chapter | +4.294 |
ible | +4.172 |
Neg logit contributions | |
ATH | -7.398 |
anamo | -7.011 |
ares | -6.592 |
ARE | -6.558 |
aldi | -6.484 |
Token | easy |
Token ID | 2562 |
Feature activation | -3.82e-01 |
Pos logit contributions | |
Zoro | +2.740 |
ibilities | +2.410 |
ells | +2.370 |
chapter | +2.236 |
ible | +2.157 |
Neg logit contributions | |
ATH | -3.514 |
anamo | -3.134 |
ares | -3.082 |
ARE | -3.063 |
aring | -3.062 |
Token | , |
Token ID | 11 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
Zoro | +2.864 |
ibilities | +2.512 |
ells | +2.482 |
chapter | +2.349 |
ible | +2.262 |
Neg logit contributions | |
ATH | -3.496 |
anamo | -3.142 |
ares | -3.099 |
ARE | -3.064 |
aldi | -3.045 |
Token | but |
Token ID | 475 |
Feature activation | +6.15e-02 |
Pos logit contributions | |
Zoro | +1.328 |
ibilities | +1.188 |
ells | +1.174 |
chapter | +1.101 |
vitamins | +1.068 |
Neg logit contributions | |
ATH | -1.416 |
ares | -1.240 |
anamo | -1.238 |
aring | -1.229 |
ARE | -1.221 |
Token | we |
Token ID | 356 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
ATH | +0.536 |
ares | +0.471 |
aring | +0.470 |
Stacy | +0.465 |
ARE | +0.463 |
Neg logit contributions | |
Zoro | -0.489 |
ibilities | -0.443 |
ells | -0.439 |
chapter | -0.400 |
vitamins | -0.391 |
Token | expect |
Token ID | 1607 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
ATH | +1.026 |
aring | +0.916 |
ares | +0.910 |
ARE | +0.891 |
Stacy | +0.889 |
Neg logit contributions | |
Zoro | -0.844 |
ibilities | -0.744 |
ells | -0.741 |
chapter | -0.675 |
vitamins | -0.658 |
Token | Ro |
Token ID | 5564 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
Zoro | +1.366 |
ibilities | +1.222 |
ells | +1.206 |
chapter | +1.128 |
vitamins | +1.093 |
Neg logit contributions | |
ATH | -1.502 |
ares | -1.315 |
anamo | -1.315 |
aring | -1.306 |
ARE | -1.296 |
Token | eth |
Token ID | 2788 |
Feature activation | +2.84e-01 |
Pos logit contributions | |
ATH | +1.170 |
aring | +0.975 |
ares | +0.967 |
aryl | +0.954 |
aldi | +0.947 |
Neg logit contributions | |
Zoro | -1.638 |
ibilities | -1.485 |
ells | -1.453 |
chapter | -1.381 |
vitamins | -1.358 |
Token | of |
Token ID | 286 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
ATH | +4.789 |
aring | +4.150 |
ares | +4.107 |
ARE | +4.037 |
aldi | +4.017 |
Neg logit contributions | |
Zoro | -4.861 |
ells | -4.351 |
ibilities | -4.302 |
vitamins | -3.888 |
ibly | -3.858 |
Token | the |
Token ID | 262 |
Feature activation | +3.03e-03 |
Pos logit contributions | |
ATH | +0.938 |
ares | +0.828 |
aring | +0.822 |
anamo | +0.815 |
ARE | +0.812 |
Neg logit contributions | |
Zoro | -0.812 |
ibilities | -0.729 |
ells | -0.717 |
chapter | -0.659 |
vitamins | -0.647 |
Token | setting |
Token ID | 4634 |
Feature activation | +5.24e-01 |
Pos logit contributions | |
ATH | +0.026 |
ares | +0.023 |
aring | +0.023 |
anamo | +0.023 |
ARE | +0.023 |
Neg logit contributions | |
Zoro | -0.024 |
ibilities | -0.022 |
ells | -0.022 |
chapter | -0.020 |
vitamins | -0.019 |
Token | . |
Token ID | 13 |
Feature activation | -3.26e-01 |
Pos logit contributions | |
ATH | +4.303 |
aring | +3.688 |
ares | +3.672 |
aryl | +3.625 |
ARE | +3.624 |
Neg logit contributions | |
Zoro | -4.290 |
ibilities | -3.918 |
ells | -3.801 |
ible | -3.485 |
vitamins | -3.467 |
Token |
|
Token ID | 198 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
Zoro | +2.576 |
ibilities | +2.289 |
ells | +2.266 |
chapter | +2.123 |
ible | +2.045 |
Neg logit contributions | |
ATH | -2.875 |
anamo | -2.530 |
ares | -2.525 |
aring | -2.507 |
ARE | -2.484 |
Token |
|
Token ID | 198 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
ATH | +1.351 |
ares | +1.177 |
aring | +1.167 |
ARE | +1.166 |
aria | +1.140 |
Neg logit contributions | |
Zoro | -1.234 |
ibilities | -1.135 |
ells | -1.097 |
vitamins | -1.009 |
chapter | -0.992 |
Token | For |
Token ID | 1890 |
Feature activation | -5.92e-02 |
Pos logit contributions | |
Zoro | +1.183 |
ibilities | +1.069 |
ells | +1.058 |
chapter | +0.992 |
vitamins | +0.968 |
Neg logit contributions | |
ATH | -1.082 |
ares | -0.933 |
aring | -0.926 |
anamo | -0.922 |
ARE | -0.920 |
Token | more |
Token ID | 517 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
Zoro | +0.484 |
ibilities | +0.435 |
ells | +0.430 |
chapter | +0.398 |
vitamins | +0.389 |
Neg logit contributions | |
ATH | -0.508 |
ares | -0.444 |
aring | -0.441 |
anamo | -0.438 |
ARE | -0.436 |
Token | advanced |
Token ID | 6190 |
Feature activation | -4.69e-02 |
Pos logit contributions | |
ATH | +1.143 |
ares | +1.004 |
aring | +1.000 |
ARE | +0.982 |
anamo | +0.980 |
Neg logit contributions | |
Zoro | -1.069 |
ibilities | -0.961 |
ells | -0.952 |
chapter | -0.870 |
vitamins | -0.856 |
Token | dungeon |
Token ID | 18974 |
Feature activation | +2.17e-01 |
Pos logit contributions | |
Zoro | +0.409 |
ibilities | +0.370 |
ells | +0.367 |
chapter | +0.343 |
vitamins | +0.335 |
Neg logit contributions | |
ATH | -0.375 |
ares | -0.324 |
aring | -0.322 |
anamo | -0.321 |
ARE | -0.318 |
Token | masters |
Token ID | 18159 |
Feature activation | -3.87e-02 |
Pos logit contributions | |
ATH | +1.662 |
ares | +1.413 |
aring | +1.411 |
ARE | +1.395 |
aryl | +1.369 |
Neg logit contributions | |
Zoro | -1.972 |
ibilities | -1.798 |
ells | -1.773 |
chapter | -1.644 |
vitamins | -1.627 |
Token | once |
Token ID | 1752 |
Feature activation | +3.84e-01 |
Pos logit contributions | |
Zoro | +1.067 |
ibilities | +0.956 |
ells | +0.945 |
chapter | +0.882 |
vitamins | +0.855 |
Neg logit contributions | |
ATH | -1.165 |
ares | -1.021 |
anamo | -1.016 |
aring | -1.013 |
ARE | -1.005 |
Token | for |
Token ID | 329 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
ATH | +3.198 |
aring | +2.788 |
ares | +2.760 |
Stacy | +2.743 |
aldi | +2.729 |
Neg logit contributions | |
Zoro | -3.098 |
ibilities | -2.902 |
ells | -2.825 |
chapter | -2.570 |
ible | -2.564 |
Token | their |
Token ID | 511 |
Feature activation | -7.73e-02 |
Pos logit contributions | |
ATH | +1.465 |
ares | +1.283 |
aring | +1.281 |
anamo | +1.272 |
Stacy | +1.265 |
Neg logit contributions | |
Zoro | -1.290 |
ibilities | -1.184 |
ells | -1.156 |
chapter | -1.055 |
ible | -1.040 |
Token | most |
Token ID | 749 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
Zoro | +0.625 |
ibilities | +0.562 |
ells | +0.556 |
chapter | +0.515 |
ible | +0.501 |
Neg logit contributions | |
ATH | -0.668 |
ares | -0.584 |
aring | -0.581 |
anamo | -0.580 |
ARE | -0.575 |
Token | recent |
Token ID | 2274 |
Feature activation | -2.26e-01 |
Pos logit contributions | |
ATH | +0.912 |
ares | +0.794 |
aring | +0.788 |
ARE | +0.778 |
anamo | +0.773 |
Neg logit contributions | |
Zoro | -0.929 |
ibilities | -0.851 |
ells | -0.840 |
chapter | -0.768 |
ible | -0.755 |
Token | video |
Token ID | 2008 |
Feature activation | -9.64e-02 |
Pos logit contributions | |
Zoro | +1.847 |
ibilities | +1.652 |
ells | +1.634 |
chapter | +1.538 |
vitamins | +1.489 |
Neg logit contributions | |
ATH | -1.941 |
ares | -1.695 |
anamo | -1.694 |
aring | -1.683 |
ARE | -1.669 |
Token | , |
Token ID | 11 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
Zoro | +0.786 |
ibilities | +0.708 |
ells | +0.700 |
chapter | +0.649 |
vitamins | +0.632 |
Neg logit contributions | |
ATH | -0.827 |
ares | -0.723 |
aring | -0.718 |
anamo | -0.716 |
ARE | -0.712 |
Token | � |
Token ID | 564 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
Zoro | +1.456 |
ibilities | +1.297 |
ells | +1.283 |
chapter | +1.202 |
vitamins | +1.164 |
Neg logit contributions | |
ATH | -1.612 |
ares | -1.414 |
anamo | -1.407 |
aring | -1.403 |
ARE | -1.390 |
Token | � |
Token ID | 250 |
Feature activation | -4.92e-01 |
Pos logit contributions | |
ATH | +1.967 |
ares | +1.717 |
aring | +1.701 |
anamo | +1.681 |
ARE | +1.673 |
Neg logit contributions | |
Zoro | -1.897 |
ibilities | -1.708 |
ells | -1.696 |
chapter | -1.569 |
vitamins | -1.540 |
Token | Mir |
Token ID | 27453 |
Feature activation | -4.59e-01 |
Pos logit contributions | |
Zoro | +4.293 |
ells | +3.880 |
ibilities | +3.879 |
chapter | +3.635 |
ible | +3.527 |
Neg logit contributions | |
ATH | -3.825 |
ares | -3.324 |
anamo | -3.316 |
aring | -3.287 |
ARE | -3.243 |
Token | acles |
Token ID | 9928 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
Zoro | +3.775 |
ibilities | +3.378 |
ells | +3.365 |
chapter | +3.145 |
ible | +3.067 |
Neg logit contributions | |
ATH | -3.845 |
anamo | -3.320 |
ARE | -3.310 |
ares | -3.308 |
aring | -3.296 |
Token | the |
Token ID | 262 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
Zoro | +1.319 |
ibilities | +1.178 |
ells | +1.165 |
chapter | +1.090 |
vitamins | +1.050 |
Neg logit contributions | |
ATH | -1.519 |
anamo | -1.335 |
ares | -1.331 |
aring | -1.324 |
ARE | -1.318 |
Token | Guard |
Token ID | 4932 |
Feature activation | -4.47e-02 |
Pos logit contributions | |
Zoro | +0.860 |
ibilities | +0.774 |
ells | +0.771 |
chapter | +0.705 |
vitamins | +0.691 |
Neg logit contributions | |
ATH | -0.911 |
ares | -0.796 |
aring | -0.789 |
anamo | -0.787 |
ARE | -0.780 |
Token | to |
Token ID | 284 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
Zoro | +0.359 |
ibilities | +0.322 |
ells | +0.318 |
chapter | +0.293 |
vitamins | +0.287 |
Neg logit contributions | |
ATH | -0.390 |
ares | -0.340 |
aring | -0.337 |
anamo | -0.336 |
ARE | -0.334 |
Token | use |
Token ID | 779 |
Feature activation | -2.69e-01 |
Pos logit contributions | |
ATH | +2.523 |
aring | +2.213 |
ares | +2.193 |
aldi | +2.152 |
ARE | +2.137 |
Neg logit contributions | |
Zoro | -2.261 |
ibilities | -2.059 |
ells | -2.038 |
vitamins | -1.839 |
chapter | -1.821 |
Token | , |
Token ID | 11 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
Zoro | +2.085 |
ibilities | +1.859 |
ells | +1.836 |
chapter | +1.719 |
ible | +1.659 |
Neg logit contributions | |
ATH | -2.407 |
anamo | -2.116 |
ares | -2.110 |
aring | -2.098 |
ARE | -2.083 |
Token | Cross |
Token ID | 6372 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
ATH | +1.029 |
ares | +0.913 |
aring | +0.907 |
ARE | +0.898 |
aryl | +0.886 |
Neg logit contributions | |
Zoro | -0.899 |
ibilities | -0.814 |
ells | -0.799 |
chapter | -0.721 |
vitamins | -0.716 |
Token | beam |
Token ID | 40045 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
Zoro | +1.063 |
ibilities | +0.962 |
ells | +0.953 |
chapter | +0.895 |
vitamins | +0.870 |
Neg logit contributions | |
ATH | -0.963 |
ares | -0.831 |
anamo | -0.827 |
aring | -0.825 |
ARE | -0.817 |
Token | provides |
Token ID | 3769 |
Feature activation | -8.85e-02 |
Pos logit contributions | |
ATH | +1.265 |
ares | +1.108 |
aring | +1.095 |
ARE | +1.091 |
anamo | +1.076 |
Neg logit contributions | |
Zoro | -1.191 |
ibilities | -1.077 |
ells | -1.058 |
chapter | -0.973 |
vitamins | -0.955 |
Token | a |
Token ID | 257 |
Feature activation | -1.49e-01 |
Pos logit contributions | |
Zoro | +0.716 |
ibilities | +0.644 |
ells | +0.637 |
chapter | +0.591 |
vitamins | +0.576 |
Neg logit contributions | |
ATH | -0.764 |
ares | -0.669 |
aring | -0.664 |
anamo | -0.662 |
ARE | -0.658 |
Token | set |
Token ID | 900 |
Feature activation | +4.21e-01 |
Pos logit contributions | |
Zoro | +1.209 |
ibilities | +1.090 |
ells | +1.077 |
chapter | +0.996 |
vitamins | +0.975 |
Neg logit contributions | |
ATH | -1.288 |
ares | -1.128 |
aring | -1.121 |
anamo | -1.115 |
ARE | -1.110 |
Token | of |
Token ID | 286 |
Feature activation | -2.46e-01 |
Pos logit contributions | |
ATH | +3.506 |
ares | +3.050 |
aring | +3.036 |
anamo | +3.019 |
ARE | +3.005 |
Neg logit contributions | |
Zoro | -3.525 |
ibilities | -3.170 |
ells | -3.139 |
chapter | -2.922 |
vitamins | -2.851 |
Token | and |
Token ID | 290 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
Zoro | +1.919 |
ibilities | +1.702 |
ells | +1.693 |
chapter | +1.597 |
ible | +1.525 |
Neg logit contributions | |
ATH | -2.249 |
anamo | -1.993 |
ares | -1.969 |
aldi | -1.952 |
aring | -1.949 |
Token | rushing |
Token ID | 15795 |
Feature activation | -4.11e-02 |
Pos logit contributions | |
ATH | +2.350 |
aring | +1.978 |
ares | +1.963 |
Stacy | +1.957 |
ARE | +1.935 |
Neg logit contributions | |
Zoro | -3.165 |
ibilities | -2.960 |
ells | -2.930 |
ible | -2.671 |
chapter | -2.654 |
Token | touchdowns |
Token ID | 17692 |
Feature activation | +7.15e-02 |
Pos logit contributions | |
Zoro | +0.334 |
ibilities | +0.301 |
ells | +0.297 |
chapter | +0.276 |
vitamins | +0.269 |
Neg logit contributions | |
ATH | -0.354 |
ares | -0.309 |
aring | -0.307 |
anamo | -0.306 |
ARE | -0.305 |
Token | records |
Token ID | 4406 |
Feature activation | -2.25e-02 |
Pos logit contributions | |
ATH | +0.622 |
ares | +0.546 |
aring | +0.542 |
ARE | +0.537 |
anamo | +0.534 |
Neg logit contributions | |
Zoro | -0.575 |
ibilities | -0.517 |
ells | -0.508 |
chapter | -0.469 |
vitamins | -0.461 |
Token | during |
Token ID | 1141 |
Feature activation | -5.27e-01 |
Pos logit contributions | |
Zoro | +0.181 |
ibilities | +0.163 |
ells | +0.161 |
chapter | +0.149 |
vitamins | +0.145 |
Neg logit contributions | |
ATH | -0.195 |
ares | -0.171 |
aring | -0.170 |
anamo | -0.168 |
ARE | -0.168 |
Token | the |
Token ID | 262 |
Feature activation | -6.75e-02 |
Pos logit contributions | |
Zoro | +3.928 |
ibilities | +3.451 |
ells | +3.421 |
chapter | +3.255 |
vitamins | +3.126 |
Neg logit contributions | |
ATH | -4.797 |
anamo | -4.340 |
ares | -4.241 |
aring | -4.213 |
ARE | -4.199 |
Token | game |
Token ID | 983 |
Feature activation | -8.99e-03 |
Pos logit contributions | |
Zoro | +0.540 |
ibilities | +0.489 |
ells | +0.483 |
chapter | +0.442 |
ible | +0.433 |
Neg logit contributions | |
ATH | -0.587 |
ares | -0.514 |
aring | -0.511 |
anamo | -0.507 |
ARE | -0.505 |
Token | , |
Token ID | 11 |
Feature activation | +3.66e-01 |
Pos logit contributions | |
Zoro | +0.069 |
ibilities | +0.062 |
ells | +0.061 |
chapter | +0.057 |
vitamins | +0.055 |
Neg logit contributions | |
ATH | -0.081 |
ares | -0.071 |
aring | -0.071 |
anamo | -0.071 |
ARE | -0.070 |
Token | ending |
Token ID | 7464 |
Feature activation | +7.07e-02 |
Pos logit contributions | |
ATH | +2.968 |
aring | +2.550 |
ares | +2.522 |
Stacy | +2.500 |
ARE | +2.462 |
Neg logit contributions | |
Zoro | -3.095 |
ibilities | -2.907 |
ells | -2.816 |
ible | -2.559 |
chapter | -2.554 |
Token | it |
Token ID | 340 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
ATH | +0.600 |
ares | +0.523 |
aring | +0.519 |
anamo | +0.516 |
ARE | +0.514 |
Neg logit contributions | |
Zoro | -0.583 |
ibilities | -0.526 |
ells | -0.519 |
chapter | -0.483 |
vitamins | -0.470 |
Token | with |
Token ID | 351 |
Feature activation | -3.26e-01 |
Pos logit contributions | |
Zoro | +2.631 |
ells | +2.348 |
ibilities | +2.347 |
chapter | +2.225 |
vitamins | +2.135 |
Neg logit contributions | |
ATH | -2.536 |
anamo | -2.223 |
ares | -2.214 |
aring | -2.191 |
ARE | -2.187 |
Token | , |
Token ID | 11 |
Feature activation | +1.46e-01 |
Pos logit contributions | |
ATH | +1.811 |
ares | +1.591 |
aring | +1.574 |
anamo | +1.571 |
ARE | +1.561 |
Neg logit contributions | |
Zoro | -1.607 |
ibilities | -1.457 |
ells | -1.428 |
chapter | -1.320 |
ible | -1.293 |
Token | the |
Token ID | 262 |
Feature activation | +2.66e-02 |
Pos logit contributions | |
ATH | +1.248 |
ares | +1.092 |
aring | +1.080 |
anamo | +1.079 |
ARE | +1.071 |
Neg logit contributions | |
Zoro | -1.185 |
ibilities | -1.078 |
ells | -1.058 |
chapter | -0.977 |
ible | -0.960 |
Token | bulk |
Token ID | 11963 |
Feature activation | +2.00e-01 |
Pos logit contributions | |
ATH | +0.224 |
ares | +0.195 |
aring | +0.193 |
anamo | +0.192 |
ARE | +0.192 |
Neg logit contributions | |
Zoro | -0.220 |
ibilities | -0.200 |
ells | -0.197 |
chapter | -0.182 |
ible | -0.179 |
Token | of |
Token ID | 286 |
Feature activation | +2.11e-01 |
Pos logit contributions | |
ATH | +1.700 |
ares | +1.482 |
anamo | +1.474 |
aring | +1.471 |
ARE | +1.458 |
Neg logit contributions | |
Zoro | -1.652 |
ibilities | -1.486 |
ells | -1.469 |
chapter | -1.373 |
vitamins | -1.333 |
Token | the |
Token ID | 262 |
Feature activation | -9.77e-02 |
Pos logit contributions | |
ATH | +1.838 |
ares | +1.618 |
aring | +1.592 |
ARE | +1.588 |
anamo | +1.583 |
Neg logit contributions | |
Zoro | -1.660 |
ibilities | -1.516 |
ells | -1.482 |
chapter | -1.352 |
ible | -1.342 |
Token | 1 |
Token ID | 352 |
Feature activation | -9.21e-01 |
Pos logit contributions | |
Zoro | +0.775 |
ibilities | +0.697 |
ells | +0.687 |
chapter | +0.637 |
ible | +0.620 |
Neg logit contributions | |
ATH | -0.859 |
ares | -0.753 |
aring | -0.747 |
anamo | -0.747 |
ARE | -0.741 |
Token | st |
Token ID | 301 |
Feature activation | -3.06e-01 |
Pos logit contributions | |
Zoro | +6.877 |
chapter | +5.941 |
ells | +5.920 |
ibilities | +5.861 |
vitamins | +5.401 |
Neg logit contributions | |
ATH | -7.732 |
anamo | -7.217 |
aldi | -6.885 |
ares | -6.841 |
merce | -6.836 |
Token | Italian |
Token ID | 8200 |
Feature activation | -4.06e-01 |
Pos logit contributions | |
Zoro | +2.520 |
ibilities | +2.246 |
ells | +2.236 |
chapter | +2.115 |
vitamins | +2.025 |
Neg logit contributions | |
ATH | -2.593 |
anamo | -2.275 |
ares | -2.251 |
aring | -2.241 |
ARE | -2.222 |
Token | volunteers |
Token ID | 11661 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
Zoro | +3.221 |
ibilities | +2.843 |
ells | +2.839 |
chapter | +2.699 |
vitamins | +2.559 |
Neg logit contributions | |
ATH | -3.544 |
anamo | -3.126 |
ares | -3.088 |
aring | -3.080 |
ARE | -3.066 |
Token | Storm |
Token ID | 8865 |
Feature activation | -3.49e-01 |
Pos logit contributions | |
Zoro | +1.617 |
ibilities | +1.441 |
ells | +1.424 |
chapter | +1.328 |
vitamins | +1.285 |
Neg logit contributions | |
ATH | -1.873 |
ares | -1.646 |
anamo | -1.640 |
aring | -1.635 |
ARE | -1.623 |
Token | Brigade |
Token ID | 26012 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
Zoro | +3.284 |
ells | +2.991 |
ibilities | +2.965 |
chapter | +2.833 |
ible | +2.749 |
Neg logit contributions | |
ATH | -2.510 |
anamo | -2.123 |
aring | -2.100 |
ARE | -2.097 |
ares | -2.093 |
Token | but |
Token ID | 475 |
Feature activation | -6.86e-02 |
Pos logit contributions | |
ATH | +1.667 |
ares | +1.451 |
aring | +1.446 |
anamo | +1.430 |
ARE | +1.425 |
Neg logit contributions | |
Zoro | -1.550 |
ibilities | -1.398 |
ells | -1.378 |
chapter | -1.271 |
vitamins | -1.248 |
Token | decided |
Token ID | 3066 |
Feature activation | +3.02e-01 |
Pos logit contributions | |
Zoro | +0.539 |
ibilities | +0.485 |
ells | +0.479 |
chapter | +0.443 |
ible | +0.430 |
Neg logit contributions | |
ATH | -0.608 |
ares | -0.534 |
aring | -0.530 |
anamo | -0.528 |
ARE | -0.525 |
Token | that |
Token ID | 326 |
Feature activation | +6.22e-03 |
Pos logit contributions | |
ATH | +2.443 |
ares | +2.127 |
aring | +2.105 |
ARE | +2.083 |
anamo | +2.063 |
Neg logit contributions | |
Zoro | -2.550 |
ibilities | -2.336 |
ells | -2.321 |
chapter | -2.117 |
vitamins | -2.079 |
Token | what |
Token ID | 644 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
ATH | +0.055 |
ares | +0.049 |
aring | +0.048 |
anamo | +0.048 |
ARE | +0.048 |
Neg logit contributions | |
Zoro | -0.049 |
ibilities | -0.044 |
ells | -0.043 |
chapter | -0.040 |
vitamins | -0.039 |
Token | the |
Token ID | 262 |
Feature activation | -5.93e-02 |
Pos logit contributions | |
Zoro | +1.073 |
ibilities | +0.954 |
ells | +0.942 |
chapter | +0.873 |
vitamins | +0.845 |
Neg logit contributions | |
ATH | -1.325 |
ares | -1.169 |
anamo | -1.164 |
aring | -1.162 |
ARE | -1.153 |
Token | hell |
Token ID | 5968 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
Zoro | +0.484 |
ibilities | +0.435 |
ells | +0.431 |
chapter | +0.401 |
vitamins | +0.390 |
Neg logit contributions | |
ATH | -0.508 |
ares | -0.444 |
aring | -0.440 |
anamo | -0.440 |
ARE | -0.436 |
Token | I |
Token ID | 314 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
Zoro | +8.271 |
ibilities | +7.272 |
ells | +7.094 |
chapter | +6.889 |
ible | +6.715 |
Neg logit contributions | |
ATH | -10.594 |
anamo | -10.028 |
aldi | -9.527 |
aryl | -9.519 |
ares | -9.476 |
Token | 'll |
Token ID | 1183 |
Feature activation | -5.56e-01 |
Pos logit contributions | |
Zoro | +1.480 |
ibilities | +1.332 |
ells | +1.316 |
chapter | +1.228 |
vitamins | +1.193 |
Neg logit contributions | |
ATH | -1.522 |
ares | -1.329 |
aring | -1.320 |
anamo | -1.314 |
ARE | -1.307 |
Token | just |
Token ID | 655 |
Feature activation | -3.57e-01 |
Pos logit contributions | |
Zoro | +4.042 |
ibilities | +3.561 |
ells | +3.513 |
chapter | +3.329 |
ible | +3.182 |
Neg logit contributions | |
ATH | -5.217 |
anamo | -4.692 |
ares | -4.623 |
aring | -4.575 |
ARE | -4.563 |
Token | put |
Token ID | 1234 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
Zoro | +2.763 |
ibilities | +2.456 |
ells | +2.427 |
chapter | +2.279 |
vitamins | +2.192 |
Neg logit contributions | |
ATH | -3.219 |
anamo | -2.835 |
ares | -2.827 |
aring | -2.808 |
ARE | -2.791 |
Token | it |
Token ID | 340 |
Feature activation | +1.90e-01 |
Pos logit contributions | |
Zoro | +1.390 |
ibilities | +1.236 |
ells | +1.224 |
chapter | +1.148 |
vitamins | +1.110 |
Neg logit contributions | |
ATH | -1.538 |
ares | -1.347 |
anamo | -1.345 |
aring | -1.339 |
ARE | -1.330 |
Token | watching |
Token ID | 4964 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
Zoro | +1.111 |
ibilities | +0.994 |
ells | +0.982 |
chapter | +0.913 |
vitamins | +0.885 |
Neg logit contributions | |
ATH | -1.260 |
ares | -1.106 |
anamo | -1.100 |
aring | -1.099 |
ARE | -1.089 |
Token | somebody |
Token ID | 8276 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
Zoro | +1.491 |
ibilities | +1.336 |
ells | +1.321 |
chapter | +1.235 |
vitamins | +1.198 |
Neg logit contributions | |
ATH | -1.596 |
ares | -1.395 |
anamo | -1.389 |
aring | -1.386 |
ARE | -1.375 |
Token | who |
Token ID | 508 |
Feature activation | -7.64e-02 |
Pos logit contributions | |
Zoro | +1.155 |
ibilities | +1.028 |
ells | +1.015 |
chapter | +0.940 |
vitamins | +0.909 |
Neg logit contributions | |
ATH | -1.427 |
ares | -1.259 |
anamo | -1.252 |
aring | -1.251 |
ARE | -1.241 |
Token | is |
Token ID | 318 |
Feature activation | +3.13e-01 |
Pos logit contributions | |
Zoro | +0.612 |
ibilities | +0.550 |
ells | +0.542 |
chapter | +0.504 |
vitamins | +0.490 |
Neg logit contributions | |
ATH | -0.667 |
ares | -0.585 |
aring | -0.581 |
anamo | -0.579 |
ARE | -0.574 |
Token | being |
Token ID | 852 |
Feature activation | +5.30e-02 |
Pos logit contributions | |
ATH | +2.646 |
aring | +2.296 |
ares | +2.291 |
Stacy | +2.238 |
anamo | +2.238 |
Neg logit contributions | |
Zoro | -2.543 |
ibilities | -2.363 |
ells | -2.313 |
chapter | -2.099 |
ible | -2.063 |
Token | brain |
Token ID | 3632 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
ATH | +0.460 |
ares | +0.402 |
aring | +0.399 |
anamo | +0.396 |
ARE | +0.394 |
Neg logit contributions | |
Zoro | -0.425 |
ibilities | -0.386 |
ells | -0.381 |
chapter | -0.350 |
vitamins | -0.341 |
Token | washed |
Token ID | 45462 |
Feature activation | -2.65e-01 |
Pos logit contributions | |
Zoro | +7.651 |
ells | +6.224 |
ibilities | +6.218 |
chapter | +6.009 |
vitamins | +5.966 |
Neg logit contributions | |
ATH | -12.825 |
ares | -11.572 |
Mehran | -11.561 |
anamo | -11.533 |
aryl | -11.436 |
Token | , |
Token ID | 11 |
Feature activation | -9.61e-02 |
Pos logit contributions | |
Zoro | +2.019 |
ibilities | +1.795 |
ells | +1.772 |
chapter | +1.654 |
ible | +1.606 |
Neg logit contributions | |
ATH | -2.406 |
anamo | -2.121 |
ares | -2.111 |
aring | -2.098 |
ARE | -2.091 |
Token | or |
Token ID | 393 |
Feature activation | -4.38e-01 |
Pos logit contributions | |
Zoro | +0.741 |
ibilities | +0.666 |
ells | +0.656 |
chapter | +0.606 |
vitamins | +0.587 |
Neg logit contributions | |
ATH | -0.868 |
ares | -0.763 |
aring | -0.760 |
anamo | -0.758 |
ARE | -0.751 |
Token | has |
Token ID | 468 |
Feature activation | -3.93e-01 |
Pos logit contributions | |
Zoro | +3.356 |
ells | +2.935 |
ibilities | +2.930 |
chapter | +2.754 |
vitamins | +2.660 |
Neg logit contributions | |
ATH | -3.921 |
anamo | -3.460 |
ares | -3.440 |
ARE | -3.409 |
aring | -3.405 |
Token | been |
Token ID | 587 |
Feature activation | -2.96e-01 |
Pos logit contributions | |
Zoro | +3.184 |
ibilities | +2.845 |
ells | +2.807 |
chapter | +2.655 |
vitamins | +2.589 |
Neg logit contributions | |
ATH | -3.334 |
ares | -2.926 |
anamo | -2.914 |
aring | -2.900 |
ARE | -2.896 |
Token | � |
Token ID | 250 |
Feature activation | +3.49e-01 |
Pos logit contributions | |
Zoro | +3.402 |
ibilities | +3.071 |
ells | +3.050 |
chapter | +2.885 |
vitamins | +2.807 |
Neg logit contributions | |
ATH | -2.897 |
anamo | -2.518 |
ares | -2.503 |
aring | -2.481 |
aryl | -2.479 |
Token | They |
Token ID | 2990 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
ATH | +2.812 |
ARE | +2.422 |
aring | +2.397 |
ares | +2.397 |
Bern | +2.345 |
Neg logit contributions | |
Zoro | -3.058 |
ibilities | -2.786 |
ells | -2.721 |
chapter | -2.548 |
vitamins | -2.490 |
Token | are |
Token ID | 389 |
Feature activation | -2.47e-01 |
Pos logit contributions | |
ATH | +1.608 |
aring | +1.415 |
ares | +1.415 |
ARE | +1.388 |
aldi | +1.369 |
Neg logit contributions | |
Zoro | -1.536 |
ibilities | -1.374 |
ells | -1.360 |
chapter | -1.253 |
vitamins | -1.220 |
Token | basically |
Token ID | 6209 |
Feature activation | -3.40e-01 |
Pos logit contributions | |
Zoro | +2.041 |
ibilities | +1.831 |
ells | +1.815 |
chapter | +1.699 |
vitamins | +1.648 |
Neg logit contributions | |
ATH | -2.094 |
ares | -1.823 |
anamo | -1.820 |
aring | -1.810 |
ARE | -1.796 |
Token | continuing |
Token ID | 8282 |
Feature activation | -4.82e-01 |
Pos logit contributions | |
Zoro | +2.916 |
ibilities | +2.611 |
ells | +2.592 |
chapter | +2.455 |
vitamins | +2.370 |
Neg logit contributions | |
ATH | -2.767 |
anamo | -2.409 |
ares | -2.384 |
aring | -2.373 |
ARE | -2.348 |
Token | to |
Token ID | 284 |
Feature activation | -9.71e-01 |
Pos logit contributions | |
Zoro | +3.632 |
ibilities | +3.185 |
ells | +3.173 |
chapter | +2.989 |
ible | +2.862 |
Neg logit contributions | |
ATH | -4.400 |
anamo | -3.930 |
ares | -3.887 |
aring | -3.865 |
aldi | -3.834 |
Token | be |
Token ID | 307 |
Feature activation | -4.04e-01 |
Pos logit contributions | |
Zoro | +6.470 |
ells | +5.474 |
ibilities | +5.461 |
chapter | +5.316 |
ible | +5.076 |
Neg logit contributions | |
ATH | -9.277 |
anamo | -8.608 |
aldi | -8.340 |
ares | -8.260 |
merce | -8.252 |
Token | equally |
Token ID | 8603 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
Zoro | +4.130 |
ibilities | +3.770 |
ells | +3.751 |
chapter | +3.585 |
ible | +3.497 |
Neg logit contributions | |
ATH | -2.589 |
anamo | -2.173 |
aring | -2.128 |
ares | -2.106 |
ARE | -2.089 |
Token | as |
Token ID | 355 |
Feature activation | -4.16e-02 |
Pos logit contributions | |
Zoro | +4.525 |
ibilities | +3.986 |
ells | +3.923 |
chapter | +3.784 |
ible | +3.645 |
Neg logit contributions | |
ATH | -5.060 |
anamo | -4.495 |
aldi | -4.380 |
ares | -4.372 |
aring | -4.348 |
Token | tight |
Token ID | 5381 |
Feature activation | -7.55e-01 |
Pos logit contributions | |
Zoro | +0.278 |
ibilities | +0.244 |
ells | +0.242 |
chapter | +0.216 |
vitamins | +0.213 |
Neg logit contributions | |
ATH | -0.418 |
ares | -0.373 |
aring | -0.372 |
anamo | -0.369 |
aryl | -0.368 |
Token | - |
Token ID | 12 |
Feature activation | -3.62e-01 |
Pos logit contributions | |
Zoro | +4.898 |
ibilities | +4.124 |
ells | +4.091 |
chapter | +4.014 |
vitamins | +3.717 |
Neg logit contributions | |
ATH | -7.425 |
anamo | -6.722 |
ares | -6.680 |
aldi | -6.674 |
ARE | -6.630 |
Token | tasting |
Token ID | 26973 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
Zoro | +1.532 |
ibilities | +1.374 |
ells | +1.355 |
chapter | +1.254 |
ible | +1.218 |
Neg logit contributions | |
ATH | -1.752 |
ares | -1.541 |
aring | -1.533 |
anamo | -1.526 |
ARE | -1.515 |
Token | . |
Token ID | 13 |
Feature activation | -8.38e-01 |
Pos logit contributions | |
ATH | +1.150 |
ares | +1.016 |
aring | +1.015 |
ARE | +1.000 |
aldi | +0.993 |
Neg logit contributions | |
Zoro | -1.048 |
ibilities | -0.942 |
ells | -0.936 |
chapter | -0.853 |
ible | -0.829 |
Token |
|
Token ID | 198 |
Feature activation | -6.81e-01 |
Pos logit contributions | |
Zoro | +6.218 |
ibilities | +5.280 |
ells | +5.279 |
chapter | +5.048 |
vitamins | +4.837 |
Neg logit contributions | |
ATH | -7.632 |
anamo | -6.921 |
ares | -6.715 |
aryl | -6.707 |
merce | -6.646 |
Token |
|
Token ID | 198 |
Feature activation | -6.38e-01 |
Pos logit contributions | |
Zoro | +4.345 |
ells | +3.721 |
ibilities | +3.692 |
chapter | +3.477 |
ible | +3.308 |
Neg logit contributions | |
ATH | -6.893 |
anamo | -6.388 |
merce | -6.200 |
ares | -6.165 |
aryl | -6.155 |
Token | 7 |
Token ID | 22 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
Zoro | +4.741 |
ibilities | +4.285 |
ells | +4.205 |
chapter | +3.952 |
ible | +3.886 |
Neg logit contributions | |
ATH | -5.563 |
anamo | -5.167 |
ares | -4.998 |
Stacy | -4.978 |
Mehran | -4.955 |
Token | . |
Token ID | 13 |
Feature activation | -9.94e-01 |
Pos logit contributions | |
Zoro | +1.294 |
ibilities | +1.176 |
ells | +1.149 |
chapter | +1.060 |
vitamins | +1.042 |
Neg logit contributions | |
ATH | -1.422 |
ares | -1.246 |
aring | -1.239 |
ARE | -1.228 |
aldi | -1.212 |
Token | While |
Token ID | 2893 |
Feature activation | -5.29e-01 |
Pos logit contributions | |
Zoro | +7.670 |
ells | +6.450 |
ibilities | +6.395 |
chapter | +6.256 |
Spoon | +6.003 |
Neg logit contributions | |
ATH | -8.621 |
anamo | -7.897 |
aryl | -7.623 |
merce | -7.553 |
ares | -7.484 |
Token | we |
Token ID | 356 |
Feature activation | -6.61e-01 |
Pos logit contributions | |
Zoro | +3.699 |
ibilities | +3.206 |
ells | +3.137 |
chapter | +2.962 |
vitamins | +2.893 |
Neg logit contributions | |
ATH | -5.112 |
anamo | -4.631 |
ares | -4.544 |
aryl | -4.511 |
aring | -4.463 |
Token | are |
Token ID | 389 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
Zoro | +4.715 |
ibilities | +4.157 |
ells | +4.093 |
chapter | +3.886 |
vitamins | +3.781 |
Neg logit contributions | |
ATH | -6.131 |
anamo | -5.534 |
aryl | -5.459 |
Mehran | -5.351 |
ares | -5.350 |
Token | waiting |
Token ID | 4953 |
Feature activation | -3.80e-01 |
Pos logit contributions | |
Zoro | +0.942 |
ibilities | +0.842 |
ells | +0.831 |
chapter | +0.769 |
vitamins | +0.745 |
Neg logit contributions | |
ATH | -1.119 |
ares | -0.984 |
aring | -0.980 |
anamo | -0.977 |
ARE | -0.970 |
Token | for |
Token ID | 329 |
Feature activation | -6.15e-01 |
Pos logit contributions | |
Zoro | +2.754 |
ibilities | +2.419 |
ells | +2.388 |
chapter | +2.242 |
vitamins | +2.151 |
Neg logit contributions | |
ATH | -3.605 |
anamo | -3.197 |
ares | -3.176 |
aring | -3.142 |
ARE | -3.137 |