Token | first |
Token ID | 717 |
Feature activation | +3.30e+00 |
Pos logit contributions | |
azines | +3.356 |
culosis | +3.291 |
excluding | +3.183 |
formance | +3.181 |
Conclusion | +3.035 |
Neg logit contributions | |
IFF | -3.261 |
usefulness | -3.114 |
Unch | -3.081 |
OR | -3.064 |
ellig | -3.045 |
Token | Rapt |
Token ID | 21301 |
Feature activation | -6.29e-01 |
Pos logit contributions | |
azines | +2.493 |
culosis | +2.460 |
excluding | +2.361 |
formance | +2.357 |
Conclusion | +2.251 |
Neg logit contributions | |
IFF | -2.328 |
usefulness | -2.240 |
Unch | -2.238 |
OR | -2.210 |
ellig | -2.155 |
Token | or |
Token ID | 273 |
Feature activation | +6.81e+00 |
Pos logit contributions | |
IFF | +0.156 |
Unch | +0.150 |
usefulness | +0.147 |
ellig | +0.120 |
OR | +0.119 |
Neg logit contributions | |
azines | -0.775 |
culosis | -0.764 |
excluding | -0.745 |
formance | -0.736 |
Conclusion | -0.724 |
Token | , |
Token ID | 11 |
Feature activation | +7.90e+00 |
Pos logit contributions | |
azines | +4.570 |
culosis | +4.444 |
formance | +4.354 |
excluding | +4.316 |
excluding | +4.176 |
Neg logit contributions | |
IFF | -5.116 |
usefulness | -4.865 |
Unch | -4.797 |
OR | -4.725 |
humans | -4.658 |
Token | we |
Token ID | 356 |
Feature activation | +9.09e+00 |
Pos logit contributions | |
azines | +5.050 |
culosis | +4.885 |
excluding | +4.847 |
formance | +4.831 |
excluding | +4.677 |
Neg logit contributions | |
IFF | -6.155 |
Unch | -5.858 |
usefulness | -5.825 |
ellig | -5.748 |
OR | -5.738 |
Token | set |
Token ID | 900 |
Feature activation | +2.56e+01 |
Pos logit contributions | |
culosis | +6.150 |
azines | +6.022 |
excluding | +5.898 |
excluding | +5.746 |
cluding | +5.624 |
Neg logit contributions | |
IFF | -6.582 |
usefulness | -6.437 |
Unch | -6.264 |
OR | -6.233 |
ibrary | -6.003 |
Token | out |
Token ID | 503 |
Feature activation | +9.29e+00 |
Pos logit contributions | |
excluding | +12.396 |
azines | +11.838 |
excluding | +11.536 |
formance | +11.515 |
excludes | +11.367 |
Neg logit contributions | |
IFF | -16.753 |
ibrary | -16.711 |
ellig | -16.284 |
Unch | -15.997 |
blance | -15.812 |
Token | to |
Token ID | 284 |
Feature activation | +6.38e+00 |
Pos logit contributions | |
culosis | +6.282 |
azines | +6.246 |
excluding | +6.014 |
formance | +5.984 |
excluding | +5.773 |
Neg logit contributions | |
Unch | -6.678 |
IFF | -6.674 |
usefulness | -6.583 |
OR | -6.494 |
ellig | -6.224 |
Token | prove |
Token ID | 5879 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
culosis | +4.105 |
azines | +4.104 |
excluding | +3.916 |
formance | +3.885 |
Conclusion | +3.767 |
Neg logit contributions | |
IFF | -4.942 |
Unch | -4.761 |
usefulness | -4.721 |
OR | -4.686 |
ibrary | -4.636 |
Token | vehicle |
Token ID | 4038 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
IFF | +0.694 |
Unch | +0.686 |
usefulness | +0.684 |
OR | +0.674 |
ellig | +0.648 |
Neg logit contributions | |
azines | -0.783 |
culosis | -0.777 |
excluding | -0.738 |
formance | -0.732 |
Conclusion | -0.702 |
Token | performance |
Token ID | 2854 |
Feature activation | +5.09e+00 |
Pos logit contributions | |
azines | +1.895 |
culosis | +1.877 |
formance | +1.809 |
excluding | +1.777 |
cluding | +1.698 |
Neg logit contributions | |
IFF | -1.745 |
Unch | -1.702 |
OR | -1.656 |
usefulness | -1.635 |
ellig | -1.611 |
Token | . |
Token ID | 13 |
Feature activation | -9.38e-01 |
Pos logit contributions | |
culosis | +4.817 |
azines | +4.753 |
excluding | +4.554 |
formance | +4.551 |
Conclusion | +4.496 |
Neg logit contributions | |
IFF | -4.889 |
Unch | -4.854 |
usefulness | -4.814 |
OR | -4.796 |
humans | -4.671 |
Token | If |
Token ID | 1002 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
IFF | +0.679 |
usefulness | +0.676 |
Unch | +0.672 |
OR | +0.663 |
lif | +0.640 |
Neg logit contributions | |
azines | -0.698 |
culosis | -0.693 |
excluding | -0.657 |
formance | -0.647 |
Conclusion | -0.625 |
Token | he |
Token ID | 339 |
Feature activation | +4.22e-03 |
Pos logit contributions | |
azines | +0.284 |
culosis | +0.281 |
excluding | +0.268 |
formance | +0.263 |
Conclusion | +0.254 |
Neg logit contributions | |
IFF | -0.272 |
Unch | -0.270 |
usefulness | -0.269 |
OR | -0.265 |
lif | -0.255 |
Token | did |
Token ID | 750 |
Feature activation | -5.38e-01 |
Pos logit contributions | |
azines | +0.003 |
culosis | +0.003 |
excluding | +0.003 |
formance | +0.003 |
Conclusion | +0.003 |
Neg logit contributions | |
IFF | -0.003 |
usefulness | -0.003 |
Unch | -0.003 |
OR | -0.003 |
ellig | -0.003 |
Token | not |
Token ID | 407 |
Feature activation | +3.62e+00 |
Pos logit contributions | |
IFF | +0.387 |
usefulness | +0.384 |
Unch | +0.383 |
OR | +0.378 |
lif | +0.363 |
Neg logit contributions | |
azines | -0.403 |
culosis | -0.400 |
excluding | -0.379 |
formance | -0.374 |
Conclusion | -0.360 |
Token | set |
Token ID | 900 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
azines | +2.652 |
culosis | +2.614 |
excluding | +2.514 |
formance | +2.437 |
Conclusion | +2.412 |
Neg logit contributions | |
IFF | -2.599 |
usefulness | -2.553 |
Unch | -2.530 |
OR | -2.511 |
humans | -2.447 |
Token | it |
Token ID | 340 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
azines | +12.355 |
excluding | +11.879 |
excluding | +11.754 |
cluding | +11.722 |
culminating | +11.638 |
Neg logit contributions | |
IFF | -14.322 |
OR | -14.170 |
ibrary | -14.039 |
Unch | -13.989 |
ellig | -13.966 |
Token | in |
Token ID | 287 |
Feature activation | +5.14e+00 |
Pos logit contributions | |
azines | +7.263 |
culosis | +7.244 |
culminating | +7.168 |
excluding | +7.107 |
cluding | +7.037 |
Neg logit contributions | |
usefulness | -9.433 |
IFF | -9.370 |
OR | -9.126 |
humans | -9.124 |
Unch | -9.052 |
Token | motion |
Token ID | 6268 |
Feature activation | +6.20e-01 |
Pos logit contributions | |
azines | +5.440 |
culosis | +5.397 |
formance | +5.290 |
excluding | +5.244 |
cluding | +5.206 |
Neg logit contributions | |
IFF | -1.922 |
usefulness | -1.841 |
OR | -1.833 |
Unch | -1.823 |
humans | -1.690 |
Token | , |
Token ID | 11 |
Feature activation | -3.90e+00 |
Pos logit contributions | |
culosis | +0.457 |
azines | +0.456 |
excluding | +0.433 |
formance | +0.425 |
Conclusion | +0.413 |
Neg logit contributions | |
IFF | -0.447 |
usefulness | -0.447 |
Unch | -0.443 |
OR | -0.437 |
humans | -0.420 |
Token | he |
Token ID | 339 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
IFF | +2.626 |
usefulness | +2.625 |
Unch | +2.612 |
OR | +2.575 |
lif | +2.486 |
Neg logit contributions | |
culosis | -3.078 |
azines | -3.075 |
excluding | -2.884 |
formance | -2.869 |
cluding | -2.721 |
Token | release |
Token ID | 2650 |
Feature activation | -7.07e-02 |
Pos logit contributions | |
usefulness | +3.943 |
IFF | +3.869 |
Unch | +3.849 |
OR | +3.781 |
lif | +3.728 |
Neg logit contributions | |
azines | -4.380 |
culosis | -4.369 |
excluding | -4.122 |
formance | -4.066 |
Conclusion | -3.900 |
Token | , |
Token ID | 11 |
Feature activation | +5.65e+00 |
Pos logit contributions | |
IFF | +0.050 |
usefulness | +0.050 |
Unch | +0.050 |
OR | +0.049 |
lif | +0.047 |
Neg logit contributions | |
azines | -0.054 |
culosis | -0.053 |
excluding | -0.051 |
formance | -0.050 |
Conclusion | -0.048 |
Token | Ken |
Token ID | 7148 |
Feature activation | +5.53e+00 |
Pos logit contributions | |
azines | +3.783 |
culosis | +3.704 |
excluding | +3.564 |
formance | +3.458 |
Conclusion | +3.387 |
Neg logit contributions | |
IFF | -4.371 |
usefulness | -4.270 |
Unch | -4.253 |
OR | -4.231 |
ellig | -4.093 |
Token | y |
Token ID | 88 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
azines | +3.405 |
culosis | +3.211 |
excluding | +3.081 |
formance | +3.014 |
cluding | +2.980 |
Neg logit contributions | |
usefulness | -4.681 |
Unch | -4.672 |
IFF | -4.610 |
OR | -4.480 |
lif | -4.402 |
Token | atta |
Token ID | 25014 |
Feature activation | +7.76e+00 |
Pos logit contributions | |
azines | +6.226 |
culosis | +5.818 |
excluding | +5.735 |
formance | +5.633 |
cluding | +5.275 |
Neg logit contributions | |
usefulness | -8.142 |
Unch | -7.996 |
IFF | -7.911 |
lif | -7.866 |
OR | -7.642 |
Token | set |
Token ID | 900 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
azines | +5.142 |
culosis | +5.033 |
excluding | +4.733 |
formance | +4.672 |
culminating | +4.640 |
Neg logit contributions | |
IFF | -5.839 |
usefulness | -5.710 |
Unch | -5.607 |
OR | -5.589 |
humans | -5.555 |
Token | about |
Token ID | 546 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
azines | +11.319 |
excluding | +10.581 |
culminating | +10.320 |
excluding | +10.104 |
formance | +10.070 |
Neg logit contributions | |
IFF | -15.940 |
ibrary | -15.609 |
Unch | -15.606 |
blance | -15.469 |
OR | -15.388 |
Token | trying |
Token ID | 2111 |
Feature activation | +4.26e+00 |
Pos logit contributions | |
azines | +7.345 |
excluding | +7.246 |
culosis | +7.245 |
culminating | +7.194 |
excluding | +7.185 |
Neg logit contributions | |
IFF | -8.271 |
OR | -7.921 |
Unch | -7.848 |
usefulness | -7.804 |
humans | -7.770 |
Token | to |
Token ID | 284 |
Feature activation | +5.82e+00 |
Pos logit contributions | |
azines | +3.472 |
culosis | +3.454 |
excluding | +3.270 |
formance | +3.238 |
Conclusion | +3.124 |
Neg logit contributions | |
IFF | -2.772 |
Unch | -2.733 |
usefulness | -2.722 |
OR | -2.683 |
humans | -2.553 |
Token | ensure |
Token ID | 4155 |
Feature activation | +8.33e+00 |
Pos logit contributions | |
azines | +4.049 |
culosis | +4.031 |
excluding | +3.762 |
Conclusion | +3.722 |
formance | +3.687 |
Neg logit contributions | |
IFF | -4.287 |
usefulness | -4.153 |
Unch | -4.151 |
OR | -4.132 |
humans | -4.051 |
Token | that |
Token ID | 326 |
Feature activation | +3.69e+00 |
Pos logit contributions | |
azines | +5.668 |
culosis | +5.573 |
excluding | +5.369 |
formance | +5.338 |
Conclusion | +5.193 |
Neg logit contributions | |
IFF | -6.043 |
OR | -5.908 |
Unch | -5.889 |
usefulness | -5.736 |
ellig | -5.720 |
Token |
|
Token ID | 198 |
Feature activation | +1.84e+00 |
Pos logit contributions | |
azines | +0.958 |
culosis | +0.953 |
excluding | +0.908 |
formance | +0.886 |
Conclusion | +0.874 |
Neg logit contributions | |
usefulness | -0.838 |
IFF | -0.834 |
Unch | -0.816 |
OR | -0.804 |
ellig | -0.784 |
Token |
|
Token ID | 198 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
azines | +1.348 |
excluding | +1.309 |
culosis | +1.300 |
formance | +1.263 |
Conclusion | +1.231 |
Neg logit contributions | |
usefulness | -1.345 |
Unch | -1.335 |
IFF | -1.312 |
OR | -1.259 |
ellig | -1.248 |
Token | � |
Token ID | 447 |
Feature activation | +7.18e-01 |
Pos logit contributions | |
azines | +1.100 |
culosis | +1.092 |
excluding | +1.035 |
formance | +1.020 |
Conclusion | +0.982 |
Neg logit contributions | |
IFF | -1.045 |
usefulness | -1.040 |
Unch | -1.039 |
OR | -1.019 |
lif | -0.983 |
Token | � |
Token ID | 246 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
azines | +0.582 |
culosis | +0.578 |
excluding | +0.549 |
formance | +0.543 |
Conclusion | +0.524 |
Neg logit contributions | |
IFF | -0.473 |
usefulness | -0.470 |
Unch | -0.469 |
OR | -0.460 |
lif | -0.442 |
Token | I |
Token ID | 40 |
Feature activation | +4.56e+00 |
Pos logit contributions | |
azines | +1.332 |
culosis | +1.306 |
excluding | +1.275 |
formance | +1.226 |
cluding | +1.199 |
Neg logit contributions | |
usefulness | -1.144 |
Unch | -1.131 |
IFF | -1.117 |
OR | -1.069 |
ellig | -1.068 |
Token | set |
Token ID | 900 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
culosis | +3.029 |
azines | +3.019 |
excluding | +2.808 |
formance | +2.692 |
cluding | +2.689 |
Neg logit contributions | |
IFF | -3.552 |
usefulness | -3.536 |
Unch | -3.523 |
OR | -3.441 |
ellig | -3.374 |
Token | off |
Token ID | 572 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
azines | +12.049 |
excluding | +11.634 |
culminating | +11.300 |
excluding | +11.243 |
cluding | +11.239 |
Neg logit contributions | |
IFF | -14.896 |
ellig | -14.685 |
ibrary | -14.681 |
OR | -14.579 |
Unch | -14.576 |
Token | on |
Token ID | 319 |
Feature activation | +4.55e+00 |
Pos logit contributions | |
azines | +0.868 |
culosis | +0.856 |
excluding | +0.815 |
formance | +0.795 |
cluding | +0.771 |
Neg logit contributions | |
IFF | -0.871 |
usefulness | -0.859 |
Unch | -0.854 |
OR | -0.847 |
ellig | -0.821 |
Token | the |
Token ID | 262 |
Feature activation | +5.63e+00 |
Pos logit contributions | |
azines | +3.105 |
culosis | +3.086 |
excluding | +2.925 |
formance | +2.845 |
cluding | +2.819 |
Neg logit contributions | |
IFF | -3.461 |
Unch | -3.348 |
usefulness | -3.327 |
ellig | -3.298 |
OR | -3.296 |
Token | path |
Token ID | 3108 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
azines | +4.282 |
culosis | +4.121 |
excluding | +4.041 |
formance | +3.942 |
Conclusion | +3.938 |
Neg logit contributions | |
IFF | -3.863 |
Unch | -3.637 |
usefulness | -3.628 |
OR | -3.626 |
ellig | -3.608 |
Token | of |
Token ID | 286 |
Feature activation | +8.88e-01 |
Pos logit contributions | |
azines | +1.070 |
culosis | +1.066 |
excluding | +1.014 |
formance | +0.989 |
Conclusion | +0.964 |
Neg logit contributions | |
IFF | -0.983 |
usefulness | -0.974 |
Unch | -0.966 |
OR | -0.951 |
ellig | -0.915 |
Token | your |
Token ID | 534 |
Feature activation | +3.39e+00 |
Pos logit contributions | |
IFF | +1.862 |
usefulness | +1.850 |
Unch | +1.847 |
OR | +1.819 |
lif | +1.750 |
Neg logit contributions | |
azines | -2.003 |
culosis | -1.989 |
excluding | -1.883 |
formance | -1.858 |
Conclusion | -1.787 |
Token | garden |
Token ID | 11376 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
azines | +2.534 |
culosis | +2.460 |
excluding | +2.399 |
formance | +2.329 |
Conclusion | +2.276 |
Neg logit contributions | |
IFF | -2.416 |
Unch | -2.371 |
OR | -2.320 |
usefulness | -2.312 |
ellig | -2.267 |
Token | , |
Token ID | 11 |
Feature activation | +2.94e+00 |
Pos logit contributions | |
azines | +2.364 |
culosis | +2.339 |
excluding | +2.234 |
formance | +2.150 |
Conclusion | +2.132 |
Neg logit contributions | |
IFF | -2.735 |
Unch | -2.706 |
usefulness | -2.668 |
OR | -2.645 |
ellig | -2.592 |
Token | is |
Token ID | 318 |
Feature activation | -5.10e-01 |
Pos logit contributions | |
azines | +2.209 |
culosis | +2.170 |
excluding | +2.097 |
formance | +2.000 |
Conclusion | +1.982 |
Neg logit contributions | |
IFF | -2.100 |
Unch | -2.055 |
usefulness | -2.039 |
OR | -2.014 |
ellig | -1.965 |
Token | to |
Token ID | 284 |
Feature activation | +8.34e+00 |
Pos logit contributions | |
IFF | +0.330 |
usefulness | +0.327 |
Unch | +0.327 |
OR | +0.322 |
lif | +0.308 |
Neg logit contributions | |
azines | -0.419 |
culosis | -0.417 |
excluding | -0.396 |
formance | -0.391 |
Conclusion | -0.378 |
Token | set |
Token ID | 900 |
Feature activation | +2.30e+01 |
Pos logit contributions | |
azines | +5.442 |
culosis | +5.373 |
excluding | +5.111 |
disregard | +5.021 |
Conclusion | +4.999 |
Neg logit contributions | |
IFF | -6.220 |
usefulness | -6.054 |
Unch | -6.024 |
humans | -5.908 |
OR | -5.854 |
Token | aside |
Token ID | 7263 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
excluding | +12.401 |
azines | +12.326 |
excluding | +11.966 |
culosis | +11.817 |
excludes | +11.794 |
Neg logit contributions | |
IFF | -13.696 |
blance | -13.631 |
Unch | -13.600 |
ellig | -13.490 |
ibrary | -13.427 |
Token | an |
Token ID | 281 |
Feature activation | +4.47e+00 |
Pos logit contributions | |
azines | +1.242 |
culosis | +1.220 |
excluding | +1.174 |
formance | +1.148 |
Conclusion | +1.115 |
Neg logit contributions | |
IFF | -1.140 |
usefulness | -1.123 |
Unch | -1.118 |
OR | -1.104 |
ellig | -1.073 |
Token | area |
Token ID | 1989 |
Feature activation | -9.25e-01 |
Pos logit contributions | |
azines | +3.210 |
culosis | +3.149 |
excluding | +3.097 |
formance | +2.995 |
cluding | +2.877 |
Neg logit contributions | |
IFF | -3.250 |
usefulness | -3.197 |
Unch | -3.157 |
OR | -3.079 |
humans | -3.078 |
Token | as |
Token ID | 355 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
IFF | +0.639 |
Unch | +0.633 |
usefulness | +0.632 |
OR | +0.621 |
ellig | +0.597 |
Neg logit contributions | |
azines | -0.719 |
culosis | -0.714 |
excluding | -0.681 |
formance | -0.669 |
Conclusion | -0.646 |
Token | a |
Token ID | 257 |
Feature activation | +5.70e+00 |
Pos logit contributions | |
IFF | +0.789 |
usefulness | +0.783 |
Unch | +0.783 |
OR | +0.771 |
ellig | +0.738 |
Neg logit contributions | |
azines | -0.916 |
culosis | -0.908 |
excluding | -0.865 |
formance | -0.850 |
Conclusion | -0.823 |
Token | his |
Token ID | 465 |
Feature activation | -3.97e+00 |
Pos logit contributions | |
IFF | +0.863 |
usefulness | +0.856 |
Unch | +0.856 |
OR | +0.842 |
lif | +0.809 |
Neg logit contributions | |
azines | -0.962 |
culosis | -0.955 |
excluding | -0.905 |
formance | -0.894 |
Conclusion | -0.861 |
Token | 15 |
Token ID | 1315 |
Feature activation | -3.63e+00 |
Pos logit contributions | |
usefulness | +2.797 |
IFF | +2.763 |
Unch | +2.759 |
OR | +2.715 |
lif | +2.657 |
Neg logit contributions | |
azines | -3.046 |
culosis | -3.031 |
excluding | -2.857 |
formance | -2.827 |
cluding | -2.705 |
Token | year |
Token ID | 614 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
IFF | +2.238 |
Unch | +2.208 |
usefulness | +2.205 |
OR | +2.192 |
lif | +2.118 |
Neg logit contributions | |
azines | -3.080 |
culosis | -3.076 |
excluding | -2.903 |
formance | -2.898 |
Conclusion | -2.781 |
Token | strategy |
Token ID | 4811 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
usefulness | +6.892 |
lif | +6.683 |
OR | +6.589 |
IFF | +6.542 |
Unch | +6.492 |
Neg logit contributions | |
azines | -7.550 |
culosis | -7.467 |
excluding | -7.065 |
formance | -6.963 |
cluding | -6.681 |
Token | to |
Token ID | 284 |
Feature activation | +6.66e+00 |
Pos logit contributions | |
azines | +0.823 |
culosis | +0.814 |
excluding | +0.784 |
formance | +0.770 |
cluding | +0.744 |
Neg logit contributions | |
IFF | -0.734 |
Unch | -0.722 |
usefulness | -0.719 |
OR | -0.713 |
humans | -0.687 |
Token | set |
Token ID | 900 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
culosis | +4.757 |
azines | +4.739 |
excluding | +4.473 |
formance | +4.354 |
Conclusion | +4.333 |
Neg logit contributions | |
IFF | -4.760 |
Unch | -4.583 |
usefulness | -4.555 |
OR | -4.535 |
humans | -4.473 |
Token | right |
Token ID | 826 |
Feature activation | +5.05e+00 |
Pos logit contributions | |
azines | +12.259 |
culminating | +11.699 |
excluding | +11.618 |
excluding | +11.519 |
culosis | +11.480 |
Neg logit contributions | |
IFF | -14.295 |
Unch | -14.245 |
ibrary | -14.113 |
blance | -13.867 |
OR | -13.728 |
Token | what |
Token ID | 644 |
Feature activation | +2.77e+00 |
Pos logit contributions | |
azines | +3.665 |
culosis | +3.648 |
excluding | +3.452 |
formance | +3.439 |
Conclusion | +3.306 |
Neg logit contributions | |
Unch | -3.598 |
IFF | -3.591 |
usefulness | -3.562 |
OR | -3.473 |
ellig | -3.390 |
Token | went |
Token ID | 1816 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
azines | +1.895 |
culosis | +1.877 |
excluding | +1.772 |
formance | +1.736 |
Conclusion | +1.690 |
Neg logit contributions | |
IFF | -2.136 |
Unch | -2.121 |
usefulness | -2.108 |
OR | -2.078 |
ellig | -2.014 |
Token | wrong |
Token ID | 2642 |
Feature activation | +3.03e+00 |
Pos logit contributions | |
IFF | +3.015 |
Unch | +2.996 |
usefulness | +2.991 |
OR | +2.962 |
lif | +2.883 |
Neg logit contributions | |
azines | -2.007 |
culosis | -1.987 |
excluding | -1.836 |
formance | -1.819 |
Conclusion | -1.718 |
Token | when |
Token ID | 618 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
culosis | +2.086 |
azines | +2.079 |
excluding | +1.997 |
formance | +1.941 |
Conclusion | +1.901 |
Neg logit contributions | |
IFF | -2.293 |
usefulness | -2.266 |
Unch | -2.235 |
OR | -2.211 |
ellig | -2.157 |
Token | if |
Token ID | 611 |
Feature activation | +5.66e+00 |
Pos logit contributions | |
azines | +4.011 |
culosis | +3.981 |
excluding | +3.927 |
excluding | +3.776 |
cluding | +3.724 |
Neg logit contributions | |
IFF | -3.685 |
usefulness | -3.613 |
Unch | -3.583 |
OR | -3.568 |
ellig | -3.467 |
Token | it |
Token ID | 340 |
Feature activation | +6.46e+00 |
Pos logit contributions | |
azines | +4.306 |
culosis | +4.215 |
excluding | +4.114 |
excluding | +3.936 |
formance | +3.936 |
Neg logit contributions | |
IFF | -3.832 |
Unch | -3.726 |
OR | -3.711 |
usefulness | -3.684 |
humans | -3.587 |
Token | succeeds |
Token ID | 31137 |
Feature activation | -5.00e-01 |
Pos logit contributions | |
azines | +4.438 |
culosis | +4.421 |
excluding | +4.220 |
excludes | +4.045 |
formance | +4.029 |
Neg logit contributions | |
IFF | -4.741 |
usefulness | -4.717 |
Unch | -4.708 |
OR | -4.659 |
humans | -4.484 |
Token | , |
Token ID | 11 |
Feature activation | +4.44e+00 |
Pos logit contributions | |
IFF | +0.355 |
usefulness | +0.352 |
Unch | +0.351 |
OR | +0.345 |
lif | +0.332 |
Neg logit contributions | |
azines | -0.378 |
culosis | -0.376 |
excluding | -0.357 |
formance | -0.351 |
Conclusion | -0.340 |
Token | is |
Token ID | 318 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
azines | +3.033 |
culosis | +3.031 |
excluding | +2.894 |
formance | +2.768 |
Conclusion | +2.750 |
Neg logit contributions | |
IFF | -3.388 |
Unch | -3.316 |
usefulness | -3.314 |
OR | -3.291 |
ellig | -3.179 |
Token | setting |
Token ID | 4634 |
Feature activation | +2.26e+01 |
Pos logit contributions | |
azines | +2.319 |
culosis | +2.303 |
excluding | +2.217 |
formance | +2.155 |
Conclusion | +2.084 |
Neg logit contributions | |
IFF | -2.395 |
Unch | -2.352 |
usefulness | -2.351 |
OR | -2.316 |
ellig | -2.249 |
Token | up |
Token ID | 510 |
Feature activation | +4.14e+00 |
Pos logit contributions | |
azines | +12.606 |
excluding | +12.394 |
culminating | +12.268 |
excluding | +12.041 |
cluding | +11.919 |
Neg logit contributions | |
IFF | -13.768 |
OR | -12.940 |
ellig | -12.893 |
blance | -12.847 |
Unch | -12.836 |
Token | the |
Token ID | 262 |
Feature activation | +2.36e+00 |
Pos logit contributions | |
azines | +2.991 |
culosis | +2.940 |
excluding | +2.804 |
formance | +2.759 |
Conclusion | +2.700 |
Neg logit contributions | |
IFF | -3.016 |
usefulness | -2.946 |
Unch | -2.939 |
OR | -2.927 |
ellig | -2.804 |
Token | case |
Token ID | 1339 |
Feature activation | -4.70e+00 |
Pos logit contributions | |
azines | +1.893 |
culosis | +1.867 |
excluding | +1.789 |
formance | +1.754 |
Conclusion | +1.726 |
Neg logit contributions | |
IFF | -1.562 |
Unch | -1.526 |
usefulness | -1.520 |
OR | -1.506 |
humans | -1.450 |
Token | for |
Token ID | 329 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
IFF | +2.635 |
Unch | +2.618 |
usefulness | +2.614 |
OR | +2.564 |
lif | +2.448 |
Neg logit contributions | |
azines | -4.225 |
culosis | -4.204 |
excluding | -3.998 |
formance | -3.974 |
Conclusion | -3.835 |
Token | an |
Token ID | 281 |
Feature activation | +4.25e+00 |
Pos logit contributions | |
azines | +0.925 |
culosis | +0.919 |
excluding | +0.879 |
formance | +0.863 |
Conclusion | +0.841 |
Neg logit contributions | |
IFF | -0.880 |
usefulness | -0.862 |
Unch | -0.862 |
OR | -0.854 |
ellig | -0.821 |
Token | reon |
Token ID | 21833 |
Feature activation | +7.71e+00 |
Pos logit contributions | |
azines | +4.588 |
excluding | +4.273 |
culosis | +4.249 |
formance | +4.187 |
cluding | +3.952 |
Neg logit contributions | |
Unch | -6.650 |
usefulness | -6.597 |
IFF | -6.522 |
lif | -6.231 |
standoff | -6.155 |
Token | in |
Token ID | 287 |
Feature activation | +4.59e+00 |
Pos logit contributions | |
culosis | +5.325 |
azines | +5.295 |
excluding | +5.118 |
formance | +5.059 |
Conclusion | +5.048 |
Neg logit contributions | |
IFF | -5.301 |
usefulness | -5.234 |
OR | -5.048 |
humans | -5.039 |
ellig | -5.020 |
Token | 2011 |
Token ID | 2813 |
Feature activation | +6.82e-01 |
Pos logit contributions | |
azines | +2.869 |
culosis | +2.779 |
formance | +2.711 |
excluding | +2.710 |
Conclusion | +2.673 |
Neg logit contributions | |
IFF | -3.720 |
Unch | -3.616 |
usefulness | -3.613 |
OR | -3.560 |
ellig | -3.508 |
Token | , |
Token ID | 11 |
Feature activation | +6.11e+00 |
Pos logit contributions | |
azines | +0.507 |
culosis | +0.503 |
excluding | +0.481 |
formance | +0.472 |
Conclusion | +0.457 |
Neg logit contributions | |
IFF | -0.491 |
usefulness | -0.489 |
Unch | -0.484 |
OR | -0.475 |
ellig | -0.460 |
Token | bas |
Token ID | 1615 |
Feature activation | +8.08e+00 |
Pos logit contributions | |
azines | +4.192 |
excluding | +4.081 |
culosis | +4.016 |
formance | +3.896 |
culminating | +3.882 |
Neg logit contributions | |
IFF | -4.560 |
Unch | -4.441 |
usefulness | -4.398 |
ellig | -4.306 |
OR | -4.295 |
Token | ing |
Token ID | 278 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
azines | +7.168 |
culosis | +7.094 |
cluding | +6.886 |
formance | +6.865 |
excluding | +6.823 |
Neg logit contributions | |
IFF | -4.407 |
usefulness | -4.172 |
Unch | -4.148 |
OR | -4.033 |
humans | -3.893 |
Token | it |
Token ID | 340 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
excluding | +12.076 |
culosis | +11.866 |
azines | +11.845 |
formance | +11.689 |
Conclusion | +11.688 |
Neg logit contributions | |
IFF | -13.585 |
ellig | -13.067 |
humans | -12.407 |
Unch | -12.293 |
OR | -12.091 |
Token | off |
Token ID | 572 |
Feature activation | +4.30e-01 |
Pos logit contributions | |
excluding | +7.393 |
azines | +7.317 |
formance | +7.311 |
culosis | +7.220 |
Conclusion | +6.989 |
Neg logit contributions | |
IFF | -11.824 |
Unch | -11.345 |
humans | -11.272 |
usefulness | -11.261 |
ellig | -11.040 |
Token | three |
Token ID | 1115 |
Feature activation | -9.98e-01 |
Pos logit contributions | |
azines | +0.343 |
culosis | +0.340 |
excluding | +0.323 |
formance | +0.320 |
Conclusion | +0.308 |
Neg logit contributions | |
IFF | -0.289 |
usefulness | -0.286 |
Unch | -0.286 |
OR | -0.282 |
lif | -0.270 |
Token | existing |
Token ID | 4683 |
Feature activation | -4.82e+00 |
Pos logit contributions | |
IFF | +0.683 |
usefulness | +0.676 |
Unch | +0.676 |
OR | +0.664 |
ellig | +0.639 |
Neg logit contributions | |
azines | -0.783 |
culosis | -0.773 |
excluding | -0.738 |
formance | -0.727 |
Conclusion | -0.703 |
Token | root |
Token ID | 6808 |
Feature activation | -5.86e+00 |
Pos logit contributions | |
usefulness | +3.444 |
Unch | +3.433 |
IFF | +3.416 |
OR | +3.384 |
lif | +3.302 |
Neg logit contributions | |
culosis | -3.622 |
azines | -3.603 |
excluding | -3.392 |
formance | -3.356 |
cluding | -3.202 |
Token | is |
Token ID | 318 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
azines | +4.401 |
culosis | +4.304 |
excluding | +4.141 |
formance | +3.952 |
excludes | +3.874 |
Neg logit contributions | |
IFF | -5.173 |
usefulness | -5.055 |
Unch | -5.046 |
OR | -4.965 |
ellig | -4.891 |
Token | quickly |
Token ID | 2952 |
Feature activation | +4.40e+00 |
Pos logit contributions | |
azines | +1.147 |
culosis | +1.135 |
excluding | +1.083 |
formance | +1.057 |
Conclusion | +1.030 |
Neg logit contributions | |
IFF | -1.122 |
Unch | -1.098 |
usefulness | -1.095 |
OR | -1.079 |
ellig | -1.053 |
Token | becoming |
Token ID | 5033 |
Feature activation | +6.25e+00 |
Pos logit contributions | |
azines | +2.896 |
culosis | +2.891 |
excluding | +2.797 |
cluding | +2.651 |
excluding | +2.632 |
Neg logit contributions | |
IFF | -3.414 |
Unch | -3.348 |
usefulness | -3.293 |
OR | -3.266 |
ellig | -3.202 |
Token | one |
Token ID | 530 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
culosis | +4.215 |
azines | +4.204 |
excluding | +3.991 |
formance | +3.847 |
Conclusion | +3.831 |
Neg logit contributions | |
IFF | -4.631 |
usefulness | -4.512 |
Unch | -4.486 |
OR | -4.459 |
ellig | -4.413 |
Token | of |
Token ID | 286 |
Feature activation | +8.16e+00 |
Pos logit contributions | |
azines | +7.596 |
culosis | +7.451 |
formance | +7.240 |
excluding | +7.154 |
Conclusion | +7.060 |
Neg logit contributions | |
IFF | -8.805 |
Unch | -8.670 |
usefulness | -8.598 |
OR | -8.521 |
ellig | -8.413 |
Token | my |
Token ID | 616 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
azines | +5.469 |
culosis | +5.302 |
excluding | +5.142 |
formance | +4.949 |
cluding | +4.947 |
Neg logit contributions | |
IFF | -6.118 |
Unch | -5.949 |
ellig | -5.872 |
usefulness | -5.868 |
OR | -5.809 |
Token | favorite |
Token ID | 4004 |
Feature activation | +8.92e+00 |
Pos logit contributions | |
azines | +12.333 |
excluding | +11.560 |
foremost | +11.341 |
Conclusion | +11.312 |
cluding | +11.275 |
Neg logit contributions | |
IFF | -14.413 |
ellig | -13.470 |
Unch | -13.352 |
humans | -13.206 |
usefulness | -13.049 |
Token | fl |
Token ID | 781 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
azines | +6.097 |
excluding | +5.658 |
culosis | +5.597 |
formance | +5.484 |
Conclusion | +5.482 |
Neg logit contributions | |
IFF | -6.673 |
Unch | -6.450 |
OR | -6.301 |
ellig | -6.271 |
usefulness | -6.203 |
Token | ours |
Token ID | 4662 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
IFF | +0.546 |
Unch | +0.543 |
usefulness | +0.530 |
OR | +0.470 |
lif | +0.456 |
Neg logit contributions | |
azines | -2.257 |
culosis | -2.220 |
excluding | -2.162 |
formance | -2.154 |
cluding | -2.102 |
Token | to |
Token ID | 284 |
Feature activation | +5.38e+00 |
Pos logit contributions | |
azines | +2.522 |
culosis | +2.456 |
excluding | +2.384 |
formance | +2.322 |
Conclusion | +2.262 |
Neg logit contributions | |
IFF | -2.430 |
Unch | -2.375 |
usefulness | -2.367 |
OR | -2.333 |
ellig | -2.268 |
Token | work |
Token ID | 670 |
Feature activation | +6.47e+00 |
Pos logit contributions | |
azines | +3.198 |
culosis | +3.111 |
excluding | +2.927 |
formance | +2.846 |
Conclusion | +2.767 |
Neg logit contributions | |
IFF | -4.640 |
Unch | -4.514 |
OR | -4.450 |
usefulness | -4.425 |
humans | -4.333 |
Token | — |
Token ID | 960 |
Feature activation | -3.99e+00 |
Pos logit contributions | |
culosis | +3.420 |
azines | +3.401 |
excluding | +3.271 |
formance | +3.147 |
Conclusion | +3.089 |
Neg logit contributions | |
usefulness | -3.728 |
IFF | -3.700 |
Unch | -3.657 |
OR | -3.602 |
humans | -3.518 |
Token | one |
Token ID | 505 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
IFF | +2.607 |
usefulness | +2.561 |
OR | +2.559 |
Unch | +2.553 |
humans | +2.433 |
Neg logit contributions | |
azines | -3.253 |
culosis | -3.231 |
formance | -3.028 |
excluding | -3.026 |
Conclusion | -2.920 |
Token | that |
Token ID | 326 |
Feature activation | +4.31e+00 |
Pos logit contributions | |
culminating | +7.090 |
azines | +7.086 |
culosis | +7.006 |
excluding | +6.994 |
excluding | +6.870 |
Neg logit contributions | |
Unch | -8.845 |
IFF | -8.840 |
OR | -8.628 |
usefulness | -8.572 |
humans | -8.559 |
Token | would |
Token ID | 561 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
azines | +3.012 |
culosis | +3.012 |
excluding | +2.882 |
formance | +2.781 |
Conclusion | +2.780 |
Neg logit contributions | |
IFF | -3.145 |
usefulness | -3.084 |
Unch | -3.080 |
OR | -3.060 |
humans | -2.958 |
Token | have |
Token ID | 423 |
Feature activation | +3.70e+00 |
Pos logit contributions | |
azines | +1.889 |
culosis | +1.881 |
excluding | +1.791 |
formance | +1.741 |
Conclusion | +1.709 |
Neg logit contributions | |
IFF | -1.958 |
Unch | -1.948 |
usefulness | -1.936 |
OR | -1.907 |
humans | -1.853 |
Token | set |
Token ID | 900 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
azines | +2.699 |
culosis | +2.646 |
excluding | +2.603 |
formance | +2.474 |
excluding | +2.474 |
Neg logit contributions | |
IFF | -2.596 |
Unch | -2.571 |
OR | -2.512 |
usefulness | -2.505 |
humans | -2.441 |
Token | preced |
Token ID | 8555 |
Feature activation | -6.27e+00 |
Pos logit contributions | |
azines | +11.983 |
culminating | +11.557 |
excluding | +11.396 |
cluding | +11.247 |
excluding | +11.176 |
Neg logit contributions | |
IFF | -13.002 |
Unch | -12.987 |
ibrary | -12.874 |
OR | -12.760 |
blance | -12.734 |
Token | ents |
Token ID | 658 |
Feature activation | -2.14e+00 |
Pos logit contributions | |
IFF | +2.818 |
usefulness | +2.756 |
Unch | +2.733 |
OR | +2.720 |
humans | +2.614 |
Neg logit contributions | |
culosis | -6.247 |
azines | -6.239 |
excluding | -6.025 |
formance | -5.891 |
Conclusion | -5.771 |
Token | , |
Token ID | 11 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
IFF | +1.346 |
usefulness | +1.335 |
Unch | +1.332 |
OR | +1.311 |
lif | +1.251 |
Neg logit contributions | |
azines | -1.801 |
culosis | -1.791 |
excluding | -1.706 |
formance | -1.686 |
Conclusion | -1.630 |
Token | raised |
Token ID | 4376 |
Feature activation | +5.61e+00 |
Pos logit contributions | |
IFF | +1.013 |
Unch | +1.004 |
usefulness | +1.002 |
OR | +0.989 |
ellig | +0.947 |
Neg logit contributions | |
azines | -1.103 |
culosis | -1.094 |
excluding | -1.037 |
formance | -1.023 |
Conclusion | -0.987 |
Token | expectations |
Token ID | 9027 |
Feature activation | +4.99e+00 |
Pos logit contributions | |
azines | +4.094 |
culosis | +4.037 |
excluding | +3.828 |
formance | +3.798 |
Conclusion | +3.797 |
Neg logit contributions | |
Unch | -3.889 |
IFF | -3.866 |
OR | -3.829 |
usefulness | -3.785 |
humans | -3.677 |
Token | 10 |
Token ID | 838 |
Feature activation | +5.68e+00 |
Pos logit contributions | |
azines | +1.885 |
culosis | +1.850 |
excluding | +1.809 |
formance | +1.753 |
Conclusion | +1.736 |
Neg logit contributions | |
IFF | -1.229 |
Unch | -1.200 |
usefulness | -1.200 |
ellig | -1.175 |
OR | -1.154 |
Token | years |
Token ID | 812 |
Feature activation | +4.80e+00 |
Pos logit contributions | |
azines | +4.543 |
culosis | +4.416 |
excluding | +4.305 |
formance | +4.181 |
cluding | +4.056 |
Neg logit contributions | |
IFF | -3.723 |
usefulness | -3.717 |
Unch | -3.636 |
OR | -3.515 |
ellig | -3.504 |
Token | and |
Token ID | 290 |
Feature activation | +6.05e+00 |
Pos logit contributions | |
azines | +3.258 |
culosis | +3.154 |
excluding | +3.050 |
formance | +2.943 |
Conclusion | +2.904 |
Neg logit contributions | |
IFF | -3.730 |
usefulness | -3.654 |
Unch | -3.645 |
ellig | -3.551 |
OR | -3.549 |
Token | older |
Token ID | 4697 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
azines | +3.145 |
culosis | +2.945 |
excluding | +2.870 |
excluding | +2.775 |
formance | +2.739 |
Neg logit contributions | |
IFF | -5.628 |
Unch | -5.437 |
usefulness | -5.423 |
ellig | -5.423 |
OR | -5.357 |
Token | , |
Token ID | 11 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
azines | +9.514 |
excluding | +9.398 |
excluding | +9.316 |
culosis | +8.949 |
culminating | +8.809 |
Neg logit contributions | |
IFF | -11.030 |
usefulness | -10.802 |
ellig | -10.707 |
blance | -10.557 |
humans | -10.554 |
Token | by |
Token ID | 416 |
Feature activation | +2.10e+01 |
Pos logit contributions | |
azines | +7.158 |
excluding | +7.082 |
excluding | +6.883 |
culosis | +6.859 |
Conclusion | +6.684 |
Neg logit contributions | |
IFF | -8.891 |
ellig | -8.601 |
Unch | -8.295 |
usefulness | -8.279 |
humans | -8.267 |
Token | sex |
Token ID | 1714 |
Feature activation | +6.84e+00 |
Pos logit contributions | |
excluding | +12.236 |
culosis | +11.874 |
azines | +11.837 |
excluding | +11.795 |
cessation | +11.628 |
Neg logit contributions | |
IFF | -13.227 |
humans | -13.008 |
Unch | -12.901 |
ellig | -12.851 |
oS | -12.587 |
Token | , |
Token ID | 11 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
azines | +4.834 |
culosis | +4.713 |
excluding | +4.639 |
formance | +4.495 |
cluding | +4.350 |
Neg logit contributions | |
IFF | -5.092 |
usefulness | -4.932 |
Unch | -4.911 |
humans | -4.864 |
OR | -4.771 |
Token | United |
Token ID | 1578 |
Feature activation | +9.60e+00 |
Pos logit contributions | |
azines | +8.527 |
excluding | +8.383 |
excluding | +8.327 |
culosis | +8.251 |
culminating | +8.103 |
Neg logit contributions | |
IFF | -9.543 |
ellig | -9.286 |
humans | -9.197 |
Unch | -9.161 |
oS | -8.922 |
Token | States |
Token ID | 1829 |
Feature activation | +8.58e+00 |
Pos logit contributions | |
azines | +4.777 |
culosis | +4.672 |
excluding | +4.496 |
Conclusion | +4.447 |
Franch | +4.215 |
Neg logit contributions | |
IFF | -8.731 |
usefulness | -8.549 |
blance | -8.424 |
ellig | -8.280 |
imeo | -8.087 |
Token | , |
Token ID | 11 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
azines | +6.034 |
culosis | +5.926 |
excluding | +5.798 |
formance | +5.522 |
excluding | +5.519 |
Neg logit contributions | |
IFF | -6.286 |
usefulness | -6.057 |
Unch | -5.893 |
humans | -5.881 |
ellig | -5.816 |
Token | Beat |
Token ID | 12568 |
Feature activation | +8.52e+00 |
Pos logit contributions | |
azines | +3.475 |
culosis | +3.433 |
excluding | +3.210 |
formance | +3.120 |
Conclusion | +3.057 |
Neg logit contributions | |
IFF | -3.536 |
usefulness | -3.453 |
Unch | -3.434 |
OR | -3.357 |
humans | -3.350 |
Token | rice |
Token ID | 20970 |
Feature activation | +7.08e+00 |
Pos logit contributions | |
azines | +4.193 |
culosis | +4.108 |
excluding | +3.649 |
formance | +3.525 |
cluding | +3.445 |
Neg logit contributions | |
IFF | -8.058 |
Unch | -7.938 |
usefulness | -7.887 |
OR | -7.757 |
humans | -7.537 |
Token | Joyce |
Token ID | 25936 |
Feature activation | +3.04e+00 |
Pos logit contributions | |
azines | +4.981 |
culosis | +4.899 |
excluding | +4.595 |
Conclusion | +4.475 |
formance | +4.454 |
Neg logit contributions | |
IFF | -5.178 |
usefulness | -5.074 |
Unch | -4.930 |
OR | -4.922 |
humans | -4.860 |
Token | Ke |
Token ID | 3873 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
azines | +2.179 |
culosis | +2.159 |
excluding | +2.033 |
formance | +1.975 |
Conclusion | +1.938 |
Neg logit contributions | |
IFF | -2.274 |
usefulness | -2.254 |
Unch | -2.218 |
OR | -2.188 |
humans | -2.133 |
Token | an |
Token ID | 272 |
Feature activation | -3.31e-01 |
Pos logit contributions | |
azines | +1.492 |
culosis | +1.474 |
excluding | +1.389 |
formance | +1.388 |
cluding | +1.337 |
Neg logit contributions | |
IFF | -1.227 |
usefulness | -1.223 |
Unch | -1.222 |
OR | -1.194 |
lif | -1.147 |
Token | set |
Token ID | 900 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
IFF | +0.244 |
usefulness | +0.242 |
Unch | +0.242 |
OR | +0.237 |
lif | +0.229 |
Neg logit contributions | |
azines | -0.243 |
culosis | -0.242 |
excluding | -0.228 |
formance | -0.224 |
Conclusion | -0.216 |
Token | up |
Token ID | 510 |
Feature activation | +3.81e+00 |
Pos logit contributions | |
azines | +11.810 |
culosis | +11.001 |
excluding | +10.833 |
excluding | +10.725 |
culminating | +10.605 |
Neg logit contributions | |
IFF | -13.682 |
ellig | -13.075 |
Unch | -13.051 |
OR | -12.905 |
ibrary | -12.686 |
Token | the |
Token ID | 262 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
azines | +2.875 |
culosis | +2.860 |
excluding | +2.680 |
formance | +2.603 |
cluding | +2.566 |
Neg logit contributions | |
IFF | -2.670 |
usefulness | -2.626 |
Unch | -2.597 |
OR | -2.594 |
ellig | -2.535 |
Token | Joyce |
Token ID | 25936 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
azines | +0.901 |
culosis | +0.896 |
excluding | +0.846 |
formance | +0.830 |
Conclusion | +0.806 |
Neg logit contributions | |
IFF | -0.840 |
usefulness | -0.828 |
Unch | -0.826 |
OR | -0.818 |
ellig | -0.789 |
Token | Foundation |
Token ID | 5693 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
azines | +1.001 |
culosis | +0.997 |
excluding | +0.935 |
formance | +0.920 |
Conclusion | +0.889 |
Neg logit contributions | |
IFF | -1.022 |
usefulness | -1.018 |
Unch | -1.010 |
OR | -0.997 |
ellig | -0.959 |
Token | in |
Token ID | 287 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
IFF | +0.970 |
usefulness | +0.961 |
Unch | +0.959 |
OR | +0.943 |
lif | +0.908 |
Neg logit contributions | |
azines | -1.027 |
culosis | -1.020 |
excluding | -0.965 |
formance | -0.951 |
Conclusion | -0.916 |
Token | . |
Token ID | 13 |
Feature activation | +5.82e+00 |
Pos logit contributions | |
azines | +2.067 |
culosis | +2.065 |
excluding | +1.948 |
formance | +1.943 |
Conclusion | +1.892 |
Neg logit contributions | |
IFF | -2.059 |
usefulness | -2.048 |
Unch | -2.012 |
OR | -1.989 |
ellig | -1.942 |
Token | Such |
Token ID | 8013 |
Feature activation | +8.51e+00 |
Pos logit contributions | |
azines | +4.194 |
culosis | +4.162 |
Conclusion | +4.013 |
excluding | +3.987 |
formance | +3.855 |
Neg logit contributions | |
usefulness | -4.158 |
IFF | -4.083 |
Unch | -3.900 |
ellig | -3.856 |
OR | -3.847 |
Token | an |
Token ID | 281 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
azines | +5.955 |
culosis | +5.751 |
formance | +5.411 |
excluding | +5.408 |
Conclusion | +5.363 |
Neg logit contributions | |
IFF | -6.054 |
Unch | -5.967 |
OR | -5.830 |
usefulness | -5.814 |
ellig | -5.700 |
Token | event |
Token ID | 1785 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
IFF | +0.092 |
usefulness | +0.091 |
Unch | +0.091 |
OR | +0.090 |
lif | +0.086 |
Neg logit contributions | |
azines | -0.105 |
culosis | -0.104 |
excluding | -0.099 |
formance | -0.098 |
Conclusion | -0.094 |
Token | might |
Token ID | 1244 |
Feature activation | +5.42e-01 |
Pos logit contributions | |
azines | +1.743 |
culosis | +1.738 |
excluding | +1.652 |
formance | +1.603 |
Conclusion | +1.568 |
Neg logit contributions | |
IFF | -1.876 |
Unch | -1.861 |
usefulness | -1.859 |
OR | -1.813 |
ellig | -1.763 |
Token | set |
Token ID | 900 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
azines | +0.402 |
culosis | +0.401 |
excluding | +0.380 |
formance | +0.373 |
Conclusion | +0.362 |
Neg logit contributions | |
IFF | -0.389 |
Unch | -0.387 |
usefulness | -0.387 |
OR | -0.378 |
humans | -0.365 |
Token | the |
Token ID | 262 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
azines | +11.488 |
culosis | +10.783 |
cluding | +10.484 |
Conclusion | +10.389 |
excluding | +10.384 |
Neg logit contributions | |
IFF | -13.264 |
usefulness | -12.900 |
ellig | -12.734 |
Unch | -12.667 |
abilities | -12.481 |
Token | stage |
Token ID | 3800 |
Feature activation | -3.48e+00 |
Pos logit contributions | |
azines | +8.708 |
culosis | +8.202 |
Conclusion | +8.007 |
excluding | +7.897 |
culminating | +7.887 |
Neg logit contributions | |
IFF | -10.108 |
Unch | -9.724 |
humans | -9.658 |
ellig | -9.650 |
OR | -9.536 |
Token | for |
Token ID | 329 |
Feature activation | +3.91e+00 |
Pos logit contributions | |
IFF | +1.833 |
Unch | +1.820 |
usefulness | +1.810 |
OR | +1.776 |
lif | +1.704 |
Neg logit contributions | |
azines | -3.258 |
culosis | -3.245 |
excluding | -3.109 |
formance | -3.061 |
Conclusion | -2.964 |
Token | a |
Token ID | 257 |
Feature activation | +4.64e+00 |
Pos logit contributions | |
azines | +2.863 |
culosis | +2.840 |
excluding | +2.676 |
formance | +2.648 |
Conclusion | +2.636 |
Neg logit contributions | |
IFF | -2.811 |
usefulness | -2.727 |
Unch | -2.724 |
OR | -2.697 |
ellig | -2.636 |
Token | tragedy |
Token ID | 13574 |
Feature activation | +2.86e+00 |
Pos logit contributions | |
azines | +3.482 |
culosis | +3.457 |
Conclusion | +3.234 |
excluding | +3.234 |
formance | +3.231 |
Neg logit contributions | |
IFF | -3.218 |
Unch | -3.134 |
usefulness | -3.133 |
OR | -3.088 |
ellig | -3.012 |
Token | and |
Token ID | 290 |
Feature activation | +2.72e+00 |
Pos logit contributions | |
IFF | +1.190 |
usefulness | +1.181 |
Unch | +1.179 |
OR | +1.161 |
lif | +1.116 |
Neg logit contributions | |
azines | -1.259 |
culosis | -1.251 |
excluding | -1.185 |
formance | -1.168 |
Conclusion | -1.125 |
Token | Spl |
Token ID | 13341 |
Feature activation | +3.84e+00 |
Pos logit contributions | |
azines | +2.086 |
culosis | +2.079 |
excluding | +2.008 |
formance | +1.962 |
Conclusion | +1.934 |
Neg logit contributions | |
IFF | -1.856 |
usefulness | -1.793 |
Unch | -1.780 |
OR | -1.766 |
ellig | -1.704 |
Token | inter |
Token ID | 3849 |
Feature activation | +5.85e+00 |
Pos logit contributions | |
azines | +3.320 |
culosis | +3.205 |
excluding | +3.178 |
formance | +3.175 |
cluding | +3.068 |
Neg logit contributions | |
Unch | -2.364 |
usefulness | -2.333 |
IFF | -2.164 |
OR | -2.107 |
lif | -2.099 |
Token | began |
Token ID | 2540 |
Feature activation | +5.76e+00 |
Pos logit contributions | |
azines | +3.894 |
culosis | +3.884 |
excluding | +3.705 |
Conclusion | +3.597 |
formance | +3.595 |
Neg logit contributions | |
IFF | -4.471 |
usefulness | -4.366 |
Unch | -4.282 |
OR | -4.210 |
humans | -4.124 |
Token | to |
Token ID | 284 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
azines | +4.107 |
culosis | +4.047 |
excluding | +3.953 |
formance | +3.860 |
cluding | +3.799 |
Neg logit contributions | |
IFF | -4.132 |
Unch | -3.950 |
usefulness | -3.932 |
OR | -3.913 |
ellig | -3.807 |
Token | set |
Token ID | 900 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
azines | +1.226 |
culosis | +1.223 |
excluding | +1.159 |
formance | +1.147 |
Conclusion | +1.125 |
Neg logit contributions | |
IFF | -1.188 |
Unch | -1.163 |
usefulness | -1.157 |
OR | -1.147 |
humans | -1.102 |
Token | his |
Token ID | 465 |
Feature activation | +9.71e+00 |
Pos logit contributions | |
azines | +11.256 |
formance | +11.013 |
excluding | +10.924 |
Conclusion | +10.904 |
culminating | +10.721 |
Neg logit contributions | |
IFF | -13.396 |
ibrary | -13.124 |
OR | -12.497 |
Unch | -12.432 |
usefulness | -12.202 |
Token | own |
Token ID | 898 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
azines | +6.139 |
culosis | +5.975 |
Conclusion | +5.844 |
excluding | +5.838 |
formance | +5.628 |
Neg logit contributions | |
IFF | -7.419 |
Unch | -7.156 |
OR | -7.069 |
ellig | -6.973 |
ibrary | -6.807 |
Token | plan |
Token ID | 1410 |
Feature activation | +3.95e+00 |
Pos logit contributions | |
azines | +7.383 |
culosis | +7.275 |
Conclusion | +7.150 |
excluding | +7.097 |
formance | +6.929 |
Neg logit contributions | |
IFF | -6.803 |
Unch | -6.498 |
OR | -6.453 |
ellig | -6.323 |
usefulness | -6.215 |
Token | for |
Token ID | 329 |
Feature activation | +2.21e+00 |
Pos logit contributions | |
azines | +2.925 |
culosis | +2.849 |
excluding | +2.797 |
formance | +2.761 |
Conclusion | +2.696 |
Neg logit contributions | |
IFF | -2.759 |
usefulness | -2.751 |
Unch | -2.695 |
OR | -2.663 |
ellig | -2.551 |
Token | vengeance |
Token ID | 30657 |
Feature activation | +3.15e+00 |
Pos logit contributions | |
culosis | +1.672 |
azines | +1.668 |
excluding | +1.617 |
formance | +1.585 |
Conclusion | +1.550 |
Neg logit contributions | |
IFF | -1.548 |
Unch | -1.487 |
usefulness | -1.482 |
OR | -1.482 |
ellig | -1.435 |
Token | said |
Token ID | 531 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
culosis | +6.083 |
azines | +5.953 |
excluding | +5.757 |
excludes | +5.728 |
formance | +5.617 |
Neg logit contributions | |
IFF | -7.192 |
Unch | -6.866 |
usefulness | -6.853 |
OR | -6.804 |
ellig | -6.775 |
Token | : |
Token ID | 25 |
Feature activation | -6.24e+00 |
Pos logit contributions | |
azines | +3.817 |
culosis | +3.781 |
excluding | +3.661 |
formance | +3.594 |
Conclusion | +3.508 |
Neg logit contributions | |
IFF | -4.025 |
usefulness | -3.892 |
Unch | -3.890 |
OR | -3.857 |
ellig | -3.769 |
Token | " |
Token ID | 366 |
Feature activation | +5.59e+00 |
Pos logit contributions | |
Unch | +3.253 |
OR | +3.245 |
IFF | +3.240 |
usefulness | +3.193 |
humans | +3.057 |
Neg logit contributions | |
azines | -5.773 |
culosis | -5.718 |
excluding | -5.414 |
formance | -5.385 |
cluding | -5.157 |
Token | We |
Token ID | 1135 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
azines | +3.925 |
excluding | +3.875 |
culosis | +3.820 |
formance | +3.745 |
Conclusion | +3.576 |
Neg logit contributions | |
usefulness | -4.116 |
Unch | -4.063 |
IFF | -3.945 |
lif | -3.874 |
ellig | -3.848 |
Token | have |
Token ID | 423 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
culosis | +6.939 |
azines | +6.627 |
disregard | +6.613 |
excluding | +6.511 |
formance | +6.329 |
Neg logit contributions | |
IFF | -8.579 |
usefulness | -8.494 |
Unch | -8.404 |
ibrary | -8.362 |
humans | -8.299 |
Token | made |
Token ID | 925 |
Feature activation | +2.04e+01 |
Pos logit contributions | |
excluding | +8.871 |
azines | +8.817 |
excluding | +8.752 |
culminating | +8.674 |
culosis | +8.521 |
Neg logit contributions | |
IFF | -10.777 |
Unch | -10.547 |
blance | -10.493 |
ellig | -10.401 |
ibrary | -10.310 |
Token | it |
Token ID | 340 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
excluding | +11.296 |
cluding | +11.044 |
culminating | +11.041 |
cessation | +11.039 |
formance | +10.932 |
Neg logit contributions | |
blance | -12.717 |
ivas | -12.551 |
humans | -12.428 |
IFF | -12.407 |
OR | -12.333 |
Token | clear |
Token ID | 1598 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
culosis | +8.525 |
excluding | +7.905 |
excluding | +7.892 |
culminating | +7.782 |
formance | +7.581 |
Neg logit contributions | |
blance | -13.702 |
Unch | -13.625 |
usefulness | -13.483 |
humans | -13.400 |
OR | -13.374 |
Token | that |
Token ID | 326 |
Feature activation | +7.90e+00 |
Pos logit contributions | |
azines | +6.733 |
culosis | +6.567 |
excluding | +6.451 |
formance | +6.444 |
excluding | +6.166 |
Neg logit contributions | |
IFF | -8.028 |
usefulness | -7.904 |
Unch | -7.894 |
OR | -7.773 |
humans | -7.725 |
Token | Rolls |
Token ID | 40074 |
Feature activation | +7.95e+00 |
Pos logit contributions | |
azines | +5.145 |
culosis | +5.090 |
excluding | +5.047 |
formance | +4.930 |
excluding | +4.844 |
Neg logit contributions | |
IFF | -5.886 |
usefulness | -5.660 |
OR | -5.604 |
Unch | -5.593 |
humans | -5.574 |
Token | - |
Token ID | 12 |
Feature activation | +9.13e+00 |
Pos logit contributions | |
azines | +5.744 |
culosis | +5.665 |
formance | +5.407 |
excluding | +5.364 |
Conclusion | +5.133 |
Neg logit contributions | |
IFF | -5.698 |
Unch | -5.620 |
usefulness | -5.562 |
OR | -5.447 |
humans | -5.367 |
Token | this |
Token ID | 428 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
azines | +8.602 |
excluding | +8.037 |
culosis | +7.974 |
excluding | +7.844 |
formance | +7.715 |
Neg logit contributions | |
IFF | -9.691 |
ellig | -9.211 |
usefulness | -9.179 |
Unch | -9.174 |
OR | -9.079 |
Token | from |
Token ID | 422 |
Feature activation | +8.14e+00 |
Pos logit contributions | |
azines | +7.847 |
culosis | +7.489 |
excluding | +7.443 |
excluding | +7.401 |
excludes | +7.382 |
Neg logit contributions | |
IFF | -9.442 |
humans | -9.164 |
Unch | -9.106 |
OR | -8.988 |
ivas | -8.962 |
Token | a |
Token ID | 257 |
Feature activation | +7.20e+00 |
Pos logit contributions | |
azines | +5.319 |
culosis | +5.182 |
excluding | +4.956 |
Conclusion | +4.910 |
formance | +4.904 |
Neg logit contributions | |
IFF | -6.288 |
usefulness | -5.990 |
Unch | -5.953 |
ellig | -5.872 |
OR | -5.866 |
Token | store |
Token ID | 3650 |
Feature activation | +6.52e+00 |
Pos logit contributions | |
azines | +4.552 |
culosis | +4.439 |
excluding | +4.213 |
formance | +4.205 |
Conclusion | +4.144 |
Neg logit contributions | |
IFF | -5.623 |
Unch | -5.520 |
usefulness | -5.454 |
OR | -5.379 |
ellig | -5.374 |
Token | , |
Token ID | 11 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
azines | +4.545 |
culosis | +4.479 |
excluding | +4.298 |
formance | +4.224 |
Conclusion | +4.092 |
Neg logit contributions | |
IFF | -4.772 |
Unch | -4.758 |
usefulness | -4.657 |
OR | -4.511 |
humans | -4.466 |
Token | make |
Token ID | 787 |
Feature activation | +2.03e+01 |
Pos logit contributions | |
azines | +9.097 |
culosis | +8.661 |
excluding | +8.585 |
excluding | +8.447 |
disregard | +8.404 |
Neg logit contributions | |
IFF | -10.004 |
Unch | -9.672 |
usefulness | -9.515 |
ellig | -9.431 |
humans | -9.176 |
Token | sure |
Token ID | 1654 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
azines | +7.699 |
excluding | +7.388 |
excluding | +7.314 |
culosis | +7.259 |
cluding | +7.222 |
Neg logit contributions | |
IFF | -16.373 |
Unch | -16.197 |
usefulness | -16.189 |
ellig | -16.149 |
humans | -15.901 |
Token | to |
Token ID | 284 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
azines | +10.527 |
excluding | +10.159 |
culosis | +10.142 |
excluding | +9.970 |
formance | +9.635 |
Neg logit contributions | |
IFF | -12.961 |
Unch | -12.783 |
usefulness | -12.642 |
blance | -12.305 |
humans | -12.230 |
Token | check |
Token ID | 2198 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
disregard | +10.526 |
azines | +10.119 |
excluding | +9.906 |
excludes | +9.738 |
excluding | +9.658 |
Neg logit contributions | |
usefulness | -12.973 |
IFF | -12.858 |
humans | -12.828 |
Unch | -12.554 |
ibrary | -12.333 |
Token | the |
Token ID | 262 |
Feature activation | +6.86e+00 |
Pos logit contributions | |
azines | +7.726 |
culosis | +7.344 |
excluding | +7.251 |
excluding | +7.106 |
formance | +7.070 |
Neg logit contributions | |
IFF | -9.257 |
Unch | -9.026 |
humans | -8.782 |
ellig | -8.723 |
usefulness | -8.704 |
Token | ingredients |
Token ID | 9391 |
Feature activation | +3.95e+00 |
Pos logit contributions | |
azines | +3.790 |
culosis | +3.562 |
excluding | +3.455 |
formance | +3.396 |
Conclusion | +3.325 |
Neg logit contributions | |
IFF | -6.093 |
Unch | -5.996 |
humans | -5.835 |
OR | -5.824 |
ellig | -5.790 |
Token | in |
Token ID | 287 |
Feature activation | +5.95e+00 |
Pos logit contributions | |
azines | +1.744 |
culosis | +1.689 |
excluding | +1.686 |
excluding | +1.609 |
formance | +1.607 |
Neg logit contributions | |
IFF | -1.951 |
Unch | -1.930 |
OR | -1.904 |
usefulness | -1.903 |
ellig | -1.879 |
Token | March |
Token ID | 2805 |
Feature activation | -3.86e+00 |
Pos logit contributions | |
azines | +3.598 |
excluding | +3.503 |
cluding | +3.457 |
Conclusion | +3.443 |
culosis | +3.412 |
Neg logit contributions | |
IFF | -4.768 |
Unch | -4.670 |
ellig | -4.662 |
OR | -4.637 |
orm | -4.494 |
Token | 2016 |
Token ID | 1584 |
Feature activation | +8.54e-01 |
Pos logit contributions | |
IFF | +2.671 |
usefulness | +2.655 |
Unch | +2.651 |
OR | +2.612 |
lif | +2.513 |
Neg logit contributions | |
azines | -2.992 |
culosis | -2.977 |
excluding | -2.810 |
formance | -2.775 |
Conclusion | -2.671 |
Token | , |
Token ID | 11 |
Feature activation | +5.88e-02 |
Pos logit contributions | |
azines | +0.655 |
culosis | +0.650 |
excluding | +0.619 |
formance | +0.609 |
cluding | +0.589 |
Neg logit contributions | |
IFF | -0.598 |
usefulness | -0.593 |
Unch | -0.590 |
OR | -0.582 |
ellig | -0.558 |
Token | it |
Token ID | 340 |
Feature activation | +2.80e+00 |
Pos logit contributions | |
azines | +0.048 |
culosis | +0.047 |
excluding | +0.045 |
formance | +0.045 |
Conclusion | +0.043 |
Neg logit contributions | |
IFF | -0.039 |
Unch | -0.038 |
usefulness | -0.038 |
OR | -0.038 |
ellig | -0.036 |
Token | set |
Token ID | 900 |
Feature activation | +2.03e+01 |
Pos logit contributions | |
azines | +1.792 |
culosis | +1.782 |
excluding | +1.703 |
formance | +1.647 |
cluding | +1.614 |
Neg logit contributions | |
IFF | -2.266 |
Unch | -2.225 |
usefulness | -2.214 |
OR | -2.200 |
humans | -2.129 |
Token | Os |
Token ID | 8834 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
azines | +10.550 |
excluding | +10.527 |
formance | +10.236 |
culminating | +10.217 |
cluding | +10.118 |
Neg logit contributions | |
IFF | -13.952 |
ellig | -13.373 |
Unch | -13.275 |
ibrary | -13.267 |
humans | -12.992 |
Token | we |
Token ID | 732 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
IFF | +1.972 |
usefulness | +1.958 |
Unch | +1.932 |
OR | +1.918 |
ellig | +1.800 |
Neg logit contributions | |
azines | -4.411 |
culosis | -4.389 |
excluding | -4.201 |
formance | -4.152 |
Conclusion | -4.056 |
Token | iler |
Token ID | 5329 |
Feature activation | +5.72e+00 |
Pos logit contributions | |
azines | +1.030 |
culosis | +1.030 |
formance | +0.974 |
excluding | +0.950 |
cluding | +0.901 |
Neg logit contributions | |
Unch | -1.595 |
usefulness | -1.577 |
IFF | -1.566 |
OR | -1.546 |
lif | -1.493 |
Token | up |
Token ID | 510 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
azines | +3.870 |
culosis | +3.790 |
excluding | +3.580 |
formance | +3.572 |
cluding | +3.449 |
Neg logit contributions | |
IFF | -4.355 |
usefulness | -4.291 |
Unch | -4.257 |
OR | -4.192 |
ellig | -4.128 |
Token | as |
Token ID | 355 |
Feature activation | +3.28e+00 |
Pos logit contributions | |
IFF | +1.189 |
Unch | +1.184 |
usefulness | +1.181 |
OR | +1.160 |
lif | +1.110 |
Neg logit contributions | |
azines | -1.856 |
culosis | -1.847 |
excluding | -1.758 |
formance | -1.735 |
Conclusion | -1.685 |
Token | the |
Token ID | 262 |
Feature activation | +9.46e-01 |
Pos logit contributions | |
azines | +2.140 |
culosis | +2.112 |
excluding | +2.021 |
formance | +1.980 |
cluding | +1.913 |
Neg logit contributions | |
IFF | -1.916 |
Unch | -1.863 |
usefulness | -1.862 |
OR | -1.842 |
ellig | -1.800 |
Token | firms |
Token ID | 9611 |
Feature activation | +3.99e-01 |
Pos logit contributions | |
azines | +0.677 |
culosis | +0.673 |
excluding | +0.639 |
formance | +0.629 |
cluding | +0.603 |
Neg logit contributions | |
IFF | -0.710 |
Unch | -0.695 |
usefulness | -0.689 |
OR | -0.688 |
ellig | -0.673 |
Token | coll |
Token ID | 2927 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
azines | +0.288 |
culosis | +0.287 |
excluding | +0.272 |
formance | +0.266 |
Conclusion | +0.257 |
Neg logit contributions | |
IFF | -0.297 |
usefulness | -0.293 |
Unch | -0.293 |
OR | -0.289 |
humans | -0.279 |
Token | uded |
Token ID | 19289 |
Feature activation | -4.22e+00 |
Pos logit contributions | |
IFF | +1.320 |
usefulness | +1.313 |
Unch | +1.311 |
OR | +1.289 |
lif | +1.233 |
Neg logit contributions | |
azines | -1.589 |
culosis | -1.581 |
excluding | -1.506 |
formance | -1.480 |
cluding | -1.427 |
Token | to |
Token ID | 284 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
IFF | +2.680 |
usefulness | +2.666 |
Unch | +2.661 |
OR | +2.615 |
lif | +2.528 |
Neg logit contributions | |
azines | -3.517 |
culosis | -3.493 |
excluding | -3.307 |
formance | -3.289 |
Conclusion | -3.163 |
Token | set |
Token ID | 900 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
azines | +0.859 |
culosis | +0.857 |
excluding | +0.801 |
formance | +0.785 |
Conclusion | +0.764 |
Neg logit contributions | |
IFF | -0.896 |
Unch | -0.887 |
usefulness | -0.885 |
OR | -0.874 |
humans | -0.846 |
Token | each |
Token ID | 1123 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
azines | +10.828 |
excluding | +10.379 |
formance | +10.347 |
culosis | +10.253 |
excluding | +10.165 |
Neg logit contributions | |
IFF | -13.682 |
ellig | -13.485 |
Unch | -13.153 |
OR | -13.153 |
ibrary | -13.099 |
Token | others |
Token ID | 1854 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
azines | +6.477 |
culosis | +6.239 |
excluding | +6.014 |
formance | +6.007 |
cluding | +5.682 |
Neg logit contributions | |
IFF | -8.614 |
Unch | -8.531 |
usefulness | -8.415 |
OR | -8.319 |
humans | -8.243 |
Token | ' |
Token ID | 6 |
Feature activation | +9.21e+00 |
Pos logit contributions | |
azines | +8.057 |
culosis | +7.693 |
formance | +7.462 |
excluding | +7.424 |
excluding | +7.120 |
Neg logit contributions | |
IFF | -9.113 |
Unch | -8.889 |
humans | -8.823 |
ellig | -8.796 |
usefulness | -8.675 |
Token | market |
Token ID | 1910 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
azines | +6.063 |
culosis | +5.958 |
excluding | +5.762 |
formance | +5.702 |
excluding | +5.504 |
Neg logit contributions | |
IFF | -6.921 |
Unch | -6.795 |
ellig | -6.679 |
OR | -6.628 |
humans | -6.552 |
Token | shares |
Token ID | 7303 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
IFF | +1.104 |
Unch | +1.096 |
usefulness | +1.092 |
OR | +1.080 |
ellig | +1.041 |
Neg logit contributions | |
azines | -0.896 |
culosis | -0.889 |
excluding | -0.836 |
formance | -0.823 |
Conclusion | -0.786 |
Token | That |
Token ID | 2504 |
Feature activation | +3.39e+00 |
Pos logit contributions | |
usefulness | +0.063 |
Unch | +0.063 |
IFF | +0.063 |
OR | +0.061 |
lif | +0.060 |
Neg logit contributions | |
azines | -0.063 |
culosis | -0.063 |
excluding | -0.060 |
formance | -0.059 |
cluding | -0.056 |
Token | made |
Token ID | 925 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
culosis | +2.423 |
azines | +2.421 |
excluding | +2.335 |
formance | +2.226 |
cluding | +2.212 |
Neg logit contributions | |
IFF | -2.457 |
Unch | -2.435 |
OR | -2.391 |
usefulness | -2.388 |
ellig | -2.346 |
Token | the |
Token ID | 262 |
Feature activation | -4.21e+00 |
Pos logit contributions | |
azines | +1.040 |
culosis | +1.030 |
excluding | +0.987 |
formance | +0.962 |
cluding | +0.937 |
Neg logit contributions | |
IFF | -1.030 |
Unch | -1.019 |
usefulness | -1.017 |
OR | -1.006 |
ellig | -0.968 |
Token | task |
Token ID | 4876 |
Feature activation | -8.96e+00 |
Pos logit contributions | |
usefulness | +3.215 |
IFF | +3.202 |
Unch | +3.200 |
OR | +3.148 |
lif | +3.055 |
Neg logit contributions | |
azines | -2.966 |
culosis | -2.949 |
excluding | -2.751 |
formance | -2.748 |
cluding | -2.585 |
Token | of |
Token ID | 286 |
Feature activation | +7.19e+00 |
Pos logit contributions | |
IFF | +5.331 |
Unch | +5.271 |
usefulness | +5.256 |
OR | +5.236 |
lif | +5.144 |
Neg logit contributions | |
azines | -7.643 |
culosis | -7.423 |
formance | -7.033 |
excluding | -7.006 |
cluding | -6.794 |
Token | setting |
Token ID | 4634 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
culosis | +4.807 |
azines | +4.735 |
excluding | +4.676 |
excluding | +4.563 |
Conclusion | +4.498 |
Neg logit contributions | |
IFF | -5.272 |
Unch | -5.148 |
OR | -5.130 |
humans | -5.082 |
usefulness | -5.039 |
Token | appropriate |
Token ID | 5035 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
excluding | +11.390 |
cluding | +11.233 |
azines | +11.145 |
excluding | +11.100 |
culminating | +10.959 |
Neg logit contributions | |
blance | -12.416 |
humans | -12.212 |
ellig | -12.206 |
Unch | -12.133 |
OR | -12.127 |
Token | levels |
Token ID | 2974 |
Feature activation | +2.15e+00 |
Pos logit contributions | |
azines | +8.003 |
excluding | +7.865 |
culosis | +7.794 |
Conclusion | +7.686 |
excluding | +7.660 |
Neg logit contributions | |
blance | -10.606 |
humans | -10.511 |
Unch | -10.488 |
ellig | -10.367 |
IFF | -10.292 |
Token | of |
Token ID | 286 |
Feature activation | +4.88e+00 |
Pos logit contributions | |
azines | +1.637 |
culosis | +1.624 |
excluding | +1.552 |
formance | +1.522 |
Conclusion | +1.479 |
Neg logit contributions | |
usefulness | -1.486 |
IFF | -1.485 |
Unch | -1.478 |
OR | -1.457 |
humans | -1.403 |
Token | tax |
Token ID | 1687 |
Feature activation | +3.34e+00 |
Pos logit contributions | |
azines | +3.080 |
culosis | +3.065 |
excluding | +2.964 |
formance | +2.865 |
cluding | +2.803 |
Neg logit contributions | |
IFF | -3.856 |
Unch | -3.842 |
OR | -3.808 |
usefulness | -3.740 |
humans | -3.738 |
Token | cuts |
Token ID | 6630 |
Feature activation | -4.51e+00 |
Pos logit contributions | |
culosis | +2.263 |
azines | +2.239 |
excluding | +2.175 |
formance | +2.146 |
Conclusion | +2.053 |
Neg logit contributions | |
IFF | -2.531 |
Unch | -2.497 |
usefulness | -2.493 |
OR | -2.447 |
ellig | -2.400 |
Token | conservative |
Token ID | 5940 |
Feature activation | +6.44e-01 |
Pos logit contributions | |
IFF | +1.394 |
usefulness | +1.384 |
Unch | +1.382 |
OR | +1.361 |
lif | +1.306 |
Neg logit contributions | |
azines | -1.588 |
culosis | -1.578 |
excluding | -1.496 |
formance | -1.477 |
Conclusion | -1.423 |
Token | group |
Token ID | 1448 |
Feature activation | -2.33e-01 |
Pos logit contributions | |
azines | +0.490 |
culosis | +0.483 |
excluding | +0.460 |
formance | +0.454 |
Conclusion | +0.442 |
Neg logit contributions | |
IFF | -0.454 |
Unch | -0.449 |
usefulness | -0.448 |
OR | -0.442 |
humans | -0.427 |
Token | in |
Token ID | 287 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
IFF | +0.165 |
usefulness | +0.164 |
Unch | +0.163 |
OR | +0.161 |
ellig | +0.155 |
Neg logit contributions | |
azines | -0.176 |
culosis | -0.175 |
excluding | -0.166 |
formance | -0.163 |
Conclusion | -0.157 |
Token | Madrid |
Token ID | 14708 |
Feature activation | +4.38e-01 |
Pos logit contributions | |
IFF | +1.863 |
usefulness | +1.857 |
Unch | +1.854 |
OR | +1.827 |
lif | +1.764 |
Neg logit contributions | |
azines | -1.732 |
culosis | -1.730 |
excluding | -1.623 |
formance | -1.598 |
Conclusion | -1.530 |
Token | has |
Token ID | 468 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
azines | +0.327 |
culosis | +0.325 |
excluding | +0.309 |
formance | +0.302 |
Conclusion | +0.291 |
Neg logit contributions | |
IFF | -0.315 |
usefulness | -0.313 |
Unch | -0.311 |
OR | -0.307 |
ellig | -0.295 |
Token | set |
Token ID | 900 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
azines | +0.823 |
culosis | +0.810 |
excluding | +0.778 |
formance | +0.759 |
cluding | +0.733 |
Neg logit contributions | |
IFF | -0.750 |
usefulness | -0.735 |
Unch | -0.734 |
OR | -0.725 |
ellig | -0.699 |
Token | up |
Token ID | 510 |
Feature activation | +3.11e+00 |
Pos logit contributions | |
azines | +10.216 |
excluding | +9.293 |
excluding | +9.263 |
culosis | +9.150 |
formance | +8.997 |
Neg logit contributions | |
IFF | -14.692 |
Unch | -14.434 |
usefulness | -14.363 |
OR | -14.361 |
ibrary | -14.257 |
Token | a |
Token ID | 257 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
azines | +2.178 |
culosis | +2.124 |
excluding | +2.007 |
formance | +1.972 |
cluding | +1.902 |
Neg logit contributions | |
IFF | -2.347 |
usefulness | -2.325 |
Unch | -2.306 |
OR | -2.276 |
humans | -2.218 |
Token | large |
Token ID | 1588 |
Feature activation | +6.22e-01 |
Pos logit contributions | |
azines | +0.119 |
culosis | +0.119 |
excluding | +0.112 |
formance | +0.111 |
Conclusion | +0.107 |
Neg logit contributions | |
IFF | -0.108 |
usefulness | -0.107 |
Unch | -0.107 |
OR | -0.105 |
humans | -0.101 |
Token | , |
Token ID | 11 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
azines | +0.490 |
culosis | +0.486 |
excluding | +0.460 |
formance | +0.454 |
cluding | +0.438 |
Neg logit contributions | |
IFF | -0.423 |
Unch | -0.419 |
usefulness | -0.417 |
OR | -0.411 |
humans | -0.397 |
Token | mock |
Token ID | 15290 |
Feature activation | +2.51e+00 |
Pos logit contributions | |
IFF | +0.875 |
usefulness | +0.867 |
Unch | +0.866 |
OR | +0.853 |
lif | +0.815 |
Neg logit contributions | |
azines | -1.041 |
culosis | -1.034 |
excluding | -0.982 |
formance | -0.970 |
Conclusion | -0.935 |
Token | wrote |
Token ID | 2630 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
IFF | +3.611 |
OR | +3.585 |
Unch | +3.519 |
usefulness | +3.413 |
lif | +3.385 |
Neg logit contributions | |
azines | -6.285 |
culosis | -6.230 |
excluding | -5.928 |
formance | -5.920 |
cluding | -5.715 |
Token | : |
Token ID | 25 |
Feature activation | -8.98e+00 |
Pos logit contributions | |
OR | +4.378 |
IFF | +4.366 |
Unch | +4.157 |
humans | +3.936 |
lif | +3.905 |
Neg logit contributions | |
culosis | -12.293 |
azines | -12.205 |
formance | -11.592 |
excluding | -11.398 |
ォ | -11.054 |
Token |
|
Token ID | 198 |
Feature activation | -9.30e+00 |
Pos logit contributions | |
IFF | +4.718 |
OR | +4.714 |
Unch | +4.575 |
usefulness | +4.487 |
lif | +4.350 |
Neg logit contributions | |
culosis | -8.315 |
azines | -8.237 |
formance | -7.711 |
excluding | -7.647 |
cluding | -7.358 |
Token |
|
Token ID | 198 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
OR | +4.708 |
IFF | +4.694 |
Unch | +4.498 |
usefulness | +4.395 |
humans | +4.289 |
Neg logit contributions | |
culosis | -8.905 |
azines | -8.703 |
formance | -8.073 |
excluding | -8.039 |
ォ | -7.810 |
Token | Happy |
Token ID | 25082 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
OR | +6.774 |
IFF | +6.754 |
humans | +6.373 |
usefulness | +6.328 |
Unch | +6.065 |
Neg logit contributions | |
culosis | -9.282 |
azines | -9.067 |
excluding | -8.279 |
Franch | -8.257 |
ォ | -8.224 |
Token | it |
Token ID | 340 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
lif | +6.673 |
usefulness | +6.402 |
Unch | +6.373 |
IFF | +6.345 |
OR | +6.187 |
Neg logit contributions | |
culosis | -13.409 |
azines | -13.282 |
excluding | -12.488 |
formance | -12.443 |
ォ | -12.254 |
Token | worked |
Token ID | 3111 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
usefulness | +6.272 |
Unch | +6.134 |
lif | +6.120 |
orm | +6.110 |
powerful | +5.685 |
Neg logit contributions | |
azines | -24.594 |
culosis | -24.085 |
ォ | -23.807 |
excluding | -23.392 |
formance | -22.869 |
Token | out |
Token ID | 503 |
Feature activation | -3.02e+00 |
Pos logit contributions | |
usefulness | +7.528 |
Unch | +7.436 |
OR | +7.357 |
IFF | +7.276 |
lif | +7.195 |
Neg logit contributions | |
azines | -8.590 |
culosis | -8.587 |
formance | -7.890 |
excluding | -7.858 |
ォ | -7.751 |
Token | . |
Token ID | 13 |
Feature activation | +3.84e+00 |
Pos logit contributions | |
IFF | +2.090 |
Unch | +2.070 |
usefulness | +2.070 |
OR | +2.047 |
lif | +1.966 |
Neg logit contributions | |
azines | -2.351 |
culosis | -2.344 |
excluding | -2.208 |
formance | -2.183 |
Conclusion | -2.096 |
Token |
|
Token ID | 198 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
azines | +2.882 |
culosis | +2.867 |
excluding | +2.713 |
formance | +2.672 |
Conclusion | +2.596 |
Neg logit contributions | |
IFF | -2.731 |
usefulness | -2.709 |
Unch | -2.683 |
OR | -2.637 |
ellig | -2.541 |
Token |
|
Token ID | 198 |
Feature activation | -6.34e-01 |
Pos logit contributions | |
IFF | +1.716 |
Unch | +1.695 |
usefulness | +1.695 |
OR | +1.676 |
lif | +1.597 |
Neg logit contributions | |
azines | -2.321 |
culosis | -2.315 |
excluding | -2.187 |
formance | -2.168 |
Conclusion | -2.088 |
Token | basically |
Token ID | 6209 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
IFF | +1.953 |
usefulness | +1.940 |
Unch | +1.939 |
OR | +1.912 |
lif | +1.843 |
Neg logit contributions | |
azines | -1.905 |
culosis | -1.893 |
excluding | -1.780 |
formance | -1.760 |
Conclusion | -1.689 |
Token | continuing |
Token ID | 8282 |
Feature activation | -1.47e+01 |
Pos logit contributions | |
azines | +0.696 |
culosis | +0.686 |
excluding | +0.659 |
formance | +0.643 |
cluding | +0.618 |
Neg logit contributions | |
IFF | -0.974 |
usefulness | -0.956 |
Unch | -0.952 |
OR | -0.942 |
ellig | -0.914 |
Token | to |
Token ID | 284 |
Feature activation | -1.68e+01 |
Pos logit contributions | |
OR | +6.224 |
Unch | +6.161 |
lif | +6.090 |
IFF | +6.086 |
usefulness | +6.068 |
Neg logit contributions | |
culosis | -14.004 |
azines | -13.896 |
formance | -12.912 |
excluding | -12.685 |
ォ | -12.520 |
Token | be |
Token ID | 307 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
OR | +7.093 |
usefulness | +7.047 |
lif | +6.960 |
Unch | +6.882 |
IFF | +6.833 |
Neg logit contributions | |
culosis | -15.643 |
azines | -15.464 |
excluding | -14.748 |
formance | -14.600 |
cluding | -14.434 |
Token | equally |
Token ID | 8603 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
Unch | +5.472 |
OR | +5.096 |
usefulness | +5.057 |
IFF | +4.814 |
ellig | +4.808 |
Neg logit contributions | |
azines | -11.983 |
culosis | -11.968 |
formance | -11.163 |
excluding | -11.102 |
Conclusion | -10.882 |
Token | as |
Token ID | 355 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
lif | +8.465 |
usefulness | +8.323 |
powerful | +8.151 |
Unch | +8.020 |
standoff | +7.914 |
Neg logit contributions | |
culosis | -20.013 |
azines | -19.105 |
excluding | -18.167 |
formance | -18.015 |
Conclusion | -17.801 |
Token | tight |
Token ID | 5381 |
Feature activation | -3.49e+00 |
Pos logit contributions | |
standoff | +7.167 |
lif | +6.992 |
IFF | +6.558 |
powerful | +6.537 |
usefulness | +6.299 |
Neg logit contributions | |
culosis | -23.904 |
azines | -23.081 |
excluding | -22.108 |
formance | -21.856 |
BuyableInstoreAndOnline | -21.392 |
Token | - |
Token ID | 12 |
Feature activation | -6.77e+00 |
Pos logit contributions | |
IFF | +2.222 |
usefulness | +2.193 |
Unch | +2.186 |
OR | +2.157 |
lif | +2.103 |
Neg logit contributions | |
culosis | -2.893 |
azines | -2.893 |
excluding | -2.735 |
formance | -2.716 |
Conclusion | -2.614 |
Token | f |
Token ID | 69 |
Feature activation | -8.57e+00 |
Pos logit contributions | |
IFF | +4.328 |
OR | +4.189 |
usefulness | +4.158 |
Unch | +4.114 |
humans | +4.068 |
Neg logit contributions | |
culosis | -5.542 |
azines | -5.525 |
formance | -5.146 |
excluding | -5.129 |
Conclusion | -4.991 |
Token | isted |
Token ID | 6347 |
Feature activation | -8.81e+00 |
Pos logit contributions | |
IFF | +4.905 |
usefulness | +4.710 |
Unch | +4.697 |
OR | +4.683 |
ellig | +4.667 |
Neg logit contributions | |
azines | -7.467 |
culosis | -7.459 |
excluding | -7.073 |
formance | -7.045 |
Conclusion | -6.869 |
Token | as |
Token ID | 355 |
Feature activation | -1.52e+01 |
Pos logit contributions | |
Unch | +4.404 |
IFF | +4.361 |
OR | +4.341 |
usefulness | +4.243 |
lif | +4.192 |
Neg logit contributions | |
culosis | -8.157 |
azines | -8.065 |
excluding | -7.730 |
formance | -7.689 |
cluding | -7.420 |
Token | was |
Token ID | 373 |
Feature activation | +5.19e+00 |
Pos logit contributions | |
azines | +2.456 |
culosis | +2.438 |
excluding | +2.296 |
formance | +2.234 |
Conclusion | +2.211 |
Neg logit contributions | |
IFF | -2.704 |
Unch | -2.662 |
usefulness | -2.655 |
OR | -2.628 |
ellig | -2.541 |
Token | made |
Token ID | 925 |
Feature activation | +5.30e+00 |
Pos logit contributions | |
culosis | +3.598 |
azines | +3.588 |
excluding | +3.437 |
formance | +3.291 |
excluding | +3.269 |
Neg logit contributions | |
IFF | -3.826 |
Unch | -3.756 |
usefulness | -3.732 |
OR | -3.684 |
ellig | -3.656 |
Token | in |
Token ID | 287 |
Feature activation | +6.38e+00 |
Pos logit contributions | |
azines | +3.689 |
culosis | +3.669 |
excluding | +3.486 |
Conclusion | +3.366 |
formance | +3.344 |
Neg logit contributions | |
IFF | -3.882 |
usefulness | -3.872 |
OR | -3.800 |
Unch | -3.766 |
ellig | -3.706 |
Token | . |
Token ID | 13 |
Feature activation | +2.64e+00 |
Pos logit contributions | |
azines | +4.426 |
culosis | +4.365 |
excluding | +4.168 |
formance | +4.129 |
cluding | +4.043 |
Neg logit contributions | |
IFF | -4.741 |
Unch | -4.556 |
usefulness | -4.534 |
OR | -4.455 |
ellig | -4.435 |
Token | - |
Token ID | 532 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
azines | +2.068 |
culosis | +2.056 |
excluding | +1.944 |
formance | +1.913 |
Conclusion | +1.894 |
Neg logit contributions | |
IFF | -1.792 |
usefulness | -1.767 |
Unch | -1.749 |
OR | -1.724 |
ellig | -1.679 |
Token | December |
Token ID | 3426 |
Feature activation | -2.34e+01 |
Pos logit contributions | |
azines | +0.943 |
culosis | +0.934 |
excluding | +0.870 |
Conclusion | +0.849 |
formance | +0.839 |
Neg logit contributions | |
IFF | -1.727 |
usefulness | -1.717 |
Unch | -1.711 |
OR | -1.674 |
lif | -1.652 |
Token | 13 |
Token ID | 1511 |
Feature activation | -6.80e+00 |
Pos logit contributions | |
OR | +2.770 |
Unch | +2.604 |
IFF | +2.039 |
ellig | +1.678 |
usefulness | +1.624 |
Neg logit contributions | |
culosis | -27.938 |
azines | -26.899 |
formance | -25.630 |
BuyableInstoreAndOnline | -25.566 |
ォ | -25.522 |
Token | , |
Token ID | 11 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
IFF | +4.106 |
OR | +4.039 |
Unch | +3.910 |
usefulness | +3.887 |
humans | +3.782 |
Neg logit contributions | |
culosis | -5.926 |
azines | -5.845 |
formance | -5.452 |
excluding | -5.389 |
Conclusion | -5.251 |
Token | 2010 |
Token ID | 3050 |
Feature activation | -6.11e+00 |
Pos logit contributions | |
azines | +1.202 |
culosis | +1.183 |
excluding | +1.127 |
formance | +1.112 |
Conclusion | +1.073 |
Neg logit contributions | |
IFF | -1.602 |
Unch | -1.595 |
usefulness | -1.589 |
OR | -1.567 |
ellig | -1.524 |
Token | boys |
Token ID | 13202 |
Feature activation | +2.75e+00 |
Pos logit contributions | |
IFF | +4.758 |
OR | +4.736 |
usefulness | +4.636 |
humans | +4.617 |
Unch | +4.543 |
Neg logit contributions | |
culosis | -4.094 |
azines | -4.074 |
formance | -3.828 |
excluding | -3.745 |
Conclusion | -3.732 |
Token | beware |
Token ID | 40600 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
azines | +0.682 |
culosis | +0.668 |
excluding | +0.588 |
formance | +0.557 |
Conclusion | +0.483 |
Neg logit contributions | |
IFF | -3.322 |
Unch | -3.290 |
usefulness | -3.274 |
OR | -3.240 |
humans | -3.200 |
Token | know |
Token ID | 760 |
Feature activation | +9.35e+00 |
Pos logit contributions | |
azines | +3.814 |
culosis | +3.651 |
excluding | +3.548 |
Conclusion | +3.461 |
excluding | +3.459 |
Neg logit contributions | |
IFF | -5.472 |
Unch | -5.402 |
OR | -5.395 |
usefulness | -5.386 |
humans | -5.276 |
Token | exactly |
Token ID | 3446 |
Feature activation | +5.91e+00 |
Pos logit contributions | |
azines | +6.515 |
excluding | +6.209 |
culosis | +6.168 |
excluding | +6.146 |
Conclusion | +6.071 |
Neg logit contributions | |
IFF | -6.234 |
Unch | -6.085 |
OR | -6.062 |
ellig | -6.047 |
usefulness | -6.011 |
Token | how |
Token ID | 703 |
Feature activation | -4.08e+00 |
Pos logit contributions | |
azines | +4.662 |
culosis | +4.462 |
excluding | +4.405 |
excluding | +4.324 |
Conclusion | +4.293 |
Neg logit contributions | |
IFF | -3.745 |
ellig | -3.619 |
Unch | -3.617 |
OR | -3.593 |
usefulness | -3.552 |
Token | long |
Token ID | 890 |
Feature activation | -7.78e+00 |
Pos logit contributions | |
IFF | +2.349 |
usefulness | +2.343 |
Unch | +2.333 |
OR | +2.289 |
lif | +2.203 |
Neg logit contributions | |
azines | -3.646 |
culosis | -3.642 |
excluding | -3.460 |
formance | -3.432 |
Conclusion | -3.300 |
Token | he |
Token ID | 339 |
Feature activation | -2.04e+01 |
Pos logit contributions | |
usefulness | +5.036 |
OR | +4.986 |
Unch | +4.981 |
IFF | +4.916 |
lif | +4.805 |
Neg logit contributions | |
culosis | -6.289 |
azines | -6.173 |
formance | -5.831 |
excluding | -5.765 |
Conclusion | -5.540 |
Token | 'll |
Token ID | 1183 |
Feature activation | -2.29e+01 |
Pos logit contributions | |
lif | +8.467 |
usefulness | +8.001 |
OR | +7.933 |
IFF | +7.724 |
orm | +7.563 |
Neg logit contributions | |
culosis | -17.860 |
azines | -17.571 |
formance | -17.275 |
excluding | -16.981 |
Conclusion | -16.510 |
Token | be |
Token ID | 307 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
lif | +10.996 |
OR | +10.475 |
orm | +10.408 |
usefulness | +10.383 |
IFF | +10.355 |
Neg logit contributions | |
culosis | -17.697 |
azines | -17.372 |
excluding | -16.655 |
formance | -16.573 |
黒 | -16.490 |
Token | out |
Token ID | 503 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
usefulness | +10.137 |
OR | +9.980 |
Unch | +9.818 |
lif | +9.752 |
standoff | +9.425 |
Neg logit contributions | |
culosis | -12.928 |
azines | -12.868 |
formance | -11.680 |
黒 | -11.253 |
excluding | -11.151 |
Token | . |
Token ID | 13 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
OR | +7.492 |
Unch | +7.483 |
usefulness | +7.409 |
lif | +7.313 |
IFF | +7.255 |
Neg logit contributions | |
culosis | -11.797 |
azines | -11.383 |
formance | -10.595 |
excluding | -10.356 |
ォ | -10.024 |
Token |
|
Token ID | 198 |
Feature activation | +4.64e+00 |
Pos logit contributions | |
azines | +0.417 |
culosis | +0.414 |
excluding | +0.395 |
formance | +0.388 |
Conclusion | +0.379 |
Neg logit contributions | |
IFF | -0.367 |
usefulness | -0.366 |
Unch | -0.360 |
OR | -0.355 |
lif | -0.344 |
Token |
|
Token ID | 198 |
Feature activation | +3.92e+00 |
Pos logit contributions | |
azines | +3.113 |
excluding | +3.066 |
culosis | +2.927 |
formance | +2.902 |
Conclusion | +2.860 |
Neg logit contributions | |
usefulness | -3.605 |
Unch | -3.564 |
IFF | -3.480 |
blance | -3.386 |
ellig | -3.332 |
Token | are |
Token ID | 389 |
Feature activation | -2.63e+00 |
Pos logit contributions | |
IFF | +4.388 |
Unch | +4.359 |
usefulness | +4.324 |
OR | +4.318 |
lif | +4.181 |
Neg logit contributions | |
azines | -4.979 |
culosis | -4.922 |
formance | -4.640 |
excluding | -4.620 |
Conclusion | -4.423 |
Token | basically |
Token ID | 6209 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
IFF | +1.953 |
usefulness | +1.940 |
Unch | +1.939 |
OR | +1.912 |
lif | +1.843 |
Neg logit contributions | |
azines | -1.905 |
culosis | -1.893 |
excluding | -1.780 |
formance | -1.760 |
Conclusion | -1.689 |
Token | continuing |
Token ID | 8282 |
Feature activation | -1.47e+01 |
Pos logit contributions | |
azines | +0.696 |
culosis | +0.686 |
excluding | +0.659 |
formance | +0.643 |
cluding | +0.618 |
Neg logit contributions | |
IFF | -0.974 |
usefulness | -0.956 |
Unch | -0.952 |
OR | -0.942 |
ellig | -0.914 |
Token | to |
Token ID | 284 |
Feature activation | -1.68e+01 |
Pos logit contributions | |
OR | +6.224 |
Unch | +6.161 |
lif | +6.090 |
IFF | +6.086 |
usefulness | +6.068 |
Neg logit contributions | |
culosis | -14.004 |
azines | -13.896 |
formance | -12.912 |
excluding | -12.685 |
ォ | -12.520 |
Token | be |
Token ID | 307 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
OR | +7.093 |
usefulness | +7.047 |
lif | +6.960 |
Unch | +6.882 |
IFF | +6.833 |
Neg logit contributions | |
culosis | -15.643 |
azines | -15.464 |
excluding | -14.748 |
formance | -14.600 |
cluding | -14.434 |
Token | equally |
Token ID | 8603 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
Unch | +5.472 |
OR | +5.096 |
usefulness | +5.057 |
IFF | +4.814 |
ellig | +4.808 |
Neg logit contributions | |
azines | -11.983 |
culosis | -11.968 |
formance | -11.163 |
excluding | -11.102 |
Conclusion | -10.882 |
Token | as |
Token ID | 355 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
lif | +8.465 |
usefulness | +8.323 |
powerful | +8.151 |
Unch | +8.020 |
standoff | +7.914 |
Neg logit contributions | |
culosis | -20.013 |
azines | -19.105 |
excluding | -18.167 |
formance | -18.015 |
Conclusion | -17.801 |
Token | tight |
Token ID | 5381 |
Feature activation | -3.49e+00 |
Pos logit contributions | |
standoff | +7.167 |
lif | +6.992 |
IFF | +6.558 |
powerful | +6.537 |
usefulness | +6.299 |
Neg logit contributions | |
culosis | -23.904 |
azines | -23.081 |
excluding | -22.108 |
formance | -21.856 |
BuyableInstoreAndOnline | -21.392 |
Token | - |
Token ID | 12 |
Feature activation | -6.77e+00 |
Pos logit contributions | |
IFF | +2.222 |
usefulness | +2.193 |
Unch | +2.186 |
OR | +2.157 |
lif | +2.103 |
Neg logit contributions | |
culosis | -2.893 |
azines | -2.893 |
excluding | -2.735 |
formance | -2.716 |
Conclusion | -2.614 |
Token | f |
Token ID | 69 |
Feature activation | -8.57e+00 |
Pos logit contributions | |
IFF | +4.328 |
OR | +4.189 |
usefulness | +4.158 |
Unch | +4.114 |
humans | +4.068 |
Neg logit contributions | |
culosis | -5.542 |
azines | -5.525 |
formance | -5.146 |
excluding | -5.129 |
Conclusion | -4.991 |
Token | isted |
Token ID | 6347 |
Feature activation | -8.81e+00 |
Pos logit contributions | |
IFF | +4.905 |
usefulness | +4.710 |
Unch | +4.697 |
OR | +4.683 |
ellig | +4.667 |
Neg logit contributions | |
azines | -7.467 |
culosis | -7.459 |
excluding | -7.073 |
formance | -7.045 |
Conclusion | -6.869 |
Token | run |
Token ID | 1057 |
Feature activation | +8.48e+00 |
Pos logit contributions | |
azines | +3.556 |
culosis | +3.520 |
excluding | +3.400 |
formance | +3.299 |
Conclusion | +3.268 |
Neg logit contributions | |
IFF | -3.922 |
usefulness | -3.835 |
Unch | -3.790 |
OR | -3.752 |
humans | -3.683 |
Token | out |
Token ID | 503 |
Feature activation | +3.65e+00 |
Pos logit contributions | |
azines | +3.776 |
culosis | +3.706 |
excluding | +3.537 |
cluding | +3.407 |
formance | +3.406 |
Neg logit contributions | |
IFF | -8.092 |
Unch | -8.075 |
usefulness | -7.911 |
OR | -7.776 |
ellig | -7.674 |
Token | of |
Token ID | 286 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
azines | +2.854 |
culosis | +2.835 |
excluding | +2.702 |
formance | +2.651 |
cluding | +2.562 |
Neg logit contributions | |
IFF | -2.485 |
Unch | -2.461 |
usefulness | -2.448 |
OR | -2.416 |
ellig | -2.326 |
Token | borrowed |
Token ID | 22546 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
IFF | +1.319 |
usefulness | +1.314 |
Unch | +1.310 |
OR | +1.290 |
lif | +1.245 |
Neg logit contributions | |
azines | -1.344 |
culosis | -1.336 |
excluding | -1.259 |
formance | -1.246 |
Conclusion | -1.196 |
Token | money |
Token ID | 1637 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
usefulness | +1.285 |
IFF | +1.277 |
Unch | +1.264 |
OR | +1.248 |
lif | +1.210 |
Neg logit contributions | |
azines | -1.678 |
culosis | -1.677 |
excluding | -1.582 |
formance | -1.579 |
Conclusion | -1.521 |
Token | remains |
Token ID | 3793 |
Feature activation | -2.11e+01 |
Pos logit contributions | |
IFF | +0.959 |
Unch | +0.948 |
usefulness | +0.947 |
OR | +0.934 |
ellig | +0.902 |
Neg logit contributions | |
azines | -1.025 |
culosis | -1.016 |
excluding | -0.967 |
formance | -0.946 |
Conclusion | -0.913 |
Token | Oct |
Token ID | 2556 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
lif | +12.348 |
Unch | +12.330 |
standoff | +12.121 |
usefulness | +11.742 |
OR | +11.635 |
Neg logit contributions | |
culosis | -15.465 |
azines | -15.067 |
formance | -13.881 |
ォ | -13.734 |
excluding | -13.485 |
Token | . |
Token ID | 13 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
OR | +7.377 |
IFF | +7.177 |
Unch | +6.923 |
usefulness | +6.722 |
ellig | +6.687 |
Neg logit contributions | |
culosis | -12.553 |
azines | -12.135 |
excluding | -11.120 |
formance | -11.078 |
BuyableInstoreAndOnline | -10.950 |
Token | 17 |
Token ID | 1596 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
Unch | +4.222 |
OR | +4.132 |
lif | +4.067 |
IFF | +3.995 |
usefulness | +3.729 |
Neg logit contributions | |
azines | -17.030 |
culosis | -16.990 |
ォ | -15.672 |
formance | -15.655 |
excluding | -15.618 |
Token | , |
Token ID | 11 |
Feature activation | -5.26e+00 |
Pos logit contributions | |
IFF | +7.308 |
Unch | +7.274 |
lif | +7.257 |
OR | +7.219 |
usefulness | +7.065 |
Neg logit contributions | |
culosis | -10.575 |
azines | -10.544 |
formance | -9.859 |
excluding | -9.593 |
ォ | -9.548 |
Token | Lew |
Token ID | 8260 |
Feature activation | -3.17e+00 |
Pos logit contributions | |
IFF | +3.626 |
usefulness | +3.618 |
Unch | +3.601 |
OR | +3.576 |
lif | +3.464 |
Neg logit contributions | |
azines | -4.065 |
culosis | -4.063 |
formance | -3.769 |
excluding | -3.748 |
Conclusion | -3.592 |
Token | in |
Token ID | 287 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
Unch | +6.533 |
OR | +6.496 |
usefulness | +6.257 |
IFF | +6.217 |
ellig | +6.180 |
Neg logit contributions | |
culosis | -10.389 |
azines | -10.353 |
excluding | -9.862 |
formance | -9.756 |
Conclusion | -9.542 |
Token | the |
Token ID | 262 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
Unch | +8.320 |
usefulness | +8.145 |
IFF | +7.805 |
lif | +7.754 |
OR | +7.727 |
Neg logit contributions | |
culosis | -13.531 |
azines | -13.290 |
excluding | -13.061 |
ォ | -12.724 |
formance | -12.716 |
Token | peer |
Token ID | 12720 |
Feature activation | -6.35e+00 |
Pos logit contributions | |
Unch | +8.142 |
usefulness | +7.994 |
OR | +7.974 |
lif | +7.753 |
IFF | +7.699 |
Neg logit contributions | |
culosis | -10.218 |
azines | -9.944 |
excluding | -9.743 |
formance | -9.603 |
ォ | -9.480 |
Token | - |
Token ID | 12 |
Feature activation | -8.26e+00 |
Pos logit contributions | |
Unch | +3.565 |
IFF | +3.561 |
usefulness | +3.554 |
OR | +3.480 |
lif | +3.355 |
Neg logit contributions | |
culosis | -5.570 |
azines | -5.531 |
excluding | -5.283 |
formance | -5.183 |
Conclusion | -5.022 |
Token | reviewed |
Token ID | 32974 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
IFF | +6.380 |
OR | +6.304 |
Unch | +6.266 |
usefulness | +6.249 |
ellig | +6.152 |
Neg logit contributions | |
culosis | -5.521 |
azines | -5.516 |
excluding | -5.039 |
formance | -5.003 |
Conclusion | -4.890 |
Token | journal |
Token ID | 3989 |
Feature activation | -2.08e+01 |
Pos logit contributions | |
Unch | +7.070 |
usefulness | +6.965 |
OR | +6.911 |
IFF | +6.766 |
lif | +6.711 |
Neg logit contributions | |
azines | -8.639 |
culosis | -8.627 |
excluding | -8.355 |
formance | -8.259 |
ォ | -8.057 |
Token | Clim |
Token ID | 28573 |
Feature activation | -3.08e+00 |
Pos logit contributions | |
Unch | +11.541 |
usefulness | +10.729 |
lif | +10.650 |
Nature | +10.585 |
OR | +10.434 |
Neg logit contributions | |
culosis | -14.972 |
azines | -14.853 |
excluding | -14.525 |
ォ | -14.480 |
formance | -14.289 |
Token | atic |
Token ID | 1512 |
Feature activation | +5.77e-01 |
Pos logit contributions | |
IFF | +2.793 |
usefulness | +2.777 |
Unch | +2.775 |
OR | +2.742 |
lif | +2.659 |
Neg logit contributions | |
azines | -1.739 |
culosis | -1.723 |
excluding | -1.598 |
formance | -1.570 |
Conclusion | -1.487 |
Token | Change |
Token ID | 9794 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
azines | +0.446 |
culosis | +0.443 |
excluding | +0.421 |
formance | +0.420 |
Conclusion | +0.407 |
Neg logit contributions | |
IFF | -0.400 |
usefulness | -0.395 |
Unch | -0.388 |
OR | -0.382 |
ellig | -0.372 |
Token | , |
Token ID | 11 |
Feature activation | +2.80e-01 |
Pos logit contributions | |
Unch | +1.442 |
IFF | +1.436 |
usefulness | +1.427 |
OR | +1.414 |
lif | +1.358 |
Neg logit contributions | |
azines | -1.832 |
culosis | -1.813 |
excluding | -1.726 |
formance | -1.695 |
Conclusion | -1.640 |
Token | provides |
Token ID | 3769 |
Feature activation | -2.74e-02 |
Pos logit contributions | |
azines | +0.206 |
culosis | +0.204 |
excluding | +0.194 |
formance | +0.190 |
Conclusion | +0.184 |
Neg logit contributions | |
IFF | -0.205 |
Unch | -0.203 |
usefulness | -0.203 |
OR | -0.200 |
ellig | -0.192 |
Token | her |
Token ID | 607 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
Unch | +6.080 |
OR | +6.011 |
usefulness | +5.998 |
IFF | +5.996 |
lif | +5.815 |
Neg logit contributions | |
culosis | -7.242 |
azines | -7.237 |
formance | -6.843 |
excluding | -6.811 |
Conclusion | -6.430 |
Token | mother |
Token ID | 2802 |
Feature activation | -6.39e+00 |
Pos logit contributions | |
usefulness | +7.667 |
Unch | +7.474 |
OR | +7.455 |
lif | +7.345 |
IFF | +7.308 |
Neg logit contributions | |
culosis | -8.858 |
azines | -8.704 |
excluding | -8.232 |
formance | -8.126 |
cluding | -7.677 |
Token | � |
Token ID | 447 |
Feature activation | -3.82e+00 |
Pos logit contributions | |
IFF | +4.088 |
Unch | +4.085 |
OR | +4.074 |
usefulness | +4.063 |
lif | +3.891 |
Neg logit contributions | |
azines | -5.174 |
culosis | -5.107 |
excluding | -4.862 |
formance | -4.795 |
Conclusion | -4.609 |
Token | � |
Token ID | 247 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
IFF | +3.286 |
usefulness | +3.263 |
Unch | +3.262 |
OR | +3.226 |
lif | +3.122 |
Neg logit contributions | |
azines | -2.318 |
culosis | -2.302 |
excluding | -2.143 |
formance | -2.109 |
Conclusion | -2.005 |
Token | s |
Token ID | 82 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
IFF | +1.374 |
usefulness | +1.361 |
Unch | +1.358 |
OR | +1.330 |
lif | +1.258 |
Neg logit contributions | |
azines | -2.556 |
culosis | -2.543 |
excluding | -2.435 |
formance | -2.410 |
Conclusion | -2.338 |
Token | continued |
Token ID | 3767 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
usefulness | +8.626 |
Unch | +8.293 |
lif | +8.201 |
OR | +8.135 |
IFF | +8.095 |
Neg logit contributions | |
culosis | -9.519 |
azines | -9.493 |
excluding | -8.872 |
formance | -8.687 |
cluding | -8.340 |
Token | creative |
Token ID | 7325 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
usefulness | +13.857 |
lif | +12.849 |
Unch | +12.177 |
standoff | +12.036 |
ordeal | +12.026 |
Neg logit contributions | |
azines | -14.041 |
culosis | -14.024 |
excluding | -12.856 |
formance | -12.508 |
ォ | -12.407 |
Token | growth |
Token ID | 3349 |
Feature activation | -9.40e+00 |
Pos logit contributions | |
usefulness | +9.057 |
lif | +8.654 |
Unch | +8.337 |
OR | +8.296 |
standoff | +8.139 |
Neg logit contributions | |
culosis | -10.779 |
azines | -10.608 |
excluding | -10.014 |
formance | -9.687 |
Conclusion | -9.538 |
Token | . |
Token ID | 13 |
Feature activation | -3.78e+00 |
Pos logit contributions | |
usefulness | +5.955 |
Unch | +5.940 |
IFF | +5.938 |
OR | +5.933 |
lif | +5.746 |
Neg logit contributions | |
azines | -7.512 |
culosis | -7.449 |
excluding | -6.976 |
formance | -6.892 |
Conclusion | -6.655 |
Token | � |
Token ID | 564 |
Feature activation | +5.03e-01 |
Pos logit contributions | |
IFF | +2.387 |
Unch | +2.387 |
usefulness | +2.347 |
OR | +2.342 |
lif | +2.221 |
Neg logit contributions | |
azines | -3.159 |
culosis | -3.138 |
excluding | -2.967 |
formance | -2.955 |
cluding | -2.824 |
Token | � |
Token ID | 250 |
Feature activation | -4.95e+00 |
Pos logit contributions | |
azines | +0.296 |
culosis | +0.291 |
excluding | +0.277 |
formance | +0.269 |
Conclusion | +0.263 |
Neg logit contributions | |
usefulness | -0.440 |
IFF | -0.436 |
Unch | -0.436 |
OR | -0.425 |
lif | -0.418 |
Token | to |
Token ID | 284 |
Feature activation | +6.60e+00 |
Pos logit contributions | |
azines | +4.097 |
culosis | +4.012 |
excluding | +3.937 |
formance | +3.843 |
excluding | +3.773 |
Neg logit contributions | |
IFF | -4.133 |
usefulness | -4.012 |
Unch | -4.006 |
OR | -3.962 |
ellig | -3.887 |
Token | know |
Token ID | 760 |
Feature activation | +9.35e+00 |
Pos logit contributions | |
azines | +3.814 |
culosis | +3.651 |
excluding | +3.548 |
Conclusion | +3.461 |
excluding | +3.459 |
Neg logit contributions | |
IFF | -5.472 |
Unch | -5.402 |
OR | -5.395 |
usefulness | -5.386 |
humans | -5.276 |
Token | exactly |
Token ID | 3446 |
Feature activation | +5.91e+00 |
Pos logit contributions | |
azines | +6.515 |
excluding | +6.209 |
culosis | +6.168 |
excluding | +6.146 |
Conclusion | +6.071 |
Neg logit contributions | |
IFF | -6.234 |
Unch | -6.085 |
OR | -6.062 |
ellig | -6.047 |
usefulness | -6.011 |
Token | how |
Token ID | 703 |
Feature activation | -4.08e+00 |
Pos logit contributions | |
azines | +4.662 |
culosis | +4.462 |
excluding | +4.405 |
excluding | +4.324 |
Conclusion | +4.293 |
Neg logit contributions | |
IFF | -3.745 |
ellig | -3.619 |
Unch | -3.617 |
OR | -3.593 |
usefulness | -3.552 |
Token | long |
Token ID | 890 |
Feature activation | -7.78e+00 |
Pos logit contributions | |
IFF | +2.349 |
usefulness | +2.343 |
Unch | +2.333 |
OR | +2.289 |
lif | +2.203 |
Neg logit contributions | |
azines | -3.646 |
culosis | -3.642 |
excluding | -3.460 |
formance | -3.432 |
Conclusion | -3.300 |
Token | he |
Token ID | 339 |
Feature activation | -2.04e+01 |
Pos logit contributions | |
usefulness | +5.036 |
OR | +4.986 |
Unch | +4.981 |
IFF | +4.916 |
lif | +4.805 |
Neg logit contributions | |
culosis | -6.289 |
azines | -6.173 |
formance | -5.831 |
excluding | -5.765 |
Conclusion | -5.540 |
Token | 'll |
Token ID | 1183 |
Feature activation | -2.29e+01 |
Pos logit contributions | |
lif | +8.467 |
usefulness | +8.001 |
OR | +7.933 |
IFF | +7.724 |
orm | +7.563 |
Neg logit contributions | |
culosis | -17.860 |
azines | -17.571 |
formance | -17.275 |
excluding | -16.981 |
Conclusion | -16.510 |
Token | be |
Token ID | 307 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
lif | +10.996 |
OR | +10.475 |
orm | +10.408 |
usefulness | +10.383 |
IFF | +10.355 |
Neg logit contributions | |
culosis | -17.697 |
azines | -17.372 |
excluding | -16.655 |
formance | -16.573 |
黒 | -16.490 |
Token | out |
Token ID | 503 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
usefulness | +10.137 |
OR | +9.980 |
Unch | +9.818 |
lif | +9.752 |
standoff | +9.425 |
Neg logit contributions | |
culosis | -12.928 |
azines | -12.868 |
formance | -11.680 |
黒 | -11.253 |
excluding | -11.151 |
Token | . |
Token ID | 13 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
OR | +7.492 |
Unch | +7.483 |
usefulness | +7.409 |
lif | +7.313 |
IFF | +7.255 |
Neg logit contributions | |
culosis | -11.797 |
azines | -11.383 |
formance | -10.595 |
excluding | -10.356 |
ォ | -10.024 |
Token |
|
Token ID | 198 |
Feature activation | +4.64e+00 |
Pos logit contributions | |
azines | +0.417 |
culosis | +0.414 |
excluding | +0.395 |
formance | +0.388 |
Conclusion | +0.379 |
Neg logit contributions | |
IFF | -0.367 |
usefulness | -0.366 |
Unch | -0.360 |
OR | -0.355 |
lif | -0.344 |
Token | in |
Token ID | 287 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
azines | +3.267 |
culosis | +3.209 |
excluding | +3.045 |
formance | +2.919 |
Conclusion | +2.878 |
Neg logit contributions | |
IFF | -3.732 |
usefulness | -3.655 |
Unch | -3.650 |
OR | -3.584 |
ellig | -3.559 |
Token | the |
Token ID | 262 |
Feature activation | +4.38e+00 |
Pos logit contributions | |
azines | +1.284 |
culosis | +1.274 |
excluding | +1.211 |
formance | +1.196 |
Conclusion | +1.154 |
Neg logit contributions | |
IFF | -1.045 |
usefulness | -1.036 |
Unch | -1.035 |
OR | -1.018 |
lif | -0.974 |
Token | atmosphere |
Token ID | 8137 |
Feature activation | +1.64e+00 |
Pos logit contributions | |
azines | +2.874 |
culosis | +2.775 |
excluding | +2.660 |
formance | +2.576 |
cluding | +2.523 |
Neg logit contributions | |
IFF | -3.522 |
Unch | -3.468 |
usefulness | -3.440 |
OR | -3.394 |
ellig | -3.328 |
Token | is |
Token ID | 318 |
Feature activation | -8.87e+00 |
Pos logit contributions | |
azines | +1.108 |
culosis | +1.099 |
excluding | +1.042 |
formance | +1.014 |
Conclusion | +0.988 |
Neg logit contributions | |
IFF | -1.292 |
usefulness | -1.269 |
Unch | -1.266 |
OR | -1.251 |
ellig | -1.218 |
Token | less |
Token ID | 1342 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
Unch | +6.325 |
usefulness | +6.301 |
OR | +6.217 |
IFF | +6.151 |
lif | +6.146 |
Neg logit contributions | |
culosis | -6.623 |
azines | -6.534 |
formance | -6.059 |
excluding | -5.983 |
cluding | -5.668 |
Token | than |
Token ID | 621 |
Feature activation | -2.03e+01 |
Pos logit contributions | |
OR | +7.257 |
usefulness | +7.243 |
lif | +7.191 |
IFF | +7.177 |
Unch | +7.004 |
Neg logit contributions | |
culosis | -12.739 |
azines | -12.568 |
formance | -11.945 |
excluding | -11.828 |
cluding | -11.167 |
Token | 10 |
Token ID | 838 |
Feature activation | -8.53e+00 |
Pos logit contributions | |
usefulness | +11.045 |
lif | +10.981 |
Unch | +10.798 |
OR | +10.744 |
IFF | +10.227 |
Neg logit contributions | |
culosis | -16.152 |
azines | -15.085 |
formance | -14.387 |
excluding | -13.893 |
ォ | -13.757 |
Token | years |
Token ID | 812 |
Feature activation | -4.70e+00 |
Pos logit contributions | |
IFF | +4.693 |
Unch | +4.683 |
OR | +4.651 |
usefulness | +4.641 |
lif | +4.638 |
Neg logit contributions | |
culosis | -7.549 |
azines | -7.509 |
formance | -7.063 |
excluding | -6.985 |
cluding | -6.706 |
Token | built |
Token ID | 3170 |
Feature activation | +7.77e+00 |
Pos logit contributions | |
usefulness | +3.260 |
Unch | +3.223 |
IFF | +3.223 |
OR | +3.170 |
lif | +3.109 |
Neg logit contributions | |
azines | -3.620 |
culosis | -3.615 |
excluding | -3.388 |
formance | -3.383 |
cluding | -3.204 |
Token | upon |
Token ID | 2402 |
Feature activation | +2.73e+00 |
Pos logit contributions | |
azines | +5.252 |
culosis | +5.012 |
excluding | +4.888 |
formance | +4.705 |
Conclusion | +4.607 |
Neg logit contributions | |
IFF | -5.727 |
Unch | -5.698 |
usefulness | -5.540 |
OR | -5.510 |
ellig | -5.425 |
Token | the |
Token ID | 262 |
Feature activation | +5.52e-01 |
Pos logit contributions | |
azines | +1.978 |
culosis | +1.943 |
excluding | +1.872 |
formance | +1.829 |
Conclusion | +1.812 |
Neg logit contributions | |
IFF | -1.977 |
Unch | -1.944 |
usefulness | -1.928 |
OR | -1.912 |
ellig | -1.879 |
Token | the |
Token ID | 262 |
Feature activation | -6.88e+00 |
Pos logit contributions | |
IFF | +4.998 |
OR | +4.950 |
Unch | +4.928 |
usefulness | +4.865 |
lif | +4.745 |
Neg logit contributions | |
culosis | -8.377 |
azines | -8.319 |
formance | -7.759 |
excluding | -7.687 |
Conclusion | -7.430 |
Token | place |
Token ID | 1295 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
usefulness | +6.237 |
OR | +6.175 |
Unch | +6.146 |
IFF | +6.134 |
lif | +6.036 |
Neg logit contributions | |
azines | -3.823 |
culosis | -3.814 |
excluding | -3.439 |
formance | -3.424 |
Conclusion | -3.186 |
Token | can |
Token ID | 460 |
Feature activation | -1.00e+01 |
Pos logit contributions | |
lif | +6.294 |
usefulness | +6.273 |
OR | +6.268 |
Unch | +6.114 |
IFF | +6.109 |
Neg logit contributions | |
azines | -13.976 |
culosis | -13.925 |
excluding | -13.143 |
formance | -13.114 |
Conclusion | -12.747 |
Token | be |
Token ID | 307 |
Feature activation | -5.64e+00 |
Pos logit contributions | |
IFF | +5.114 |
OR | +5.107 |
usefulness | +5.013 |
lif | +4.970 |
Unch | +4.963 |
Neg logit contributions | |
culosis | -9.248 |
azines | -9.131 |
excluding | -8.711 |
formance | -8.642 |
cluding | -8.434 |
Token | explored |
Token ID | 18782 |
Feature activation | -6.70e+00 |
Pos logit contributions | |
usefulness | +2.507 |
IFF | +2.505 |
Unch | +2.488 |
OR | +2.458 |
ellig | +2.301 |
Neg logit contributions | |
azines | -5.737 |
culosis | -5.714 |
formance | -5.441 |
excluding | -5.419 |
Conclusion | -5.235 |
Token | in |
Token ID | 287 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
IFF | +4.285 |
OR | +4.220 |
Unch | +4.193 |
usefulness | +4.193 |
lif | +4.063 |
Neg logit contributions | |
culosis | -5.512 |
azines | -5.490 |
formance | -5.111 |
excluding | -5.034 |
Conclusion | -4.853 |
Token | 3 |
Token ID | 513 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
IFF | +8.819 |
OR | +8.741 |
usefulness | +8.578 |
Unch | +8.491 |
lif | +8.351 |
Neg logit contributions | |
culosis | -16.424 |
azines | -15.865 |
excluding | -14.674 |
formance | -14.532 |
ォ | -14.168 |
Token | D |
Token ID | 35 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
usefulness | +1.024 |
Unch | +1.019 |
IFF | +1.014 |
OR | +0.989 |
lif | +0.963 |
Neg logit contributions | |
azines | -1.005 |
culosis | -0.991 |
excluding | -0.953 |
formance | -0.933 |
Conclusion | -0.900 |
Token | with |
Token ID | 351 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
IFF | +5.670 |
OR | +5.550 |
usefulness | +5.517 |
Unch | +5.492 |
lif | +5.471 |
Neg logit contributions | |
culosis | -9.380 |
azines | -9.319 |
formance | -8.503 |
excluding | -8.452 |
ォ | -8.278 |
Token | Google |
Token ID | 3012 |
Feature activation | -3.83e+00 |
Pos logit contributions | |
IFF | +1.153 |
usefulness | +1.144 |
Unch | +1.143 |
OR | +1.126 |
lif | +1.082 |
Neg logit contributions | |
azines | -1.325 |
culosis | -1.316 |
excluding | -1.247 |
formance | -1.232 |
Conclusion | -1.186 |
Token | Maps |
Token ID | 20347 |
Feature activation | +9.96e-01 |
Pos logit contributions | |
IFF | +2.561 |
Unch | +2.546 |
usefulness | +2.543 |
OR | +2.506 |
lif | +2.402 |
Neg logit contributions | |
azines | -3.050 |
culosis | -3.032 |
excluding | -2.884 |
formance | -2.848 |
cluding | -2.739 |
Token | . |
Token ID | 13 |
Feature activation | -2.66e+00 |
Pos logit contributions | |
azines | +0.149 |
culosis | +0.147 |
excluding | +0.140 |
formance | +0.138 |
cluding | +0.133 |
Neg logit contributions | |
usefulness | -0.154 |
Unch | -0.154 |
IFF | -0.152 |
OR | -0.148 |
lif | -0.145 |
Token | N |
Token ID | 45 |
Feature activation | -6.98e+00 |
Pos logit contributions | |
OR | +1.510 |
IFF | +1.508 |
usefulness | +1.495 |
Unch | +1.488 |
lif | +1.413 |
Neg logit contributions | |
culosis | -2.382 |
azines | -2.359 |
excluding | -2.251 |
formance | -2.219 |
cluding | -2.152 |
Token | . |
Token ID | 13 |
Feature activation | -7.36e+00 |
Pos logit contributions | |
IFF | +4.189 |
OR | +4.188 |
Unch | +4.069 |
usefulness | +3.988 |
lif | +3.919 |
Neg logit contributions | |
culosis | -5.805 |
azines | -5.737 |
excluding | -5.632 |
formance | -5.458 |
Conclusion | -5.201 |
Token | ST |
Token ID | 3563 |
Feature activation | -6.12e+00 |
Pos logit contributions | |
Unch | +5.173 |
OR | +5.160 |
IFF | +5.158 |
usefulness | +5.154 |
lif | +4.996 |
Neg logit contributions | |
azines | -5.362 |
culosis | -5.321 |
excluding | -5.108 |
formance | -5.085 |
cluding | -4.776 |
Token | ILL |
Token ID | 8267 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
IFF | +3.667 |
OR | +3.591 |
usefulness | +3.382 |
Unch | +3.373 |
ellig | +3.208 |
Neg logit contributions | |
azines | -5.500 |
culosis | -5.460 |
formance | -5.111 |
excluding | -5.098 |
cluding | -4.934 |
Token | SUPPORT |
Token ID | 43333 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
OR | +7.945 |
IFF | +7.900 |
Unch | +7.582 |
usefulness | +7.476 |
humans | +7.125 |
Neg logit contributions | |
azines | -7.974 |
culosis | -7.965 |
formance | -7.405 |
excluding | -7.203 |
cluding | -6.919 |
Token | ING |
Token ID | 2751 |
Feature activation | -9.07e+00 |
Pos logit contributions | |
OR | +12.240 |
IFF | +11.811 |
Unch | +11.253 |
HOU | +10.292 |
EFF | +10.248 |
Neg logit contributions | |
azines | -15.006 |
culosis | -14.494 |
formance | -14.183 |
excluding | -13.526 |
culminating | -13.108 |
Token | UN |
Token ID | 4725 |
Feature activation | -2.83e+00 |
Pos logit contributions | |
IFF | +5.920 |
OR | +5.893 |
Unch | +5.883 |
usefulness | +5.598 |
lif | +5.363 |
Neg logit contributions | |
azines | -7.358 |
culosis | -7.205 |
formance | -6.813 |
excluding | -6.764 |
cluding | -6.412 |
Token | ITS |
Token ID | 29722 |
Feature activation | -9.37e-01 |
Pos logit contributions | |
IFF | +1.677 |
Unch | +1.647 |
usefulness | +1.642 |
OR | +1.633 |
lif | +1.540 |
Neg logit contributions | |
azines | -2.504 |
culosis | -2.484 |
excluding | -2.363 |
formance | -2.343 |
cluding | -2.260 |
Token |
|
Token ID | 198 |
Feature activation | -8.76e-01 |
Pos logit contributions | |
IFF | +0.620 |
usefulness | +0.618 |
Unch | +0.614 |
OR | +0.603 |
lif | +0.581 |
Neg logit contributions | |
azines | -0.753 |
culosis | -0.749 |
excluding | -0.713 |
formance | -0.702 |
Conclusion | -0.682 |
Token |
|
Token ID | 198 |
Feature activation | -3.14e+00 |
Pos logit contributions | |
usefulness | +0.583 |
IFF | +0.580 |
Unch | +0.580 |
OR | +0.562 |
lif | +0.545 |
Neg logit contributions | |
azines | -0.702 |
culosis | -0.694 |
excluding | -0.669 |
formance | -0.656 |
Conclusion | -0.636 |
Token | as |
Token ID | 355 |
Feature activation | -7.80e+00 |
Pos logit contributions | |
azines | +1.584 |
culosis | +1.575 |
excluding | +1.500 |
formance | +1.482 |
Conclusion | +1.432 |
Neg logit contributions | |
IFF | -1.170 |
usefulness | -1.162 |
Unch | -1.160 |
OR | -1.140 |
lif | -1.091 |
Token | sc |
Token ID | 629 |
Feature activation | -6.64e+00 |
Pos logit contributions | |
Unch | +5.308 |
usefulness | +5.259 |
OR | +5.213 |
IFF | +5.210 |
lif | +5.099 |
Neg logit contributions | |
azines | -5.942 |
culosis | -5.913 |
formance | -5.605 |
excluding | -5.561 |
cluding | -5.241 |
Token | a |
Token ID | 64 |
Feature activation | -3.60e+00 |
Pos logit contributions | |
OR | +3.562 |
IFF | +3.559 |
Unch | +3.460 |
usefulness | +3.403 |
orm | +3.328 |
Neg logit contributions | |
culosis | -6.075 |
azines | -5.998 |
excluding | -5.700 |
formance | -5.694 |
Conclusion | -5.526 |
Token | . |
Token ID | 13 |
Feature activation | -7.99e-01 |
Pos logit contributions | |
IFF | +2.353 |
usefulness | +2.338 |
Unch | +2.335 |
OR | +2.291 |
lif | +2.197 |
Neg logit contributions | |
azines | -2.935 |
culosis | -2.916 |
excluding | -2.771 |
formance | -2.741 |
Conclusion | -2.643 |
Token | If |
Token ID | 1002 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
IFF | +0.548 |
usefulness | +0.543 |
Unch | +0.542 |
OR | +0.530 |
lif | +0.510 |
Neg logit contributions | |
azines | -0.629 |
culosis | -0.624 |
excluding | -0.593 |
formance | -0.585 |
Conclusion | -0.565 |
Token | it |
Token ID | 340 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
lif | +6.477 |
OR | +6.372 |
usefulness | +6.284 |
Unch | +6.217 |
orm | +6.035 |
Neg logit contributions | |
culosis | -12.417 |
azines | -12.245 |
excluding | -11.453 |
formance | -11.438 |
ォ | -11.285 |
Token | worked |
Token ID | 3111 |
Feature activation | -8.48e+00 |
Pos logit contributions | |
usefulness | +5.971 |
lif | +5.906 |
orm | +5.667 |
IFF | +5.619 |
Unch | +5.497 |
Neg logit contributions | |
azines | -20.347 |
culosis | -19.821 |
ォ | -19.141 |
excluding | -19.025 |
formance | -18.895 |
Token | out |
Token ID | 503 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
usefulness | +6.214 |
Unch | +6.123 |
OR | +6.075 |
IFF | +6.061 |
lif | +5.991 |
Neg logit contributions | |
azines | -6.153 |
culosis | -6.113 |
excluding | -5.639 |
formance | -5.636 |
ォ | -5.386 |
Token | , |
Token ID | 11 |
Feature activation | -7.07e+00 |
Pos logit contributions | |
IFF | +1.836 |
usefulness | +1.820 |
Unch | +1.819 |
OR | +1.793 |
lif | +1.721 |
Neg logit contributions | |
azines | -2.131 |
culosis | -2.120 |
excluding | -2.005 |
formance | -1.983 |
Conclusion | -1.910 |
Token | dragon |
Token ID | 10441 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
usefulness | +3.780 |
OR | +3.729 |
Unch | +3.727 |
IFF | +3.698 |
lif | +3.625 |
Neg logit contributions | |
azines | -6.556 |
culosis | -6.507 |
formance | -6.147 |
excluding | -6.143 |
Conclusion | -5.966 |
Token | would |
Token ID | 561 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
OR | +5.754 |
lif | +5.697 |
IFF | +5.656 |
usefulness | +5.535 |
Unch | +5.508 |
Neg logit contributions | |
culosis | -9.243 |
azines | -9.117 |
formance | -8.613 |
excluding | -8.542 |
ォ | -8.530 |
Token | if |
Token ID | 611 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
IFF | +3.319 |
usefulness | +3.318 |
Unch | +3.313 |
OR | +3.265 |
lif | +3.158 |
Neg logit contributions | |
azines | -3.686 |
culosis | -3.679 |
excluding | -3.456 |
formance | -3.417 |
cluding | -3.275 |
Token | so |
Token ID | 523 |
Feature activation | +1.78e+00 |
Pos logit contributions | |
IFF | +1.108 |
usefulness | +1.100 |
Unch | +1.099 |
OR | +1.083 |
lif | +1.041 |
Neg logit contributions | |
azines | -1.163 |
culosis | -1.155 |
excluding | -1.092 |
formance | -1.077 |
Conclusion | -1.036 |
Token | , |
Token ID | 11 |
Feature activation | +3.07e-01 |
Pos logit contributions | |
azines | +1.403 |
culosis | +1.394 |
excluding | +1.322 |
formance | +1.305 |
Conclusion | +1.258 |
Neg logit contributions | |
IFF | -1.216 |
usefulness | -1.207 |
Unch | -1.205 |
OR | -1.187 |
lif | -1.139 |
Token | it |
Token ID | 340 |
Feature activation | -3.61e+00 |
Pos logit contributions | |
azines | +0.237 |
culosis | +0.233 |
excluding | +0.223 |
formance | +0.220 |
Conclusion | +0.212 |
Neg logit contributions | |
IFF | -0.216 |
Unch | -0.213 |
usefulness | -0.212 |
OR | -0.208 |
ellig | -0.201 |
Token | has |
Token ID | 468 |
Feature activation | -5.28e+00 |
Pos logit contributions | |
IFF | +2.573 |
Unch | +2.557 |
usefulness | +2.553 |
OR | +2.525 |
lif | +2.440 |
Neg logit contributions | |
azines | -2.717 |
culosis | -2.709 |
excluding | -2.552 |
formance | -2.528 |
Conclusion | -2.423 |
Token | another |
Token ID | 1194 |
Feature activation | -1.97e+01 |
Pos logit contributions | |
usefulness | +3.429 |
Unch | +3.408 |
IFF | +3.403 |
OR | +3.353 |
lif | +3.252 |
Neg logit contributions | |
culosis | -4.297 |
azines | -4.265 |
excluding | -4.025 |
formance | -3.992 |
Conclusion | -3.864 |
Token | 180 |
Token ID | 11546 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
lif | +11.618 |
usefulness | +11.521 |
OR | +11.122 |
standoff | +10.973 |
Unch | +10.854 |
Neg logit contributions | |
culosis | -14.351 |
azines | -14.161 |
excluding | -13.083 |
formance | -13.039 |
黒 | -12.911 |
Token | days |
Token ID | 1528 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
usefulness | +6.303 |
OR | +6.284 |
IFF | +6.264 |
lif | +6.125 |
Unch | +6.089 |
Neg logit contributions | |
culosis | -12.199 |
azines | -11.718 |
formance | -11.489 |
Conclusion | -11.212 |
excluding | -11.179 |
Token | to |
Token ID | 284 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
OR | +9.456 |
usefulness | +9.217 |
Unch | +9.128 |
lif | +9.040 |
IFF | +8.896 |
Neg logit contributions | |
culosis | -13.513 |
azines | -12.914 |
formance | -12.568 |
excluding | -12.008 |
Conclusion | -11.870 |
Token | issue |
Token ID | 2071 |
Feature activation | +7.42e+00 |
Pos logit contributions | |
IFF | +0.966 |
usefulness | +0.956 |
Unch | +0.956 |
OR | +0.939 |
humans | +0.907 |
Neg logit contributions | |
azines | -0.954 |
culosis | -0.944 |
excluding | -0.895 |
formance | -0.885 |
Conclusion | -0.852 |
Token | preliminary |
Token ID | 15223 |
Feature activation | +2.41e+00 |
Pos logit contributions | |
azines | +4.756 |
formance | +4.542 |
culosis | +4.489 |
excluding | +4.466 |
Conclusion | +4.349 |
Neg logit contributions | |
IFF | -5.704 |
Unch | -5.686 |
usefulness | -5.612 |
humans | -5.483 |
ellig | -5.463 |
Token | pixel |
Token ID | 17465 |
Feature activation | -3.18e+00 |
Pos logit contributions | |
usefulness | +2.768 |
IFF | +2.761 |
Unch | +2.730 |
OR | +2.700 |
lif | +2.614 |
Neg logit contributions | |
azines | -3.237 |
culosis | -3.236 |
excluding | -3.033 |
formance | -3.002 |
cluding | -2.869 |
Token | size |
Token ID | 2546 |
Feature activation | -3.55e+00 |
Pos logit contributions | |
IFF | +2.241 |
usefulness | +2.235 |
Unch | +2.218 |
OR | +2.197 |
lif | +2.118 |
Neg logit contributions | |
azines | -2.432 |
culosis | -2.427 |
excluding | -2.282 |
formance | -2.248 |
cluding | -2.164 |
Token | wouldn |
Token ID | 3636 |
Feature activation | +4.46e+00 |
Pos logit contributions | |
IFF | +2.483 |
usefulness | +2.477 |
Unch | +2.464 |
OR | +2.426 |
lif | +2.346 |
Neg logit contributions | |
culosis | -2.731 |
azines | -2.729 |
excluding | -2.564 |
formance | -2.541 |
cluding | -2.427 |
Token | 't |
Token ID | 470 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
azines | +2.195 |
excluding | +2.118 |
culosis | +2.065 |
formance | +1.999 |
Conclusion | +1.923 |
Neg logit contributions | |
usefulness | -4.267 |
Unch | -4.237 |
IFF | -4.121 |
lif | -3.986 |
ellig | -3.982 |
Token | look |
Token ID | 804 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
Unch | +6.462 |
usefulness | +6.445 |
IFF | +6.427 |
lif | +6.331 |
OR | +6.307 |
Neg logit contributions | |
culosis | -9.557 |
azines | -9.494 |
formance | -9.010 |
excluding | -8.932 |
黒 | -8.492 |
Token | as |
Token ID | 355 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
Unch | +8.695 |
OR | +8.493 |
lif | +8.465 |
usefulness | +8.414 |
IFF | +8.322 |
Neg logit contributions | |
culosis | -12.531 |
azines | -12.268 |
formance | -11.580 |
excluding | -11.285 |
cluding | -10.875 |
Token | bad |
Token ID | 2089 |
Feature activation | -4.77e+00 |
Pos logit contributions | |
lif | +10.897 |
IFF | +10.862 |
usefulness | +10.601 |
Unch | +10.483 |
OR | +10.243 |
Neg logit contributions | |
culosis | -15.651 |
azines | -14.971 |
formance | -13.828 |
excluding | -13.672 |
cluding | -13.035 |
Token | as |
Token ID | 355 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
IFF | +3.022 |
usefulness | +2.995 |
Unch | +2.993 |
OR | +2.958 |
lif | +2.846 |
Neg logit contributions | |
culosis | -3.957 |
azines | -3.957 |
excluding | -3.729 |
formance | -3.706 |
cluding | -3.552 |
Token | it |
Token ID | 340 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
usefulness | +8.092 |
Unch | +7.944 |
IFF | +7.942 |
lif | +7.892 |
OR | +7.817 |
Neg logit contributions | |
culosis | -11.469 |
azines | -11.161 |
formance | -10.593 |
excluding | -10.358 |
ォ | -9.853 |
Token | does |
Token ID | 857 |
Feature activation | -7.88e+00 |
Pos logit contributions | |
usefulness | +7.100 |
IFF | +6.896 |
Unch | +6.889 |
OR | +6.863 |
lif | +6.794 |
Neg logit contributions | |
culosis | -10.987 |
azines | -10.920 |
excluding | -10.126 |
formance | -10.078 |
cluding | -9.577 |
Token | there |
Token ID | 612 |
Feature activation | -1.93e+00 |
Pos logit contributions | |
usefulness | +5.185 |
Unch | +5.162 |
IFF | +5.156 |
OR | +5.054 |
lif | +4.943 |
Neg logit contributions | |
culosis | -6.211 |
azines | -6.186 |
excluding | -5.791 |
formance | -5.766 |
cluding | -5.506 |
Token | research |
Token ID | 2267 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
usefulness | +5.462 |
IFF | +5.261 |
OR | +5.254 |
Unch | +5.250 |
lif | +5.069 |
Neg logit contributions | |
culosis | -6.911 |
azines | -6.857 |
excluding | -6.407 |
formance | -6.388 |
cluding | -6.015 |
Token | was |
Token ID | 373 |
Feature activation | -7.26e-01 |
Pos logit contributions | |
IFF | +1.529 |
usefulness | +1.526 |
Unch | +1.517 |
OR | +1.498 |
lif | +1.448 |
Neg logit contributions | |
azines | -1.440 |
culosis | -1.433 |
excluding | -1.347 |
formance | -1.331 |
Conclusion | -1.271 |
Token | published |
Token ID | 3199 |
Feature activation | -3.13e+00 |
Pos logit contributions | |
IFF | +0.547 |
Unch | +0.544 |
usefulness | +0.542 |
OR | +0.534 |
ellig | +0.516 |
Neg logit contributions | |
azines | -0.517 |
culosis | -0.509 |
excluding | -0.486 |
formance | -0.478 |
Conclusion | -0.461 |
Token | last |
Token ID | 938 |
Feature activation | -3.99e+00 |
Pos logit contributions | |
IFF | +2.291 |
Unch | +2.277 |
usefulness | +2.272 |
OR | +2.240 |
lif | +2.158 |
Neg logit contributions | |
azines | -2.303 |
culosis | -2.291 |
excluding | -2.163 |
formance | -2.134 |
Conclusion | -2.044 |
Token | month |
Token ID | 1227 |
Feature activation | -9.80e+00 |
Pos logit contributions | |
IFF | +3.710 |
Unch | +3.703 |
usefulness | +3.696 |
OR | +3.662 |
lif | +3.572 |
Neg logit contributions | |
azines | -2.123 |
culosis | -2.108 |
excluding | -1.946 |
formance | -1.924 |
cluding | -1.791 |
Token | in |
Token ID | 287 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
Unch | +5.886 |
OR | +5.865 |
IFF | +5.814 |
usefulness | +5.723 |
lif | +5.532 |
Neg logit contributions | |
culosis | -8.034 |
azines | -7.953 |
excluding | -7.547 |
formance | -7.478 |
cluding | -7.240 |
Token | the |
Token ID | 262 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
Unch | +9.843 |
usefulness | +9.696 |
IFF | +9.513 |
OR | +9.421 |
lif | +9.406 |
Neg logit contributions | |
culosis | -15.453 |
azines | -14.933 |
黒 | -14.792 |
ォ | -14.642 |
excluding | -14.547 |
Token | Proceedings |
Token ID | 30641 |
Feature activation | -7.70e+00 |
Pos logit contributions | |
Unch | +8.058 |
usefulness | +7.959 |
OR | +7.912 |
lif | +7.757 |
IFF | +7.738 |
Neg logit contributions | |
culosis | -10.153 |
azines | -9.714 |
excluding | -9.468 |
formance | -9.365 |
ォ | -9.312 |
Token | of |
Token ID | 286 |
Feature activation | -8.50e+00 |
Pos logit contributions | |
Unch | +4.532 |
IFF | +4.497 |
usefulness | +4.470 |
OR | +4.456 |
lif | +4.230 |
Neg logit contributions | |
culosis | -6.791 |
azines | -6.676 |
excluding | -6.301 |
formance | -6.182 |
cluding | -5.995 |
Token | the |
Token ID | 262 |
Feature activation | -3.20e+00 |
Pos logit contributions | |
Unch | +5.023 |
IFF | +4.976 |
usefulness | +4.957 |
OR | +4.889 |
lif | +4.653 |
Neg logit contributions | |
azines | -7.399 |
culosis | -7.394 |
excluding | -6.999 |
formance | -6.898 |
cluding | -6.618 |
Token | National |
Token ID | 2351 |
Feature activation | -4.91e-01 |
Pos logit contributions | |
IFF | +2.043 |
Unch | +2.028 |
usefulness | +2.027 |
OR | +1.991 |
lif | +1.906 |
Neg logit contributions | |
azines | -2.664 |
culosis | -2.651 |
excluding | -2.520 |
formance | -2.490 |
cluding | -2.397 |
Token | didn |
Token ID | 1422 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
Unch | +7.885 |
IFF | +7.763 |
lif | +7.716 |
OR | +7.647 |
usefulness | +7.534 |
Neg logit contributions | |
azines | -10.018 |
culosis | -9.724 |
formance | -9.532 |
excluding | -9.172 |
Conclusion | -8.811 |
Token | � |
Token ID | 447 |
Feature activation | -9.31e+00 |
Pos logit contributions | |
azines | +0.220 |
culosis | +0.213 |
excluding | +0.207 |
formance | +0.201 |
Conclusion | +0.192 |
Neg logit contributions | |
usefulness | -0.338 |
Unch | -0.336 |
IFF | -0.334 |
OR | -0.325 |
lif | -0.320 |
Token | � |
Token ID | 247 |
Feature activation | -3.31e+00 |
Pos logit contributions | |
Unch | +6.965 |
OR | +6.950 |
IFF | +6.909 |
usefulness | +6.756 |
lif | +6.543 |
Neg logit contributions | |
azines | -6.505 |
culosis | -6.348 |
excluding | -5.948 |
formance | -5.781 |
cluding | -5.639 |
Token | t |
Token ID | 83 |
Feature activation | -1.37e+01 |
Pos logit contributions | |
IFF | +2.247 |
Unch | +2.229 |
usefulness | +2.214 |
OR | +2.208 |
lif | +2.116 |
Neg logit contributions | |
azines | -2.608 |
culosis | -2.573 |
excluding | -2.449 |
formance | -2.413 |
Conclusion | -2.329 |
Token | waive |
Token ID | 40307 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
Unch | +8.772 |
IFF | +8.751 |
lif | +8.709 |
OR | +8.566 |
usefulness | +8.358 |
Neg logit contributions | |
culosis | -10.435 |
azines | -10.334 |
formance | -9.755 |
excluding | -9.542 |
黒 | -9.188 |
Token | another |
Token ID | 1194 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
usefulness | +7.321 |
IFF | +7.263 |
Unch | +7.194 |
OR | +7.171 |
lif | +7.097 |
Neg logit contributions | |
culosis | -10.970 |
azines | -10.933 |
formance | -10.170 |
excluding | -9.990 |
ォ | -9.639 |
Token | part |
Token ID | 636 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
lif | +12.250 |
usefulness | +12.050 |
IFF | +11.819 |
OR | +11.528 |
standoff | +11.451 |
Neg logit contributions | |
azines | -13.815 |
culosis | -13.461 |
excluding | -12.538 |
formance | -12.473 |
ォ | -12.329 |
Token | of |
Token ID | 286 |
Feature activation | -1.59e+01 |
Pos logit contributions | |
OR | +6.491 |
IFF | +6.380 |
Unch | +6.248 |
lif | +6.020 |
usefulness | +5.911 |
Neg logit contributions | |
azines | -12.385 |
culosis | -12.358 |
excluding | -11.311 |
formance | -11.237 |
Conclusion | -10.672 |
Token | the |
Token ID | 262 |
Feature activation | -1.69e+01 |
Pos logit contributions | |
Unch | +8.045 |
IFF | +8.022 |
usefulness | +7.956 |
lif | +7.856 |
OR | +7.807 |
Neg logit contributions | |
culosis | -13.639 |
azines | -13.534 |
excluding | -12.529 |
formance | -12.515 |
ォ | -12.116 |
Token | decision |
Token ID | 2551 |
Feature activation | -1.80e+01 |
Pos logit contributions | |
usefulness | +10.945 |
IFF | +10.745 |
Unch | +10.658 |
lif | +10.490 |
OR | +10.465 |
Neg logit contributions | |
culosis | -11.967 |
azines | -11.940 |
formance | -11.353 |
excluding | -11.065 |
ォ | -10.658 |
Token | that |
Token ID | 326 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
OR | +10.453 |
lif | +10.369 |
Unch | +10.210 |
IFF | +10.202 |
usefulness | +9.892 |
Neg logit contributions | |
culosis | -13.773 |
azines | -13.708 |
formance | -12.686 |
excluding | -12.075 |
ォ | -12.009 |
Token | , |
Token ID | 11 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
IFF | +2.048 |
Unch | +2.024 |
usefulness | +2.023 |
OR | +2.002 |
lif | +1.915 |
Neg logit contributions | |
azines | -2.421 |
culosis | -2.410 |
excluding | -2.273 |
formance | -2.252 |
Conclusion | -2.170 |
Token | 2012 |
Token ID | 2321 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
azines | +0.736 |
culosis | +0.723 |
excluding | +0.690 |
formance | +0.661 |
Conclusion | +0.644 |
Neg logit contributions | |
IFF | -1.017 |
usefulness | -1.017 |
Unch | -1.014 |
OR | -0.980 |
ellig | -0.966 |
Token | ) |
Token ID | 8 |
Feature activation | -6.34e+00 |
Pos logit contributions | |
usefulness | +1.141 |
IFF | +1.134 |
Unch | +1.133 |
OR | +1.101 |
lif | +1.075 |
Neg logit contributions | |
azines | -1.064 |
culosis | -1.050 |
excluding | -1.006 |
formance | -0.984 |
Conclusion | -0.949 |
Token |
|
Token ID | 198 |
Feature activation | -7.65e+00 |
Pos logit contributions | |
IFF | +3.658 |
OR | +3.657 |
Unch | +3.583 |
usefulness | +3.450 |
ellig | +3.307 |
Neg logit contributions | |
culosis | -5.672 |
azines | -5.636 |
excluding | -5.265 |
formance | -5.259 |
cluding | -5.074 |
Token |
|
Token ID | 198 |
Feature activation | -9.93e+00 |
Pos logit contributions | |
OR | +4.112 |
IFF | +4.085 |
Unch | +3.921 |
usefulness | +3.829 |
humans | +3.714 |
Neg logit contributions | |
culosis | -7.179 |
azines | -7.063 |
formance | -6.619 |
excluding | -6.545 |
cluding | -6.336 |
Token | A |
Token ID | 32 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
OR | +6.080 |
IFF | +5.954 |
humans | +5.407 |
ELL | +5.327 |
usefulness | +5.300 |
Neg logit contributions | |
culosis | -8.513 |
azines | -8.475 |
formance | -7.877 |
excluding | -7.781 |
Conclusion | -7.726 |
Token | 24 |
Token ID | 1987 |
Feature activation | -8.87e+00 |
Pos logit contributions | |
lif | +9.072 |
Unch | +8.774 |
OR | +8.690 |
IFF | +8.619 |
ils | +8.528 |
Neg logit contributions | |
azines | -16.537 |
culosis | -16.026 |
formance | -15.421 |
excluding | -15.362 |
Conclusion | -14.564 |
Token | - |
Token ID | 12 |
Feature activation | -4.94e+00 |
Pos logit contributions | |
IFF | +5.034 |
OR | +4.963 |
Unch | +4.913 |
usefulness | +4.824 |
lif | +4.756 |
Neg logit contributions | |
azines | -7.768 |
culosis | -7.763 |
excluding | -7.329 |
formance | -7.246 |
Conclusion | -7.005 |
Token | year |
Token ID | 1941 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
IFF | +5.029 |
Unch | +4.988 |
OR | +4.979 |
usefulness | +4.963 |
lif | +4.838 |
Neg logit contributions | |
azines | -2.205 |
culosis | -2.171 |
excluding | -1.947 |
formance | -1.911 |
Conclusion | -1.792 |
Token | - |
Token ID | 12 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
usefulness | +5.716 |
OR | +5.640 |
IFF | +5.617 |
lif | +5.612 |
Unch | +5.604 |
Neg logit contributions | |
culosis | -9.587 |
azines | -9.555 |
excluding | -9.064 |
formance | -9.049 |
Conclusion | -8.576 |
Token | old |
Token ID | 727 |
Feature activation | -8.69e+00 |
Pos logit contributions | |
OR | +5.836 |
IFF | +5.684 |
humans | +5.342 |
orm | +5.332 |
Unch | +5.244 |
Neg logit contributions | |
culosis | -9.369 |
azines | -9.321 |
formance | -8.718 |
excluding | -8.602 |
Conclusion | -8.515 |
Token | aren |
Token ID | 3588 |
Feature activation | +5.05e+00 |
Pos logit contributions | |
Unch | +4.751 |
usefulness | +4.739 |
IFF | +4.706 |
OR | +4.657 |
lif | +4.570 |
Neg logit contributions | |
azines | -5.733 |
culosis | -5.660 |
excluding | -5.366 |
formance | -5.356 |
cluding | -5.098 |
Token | � |
Token ID | 447 |
Feature activation | -7.00e+00 |
Pos logit contributions | |
azines | +2.427 |
excluding | +2.391 |
culosis | +2.271 |
formance | +2.189 |
Conclusion | +2.178 |
Neg logit contributions | |
usefulness | -4.894 |
Unch | -4.793 |
IFF | -4.632 |
ellig | -4.549 |
lif | -4.546 |
Token | � |
Token ID | 247 |
Feature activation | -3.71e+00 |
Pos logit contributions | |
IFF | +5.214 |
OR | +5.179 |
Unch | +5.143 |
usefulness | +5.129 |
lif | +4.909 |
Neg logit contributions | |
azines | -4.999 |
culosis | -4.971 |
excluding | -4.617 |
formance | -4.586 |
cluding | -4.417 |
Token | t |
Token ID | 83 |
Feature activation | -7.89e+00 |
Pos logit contributions | |
IFF | +2.509 |
usefulness | +2.483 |
Unch | +2.480 |
OR | +2.458 |
lif | +2.356 |
Neg logit contributions | |
azines | -2.926 |
culosis | -2.902 |
excluding | -2.749 |
formance | -2.718 |
Conclusion | -2.626 |
Token | nearly |
Token ID | 3016 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
usefulness | +5.502 |
IFF | +5.469 |
Unch | +5.457 |
OR | +5.388 |
lif | +5.307 |
Neg logit contributions | |
culosis | -5.941 |
azines | -5.916 |
formance | -5.505 |
excluding | -5.406 |
Conclusion | -5.262 |
Token | as |
Token ID | 355 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
Unch | +5.764 |
usefulness | +5.700 |
IFF | +5.686 |
OR | +5.577 |
lif | +5.552 |
Neg logit contributions | |
azines | -9.116 |
culosis | -9.097 |
formance | -8.594 |
excluding | -8.504 |
Conclusion | -8.264 |
Token | entertained |
Token ID | 34988 |
Feature activation | -5.01e+00 |
Pos logit contributions | |
lif | +11.385 |
usefulness | +11.253 |
IFF | +10.845 |
powerful | +10.841 |
standoff | +10.645 |
Neg logit contributions | |
culosis | -14.721 |
azines | -14.146 |
formance | -13.416 |
excluding | -13.199 |
ォ | -12.628 |
Token | by |
Token ID | 416 |
Feature activation | -9.57e+00 |
Pos logit contributions | |
IFF | +3.176 |
Unch | +3.164 |
usefulness | +3.129 |
OR | +3.096 |
lif | +2.981 |
Neg logit contributions | |
azines | -4.171 |
culosis | -4.117 |
excluding | -3.920 |
formance | -3.893 |
cluding | -3.729 |
Token | it |
Token ID | 340 |
Feature activation | -6.39e-01 |
Pos logit contributions | |
usefulness | +6.252 |
Unch | +6.095 |
IFF | +6.020 |
lif | +5.964 |
OR | +5.932 |
Neg logit contributions | |
culosis | -7.573 |
azines | -7.572 |
formance | -7.108 |
excluding | -7.008 |
Conclusion | -6.689 |
Token | — |
Token ID | 851 |
Feature activation | -9.49e+00 |
Pos logit contributions | |
IFF | +0.418 |
usefulness | +0.415 |
Unch | +0.413 |
OR | +0.406 |
ellig | +0.389 |
Neg logit contributions | |
azines | -0.521 |
culosis | -0.518 |
excluding | -0.492 |
formance | -0.486 |
Conclusion | -0.471 |
Token | in |
Token ID | 287 |
Feature activation | -3.32e+00 |
Pos logit contributions | |
IFF | +6.271 |
usefulness | +6.260 |
OR | +6.257 |
Unch | +6.251 |
lif | +6.027 |
Neg logit contributions | |
azines | -7.291 |
culosis | -7.233 |
formance | -6.775 |
excluding | -6.619 |
cluding | -6.357 |
Token | the |
Token ID | 262 |
Feature activation | +9.00e-01 |
Pos logit contributions | |
azines | +5.535 |
culosis | +5.284 |
excluding | +5.219 |
formance | +5.150 |
Conclusion | +5.031 |
Neg logit contributions | |
IFF | -5.642 |
usefulness | -5.485 |
ellig | -5.441 |
Unch | -5.377 |
OR | -5.288 |
Token | lines |
Token ID | 3951 |
Feature activation | -4.57e+00 |
Pos logit contributions | |
azines | +0.652 |
culosis | +0.634 |
excluding | +0.609 |
formance | +0.604 |
Conclusion | +0.586 |
Neg logit contributions | |
IFF | -0.668 |
Unch | -0.654 |
usefulness | -0.651 |
OR | -0.646 |
ellig | -0.632 |
Token | will |
Token ID | 481 |
Feature activation | -5.93e+00 |
Pos logit contributions | |
usefulness | +3.190 |
Unch | +3.189 |
IFF | +3.188 |
OR | +3.129 |
lif | +3.044 |
Neg logit contributions | |
azines | -3.481 |
culosis | -3.466 |
excluding | -3.279 |
formance | -3.241 |
Conclusion | -3.110 |
Token | be |
Token ID | 307 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
Unch | +4.015 |
usefulness | +3.974 |
IFF | +3.972 |
OR | +3.934 |
lif | +3.843 |
Neg logit contributions | |
azines | -4.657 |
culosis | -4.625 |
excluding | -4.376 |
formance | -4.305 |
cluding | -4.111 |
Token | just |
Token ID | 655 |
Feature activation | -5.89e+00 |
Pos logit contributions | |
Unch | +7.535 |
lif | +7.384 |
OR | +7.325 |
usefulness | +7.307 |
IFF | +7.189 |
Neg logit contributions | |
culosis | -10.171 |
azines | -10.145 |
excluding | -9.343 |
formance | -9.220 |
ォ | -8.938 |
Token | as |
Token ID | 355 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
IFF | +3.618 |
Unch | +3.617 |
usefulness | +3.570 |
OR | +3.543 |
lif | +3.413 |
Neg logit contributions | |
azines | -4.978 |
culosis | -4.974 |
excluding | -4.724 |
formance | -4.671 |
Conclusion | -4.510 |
Token | long |
Token ID | 890 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
lif | +9.892 |
Unch | +9.469 |
IFF | +9.279 |
usefulness | +9.201 |
OR | +9.060 |
Neg logit contributions | |
culosis | -16.497 |
azines | -15.786 |
excluding | -14.991 |
ォ | -14.393 |
formance | -14.194 |
Token | . |
Token ID | 13 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
Unch | +7.096 |
IFF | +7.076 |
OR | +7.040 |
usefulness | +6.968 |
lif | +6.908 |
Neg logit contributions | |
culosis | -9.780 |
azines | -9.646 |
formance | -8.997 |
excluding | -8.963 |
Conclusion | -8.541 |
Token | Knowing |
Token ID | 29154 |
Feature activation | +8.14e+00 |
Pos logit contributions | |
IFF | +1.393 |
usefulness | +1.382 |
Unch | +1.380 |
OR | +1.358 |
lif | +1.303 |
Neg logit contributions | |
azines | -1.635 |
culosis | -1.624 |
excluding | -1.541 |
formance | -1.522 |
Conclusion | -1.467 |
Token | what |
Token ID | 644 |
Feature activation | +3.55e+00 |
Pos logit contributions | |
azines | +5.967 |
culosis | +5.707 |
excluding | +5.497 |
formance | +5.471 |
Conclusion | +5.361 |
Neg logit contributions | |
IFF | -5.452 |
Unch | -5.326 |
ellig | -5.315 |
usefulness | -5.289 |
OR | -5.177 |
Token | you |
Token ID | 345 |
Feature activation | -4.56e+00 |
Pos logit contributions | |
azines | +2.642 |
culosis | +2.491 |
excluding | +2.420 |
formance | +2.419 |
Conclusion | +2.327 |
Neg logit contributions | |
IFF | -2.542 |
Unch | -2.503 |
usefulness | -2.467 |
OR | -2.446 |
ellig | -2.429 |
Token |
|
Token ID | 198 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
azines | +2.820 |
excluding | +2.764 |
culosis | +2.676 |
formance | +2.647 |
Conclusion | +2.589 |
Neg logit contributions | |
usefulness | -3.214 |
Unch | -3.196 |
IFF | -3.125 |
blance | -3.015 |
ellig | -2.999 |
Token | Put |
Token ID | 11588 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
azines | +2.132 |
culosis | +2.088 |
excluding | +2.034 |
formance | +1.986 |
cluding | +1.907 |
Neg logit contributions | |
Unch | -2.026 |
usefulness | -1.992 |
IFF | -1.975 |
ellig | -1.883 |
OR | -1.882 |
Token | the |
Token ID | 262 |
Feature activation | +8.04e+00 |
Pos logit contributions | |
azines | +8.369 |
culosis | +8.114 |
excluding | +7.807 |
cluding | +7.720 |
formance | +7.504 |
Neg logit contributions | |
IFF | -9.588 |
Unch | -9.336 |
usefulness | -9.314 |
ellig | -8.897 |
OR | -8.868 |
Token | branches |
Token ID | 13737 |
Feature activation | -3.23e-01 |
Pos logit contributions | |
azines | +5.226 |
culosis | +4.982 |
excluding | +4.879 |
culminating | +4.654 |
formance | +4.615 |
Neg logit contributions | |
IFF | -6.245 |
Unch | -6.047 |
OR | -6.038 |
ellig | -6.031 |
usefulness | -5.956 |
Token | in |
Token ID | 287 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
IFF | +0.238 |
usefulness | +0.236 |
Unch | +0.236 |
OR | +0.232 |
ellig | +0.223 |
Neg logit contributions | |
azines | -0.236 |
culosis | -0.234 |
excluding | -0.222 |
formance | -0.218 |
Conclusion | -0.210 |
Token | the |
Token ID | 262 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
azines | +6.228 |
culosis | +5.673 |
formance | +5.659 |
excluding | +5.577 |
Conclusion | +5.563 |
Neg logit contributions | |
IFF | -7.987 |
usefulness | -7.707 |
Unch | -7.659 |
humans | -7.562 |
OR | -7.532 |
Token | water |
Token ID | 1660 |
Feature activation | -4.34e+00 |
Pos logit contributions | |
azines | +8.001 |
excluding | +7.220 |
culosis | +7.216 |
culminating | +7.178 |
Conclusion | +7.078 |
Neg logit contributions | |
IFF | -11.541 |
humans | -11.185 |
ellig | -11.022 |
Unch | -10.980 |
blance | -10.867 |
Token | , |
Token ID | 11 |
Feature activation | +2.79e+00 |
Pos logit contributions | |
IFF | +2.845 |
usefulness | +2.829 |
Unch | +2.824 |
OR | +2.805 |
lif | +2.707 |
Neg logit contributions | |
culosis | -3.479 |
azines | -3.462 |
excluding | -3.282 |
formance | -3.242 |
Conclusion | -3.136 |
Token | then |
Token ID | 788 |
Feature activation | +6.55e+00 |
Pos logit contributions | |
azines | +1.960 |
culosis | +1.905 |
excluding | +1.827 |
formance | +1.771 |
cluding | +1.748 |
Neg logit contributions | |
IFF | -2.137 |
Unch | -2.096 |
usefulness | -2.084 |
OR | -2.025 |
ellig | -2.003 |
Token | boil |
Token ID | 20667 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
azines | +4.522 |
culosis | +4.445 |
excluding | +4.165 |
formance | +4.057 |
cluding | +4.055 |
Neg logit contributions | |
IFF | -4.829 |
Unch | -4.763 |
usefulness | -4.715 |
humans | -4.632 |
OR | -4.573 |
Token | them |
Token ID | 606 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
IFF | +1.207 |
usefulness | +1.195 |
Unch | +1.193 |
OR | +1.174 |
lif | +1.124 |
Neg logit contributions | |
azines | -1.461 |
culosis | -1.448 |
excluding | -1.378 |
formance | -1.359 |
Conclusion | -1.313 |
Token | 03 |
Token ID | 7643 |
Feature activation | +4.06e+00 |
Pos logit contributions | |
azines | +1.729 |
culosis | +1.673 |
excluding | +1.634 |
formance | +1.615 |
cluding | +1.593 |
Neg logit contributions | |
IFF | -1.018 |
usefulness | -0.989 |
Unch | -0.959 |
ellig | -0.936 |
OR | -0.917 |
Token | 30 |
Token ID | 1270 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
azines | +2.949 |
excluding | +2.913 |
culosis | +2.867 |
Conclusion | +2.777 |
formance | +2.776 |
Neg logit contributions | |
IFF | -2.939 |
usefulness | -2.866 |
Unch | -2.854 |
ellig | -2.770 |
OR | -2.717 |
Token | 333 |
Token ID | 23460 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
IFF | +0.071 |
Unch | +0.070 |
usefulness | +0.070 |
OR | +0.068 |
lif | +0.065 |
Neg logit contributions | |
azines | -0.118 |
culosis | -0.117 |
excluding | -0.112 |
formance | -0.111 |
Conclusion | -0.108 |
Token | 68 |
Token ID | 8257 |
Feature activation | +7.80e+00 |
Pos logit contributions | |
IFF | +1.135 |
usefulness | +1.118 |
Unch | +1.116 |
OR | +1.086 |
lif | +1.019 |
Neg logit contributions | |
azines | -2.685 |
culosis | -2.671 |
excluding | -2.573 |
formance | -2.546 |
cluding | -2.476 |
Token | 46 |
Token ID | 3510 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
azines | +4.539 |
excluding | +4.515 |
culosis | +4.324 |
formance | +4.296 |
excluding | +4.130 |
Neg logit contributions | |
Unch | -6.534 |
ivas | -6.366 |
OR | -6.339 |
IFF | -6.328 |
ellig | -6.327 |
Token | . |
Token ID | 13 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
excluding | +6.969 |
azines | +6.744 |
excluding | +6.540 |
culosis | +6.123 |
formance | +6.039 |
Neg logit contributions | |
ivas | -10.959 |
usefulness | -10.379 |
IFF | -10.370 |
Unch | -10.368 |
ellig | -10.320 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
excluding | +8.978 |
azines | +8.871 |
excluding | +8.421 |
Conclusion | +8.316 |
Franch | +8.068 |
Neg logit contributions | |
ivas | -9.003 |
orm | -8.997 |
IFF | -8.792 |
usefulness | -8.691 |
oried | -8.621 |
Token | ( |
Token ID | 7 |
Feature activation | -6.48e+00 |
Pos logit contributions | |
IFF | +1.081 |
usefulness | +1.074 |
Unch | +1.073 |
OR | +1.056 |
lif | +1.016 |
Neg logit contributions | |
azines | -1.134 |
culosis | -1.126 |
excluding | -1.066 |
formance | -1.052 |
Conclusion | -1.011 |
Token | FIL |
Token ID | 46700 |
Feature activation | -5.21e+00 |
Pos logit contributions | |
IFF | +4.467 |
OR | +4.450 |
Unch | +4.350 |
usefulness | +4.320 |
humans | +4.185 |
Neg logit contributions | |
azines | -4.999 |
culosis | -4.986 |
formance | -4.635 |
excluding | -4.597 |
cluding | -4.436 |
Token | ES |
Token ID | 1546 |
Feature activation | -7.28e-01 |
Pos logit contributions | |
IFF | +3.027 |
OR | +2.956 |
usefulness | +2.934 |
Unch | +2.927 |
lif | +2.748 |
Neg logit contributions | |
azines | -4.647 |
culosis | -4.619 |
formance | -4.378 |
excluding | -4.376 |
Conclusion | -4.184 |
Token | ) |
Token ID | 8 |
Feature activation | -5.27e+00 |
Pos logit contributions | |
usefulness | +0.495 |
IFF | +0.495 |
Unch | +0.492 |
OR | +0.480 |
ellig | +0.467 |
Neg logit contributions | |
azines | -0.569 |
culosis | -0.567 |
excluding | -0.540 |
formance | -0.530 |
cluding | -0.514 |
Token | NS |
Token ID | 8035 |
Feature activation | +6.38e+00 |
Pos logit contributions | |
azines | +1.249 |
culosis | +1.239 |
excluding | +1.181 |
formance | +1.157 |
cluding | +1.127 |
Neg logit contributions | |
Unch | -0.992 |
usefulness | -0.992 |
IFF | -0.983 |
OR | -0.941 |
lif | -0.933 |
Token | ) |
Token ID | 8 |
Feature activation | +7.46e+00 |
Pos logit contributions | |
culosis | +4.340 |
azines | +4.337 |
excluding | +4.132 |
formance | +3.952 |
cluding | +3.879 |
Neg logit contributions | |
IFF | -4.775 |
usefulness | -4.763 |
Unch | -4.695 |
ellig | -4.589 |
humans | -4.570 |
Token | for |
Token ID | 329 |
Feature activation | +5.89e+00 |
Pos logit contributions | |
azines | +5.270 |
culosis | +5.063 |
excluding | +5.002 |
excluding | +4.814 |
formance | +4.741 |
Neg logit contributions | |
IFF | -5.375 |
ellig | -5.224 |
usefulness | -5.198 |
Unch | -5.138 |
humans | -5.067 |
Token | 12 |
Token ID | 1105 |
Feature activation | +5.99e+00 |
Pos logit contributions | |
azines | +4.691 |
culosis | +4.638 |
excluding | +4.525 |
formance | +4.335 |
excluding | +4.332 |
Neg logit contributions | |
IFF | -3.729 |
Unch | -3.663 |
ellig | -3.595 |
OR | -3.571 |
usefulness | -3.561 |
Token | weeks |
Token ID | 2745 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
azines | +4.451 |
culosis | +4.280 |
excluding | +4.192 |
formance | +4.028 |
cluding | +4.004 |
Neg logit contributions | |
IFF | -4.226 |
usefulness | -4.175 |
Unch | -4.148 |
OR | -4.024 |
humans | -4.008 |
Token | . |
Token ID | 13 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
azines | +6.101 |
excluding | +5.979 |
excluding | +5.911 |
culminating | +5.872 |
culosis | +5.872 |
Neg logit contributions | |
IFF | -8.015 |
usefulness | -7.901 |
Unch | -7.759 |
humans | -7.710 |
ellig | -7.641 |
Token | In |
Token ID | 554 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
Conclusion | +9.750 |
azines | +9.279 |
excluding | +8.952 |
Month | +8.883 |
culosis | +8.798 |
Neg logit contributions | |
usefulness | -11.450 |
ellig | -11.231 |
IFF | -11.183 |
blance | -10.811 |
imeo | -10.721 |
Token | the |
Token ID | 262 |
Feature activation | +1.53e+01 |
Pos logit contributions | |
azines | +8.794 |
cluding | +8.740 |
culosis | +8.456 |
Conclusion | +8.358 |
formance | +8.323 |
Neg logit contributions | |
IFF | -8.907 |
usefulness | -8.532 |
Unch | -8.469 |
ellig | -8.325 |
OR | -8.119 |
Token | second |
Token ID | 1218 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
azines | +9.264 |
Conclusion | +9.082 |
cluding | +8.756 |
excluding | +8.750 |
excluding | +8.730 |
Neg logit contributions | |
IFF | -10.936 |
ellig | -10.465 |
Unch | -10.161 |
humans | -9.964 |
imeo | -9.822 |
Token | cohort |
Token ID | 20812 |
Feature activation | +4.33e+00 |
Pos logit contributions | |
azines | +5.939 |
culosis | +5.800 |
excluding | +5.596 |
cluding | +5.443 |
excluding | +5.429 |
Neg logit contributions | |
IFF | -8.476 |
Unch | -8.106 |
humans | -7.962 |
ellig | -7.939 |
usefulness | -7.923 |
Token | ( |
Token ID | 357 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
azines | +3.232 |
culosis | +3.195 |
excluding | +3.068 |
formance | +2.968 |
cluding | +2.905 |
Neg logit contributions | |
IFF | -3.081 |
Unch | -3.039 |
usefulness | -3.025 |
OR | -2.964 |
ellig | -2.898 |
Token | , |
Token ID | 11 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
IFF | +0.320 |
usefulness | +0.318 |
Unch | +0.315 |
OR | +0.311 |
ellig | +0.300 |
Neg logit contributions | |
azines | -0.346 |
culosis | -0.344 |
excluding | -0.328 |
formance | -0.322 |
Conclusion | -0.311 |
Token | nor |
Token ID | 4249 |
Feature activation | +5.88e+00 |
Pos logit contributions | |
IFF | +0.129 |
usefulness | +0.127 |
Unch | +0.127 |
OR | +0.125 |
ellig | +0.120 |
Neg logit contributions | |
azines | -0.144 |
culosis | -0.143 |
excluding | -0.136 |
formance | -0.133 |
Conclusion | -0.129 |
Token | will |
Token ID | 481 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
azines | +3.931 |
culosis | +3.919 |
excluding | +3.704 |
formance | +3.616 |
Conclusion | +3.557 |
Neg logit contributions | |
IFF | -4.546 |
usefulness | -4.459 |
OR | -4.396 |
Unch | -4.384 |
ellig | -4.305 |
Token | it |
Token ID | 340 |
Feature activation | +7.85e+00 |
Pos logit contributions | |
azines | +1.071 |
culosis | +1.064 |
excluding | +1.010 |
formance | +0.996 |
Conclusion | +0.960 |
Neg logit contributions | |
IFF | -0.969 |
usefulness | -0.959 |
Unch | -0.954 |
OR | -0.943 |
lif | -0.905 |
Token | be |
Token ID | 307 |
Feature activation | +8.26e+00 |
Pos logit contributions | |
azines | +5.437 |
culosis | +5.398 |
excluding | +5.189 |
formance | +4.994 |
Conclusion | +4.920 |
Neg logit contributions | |
IFF | -5.673 |
usefulness | -5.582 |
Unch | -5.497 |
OR | -5.455 |
humans | -5.393 |
Token | the |
Token ID | 262 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
azines | +5.589 |
culosis | +5.433 |
excluding | +5.381 |
formance | +5.298 |
cluding | +5.154 |
Neg logit contributions | |
IFF | -6.024 |
usefulness | -5.925 |
Unch | -5.822 |
OR | -5.808 |
ellig | -5.801 |
Token | last |
Token ID | 938 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
culminating | +8.647 |
azines | +8.641 |
cluding | +8.279 |
foremost | +8.240 |
excluding | +8.182 |
Neg logit contributions | |
humans | -15.431 |
ellig | -15.395 |
blance | -15.294 |
IFF | -15.225 |
OR | -14.797 |
Token | . |
Token ID | 13 |
Feature activation | -6.18e+00 |
Pos logit contributions | |
Unch | +2.425 |
IFF | +2.424 |
usefulness | +2.412 |
OR | +2.375 |
lif | +2.289 |
Neg logit contributions | |
azines | -2.977 |
culosis | -2.957 |
excluding | -2.785 |
formance | -2.761 |
Conclusion | -2.645 |
Token | The |
Token ID | 383 |
Feature activation | -3.76e+00 |
Pos logit contributions | |
Unch | +4.289 |
IFF | +4.145 |
OR | +4.125 |
usefulness | +4.056 |
ellig | +3.880 |
Neg logit contributions | |
azines | -4.817 |
culosis | -4.807 |
excluding | -4.496 |
formance | -4.475 |
cluding | -4.219 |
Token | Last |
Token ID | 4586 |
Feature activation | -3.24e+00 |
Pos logit contributions | |
usefulness | +2.735 |
IFF | +2.731 |
Unch | +2.724 |
OR | +2.680 |
lif | +2.586 |
Neg logit contributions | |
azines | -2.767 |
culosis | -2.762 |
excluding | -2.603 |
formance | -2.569 |
Conclusion | -2.443 |
Token | T |
Token ID | 309 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
IFF | +2.409 |
Unch | +2.397 |
usefulness | +2.396 |
OR | +2.368 |
lif | +2.274 |
Neg logit contributions | |
azines | -2.355 |
culosis | -2.326 |
excluding | -2.199 |
formance | -2.166 |
cluding | -2.075 |
Token | from |
Token ID | 422 |
Feature activation | +5.07e+00 |
Pos logit contributions | |
IFF | +0.396 |
usefulness | +0.391 |
Unch | +0.391 |
OR | +0.385 |
ellig | +0.370 |
Neg logit contributions | |
azines | -0.435 |
culosis | -0.433 |
excluding | -0.410 |
formance | -0.404 |
cluding | -0.390 |
Token | the |
Token ID | 262 |
Feature activation | +9.26e+00 |
Pos logit contributions | |
azines | +3.642 |
culosis | +3.628 |
excluding | +3.431 |
cluding | +3.366 |
formance | +3.345 |
Neg logit contributions | |
IFF | -3.694 |
usefulness | -3.608 |
Unch | -3.587 |
ellig | -3.495 |
OR | -3.472 |
Token | 1980 |
Token ID | 7169 |
Feature activation | -3.63e+00 |
Pos logit contributions | |
culosis | +5.584 |
azines | +5.535 |
excluding | +5.135 |
cluding | +5.099 |
Conclusion | +5.081 |
Neg logit contributions | |
IFF | -7.391 |
usefulness | -7.083 |
Unch | -7.075 |
ellig | -7.043 |
blance | -7.029 |
Token | s |
Token ID | 82 |
Feature activation | +2.84e+00 |
Pos logit contributions | |
OR | +1.270 |
IFF | +1.263 |
usefulness | +1.240 |
Unch | +1.227 |
lif | +1.157 |
Neg logit contributions | |
azines | -3.985 |
culosis | -3.964 |
excluding | -3.872 |
formance | -3.830 |
Conclusion | -3.712 |
Token | to |
Token ID | 284 |
Feature activation | +6.27e+00 |
Pos logit contributions | |
azines | +2.073 |
culosis | +2.058 |
excluding | +1.952 |
formance | +1.910 |
cluding | +1.853 |
Neg logit contributions | |
IFF | -2.081 |
usefulness | -2.050 |
Unch | -2.043 |
OR | -1.995 |
ellig | -1.932 |
Token | the |
Token ID | 262 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
azines | +4.091 |
culosis | +4.007 |
excluding | +3.806 |
formance | +3.760 |
cluding | +3.722 |
Neg logit contributions | |
IFF | -4.863 |
Unch | -4.799 |
usefulness | -4.797 |
ellig | -4.657 |
OR | -4.619 |
Token | 1990 |
Token ID | 6303 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
azines | +7.326 |
culosis | +6.900 |
cluding | +6.756 |
Conclusion | +6.702 |
culminating | +6.653 |
Neg logit contributions | |
IFF | -11.259 |
Unch | -11.103 |
ellig | -11.034 |
usefulness | -10.916 |
blance | -10.825 |
Token | s |
Token ID | 82 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
Unch | +0.498 |
IFF | +0.497 |
usefulness | +0.495 |
OR | +0.473 |
ellig | +0.448 |
Neg logit contributions | |
azines | -1.145 |
culosis | -1.137 |
excluding | -1.095 |
formance | -1.081 |
Conclusion | -1.054 |
Token | , |
Token ID | 11 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
azines | +1.379 |
culosis | +1.369 |
excluding | +1.300 |
formance | +1.274 |
cluding | +1.236 |
Neg logit contributions | |
IFF | -1.275 |
Unch | -1.255 |
usefulness | -1.255 |
OR | -1.228 |
ellig | -1.183 |
Token | his |
Token ID | 465 |
Feature activation | +3.12e+00 |
Pos logit contributions | |
azines | +0.982 |
culosis | +0.972 |
excluding | +0.923 |
formance | +0.907 |
cluding | +0.879 |
Neg logit contributions | |
IFF | -0.903 |
usefulness | -0.886 |
Unch | -0.885 |
OR | -0.872 |
ellig | -0.838 |
Token | family |
Token ID | 1641 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
azines | +2.610 |
culosis | +2.579 |
excluding | +2.468 |
formance | +2.412 |
Conclusion | +2.376 |
Neg logit contributions | |
IFF | -1.979 |
Unch | -1.906 |
usefulness | -1.870 |
OR | -1.854 |
ellig | -1.807 |
Token | that |
Token ID | 326 |
Feature activation | +2.75e+00 |
Pos logit contributions | |
IFF | +1.280 |
usefulness | +1.270 |
Unch | +1.268 |
OR | +1.249 |
lif | +1.199 |
Neg logit contributions | |
azines | -1.444 |
culosis | -1.436 |
excluding | -1.361 |
formance | -1.342 |
Conclusion | -1.295 |
Token | � |
Token ID | 447 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
culosis | +1.974 |
azines | +1.962 |
excluding | +1.880 |
formance | +1.822 |
Conclusion | +1.792 |
Neg logit contributions | |
IFF | -1.989 |
Unch | -1.978 |
usefulness | -1.976 |
OR | -1.945 |
ellig | -1.923 |
Token | � |
Token ID | 247 |
Feature activation | -6.50e-01 |
Pos logit contributions | |
IFF | +1.664 |
usefulness | +1.656 |
Unch | +1.656 |
OR | +1.627 |
lif | +1.582 |
Neg logit contributions | |
azines | -1.080 |
culosis | -1.067 |
excluding | -1.000 |
formance | -0.979 |
Conclusion | -0.933 |
Token | s |
Token ID | 82 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
IFF | +0.377 |
Unch | +0.373 |
usefulness | +0.372 |
OR | +0.365 |
ellig | +0.348 |
Neg logit contributions | |
azines | -0.578 |
culosis | -0.576 |
excluding | -0.551 |
formance | -0.543 |
Conclusion | -0.527 |
Token | industry |
Token ID | 2831 |
Feature activation | +3.64e+00 |
Pos logit contributions | |
azines | +0.880 |
culosis | +0.877 |
excluding | +0.840 |
formance | +0.819 |
Conclusion | +0.798 |
Neg logit contributions | |
IFF | -0.855 |
Unch | -0.845 |
usefulness | -0.839 |
OR | -0.830 |
ellig | -0.811 |
Token | standard |
Token ID | 3210 |
Feature activation | +4.43e+00 |
Pos logit contributions | |
culosis | +2.620 |
azines | +2.614 |
excluding | +2.508 |
formance | +2.435 |
Conclusion | +2.403 |
Neg logit contributions | |
IFF | -2.607 |
Unch | -2.570 |
usefulness | -2.543 |
OR | -2.525 |
ellig | -2.495 |
Token | and |
Token ID | 290 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
culosis | +3.110 |
azines | +3.077 |
excluding | +2.970 |
formance | +2.894 |
Conclusion | +2.831 |
Neg logit contributions | |
IFF | -3.206 |
Unch | -3.180 |
usefulness | -3.156 |
OR | -3.147 |
ellig | -3.108 |
Token | is |
Token ID | 318 |
Feature activation | +4.52e-01 |
Pos logit contributions | |
azines | +0.154 |
culosis | +0.153 |
excluding | +0.146 |
formance | +0.143 |
Conclusion | +0.139 |
Neg logit contributions | |
IFF | -0.151 |
Unch | -0.149 |
usefulness | -0.148 |
OR | -0.147 |
ellig | -0.142 |
Token | what |
Token ID | 644 |
Feature activation | +4.95e+00 |
Pos logit contributions | |
azines | +0.335 |
culosis | +0.333 |
excluding | +0.318 |
formance | +0.313 |
Conclusion | +0.300 |
Neg logit contributions | |
IFF | -0.325 |
Unch | -0.322 |
usefulness | -0.322 |
OR | -0.317 |
ellig | -0.307 |
Token | investors |
Token ID | 7713 |
Feature activation | +4.77e+00 |
Pos logit contributions | |
azines | +3.548 |
culosis | +3.485 |
excluding | +3.380 |
formance | +3.210 |
Conclusion | +3.188 |
Neg logit contributions | |
Unch | -3.499 |
IFF | -3.494 |
usefulness | -3.478 |
OR | -3.399 |
humans | -3.349 |
Token | will |
Token ID | 481 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
azines | +3.649 |
culosis | +3.643 |
excluding | +3.496 |
formance | +3.386 |
Conclusion | +3.367 |
Neg logit contributions | |
IFF | -3.185 |
Unch | -3.163 |
usefulness | -3.107 |
OR | -3.083 |
humans | -3.028 |
Token | since |
Token ID | 1201 |
Feature activation | -2.89e+00 |
Pos logit contributions | |
IFF | +0.476 |
Unch | +0.470 |
usefulness | +0.469 |
OR | +0.461 |
ellig | +0.444 |
Neg logit contributions | |
azines | -0.554 |
culosis | -0.547 |
excluding | -0.524 |
formance | -0.515 |
Conclusion | -0.502 |
Token | my |
Token ID | 616 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
IFF | +1.984 |
usefulness | +1.976 |
Unch | +1.970 |
OR | +1.940 |
lif | +1.865 |
Neg logit contributions | |
azines | -2.256 |
culosis | -2.249 |
excluding | -2.123 |
formance | -2.100 |
cluding | -2.014 |
Token | hardware |
Token ID | 6890 |
Feature activation | +4.46e+00 |
Pos logit contributions | |
azines | +1.031 |
culosis | +1.010 |
excluding | +0.971 |
formance | +0.955 |
Conclusion | +0.938 |
Neg logit contributions | |
IFF | -0.946 |
Unch | -0.934 |
usefulness | -0.920 |
OR | -0.914 |
ellig | -0.887 |
Token | is |
Token ID | 318 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
azines | +3.091 |
culosis | +2.994 |
excluding | +2.892 |
formance | +2.865 |
Conclusion | +2.846 |
Neg logit contributions | |
IFF | -3.333 |
Unch | -3.287 |
OR | -3.220 |
usefulness | -3.197 |
humans | -3.159 |
Token | almost |
Token ID | 2048 |
Feature activation | +2.54e+00 |
Pos logit contributions | |
IFF | +0.422 |
Unch | +0.416 |
usefulness | +0.415 |
OR | +0.409 |
ellig | +0.393 |
Neg logit contributions | |
azines | -0.460 |
culosis | -0.455 |
excluding | -0.436 |
formance | -0.430 |
Conclusion | -0.416 |
Token | 4 |
Token ID | 604 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
azines | +1.558 |
culosis | +1.541 |
excluding | +1.493 |
formance | +1.463 |
Conclusion | +1.398 |
Neg logit contributions | |
IFF | -2.131 |
usefulness | -2.084 |
Unch | -2.072 |
OR | -2.051 |
ellig | -2.003 |
Token | years |
Token ID | 812 |
Feature activation | -6.08e-02 |
Pos logit contributions | |
azines | +0.917 |
culosis | +0.908 |
excluding | +0.863 |
formance | +0.844 |
Conclusion | +0.821 |
Neg logit contributions | |
usefulness | -0.925 |
IFF | -0.920 |
Unch | -0.918 |
OR | -0.901 |
ellig | -0.873 |
Token | old |
Token ID | 1468 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
IFF | +0.045 |
usefulness | +0.045 |
Unch | +0.045 |
OR | +0.044 |
humans | +0.043 |
Neg logit contributions | |
azines | -0.044 |
culosis | -0.043 |
excluding | -0.041 |
formance | -0.041 |
Conclusion | -0.039 |
Token | and |
Token ID | 290 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
azines | +3.000 |
culosis | +2.940 |
excluding | +2.836 |
formance | +2.795 |
Conclusion | +2.742 |
Neg logit contributions | |
IFF | -3.102 |
Unch | -3.048 |
usefulness | -3.044 |
OR | -3.016 |
ellig | -2.900 |
Token | once |
Token ID | 1752 |
Feature activation | +8.67e+00 |
Pos logit contributions | |
azines | +1.111 |
culosis | +1.087 |
excluding | +1.054 |
formance | +1.031 |
Conclusion | +1.012 |
Neg logit contributions | |
IFF | -1.058 |
Unch | -1.036 |
OR | -1.029 |
usefulness | -1.027 |
ellig | -1.001 |
Token | I |
Token ID | 314 |
Feature activation | +7.84e+00 |
Pos logit contributions | |
azines | +5.878 |
culosis | +5.659 |
excluding | +5.546 |
Conclusion | +5.443 |
formance | +5.427 |
Neg logit contributions | |
IFF | -6.126 |
Unch | -6.036 |
ellig | -5.977 |
usefulness | -5.952 |
OR | -5.946 |
Token | income |
Token ID | 3739 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
IFF | +0.141 |
Unch | +0.140 |
usefulness | +0.139 |
OR | +0.137 |
ellig | +0.133 |
Neg logit contributions | |
azines | -0.126 |
culosis | -0.125 |
excluding | -0.119 |
formance | -0.116 |
Conclusion | -0.112 |
Token | from |
Token ID | 422 |
Feature activation | +5.18e+00 |
Pos logit contributions | |
azines | +2.634 |
culosis | +2.572 |
excluding | +2.519 |
formance | +2.434 |
excluding | +2.358 |
Neg logit contributions | |
IFF | -3.220 |
Unch | -3.167 |
usefulness | -3.157 |
OR | -3.112 |
ellig | -3.059 |
Token | the |
Token ID | 262 |
Feature activation | +2.47e+00 |
Pos logit contributions | |
azines | +3.538 |
culosis | +3.482 |
excluding | +3.380 |
formance | +3.327 |
cluding | +3.210 |
Neg logit contributions | |
IFF | -3.943 |
Unch | -3.783 |
usefulness | -3.741 |
OR | -3.727 |
ellig | -3.726 |
Token | property |
Token ID | 3119 |
Feature activation | +3.97e+00 |
Pos logit contributions | |
azines | +1.607 |
culosis | +1.581 |
excluding | +1.517 |
formance | +1.488 |
Conclusion | +1.429 |
Neg logit contributions | |
IFF | -2.009 |
Unch | -1.963 |
usefulness | -1.943 |
OR | -1.932 |
ellig | -1.897 |
Token | can |
Token ID | 460 |
Feature activation | +6.86e+00 |
Pos logit contributions | |
azines | +2.347 |
culosis | +2.320 |
excluding | +2.240 |
formance | +2.166 |
Conclusion | +2.067 |
Neg logit contributions | |
IFF | -3.381 |
Unch | -3.349 |
usefulness | -3.313 |
OR | -3.265 |
humans | -3.236 |
Token | be |
Token ID | 307 |
Feature activation | +2.89e+00 |
Pos logit contributions | |
azines | +4.652 |
culosis | +4.610 |
excluding | +4.449 |
formance | +4.269 |
cluding | +4.143 |
Neg logit contributions | |
usefulness | -5.110 |
Unch | -5.094 |
IFF | -5.040 |
OR | -4.922 |
humans | -4.841 |
Token | distributed |
Token ID | 9387 |
Feature activation | -2.36e+00 |
Pos logit contributions | |
azines | +1.932 |
culosis | +1.892 |
excluding | +1.863 |
formance | +1.790 |
excluding | +1.753 |
Neg logit contributions | |
IFF | -2.224 |
Unch | -2.196 |
usefulness | -2.189 |
OR | -2.154 |
ellig | -2.097 |
Token | to |
Token ID | 284 |
Feature activation | +4.55e+00 |
Pos logit contributions | |
IFF | +1.608 |
Unch | +1.598 |
usefulness | +1.596 |
OR | +1.572 |
lif | +1.511 |
Neg logit contributions | |
azines | -1.864 |
culosis | -1.854 |
excluding | -1.749 |
formance | -1.733 |
cluding | -1.665 |
Token | members |
Token ID | 1866 |
Feature activation | +3.90e+00 |
Pos logit contributions | |
azines | +3.218 |
culosis | +3.182 |
excluding | +3.032 |
formance | +2.996 |
Conclusion | +2.900 |
Neg logit contributions | |
IFF | -3.398 |
Unch | -3.252 |
usefulness | -3.243 |
OR | -3.182 |
ellig | -3.169 |
Token | , |
Token ID | 11 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
azines | +2.900 |
culosis | +2.851 |
excluding | +2.763 |
formance | +2.687 |
Conclusion | +2.610 |
Neg logit contributions | |
IFF | -2.779 |
usefulness | -2.765 |
Unch | -2.723 |
OR | -2.674 |
ellig | -2.603 |
Token | directors |
Token ID | 13445 |
Feature activation | -3.28e+00 |
Pos logit contributions | |
azines | +1.506 |
culosis | +1.479 |
excluding | +1.431 |
formance | +1.380 |
Conclusion | +1.348 |
Neg logit contributions | |
IFF | -1.487 |
usefulness | -1.441 |
Unch | -1.441 |
OR | -1.420 |
ellig | -1.382 |
Token | further |
Token ID | 2252 |
Feature activation | -6.43e+00 |
Pos logit contributions | |
IFF | +0.770 |
Unch | +0.761 |
usefulness | +0.761 |
OR | +0.751 |
ellig | +0.720 |
Neg logit contributions | |
azines | -0.872 |
culosis | -0.866 |
excluding | -0.823 |
formance | -0.811 |
Conclusion | -0.784 |
Token | bombings |
Token ID | 26579 |
Feature activation | -1.69e-02 |
Pos logit contributions | |
usefulness | +4.294 |
Unch | +4.240 |
IFF | +4.210 |
lif | +4.127 |
OR | +4.060 |
Neg logit contributions | |
azines | -5.113 |
culosis | -5.043 |
excluding | -4.798 |
formance | -4.772 |
cluding | -4.559 |
Token | , |
Token ID | 11 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
IFF | +0.012 |
usefulness | +0.012 |
Unch | +0.012 |
OR | +0.012 |
ellig | +0.011 |
Neg logit contributions | |
azines | -0.013 |
culosis | -0.013 |
excluding | -0.012 |
formance | -0.012 |
cluding | -0.011 |
Token | the |
Token ID | 262 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
azines | +1.283 |
culosis | +1.270 |
excluding | +1.199 |
formance | +1.179 |
cluding | +1.143 |
Neg logit contributions | |
IFF | -1.209 |
Unch | -1.192 |
usefulness | -1.188 |
OR | -1.180 |
ellig | -1.129 |
Token | 2003 |
Token ID | 5816 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
azines | +0.126 |
culosis | +0.125 |
excluding | +0.118 |
formance | +0.116 |
Conclusion | +0.112 |
Neg logit contributions | |
IFF | -0.125 |
Unch | -0.123 |
usefulness | -0.123 |
OR | -0.121 |
ellig | -0.117 |
Token | invasion |
Token ID | 11796 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
usefulness | +1.413 |
IFF | +1.411 |
Unch | +1.408 |
OR | +1.380 |
lif | +1.326 |
Neg logit contributions | |
azines | -2.005 |
culosis | -1.997 |
excluding | -1.906 |
formance | -1.884 |
cluding | -1.808 |
Token | , |
Token ID | 11 |
Feature activation | +2.96e+00 |
Pos logit contributions | |
azines | +2.784 |
culosis | +2.768 |
excluding | +2.623 |
formance | +2.573 |
Conclusion | +2.501 |
Neg logit contributions | |
IFF | -2.737 |
Unch | -2.702 |
usefulness | -2.693 |
OR | -2.658 |
ellig | -2.557 |
Token | and |
Token ID | 290 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
azines | +2.204 |
culosis | +2.178 |
excluding | +2.067 |
formance | +2.032 |
Conclusion | +1.980 |
Neg logit contributions | |
IFF | -2.139 |
Unch | -2.100 |
usefulness | -2.096 |
OR | -2.075 |
ellig | -1.999 |
Token | nine |
Token ID | 5193 |
Feature activation | +4.92e+00 |
Pos logit contributions | |
azines | +1.108 |
culosis | +1.098 |
excluding | +1.041 |
formance | +1.025 |
Conclusion | +0.997 |
Neg logit contributions | |
IFF | -1.009 |
Unch | -0.992 |
usefulness | -0.990 |
OR | -0.980 |
ellig | -0.939 |
Token | years |
Token ID | 812 |
Feature activation | -5.10e+00 |
Pos logit contributions | |
azines | +3.848 |
culosis | +3.729 |
excluding | +3.524 |
formance | +3.478 |
cluding | +3.451 |
Neg logit contributions | |
IFF | -3.371 |
Unch | -3.322 |
usefulness | -3.266 |
OR | -3.263 |
ellig | -3.113 |
Token | of |
Token ID | 286 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
IFF | +3.093 |
usefulness | +3.091 |
Unch | +3.074 |
OR | +3.047 |
lif | +2.977 |
Neg logit contributions | |
azines | -4.310 |
culosis | -4.279 |
excluding | -4.078 |
formance | -4.056 |
cluding | -3.849 |
Token |
|
Token ID | 198 |
Feature activation | +6.88e-01 |
Pos logit contributions | |
azines | +1.700 |
excluding | +1.654 |
culosis | +1.640 |
formance | +1.586 |
Conclusion | +1.562 |
Neg logit contributions | |
usefulness | -1.724 |
Unch | -1.706 |
IFF | -1.673 |
OR | -1.602 |
ellig | -1.594 |
Token | This |
Token ID | 1212 |
Feature activation | +8.83e+00 |
Pos logit contributions | |
azines | +0.509 |
culosis | +0.500 |
excluding | +0.488 |
formance | +0.473 |
Conclusion | +0.455 |
Neg logit contributions | |
Unch | -0.503 |
usefulness | -0.501 |
IFF | -0.492 |
lif | -0.475 |
OR | -0.473 |
Token | kind |
Token ID | 1611 |
Feature activation | +5.18e+00 |
Pos logit contributions | |
azines | +5.651 |
excluding | +5.376 |
culosis | +5.371 |
Conclusion | +5.340 |
excludes | +5.163 |
Neg logit contributions | |
IFF | -6.702 |
OR | -6.405 |
Unch | -6.404 |
usefulness | -6.346 |
ellig | -6.318 |
Token | of |
Token ID | 286 |
Feature activation | +2.81e+00 |
Pos logit contributions | |
azines | +3.452 |
culosis | +3.317 |
excluding | +3.311 |
formance | +3.209 |
Conclusion | +3.204 |
Neg logit contributions | |
Unch | -3.925 |
IFF | -3.893 |
usefulness | -3.890 |
OR | -3.786 |
ellig | -3.696 |
Token | programming |
Token ID | 8300 |
Feature activation | +4.98e+00 |
Pos logit contributions | |
azines | +2.139 |
culosis | +2.091 |
excluding | +2.031 |
formance | +2.002 |
Conclusion | +1.955 |
Neg logit contributions | |
IFF | -1.972 |
Unch | -1.924 |
OR | -1.891 |
usefulness | -1.874 |
ellig | -1.830 |
Token | is |
Token ID | 318 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
azines | +3.463 |
culosis | +3.431 |
excluding | +3.303 |
formance | +3.176 |
excludes | +3.148 |
Neg logit contributions | |
IFF | -3.723 |
Unch | -3.602 |
OR | -3.577 |
usefulness | -3.529 |
ellig | -3.457 |
Token | a |
Token ID | 257 |
Feature activation | +5.23e+00 |
Pos logit contributions | |
azines | +0.809 |
culosis | +0.796 |
excluding | +0.770 |
formance | +0.753 |
Conclusion | +0.730 |
Neg logit contributions | |
IFF | -0.736 |
Unch | -0.722 |
usefulness | -0.719 |
OR | -0.706 |
ellig | -0.686 |
Token | breath |
Token ID | 8033 |
Feature activation | -5.05e+00 |
Pos logit contributions | |
azines | +4.017 |
culosis | +3.985 |
excluding | +3.832 |
formance | +3.809 |
Conclusion | +3.728 |
Neg logit contributions | |
IFF | -3.435 |
Unch | -3.426 |
usefulness | -3.340 |
OR | -3.294 |
ellig | -3.210 |
Token | of |
Token ID | 286 |
Feature activation | +9.63e-01 |
Pos logit contributions | |
OR | +2.978 |
IFF | +2.964 |
Unch | +2.942 |
usefulness | +2.924 |
lif | +2.830 |
Neg logit contributions | |
azines | -4.409 |
culosis | -4.359 |
excluding | -4.130 |
formance | -4.099 |
Conclusion | -3.939 |
Token | fresh |
Token ID | 4713 |
Feature activation | +2.91e+00 |
Pos logit contributions | |
azines | +0.538 |
culosis | +0.528 |
excluding | +0.498 |
formance | +0.486 |
cluding | +0.467 |
Neg logit contributions | |
IFF | -0.870 |
Unch | -0.862 |
usefulness | -0.856 |
OR | -0.851 |
humans | -0.828 |
Token | air |
Token ID | 1633 |
Feature activation | +2.69e-01 |
Pos logit contributions | |
azines | +2.134 |
culosis | +2.115 |
excluding | +1.997 |
formance | +1.947 |
cluding | +1.905 |
Neg logit contributions | |
IFF | -2.100 |
Unch | -2.091 |
usefulness | -2.047 |
OR | -2.025 |
humans | -1.978 |
Token | need |
Token ID | 761 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
IFF | +4.747 |
Unch | +4.721 |
usefulness | +4.697 |
OR | +4.680 |
lif | +4.506 |
Neg logit contributions | |
azines | -4.577 |
culosis | -4.461 |
formance | -4.211 |
excluding | -4.208 |
Conclusion | -3.984 |
Token | not |
Token ID | 407 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
azines | +1.536 |
culosis | +1.515 |
excluding | +1.431 |
formance | +1.399 |
Conclusion | +1.349 |
Neg logit contributions | |
IFF | -1.969 |
Unch | -1.950 |
usefulness | -1.935 |
OR | -1.914 |
ellig | -1.852 |
Token | supply |
Token ID | 5127 |
Feature activation | +2.90e+00 |
Pos logit contributions | |
azines | +1.195 |
culosis | +1.180 |
excluding | +1.123 |
formance | +1.098 |
Conclusion | +1.081 |
Neg logit contributions | |
IFF | -1.238 |
Unch | -1.226 |
usefulness | -1.222 |
OR | -1.206 |
humans | -1.162 |
Token | that |
Token ID | 326 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
azines | +2.159 |
culosis | +2.107 |
excluding | +2.030 |
formance | +1.975 |
cluding | +1.937 |
Neg logit contributions | |
IFF | -2.073 |
Unch | -2.036 |
OR | -2.010 |
usefulness | -2.008 |
ellig | -1.940 |
Token | blank |
Token ID | 9178 |
Feature activation | -9.00e-01 |
Pos logit contributions | |
azines | +0.843 |
culosis | +0.841 |
excluding | +0.796 |
formance | +0.787 |
Conclusion | +0.763 |
Neg logit contributions | |
IFF | -0.817 |
Unch | -0.809 |
usefulness | -0.797 |
OR | -0.796 |
humans | -0.768 |
Token | ! |
Token ID | 0 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
IFF | +0.617 |
Unch | +0.614 |
usefulness | +0.611 |
OR | +0.603 |
lif | +0.577 |
Neg logit contributions | |
azines | -0.701 |
culosis | -0.700 |
excluding | -0.664 |
formance | -0.655 |
Conclusion | -0.633 |
Token | � |
Token ID | 447 |
Feature activation | +4.71e+00 |
Pos logit contributions | |
IFF | +0.692 |
usefulness | +0.687 |
Unch | +0.687 |
OR | +0.676 |
lif | +0.649 |
Neg logit contributions | |
azines | -0.784 |
culosis | -0.779 |
excluding | -0.738 |
formance | -0.729 |
Conclusion | -0.702 |
Token | � |
Token ID | 251 |
Feature activation | +3.88e+00 |
Pos logit contributions | |
azines | +2.440 |
culosis | +2.402 |
excluding | +2.250 |
formance | +2.231 |
Conclusion | +2.211 |
Neg logit contributions | |
IFF | -4.281 |
usefulness | -4.266 |
Unch | -4.258 |
OR | -4.150 |
ellig | -4.113 |
Token |
|
Token ID | 198 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
azines | +3.133 |
culosis | +3.117 |
excluding | +2.966 |
formance | +2.928 |
Conclusion | +2.844 |
Neg logit contributions | |
IFF | -2.531 |
usefulness | -2.524 |
Unch | -2.507 |
OR | -2.460 |
lif | -2.364 |
Token |
|
Token ID | 198 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
azines | +0.091 |
culosis | +0.089 |
excluding | +0.088 |
formance | +0.085 |
Conclusion | +0.083 |
Neg logit contributions | |
usefulness | -0.081 |
Unch | -0.081 |
IFF | -0.080 |
OR | -0.078 |
ellig | -0.076 |
Token | E |
Token ID | 36 |
Feature activation | -3.81e+00 |
Pos logit contributions | |
IFF | +0.881 |
usefulness | +0.876 |
Unch | +0.875 |
OR | +0.858 |
lif | +0.827 |
Neg logit contributions | |
azines | -1.009 |
culosis | -1.002 |
excluding | -0.952 |
formance | -0.939 |
Conclusion | -0.905 |
Token | made |
Token ID | 925 |
Feature activation | +9.06e-01 |
Pos logit contributions | |
culosis | +1.211 |
azines | +1.206 |
excluding | +1.143 |
formance | +1.113 |
Conclusion | +1.091 |
Neg logit contributions | |
IFF | -1.289 |
usefulness | -1.279 |
Unch | -1.262 |
OR | -1.246 |
humans | -1.216 |
Token | his |
Token ID | 465 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
azines | +0.675 |
culosis | +0.671 |
excluding | +0.635 |
formance | +0.628 |
Conclusion | +0.611 |
Neg logit contributions | |
IFF | -0.648 |
usefulness | -0.638 |
Unch | -0.636 |
OR | -0.631 |
ellig | -0.608 |
Token | bid |
Token ID | 8406 |
Feature activation | -5.30e+00 |
Pos logit contributions | |
IFF | +0.728 |
Unch | +0.719 |
usefulness | +0.718 |
OR | +0.710 |
ellig | +0.683 |
Neg logit contributions | |
azines | -0.800 |
culosis | -0.795 |
excluding | -0.754 |
formance | -0.743 |
Conclusion | -0.722 |
Token | for |
Token ID | 329 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
IFF | +2.969 |
Unch | +2.967 |
usefulness | +2.928 |
OR | +2.892 |
lif | +2.763 |
Neg logit contributions | |
azines | -4.791 |
culosis | -4.748 |
excluding | -4.521 |
formance | -4.475 |
Conclusion | -4.326 |
Token | the |
Token ID | 262 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
usefulness | +2.293 |
IFF | +2.279 |
Unch | +2.279 |
OR | +2.244 |
lif | +2.168 |
Neg logit contributions | |
azines | -2.759 |
culosis | -2.737 |
excluding | -2.597 |
formance | -2.573 |
Conclusion | -2.459 |
Token | throne |
Token ID | 19262 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
azines | +0.917 |
culosis | +0.908 |
excluding | +0.861 |
formance | +0.850 |
Conclusion | +0.823 |
Neg logit contributions | |
IFF | -0.899 |
Unch | -0.875 |
usefulness | -0.875 |
OR | -0.867 |
ellig | -0.839 |
Token | in |
Token ID | 287 |
Feature activation | -4.13e+00 |
Pos logit contributions | |
IFF | +1.142 |
usefulness | +1.136 |
Unch | +1.130 |
OR | +1.113 |
lif | +1.070 |
Neg logit contributions | |
azines | -1.230 |
culosis | -1.224 |
excluding | -1.160 |
formance | -1.145 |
Conclusion | -1.104 |
Token | conjunction |
Token ID | 17856 |
Feature activation | -2.89e+00 |
Pos logit contributions | |
usefulness | +2.898 |
IFF | +2.886 |
Unch | +2.883 |
OR | +2.849 |
lif | +2.748 |
Neg logit contributions | |
azines | -3.164 |
culosis | -3.142 |
excluding | -2.960 |
formance | -2.902 |
cluding | -2.782 |
Token | with |
Token ID | 351 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
IFF | +2.011 |
usefulness | +1.996 |
Unch | +1.995 |
OR | +1.965 |
lif | +1.889 |
Neg logit contributions | |
azines | -2.237 |
culosis | -2.222 |
excluding | -2.101 |
formance | -2.075 |
Conclusion | -1.997 |
Token | Edwin |
Token ID | 37016 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
IFF | +1.649 |
usefulness | +1.643 |
Unch | +1.642 |
OR | +1.618 |
lif | +1.557 |
Neg logit contributions | |
azines | -1.784 |
culosis | -1.770 |
excluding | -1.674 |
formance | -1.658 |
Conclusion | -1.585 |
Token | Earl |
Token ID | 21647 |
Feature activation | +4.99e-01 |
Pos logit contributions | |
IFF | +1.599 |
Unch | +1.587 |
usefulness | +1.586 |
OR | +1.563 |
lif | +1.496 |
Neg logit contributions | |
azines | -1.976 |
culosis | -1.960 |
excluding | -1.865 |
formance | -1.841 |
Conclusion | -1.771 |
Token | replacing |
Token ID | 13586 |
Feature activation | -5.42e+00 |
Pos logit contributions | |
IFF | +0.853 |
usefulness | +0.846 |
Unch | +0.845 |
OR | +0.833 |
ellig | +0.801 |
Neg logit contributions | |
azines | -0.851 |
culosis | -0.847 |
excluding | -0.801 |
formance | -0.789 |
Conclusion | -0.760 |
Token | Confederate |
Token ID | 21900 |
Feature activation | +7.02e+00 |
Pos logit contributions | |
usefulness | +3.621 |
Unch | +3.618 |
IFF | +3.611 |
OR | +3.546 |
lif | +3.453 |
Neg logit contributions | |
azines | -4.270 |
culosis | -4.253 |
excluding | -4.004 |
formance | -3.986 |
Conclusion | -3.791 |
Token | General |
Token ID | 3611 |
Feature activation | +7.91e+00 |
Pos logit contributions | |
azines | +5.250 |
culosis | +5.237 |
excluding | +4.937 |
Conclusion | +4.882 |
formance | +4.804 |
Neg logit contributions | |
IFF | -4.722 |
Unch | -4.589 |
OR | -4.579 |
usefulness | -4.544 |
humans | -4.428 |
Token | Edmund |
Token ID | 35646 |
Feature activation | +4.30e+00 |
Pos logit contributions | |
azines | +5.405 |
culosis | +5.380 |
Conclusion | +5.045 |
formance | +5.018 |
excluding | +5.017 |
Neg logit contributions | |
IFF | -5.857 |
usefulness | -5.728 |
OR | -5.693 |
Unch | -5.659 |
humans | -5.508 |
Token | Kirby |
Token ID | 23965 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
culosis | +2.966 |
azines | +2.957 |
excluding | +2.775 |
formance | +2.720 |
Conclusion | +2.693 |
Neg logit contributions | |
IFF | -3.310 |
usefulness | -3.286 |
Unch | -3.263 |
OR | -3.221 |
lif | -3.129 |
Token | Smith |
Token ID | 4176 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
azines | +1.106 |
culosis | +1.096 |
excluding | +1.040 |
formance | +1.032 |
Conclusion | +0.998 |
Neg logit contributions | |
IFF | -1.029 |
usefulness | -1.022 |
Unch | -1.008 |
OR | -0.999 |
humans | -0.961 |
Token | .[ |
Token ID | 3693 |
Feature activation | +1.78e+00 |
Pos logit contributions | |
IFF | +1.407 |
Unch | +1.401 |
usefulness | +1.393 |
OR | +1.377 |
lif | +1.318 |
Neg logit contributions | |
azines | -1.664 |
culosis | -1.652 |
excluding | -1.569 |
formance | -1.544 |
cluding | -1.488 |
Token | 7 |
Token ID | 22 |
Feature activation | -3.22e+00 |
Pos logit contributions | |
azines | +1.629 |
culosis | +1.617 |
excluding | +1.556 |
formance | +1.532 |
cluding | +1.486 |
Neg logit contributions | |
IFF | -0.983 |
Unch | -0.981 |
usefulness | -0.980 |
OR | -0.947 |
lif | -0.913 |
Token | ] |
Token ID | 60 |
Feature activation | +4.20e+00 |
Pos logit contributions | |
IFF | +1.539 |
OR | +1.517 |
Unch | +1.490 |
usefulness | +1.472 |
ellig | +1.400 |
Neg logit contributions | |
azines | -3.183 |
culosis | -3.173 |
excluding | -3.001 |
formance | -2.987 |
Conclusion | -2.894 |
Token |
|
Token ID | 198 |
Feature activation | -9.17e-01 |
Pos logit contributions | |
azines | +3.048 |
culosis | +3.011 |
excluding | +2.883 |
formance | +2.811 |
Conclusion | +2.806 |
Neg logit contributions | |
usefulness | -3.073 |
IFF | -3.024 |
Unch | -2.944 |
OR | -2.919 |
lif | -2.869 |
Token |
|
Token ID | 198 |
Feature activation | +3.17e+00 |
Pos logit contributions | |
usefulness | +0.608 |
IFF | +0.607 |
Unch | +0.606 |
OR | +0.588 |
lif | +0.568 |
Neg logit contributions | |
azines | -0.737 |
culosis | -0.727 |
excluding | -0.701 |
formance | -0.688 |
Conclusion | -0.667 |
Token | , |
Token ID | 11 |
Feature activation | +5.81e+00 |
Pos logit contributions | |
azines | +1.542 |
culosis | +1.521 |
excluding | +1.457 |
formance | +1.438 |
Conclusion | +1.410 |
Neg logit contributions | |
IFF | -1.454 |
Unch | -1.411 |
OR | -1.407 |
usefulness | -1.384 |
humans | -1.369 |
Token | the |
Token ID | 262 |
Feature activation | +5.20e-01 |
Pos logit contributions | |
azines | +4.244 |
culosis | +4.115 |
excluding | +3.990 |
Conclusion | +3.927 |
formance | +3.899 |
Neg logit contributions | |
IFF | -4.115 |
Unch | -3.997 |
usefulness | -3.964 |
OR | -3.929 |
ellig | -3.854 |
Token | interviewer |
Token ID | 39877 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
azines | +0.396 |
culosis | +0.391 |
excluding | +0.372 |
formance | +0.367 |
Conclusion | +0.358 |
Neg logit contributions | |
IFF | -0.369 |
Unch | -0.362 |
usefulness | -0.359 |
OR | -0.357 |
ellig | -0.346 |
Token | explained |
Token ID | 4893 |
Feature activation | -4.86e+00 |
Pos logit contributions | |
IFF | +0.904 |
usefulness | +0.897 |
Unch | +0.896 |
OR | +0.883 |
lif | +0.848 |
Neg logit contributions | |
azines | -0.975 |
culosis | -0.969 |
excluding | -0.917 |
formance | -0.905 |
Conclusion | -0.871 |
Token | that |
Token ID | 326 |
Feature activation | -4.16e+00 |
Pos logit contributions | |
usefulness | +3.024 |
IFF | +3.003 |
Unch | +2.996 |
OR | +2.938 |
lif | +2.847 |
Neg logit contributions | |
azines | -4.099 |
culosis | -4.099 |
excluding | -3.870 |
formance | -3.834 |
cluding | -3.673 |
Token | as |
Token ID | 355 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
usefulness | +2.786 |
Unch | +2.783 |
IFF | +2.779 |
OR | +2.718 |
lif | +2.638 |
Neg logit contributions | |
azines | -3.308 |
culosis | -3.296 |
excluding | -3.112 |
formance | -3.094 |
cluding | -2.948 |
Token | the |
Token ID | 262 |
Feature activation | +3.95e+00 |
Pos logit contributions | |
IFF | +0.200 |
Unch | +0.197 |
usefulness | +0.197 |
OR | +0.194 |
ellig | +0.186 |
Neg logit contributions | |
azines | -0.260 |
culosis | -0.257 |
excluding | -0.246 |
formance | -0.243 |
Conclusion | -0.236 |
Token | user |
Token ID | 2836 |
Feature activation | +5.50e+00 |
Pos logit contributions | |
azines | +3.063 |
culosis | +3.017 |
excluding | +2.911 |
formance | +2.846 |
Conclusion | +2.808 |
Neg logit contributions | |
IFF | -2.637 |
Unch | -2.553 |
OR | -2.520 |
ellig | -2.501 |
usefulness | -2.472 |
Token | base |
Token ID | 8692 |
Feature activation | +5.62e+00 |
Pos logit contributions | |
culosis | +3.739 |
azines | +3.728 |
formance | +3.514 |
excluding | +3.499 |
Conclusion | +3.334 |
Neg logit contributions | |
IFF | -4.186 |
Unch | -4.087 |
usefulness | -4.025 |
OR | -4.022 |
humans | -3.909 |
Token | gets |
Token ID | 3011 |
Feature activation | +6.90e-01 |
Pos logit contributions | |
azines | +3.864 |
culosis | +3.849 |
excluding | +3.633 |
formance | +3.588 |
cluding | +3.466 |
Neg logit contributions | |
IFF | -4.220 |
usefulness | -4.059 |
OR | -4.054 |
Unch | -4.046 |
humans | -3.904 |
Token | large |
Token ID | 1588 |
Feature activation | +3.18e+00 |
Pos logit contributions | |
azines | +0.506 |
culosis | +0.505 |
excluding | +0.477 |
formance | +0.471 |
Conclusion | +0.455 |
Neg logit contributions | |
IFF | -0.502 |
usefulness | -0.493 |
Unch | -0.492 |
OR | -0.488 |
ellig | -0.469 |
Token | often |
Token ID | 1690 |
Feature activation | +4.22e+00 |
Pos logit contributions | |
IFF | +3.754 |
usefulness | +3.723 |
Unch | +3.691 |
OR | +3.658 |
lif | +3.549 |
Neg logit contributions | |
azines | -4.919 |
culosis | -4.877 |
excluding | -4.649 |
formance | -4.606 |
Conclusion | -4.441 |
Token | characterize |
Token ID | 34404 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
azines | +3.015 |
culosis | +2.984 |
excluding | +2.815 |
formance | +2.743 |
Conclusion | +2.706 |
Neg logit contributions | |
IFF | -3.047 |
Unch | -3.026 |
usefulness | -3.002 |
OR | -2.995 |
ellig | -2.865 |
Token | dialog |
Token ID | 17310 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
IFF | +0.908 |
Unch | +0.900 |
usefulness | +0.899 |
OR | +0.888 |
ellig | +0.853 |
Neg logit contributions | |
azines | -0.938 |
culosis | -0.929 |
excluding | -0.881 |
formance | -0.870 |
Conclusion | -0.838 |
Token | ues |
Token ID | 947 |
Feature activation | +2.94e+00 |
Pos logit contributions | |
IFF | +1.112 |
usefulness | +1.103 |
Unch | +1.101 |
OR | +1.082 |
lif | +1.035 |
Neg logit contributions | |
azines | -1.452 |
culosis | -1.443 |
excluding | -1.372 |
formance | -1.356 |
Conclusion | -1.309 |
Token | in |
Token ID | 287 |
Feature activation | -7.27e+00 |
Pos logit contributions | |
azines | +1.993 |
culosis | +1.986 |
excluding | +1.907 |
formance | +1.858 |
Conclusion | +1.816 |
Neg logit contributions | |
IFF | -2.249 |
usefulness | -2.219 |
Unch | -2.208 |
OR | -2.186 |
ellig | -2.100 |
Token | the |
Token ID | 262 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
usefulness | +5.272 |
Unch | +5.232 |
IFF | +5.228 |
OR | +5.112 |
lif | +5.087 |
Neg logit contributions | |
culosis | -5.303 |
azines | -5.272 |
excluding | -4.961 |
formance | -4.892 |
Conclusion | -4.633 |
Token | field |
Token ID | 2214 |
Feature activation | +4.40e+00 |
Pos logit contributions | |
IFF | +0.842 |
usefulness | +0.833 |
Unch | +0.833 |
OR | +0.822 |
ellig | +0.790 |
Neg logit contributions | |
azines | -0.875 |
culosis | -0.864 |
excluding | -0.821 |
formance | -0.812 |
Conclusion | -0.781 |
Token | of |
Token ID | 286 |
Feature activation | -4.55e+00 |
Pos logit contributions | |
azines | +3.263 |
culosis | +3.240 |
excluding | +3.076 |
formance | +3.047 |
Conclusion | +2.944 |
Neg logit contributions | |
IFF | -3.118 |
usefulness | -3.083 |
Unch | -3.061 |
OR | -3.031 |
humans | -2.910 |
Token | di |
Token ID | 2566 |
Feature activation | -5.59e+00 |
Pos logit contributions | |
IFF | +3.128 |
usefulness | +3.127 |
Unch | +3.107 |
OR | +3.053 |
lif | +2.966 |
Neg logit contributions | |
azines | -3.541 |
culosis | -3.529 |
excluding | -3.328 |
formance | -3.282 |
cluding | -3.148 |
Token | as |
Token ID | 292 |
Feature activation | +4.50e+00 |
Pos logit contributions | |
usefulness | +2.121 |
IFF | +2.108 |
Unch | +2.107 |
OR | +2.066 |
ellig | +1.950 |
Neg logit contributions | |
culosis | -6.018 |
azines | -5.956 |
excluding | -5.743 |
formance | -5.624 |
Conclusion | -5.536 |
Token | pora |
Token ID | 38851 |
Feature activation | -4.56e+00 |
Pos logit contributions | |
azines | +1.961 |
culosis | +1.936 |
formance | +1.753 |
excluding | +1.752 |
cluding | +1.656 |
Neg logit contributions | |
IFF | -4.651 |
usefulness | -4.566 |
Unch | -4.547 |
OR | -4.524 |
lif | -4.346 |
Token | the |
Token ID | 262 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
IFF | +0.119 |
usefulness | +0.118 |
Unch | +0.118 |
OR | +0.116 |
ellig | +0.112 |
Neg logit contributions | |
azines | -0.129 |
culosis | -0.128 |
excluding | -0.122 |
formance | -0.120 |
Conclusion | -0.116 |
Token | syntax |
Token ID | 15582 |
Feature activation | -5.11e+00 |
Pos logit contributions | |
IFF | +0.940 |
Unch | +0.927 |
usefulness | +0.925 |
OR | +0.913 |
ellig | +0.881 |
Neg logit contributions | |
azines | -0.982 |
culosis | -0.974 |
excluding | -0.926 |
formance | -0.911 |
Conclusion | -0.882 |
Token | just |
Token ID | 655 |
Feature activation | -5.32e+00 |
Pos logit contributions | |
IFF | +3.497 |
usefulness | +3.493 |
Unch | +3.480 |
OR | +3.422 |
lif | +3.306 |
Neg logit contributions | |
azines | -3.989 |
culosis | -3.973 |
excluding | -3.719 |
formance | -3.704 |
cluding | -3.540 |
Token | as |
Token ID | 355 |
Feature activation | -1.56e+01 |
Pos logit contributions | |
IFF | +3.640 |
usefulness | +3.632 |
Unch | +3.628 |
OR | +3.558 |
lif | +3.447 |
Neg logit contributions | |
azines | -4.150 |
culosis | -4.131 |
excluding | -3.873 |
formance | -3.847 |
Conclusion | -3.686 |
Token | rich |
Token ID | 5527 |
Feature activation | -3.73e+00 |
Pos logit contributions | |
usefulness | +10.175 |
IFF | +10.065 |
lif | +9.862 |
OR | +9.781 |
Unch | +9.729 |
Neg logit contributions | |
culosis | -11.882 |
azines | -11.332 |
formance | -10.374 |
excluding | -10.351 |
Conclusion | -9.803 |
Token | , |
Token ID | 11 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
IFF | +2.411 |
usefulness | +2.386 |
Unch | +2.380 |
OR | +2.354 |
lif | +2.261 |
Neg logit contributions | |
azines | -3.071 |
culosis | -3.055 |
excluding | -2.889 |
formance | -2.861 |
Conclusion | -2.753 |
Token | can |
Token ID | 460 |
Feature activation | +2.95e+00 |
Pos logit contributions | |
usefulness | +7.930 |
lif | +7.715 |
Unch | +7.714 |
IFF | +7.714 |
OR | +7.702 |
Neg logit contributions | |
culosis | -9.034 |
azines | -8.823 |
formance | -8.159 |
excluding | -8.126 |
cluding | -7.705 |
Token | you |
Token ID | 345 |
Feature activation | +5.49e+00 |
Pos logit contributions | |
azines | +2.184 |
culosis | +2.141 |
excluding | +2.056 |
formance | +2.039 |
Conclusion | +1.965 |
Neg logit contributions | |
IFF | -2.101 |
Unch | -2.096 |
usefulness | -2.070 |
OR | -2.022 |
ellig | -1.958 |
Token | have |
Token ID | 423 |
Feature activation | -2.79e+00 |
Pos logit contributions | |
culosis | +3.777 |
azines | +3.768 |
excluding | +3.656 |
Conclusion | +3.621 |
formance | +3.558 |
Neg logit contributions | |
IFF | -3.985 |
Unch | -3.966 |
usefulness | -3.929 |
OR | -3.860 |
humans | -3.759 |
Token | default |
Token ID | 4277 |
Feature activation | -9.56e-01 |
Pos logit contributions | |
IFF | +1.905 |
usefulness | +1.890 |
Unch | +1.888 |
OR | +1.858 |
lif | +1.783 |
Neg logit contributions | |
azines | -2.199 |
culosis | -2.185 |
excluding | -2.072 |
formance | -2.046 |
Conclusion | -1.972 |
Token | values |
Token ID | 3815 |
Feature activation | -3.70e+00 |
Pos logit contributions | |
IFF | +0.653 |
Unch | +0.645 |
usefulness | +0.644 |
OR | +0.632 |
ellig | +0.610 |
Neg logit contributions | |
azines | -0.751 |
culosis | -0.744 |
excluding | -0.710 |
formance | -0.701 |
Conclusion | -0.677 |
Token | my |
Token ID | 616 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
azines | +2.198 |
culosis | +2.151 |
excluding | +2.067 |
formance | +2.029 |
cluding | +1.981 |
Neg logit contributions | |
IFF | -1.806 |
Unch | -1.774 |
usefulness | -1.771 |
OR | -1.749 |
humans | -1.680 |
Token | shoulder |
Token ID | 8163 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
azines | +6.686 |
excluding | +6.185 |
culosis | +5.871 |
culminating | +5.862 |
Conclusion | +5.828 |
Neg logit contributions | |
IFF | -7.544 |
Unch | -7.446 |
humans | -7.418 |
ellig | -7.401 |
OR | -7.332 |
Token | softly |
Token ID | 26625 |
Feature activation | +3.73e+00 |
Pos logit contributions | |
azines | +1.499 |
culosis | +1.466 |
excluding | +1.406 |
formance | +1.386 |
cluding | +1.338 |
Neg logit contributions | |
IFF | -1.441 |
Unch | -1.429 |
usefulness | -1.424 |
OR | -1.409 |
ellig | -1.359 |
Token | and |
Token ID | 290 |
Feature activation | -7.87e+00 |
Pos logit contributions | |
azines | +2.654 |
culosis | +2.606 |
excluding | +2.498 |
formance | +2.447 |
cluding | +2.397 |
Neg logit contributions | |
IFF | -2.769 |
usefulness | -2.762 |
Unch | -2.736 |
OR | -2.702 |
humans | -2.610 |
Token | responds |
Token ID | 20067 |
Feature activation | -1.89e+01 |
Pos logit contributions | |
Unch | +5.131 |
usefulness | +5.126 |
IFF | +5.067 |
OR | +5.034 |
lif | +4.987 |
Neg logit contributions | |
culosis | -6.227 |
azines | -6.169 |
formance | -5.824 |
excluding | -5.815 |
Conclusion | -5.487 |
Token | , |
Token ID | 11 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
lif | +9.698 |
Unch | +9.663 |
usefulness | +9.473 |
IFF | +9.470 |
standoff | +9.369 |
Neg logit contributions | |
culosis | -15.144 |
azines | -15.062 |
formance | -13.886 |
excluding | -13.522 |
cluding | -13.148 |
Token | " |
Token ID | 366 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
Unch | +5.664 |
lif | +5.552 |
IFF | +5.491 |
usefulness | +5.480 |
OR | +5.376 |
Neg logit contributions | |
azines | -12.453 |
culosis | -12.369 |
formance | -11.568 |
excluding | -11.423 |
Conclusion | -11.106 |
Token | You |
Token ID | 1639 |
Feature activation | -9.25e+00 |
Pos logit contributions | |
OR | +6.549 |
IFF | +6.438 |
Unch | +6.009 |
usefulness | +5.992 |
humans | +5.950 |
Neg logit contributions | |
culosis | -8.706 |
azines | -8.383 |
formance | -7.821 |
excluding | -7.655 |
Conclusion | -7.528 |
Token | are |
Token ID | 389 |
Feature activation | -6.39e+00 |
Pos logit contributions | |
Unch | +5.881 |
usefulness | +5.845 |
OR | +5.805 |
IFF | +5.784 |
lif | +5.659 |
Neg logit contributions | |
culosis | -7.441 |
azines | -7.417 |
formance | -6.953 |
excluding | -6.919 |
Conclusion | -6.569 |
Token | such |
Token ID | 884 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
usefulness | +4.443 |
Unch | +4.426 |
IFF | +4.419 |
OR | +4.407 |
lif | +4.255 |
Neg logit contributions | |
culosis | -4.934 |
azines | -4.901 |
formance | -4.535 |
excluding | -4.511 |
Conclusion | -4.294 |
Token | a |
Token ID | 257 |
Feature activation | -6.81e+00 |
Pos logit contributions | |
azines | +0.085 |
culosis | +0.084 |
excluding | +0.080 |
formance | +0.079 |
Conclusion | +0.076 |
Neg logit contributions | |
IFF | -0.090 |
Unch | -0.089 |
usefulness | -0.089 |
OR | -0.088 |
ellig | -0.084 |
Token | the |
Token ID | 262 |
Feature activation | -7.79e+00 |
Pos logit contributions | |
azines | +0.468 |
culosis | +0.465 |
excluding | +0.444 |
formance | +0.434 |
Conclusion | +0.422 |
Neg logit contributions | |
IFF | -0.436 |
Unch | -0.430 |
usefulness | -0.428 |
OR | -0.424 |
ellig | -0.411 |
Token | potential |
Token ID | 2785 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
usefulness | +5.357 |
Unch | +5.230 |
IFF | +5.214 |
OR | +5.168 |
lif | +5.122 |
Neg logit contributions | |
azines | -6.044 |
culosis | -6.005 |
formance | -5.662 |
excluding | -5.614 |
cluding | -5.290 |
Token | for |
Token ID | 329 |
Feature activation | -2.69e+00 |
Pos logit contributions | |
usefulness | +9.772 |
lif | +9.444 |
Unch | +9.295 |
IFF | +9.049 |
OR | +9.042 |
Neg logit contributions | |
azines | -10.344 |
culosis | -10.217 |
formance | -9.674 |
excluding | -9.553 |
cluding | -9.024 |
Token | infrastructure |
Token ID | 6884 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
IFF | +1.930 |
usefulness | +1.922 |
Unch | +1.916 |
OR | +1.886 |
lif | +1.824 |
Neg logit contributions | |
azines | -2.019 |
culosis | -2.002 |
excluding | -1.893 |
formance | -1.870 |
Conclusion | -1.793 |
Token | cost |
Token ID | 1575 |
Feature activation | -3.52e+00 |
Pos logit contributions | |
azines | +1.722 |
culosis | +1.716 |
excluding | +1.635 |
formance | +1.585 |
Conclusion | +1.542 |
Neg logit contributions | |
IFF | -1.865 |
Unch | -1.835 |
OR | -1.808 |
usefulness | -1.804 |
humans | -1.776 |
Token | overrun |
Token ID | 33713 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
IFF | +2.288 |
usefulness | +2.270 |
Unch | +2.265 |
OR | +2.230 |
lif | +2.142 |
Neg logit contributions | |
azines | -2.876 |
culosis | -2.857 |
excluding | -2.714 |
formance | -2.683 |
Conclusion | -2.588 |
Token | s |
Token ID | 82 |
Feature activation | -4.60e+00 |
Pos logit contributions | |
IFF | +4.229 |
usefulness | +4.192 |
OR | +4.138 |
Unch | +4.136 |
lif | +3.988 |
Neg logit contributions | |
azines | -12.261 |
culosis | -12.100 |
excluding | -11.685 |
formance | -11.665 |
cluding | -11.246 |
Token | , |
Token ID | 11 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
IFF | +3.170 |
Unch | +3.145 |
usefulness | +3.140 |
OR | +3.103 |
lif | +2.989 |
Neg logit contributions | |
azines | -3.587 |
culosis | -3.562 |
excluding | -3.354 |
formance | -3.338 |
Conclusion | -3.180 |
Token | future |
Token ID | 2003 |
Feature activation | -6.99e+00 |
Pos logit contributions | |
IFF | +1.394 |
usefulness | +1.383 |
Unch | +1.382 |
OR | +1.362 |
lif | +1.310 |
Neg logit contributions | |
azines | -1.372 |
culosis | -1.363 |
excluding | -1.287 |
formance | -1.269 |
Conclusion | -1.219 |
Token | transport |
Token ID | 4839 |
Feature activation | -8.58e+00 |
Pos logit contributions | |
usefulness | +5.063 |
Unch | +4.955 |
IFF | +4.947 |
lif | +4.882 |
OR | +4.873 |
Neg logit contributions | |
azines | -5.196 |
culosis | -5.132 |
excluding | -4.830 |
formance | -4.815 |
Conclusion | -4.545 |
Token | cost |
Token ID | 1575 |
Feature activation | -5.89e+00 |
Pos logit contributions | |
usefulness | +5.262 |
IFF | +5.145 |
OR | +5.098 |
Unch | +5.093 |
lif | +5.052 |
Neg logit contributions | |
azines | -7.244 |
culosis | -7.087 |
formance | -6.758 |
excluding | -6.729 |
Conclusion | -6.438 |
Token | f |
Token ID | 69 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
azines | +1.828 |
culosis | +1.816 |
excluding | +1.725 |
formance | +1.714 |
cluding | +1.664 |
Neg logit contributions | |
usefulness | -1.692 |
IFF | -1.687 |
Unch | -1.673 |
OR | -1.620 |
humans | -1.589 |
Token | ica |
Token ID | 3970 |
Feature activation | -5.98e+00 |
Pos logit contributions | |
azines | +1.218 |
culosis | +1.210 |
formance | +1.099 |
excluding | +1.082 |
cluding | +1.004 |
Neg logit contributions | |
usefulness | -2.425 |
IFF | -2.412 |
Unch | -2.402 |
OR | -2.352 |
humans | -2.318 |
Token | still |
Token ID | 991 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
Unch | +4.197 |
IFF | +4.191 |
usefulness | +4.152 |
OR | +4.126 |
lif | +3.973 |
Neg logit contributions | |
azines | -4.497 |
culosis | -4.471 |
excluding | -4.232 |
formance | -4.196 |
cluding | -4.021 |
Token | owns |
Token ID | 12216 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
usefulness | +7.514 |
OR | +7.430 |
Unch | +7.423 |
IFF | +7.414 |
lif | +7.198 |
Neg logit contributions | |
azines | -8.768 |
culosis | -8.750 |
formance | -8.210 |
excluding | -8.181 |
cluding | -7.901 |
Token | my |
Token ID | 616 |
Feature activation | +6.25e-01 |
Pos logit contributions | |
IFF | +0.866 |
usefulness | +0.857 |
Unch | +0.857 |
OR | +0.843 |
ellig | +0.810 |
Neg logit contributions | |
azines | -0.962 |
culosis | -0.953 |
excluding | -0.906 |
formance | -0.894 |
Conclusion | -0.863 |
Token | contract |
Token ID | 2775 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
azines | +0.465 |
culosis | +0.458 |
excluding | +0.437 |
formance | +0.430 |
Conclusion | +0.415 |
Neg logit contributions | |
IFF | -0.453 |
Unch | -0.449 |
usefulness | -0.444 |
OR | -0.438 |
humans | -0.427 |
Token | , |
Token ID | 11 |
Feature activation | -6.54e+00 |
Pos logit contributions | |
IFF | +7.241 |
Unch | +7.229 |
usefulness | +7.195 |
OR | +7.188 |
lif | +6.968 |
Neg logit contributions | |
culosis | -9.470 |
azines | -9.364 |
formance | -8.790 |
excluding | -8.681 |
cluding | -8.296 |
Token | � |
Token ID | 447 |
Feature activation | +5.23e+00 |
Pos logit contributions | |
Unch | +4.413 |
usefulness | +4.401 |
IFF | +4.399 |
OR | +4.359 |
lif | +4.226 |
Neg logit contributions | |
culosis | -5.074 |
azines | -5.072 |
excluding | -4.736 |
formance | -4.718 |
cluding | -4.494 |
Token | � |
Token ID | 251 |
Feature activation | +7.50e-02 |
Pos logit contributions | |
azines | +2.603 |
culosis | +2.512 |
excluding | +2.431 |
formance | +2.352 |
Conclusion | +2.299 |
Neg logit contributions | |
Unch | -4.887 |
usefulness | -4.873 |
IFF | -4.859 |
OR | -4.665 |
ellig | -4.660 |
Token | A |
Token ID | 317 |
Feature activation | -6.62e-01 |
Pos logit contributions | |
azines | +0.060 |
culosis | +0.060 |
excluding | +0.058 |
formance | +0.056 |
Conclusion | +0.055 |
Neg logit contributions | |
usefulness | -0.050 |
IFF | -0.050 |
Unch | -0.049 |
OR | -0.048 |
ellig | -0.046 |
Token | du |
Token ID | 646 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
IFF | +0.368 |
usefulness | +0.364 |
Unch | +0.364 |
OR | +0.357 |
lif | +0.339 |
Neg logit contributions | |
azines | -0.605 |
culosis | -0.602 |
excluding | -0.575 |
formance | -0.569 |
Conclusion | -0.551 |
Token | concert |
Token ID | 10010 |
Feature activation | -3.92e+00 |
Pos logit contributions | |
IFF | +6.064 |
Unch | +5.996 |
usefulness | +5.983 |
OR | +5.916 |
lif | +5.779 |
Neg logit contributions | |
azines | -5.790 |
culosis | -5.671 |
excluding | -5.419 |
formance | -5.413 |
Conclusion | -5.154 |
Token | promoter |
Token ID | 32972 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
IFF | +3.139 |
usefulness | +3.109 |
Unch | +3.102 |
OR | +3.079 |
lif | +2.974 |
Neg logit contributions | |
azines | -2.610 |
culosis | -2.589 |
excluding | -2.438 |
formance | -2.405 |
Conclusion | -2.305 |
Token | were |
Token ID | 547 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
azines | +0.103 |
culosis | +0.103 |
excluding | +0.097 |
formance | +0.095 |
cluding | +0.092 |
Neg logit contributions | |
IFF | -0.112 |
usefulness | -0.111 |
Unch | -0.111 |
OR | -0.109 |
ellig | -0.106 |
Token | halted |
Token ID | 27771 |
Feature activation | -4.94e+00 |
Pos logit contributions | |
azines | +1.530 |
culosis | +1.514 |
excluding | +1.453 |
formance | +1.425 |
cluding | +1.380 |
Neg logit contributions | |
IFF | -1.230 |
Unch | -1.217 |
usefulness | -1.215 |
OR | -1.192 |
ellig | -1.147 |
Token | by |
Token ID | 416 |
Feature activation | -6.89e+00 |
Pos logit contributions | |
IFF | +3.395 |
Unch | +3.373 |
usefulness | +3.362 |
OR | +3.317 |
lif | +3.204 |
Neg logit contributions | |
azines | -3.867 |
culosis | -3.835 |
excluding | -3.625 |
formance | -3.590 |
Conclusion | -3.447 |
Token | a |
Token ID | 257 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
Unch | +4.641 |
usefulness | +4.613 |
IFF | +4.605 |
OR | +4.495 |
lif | +4.380 |
Neg logit contributions | |
culosis | -5.394 |
azines | -5.382 |
excluding | -5.128 |
formance | -5.009 |
Conclusion | -4.751 |
Token | judge |
Token ID | 5052 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
Unch | +7.540 |
IFF | +7.452 |
usefulness | +7.388 |
OR | +7.287 |
lif | +7.177 |
Neg logit contributions | |
azines | -9.300 |
culosis | -9.135 |
excluding | -8.884 |
formance | -8.700 |
ォ | -8.100 |
Token | , |
Token ID | 11 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
Unch | +6.902 |
IFF | +6.857 |
OR | +6.823 |
usefulness | +6.740 |
lif | +6.690 |
Neg logit contributions | |
azines | -8.899 |
culosis | -8.791 |
excluding | -8.298 |
formance | -8.173 |
Conclusion | -7.871 |
Token | so |
Token ID | 523 |
Feature activation | +5.37e-01 |
Pos logit contributions | |
azines | +0.074 |
culosis | +0.074 |
excluding | +0.070 |
formance | +0.069 |
Conclusion | +0.066 |
Neg logit contributions | |
IFF | -0.075 |
usefulness | -0.075 |
Unch | -0.074 |
OR | -0.073 |
ellig | -0.071 |
Token | his |
Token ID | 465 |
Feature activation | -4.70e+00 |
Pos logit contributions | |
azines | +0.401 |
culosis | +0.397 |
excluding | +0.377 |
formance | +0.372 |
cluding | +0.359 |
Neg logit contributions | |
IFF | -0.385 |
usefulness | -0.384 |
Unch | -0.380 |
OR | -0.378 |
ellig | -0.363 |
Token | administration |
Token ID | 3662 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
usefulness | +3.360 |
IFF | +3.339 |
Unch | +3.333 |
OR | +3.269 |
lif | +3.175 |
Neg logit contributions | |
azines | -3.532 |
culosis | -3.523 |
excluding | -3.316 |
formance | -3.287 |
Conclusion | -3.133 |