Token | m |
Token ID | 285 |
Feature activation | +4.35e-01 |
Pos logit contributions | |
Synd | +4.086 |
synd | +4.031 |
anda | +3.964 |
�醒 | +3.871 |
Tad | +3.725 |
Neg logit contributions | |
Guilty | -5.675 |
GH | -4.759 |
naire | -4.614 |
NG | -4.606 |
ready | -4.555 |
Token | 2 |
Token ID | 17 |
Feature activation | +8.59e-01 |
Pos logit contributions | |
anda | +5.061 |
Synd | +4.944 |
synd | +4.824 |
utt | +4.641 |
iliate | +4.558 |
Neg logit contributions | |
Guilty | -5.439 |
GH | -4.272 |
naire | -4.166 |
que | -4.148 |
NG | -4.069 |
Token | k |
Token ID | 74 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
anda | +4.232 |
Synd | +4.070 |
nt | +3.947 |
synd | +3.938 |
utt | +3.605 |
Neg logit contributions | |
Guilty | -15.137 |
� | -13.331 |
proble | -13.218 |
� | -13.159 |
GH | -12.948 |
Token | [ |
Token ID | 685 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
Guilty | +2.404 |
GH | +1.969 |
que | +1.934 |
naire | +1.920 |
NG | +1.906 |
Neg logit contributions | |
�醒 | -2.164 |
Synd | -2.141 |
anda | -2.077 |
synd | -2.076 |
ahime | -1.997 |
Token | 10 |
Token ID | 940 |
Feature activation | +5.17e-01 |
Pos logit contributions | |
Synd | +1.143 |
synd | +1.107 |
anda | +1.106 |
�醒 | +1.043 |
utt | +1.022 |
Neg logit contributions | |
Guilty | -1.838 |
GH | -1.524 |
que | -1.502 |
naire | -1.501 |
NG | -1.483 |
Token | : |
Token ID | 25 |
Feature activation | +3.42e+00 |
Pos logit contributions | |
Synd | +3.678 |
synd | +3.493 |
anda | +3.435 |
Tad | +3.165 |
Mutual | +3.132 |
Neg logit contributions | |
Guilty | -8.614 |
GH | -7.196 |
isSpecialOrderable | -7.137 |
� | -7.131 |
naire | -7.117 |
Token | 48 |
Token ID | 2780 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
48 | +14.841 |
anda | +9.038 |
Synd | +7.919 |
nt | +7.761 |
48 | +7.402 |
Neg logit contributions | |
Guilty | -40.388 |
� | -38.226 |
proble | -36.920 |
� | -36.789 |
� | -36.640 |
Token | ] |
Token ID | 60 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
Synd | +1.362 |
synd | +1.299 |
anda | +1.284 |
Tad | +1.176 |
utt | +1.162 |
Neg logit contributions | |
Guilty | -3.085 |
GH | -2.621 |
naire | -2.588 |
que | -2.578 |
NG | -2.557 |
Token | < |
Token ID | 1279 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
Synd | +1.784 |
synd | +1.699 |
anda | +1.658 |
Tad | +1.531 |
�醒 | +1.524 |
Neg logit contributions | |
Guilty | -4.281 |
GH | -3.702 |
naire | -3.647 |
NG | -3.627 |
que | -3.582 |
Token | min |
Token ID | 1084 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
Synd | +1.375 |
anda | +1.344 |
synd | +1.335 |
�醒 | +1.311 |
utt | +1.248 |
Neg logit contributions | |
Guilty | -1.814 |
GH | -1.488 |
que | -1.456 |
naire | -1.456 |
NG | -1.452 |
Token | ion |
Token ID | 295 |
Feature activation | -5.17e-01 |
Pos logit contributions | |
Guilty | +4.521 |
naire | +3.397 |
GH | +3.357 |
que | +3.314 |
NG | +3.278 |
Neg logit contributions | |
�醒 | -8.948 |
Synd | -8.730 |
synd | -8.607 |
Tad | -8.346 |
Mutual | -8.177 |
Token | m |
Token ID | 76 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
Synd | +0.718 |
synd | +0.700 |
anda | +0.693 |
�醒 | +0.689 |
Tad | +0.653 |
Neg logit contributions | |
Guilty | -0.873 |
GH | -0.719 |
naire | -0.701 |
NG | -0.699 |
que | -0.693 |
Token | 2 |
Token ID | 17 |
Feature activation | +5.79e-01 |
Pos logit contributions | |
Guilty | +3.381 |
GH | +2.807 |
que | +2.738 |
NG | +2.725 |
naire | +2.703 |
Neg logit contributions | |
Synd | -3.035 |
�醒 | -3.007 |
synd | -2.939 |
anda | -2.891 |
ahime | -2.770 |
Token | k |
Token ID | 74 |
Feature activation | +9.06e-02 |
Pos logit contributions | |
Synd | +4.072 |
synd | +3.943 |
anda | +3.940 |
�醒 | +3.638 |
ahime | +3.540 |
Neg logit contributions | |
Guilty | -9.445 |
GH | -8.042 |
NG | -7.884 |
naire | -7.856 |
isSpecialOrderable | -7.762 |
Token | [ |
Token ID | 685 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
Synd | +0.962 |
synd | +0.935 |
anda | +0.928 |
�醒 | +0.919 |
Tad | +0.870 |
Neg logit contributions | |
Guilty | -1.243 |
GH | -1.028 |
naire | -1.005 |
NG | -1.003 |
que | -0.994 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.58e-01 |
Pos logit contributions | |
Guilty | +0.274 |
GH | +0.230 |
naire | +0.224 |
NG | +0.224 |
que | +0.223 |
Neg logit contributions | |
Synd | -0.192 |
synd | -0.186 |
�醒 | -0.185 |
anda | -0.184 |
Tad | -0.172 |
Token | : |
Token ID | 25 |
Feature activation | +3.11e+00 |
Pos logit contributions | |
Synd | +3.388 |
synd | +3.227 |
anda | +3.185 |
Tad | +2.930 |
Mutual | +2.905 |
Neg logit contributions | |
Guilty | -7.571 |
GH | -6.328 |
naire | -6.254 |
que | -6.244 |
isSpecialOrderable | -6.227 |
Token | 48 |
Token ID | 2780 |
Feature activation | +9.78e-02 |
Pos logit contributions | |
48 | +15.399 |
anda | +12.394 |
Synd | +11.089 |
nt | +10.289 |
utt | +10.110 |
Neg logit contributions | |
Guilty | -34.531 |
GH | -28.849 |
Reloaded | -27.601 |
proble | -27.468 |
NG | -27.279 |
Token | ] |
Token ID | 60 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
Synd | +0.766 |
synd | +0.734 |
anda | +0.726 |
�醒 | +0.685 |
Tad | +0.666 |
Neg logit contributions | |
Guilty | -1.618 |
GH | -1.379 |
naire | -1.357 |
que | -1.351 |
NG | -1.347 |
Token | < |
Token ID | 1279 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
Synd | +1.800 |
synd | +1.712 |
anda | +1.670 |
Tad | +1.541 |
�醒 | +1.511 |
Neg logit contributions | |
Guilty | -4.318 |
GH | -3.734 |
naire | -3.675 |
NG | -3.656 |
que | -3.618 |
Token | m |
Token ID | 76 |
Feature activation | -5.17e-01 |
Pos logit contributions | |
Synd | +1.558 |
anda | +1.524 |
synd | +1.511 |
�醒 | +1.482 |
utt | +1.414 |
Neg logit contributions | |
Guilty | -2.056 |
GH | -1.684 |
que | -1.649 |
naire | -1.649 |
NG | -1.644 |
Token | ew |
Token ID | 413 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
Guilty | +7.030 |
GH | +6.066 |
NG | +5.960 |
naire | +5.897 |
ready | +5.855 |
Neg logit contributions | |
�醒 | -5.248 |
Synd | -5.108 |
synd | -4.982 |
Mutual | -4.614 |
Tad | -4.592 |
Token | m |
Token ID | 76 |
Feature activation | -2.50e-01 |
Pos logit contributions | |
Synd | +2.290 |
synd | +2.231 |
anda | +2.218 |
�醒 | +2.157 |
ahime | +2.063 |
Neg logit contributions | |
Guilty | -3.149 |
GH | -2.599 |
naire | -2.557 |
NG | -2.531 |
que | -2.525 |
Token | 4 |
Token ID | 19 |
Feature activation | +3.84e-01 |
Pos logit contributions | |
Guilty | +3.141 |
GH | +2.590 |
NG | +2.518 |
que | +2.518 |
naire | +2.498 |
Neg logit contributions | |
Synd | -2.891 |
�醒 | -2.872 |
synd | -2.809 |
anda | -2.762 |
Tad | -2.654 |
Token | k |
Token ID | 74 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
Synd | +3.700 |
synd | +3.602 |
anda | +3.581 |
�醒 | +3.381 |
utt | +3.305 |
Neg logit contributions | |
Guilty | -5.509 |
GH | -4.525 |
naire | -4.489 |
NG | -4.402 |
que | -4.373 |
Token | [ |
Token ID | 685 |
Feature activation | +1.65e-01 |
Pos logit contributions | |
Synd | +1.552 |
synd | +1.511 |
anda | +1.502 |
�醒 | +1.469 |
Tad | +1.406 |
Neg logit contributions | |
Guilty | -1.875 |
GH | -1.537 |
naire | -1.504 |
NG | -1.495 |
que | -1.485 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.81e-01 |
Pos logit contributions | |
Synd | +1.512 |
anda | +1.467 |
synd | +1.465 |
�醒 | +1.358 |
utt | +1.350 |
Neg logit contributions | |
Guilty | -2.497 |
GH | -2.067 |
que | -2.042 |
naire | -2.041 |
NG | -2.009 |
Token | : |
Token ID | 25 |
Feature activation | +2.98e+00 |
Pos logit contributions | |
Synd | +3.505 |
synd | +3.344 |
anda | +3.310 |
Tad | +3.039 |
Mutual | +3.006 |
Neg logit contributions | |
Guilty | -7.972 |
GH | -6.655 |
naire | -6.591 |
que | -6.588 |
isSpecialOrderable | -6.573 |
Token | 48 |
Token ID | 2780 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
48 | +16.255 |
anda | +14.687 |
Synd | +13.348 |
utt | +12.497 |
nt | +12.163 |
Neg logit contributions | |
Guilty | -30.370 |
GH | -25.324 |
NG | -23.816 |
Reloaded | -23.666 |
naire | -23.285 |
Token | ] |
Token ID | 60 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
Synd | +0.854 |
synd | +0.817 |
anda | +0.809 |
�醒 | +0.757 |
Tad | +0.742 |
Neg logit contributions | |
Guilty | -1.820 |
GH | -1.550 |
naire | -1.526 |
que | -1.520 |
NG | -1.514 |
Token | < |
Token ID | 1279 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
Synd | +3.158 |
synd | +3.032 |
anda | +2.988 |
�醒 | +2.936 |
Tad | +2.731 |
Neg logit contributions | |
Guilty | -7.913 |
GH | -6.847 |
naire | -6.777 |
NG | -6.714 |
itcher | -6.587 |
Token | mom |
Token ID | 32542 |
Feature activation | +2.05e-01 |
Pos logit contributions | |
Synd | +1.156 |
anda | +1.128 |
synd | +1.123 |
�醒 | +1.103 |
Tad | +1.048 |
Neg logit contributions | |
Guilty | -1.524 |
GH | -1.252 |
naire | -1.225 |
que | -1.225 |
NG | -1.221 |
Token | per |
Token ID | 525 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
Synd | +1.507 |
anda | +1.475 |
synd | +1.435 |
�醒 | +1.352 |
utt | +1.329 |
Neg logit contributions | |
Guilty | -3.468 |
GH | -2.970 |
naire | -2.895 |
NG | -2.882 |
que | -2.881 |
Token | m |
Token ID | 285 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
Synd | +2.743 |
synd | +2.687 |
anda | +2.653 |
�醒 | +2.587 |
Tad | +2.509 |
Neg logit contributions | |
Guilty | -3.481 |
GH | -2.887 |
naire | -2.811 |
NG | -2.807 |
ready | -2.758 |
Token | 2 |
Token ID | 17 |
Feature activation | +7.16e-01 |
Pos logit contributions | |
Synd | +2.299 |
anda | +2.285 |
synd | +2.243 |
�醒 | +2.146 |
utt | +2.134 |
Neg logit contributions | |
Guilty | -2.129 |
GH | -1.673 |
naire | -1.629 |
que | -1.614 |
NG | -1.610 |
Token | k |
Token ID | 74 |
Feature activation | -8.79e-03 |
Pos logit contributions | |
anda | +4.017 |
Synd | +3.926 |
synd | +3.847 |
nt | +3.611 |
utt | +3.515 |
Neg logit contributions | |
Guilty | -12.461 |
GH | -10.739 |
isSpecialOrderable | -10.429 |
NG | -10.380 |
Reloaded | -10.340 |
Token | [ |
Token ID | 685 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
Guilty | +0.118 |
GH | +0.098 |
naire | +0.095 |
NG | +0.095 |
que | +0.095 |
Neg logit contributions | |
Synd | -0.096 |
synd | -0.093 |
anda | -0.092 |
�醒 | -0.092 |
Tad | -0.087 |
Token | 10 |
Token ID | 940 |
Feature activation | +5.13e-01 |
Pos logit contributions | |
Synd | +1.235 |
synd | +1.197 |
anda | +1.195 |
�醒 | +1.122 |
utt | +1.104 |
Neg logit contributions | |
Guilty | -1.997 |
GH | -1.655 |
naire | -1.633 |
que | -1.632 |
NG | -1.610 |
Token | : |
Token ID | 25 |
Feature activation | +2.96e+00 |
Pos logit contributions | |
Synd | +3.666 |
synd | +3.483 |
anda | +3.431 |
Tad | +3.159 |
Mutual | +3.119 |
Neg logit contributions | |
Guilty | -8.529 |
GH | -7.122 |
isSpecialOrderable | -7.059 |
naire | -7.050 |
que | -7.041 |
Token | 48 |
Token ID | 2780 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
48 | +16.038 |
anda | +14.126 |
Synd | +12.978 |
utt | +12.095 |
nt | +11.889 |
Neg logit contributions | |
Guilty | -30.811 |
GH | -25.751 |
NG | -24.333 |
Reloaded | -24.113 |
naire | -23.802 |
Token | ] |
Token ID | 60 |
Feature activation | +4.21e-01 |
Pos logit contributions | |
Synd | +0.972 |
synd | +0.930 |
anda | +0.919 |
�醒 | +0.853 |
Tad | +0.844 |
Neg logit contributions | |
Guilty | -2.100 |
GH | -1.788 |
naire | -1.761 |
que | -1.754 |
NG | -1.746 |
Token | < |
Token ID | 1279 |
Feature activation | +8.44e-02 |
Pos logit contributions | |
Synd | +2.890 |
synd | +2.774 |
anda | +2.734 |
�醒 | +2.699 |
Tad | +2.500 |
Neg logit contributions | |
Guilty | -7.161 |
GH | -6.185 |
naire | -6.119 |
NG | -6.068 |
que | -5.950 |
Token | qu |
Token ID | 421 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
Synd | +0.887 |
anda | +0.863 |
synd | +0.861 |
�醒 | +0.849 |
Tad | +0.803 |
Neg logit contributions | |
Guilty | -1.167 |
GH | -0.961 |
naire | -0.940 |
que | -0.939 |
NG | -0.937 |
Token | ij |
Token ID | 2926 |
Feature activation | +6.12e-01 |
Pos logit contributions | |
Guilty | +1.726 |
GH | +1.452 |
naire | +1.427 |
NG | +1.420 |
que | +1.412 |
Neg logit contributions | |
Synd | -1.159 |
synd | -1.124 |
�醒 | -1.119 |
anda | -1.095 |
Tad | -1.041 |
Token | / |
Token ID | 1220 |
Feature activation | +3.51e-02 |
Pos logit contributions | |
Synd | +3.510 |
synd | +3.426 |
anda | +3.360 |
�醒 | +3.228 |
Tad | +3.220 |
Neg logit contributions | |
Guilty | -4.345 |
GH | -3.621 |
naire | -3.574 |
NG | -3.531 |
isSpecialOrderable | -3.477 |
Token | clear |
Token ID | 20063 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
Synd | +0.335 |
synd | +0.323 |
anda | +0.321 |
�醒 | +0.318 |
Tad | +0.299 |
Neg logit contributions | |
Guilty | -0.520 |
GH | -0.437 |
naire | -0.428 |
NG | -0.427 |
que | -0.426 |
Token | chat |
Token ID | 8537 |
Feature activation | +5.99e-01 |
Pos logit contributions | |
Synd | +4.326 |
anda | +4.217 |
synd | +4.212 |
�醒 | +3.994 |
utt | +3.927 |
Neg logit contributions | |
Guilty | -5.087 |
GH | -4.183 |
naire | -4.057 |
NG | -4.036 |
que | -3.966 |
Token | [ |
Token ID | 685 |
Feature activation | +3.69e-01 |
Pos logit contributions | |
Synd | +6.272 |
synd | +6.168 |
anda | +6.108 |
�醒 | +5.689 |
ahime | +5.639 |
Neg logit contributions | |
Guilty | -7.703 |
GH | -6.387 |
naire | -6.258 |
isSpecialOrderable | -6.219 |
NG | -6.174 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
Synd | +3.058 |
anda | +3.009 |
synd | +2.956 |
utt | +2.750 |
Tad | +2.688 |
Neg logit contributions | |
Guilty | -5.836 |
que | -4.766 |
naire | -4.754 |
GH | -4.752 |
itcher | -4.657 |
Token | : |
Token ID | 25 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
Synd | +3.412 |
synd | +3.252 |
anda | +3.210 |
Tad | +2.967 |
Mutual | +2.914 |
Neg logit contributions | |
Guilty | -7.626 |
GH | -6.368 |
naire | -6.304 |
que | -6.295 |
isSpecialOrderable | -6.291 |
Token | 47 |
Token ID | 2857 |
Feature activation | +2.73e-01 |
Pos logit contributions | |
48 | +7.482 |
Synd | +6.225 |
Tad | +6.203 |
Teddy | +5.493 |
synd | +5.335 |
Neg logit contributions | |
Guilty | -32.487 |
� | -29.851 |
pse | -29.799 |
proble | -29.625 |
� | -29.614 |
Token | ] |
Token ID | 60 |
Feature activation | +5.82e-01 |
Pos logit contributions | |
Synd | +1.929 |
synd | +1.834 |
anda | +1.811 |
Tad | +1.653 |
utt | +1.623 |
Neg logit contributions | |
Guilty | -4.692 |
GH | -3.989 |
naire | -3.936 |
que | -3.925 |
NG | -3.882 |
Token | < |
Token ID | 1279 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
Synd | +3.953 |
synd | +3.809 |
anda | +3.720 |
�醒 | +3.684 |
Tad | +3.440 |
Neg logit contributions | |
Guilty | -9.661 |
GH | -8.376 |
naire | -8.285 |
NG | -8.202 |
anted | -8.064 |
Token | her |
Token ID | 372 |
Feature activation | +4.72e-02 |
Pos logit contributions | |
Synd | +1.467 |
anda | +1.434 |
synd | +1.425 |
�醒 | +1.400 |
utt | +1.333 |
Neg logit contributions | |
Guilty | -1.896 |
GH | -1.550 |
que | -1.520 |
naire | -1.520 |
NG | -1.512 |
Token | ret |
Token ID | 1186 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
Synd | +0.478 |
synd | +0.464 |
anda | +0.463 |
�醒 | +0.458 |
ahime | +0.431 |
Neg logit contributions | |
Guilty | -0.669 |
GH | -0.558 |
naire | -0.545 |
NG | -0.543 |
que | -0.543 |
Token | 2 |
Token ID | 17 |
Feature activation | +9.18e-01 |
Pos logit contributions | |
Guilty | +0.495 |
GH | +0.395 |
naire | +0.383 |
NG | +0.382 |
que | +0.381 |
Neg logit contributions | |
Synd | -0.550 |
synd | -0.537 |
�醒 | -0.535 |
anda | -0.532 |
Tad | -0.507 |
Token | k |
Token ID | 74 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
Synd | +5.038 |
anda | +4.968 |
synd | +4.919 |
�醒 | +4.416 |
nt | +4.386 |
Neg logit contributions | |
Guilty | -15.150 |
GH | -13.119 |
NG | -12.793 |
isSpecialOrderable | -12.654 |
naire | -12.586 |
Token | lol |
Token ID | 19462 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
Synd | +3.711 |
synd | +3.626 |
anda | +3.573 |
�醒 | +3.435 |
Tad | +3.347 |
Neg logit contributions | |
Guilty | -5.025 |
GH | -4.164 |
naire | -4.083 |
NG | -4.078 |
ready | -4.000 |
Token | [ |
Token ID | 685 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
Synd | +3.713 |
synd | +3.637 |
anda | +3.614 |
�醒 | +3.511 |
Tad | +3.386 |
Neg logit contributions | |
Guilty | -5.229 |
GH | -4.345 |
naire | -4.252 |
NG | -4.249 |
ready | -4.168 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.91e-01 |
Pos logit contributions | |
Synd | +2.335 |
anda | +2.271 |
synd | +2.263 |
utt | +2.086 |
Tad | +2.057 |
Neg logit contributions | |
Guilty | -4.262 |
GH | -3.487 |
que | -3.480 |
naire | -3.475 |
itcher | -3.385 |
Token | : |
Token ID | 25 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
Synd | +3.561 |
synd | +3.391 |
anda | +3.338 |
Tad | +3.075 |
Mutual | +3.034 |
Neg logit contributions | |
Guilty | -8.145 |
GH | -6.807 |
naire | -6.734 |
isSpecialOrderable | -6.728 |
que | -6.723 |
Token | 47 |
Token ID | 2857 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
48 | +7.133 |
Synd | +5.211 |
Tad | +5.097 |
nt | +4.999 |
anda | +4.562 |
Neg logit contributions | |
� | -34.896 |
� | -34.473 |
� | -33.087 |
proble | -32.746 |
Guilty | -32.708 |
Token | ] |
Token ID | 60 |
Feature activation | +4.99e-01 |
Pos logit contributions | |
Synd | +2.014 |
synd | +1.915 |
anda | +1.893 |
Tad | +1.719 |
utt | +1.690 |
Neg logit contributions | |
Guilty | -4.962 |
GH | -4.216 |
naire | -4.161 |
que | -4.149 |
NG | -4.096 |
Token | < |
Token ID | 1279 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
Synd | +3.412 |
synd | +3.283 |
anda | +3.216 |
�醒 | +3.184 |
Tad | +2.945 |
Neg logit contributions | |
Guilty | -8.389 |
GH | -7.263 |
naire | -7.167 |
NG | -7.103 |
itcher | -6.983 |
Token | m |
Token ID | 76 |
Feature activation | -4.86e-01 |
Pos logit contributions | |
Synd | +1.597 |
anda | +1.564 |
synd | +1.551 |
�醒 | +1.524 |
utt | +1.454 |
Neg logit contributions | |
Guilty | -2.063 |
GH | -1.684 |
que | -1.652 |
naire | -1.650 |
NG | -1.643 |
Token | ik |
Token ID | 1134 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
Guilty | +6.611 |
GH | +5.707 |
NG | +5.587 |
naire | +5.524 |
ready | +5.495 |
Neg logit contributions | |
�醒 | -4.952 |
Synd | -4.853 |
synd | -4.715 |
Mutual | -4.389 |
Tad | -4.358 |
Token | l |
Token ID | 300 |
Feature activation | +1.98e-01 |
Pos logit contributions | |
Synd | +2.190 |
synd | +2.144 |
anda | +2.132 |
�醒 | +2.056 |
Tad | +1.985 |
Neg logit contributions | |
Guilty | -2.951 |
GH | -2.427 |
naire | -2.397 |
NG | -2.367 |
que | -2.349 |
Token | ma |
Token ID | 2611 |
Feature activation | -6.83e-01 |
Pos logit contributions | |
Synd | +1.974 |
anda | +1.944 |
synd | +1.919 |
�醒 | +1.853 |
utt | +1.809 |
Neg logit contributions | |
Guilty | -2.830 |
GH | -2.339 |
naire | -2.313 |
NG | -2.286 |
que | -2.266 |
Token | o |
Token ID | 78 |
Feature activation | +4.04e-02 |
Pos logit contributions | |
Guilty | +7.170 |
GH | +5.894 |
que | +5.768 |
ready | +5.483 |
NG | +5.448 |
Neg logit contributions | |
Synd | -8.807 |
�醒 | -8.565 |
synd | -8.492 |
ahime | -8.169 |
Tad | -8.096 |
Token | [ |
Token ID | 685 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
Synd | +0.434 |
synd | +0.423 |
anda | +0.419 |
�醒 | +0.416 |
Tad | +0.394 |
Neg logit contributions | |
Guilty | -0.549 |
GH | -0.454 |
naire | -0.444 |
NG | -0.442 |
que | -0.440 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.96e-01 |
Pos logit contributions | |
Synd | +2.926 |
anda | +2.867 |
synd | +2.832 |
utt | +2.627 |
Tad | +2.573 |
Neg logit contributions | |
Guilty | -5.577 |
naire | -4.554 |
que | -4.552 |
GH | -4.541 |
itcher | -4.443 |
Token | : |
Token ID | 25 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
Synd | +3.582 |
synd | +3.412 |
anda | +3.365 |
Tad | +3.103 |
Mutual | +3.050 |
Neg logit contributions | |
Guilty | -8.230 |
GH | -6.870 |
isSpecialOrderable | -6.806 |
naire | -6.805 |
que | -6.795 |
Token | 47 |
Token ID | 2857 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
48 | +6.921 |
Synd | +5.134 |
Tad | +5.068 |
Teddy | +4.435 |
anda | +4.390 |
Neg logit contributions | |
� | -33.318 |
Guilty | -32.965 |
� | -32.944 |
proble | -31.849 |
� | -31.807 |
Token | ] |
Token ID | 60 |
Feature activation | +5.58e-01 |
Pos logit contributions | |
Synd | +2.309 |
synd | +2.187 |
anda | +2.162 |
Tad | +1.959 |
utt | +1.923 |
Neg logit contributions | |
Guilty | -5.932 |
GH | -5.035 |
naire | -4.977 |
que | -4.966 |
isSpecialOrderable | -4.896 |
Token | < |
Token ID | 1279 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
Synd | +3.773 |
synd | +3.632 |
anda | +3.551 |
�醒 | +3.501 |
Tad | +3.264 |
Neg logit contributions | |
Guilty | -9.331 |
GH | -8.084 |
naire | -7.993 |
NG | -7.916 |
itcher | -7.789 |
Token | rev |
Token ID | 18218 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
Synd | +1.160 |
anda | +1.131 |
synd | +1.126 |
�醒 | +1.108 |
utt | +1.051 |
Neg logit contributions | |
Guilty | -1.510 |
GH | -1.239 |
naire | -1.213 |
que | -1.213 |
NG | -1.208 |
Token | itle |
Token ID | 2578 |
Feature activation | -2.01e-01 |
Pos logit contributions | |
Guilty | +1.860 |
GH | +1.555 |
naire | +1.518 |
NG | +1.512 |
que | +1.504 |
Neg logit contributions | |
Synd | -1.471 |
�醒 | -1.434 |
synd | -1.433 |
anda | -1.406 |
Tad | -1.340 |
Token | > |
Token ID | 29 |
Feature activation | +3.20e-01 |
Pos logit contributions | |
Synd | +3.338 |
anda | +3.252 |
synd | +3.237 |
�醒 | +3.011 |
utt | +2.945 |
Neg logit contributions | |
Guilty | -6.261 |
GH | -5.253 |
que | -5.189 |
naire | -5.134 |
NG | -5.105 |
Token | H |
Token ID | 367 |
Feature activation | +8.40e-02 |
Pos logit contributions | |
Synd | +3.411 |
synd | +3.327 |
anda | +3.265 |
�醒 | +3.140 |
Tad | +3.119 |
Neg logit contributions | |
Guilty | -4.268 |
GH | -3.556 |
naire | -3.504 |
NG | -3.463 |
isSpecialOrderable | -3.405 |
Token | aha |
Token ID | 12236 |
Feature activation | -3.29e-02 |
Pos logit contributions | |
Synd | +0.913 |
anda | +0.890 |
synd | +0.888 |
�醒 | +0.873 |
utt | +0.831 |
Neg logit contributions | |
Guilty | -1.130 |
GH | -0.921 |
naire | -0.911 |
que | -0.902 |
NG | -0.897 |
Token | [ |
Token ID | 685 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
Guilty | +0.445 |
GH | +0.369 |
naire | +0.359 |
NG | +0.358 |
que | +0.358 |
Neg logit contributions | |
Synd | -0.354 |
synd | -0.344 |
�醒 | -0.342 |
anda | -0.342 |
ahime | -0.321 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.59e-01 |
Pos logit contributions | |
Synd | +2.608 |
anda | +2.550 |
synd | +2.520 |
utt | +2.345 |
Tad | +2.300 |
Neg logit contributions | |
Guilty | -4.863 |
que | -3.963 |
naire | -3.958 |
GH | -3.946 |
itcher | -3.865 |
Token | : |
Token ID | 25 |
Feature activation | +2.22e+00 |
Pos logit contributions | |
Synd | +3.381 |
synd | +3.222 |
anda | +3.188 |
Tad | +2.943 |
utt | +2.897 |
Neg logit contributions | |
Guilty | -7.571 |
GH | -6.316 |
naire | -6.252 |
que | -6.249 |
isSpecialOrderable | -6.227 |
Token | 47 |
Token ID | 2857 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
48 | +6.817 |
Synd | +5.203 |
Tad | +5.191 |
Teddy | +4.741 |
anda | +4.320 |
Neg logit contributions | |
Guilty | -32.779 |
� | -32.200 |
� | -31.831 |
proble | -31.206 |
pse | -30.900 |
Token | ] |
Token ID | 60 |
Feature activation | +5.45e-01 |
Pos logit contributions | |
Synd | +1.808 |
synd | +1.720 |
anda | +1.703 |
Tad | +1.552 |
utt | +1.528 |
Neg logit contributions | |
Guilty | -4.337 |
GH | -3.685 |
naire | -3.634 |
que | -3.626 |
NG | -3.586 |
Token | < |
Token ID | 1279 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
Synd | +3.708 |
synd | +3.564 |
anda | +3.506 |
�醒 | +3.466 |
Tad | +3.234 |
Neg logit contributions | |
Guilty | -9.112 |
GH | -7.881 |
naire | -7.803 |
NG | -7.717 |
itcher | -7.590 |
Token | t |
Token ID | 83 |
Feature activation | -2.19e-01 |
Pos logit contributions | |
Synd | +1.379 |
anda | +1.348 |
synd | +1.339 |
�醒 | +1.317 |
utt | +1.253 |
Neg logit contributions | |
Guilty | -1.789 |
GH | -1.462 |
que | -1.435 |
naire | -1.434 |
NG | -1.426 |
Token | oxic |
Token ID | 18047 |
Feature activation | -8.78e-02 |
Pos logit contributions | |
Guilty | +2.946 |
GH | +2.490 |
NG | +2.418 |
naire | +2.399 |
que | +2.396 |
Neg logit contributions | |
Synd | -2.356 |
�醒 | -2.315 |
synd | -2.280 |
anda | -2.200 |
Mutual | -2.139 |
Token | m |
Token ID | 285 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
Synd | +2.602 |
synd | +2.548 |
anda | +2.521 |
�醒 | +2.462 |
Tad | +2.379 |
Neg logit contributions | |
Guilty | -3.320 |
GH | -2.757 |
naire | -2.688 |
NG | -2.676 |
ready | -2.632 |
Token | 2 |
Token ID | 17 |
Feature activation | +7.66e-01 |
Pos logit contributions | |
Synd | +3.325 |
anda | +3.319 |
synd | +3.237 |
�醒 | +3.155 |
ahime | +3.085 |
Neg logit contributions | |
Guilty | -3.153 |
GH | -2.473 |
naire | -2.421 |
que | -2.398 |
NG | -2.372 |
Token | k |
Token ID | 74 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
anda | +4.096 |
Synd | +3.956 |
synd | +3.833 |
nt | +3.738 |
utt | +3.560 |
Neg logit contributions | |
Guilty | -13.452 |
GH | -11.521 |
� | -11.470 |
proble | -11.438 |
� | -11.337 |
Token | [ |
Token ID | 685 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
Guilty | +1.825 |
GH | +1.497 |
que | +1.467 |
naire | +1.459 |
NG | +1.450 |
Neg logit contributions | |
Synd | -1.568 |
�醒 | -1.562 |
synd | -1.521 |
anda | -1.519 |
ahime | -1.449 |
Token | 10 |
Token ID | 940 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
Synd | +1.585 |
anda | +1.539 |
synd | +1.538 |
utt | +1.418 |
Tad | +1.411 |
Neg logit contributions | |
Guilty | -2.670 |
GH | -2.202 |
que | -2.181 |
naire | -2.179 |
NG | -2.140 |
Token | : |
Token ID | 25 |
Feature activation | +2.22e+00 |
Pos logit contributions | |
Synd | +2.927 |
synd | +2.796 |
anda | +2.758 |
Tad | +2.552 |
Mutual | +2.518 |
Neg logit contributions | |
Guilty | -6.110 |
GH | -5.116 |
naire | -5.048 |
que | -5.039 |
NG | -4.988 |
Token | 47 |
Token ID | 2857 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
48 | +7.326 |
nt | +5.280 |
Synd | +5.279 |
Tad | +5.157 |
anda | +4.707 |
Neg logit contributions | |
� | -34.903 |
� | -34.481 |
� | -33.038 |
proble | -32.594 |
Guilty | -32.439 |
Token | ] |
Token ID | 60 |
Feature activation | +4.96e-01 |
Pos logit contributions | |
Synd | +1.076 |
synd | +1.030 |
anda | +1.020 |
�醒 | +0.941 |
Tad | +0.933 |
Neg logit contributions | |
Guilty | -2.358 |
GH | -2.009 |
naire | -1.975 |
que | -1.970 |
NG | -1.959 |
Token | < |
Token ID | 1279 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
Synd | +3.411 |
synd | +3.274 |
anda | +3.220 |
�醒 | +3.178 |
Tad | +2.952 |
Neg logit contributions | |
Guilty | -8.332 |
GH | -7.216 |
naire | -7.122 |
NG | -7.058 |
itcher | -6.922 |
Token | kw |
Token ID | 46265 |
Feature activation | -1.72e-01 |
Pos logit contributions | |
Synd | +1.388 |
anda | +1.357 |
synd | +1.347 |
�醒 | +1.323 |
utt | +1.260 |
Neg logit contributions | |
Guilty | -1.823 |
GH | -1.494 |
naire | -1.465 |
que | -1.464 |
NG | -1.458 |
Token | ij |
Token ID | 2926 |
Feature activation | +4.04e-01 |
Pos logit contributions | |
Guilty | +2.357 |
GH | +1.978 |
NG | +1.934 |
naire | +1.929 |
que | +1.915 |
Neg logit contributions | |
Synd | -1.811 |
�醒 | -1.770 |
synd | -1.758 |
anda | -1.713 |
Tad | -1.644 |
Token | m |
Token ID | 285 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
Synd | +4.109 |
synd | +4.037 |
anda | +3.988 |
�醒 | +3.850 |
Tad | +3.768 |
Neg logit contributions | |
Guilty | -5.447 |
GH | -4.534 |
naire | -4.425 |
NG | -4.399 |
ready | -4.341 |
Token | 2 |
Token ID | 17 |
Feature activation | +7.68e-01 |
Pos logit contributions | |
Synd | +2.980 |
anda | +2.980 |
synd | +2.902 |
utt | +2.773 |
ahime | +2.758 |
Neg logit contributions | |
Guilty | -2.851 |
GH | -2.236 |
naire | -2.186 |
que | -2.165 |
NG | -2.148 |
Token | k |
Token ID | 74 |
Feature activation | -8.05e-02 |
Pos logit contributions | |
anda | +4.148 |
Synd | +4.012 |
synd | +3.912 |
nt | +3.754 |
utt | +3.592 |
Neg logit contributions | |
Guilty | -13.431 |
GH | -11.552 |
isSpecialOrderable | -11.271 |
proble | -11.244 |
� | -11.213 |
Token | [ |
Token ID | 685 |
Feature activation | +2.12e-01 |
Pos logit contributions | |
Guilty | +1.067 |
GH | +0.879 |
que | +0.857 |
naire | +0.856 |
NG | +0.852 |
Neg logit contributions | |
Synd | -0.892 |
�醒 | -0.875 |
synd | -0.866 |
anda | -0.862 |
ahime | -0.817 |
Token | 10 |
Token ID | 940 |
Feature activation | +3.99e-01 |
Pos logit contributions | |
Synd | +1.886 |
anda | +1.832 |
synd | +1.830 |
utt | +1.689 |
Tad | +1.674 |
Neg logit contributions | |
Guilty | -3.285 |
GH | -2.699 |
que | -2.683 |
naire | -2.679 |
NG | -2.623 |
Token | : |
Token ID | 25 |
Feature activation | +2.21e+00 |
Pos logit contributions | |
Synd | +3.068 |
synd | +2.928 |
anda | +2.884 |
Tad | +2.669 |
Mutual | +2.635 |
Neg logit contributions | |
Guilty | -6.516 |
GH | -5.453 |
naire | -5.389 |
que | -5.379 |
isSpecialOrderable | -5.329 |
Token | 47 |
Token ID | 2857 |
Feature activation | +1.68e-01 |
Pos logit contributions | |
48 | +7.061 |
Synd | +5.208 |
Tad | +5.016 |
nt | +4.923 |
anda | +4.516 |
Neg logit contributions | |
� | -34.466 |
� | -34.008 |
� | -32.701 |
Guilty | -32.527 |
proble | -32.343 |
Token | ] |
Token ID | 60 |
Feature activation | +4.39e-01 |
Pos logit contributions | |
Synd | +1.261 |
synd | +1.205 |
anda | +1.193 |
Tad | +1.090 |
�醒 | +1.082 |
Neg logit contributions | |
Guilty | -2.821 |
GH | -2.401 |
naire | -2.364 |
que | -2.357 |
NG | -2.340 |
Token | < |
Token ID | 1279 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
Synd | +3.085 |
synd | +2.965 |
anda | +2.914 |
�醒 | +2.892 |
Tad | +2.679 |
Neg logit contributions | |
Guilty | -7.365 |
GH | -6.364 |
naire | -6.280 |
NG | -6.226 |
que | -6.108 |
Token | sn |
Token ID | 16184 |
Feature activation | +2.36e-02 |
Pos logit contributions | |
Synd | +1.275 |
anda | +1.245 |
synd | +1.238 |
�醒 | +1.217 |
utt | +1.157 |
Neg logit contributions | |
Guilty | -1.674 |
GH | -1.372 |
naire | -1.345 |
que | -1.345 |
NG | -1.338 |
Token | iping |
Token ID | 34690 |
Feature activation | +1.98e-02 |
Pos logit contributions | |
Synd | +0.266 |
synd | +0.259 |
anda | +0.258 |
�醒 | +0.256 |
Tad | +0.242 |
Neg logit contributions | |
Guilty | -0.309 |
GH | -0.253 |
naire | -0.247 |
NG | -0.246 |
que | -0.246 |
Token | w |
Token ID | 86 |
Feature activation | -2.60e-01 |
Pos logit contributions | |
Guilty | +2.815 |
GH | +2.371 |
NG | +2.321 |
naire | +2.313 |
que | +2.300 |
Neg logit contributions | |
Synd | -2.046 |
�醒 | -1.994 |
synd | -1.978 |
anda | -1.932 |
Tad | -1.840 |
Token | > |
Token ID | 29 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
Guilty | +3.540 |
GH | +2.973 |
NG | +2.921 |
naire | +2.909 |
que | +2.895 |
Neg logit contributions | |
Synd | -2.699 |
�醒 | -2.652 |
synd | -2.607 |
anda | -2.521 |
Tad | -2.456 |
Token | save |
Token ID | 3613 |
Feature activation | -3.04e-01 |
Pos logit contributions | |
Synd | +3.776 |
synd | +3.688 |
anda | +3.613 |
�醒 | +3.462 |
Tad | +3.457 |
Neg logit contributions | |
Guilty | -4.651 |
GH | -3.874 |
naire | -3.821 |
NG | -3.775 |
isSpecialOrderable | -3.712 |
Token | [ |
Token ID | 685 |
Feature activation | +3.03e-01 |
Pos logit contributions | |
Guilty | +4.102 |
GH | +3.394 |
que | +3.387 |
NG | +3.350 |
naire | +3.290 |
Neg logit contributions | |
Synd | -3.210 |
�醒 | -3.198 |
synd | -3.098 |
anda | -3.084 |
ahime | -2.904 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.67e-01 |
Pos logit contributions | |
Synd | +2.607 |
anda | +2.566 |
synd | +2.522 |
utt | +2.340 |
Tad | +2.299 |
Neg logit contributions | |
Guilty | -4.729 |
GH | -3.869 |
que | -3.851 |
naire | -3.848 |
NG | -3.769 |
Token | : |
Token ID | 25 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
Synd | +3.424 |
synd | +3.268 |
anda | +3.231 |
Tad | +2.982 |
utt | +2.933 |
Neg logit contributions | |
Guilty | -7.704 |
GH | -6.429 |
naire | -6.370 |
isSpecialOrderable | -6.353 |
que | -6.349 |
Token | 47 |
Token ID | 2857 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
48 | +6.782 |
Synd | +5.032 |
Tad | +5.031 |
nt | +4.676 |
Teddy | +4.510 |
Neg logit contributions | |
� | -34.193 |
� | -33.859 |
� | -32.652 |
Guilty | -32.613 |
proble | -32.498 |
Token | ] |
Token ID | 60 |
Feature activation | +5.48e-01 |
Pos logit contributions | |
Synd | +1.911 |
synd | +1.816 |
anda | +1.798 |
Tad | +1.640 |
utt | +1.608 |
Neg logit contributions | |
Guilty | -4.643 |
GH | -3.945 |
naire | -3.894 |
que | -3.880 |
NG | -3.839 |
Token | < |
Token ID | 1279 |
Feature activation | +8.89e-02 |
Pos logit contributions | |
Synd | +3.682 |
synd | +3.552 |
anda | +3.495 |
�醒 | +3.450 |
Tad | +3.201 |
Neg logit contributions | |
Guilty | -9.183 |
GH | -7.938 |
naire | -7.858 |
NG | -7.782 |
itcher | -7.652 |
Token | f |
Token ID | 69 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
Synd | +0.936 |
anda | +0.911 |
synd | +0.909 |
�醒 | +0.895 |
Tad | +0.848 |
Neg logit contributions | |
Guilty | -1.226 |
GH | -1.009 |
naire | -0.987 |
que | -0.986 |
NG | -0.983 |
Token | gt |
Token ID | 13655 |
Feature activation | -8.85e-02 |
Pos logit contributions | |
Guilty | +3.543 |
GH | +2.998 |
naire | +2.905 |
NG | +2.897 |
que | +2.868 |
Neg logit contributions | |
Synd | -2.779 |
�醒 | -2.716 |
synd | -2.673 |
anda | -2.590 |
Tad | -2.500 |
Token | lol |
Token ID | 19462 |
Feature activation | +3.89e-01 |
Pos logit contributions | |
Synd | +3.763 |
synd | +3.666 |
anda | +3.592 |
�醒 | +3.440 |
Tad | +3.437 |
Neg logit contributions | |
Guilty | -4.623 |
GH | -3.861 |
naire | -3.807 |
NG | -3.756 |
isSpecialOrderable | -3.704 |
Token | j |
Token ID | 474 |
Feature activation | +3.57e-01 |
Pos logit contributions | |
Synd | +4.012 |
synd | +3.937 |
anda | +3.891 |
�醒 | +3.747 |
Tad | +3.673 |
Neg logit contributions | |
Guilty | -5.256 |
GH | -4.375 |
naire | -4.260 |
NG | -4.238 |
ready | -4.184 |
Token | ason |
Token ID | 888 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
anda | +4.562 |
Synd | +4.530 |
synd | +4.437 |
�醒 | +4.299 |
utt | +4.289 |
Neg logit contributions | |
Guilty | -4.000 |
GH | -3.055 |
naire | -3.045 |
que | -2.978 |
NG | -2.939 |
Token | [ |
Token ID | 685 |
Feature activation | +5.24e-02 |
Pos logit contributions | |
Guilty | +2.570 |
GH | +2.110 |
que | +2.073 |
NG | +2.055 |
naire | +2.055 |
Neg logit contributions | |
Synd | -2.181 |
�醒 | -2.122 |
synd | -2.104 |
anda | -2.092 |
ahime | -1.991 |
Token | 10 |
Token ID | 940 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
Synd | +0.506 |
synd | +0.491 |
anda | +0.488 |
�醒 | +0.474 |
Tad | +0.454 |
Neg logit contributions | |
Guilty | -0.770 |
GH | -0.641 |
naire | -0.629 |
que | -0.628 |
NG | -0.624 |
Token | : |
Token ID | 25 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
Synd | +2.978 |
synd | +2.859 |
anda | +2.821 |
Tad | +2.601 |
utt | +2.578 |
Neg logit contributions | |
Guilty | -6.305 |
GH | -5.270 |
naire | -5.199 |
que | -5.196 |
isSpecialOrderable | -5.146 |
Token | 47 |
Token ID | 2857 |
Feature activation | +3.10e-01 |
Pos logit contributions | |
48 | +6.526 |
Synd | +4.822 |
Tad | +4.534 |
Teddy | +4.100 |
synd | +4.065 |
Neg logit contributions | |
� | -33.501 |
� | -33.111 |
Guilty | -33.107 |
proble | -32.021 |
� | -31.969 |
Token | ] |
Token ID | 60 |
Feature activation | +4.85e-01 |
Pos logit contributions | |
Synd | +2.132 |
synd | +2.030 |
anda | +2.003 |
Tad | +1.817 |
utt | +1.794 |
Neg logit contributions | |
Guilty | -5.354 |
GH | -4.545 |
naire | -4.483 |
que | -4.476 |
NG | -4.413 |
Token | < |
Token ID | 1279 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
Synd | +3.341 |
synd | +3.222 |
anda | +3.145 |
�醒 | +3.121 |
Tad | +2.888 |
Neg logit contributions | |
Guilty | -8.160 |
GH | -7.063 |
naire | -6.973 |
NG | -6.899 |
itcher | -6.784 |
Token | fen |
Token ID | 41037 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
Synd | +1.308 |
anda | +1.277 |
synd | +1.270 |
�醒 | +1.248 |
utt | +1.187 |
Neg logit contributions | |
Guilty | -1.699 |
GH | -1.391 |
que | -1.363 |
naire | -1.363 |
NG | -1.357 |
Token | ren |
Token ID | 918 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
Synd | +1.524 |
anda | +1.491 |
synd | +1.480 |
�醒 | +1.453 |
ahime | +1.389 |
Neg logit contributions | |
Guilty | -1.879 |
GH | -1.539 |
NG | -1.500 |
naire | -1.500 |
que | -1.494 |
Token | m |
Token ID | 285 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
Synd | +3.411 |
synd | +3.343 |
anda | +3.305 |
�醒 | +3.203 |
Tad | +3.125 |
Neg logit contributions | |
Guilty | -4.398 |
GH | -3.649 |
naire | -3.562 |
NG | -3.543 |
ready | -3.491 |
Token | 2 |
Token ID | 17 |
Feature activation | +6.84e-01 |
Pos logit contributions | |
Synd | +3.220 |
anda | +3.215 |
synd | +3.133 |
�醒 | +3.047 |
ahime | +2.994 |
Neg logit contributions | |
Guilty | -3.062 |
GH | -2.398 |
naire | -2.348 |
que | -2.327 |
NG | -2.303 |
Token | k |
Token ID | 74 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
anda | +3.955 |
Synd | +3.895 |
synd | +3.810 |
nt | +3.519 |
utt | +3.454 |
Neg logit contributions | |
Guilty | -11.851 |
GH | -10.235 |
isSpecialOrderable | -9.907 |
NG | -9.899 |
Reloaded | -9.809 |
Token | [ |
Token ID | 685 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
Synd | +2.486 |
synd | +2.420 |
anda | +2.398 |
�醒 | +2.360 |
Tad | +2.248 |
Neg logit contributions | |
Guilty | -3.419 |
GH | -2.838 |
NG | -2.784 |
naire | -2.781 |
ready | -2.736 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.18e-01 |
Pos logit contributions | |
Synd | +1.796 |
anda | +1.744 |
synd | +1.743 |
utt | +1.609 |
Tad | +1.595 |
Neg logit contributions | |
Guilty | -3.094 |
GH | -2.544 |
que | -2.526 |
naire | -2.523 |
NG | -2.473 |
Token | : |
Token ID | 25 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
Synd | +3.182 |
synd | +3.037 |
anda | +2.989 |
Tad | +2.763 |
Mutual | +2.727 |
Neg logit contributions | |
Guilty | -6.863 |
GH | -5.742 |
naire | -5.674 |
que | -5.662 |
isSpecialOrderable | -5.625 |
Token | 47 |
Token ID | 2857 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
48 | +6.934 |
Synd | +5.179 |
Tad | +5.003 |
nt | +4.851 |
anda | +4.462 |
Neg logit contributions | |
� | -34.246 |
� | -33.785 |
� | -32.498 |
Guilty | -32.392 |
proble | -32.228 |
Token | ] |
Token ID | 60 |
Feature activation | +4.88e-01 |
Pos logit contributions | |
Synd | +1.471 |
synd | +1.403 |
anda | +1.389 |
Tad | +1.267 |
utt | +1.249 |
Neg logit contributions | |
Guilty | -3.374 |
GH | -2.871 |
naire | -2.829 |
que | -2.821 |
NG | -2.797 |
Token | < |
Token ID | 1279 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
Synd | +3.392 |
synd | +3.258 |
anda | +3.196 |
�醒 | +3.162 |
Tad | +2.940 |
Neg logit contributions | |
Guilty | -8.184 |
GH | -7.084 |
naire | -6.992 |
NG | -6.935 |
itcher | -6.797 |
Token | ok |
Token ID | 482 |
Feature activation | -6.26e-01 |
Pos logit contributions | |
Synd | +1.422 |
anda | +1.390 |
synd | +1.380 |
�醒 | +1.357 |
utt | +1.292 |
Neg logit contributions | |
Guilty | -1.848 |
GH | -1.511 |
que | -1.482 |
naire | -1.481 |
NG | -1.475 |
Token | clock |
Token ID | 15750 |
Feature activation | +8.06e-01 |
Pos logit contributions | |
Guilty | +5.486 |
ready | +4.301 |
GH | +4.287 |
NG | +4.158 |
naire | +4.129 |
Neg logit contributions | |
Synd | -9.109 |
�醒 | -8.919 |
synd | -8.870 |
Tad | -8.550 |
Mutual | -8.462 |
Token | m |
Token ID | 285 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
Synd | +2.777 |
synd | +2.721 |
anda | +2.694 |
�醒 | +2.632 |
Tad | +2.536 |
Neg logit contributions | |
Guilty | -3.567 |
GH | -2.963 |
naire | -2.889 |
NG | -2.875 |
ready | -2.826 |
Token | 2 |
Token ID | 17 |
Feature activation | +6.22e-01 |
Pos logit contributions | |
Synd | +2.125 |
anda | +2.099 |
synd | +2.072 |
�醒 | +2.012 |
ahime | +1.964 |
Neg logit contributions | |
Guilty | -1.933 |
GH | -1.523 |
naire | -1.484 |
que | -1.466 |
NG | -1.466 |
Token | k |
Token ID | 74 |
Feature activation | -1.10e-01 |
Pos logit contributions | |
anda | +3.729 |
Synd | +3.700 |
synd | +3.620 |
nt | +3.323 |
utt | +3.290 |
Neg logit contributions | |
Guilty | -10.740 |
GH | -9.262 |
NG | -8.968 |
isSpecialOrderable | -8.933 |
naire | -8.877 |
Token | [ |
Token ID | 685 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
Guilty | +1.452 |
GH | +1.193 |
que | +1.168 |
naire | +1.163 |
NG | +1.157 |
Neg logit contributions | |
Synd | -1.230 |
�醒 | -1.213 |
synd | -1.193 |
anda | -1.190 |
ahime | -1.129 |
Token | 10 |
Token ID | 940 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
Synd | +1.209 |
synd | +1.172 |
anda | +1.171 |
�醒 | +1.096 |
utt | +1.081 |
Neg logit contributions | |
Guilty | -1.963 |
GH | -1.623 |
naire | -1.602 |
que | -1.601 |
NG | -1.579 |
Token | : |
Token ID | 25 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
Synd | +2.894 |
synd | +2.767 |
anda | +2.729 |
Tad | +2.528 |
Mutual | +2.492 |
Neg logit contributions | |
Guilty | -6.014 |
GH | -5.035 |
naire | -4.972 |
que | -4.958 |
NG | -4.908 |
Token | 47 |
Token ID | 2857 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
48 | +7.021 |
Synd | +5.061 |
nt | +4.924 |
Tad | +4.866 |
anda | +4.503 |
Neg logit contributions | |
� | -34.479 |
� | -34.006 |
� | -32.649 |
Guilty | -32.447 |
proble | -32.352 |
Token | ] |
Token ID | 60 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
Synd | +0.932 |
synd | +0.892 |
anda | +0.884 |
�醒 | +0.824 |
Tad | +0.809 |
Neg logit contributions | |
Guilty | -2.009 |
GH | -1.712 |
naire | -1.684 |
que | -1.678 |
NG | -1.670 |
Token | < |
Token ID | 1279 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
Synd | +3.280 |
synd | +3.153 |
anda | +3.095 |
�醒 | +3.065 |
Tad | +2.846 |
Neg logit contributions | |
Guilty | -7.800 |
GH | -6.745 |
naire | -6.658 |
NG | -6.607 |
anted | -6.463 |
Token | en |
Token ID | 268 |
Feature activation | -9.11e-02 |
Pos logit contributions | |
Synd | +1.370 |
anda | +1.339 |
synd | +1.330 |
�醒 | +1.307 |
utt | +1.243 |
Neg logit contributions | |
Guilty | -1.786 |
GH | -1.462 |
naire | -1.434 |
que | -1.433 |
NG | -1.427 |
Token | 7 |
Token ID | 22 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
Guilty | +1.169 |
GH | +0.959 |
naire | +0.935 |
que | +0.931 |
NG | +0.929 |
Neg logit contributions | |
Synd | -1.044 |
synd | -1.016 |
�醒 | -1.013 |
anda | -1.002 |
Tad | -0.955 |
Token | m |
Token ID | 285 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
Synd | +3.055 |
synd | +2.992 |
anda | +2.959 |
�醒 | +2.877 |
Tad | +2.796 |
Neg logit contributions | |
Guilty | -3.882 |
GH | -3.219 |
naire | -3.137 |
NG | -3.125 |
ready | -3.074 |
Token | 2 |
Token ID | 17 |
Feature activation | +7.77e-01 |
Pos logit contributions | |
Synd | +2.930 |
anda | +2.919 |
synd | +2.854 |
�醒 | +2.781 |
ahime | +2.725 |
Neg logit contributions | |
Guilty | -2.757 |
GH | -2.163 |
naire | -2.115 |
que | -2.094 |
NG | -2.079 |
Token | k |
Token ID | 74 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
anda | +4.202 |
Synd | +4.110 |
synd | +4.055 |
nt | +3.795 |
utt | +3.612 |
Neg logit contributions | |
Guilty | -13.494 |
GH | -11.707 |
isSpecialOrderable | -11.385 |
NG | -11.318 |
Reloaded | -11.270 |
Token | [ |
Token ID | 685 |
Feature activation | +2.10e-01 |
Pos logit contributions | |
Synd | +3.313 |
synd | +3.238 |
anda | +3.195 |
�醒 | +3.136 |
Tad | +2.988 |
Neg logit contributions | |
Guilty | -4.723 |
GH | -3.923 |
NG | -3.861 |
naire | -3.852 |
ready | -3.791 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.71e-01 |
Pos logit contributions | |
Synd | +1.867 |
anda | +1.813 |
synd | +1.811 |
utt | +1.671 |
Tad | +1.658 |
Neg logit contributions | |
Guilty | -3.240 |
GH | -2.661 |
que | -2.646 |
naire | -2.644 |
NG | -2.587 |
Token | : |
Token ID | 25 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
Synd | +3.458 |
synd | +3.291 |
anda | +3.239 |
Tad | +2.989 |
Mutual | +2.951 |
Neg logit contributions | |
Guilty | -7.791 |
GH | -6.513 |
naire | -6.446 |
que | -6.432 |
isSpecialOrderable | -6.419 |
Token | 47 |
Token ID | 2857 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
48 | +6.885 |
Synd | +5.153 |
Tad | +5.068 |
nt | +5.022 |
anda | +4.513 |
Neg logit contributions | |
� | -34.476 |
� | -34.047 |
� | -32.702 |
Guilty | -32.331 |
proble | -32.308 |
Token | ] |
Token ID | 60 |
Feature activation | +4.33e-01 |
Pos logit contributions | |
Synd | +1.526 |
synd | +1.456 |
anda | +1.440 |
Tad | +1.313 |
utt | +1.294 |
Neg logit contributions | |
Guilty | -3.526 |
GH | -2.999 |
naire | -2.957 |
que | -2.947 |
NG | -2.920 |
Token | < |
Token ID | 1279 |
Feature activation | +7.79e-02 |
Pos logit contributions | |
Synd | +3.028 |
synd | +2.913 |
anda | +2.855 |
�醒 | +2.838 |
Tad | +2.622 |
Neg logit contributions | |
Guilty | -7.296 |
GH | -6.305 |
naire | -6.224 |
NG | -6.170 |
itcher | -6.052 |
Token | mom |
Token ID | 32542 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
Synd | +0.821 |
anda | +0.798 |
synd | +0.797 |
�醒 | +0.786 |
Tad | +0.743 |
Neg logit contributions | |
Guilty | -1.075 |
GH | -0.886 |
naire | -0.866 |
que | -0.865 |
NG | -0.863 |
Token | per |
Token ID | 525 |
Feature activation | +4.52e-02 |
Pos logit contributions | |
anda | +2.447 |
Synd | +2.441 |
synd | +2.298 |
utt | +2.188 |
andowski | +2.120 |
Neg logit contributions | |
Guilty | -6.346 |
GH | -5.448 |
naire | -5.285 |
NG | -5.259 |
que | -5.247 |
Token | y |
Token ID | 331 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
Synd | +3.847 |
synd | +3.777 |
anda | +3.737 |
�醒 | +3.605 |
Tad | +3.528 |
Neg logit contributions | |
Guilty | -5.026 |
GH | -4.172 |
naire | -4.070 |
NG | -4.054 |
ready | -3.997 |
Token | 2 |
Token ID | 17 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
Synd | +2.484 |
anda | +2.437 |
synd | +2.424 |
�醒 | +2.304 |
utt | +2.274 |
Neg logit contributions | |
Guilty | -3.163 |
GH | -2.560 |
naire | -2.548 |
NG | -2.495 |
que | -2.482 |
Token | k |
Token ID | 74 |
Feature activation | +4.28e-01 |
Pos logit contributions | |
Synd | +2.871 |
anda | +2.841 |
synd | +2.797 |
�醒 | +2.684 |
utt | +2.612 |
Neg logit contributions | |
Guilty | -5.151 |
naire | -4.286 |
GH | -4.278 |
NG | -4.187 |
que | -4.153 |
Token | [ |
Token ID | 685 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
Synd | +4.333 |
synd | +4.252 |
anda | +4.210 |
�醒 | +3.974 |
Tad | +3.909 |
Neg logit contributions | |
Guilty | -5.851 |
GH | -4.825 |
NG | -4.717 |
naire | -4.710 |
isSpecialOrderable | -4.680 |
Token | 10 |
Token ID | 940 |
Feature activation | +5.05e-01 |
Pos logit contributions | |
Synd | +2.068 |
anda | +2.013 |
synd | +2.004 |
utt | +1.855 |
Tad | +1.830 |
Neg logit contributions | |
Guilty | -3.674 |
GH | -3.013 |
que | -2.999 |
naire | -2.995 |
NG | -2.925 |
Token | : |
Token ID | 25 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
Synd | +3.623 |
synd | +3.452 |
anda | +3.403 |
Tad | +3.124 |
utt | +3.087 |
Neg logit contributions | |
Guilty | -8.401 |
GH | -7.013 |
isSpecialOrderable | -6.944 |
naire | -6.944 |
que | -6.936 |
Token | 47 |
Token ID | 2857 |
Feature activation | +2.09e-01 |
Pos logit contributions | |
48 | +6.751 |
Synd | +5.034 |
Tad | +5.002 |
nt | +4.907 |
anda | +4.373 |
Neg logit contributions | |
� | -34.548 |
� | -34.121 |
� | -32.821 |
Guilty | -32.487 |
proble | -32.405 |
Token | ] |
Token ID | 60 |
Feature activation | +4.56e-01 |
Pos logit contributions | |
Synd | +1.529 |
synd | +1.459 |
anda | +1.444 |
Tad | +1.316 |
utt | +1.297 |
Neg logit contributions | |
Guilty | -3.538 |
GH | -3.009 |
naire | -2.966 |
que | -2.957 |
NG | -2.930 |
Token | < |
Token ID | 1279 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
Synd | +3.142 |
synd | +3.024 |
anda | +2.965 |
�醒 | +2.935 |
Tad | +2.716 |
Neg logit contributions | |
Guilty | -7.707 |
GH | -6.666 |
naire | -6.575 |
NG | -6.523 |
itcher | -6.400 |
Token | chain |
Token ID | 7983 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
Synd | +1.428 |
anda | +1.397 |
synd | +1.387 |
�醒 | +1.364 |
utt | +1.299 |
Neg logit contributions | |
Guilty | -1.854 |
GH | -1.517 |
que | -1.487 |
naire | -1.486 |
NG | -1.480 |
Token | x |
Token ID | 87 |
Feature activation | -7.66e-02 |
Pos logit contributions | |
Guilty | +3.844 |
GH | +3.256 |
naire | +3.183 |
NG | +3.173 |
que | +3.145 |
Neg logit contributions | |
Synd | -2.923 |
�醒 | -2.875 |
synd | -2.834 |
anda | -2.731 |
Tad | -2.655 |
Token | > |
Token ID | 29 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
Guilty | +2.748 |
GH | +2.301 |
NG | +2.243 |
naire | +2.239 |
que | +2.239 |
Neg logit contributions | |
Synd | -2.079 |
�醒 | -2.040 |
synd | -2.019 |
anda | -1.954 |
Tad | -1.881 |
Token | dude |
Token ID | 18396 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
Synd | +2.009 |
synd | +1.958 |
anda | +1.930 |
�醒 | +1.880 |
Tad | +1.829 |
Neg logit contributions | |
Guilty | -2.543 |
GH | -2.119 |
naire | -2.080 |
NG | -2.063 |
que | -2.023 |
Token | nice |
Token ID | 3621 |
Feature activation | +2.79e-01 |
Pos logit contributions | |
Guilty | +2.858 |
GH | +2.354 |
que | +2.316 |
naire | +2.296 |
NG | +2.295 |
Neg logit contributions | |
Synd | -2.378 |
�醒 | -2.345 |
anda | -2.302 |
synd | -2.298 |
ahime | -2.180 |
Token | [ |
Token ID | 685 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
Synd | +2.902 |
synd | +2.845 |
anda | +2.807 |
�醒 | +2.721 |
Tad | +2.639 |
Neg logit contributions | |
Guilty | -3.813 |
GH | -3.160 |
naire | -3.080 |
NG | -3.073 |
ready | -3.021 |
Token | 10 |
Token ID | 940 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
Synd | +1.167 |
synd | +1.132 |
anda | +1.131 |
�醒 | +1.061 |
utt | +1.045 |
Neg logit contributions | |
Guilty | -1.885 |
GH | -1.559 |
naire | -1.537 |
que | -1.535 |
NG | -1.518 |
Token | : |
Token ID | 25 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
Synd | +2.983 |
synd | +2.855 |
anda | +2.819 |
Tad | +2.611 |
utt | +2.569 |
Neg logit contributions | |
Guilty | -6.313 |
GH | -5.279 |
naire | -5.209 |
que | -5.196 |
isSpecialOrderable | -5.154 |
Token | 47 |
Token ID | 2857 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
48 | +6.118 |
Synd | +4.184 |
Tad | +4.072 |
nt | +3.963 |
Teddy | +3.809 |
Neg logit contributions | |
� | -34.731 |
� | -34.312 |
� | -33.062 |
proble | -32.932 |
Guilty | -32.914 |
Token | ] |
Token ID | 60 |
Feature activation | +5.48e-01 |
Pos logit contributions | |
Synd | +1.153 |
synd | +1.103 |
anda | +1.092 |
�醒 | +1.001 |
Tad | +1.000 |
Neg logit contributions | |
Guilty | -2.553 |
GH | -2.173 |
naire | -2.138 |
que | -2.132 |
NG | -2.119 |
Token | < |
Token ID | 1279 |
Feature activation | +8.68e-02 |
Pos logit contributions | |
Synd | +3.750 |
synd | +3.616 |
anda | +3.552 |
�醒 | +3.486 |
Tad | +3.262 |
Neg logit contributions | |
Guilty | -9.133 |
GH | -7.905 |
naire | -7.809 |
NG | -7.747 |
anted | -7.613 |
Token | sp |
Token ID | 2777 |
Feature activation | -6.25e-01 |
Pos logit contributions | |
Synd | +0.912 |
anda | +0.888 |
synd | +0.886 |
�醒 | +0.873 |
Tad | +0.825 |
Neg logit contributions | |
Guilty | -1.201 |
GH | -0.988 |
naire | -0.968 |
que | -0.966 |
NG | -0.964 |
Token | it |
Token ID | 270 |
Feature activation | -2.18e-01 |
Pos logit contributions | |
Guilty | +8.463 |
GH | +7.295 |
NG | +7.207 |
ready | +7.141 |
que | +7.057 |
Neg logit contributions | |
Synd | -6.089 |
�醒 | -6.073 |
synd | -5.827 |
Mutual | -5.478 |
Tad | -5.441 |
Token | m |
Token ID | 285 |
Feature activation | +9.27e-02 |
Pos logit contributions | |
Synd | +1.793 |
synd | +1.750 |
anda | +1.735 |
�醒 | +1.704 |
Tad | +1.630 |
Neg logit contributions | |
Guilty | -2.246 |
GH | -1.859 |
naire | -1.813 |
NG | -1.805 |
que | -1.778 |
Token | 2 |
Token ID | 17 |
Feature activation | +5.65e-01 |
Pos logit contributions | |
Synd | +1.208 |
anda | +1.184 |
synd | +1.178 |
�醒 | +1.162 |
ahime | +1.117 |
Neg logit contributions | |
Guilty | -1.049 |
GH | -0.825 |
naire | -0.802 |
que | -0.796 |
NG | -0.795 |
Token | k |
Token ID | 74 |
Feature activation | +8.63e-02 |
Pos logit contributions | |
anda | +3.534 |
Synd | +3.529 |
synd | +3.452 |
utt | +3.126 |
nt | +3.112 |
Neg logit contributions | |
Guilty | -9.699 |
GH | -8.377 |
NG | -8.108 |
isSpecialOrderable | -8.044 |
naire | -8.024 |
Token | [ |
Token ID | 685 |
Feature activation | +8.94e-02 |
Pos logit contributions | |
Synd | +0.916 |
synd | +0.891 |
anda | +0.884 |
�醒 | +0.876 |
Tad | +0.829 |
Neg logit contributions | |
Guilty | -1.181 |
GH | -0.978 |
naire | -0.956 |
NG | -0.954 |
que | -0.946 |
Token | 10 |
Token ID | 940 |
Feature activation | +2.79e-01 |
Pos logit contributions | |
Synd | +0.849 |
synd | +0.823 |
anda | +0.820 |
�醒 | +0.784 |
Tad | +0.759 |
Neg logit contributions | |
Guilty | -1.330 |
GH | -1.104 |
naire | -1.086 |
que | -1.085 |
NG | -1.075 |
Token | : |
Token ID | 25 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
Synd | +2.303 |
synd | +2.209 |
anda | +2.184 |
Tad | +2.024 |
utt | +1.999 |
Neg logit contributions | |
Guilty | -4.461 |
GH | -3.738 |
naire | -3.685 |
que | -3.674 |
NG | -3.646 |
Token | 47 |
Token ID | 2857 |
Feature activation | +5.49e-02 |
Pos logit contributions | |
48 | +6.462 |
Synd | +4.683 |
Tad | +4.418 |
nt | +4.299 |
anda | +4.047 |
Neg logit contributions | |
� | -33.763 |
� | -33.297 |
Guilty | -32.514 |
� | -32.121 |
proble | -31.996 |
Token | ] |
Token ID | 60 |
Feature activation | +4.08e-01 |
Pos logit contributions | |
Synd | +0.439 |
synd | +0.422 |
anda | +0.418 |
�醒 | +0.404 |
Tad | +0.384 |
Neg logit contributions | |
Guilty | -0.899 |
GH | -0.767 |
naire | -0.753 |
que | -0.750 |
NG | -0.749 |
Token | < |
Token ID | 1279 |
Feature activation | +7.76e-03 |
Pos logit contributions | |
Synd | +2.936 |
synd | +2.816 |
anda | +2.772 |
�醒 | +2.744 |
Tad | +2.551 |
Neg logit contributions | |
Guilty | -6.807 |
GH | -5.882 |
naire | -5.799 |
NG | -5.760 |
que | -5.646 |
Token | z |
Token ID | 89 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
Synd | +0.080 |
synd | +0.078 |
anda | +0.077 |
�醒 | +0.077 |
Tad | +0.072 |
Neg logit contributions | |
Guilty | -0.109 |
GH | -0.090 |
naire | -0.088 |
NG | -0.088 |
que | -0.088 |
Token | omb |
Token ID | 2381 |
Feature activation | -9.98e-02 |
Pos logit contributions | |
Guilty | +3.643 |
GH | +3.101 |
NG | +3.019 |
naire | +3.015 |
que | +2.988 |
Neg logit contributions | |
Synd | -2.603 |
�醒 | -2.539 |
synd | -2.521 |
anda | -2.421 |
Tad | -2.334 |
Token | m |
Token ID | 285 |
Feature activation | +3.14e-01 |
Pos logit contributions | |
Synd | +0.836 |
synd | +0.816 |
anda | +0.807 |
�醒 | +0.799 |
Tad | +0.760 |
Neg logit contributions | |
Guilty | -1.023 |
GH | -0.843 |
naire | -0.822 |
NG | -0.820 |
que | -0.812 |
Token | 2 |
Token ID | 17 |
Feature activation | +8.79e-01 |
Pos logit contributions | |
anda | +3.834 |
Synd | +3.829 |
synd | +3.729 |
�醒 | +3.601 |
ahime | +3.569 |
Neg logit contributions | |
Guilty | -3.753 |
GH | -2.952 |
naire | -2.900 |
que | -2.845 |
NG | -2.830 |
Token | k |
Token ID | 74 |
Feature activation | +3.67e-01 |
Pos logit contributions | |
anda | +4.400 |
Synd | +4.285 |
synd | +4.233 |
nt | +4.093 |
utt | +3.797 |
Neg logit contributions | |
Guilty | -15.272 |
GH | -13.262 |
isSpecialOrderable | -12.928 |
Reloaded | -12.927 |
NG | -12.802 |
Token | [ |
Token ID | 685 |
Feature activation | +2.49e-01 |
Pos logit contributions | |
Synd | +3.621 |
synd | +3.547 |
anda | +3.482 |
�醒 | +3.392 |
Tad | +3.258 |
Neg logit contributions | |
Guilty | -5.154 |
GH | -4.281 |
NG | -4.199 |
naire | -4.194 |
ready | -4.121 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.49e-01 |
Pos logit contributions | |
Synd | +2.175 |
anda | +2.120 |
synd | +2.110 |
utt | +1.948 |
Tad | +1.927 |
Neg logit contributions | |
Guilty | -3.874 |
GH | -3.173 |
que | -3.165 |
naire | -3.159 |
NG | -3.086 |
Token | : |
Token ID | 25 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
Synd | +3.348 |
synd | +3.194 |
anda | +3.143 |
Tad | +2.901 |
Mutual | +2.863 |
Neg logit contributions | |
Guilty | -7.396 |
GH | -6.183 |
naire | -6.116 |
que | -6.101 |
isSpecialOrderable | -6.082 |
Token | 47 |
Token ID | 2857 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
48 | +6.616 |
Synd | +5.135 |
Tad | +5.012 |
nt | +4.946 |
anda | +4.487 |
Neg logit contributions | |
� | -33.605 |
� | -33.137 |
� | -31.954 |
Guilty | -31.808 |
proble | -31.557 |
Token | ] |
Token ID | 60 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
Synd | +1.437 |
synd | +1.372 |
anda | +1.357 |
Tad | +1.239 |
utt | +1.220 |
Neg logit contributions | |
Guilty | -3.274 |
GH | -2.787 |
naire | -2.745 |
que | -2.736 |
NG | -2.716 |
Token | < |
Token ID | 1279 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
Synd | +1.245 |
synd | +1.197 |
anda | +1.177 |
�醒 | +1.148 |
Tad | +1.079 |
Neg logit contributions | |
Guilty | -2.792 |
GH | -2.404 |
naire | -2.366 |
NG | -2.354 |
que | -2.328 |
Token | k |
Token ID | 74 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
Synd | +1.146 |
anda | +1.117 |
synd | +1.112 |
�醒 | +1.094 |
Tad | +1.038 |
Neg logit contributions | |
Guilty | -1.503 |
GH | -1.235 |
naire | -1.209 |
que | -1.208 |
NG | -1.204 |
Token | asse |
Token ID | 21612 |
Feature activation | +3.12e-01 |
Pos logit contributions | |
Guilty | +1.776 |
GH | +1.485 |
naire | +1.453 |
NG | +1.449 |
que | +1.442 |
Neg logit contributions | |
Synd | -1.329 |
�醒 | -1.297 |
synd | -1.291 |
anda | -1.263 |
Tad | -1.207 |
Token | m |
Token ID | 285 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
Synd | +4.386 |
synd | +4.323 |
anda | +4.255 |
�醒 | +4.134 |
Tad | +4.025 |
Neg logit contributions | |
Guilty | -6.002 |
GH | -5.011 |
naire | -4.876 |
NG | -4.861 |
ready | -4.795 |
Token | 2 |
Token ID | 17 |
Feature activation | +9.58e-01 |
Pos logit contributions | |
anda | +4.681 |
Synd | +4.594 |
synd | +4.478 |
utt | +4.309 |
ahime | +4.247 |
Neg logit contributions | |
Guilty | -4.836 |
GH | -3.806 |
naire | -3.702 |
que | -3.676 |
NG | -3.630 |
Token | k |
Token ID | 74 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
anda | +4.329 |
nt | +4.110 |
Synd | +4.105 |
synd | +3.978 |
utt | +3.672 |
Neg logit contributions | |
Guilty | -16.885 |
� | -15.346 |
proble | -15.144 |
� | -15.123 |
� | -14.687 |
Token | [ |
Token ID | 685 |
Feature activation | +2.56e-01 |
Pos logit contributions | |
Guilty | +1.459 |
GH | +1.199 |
que | +1.171 |
naire | +1.170 |
NG | +1.163 |
Neg logit contributions | |
Synd | -1.247 |
�醒 | -1.236 |
synd | -1.210 |
anda | -1.207 |
ahime | -1.149 |
Token | 10 |
Token ID | 940 |
Feature activation | +5.01e-01 |
Pos logit contributions | |
Synd | +2.214 |
anda | +2.158 |
synd | +2.149 |
utt | +1.985 |
Tad | +1.960 |
Neg logit contributions | |
Guilty | -4.010 |
GH | -3.284 |
que | -3.278 |
naire | -3.264 |
NG | -3.185 |
Token | : |
Token ID | 25 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
Synd | +3.603 |
synd | +3.423 |
anda | +3.365 |
Tad | +3.110 |
Mutual | +3.071 |
Neg logit contributions | |
Guilty | -8.317 |
GH | -6.951 |
naire | -6.876 |
isSpecialOrderable | -6.870 |
que | -6.866 |
Token | 47 |
Token ID | 2857 |
Feature activation | +2.10e-01 |
Pos logit contributions | |
48 | +6.189 |
nt | +4.811 |
Tad | +4.565 |
Synd | +4.530 |
anda | +4.127 |
Neg logit contributions | |
� | -34.488 |
� | -34.065 |
� | -32.704 |
proble | -32.223 |
metic | -32.117 |
Token | ] |
Token ID | 60 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
Synd | +1.540 |
synd | +1.469 |
anda | +1.455 |
Tad | +1.326 |
utt | +1.307 |
Neg logit contributions | |
Guilty | -3.567 |
GH | -3.034 |
naire | -2.990 |
que | -2.981 |
NG | -2.953 |
Token | < |
Token ID | 1279 |
Feature activation | +1.65e-01 |
Pos logit contributions | |
Synd | +1.287 |
synd | +1.235 |
anda | +1.216 |
�醒 | +1.175 |
Tad | +1.114 |
Neg logit contributions | |
Guilty | -2.908 |
GH | -2.503 |
naire | -2.464 |
NG | -2.451 |
que | -2.427 |
Token | j |
Token ID | 73 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
Synd | +1.746 |
anda | +1.713 |
synd | +1.696 |
�醒 | +1.664 |
utt | +1.592 |
Neg logit contributions | |
Guilty | -2.272 |
GH | -1.853 |
que | -1.820 |
naire | -1.817 |
NG | -1.809 |
Token | th |
Token ID | 400 |
Feature activation | -2.01e-01 |
Pos logit contributions | |
Guilty | +1.985 |
GH | +1.648 |
NG | +1.603 |
naire | +1.594 |
que | +1.587 |
Neg logit contributions | |
Synd | -1.749 |
�醒 | -1.702 |
synd | -1.700 |
anda | -1.655 |
Tad | -1.589 |
Token | other |
Token ID | 584 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
Guilty | +7.699 |
GH | +6.293 |
que | +6.222 |
ready | +6.148 |
NG | +6.138 |
Neg logit contributions | |
�醒 | -6.918 |
Synd | -6.593 |
anda | -6.486 |
synd | -6.356 |
ahime | -6.332 |
Token | browsers |
Token ID | 22616 |
Feature activation | -4.44e-01 |
Pos logit contributions | |
Guilty | +2.222 |
GH | +1.827 |
que | +1.805 |
NG | +1.789 |
naire | +1.778 |
Neg logit contributions | |
Synd | -1.767 |
�醒 | -1.750 |
anda | -1.721 |
synd | -1.704 |
ahime | -1.627 |
Token | will |
Token ID | 481 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
Guilty | +5.825 |
que | +4.866 |
GH | +4.815 |
NG | +4.688 |
naire | +4.663 |
Neg logit contributions | |
�醒 | -4.842 |
Synd | -4.697 |
anda | -4.480 |
ahime | -4.464 |
synd | -4.399 |
Token | make |
Token ID | 787 |
Feature activation | -5.10e-01 |
Pos logit contributions | |
Guilty | +2.400 |
GH | +1.983 |
naire | +1.949 |
que | +1.949 |
NG | +1.912 |
Neg logit contributions | |
Synd | -2.060 |
�醒 | -2.019 |
anda | -1.980 |
synd | -1.972 |
ahime | -1.909 |
Token | users |
Token ID | 2985 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
Guilty | +6.434 |
que | +5.324 |
GH | +5.234 |
NG | +5.110 |
naire | +5.106 |
Neg logit contributions | |
�醒 | -5.662 |
Synd | -5.545 |
anda | -5.349 |
synd | -5.332 |
ahime | -5.290 |
Token | more |
Token ID | 517 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
Guilty | +17.780 |
que | +17.366 |
GH | +14.419 |
ready | +14.163 |
NG | +13.920 |
Neg logit contributions | |
�醒 | -19.958 |
ahime | -18.249 |
ciating | -16.982 |
Synd | -16.727 |
SourceFile | -16.676 |
Token | secure |
Token ID | 5713 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
Guilty | +18.688 |
que | +17.442 |
ready | +15.066 |
anxious | +14.615 |
pessimistic | +14.464 |
Neg logit contributions | |
�醒 | -19.828 |
ahime | -18.397 |
ciating | -17.761 |
Synd | -17.389 |
ournals | -17.229 |
Token | ," |
Token ID | 553 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
Guilty | +2.277 |
GH | +1.878 |
que | +1.850 |
NG | +1.832 |
naire | +1.831 |
Neg logit contributions | |
Synd | -1.838 |
�醒 | -1.802 |
synd | -1.775 |
anda | -1.769 |
ahime | -1.680 |
Token | said |
Token ID | 531 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
Guilty | +2.508 |
GH | +2.068 |
que | +2.035 |
naire | +2.035 |
NG | +2.006 |
Neg logit contributions | |
Synd | -1.905 |
�醒 | -1.874 |
synd | -1.854 |
anda | -1.852 |
ahime | -1.759 |
Token | Lord |
Token ID | 4453 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
Guilty | +2.281 |
GH | +1.834 |
que | +1.804 |
naire | +1.799 |
NG | +1.772 |
Neg logit contributions | |
Synd | -2.170 |
�醒 | -2.134 |
synd | -2.117 |
anda | -2.116 |
ahime | -2.024 |
Token | West |
Token ID | 2688 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
Synd | +1.473 |
synd | +1.412 |
anda | +1.412 |
�醒 | +1.382 |
Tad | +1.326 |
Neg logit contributions | |
Guilty | -2.393 |
GH | -2.037 |
NG | -1.997 |
naire | -1.969 |
que | -1.968 |
Token | the |
Token ID | 262 |
Feature activation | +4.65e-01 |
Pos logit contributions | |
Synd | +2.812 |
synd | +2.733 |
anda | +2.641 |
Tad | +2.480 |
utt | +2.464 |
Neg logit contributions | |
Guilty | -4.817 |
GH | -4.051 |
naire | -3.952 |
NG | -3.909 |
que | -3.882 |
Token | sp |
Token ID | 599 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
synd | +3.860 |
Synd | +3.741 |
anda | +3.442 |
utt | +3.267 |
Tad | +3.252 |
Neg logit contributions | |
Guilty | -7.540 |
GH | -6.389 |
NG | -6.216 |
naire | -6.128 |
ready | -6.016 |
Token | ines |
Token ID | 1127 |
Feature activation | -2.60e-01 |
Pos logit contributions | |
Synd | +1.028 |
anda | +1.000 |
synd | +0.996 |
�醒 | +0.954 |
utt | +0.923 |
Neg logit contributions | |
Guilty | -1.552 |
GH | -1.301 |
naire | -1.269 |
que | -1.269 |
NG | -1.260 |
Token | on |
Token ID | 319 |
Feature activation | -4.94e-01 |
Pos logit contributions | |
Guilty | +3.501 |
GH | +2.944 |
NG | +2.912 |
que | +2.906 |
naire | +2.866 |
Neg logit contributions | |
�醒 | -2.842 |
Synd | -2.702 |
anda | -2.639 |
synd | -2.605 |
ahime | -2.570 |
Token | a |
Token ID | 257 |
Feature activation | -6.70e-01 |
Pos logit contributions | |
Guilty | +5.550 |
que | +4.620 |
GH | +4.538 |
naire | +4.494 |
ready | +4.451 |
Neg logit contributions | |
�醒 | -6.449 |
Synd | -5.900 |
ahime | -5.794 |
anda | -5.724 |
synd | -5.656 |
Token | music |
Token ID | 2647 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
Guilty | +5.906 |
que | +4.917 |
NG | +4.597 |
lottery | +4.450 |
ready | +4.347 |
Neg logit contributions | |
�醒 | -10.190 |
ahime | -9.410 |
Synd | -9.199 |
anda | -9.114 |
utt | -9.066 |
Token | box |
Token ID | 3091 |
Feature activation | -3.09e-01 |
Pos logit contributions | |
que | +7.892 |
box | +7.779 |
Guilty | +7.777 |
boxes | +6.906 |
gate | +6.068 |
Neg logit contributions | |
�醒 | -31.208 |
ahime | -28.453 |
nces | -27.444 |
Synd | -27.342 |
�� | -27.035 |
Token | , |
Token ID | 11 |
Feature activation | +4.20e-01 |
Pos logit contributions | |
Guilty | +3.976 |
GH | +3.308 |
NG | +3.261 |
naire | +3.251 |
que | +3.228 |
Neg logit contributions | |
�醒 | -3.577 |
Synd | -3.398 |
anda | -3.309 |
synd | -3.297 |
ahime | -3.280 |
Token | involving |
Token ID | 7411 |
Feature activation | +3.00e-01 |
Pos logit contributions | |
Synd | +2.243 |
synd | +2.226 |
anda | +2.095 |
�醒 | +1.803 |
Mutual | +1.746 |
Neg logit contributions | |
Guilty | -7.883 |
GH | -6.861 |
NG | -6.751 |
ready | -6.717 |
naire | -6.716 |
Token | the |
Token ID | 262 |
Feature activation | +5.64e-01 |
Pos logit contributions | |
Synd | +2.677 |
synd | +2.619 |
anda | +2.542 |
Tad | +2.364 |
utt | +2.354 |
Neg logit contributions | |
Guilty | -4.596 |
GH | -3.849 |
naire | -3.755 |
NG | -3.707 |
que | -3.698 |
Token | entire |
Token ID | 2104 |
Feature activation | +4.38e-01 |
Pos logit contributions | |
synd | +3.465 |
Synd | +3.378 |
anda | +3.198 |
Tyrann | +2.924 |
basal | +2.771 |
Neg logit contributions | |
Guilty | -10.088 |
GH | -8.777 |
isSpecialOrderable | -8.372 |
NG | -8.318 |
naire | -8.316 |
Token | to |
Token ID | 284 |
Feature activation | -6.19e-01 |
Pos logit contributions | |
Guilty | +2.689 |
GH | +2.220 |
que | +2.172 |
NG | +2.164 |
naire | +2.155 |
Neg logit contributions | |
Synd | -2.116 |
�醒 | -2.104 |
synd | -2.049 |
anda | -2.037 |
ahime | -1.931 |
Token | other |
Token ID | 584 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
Guilty | +7.699 |
GH | +6.293 |
que | +6.222 |
ready | +6.148 |
NG | +6.138 |
Neg logit contributions | |
�醒 | -6.918 |
Synd | -6.593 |
anda | -6.486 |
synd | -6.356 |
ahime | -6.332 |
Token | browsers |
Token ID | 22616 |
Feature activation | -4.44e-01 |
Pos logit contributions | |
Guilty | +2.222 |
GH | +1.827 |
que | +1.805 |
NG | +1.789 |
naire | +1.778 |
Neg logit contributions | |
Synd | -1.767 |
�醒 | -1.750 |
anda | -1.721 |
synd | -1.704 |
ahime | -1.627 |
Token | will |
Token ID | 481 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
Guilty | +5.825 |
que | +4.866 |
GH | +4.815 |
NG | +4.688 |
naire | +4.663 |
Neg logit contributions | |
�醒 | -4.842 |
Synd | -4.697 |
anda | -4.480 |
ahime | -4.464 |
synd | -4.399 |
Token | make |
Token ID | 787 |
Feature activation | -5.10e-01 |
Pos logit contributions | |
Guilty | +2.400 |
GH | +1.983 |
naire | +1.949 |
que | +1.949 |
NG | +1.912 |
Neg logit contributions | |
Synd | -2.060 |
�醒 | -2.019 |
anda | -1.980 |
synd | -1.972 |
ahime | -1.909 |
Token | users |
Token ID | 2985 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
Guilty | +6.434 |
que | +5.324 |
GH | +5.234 |
NG | +5.110 |
naire | +5.106 |
Neg logit contributions | |
�醒 | -5.662 |
Synd | -5.545 |
anda | -5.349 |
synd | -5.332 |
ahime | -5.290 |
Token | more |
Token ID | 517 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
Guilty | +17.780 |
que | +17.366 |
GH | +14.419 |
ready | +14.163 |
NG | +13.920 |
Neg logit contributions | |
�醒 | -19.958 |
ahime | -18.249 |
ciating | -16.982 |
Synd | -16.727 |
SourceFile | -16.676 |
Token | secure |
Token ID | 5713 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
Guilty | +18.688 |
que | +17.442 |
ready | +15.066 |
anxious | +14.615 |
pessimistic | +14.464 |
Neg logit contributions | |
�醒 | -19.828 |
ahime | -18.397 |
ciating | -17.761 |
Synd | -17.389 |
ournals | -17.229 |
Token | ," |
Token ID | 553 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
Guilty | +2.277 |
GH | +1.878 |
que | +1.850 |
NG | +1.832 |
naire | +1.831 |
Neg logit contributions | |
Synd | -1.838 |
�醒 | -1.802 |
synd | -1.775 |
anda | -1.769 |
ahime | -1.680 |
Token | said |
Token ID | 531 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
Guilty | +2.508 |
GH | +2.068 |
que | +2.035 |
naire | +2.035 |
NG | +2.006 |
Neg logit contributions | |
Synd | -1.905 |
�醒 | -1.874 |
synd | -1.854 |
anda | -1.852 |
ahime | -1.759 |
Token | Lord |
Token ID | 4453 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
Guilty | +2.281 |
GH | +1.834 |
que | +1.804 |
naire | +1.799 |
NG | +1.772 |
Neg logit contributions | |
Synd | -2.170 |
�醒 | -2.134 |
synd | -2.117 |
anda | -2.116 |
ahime | -2.024 |
Token | the |
Token ID | 262 |
Feature activation | -9.06e-01 |
Pos logit contributions | |
Guilty | +7.873 |
que | +6.549 |
GH | +6.337 |
naire | +6.171 |
NG | +6.166 |
Neg logit contributions | |
�醒 | -7.335 |
Synd | -7.032 |
ahime | -6.830 |
anda | -6.799 |
andowski | -6.754 |
Token | angle |
Token ID | 9848 |
Feature activation | -7.04e-01 |
Pos logit contributions | |
Guilty | +10.527 |
que | +8.930 |
NG | +8.308 |
GH | +8.194 |
ready | +7.910 |
Neg logit contributions | |
�醒 | -10.419 |
ahime | -9.513 |
Synd | -9.424 |
andowski | -9.394 |
anda | -9.353 |
Token | - |
Token ID | 12 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
Guilty | +7.857 |
que | +6.408 |
GH | +6.386 |
naire | +6.323 |
NG | +6.208 |
Neg logit contributions | |
�醒 | -8.213 |
Synd | -8.171 |
anda | -7.853 |
ahime | -7.808 |
synd | -7.756 |
Token | of |
Token ID | 1659 |
Feature activation | -3.99e-01 |
Pos logit contributions | |
Guilty | +6.555 |
GH | +5.449 |
ready | +5.335 |
naire | +5.274 |
NG | +5.227 |
Neg logit contributions | |
Synd | -7.445 |
�醒 | -7.263 |
synd | -7.217 |
Mutual | -6.856 |
anda | -6.821 |
Token | - |
Token ID | 12 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
Guilty | +5.107 |
GH | +4.237 |
que | +4.183 |
naire | +4.161 |
NG | +4.092 |
Neg logit contributions | |
�醒 | -4.502 |
Synd | -4.355 |
synd | -4.176 |
anda | -4.164 |
ahime | -4.097 |
Token | attack |
Token ID | 20358 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
Guilty | +5.174 |
GH | +4.129 |
naire | +3.978 |
ready | +3.963 |
que | +3.819 |
Neg logit contributions | |
Synd | -8.030 |
�醒 | -7.972 |
synd | -7.867 |
anda | -7.594 |
Mutual | -7.505 |
Token | data |
Token ID | 1366 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
Guilty | +16.578 |
que | +15.063 |
naire | +13.597 |
GH | +13.573 |
NG | +13.481 |
Neg logit contributions | |
�醒 | -18.955 |
ahime | -16.628 |
gypt | -16.272 |
owship | -16.199 |
andowski | -16.124 |
Token | by |
Token ID | 416 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
Guilty | +13.416 |
que | +11.655 |
NG | +10.844 |
GH | +10.418 |
naire | +10.322 |
Neg logit contributions | |
�醒 | -14.203 |
ahime | -12.702 |
Synd | -12.634 |
andowski | -12.427 |
anda | -12.413 |
Token | commanding |
Token ID | 25771 |
Feature activation | -3.49e-01 |
Pos logit contributions | |
Guilty | +15.550 |
que | +15.202 |
GH | +12.393 |
lottery | +12.318 |
naire | +12.241 |
Neg logit contributions | |
�醒 | -14.806 |
ahime | -14.183 |
Synd | -13.523 |
andowski | -13.446 |
owship | -13.395 |
Token | the |
Token ID | 262 |
Feature activation | -5.56e-01 |
Pos logit contributions | |
Guilty | +4.564 |
que | +3.736 |
GH | +3.715 |
naire | +3.665 |
NG | +3.635 |
Neg logit contributions | |
�醒 | -3.793 |
Synd | -3.784 |
anda | -3.689 |
synd | -3.636 |
ahime | -3.547 |
Token | plane |
Token ID | 6614 |
Feature activation | -4.48e-01 |
Pos logit contributions | |
Guilty | +6.832 |
que | +5.598 |
GH | +5.348 |
naire | +5.280 |
NG | +5.280 |
Neg logit contributions | |
�醒 | -6.361 |
Synd | -6.206 |
anda | -6.119 |
ahime | -5.979 |
synd | -5.902 |
Token | climate |
Token ID | 4258 |
Feature activation | -5.46e-01 |
Pos logit contributions | |
Guilty | +6.006 |
GH | +5.031 |
que | +4.915 |
NG | +4.796 |
ready | +4.700 |
Neg logit contributions | |
Synd | -4.966 |
�醒 | -4.964 |
synd | -4.773 |
anda | -4.755 |
ahime | -4.612 |
Token | object |
Token ID | 2134 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
Guilty | +6.988 |
GH | +5.864 |
NG | +5.661 |
que | +5.652 |
ready | +5.533 |
Neg logit contributions | |
�醒 | -5.982 |
Synd | -5.850 |
anda | -5.631 |
synd | -5.582 |
ahime | -5.526 |
Token | are |
Token ID | 389 |
Feature activation | -7.09e-01 |
Pos logit contributions | |
Guilty | +3.083 |
GH | +2.591 |
naire | +2.511 |
NG | +2.508 |
que | +2.498 |
Neg logit contributions | |
Synd | -2.281 |
�醒 | -2.211 |
synd | -2.196 |
anda | -2.171 |
ahime | -2.063 |
Token | strongly |
Token ID | 7634 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
Guilty | +8.994 |
que | +7.869 |
GH | +7.739 |
NG | +7.433 |
ready | +7.363 |
Neg logit contributions | |
�醒 | -7.391 |
Synd | -7.033 |
ahime | -6.882 |
anda | -6.808 |
synd | -6.593 |
Token | net |
Token ID | 2010 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
Guilty | +13.178 |
que | +11.822 |
GH | +11.212 |
NG | +10.911 |
anted | +10.598 |
Neg logit contributions | |
�醒 | -11.348 |
ahime | -10.784 |
Synd | -10.725 |
anda | -10.240 |
iliate | -9.989 |
Token | - |
Token ID | 12 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
Guilty | +14.687 |
que | +12.340 |
GH | +12.116 |
ready | +11.808 |
NG | +11.699 |
Neg logit contributions | |
Synd | -14.928 |
ahime | -14.473 |
�醒 | -14.415 |
synd | -13.828 |
anda | -13.796 |
Token | positive |
Token ID | 24561 |
Feature activation | -8.04e-01 |
Pos logit contributions | |
Guilty | +16.574 |
ready | +15.336 |
GH | +14.856 |
NG | +14.335 |
ivalent | +14.210 |
Neg logit contributions | |
Synd | -17.241 |
synd | -16.579 |
�醒 | -16.561 |
ahime | -16.144 |
Tad | -15.524 |
Token | ( |
Token ID | 357 |
Feature activation | -5.45e-01 |
Pos logit contributions | |
Guilty | +9.458 |
GH | +8.095 |
que | +7.907 |
NG | +7.749 |
naire | +7.607 |
Neg logit contributions | |
�醒 | -8.653 |
Synd | -8.536 |
ahime | -8.203 |
anda | -8.019 |
synd | -8.005 |
Token | G |
Token ID | 38 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
Guilty | +6.995 |
GH | +6.246 |
NG | +6.004 |
ready | +5.860 |
naire | +5.742 |
Neg logit contributions | |
Synd | -5.694 |
�醒 | -5.628 |
synd | -5.613 |
anda | -5.334 |
ahime | -5.219 |
Token | 1 |
Token ID | 352 |
Feature activation | +3.36e-01 |
Pos logit contributions | |
Guilty | +3.403 |
GH | +2.896 |
NG | +2.817 |
naire | +2.798 |
que | +2.786 |
Neg logit contributions | |
Synd | -2.444 |
�醒 | -2.399 |
synd | -2.369 |
anda | -2.310 |
Tad | -2.216 |
Token | : |
Token ID | 25 |
Feature activation | -5.18e-01 |
Pos logit contributions | |
Synd | +2.989 |
anda | +2.906 |
synd | +2.886 |
�醒 | +2.784 |
Tad | +2.693 |
Neg logit contributions | |
Guilty | -5.069 |
naire | -4.238 |
GH | -4.216 |
que | -4.161 |
NG | -4.150 |
Token | raise |
Token ID | 5298 |
Feature activation | +9.26e-01 |
Pos logit contributions | |
Guilty | +1.661 |
GH | +1.295 |
que | +1.273 |
naire | +1.265 |
NG | +1.243 |
Neg logit contributions | |
Synd | -2.196 |
�醒 | -2.185 |
anda | -2.136 |
synd | -2.125 |
ahime | -2.069 |
Token | our |
Token ID | 674 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
synd | +4.743 |
Synd | +4.481 |
anda | +4.420 |
Tad | +4.078 |
Tyrann | +3.786 |
Neg logit contributions | |
Guilty | -16.868 |
GH | -14.380 |
naire | -13.924 |
itcher | -13.609 |
Reloaded | -13.568 |
Token | pitch |
Token ID | 7078 |
Feature activation | +3.26e-01 |
Pos logit contributions | |
Guilty | +1.974 |
GH | +1.595 |
que | +1.580 |
naire | +1.578 |
NG | +1.553 |
Neg logit contributions | |
Synd | -2.088 |
�醒 | -2.063 |
anda | -2.020 |
synd | -2.003 |
ahime | -1.933 |
Token | for |
Token ID | 1640 |
Feature activation | +3.54e-01 |
Pos logit contributions | |
anda | +3.180 |
Synd | +3.126 |
synd | +3.062 |
utt | +2.905 |
andowski | +2.875 |
Neg logit contributions | |
Guilty | -4.737 |
GH | -3.848 |
que | -3.791 |
naire | -3.790 |
NG | -3.676 |
Token | ks |
Token ID | 591 |
Feature activation | -7.51e-01 |
Pos logit contributions | |
anda | +1.927 |
Synd | +1.892 |
synd | +1.807 |
utt | +1.694 |
andowski | +1.611 |
Neg logit contributions | |
Guilty | -6.608 |
GH | -5.700 |
naire | -5.653 |
que | -5.526 |
NG | -5.505 |
Token | over |
Token ID | 625 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
Guilty | +6.902 |
que | +6.254 |
GH | +5.805 |
naire | +5.678 |
NG | +5.626 |
Neg logit contributions | |
�醒 | -10.688 |
Synd | -9.752 |
ahime | -9.396 |
anda | -9.212 |
Tad | -9.157 |
Token | right |
Token ID | 826 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
que | +9.275 |
Guilty | +9.115 |
ready | +7.440 |
wrong | +7.301 |
NG | +6.587 |
Neg logit contributions | |
�醒 | -29.444 |
ahime | -25.531 |
gypt | -23.567 |
Tad | -23.195 |
nces | -23.163 |
Token | ? |
Token ID | 30 |
Feature activation | -9.57e-01 |
Pos logit contributions | |
Synd | +0.872 |
synd | +0.835 |
anda | +0.831 |
�醒 | +0.791 |
Tad | +0.764 |
Neg logit contributions | |
Guilty | -1.704 |
GH | -1.447 |
naire | -1.415 |
que | -1.414 |
NG | -1.410 |
Token | Any |
Token ID | 7149 |
Feature activation | -4.96e-01 |
Pos logit contributions | |
Guilty | +8.947 |
NG | +7.298 |
naire | +7.005 |
GH | +6.998 |
que | +6.812 |
Neg logit contributions | |
synd | -11.825 |
utt | -11.729 |
ahime | -11.686 |
anda | -11.670 |
Synd | -11.556 |
Token | ways |
Token ID | 1322 |
Feature activation | -7.85e-01 |
Pos logit contributions | |
Guilty | +4.943 |
ready | +4.164 |
que | +4.101 |
GH | +4.043 |
NG | +3.980 |
Neg logit contributions | |
�醒 | -6.899 |
Synd | -6.742 |
synd | -6.455 |
Tad | -6.288 |
ahime | -6.222 |
Token | , |
Token ID | 11 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
Guilty | +7.847 |
GH | +6.726 |
NG | +6.590 |
ready | +6.420 |
que | +6.416 |
Neg logit contributions | |
�醒 | -11.038 |
ahime | -9.792 |
Synd | -9.607 |
commer | -9.552 |
anda | -9.365 |
Token | the |
Token ID | 262 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
Guilty | +7.802 |
que | +6.472 |
GH | +6.380 |
NG | +6.349 |
naire | +6.115 |
Neg logit contributions | |
�醒 | -7.452 |
Synd | -7.349 |
anda | -7.238 |
synd | -7.147 |
ahime | -7.110 |
Token | world |
Token ID | 995 |
Feature activation | -6.13e-01 |
Pos logit contributions | |
Guilty | +12.026 |
que | +10.572 |
NG | +9.899 |
GH | +9.590 |
ready | +9.289 |
Neg logit contributions | |
�醒 | -11.543 |
iliate | -10.971 |
anda | -10.948 |
rint | -10.835 |
andowski | -10.790 |
Token | , |
Token ID | 11 |
Feature activation | -8.45e-01 |
Pos logit contributions | |
Guilty | +7.289 |
que | +6.060 |
GH | +5.993 |
NG | +5.947 |
naire | +5.870 |
Neg logit contributions | |
Synd | -6.913 |
�醒 | -6.832 |
synd | -6.544 |
anda | -6.466 |
ahime | -6.405 |
Token | not |
Token ID | 407 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
Guilty | +10.641 |
que | +9.157 |
GH | +8.564 |
NG | +8.559 |
ready | +8.512 |
Neg logit contributions | |
�醒 | -8.833 |
Synd | -8.161 |
ahime | -8.019 |
anda | -7.864 |
synd | -7.719 |
Token | solely |
Token ID | 9944 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
Guilty | +13.839 |
que | +11.778 |
NG | +11.183 |
GH | +10.986 |
ready | +10.885 |
Neg logit contributions | |
�醒 | -10.345 |
ahime | -10.268 |
Synd | -9.831 |
anda | -9.691 |
arta | -9.246 |
Token | to |
Token ID | 284 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
Guilty | +14.981 |
que | +12.962 |
GH | +11.569 |
NG | +11.549 |
anted | +11.468 |
Neg logit contributions | |
�醒 | -15.547 |
ahime | -14.894 |
anda | -14.042 |
Synd | -13.821 |
utt | -13.638 |
Token | the |
Token ID | 262 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
Guilty | +17.546 |
que | +15.977 |
GH | +14.668 |
NG | +14.370 |
ready | +14.156 |
Neg logit contributions | |
�醒 | -16.628 |
ahime | -14.623 |
anda | -14.133 |
SourceFile | -14.123 |
owship | -14.017 |
Token | people |
Token ID | 661 |
Feature activation | -8.63e-01 |
Pos logit contributions | |
Guilty | +14.476 |
que | +12.903 |
NG | +11.952 |
GH | +11.551 |
lottery | +11.508 |
Neg logit contributions | |
�醒 | -11.446 |
iliate | -10.146 |
anda | -10.052 |
andowski | -10.026 |
ahime | -10.003 |
Token | he |
Token ID | 339 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
Guilty | +9.929 |
que | +8.883 |
NG | +8.354 |
GH | +8.153 |
naire | +8.064 |
Neg logit contributions | |
�醒 | -9.666 |
Synd | -8.963 |
anda | -8.746 |
ahime | -8.698 |
synd | -8.634 |
Token | governs |
Token ID | 47049 |
Feature activation | -6.97e-01 |
Pos logit contributions | |
Guilty | +6.612 |
que | +5.630 |
GH | +5.592 |
naire | +5.460 |
NG | +5.457 |
Neg logit contributions | |
�醒 | -6.491 |
Synd | -6.465 |
synd | -6.149 |
anda | -6.060 |
ahime | -5.973 |
Token | : |
Token ID | 25 |
Feature activation | -7.32e-01 |
Pos logit contributions | |
Guilty | +8.234 |
GH | +6.969 |
que | +6.947 |
NG | +6.805 |
ready | +6.684 |
Neg logit contributions | |
�醒 | -7.696 |
Synd | -7.589 |
synd | -7.233 |
anda | -7.226 |
ahime | -7.176 |
Token | ], |
Token ID | 4357 |
Feature activation | -2.25e-01 |
Pos logit contributions | |
Guilty | +1.111 |
GH | +0.926 |
naire | +0.902 |
que | +0.902 |
NG | +0.901 |
Neg logit contributions | |
Synd | -0.847 |
synd | -0.820 |
�醒 | -0.820 |
anda | -0.814 |
ahime | -0.772 |
Token | � |
Token ID | 447 |
Feature activation | -7.37e-02 |
Pos logit contributions | |
Guilty | +3.094 |
GH | +2.576 |
que | +2.519 |
NG | +2.502 |
naire | +2.488 |
Neg logit contributions | |
Synd | -2.339 |
�醒 | -2.287 |
synd | -2.271 |
anda | -2.225 |
ahime | -2.151 |
Token | � |
Token ID | 251 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
Guilty | +1.155 |
GH | +0.983 |
naire | +0.962 |
que | +0.960 |
NG | +0.960 |
Neg logit contributions | |
Synd | -0.639 |
synd | -0.618 |
anda | -0.610 |
�醒 | -0.607 |
ahime | -0.563 |
Token | D |
Token ID | 360 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
Synd | +2.790 |
anda | +2.723 |
synd | +2.706 |
�醒 | +2.578 |
Tad | +2.549 |
Neg logit contributions | |
Guilty | -3.668 |
GH | -3.081 |
naire | -3.003 |
NG | -2.962 |
que | -2.926 |
Token | ang |
Token ID | 648 |
Feature activation | -6.44e-01 |
Pos logit contributions | |
Guilty | +1.724 |
GH | +1.456 |
NG | +1.418 |
naire | +1.406 |
que | +1.403 |
Neg logit contributions | |
Synd | -1.239 |
synd | -1.201 |
�醒 | -1.189 |
anda | -1.168 |
Tad | -1.108 |
Token | - |
Token ID | 12 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
Guilty | +7.886 |
GH | +6.513 |
naire | +6.500 |
que | +6.311 |
NG | +6.177 |
Neg logit contributions | |
Synd | -7.035 |
�醒 | -6.888 |
synd | -6.836 |
ahime | -6.714 |
anda | -6.575 |
Token | Hall |
Token ID | 34194 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
Guilty | +10.065 |
GH | +9.944 |
naire | +9.318 |
NG | +9.151 |
Hall | +9.136 |
Neg logit contributions | |
�醒 | -26.104 |
commer | -22.850 |
ahime | -22.552 |
Synd | -22.232 |
mathemat | -22.005 |
Token | er |
Token ID | 263 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
Guilty | +3.265 |
GH | +2.669 |
naire | +2.642 |
NG | +2.621 |
ready | +2.610 |
Neg logit contributions | |
�醒 | -3.103 |
Synd | -3.097 |
synd | -2.997 |
anda | -2.915 |
ahime | -2.858 |
Token | says |
Token ID | 1139 |
Feature activation | -4.75e-01 |
Pos logit contributions | |
Guilty | +2.519 |
GH | +2.026 |
que | +1.986 |
naire | +1.973 |
NG | +1.954 |
Neg logit contributions | |
Synd | -2.586 |
�醒 | -2.534 |
synd | -2.498 |
anda | -2.484 |
ahime | -2.397 |
Token | . |
Token ID | 13 |
Feature activation | -4.62e-02 |
Pos logit contributions | |
Guilty | +6.024 |
GH | +4.970 |
que | +4.891 |
naire | +4.864 |
NG | +4.795 |
Neg logit contributions | |
Synd | -5.200 |
synd | -4.998 |
�醒 | -4.966 |
anda | -4.913 |
ahime | -4.909 |
Token | � |
Token ID | 564 |
Feature activation | +5.69e-01 |
Pos logit contributions | |
Guilty | +0.641 |
GH | +0.532 |
naire | +0.519 |
NG | +0.518 |
que | +0.517 |
Neg logit contributions | |
Synd | -0.483 |
synd | -0.470 |
�醒 | -0.466 |
anda | -0.466 |
ahime | -0.438 |
Token | i |
Token ID | 1312 |
Feature activation | -4.22e-01 |
Pos logit contributions | |
Guilty | +6.135 |
que | +5.096 |
GH | +5.020 |
NG | +4.989 |
naire | +4.910 |
Neg logit contributions | |
�醒 | -4.686 |
Synd | -4.537 |
anda | -4.391 |
synd | -4.343 |
ahime | -4.305 |
Token | . |
Token ID | 13 |
Feature activation | -6.24e-02 |
Pos logit contributions | |
Guilty | +5.377 |
GH | +4.562 |
NG | +4.448 |
que | +4.380 |
ready | +4.295 |
Neg logit contributions | |
Synd | -4.646 |
�醒 | -4.640 |
synd | -4.535 |
anda | -4.433 |
ahime | -4.371 |
Token | e |
Token ID | 68 |
Feature activation | -3.64e-01 |
Pos logit contributions | |
Guilty | +1.000 |
GH | +0.857 |
naire | +0.839 |
NG | +0.839 |
que | +0.836 |
Neg logit contributions | |
Synd | -0.518 |
�醒 | -0.501 |
synd | -0.498 |
anda | -0.492 |
ahime | -0.457 |
Token | . |
Token ID | 13 |
Feature activation | -6.69e-01 |
Pos logit contributions | |
Guilty | +4.234 |
GH | +3.455 |
NG | +3.346 |
que | +3.343 |
naire | +3.294 |
Neg logit contributions | |
Synd | -4.483 |
synd | -4.356 |
anda | -4.321 |
�醒 | -4.273 |
ahime | -4.184 |
Token | those |
Token ID | 883 |
Feature activation | -5.95e-01 |
Pos logit contributions | |
Guilty | +8.689 |
que | +7.242 |
GH | +7.053 |
NG | +7.024 |
ready | +6.884 |
Neg logit contributions | |
�醒 | -7.108 |
Synd | -6.851 |
anda | -6.624 |
ahime | -6.558 |
synd | -6.447 |
Token | who |
Token ID | 508 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
Guilty | +7.998 |
que | +6.751 |
GH | +6.525 |
NG | +6.481 |
naire | +6.425 |
Neg logit contributions | |
�醒 | -6.211 |
Synd | -5.934 |
anda | -5.791 |
ahime | -5.632 |
synd | -5.604 |
Token | voted |
Token ID | 7052 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
Guilty | +15.784 |
que | +15.051 |
NG | +12.938 |
ready | +12.874 |
GH | +12.833 |
Neg logit contributions | |
�醒 | -19.253 |
ahime | -16.530 |
Synd | -16.364 |
SourceFile | -15.959 |
anda | -15.499 |
Token | in |
Token ID | 287 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
Guilty | +14.771 |
que | +12.097 |
lottery | +11.194 |
NG | +11.088 |
ready | +10.912 |
Neg logit contributions | |
�醒 | -14.005 |
ahime | -13.384 |
Synd | -12.565 |
anda | -12.535 |
gypt | -12.519 |
Token | the |
Token ID | 262 |
Feature activation | -6.17e-01 |
Pos logit contributions | |
Guilty | +13.066 |
que | +11.151 |
NG | +10.328 |
lottery | +10.323 |
ready | +10.126 |
Neg logit contributions | |
�醒 | -11.330 |
anda | -10.534 |
Synd | -10.364 |
andowski | -10.349 |
ahime | -10.294 |
Token | previous |
Token ID | 2180 |
Feature activation | -8.59e-01 |
Pos logit contributions | |
Guilty | +7.931 |
que | +6.425 |
GH | +6.274 |
ready | +6.175 |
naire | +6.165 |
Neg logit contributions | |
�醒 | -6.679 |
Synd | -6.532 |
anda | -6.378 |
synd | -6.275 |
ahime | -6.130 |
Token | election |
Token ID | 3071 |
Feature activation | -6.68e-01 |
Pos logit contributions | |
Guilty | +9.842 |
que | +8.056 |
GH | +7.608 |
naire | +7.478 |
lottery | +7.470 |
Neg logit contributions | |
�醒 | -9.907 |
Synd | -9.648 |
anda | -9.396 |
synd | -9.237 |
andowski | -9.080 |
Token | tracking |
Token ID | 9646 |
Feature activation | +2.73e-01 |
Pos logit contributions | |
synd | +6.792 |
Synd | +6.670 |
anda | +6.570 |
utt | +6.097 |
andowski | +6.039 |
Neg logit contributions | |
Guilty | -8.995 |
isSpecialOrderable | -7.293 |
GH | -7.264 |
NG | -7.054 |
naire | -7.041 |
Token | of |
Token ID | 286 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
Synd | +2.677 |
synd | +2.646 |
anda | +2.630 |
�醒 | +2.535 |
utt | +2.447 |
Neg logit contributions | |
Guilty | -3.913 |
GH | -3.238 |
NG | -3.164 |
naire | -3.160 |
que | -3.116 |
Token | homeless |
Token ID | 10463 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
Guilty | +2.509 |
GH | +2.042 |
que | +2.019 |
naire | +1.987 |
NG | +1.978 |
Neg logit contributions | |
Synd | -2.339 |
�醒 | -2.314 |
anda | -2.258 |
synd | -2.253 |
ahime | -2.175 |
Token | people |
Token ID | 661 |
Feature activation | -3.67e-01 |
Pos logit contributions | |
Guilty | +3.360 |
GH | +2.855 |
que | +2.827 |
naire | +2.795 |
NG | +2.782 |
Neg logit contributions | |
Synd | -2.116 |
�醒 | -2.097 |
anda | -2.015 |
synd | -2.013 |
ahime | -1.930 |
Token | as |
Token ID | 355 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
Guilty | +4.812 |
que | +4.045 |
GH | +4.001 |
naire | +3.959 |
NG | +3.913 |
Neg logit contributions | |
Synd | -3.938 |
�醒 | -3.888 |
synd | -3.757 |
anda | -3.689 |
ahime | -3.622 |
Token | they |
Token ID | 484 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
Synd | +0.932 |
synd | +0.906 |
anda | +0.893 |
�醒 | +0.879 |
Tad | +0.830 |
Neg logit contributions | |
Guilty | -1.535 |
GH | -1.298 |
NG | -1.267 |
naire | -1.266 |
que | -1.251 |
Token | seek |
Token ID | 5380 |
Feature activation | +4.38e-02 |
Pos logit contributions | |
que | +16.241 |
Guilty | +15.631 |
naire | +13.919 |
GH | +13.637 |
anted | +13.533 |
Neg logit contributions | |
�醒 | -18.293 |
Synd | -15.507 |
ahime | -15.193 |
SourceFile | -14.978 |
owship | -14.539 |
Token | services |
Token ID | 2594 |
Feature activation | -3.63e-01 |
Pos logit contributions | |
Synd | +0.464 |
synd | +0.451 |
anda | +0.448 |
�醒 | +0.443 |
Tad | +0.420 |
Neg logit contributions | |
Guilty | -0.603 |
GH | -0.501 |
naire | -0.488 |
NG | -0.487 |
que | -0.484 |
Token | and |
Token ID | 290 |
Feature activation | -4.02e-01 |
Pos logit contributions | |
Guilty | +4.749 |
que | +3.963 |
GH | +3.924 |
NG | +3.868 |
naire | +3.829 |
Neg logit contributions | |
Synd | -3.925 |
�醒 | -3.889 |
synd | -3.741 |
anda | -3.721 |
ahime | -3.638 |
Token | better |
Token ID | 1365 |
Feature activation | +5.50e-01 |
Pos logit contributions | |
Guilty | +5.244 |
que | +4.369 |
GH | +4.306 |
naire | +4.278 |
NG | +4.220 |
Neg logit contributions | |
�醒 | -4.449 |
Synd | -4.346 |
anda | -4.190 |
ahime | -4.144 |
synd | -4.114 |
Token | tracking |
Token ID | 9646 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
synd | +5.856 |
Synd | +5.781 |
anda | +5.671 |
utt | +5.274 |
andowski | +5.209 |
Neg logit contributions | |
Guilty | -7.196 |
GH | -5.857 |
isSpecialOrderable | -5.660 |
NG | -5.613 |
naire | -5.546 |
Token | Old |
Token ID | 5706 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Guilty | +4.992 |
GH | +4.069 |
naire | +3.995 |
NG | +3.964 |
que | +3.925 |
Neg logit contributions | |
�醒 | -3.465 |
synd | -3.453 |
Synd | -3.448 |
anda | -3.389 |
ahime | -3.286 |
Token | gift |
Token ID | 6979 |
Feature activation | +2.68e-02 |
Pos logit contributions | |
Guilty | +12.384 |
naire | +10.070 |
GH | +9.865 |
que | +9.772 |
NG | +9.609 |
Neg logit contributions | |
Synd | -12.797 |
ahime | -12.206 |
anda | -11.935 |
synd | -11.861 |
�醒 | -11.845 |
Token | – |
Token ID | 1906 |
Feature activation | +7.47e-02 |
Pos logit contributions | |
Synd | +0.255 |
synd | +0.247 |
anda | +0.245 |
�醒 | +0.244 |
Tad | +0.228 |
Neg logit contributions | |
Guilty | -0.398 |
GH | -0.335 |
naire | -0.327 |
NG | -0.326 |
que | -0.326 |
Token | be |
Token ID | 1350 |
Feature activation | +3.55e-01 |
Pos logit contributions | |
Synd | +0.393 |
anda | +0.372 |
synd | +0.371 |
�醒 | +0.355 |
Tad | +0.320 |
Neg logit contributions | |
Guilty | -1.426 |
GH | -1.246 |
que | -1.222 |
NG | -1.221 |
naire | -1.220 |
Token | arer |
Token ID | 11258 |
Feature activation | +8.28e-02 |
Pos logit contributions | |
anda | +3.462 |
Synd | +3.392 |
synd | +3.321 |
Tad | +3.167 |
�醒 | +3.163 |
Neg logit contributions | |
Guilty | -5.100 |
GH | -4.323 |
que | -4.082 |
NG | -4.055 |
naire | -4.041 |
Token | setting |
Token ID | 4634 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
Synd | +0.777 |
synd | +0.758 |
anda | +0.744 |
�醒 | +0.727 |
Tad | +0.693 |
Neg logit contributions | |
Guilty | -1.243 |
GH | -1.050 |
naire | -1.024 |
NG | -1.018 |
que | -1.009 |
Token | box |
Token ID | 3091 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
Guilty | +6.986 |
que | +6.369 |
box | +5.953 |
naire | +5.392 |
boxes | +5.335 |
Neg logit contributions | |
�醒 | -28.270 |
ahime | -25.587 |
Synd | -25.527 |
ciating | -24.249 |
nces | -24.178 |
Token | underneath |
Token ID | 14638 |
Feature activation | -6.93e-01 |
Pos logit contributions | |
Guilty | +3.094 |
GH | +2.529 |
que | +2.521 |
naire | +2.509 |
NG | +2.475 |
Neg logit contributions | |
Synd | -2.608 |
synd | -2.521 |
�醒 | -2.512 |
anda | -2.482 |
ahime | -2.387 |
Token | roughly |
Token ID | 7323 |
Feature activation | -6.13e-01 |
Pos logit contributions | |
Guilty | +6.742 |
que | +5.421 |
GH | +5.361 |
naire | +5.291 |
ready | +5.279 |
Neg logit contributions | |
Synd | -9.166 |
�醒 | -8.948 |
ahime | -8.849 |
synd | -8.816 |
anda | -8.758 |
Token | ( |
Token ID | 357 |
Feature activation | -9.82e-01 |
Pos logit contributions | |
Guilty | +7.214 |
GH | +6.091 |
que | +6.038 |
naire | +5.894 |
ready | +5.852 |
Neg logit contributions | |
�醒 | -7.043 |
Synd | -6.946 |
synd | -6.719 |
ahime | -6.639 |
anda | -6.440 |
Token | 6 |
Token ID | 21 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
Guilty | +7.181 |
GH | +6.128 |
NG | +5.848 |
ready | +5.514 |
naire | +5.355 |
Neg logit contributions | |
Synd | -14.233 |
synd | -14.056 |
�醒 | -13.968 |
Mutual | -13.578 |
Tad | -13.405 |
Token | the |
Token ID | 262 |
Feature activation | -8.57e-01 |
Pos logit contributions | |
Guilty | +8.278 |
que | +6.705 |
NG | +6.600 |
GH | +6.584 |
naire | +6.449 |
Neg logit contributions | |
�醒 | -8.347 |
Synd | -7.576 |
ahime | -7.542 |
anda | -7.488 |
andowski | -7.454 |
Token | same |
Token ID | 976 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
Guilty | +9.565 |
que | +7.730 |
GH | +7.419 |
NG | +7.269 |
lottery | +7.262 |
Neg logit contributions | |
�醒 | -9.937 |
ahime | -9.728 |
Synd | -9.437 |
anda | -9.296 |
gypt | -9.177 |
Token | rink |
Token ID | 47925 |
Feature activation | -8.89e-01 |
Pos logit contributions | |
Guilty | +6.525 |
que | +5.308 |
GH | +5.139 |
NG | +5.050 |
naire | +4.971 |
Neg logit contributions | |
�醒 | -6.938 |
Synd | -6.857 |
ahime | -6.665 |
anda | -6.630 |
utt | -6.452 |
Token | each |
Token ID | 1123 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
Guilty | +10.053 |
que | +8.653 |
NG | +8.185 |
GH | +8.008 |
ready | +8.007 |
Neg logit contributions | |
�醒 | -10.414 |
ahime | -9.574 |
Synd | -9.388 |
anda | -9.210 |
iliate | -8.951 |
Token | and |
Token ID | 290 |
Feature activation | -3.84e-01 |
Pos logit contributions | |
Guilty | +12.283 |
que | +10.553 |
NG | +10.385 |
lottery | +10.117 |
GH | +9.993 |
Neg logit contributions | |
�醒 | -16.778 |
andowski | -15.829 |
ahime | -15.827 |
Synd | -15.504 |
anda | -15.335 |
Token | every |
Token ID | 790 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
Guilty | +3.976 |
GH | +3.154 |
que | +3.141 |
naire | +3.059 |
NG | +3.046 |
Neg logit contributions | |
�醒 | -5.189 |
Synd | -5.142 |
anda | -4.990 |
synd | -4.946 |
ahime | -4.876 |
Token | day |
Token ID | 1110 |
Feature activation | -7.48e-01 |
Pos logit contributions | |
Guilty | +12.410 |
NG | +10.804 |
que | +10.586 |
lottery | +10.301 |
naire | +10.073 |
Neg logit contributions | |
�醒 | -19.892 |
andowski | -19.435 |
ahime | -18.958 |
gypt | -18.714 |
Synd | -18.513 |
Token | , |
Token ID | 11 |
Feature activation | -7.71e-01 |
Pos logit contributions | |
Guilty | +8.849 |
que | +7.588 |
NG | +7.196 |
GH | +7.064 |
ready | +7.022 |
Neg logit contributions | |
�醒 | -8.641 |
ahime | -8.129 |
Synd | -8.094 |
anda | -7.791 |
synd | -7.651 |
Token | and |
Token ID | 290 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
Guilty | +9.656 |
que | +8.186 |
NG | +7.709 |
GH | +7.677 |
ready | +7.591 |
Neg logit contributions | |
�醒 | -8.567 |
ahime | -7.942 |
Synd | -7.902 |
anda | -7.676 |
synd | -7.487 |
Token | now |
Token ID | 783 |
Feature activation | -2.23e-01 |
Pos logit contributions | |
Guilty | +3.626 |
GH | +2.991 |
que | +2.980 |
NG | +2.938 |
naire | +2.918 |
Neg logit contributions | |
�醒 | -2.693 |
Synd | -2.620 |
anda | -2.542 |
synd | -2.533 |
ahime | -2.464 |
Token | to |
Token ID | 284 |
Feature activation | -3.69e-01 |
Pos logit contributions | |
Guilty | +3.158 |
GH | +2.617 |
que | +2.584 |
NG | +2.569 |
naire | +2.546 |
Neg logit contributions | |
�醒 | -2.275 |
Synd | -2.233 |
anda | -2.166 |
synd | -2.160 |
ahime | -2.089 |
Token | sequence |
Token ID | 8379 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
Synd | +0.055 |
synd | +0.053 |
anda | +0.053 |
�醒 | +0.053 |
Tad | +0.049 |
Neg logit contributions | |
Guilty | -0.078 |
GH | -0.066 |
naire | -0.064 |
NG | -0.064 |
que | -0.064 |
Token | takes |
Token ID | 2753 |
Feature activation | +6.06e-01 |
Pos logit contributions | |
Guilty | +1.742 |
GH | +1.376 |
que | +1.366 |
naire | +1.343 |
NG | +1.327 |
Neg logit contributions | |
Synd | -2.056 |
�醒 | -2.038 |
anda | -1.997 |
synd | -1.990 |
ahime | -1.920 |
Token | place |
Token ID | 1295 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
Synd | +5.035 |
synd | +5.013 |
anda | +4.689 |
Tad | +4.583 |
utt | +4.425 |
Neg logit contributions | |
Guilty | -9.446 |
naire | -7.847 |
GH | -7.775 |
NG | -7.699 |
isSpecialOrderable | -7.556 |
Token | in |
Token ID | 287 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
Guilty | +2.432 |
GH | +2.013 |
que | +1.987 |
naire | +1.976 |
NG | +1.967 |
Neg logit contributions | |
�醒 | -1.923 |
Synd | -1.903 |
anda | -1.845 |
synd | -1.845 |
ahime | -1.764 |
Token | the |
Token ID | 262 |
Feature activation | +8.27e-01 |
Pos logit contributions | |
Synd | +1.873 |
synd | +1.806 |
anda | +1.775 |
Tad | +1.684 |
�醒 | +1.667 |
Neg logit contributions | |
Guilty | -2.872 |
GH | -2.426 |
naire | -2.365 |
NG | -2.357 |
que | -2.335 |
Token | library |
Token ID | 5888 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
Synd | +6.382 |
synd | +6.331 |
anda | +6.123 |
Carnegie | +5.897 |
Berkshire | +5.870 |
Neg logit contributions | |
Guilty | -12.536 |
GH | -10.962 |
NG | -10.507 |
naire | -10.469 |
anted | -9.980 |
Token | inside |
Token ID | 2641 |
Feature activation | +4.25e-01 |
Pos logit contributions | |
Guilty | +10.765 |
que | +9.626 |
ready | +8.388 |
gates | +8.290 |
NG | +7.754 |
Neg logit contributions | |
�醒 | -25.074 |
ahime | -22.238 |
Synd | -21.190 |
gypt | -20.576 |
utt | -20.560 |
Token | the |
Token ID | 262 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
Synd | +3.738 |
synd | +3.528 |
anda | +3.425 |
Tad | +3.351 |
Mutual | +3.290 |
Neg logit contributions | |
Guilty | -6.488 |
GH | -5.532 |
naire | -5.407 |
NG | -5.406 |
que | -5.326 |
Token | in |
Token ID | 259 |
Feature activation | +7.27e-01 |
Pos logit contributions | |
Synd | +7.799 |
anda | +6.939 |
Mutual | +6.922 |
Berkshire | +6.909 |
synd | +6.810 |
Neg logit contributions | |
Guilty | -22.194 |
GH | -19.881 |
NG | -19.604 |
� | -19.211 |
proble | -19.124 |
Token | Border |
Token ID | 15443 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
anda | +7.557 |
Synd | +7.553 |
synd | +7.357 |
Mutual | +7.040 |
Berkshire | +7.007 |
Neg logit contributions | |
Guilty | -9.176 |
GH | -7.474 |
naire | -7.333 |
NG | -7.252 |
que | -7.198 |
Token | land |
Token ID | 1044 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
anda | +5.958 |
Synd | +5.726 |
synd | +5.084 |
nt | +4.929 |
ter | +4.635 |
Neg logit contributions | |
� | -26.960 |
Guilty | -26.387 |
� | -25.773 |
� | -25.762 |
proble | -25.093 |
Token | i |
Token ID | 72 |
Feature activation | -5.80e-01 |
Pos logit contributions | |
Guilty | +8.217 |
GH | +7.234 |
NG | +7.206 |
ready | +6.955 |
naire | +6.871 |
Neg logit contributions | |
Synd | -6.782 |
�醒 | -6.653 |
synd | -6.602 |
ahime | -6.217 |
anda | -6.148 |
Token | . |
Token ID | 13 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
Guilty | +6.683 |
GH | +5.720 |
NG | +5.630 |
naire | +5.395 |
ready | +5.383 |
Neg logit contributions | |
�醒 | -7.277 |
Synd | -6.778 |
ahime | -6.635 |
synd | -6.618 |
anda | -6.431 |
Token | e |
Token ID | 68 |
Feature activation | -7.63e-01 |
Pos logit contributions | |
Guilty | +3.940 |
GH | +3.397 |
NG | +3.340 |
naire | +3.314 |
ready | +3.306 |
Neg logit contributions | |
�醒 | -2.493 |
Synd | -2.402 |
synd | -2.324 |
anda | -2.255 |
ahime | -2.207 |
Token | . |
Token ID | 13 |
Feature activation | -8.72e-01 |
Pos logit contributions | |
Guilty | +8.310 |
GH | +6.816 |
que | +6.742 |
NG | +6.667 |
ready | +6.442 |
Neg logit contributions | |
Synd | -9.018 |
synd | -8.721 |
ahime | -8.654 |
anda | -8.565 |
�醒 | -8.409 |
Token | those |
Token ID | 883 |
Feature activation | -9.45e-01 |
Pos logit contributions | |
Guilty | +9.952 |
que | +8.348 |
GH | +8.040 |
NG | +8.025 |
ready | +7.814 |
Neg logit contributions | |
�醒 | -9.913 |
Synd | -9.436 |
ahime | -9.303 |
anda | -9.174 |
synd | -8.996 |
Token | who |
Token ID | 508 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
Guilty | +11.262 |
que | +9.697 |
NG | +9.104 |
GH | +9.068 |
ready | +8.979 |
Neg logit contributions | |
�醒 | -10.366 |
Synd | -9.578 |
ahime | -9.490 |
anda | -9.297 |
synd | -9.030 |
Token | voted |
Token ID | 7052 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
Guilty | +14.141 |
que | +13.797 |
GH | +11.621 |
naire | +11.464 |
ready | +11.339 |
Neg logit contributions | |
�醒 | -19.247 |
ahime | -17.108 |
Synd | -16.980 |
SourceFile | -16.079 |
rint | -16.019 |
Token | in |
Token ID | 287 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
Guilty | +12.287 |
que | +10.197 |
NG | +9.518 |
ready | +9.518 |
GH | +9.331 |
Neg logit contributions | |
�醒 | -12.487 |
ahime | -11.889 |
Synd | -11.845 |
anda | -11.661 |
gypt | -11.617 |
Token | the |
Token ID | 262 |
Feature activation | -9.77e-01 |
Pos logit contributions | |
Guilty | +11.049 |
que | +9.210 |
NG | +8.851 |
GH | +8.751 |
lottery | +8.617 |
Neg logit contributions | |
�醒 | -11.686 |
Synd | -11.470 |
anda | -11.238 |
andowski | -11.222 |
gypt | -11.079 |
Token | previous |
Token ID | 2180 |
Feature activation | -5.88e-01 |
Pos logit contributions | |
Guilty | +8.886 |
que | +6.992 |
lottery | +6.665 |
GH | +6.493 |
NG | +6.467 |
Neg logit contributions | |
�醒 | -12.568 |
Synd | -12.486 |
anda | -12.164 |
synd | -11.995 |
gypt | -11.976 |
Token | election |
Token ID | 3071 |
Feature activation | -8.22e-01 |
Pos logit contributions | |
Guilty | +4.574 |
GH | +3.286 |
que | +3.240 |
naire | +3.128 |
NG | +3.124 |
Neg logit contributions | |
Synd | -9.225 |
synd | -8.886 |
�醒 | -8.867 |
anda | -8.791 |
andowski | -8.594 |
Token | fun |
Token ID | 1257 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
Guilty | +8.895 |
que | +7.473 |
GH | +7.454 |
NG | +7.162 |
ready | +6.987 |
Neg logit contributions | |
�醒 | -7.400 |
Synd | -6.780 |
ahime | -6.586 |
anda | -6.559 |
synd | -6.487 |
Token | . |
Token ID | 13 |
Feature activation | -3.73e-01 |
Pos logit contributions | |
Guilty | +1.893 |
GH | +1.581 |
que | +1.544 |
naire | +1.539 |
NG | +1.539 |
Neg logit contributions | |
Synd | -1.385 |
�醒 | -1.346 |
synd | -1.344 |
anda | -1.327 |
ahime | -1.260 |
Token |
|
Token ID | 198 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
Guilty | +5.075 |
GH | +4.116 |
NG | +4.011 |
naire | +3.948 |
que | +3.934 |
Neg logit contributions | |
�醒 | -3.980 |
synd | -3.929 |
Synd | -3.915 |
anda | -3.842 |
ahime | -3.821 |
Token |
|
Token ID | 198 |
Feature activation | +3.55e-02 |
Pos logit contributions | |
Guilty | +1.667 |
GH | +1.391 |
NG | +1.356 |
naire | +1.348 |
que | +1.342 |
Neg logit contributions | |
�醒 | -1.354 |
Synd | -1.352 |
synd | -1.316 |
anda | -1.305 |
ahime | -1.255 |
Token | X |
Token ID | 55 |
Feature activation | -5.89e-01 |
Pos logit contributions | |
Synd | +0.457 |
synd | +0.446 |
anda | +0.445 |
�醒 | +0.443 |
Tad | +0.421 |
Neg logit contributions | |
Guilty | -0.406 |
GH | -0.321 |
naire | -0.313 |
que | -0.312 |
NG | -0.310 |
Token | avier |
Token ID | 19492 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
Guilty | +5.762 |
GH | +4.707 |
NG | +4.567 |
que | +4.490 |
naire | +4.418 |
Neg logit contributions | |
Synd | -8.028 |
�醒 | -8.024 |
synd | -7.801 |
ahime | -7.559 |
Tad | -7.434 |
Token | Gu |
Token ID | 1962 |
Feature activation | -5.26e-01 |
Pos logit contributions | |
Guilty | +12.634 |
GH | +9.228 |
naire | +7.822 |
NG | +7.661 |
que | +7.655 |
Neg logit contributions | |
�醒 | -25.591 |
ahime | -22.165 |
ntil | -21.896 |
owship | -21.570 |
commer | -21.330 |
Token | il |
Token ID | 346 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
Guilty | +5.471 |
GH | +4.482 |
NG | +4.323 |
naire | +4.242 |
itcher | +4.181 |
Neg logit contributions | |
�醒 | -7.347 |
Synd | -7.047 |
synd | -6.830 |
Tad | -6.574 |
ahime | -6.500 |
Token | bert |
Token ID | 4835 |
Feature activation | -5.09e-01 |
Pos logit contributions | |
anda | +2.638 |
Synd | +2.587 |
synd | +2.505 |
utt | +2.380 |
andowski | +2.344 |
Neg logit contributions | |
Guilty | -5.141 |
GH | -4.250 |
que | -4.177 |
NG | -4.176 |
naire | -4.173 |
Token | : |
Token ID | 1058 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
Guilty | +6.855 |
GH | +5.725 |
naire | +5.691 |
que | +5.682 |
NG | +5.563 |
Neg logit contributions | |
�醒 | -5.434 |
Synd | -4.974 |
ahime | -4.915 |
synd | -4.873 |
anda | -4.829 |
Token | Well |
Token ID | 3894 |
Feature activation | -6.52e-01 |
Pos logit contributions | |
Guilty | +1.831 |
GH | +1.497 |
naire | +1.456 |
NG | +1.455 |
que | +1.448 |
Neg logit contributions | |
Synd | -1.452 |
�醒 | -1.447 |
synd | -1.428 |
anda | -1.419 |
ahime | -1.356 |
Token | professor |
Token ID | 6240 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
Synd | +3.697 |
synd | +3.576 |
anda | +3.543 |
utt | +3.246 |
Tyrann | +3.140 |
Neg logit contributions | |
Guilty | -7.581 |
GH | -6.463 |
naire | -6.373 |
NG | -6.308 |
isSpecialOrderable | -6.264 |
Token | at |
Token ID | 379 |
Feature activation | +9.42e-02 |
Pos logit contributions | |
Guilty | +5.074 |
GH | +3.826 |
que | +3.822 |
ready | +3.768 |
naire | +3.686 |
Neg logit contributions | |
�醒 | -9.375 |
ahime | -8.847 |
Synd | -8.731 |
synd | -8.549 |
anda | -8.421 |
Token | Columbia |
Token ID | 9309 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
Synd | +1.054 |
anda | +1.022 |
synd | +1.021 |
�醒 | +1.005 |
Tad | +0.955 |
Neg logit contributions | |
Guilty | -1.240 |
GH | -1.018 |
naire | -0.996 |
que | -0.987 |
NG | -0.987 |
Token | University |
Token ID | 2059 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
Synd | +3.757 |
University | +3.304 |
Mutual | +3.153 |
anda | +3.000 |
Carnegie | +2.973 |
Neg logit contributions | |
Guilty | -24.864 |
isSpecialOrderable | -23.651 |
GH | -23.330 |
pse | -23.031 |
naire | -23.013 |
Token | , |
Token ID | 11 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
Guilty | +4.317 |
GH | +3.572 |
que | +3.503 |
NG | +3.484 |
naire | +3.462 |
Neg logit contributions | |
�醒 | -3.718 |
Synd | -3.590 |
synd | -3.499 |
anda | -3.489 |
ahime | -3.419 |
Token | where |
Token ID | 810 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
Guilty | +2.100 |
GH | +1.738 |
que | +1.705 |
NG | +1.704 |
naire | +1.688 |
Neg logit contributions | |
Synd | -1.644 |
�醒 | -1.631 |
synd | -1.592 |
anda | -1.582 |
ahime | -1.507 |
Token | some |
Token ID | 617 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
Guilty | +6.369 |
que | +4.998 |
NG | +4.476 |
GH | +4.215 |
gays | +3.612 |
Neg logit contributions | |
�醒 | -28.362 |
ahime | -25.927 |
anda | -24.378 |
iliate | -24.241 |
owship | -24.202 |
Token | filming |
Token ID | 17691 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
Guilty | +2.340 |
GH | +1.970 |
que | +1.944 |
NG | +1.926 |
naire | +1.908 |
Neg logit contributions | |
Synd | -1.631 |
�醒 | -1.615 |
synd | -1.564 |
anda | -1.555 |
ahime | -1.484 |
Token | took |
Token ID | 1718 |
Feature activation | +3.21e-01 |
Pos logit contributions | |
Guilty | +4.778 |
que | +4.427 |
anted | +2.898 |
GH | +2.749 |
ready | +2.726 |
Neg logit contributions | |
�醒 | -20.235 |
Synd | -18.373 |
anda | -18.263 |
ahime | -18.189 |
iliate | -17.607 |
Token | place |
Token ID | 1295 |
Feature activation | -1.43e-02 |
Pos logit contributions | |
Synd | +3.050 |
synd | +3.031 |
anda | +2.926 |
Tad | +2.778 |
utt | +2.731 |
Neg logit contributions | |
Guilty | -4.742 |
GH | -3.924 |
naire | -3.881 |
NG | -3.835 |
isSpecialOrderable | -3.702 |
Token | near |
Token ID | 1474 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
Guilty | +0.204 |
GH | +0.170 |
naire | +0.166 |
NG | +0.166 |
que | +0.166 |
Neg logit contributions | |
Synd | -0.144 |
synd | -0.139 |
anda | -0.138 |
�醒 | -0.138 |
Tad | -0.129 |
Token | around |
Token ID | 1088 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
Synd | +4.632 |
synd | +4.501 |
anda | +4.369 |
�醒 | +4.127 |
Mutual | +4.071 |
Neg logit contributions | |
Guilty | -6.540 |
GH | -5.456 |
naire | -5.315 |
NG | -5.202 |
ready | -5.154 |
Token | 150 |
Token ID | 6640 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
Synd | +1.802 |
synd | +1.751 |
anda | +1.722 |
�醒 | +1.673 |
Tad | +1.604 |
Neg logit contributions | |
Guilty | -2.772 |
GH | -2.333 |
naire | -2.281 |
NG | -2.254 |
que | -2.236 |
Token | , |
Token ID | 11 |
Feature activation | -2.73e-02 |
Pos logit contributions | |
Guilty | +1.549 |
GH | +1.293 |
que | +1.264 |
NG | +1.262 |
naire | +1.259 |
Neg logit contributions | |
Synd | -1.144 |
�醒 | -1.106 |
synd | -1.106 |
anda | -1.105 |
ahime | -1.042 |
Token | 000 |
Token ID | 830 |
Feature activation | -4.89e-01 |
Pos logit contributions | |
Guilty | +0.416 |
GH | +0.352 |
naire | +0.344 |
NG | +0.344 |
que | +0.343 |
Neg logit contributions | |
Synd | -0.249 |
synd | -0.241 |
�醒 | -0.239 |
anda | -0.239 |
Tad | -0.222 |
Token | immigrants |
Token ID | 7971 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
Guilty | +6.599 |
que | +5.640 |
GH | +5.491 |
NG | +5.467 |
naire | +5.457 |
Neg logit contributions | |
�醒 | -4.931 |
Synd | -4.858 |
anda | -4.695 |
synd | -4.634 |
ahime | -4.619 |
Token | who |
Token ID | 508 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
Guilty | +11.432 |
que | +10.480 |
naire | +9.338 |
NG | +9.331 |
GH | +9.311 |
Neg logit contributions | |
�醒 | -11.998 |
Synd | -11.118 |
ahime | -10.857 |
SourceFile | -10.372 |
anda | -10.367 |
Token | are |
Token ID | 389 |
Feature activation | -8.23e-01 |
Pos logit contributions | |
Guilty | +14.488 |
que | +14.370 |
naire | +13.186 |
NG | +12.502 |
illegally | +12.310 |
Neg logit contributions | |
�醒 | -17.819 |
Synd | -16.234 |
ahime | -15.616 |
SourceFile | -15.430 |
rint | -15.350 |
Token | in |
Token ID | 287 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
Guilty | +9.627 |
que | +8.605 |
ready | +8.034 |
NG | +8.025 |
naire | +7.891 |
Neg logit contributions | |
�醒 | -8.966 |
Synd | -8.556 |
ahime | -8.455 |
anda | -8.346 |
synd | -8.216 |
Token | Spain |
Token ID | 8602 |
Feature activation | -9.80e-01 |
Pos logit contributions | |
Guilty | +5.574 |
que | +4.660 |
NG | +4.588 |
naire | +4.536 |
GH | +4.534 |
Neg logit contributions | |
Synd | -4.561 |
�醒 | -4.469 |
anda | -4.418 |
synd | -4.351 |
ahime | -4.239 |
Token | but |
Token ID | 475 |
Feature activation | -7.89e-01 |
Pos logit contributions | |
Guilty | +11.009 |
que | +9.914 |
ready | +9.215 |
naire | +8.909 |
NG | +8.869 |
Neg logit contributions | |
�醒 | -10.708 |
Synd | -10.358 |
ahime | -9.991 |
synd | -9.772 |
anda | -9.653 |
Token | do |
Token ID | 466 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
Guilty | +9.597 |
que | +8.496 |
ready | +8.002 |
GH | +7.962 |
NG | +7.942 |
Neg logit contributions | |
�醒 | -8.670 |
Synd | -8.052 |
anda | -7.753 |
synd | -7.702 |
ahime | -7.610 |
Token | the |
Token ID | 262 |
Feature activation | -7.87e-01 |
Pos logit contributions | |
Guilty | +10.507 |
que | +8.674 |
NG | +8.130 |
naire | +8.052 |
GH | +8.052 |
Neg logit contributions | |
�醒 | -10.611 |
anda | -9.628 |
Synd | -9.553 |
andowski | -9.234 |
ahime | -9.216 |
Token | time |
Token ID | 640 |
Feature activation | -4.03e-01 |
Pos logit contributions | |
Guilty | +9.489 |
que | +7.704 |
NG | +7.354 |
GH | +7.340 |
ready | +7.267 |
Neg logit contributions | |
�醒 | -9.220 |
Synd | -8.381 |
anda | -8.346 |
ahime | -7.964 |
andowski | -7.956 |
Token | Mason |
Token ID | 14737 |
Feature activation | -9.20e-01 |
Pos logit contributions | |
Guilty | +5.421 |
GH | +4.462 |
que | +4.431 |
naire | +4.407 |
NG | +4.354 |
Neg logit contributions | |
�醒 | -4.241 |
Synd | -4.138 |
anda | -4.069 |
synd | -4.020 |
ahime | -3.982 |
Token | was |
Token ID | 373 |
Feature activation | +4.14e-03 |
Pos logit contributions | |
Guilty | +10.274 |
que | +8.618 |
naire | +8.196 |
ready | +8.060 |
GH | +8.049 |
Neg logit contributions | |
�醒 | -10.763 |
Synd | -9.907 |
ahime | -9.658 |
anda | -9.474 |
iliate | -9.402 |
Token | ready |
Token ID | 3492 |
Feature activation | -5.19e-01 |
Pos logit contributions | |
Synd | +0.045 |
synd | +0.043 |
anda | +0.043 |
�醒 | +0.043 |
Tad | +0.040 |
Neg logit contributions | |
Guilty | -0.056 |
GH | -0.047 |
naire | -0.045 |
NG | -0.045 |
que | -0.045 |
Token | to |
Token ID | 284 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
Guilty | +6.320 |
GH | +5.096 |
que | +5.064 |
NG | +5.019 |
naire | +4.944 |
Neg logit contributions | |
�醒 | -5.958 |
Synd | -5.901 |
ahime | -5.747 |
anda | -5.730 |
synd | -5.691 |
Token | step |
Token ID | 2239 |
Feature activation | -6.28e-01 |
Pos logit contributions | |
Guilty | +16.002 |
que | +14.225 |
naire | +13.170 |
gamble | +13.009 |
GH | +12.573 |
Neg logit contributions | |
�醒 | -18.399 |
ahime | -15.566 |
anda | -15.105 |
SourceFile | -15.087 |
Synd | -14.659 |
Token | down |
Token ID | 866 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
Guilty | +9.570 |
que | +8.023 |
GH | +7.974 |
NG | +7.917 |
naire | +7.764 |
Neg logit contributions | |
�醒 | -5.467 |
Synd | -5.029 |
anda | -4.850 |
synd | -4.742 |
ahime | -4.655 |
Token | as |
Token ID | 355 |
Feature activation | +2.81e-01 |
Pos logit contributions | |
Synd | +1.256 |
synd | +1.214 |
anda | +1.198 |
�醒 | +1.172 |
Tad | +1.124 |
Neg logit contributions | |
Guilty | -1.990 |
GH | -1.679 |
naire | -1.641 |
NG | -1.638 |
que | -1.626 |
Token | leader |
Token ID | 3554 |
Feature activation | -2.46e-01 |
Pos logit contributions | |
Synd | +3.132 |
synd | +3.038 |
anda | +2.963 |
�醒 | +2.896 |
Tad | +2.854 |
Neg logit contributions | |
Guilty | -3.696 |
GH | -3.040 |
naire | -2.987 |
NG | -2.948 |
que | -2.906 |
Token | , |
Token ID | 11 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
Guilty | +3.319 |
GH | +2.747 |
que | +2.693 |
naire | +2.689 |
NG | +2.672 |
Neg logit contributions | |
Synd | -2.602 |
�醒 | -2.563 |
anda | -2.520 |
synd | -2.514 |
ahime | -2.413 |
Token | 75 |
Token ID | 2425 |
Feature activation | +4.86e-01 |
Pos logit contributions | |
Synd | +3.397 |
synd | +3.270 |
anda | +3.268 |
Tad | +3.081 |
Mutual | +3.033 |
Neg logit contributions | |
Guilty | -6.272 |
GH | -5.230 |
naire | -5.219 |
NG | -5.195 |
que | -5.191 |
Token | Author |
Token ID | 6434 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
Synd | +4.813 |
synd | +4.606 |
anda | +4.586 |
Tad | +4.410 |
�醒 | +4.409 |
Neg logit contributions | |
Guilty | -6.710 |
GH | -5.636 |
naire | -5.557 |
que | -5.457 |
ready | -5.394 |
Token | : |
Token ID | 25 |
Feature activation | -2.54e-01 |
Pos logit contributions | |
Guilty | +3.155 |
GH | +2.630 |
naire | +2.573 |
NG | +2.570 |
que | +2.561 |
Neg logit contributions | |
Synd | -2.216 |
synd | -2.145 |
�醒 | -2.144 |
anda | -2.119 |
ahime | -2.023 |
Token | E |
Token ID | 412 |
Feature activation | -2.65e-01 |
Pos logit contributions | |
Guilty | +3.495 |
GH | +2.892 |
que | +2.822 |
NG | +2.816 |
naire | +2.808 |
Neg logit contributions | |
Synd | -2.617 |
�醒 | -2.612 |
synd | -2.558 |
anda | -2.555 |
ahime | -2.461 |
Token | . |
Token ID | 13 |
Feature activation | -5.29e-01 |
Pos logit contributions | |
Guilty | +3.537 |
GH | +2.991 |
NG | +2.900 |
naire | +2.869 |
que | +2.858 |
Neg logit contributions | |
Synd | -2.831 |
synd | -2.740 |
�醒 | -2.734 |
anda | -2.688 |
ahime | -2.598 |
Token | S |
Token ID | 50 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
Guilty | +5.325 |
GH | +4.275 |
NG | +4.082 |
que | +3.869 |
naire | +3.844 |
Neg logit contributions | |
�醒 | -7.141 |
ahime | -7.008 |
Synd | -6.997 |
synd | -6.968 |
anda | -6.946 |
Token | . |
Token ID | 13 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
Guilty | +13.417 |
GH | +11.026 |
NG | +10.379 |
naire | +9.772 |
itcher | +9.710 |
Neg logit contributions | |
�醒 | -18.791 |
ahime | -17.708 |
synd | -17.536 |
andowski | -17.424 |
Synd | -17.365 |
Token | Glover |
Token ID | 43487 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
Guilty | +12.161 |
GH | +10.386 |
NG | +9.850 |
que | +8.926 |
naire | +8.827 |
Neg logit contributions | |
�醒 | -14.349 |
ahime | -14.185 |
Synd | -14.040 |
utt | -13.971 |
anda | -13.850 |
Token | D |
Token ID | 360 |
Feature activation | +6.77e-02 |
Pos logit contributions | |
Guilty | +1.441 |
GH | +1.201 |
NG | +1.176 |
naire | +1.174 |
que | +1.172 |
Neg logit contributions | |
Synd | -1.017 |
synd | -0.988 |
�醒 | -0.986 |
anda | -0.982 |
ahime | -0.925 |
Token | wn |
Token ID | 675 |
Feature activation | +1.66e-03 |
Pos logit contributions | |
Synd | +0.760 |
synd | +0.740 |
anda | +0.740 |
�醒 | +0.732 |
utt | +0.694 |
Neg logit contributions | |
Guilty | -0.886 |
GH | -0.722 |
naire | -0.710 |
que | -0.704 |
NG | -0.698 |
Token | ld |
Token ID | 335 |
Feature activation | -6.04e-02 |
Pos logit contributions | |
Synd | +0.017 |
synd | +0.017 |
anda | +0.016 |
�醒 | +0.016 |
Tad | +0.015 |
Neg logit contributions | |
Guilty | -0.023 |
GH | -0.020 |
naire | -0.019 |
NG | -0.019 |
que | -0.019 |
Token | , |
Token ID | 11 |
Feature activation | -3.02e-01 |
Pos logit contributions | |
Synd | +0.319 |
synd | +0.310 |
anda | +0.307 |
�醒 | +0.304 |
Tad | +0.287 |
Neg logit contributions | |
Guilty | -0.458 |
GH | -0.384 |
naire | -0.375 |
NG | -0.373 |
que | -0.372 |
Token | which |
Token ID | 543 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
Guilty | +4.213 |
GH | +3.505 |
que | +3.495 |
NG | +3.443 |
naire | +3.404 |
Neg logit contributions | |
Synd | -3.048 |
�醒 | -3.017 |
synd | -2.925 |
anda | -2.914 |
ahime | -2.800 |
Token | is |
Token ID | 318 |
Feature activation | -3.31e-01 |
Pos logit contributions | |
Guilty | +4.853 |
que | +4.025 |
GH | +4.023 |
naire | +3.955 |
NG | +3.930 |
Neg logit contributions | |
�醒 | -3.757 |
Synd | -3.736 |
anda | -3.586 |
synd | -3.555 |
ahime | -3.504 |
Token | probably |
Token ID | 2192 |
Feature activation | -4.32e-01 |
Pos logit contributions | |
Guilty | +4.387 |
que | +3.627 |
GH | +3.602 |
NG | +3.515 |
naire | +3.509 |
Neg logit contributions | |
�醒 | -3.580 |
Synd | -3.567 |
anda | -3.459 |
synd | -3.379 |
ahime | -3.334 |
Token | not |
Token ID | 407 |
Feature activation | -3.49e-01 |
Pos logit contributions | |
Guilty | +5.603 |
que | +4.642 |
GH | +4.579 |
NG | +4.419 |
naire | +4.401 |
Neg logit contributions | |
�醒 | -4.823 |
Synd | -4.698 |
anda | -4.584 |
ahime | -4.441 |
synd | -4.422 |
Token | terribly |
Token ID | 22121 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
Guilty | +4.607 |
GH | +3.785 |
que | +3.779 |
ready | +3.642 |
naire | +3.631 |
Neg logit contributions | |
�醒 | -3.822 |
Synd | -3.756 |
anda | -3.647 |
synd | -3.550 |
ahime | -3.500 |
Token | mature |
Token ID | 15345 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
Guilty | +16.561 |
que | +14.844 |
GH | +13.416 |
naire | +13.027 |
lottery | +12.755 |
Neg logit contributions | |
�醒 | -16.717 |
iliate | -14.994 |
anda | -14.915 |
rint | -14.427 |
ahime | -14.393 |
Token | on |
Token ID | 319 |
Feature activation | -5.45e-01 |
Pos logit contributions | |
Guilty | +2.673 |
GH | +2.224 |
que | +2.200 |
NG | +2.179 |
naire | +2.174 |
Neg logit contributions | |
Synd | -2.002 |
�醒 | -1.974 |
synd | -1.935 |
anda | -1.930 |
ahime | -1.822 |
Token | the |
Token ID | 262 |
Feature activation | -4.59e-01 |
Pos logit contributions | |
Guilty | +7.144 |
que | +5.927 |
GH | +5.899 |
NG | +5.679 |
ready | +5.675 |
Neg logit contributions | |
�醒 | -5.725 |
Synd | -5.663 |
anda | -5.410 |
synd | -5.372 |
ahime | -5.207 |
Token | boy |
Token ID | 2933 |
Feature activation | -3.76e-01 |
Pos logit contributions | |
Guilty | +5.957 |
que | +4.864 |
GH | +4.842 |
naire | +4.711 |
NG | +4.677 |
Neg logit contributions | |
�醒 | -4.987 |
Synd | -4.979 |
anda | -4.810 |
synd | -4.715 |
ahime | -4.633 |
Token | � |
Token ID | 447 |
Feature activation | +5.92e-02 |
Pos logit contributions | |
Guilty | +4.653 |
GH | +3.843 |
que | +3.798 |
naire | +3.745 |
NG | +3.722 |
Neg logit contributions | |
Synd | -4.304 |
�醒 | -4.237 |
synd | -4.113 |
anda | -4.100 |
ahime | -3.948 |
Token | w |
Token ID | 86 |
Feature activation | -2.60e-01 |
Pos logit contributions | |
Guilty | +2.815 |
GH | +2.371 |
NG | +2.321 |
naire | +2.313 |
que | +2.300 |
Neg logit contributions | |
Synd | -2.046 |
�醒 | -1.994 |
synd | -1.978 |
anda | -1.932 |
Tad | -1.840 |
Token | > |
Token ID | 29 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
Guilty | +3.540 |
GH | +2.973 |
NG | +2.921 |
naire | +2.909 |
que | +2.895 |
Neg logit contributions | |
Synd | -2.699 |
�醒 | -2.652 |
synd | -2.607 |
anda | -2.521 |
Tad | -2.456 |
Token | save |
Token ID | 3613 |
Feature activation | -3.04e-01 |
Pos logit contributions | |
Synd | +3.776 |
synd | +3.688 |
anda | +3.613 |
�醒 | +3.462 |
Tad | +3.457 |
Neg logit contributions | |
Guilty | -4.651 |
GH | -3.874 |
naire | -3.821 |
NG | -3.775 |
isSpecialOrderable | -3.712 |
Token | [ |
Token ID | 685 |
Feature activation | +3.03e-01 |
Pos logit contributions | |
Guilty | +4.102 |
GH | +3.394 |
que | +3.387 |
NG | +3.350 |
naire | +3.290 |
Neg logit contributions | |
Synd | -3.210 |
�醒 | -3.198 |
synd | -3.098 |
anda | -3.084 |
ahime | -2.904 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.67e-01 |
Pos logit contributions | |
Synd | +2.607 |
anda | +2.566 |
synd | +2.522 |
utt | +2.340 |
Tad | +2.299 |
Neg logit contributions | |
Guilty | -4.729 |
GH | -3.869 |
que | -3.851 |
naire | -3.848 |
NG | -3.769 |
Token | : |
Token ID | 25 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
Synd | +3.424 |
synd | +3.268 |
anda | +3.231 |
Tad | +2.982 |
utt | +2.933 |
Neg logit contributions | |
Guilty | -7.704 |
GH | -6.429 |
naire | -6.370 |
isSpecialOrderable | -6.353 |
que | -6.349 |
Token | 47 |
Token ID | 2857 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
48 | +6.782 |
Synd | +5.032 |
Tad | +5.031 |
nt | +4.676 |
Teddy | +4.510 |
Neg logit contributions | |
� | -34.193 |
� | -33.859 |
� | -32.652 |
Guilty | -32.613 |
proble | -32.498 |
Token | ] |
Token ID | 60 |
Feature activation | +5.48e-01 |
Pos logit contributions | |
Synd | +1.911 |
synd | +1.816 |
anda | +1.798 |
Tad | +1.640 |
utt | +1.608 |
Neg logit contributions | |
Guilty | -4.643 |
GH | -3.945 |
naire | -3.894 |
que | -3.880 |
NG | -3.839 |
Token | < |
Token ID | 1279 |
Feature activation | +8.89e-02 |
Pos logit contributions | |
Synd | +3.682 |
synd | +3.552 |
anda | +3.495 |
�醒 | +3.450 |
Tad | +3.201 |
Neg logit contributions | |
Guilty | -9.183 |
GH | -7.938 |
naire | -7.858 |
NG | -7.782 |
itcher | -7.652 |
Token | f |
Token ID | 69 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
Synd | +0.936 |
anda | +0.911 |
synd | +0.909 |
�醒 | +0.895 |
Tad | +0.848 |
Neg logit contributions | |
Guilty | -1.226 |
GH | -1.009 |
naire | -0.987 |
que | -0.986 |
NG | -0.983 |
Token | gt |
Token ID | 13655 |
Feature activation | -8.85e-02 |
Pos logit contributions | |
Guilty | +3.543 |
GH | +2.998 |
naire | +2.905 |
NG | +2.897 |
que | +2.868 |
Neg logit contributions | |
Synd | -2.779 |
�醒 | -2.716 |
synd | -2.673 |
anda | -2.590 |
Tad | -2.500 |
Token | m |
Token ID | 285 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
Synd | +1.721 |
synd | +1.681 |
anda | +1.667 |
�醒 | +1.639 |
Tad | +1.566 |
Neg logit contributions | |
Guilty | -2.156 |
GH | -1.783 |
naire | -1.740 |
NG | -1.734 |
que | -1.707 |
Token | 2 |
Token ID | 17 |
Feature activation | +5.94e-01 |
Pos logit contributions | |
Synd | +1.518 |
anda | +1.492 |
synd | +1.482 |
�醒 | +1.458 |
ahime | +1.405 |
Neg logit contributions | |
Guilty | -1.336 |
GH | -1.051 |
naire | -1.022 |
que | -1.014 |
NG | -1.012 |
Token | k |
Token ID | 74 |
Feature activation | -6.57e-02 |
Pos logit contributions | |
anda | +3.626 |
Synd | +3.612 |
synd | +3.534 |
utt | +3.210 |
nt | +3.210 |
Neg logit contributions | |
Guilty | -10.238 |
GH | -8.819 |
NG | -8.552 |
isSpecialOrderable | -8.512 |
naire | -8.466 |
Token | [ |
Token ID | 685 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
Guilty | +0.874 |
GH | +0.721 |
naire | +0.702 |
que | +0.702 |
NG | +0.700 |
Neg logit contributions | |
Synd | -0.724 |
�醒 | -0.704 |
synd | -0.702 |
anda | -0.699 |
ahime | -0.660 |
Token | 10 |
Token ID | 940 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
Synd | +1.260 |
synd | +1.222 |
anda | +1.219 |
�醒 | +1.141 |
utt | +1.126 |
Neg logit contributions | |
Guilty | -2.050 |
GH | -1.695 |
naire | -1.674 |
que | -1.673 |
NG | -1.650 |
Token | : |
Token ID | 25 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
Synd | +2.362 |
synd | +2.264 |
anda | +2.236 |
Tad | +2.075 |
Mutual | +2.046 |
Neg logit contributions | |
Guilty | -4.594 |
GH | -3.849 |
naire | -3.796 |
que | -3.784 |
NG | -3.754 |
Token | 47 |
Token ID | 2857 |
Feature activation | +6.70e-02 |
Pos logit contributions | |
48 | +5.876 |
Synd | +4.328 |
Tad | +4.109 |
nt | +3.747 |
anda | +3.617 |
Neg logit contributions | |
� | -33.293 |
� | -32.813 |
Guilty | -32.516 |
proble | -31.729 |
� | -31.727 |
Token | ] |
Token ID | 60 |
Feature activation | +4.11e-01 |
Pos logit contributions | |
Synd | +0.532 |
synd | +0.511 |
anda | +0.506 |
�醒 | +0.487 |
Tad | +0.464 |
Neg logit contributions | |
Guilty | -1.100 |
GH | -0.938 |
naire | -0.921 |
que | -0.918 |
NG | -0.916 |
Token | < |
Token ID | 1279 |
Feature activation | -5.83e-03 |
Pos logit contributions | |
Synd | +2.948 |
synd | +2.830 |
anda | +2.782 |
�醒 | +2.751 |
Tad | +2.561 |
Neg logit contributions | |
Guilty | -6.878 |
GH | -5.946 |
naire | -5.863 |
NG | -5.824 |
que | -5.708 |
Token | fr |
Token ID | 8310 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
Guilty | +0.081 |
GH | +0.068 |
naire | +0.066 |
NG | +0.066 |
que | +0.066 |
Neg logit contributions | |
Synd | -0.060 |
synd | -0.059 |
anda | -0.058 |
�醒 | -0.058 |
Tad | -0.055 |
Token | ank |
Token ID | 962 |
Feature activation | -4.34e-01 |
Pos logit contributions | |
Synd | +1.531 |
anda | +1.507 |
synd | +1.491 |
�醒 | +1.460 |
utt | +1.411 |
Neg logit contributions | |
Guilty | -1.896 |
GH | -1.547 |
naire | -1.519 |
NG | -1.508 |
que | -1.506 |
Token | m |
Token ID | 285 |
Feature activation | +3.14e-01 |
Pos logit contributions | |
Synd | +0.836 |
synd | +0.816 |
anda | +0.807 |
�醒 | +0.799 |
Tad | +0.760 |
Neg logit contributions | |
Guilty | -1.023 |
GH | -0.843 |
naire | -0.822 |
NG | -0.820 |
que | -0.812 |
Token | 2 |
Token ID | 17 |
Feature activation | +8.79e-01 |
Pos logit contributions | |
anda | +3.834 |
Synd | +3.829 |
synd | +3.729 |
�醒 | +3.601 |
ahime | +3.569 |
Neg logit contributions | |
Guilty | -3.753 |
GH | -2.952 |
naire | -2.900 |
que | -2.845 |
NG | -2.830 |
Token | k |
Token ID | 74 |
Feature activation | +3.67e-01 |
Pos logit contributions | |
anda | +4.400 |
Synd | +4.285 |
synd | +4.233 |
nt | +4.093 |
utt | +3.797 |
Neg logit contributions | |
Guilty | -15.272 |
GH | -13.262 |
isSpecialOrderable | -12.928 |
Reloaded | -12.927 |
NG | -12.802 |
Token | [ |
Token ID | 685 |
Feature activation | +2.49e-01 |
Pos logit contributions | |
Synd | +3.621 |
synd | +3.547 |
anda | +3.482 |
�醒 | +3.392 |
Tad | +3.258 |
Neg logit contributions | |
Guilty | -5.154 |
GH | -4.281 |
NG | -4.199 |
naire | -4.194 |
ready | -4.121 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.49e-01 |
Pos logit contributions | |
Synd | +2.175 |
anda | +2.120 |
synd | +2.110 |
utt | +1.948 |
Tad | +1.927 |
Neg logit contributions | |
Guilty | -3.874 |
GH | -3.173 |
que | -3.165 |
naire | -3.159 |
NG | -3.086 |
Token | : |
Token ID | 25 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
Synd | +3.348 |
synd | +3.194 |
anda | +3.143 |
Tad | +2.901 |
Mutual | +2.863 |
Neg logit contributions | |
Guilty | -7.396 |
GH | -6.183 |
naire | -6.116 |
que | -6.101 |
isSpecialOrderable | -6.082 |
Token | 47 |
Token ID | 2857 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
48 | +6.616 |
Synd | +5.135 |
Tad | +5.012 |
nt | +4.946 |
anda | +4.487 |
Neg logit contributions | |
� | -33.605 |
� | -33.137 |
� | -31.954 |
Guilty | -31.808 |
proble | -31.557 |
Token | ] |
Token ID | 60 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
Synd | +1.437 |
synd | +1.372 |
anda | +1.357 |
Tad | +1.239 |
utt | +1.220 |
Neg logit contributions | |
Guilty | -3.274 |
GH | -2.787 |
naire | -2.745 |
que | -2.736 |
NG | -2.716 |
Token | < |
Token ID | 1279 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
Synd | +1.245 |
synd | +1.197 |
anda | +1.177 |
�醒 | +1.148 |
Tad | +1.079 |
Neg logit contributions | |
Guilty | -2.792 |
GH | -2.404 |
naire | -2.366 |
NG | -2.354 |
que | -2.328 |
Token | k |
Token ID | 74 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
Synd | +1.146 |
anda | +1.117 |
synd | +1.112 |
�醒 | +1.094 |
Tad | +1.038 |
Neg logit contributions | |
Guilty | -1.503 |
GH | -1.235 |
naire | -1.209 |
que | -1.208 |
NG | -1.204 |
Token | asse |
Token ID | 21612 |
Feature activation | +3.12e-01 |
Pos logit contributions | |
Guilty | +1.776 |
GH | +1.485 |
naire | +1.453 |
NG | +1.449 |
que | +1.442 |
Neg logit contributions | |
Synd | -1.329 |
�醒 | -1.297 |
synd | -1.291 |
anda | -1.263 |
Tad | -1.207 |
Token | lol |
Token ID | 19462 |
Feature activation | +3.89e-01 |
Pos logit contributions | |
Synd | +3.763 |
synd | +3.666 |
anda | +3.592 |
�醒 | +3.440 |
Tad | +3.437 |
Neg logit contributions | |
Guilty | -4.623 |
GH | -3.861 |
naire | -3.807 |
NG | -3.756 |
isSpecialOrderable | -3.704 |
Token | j |
Token ID | 474 |
Feature activation | +3.57e-01 |
Pos logit contributions | |
Synd | +4.012 |
synd | +3.937 |
anda | +3.891 |
�醒 | +3.747 |
Tad | +3.673 |
Neg logit contributions | |
Guilty | -5.256 |
GH | -4.375 |
naire | -4.260 |
NG | -4.238 |
ready | -4.184 |
Token | ason |
Token ID | 888 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
anda | +4.562 |
Synd | +4.530 |
synd | +4.437 |
�醒 | +4.299 |
utt | +4.289 |
Neg logit contributions | |
Guilty | -4.000 |
GH | -3.055 |
naire | -3.045 |
que | -2.978 |
NG | -2.939 |
Token | [ |
Token ID | 685 |
Feature activation | +5.24e-02 |
Pos logit contributions | |
Guilty | +2.570 |
GH | +2.110 |
que | +2.073 |
NG | +2.055 |
naire | +2.055 |
Neg logit contributions | |
Synd | -2.181 |
�醒 | -2.122 |
synd | -2.104 |
anda | -2.092 |
ahime | -1.991 |
Token | 10 |
Token ID | 940 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
Synd | +0.506 |
synd | +0.491 |
anda | +0.488 |
�醒 | +0.474 |
Tad | +0.454 |
Neg logit contributions | |
Guilty | -0.770 |
GH | -0.641 |
naire | -0.629 |
que | -0.628 |
NG | -0.624 |
Token | : |
Token ID | 25 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
Synd | +2.978 |
synd | +2.859 |
anda | +2.821 |
Tad | +2.601 |
utt | +2.578 |
Neg logit contributions | |
Guilty | -6.305 |
GH | -5.270 |
naire | -5.199 |
que | -5.196 |
isSpecialOrderable | -5.146 |
Token | 47 |
Token ID | 2857 |
Feature activation | +3.10e-01 |
Pos logit contributions | |
48 | +6.526 |
Synd | +4.822 |
Tad | +4.534 |
Teddy | +4.100 |
synd | +4.065 |
Neg logit contributions | |
� | -33.501 |
� | -33.111 |
Guilty | -33.107 |
proble | -32.021 |
� | -31.969 |
Token | ] |
Token ID | 60 |
Feature activation | +4.85e-01 |
Pos logit contributions | |
Synd | +2.132 |
synd | +2.030 |
anda | +2.003 |
Tad | +1.817 |
utt | +1.794 |
Neg logit contributions | |
Guilty | -5.354 |
GH | -4.545 |
naire | -4.483 |
que | -4.476 |
NG | -4.413 |
Token | < |
Token ID | 1279 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
Synd | +3.341 |
synd | +3.222 |
anda | +3.145 |
�醒 | +3.121 |
Tad | +2.888 |
Neg logit contributions | |
Guilty | -8.160 |
GH | -7.063 |
naire | -6.973 |
NG | -6.899 |
itcher | -6.784 |
Token | fen |
Token ID | 41037 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
Synd | +1.308 |
anda | +1.277 |
synd | +1.270 |
�醒 | +1.248 |
utt | +1.187 |
Neg logit contributions | |
Guilty | -1.699 |
GH | -1.391 |
que | -1.363 |
naire | -1.363 |
NG | -1.357 |
Token | ren |
Token ID | 918 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
Synd | +1.524 |
anda | +1.491 |
synd | +1.480 |
�醒 | +1.453 |
ahime | +1.389 |
Neg logit contributions | |
Guilty | -1.879 |
GH | -1.539 |
NG | -1.500 |
naire | -1.500 |
que | -1.494 |
Token | m |
Token ID | 285 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
Synd | +3.411 |
synd | +3.343 |
anda | +3.305 |
�醒 | +3.203 |
Tad | +3.125 |
Neg logit contributions | |
Guilty | -4.398 |
GH | -3.649 |
naire | -3.562 |
NG | -3.543 |
ready | -3.491 |
Token | 2 |
Token ID | 17 |
Feature activation | +6.84e-01 |
Pos logit contributions | |
Synd | +3.220 |
anda | +3.215 |
synd | +3.133 |
�醒 | +3.047 |
ahime | +2.994 |
Neg logit contributions | |
Guilty | -3.062 |
GH | -2.398 |
naire | -2.348 |
que | -2.327 |
NG | -2.303 |
Token | k |
Token ID | 74 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
anda | +3.955 |
Synd | +3.895 |
synd | +3.810 |
nt | +3.519 |
utt | +3.454 |
Neg logit contributions | |
Guilty | -11.851 |
GH | -10.235 |
isSpecialOrderable | -9.907 |
NG | -9.899 |
Reloaded | -9.809 |
Token | [ |
Token ID | 685 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
Synd | +2.486 |
synd | +2.420 |
anda | +2.398 |
�醒 | +2.360 |
Tad | +2.248 |
Neg logit contributions | |
Guilty | -3.419 |
GH | -2.838 |
NG | -2.784 |
naire | -2.781 |
ready | -2.736 |
Token | 10 |
Token ID | 940 |
Feature activation | +4.18e-01 |
Pos logit contributions | |
Synd | +1.796 |
anda | +1.744 |
synd | +1.743 |
utt | +1.609 |
Tad | +1.595 |
Neg logit contributions | |
Guilty | -3.094 |
GH | -2.544 |
que | -2.526 |
naire | -2.523 |
NG | -2.473 |
Token | : |
Token ID | 25 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
Synd | +3.182 |
synd | +3.037 |
anda | +2.989 |
Tad | +2.763 |
Mutual | +2.727 |
Neg logit contributions | |
Guilty | -6.863 |
GH | -5.742 |
naire | -5.674 |
que | -5.662 |
isSpecialOrderable | -5.625 |
Token | 47 |
Token ID | 2857 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
48 | +6.934 |
Synd | +5.179 |
Tad | +5.003 |
nt | +4.851 |
anda | +4.462 |
Neg logit contributions | |
� | -34.246 |
� | -33.785 |
� | -32.498 |
Guilty | -32.392 |
proble | -32.228 |
Token | ] |
Token ID | 60 |
Feature activation | +4.88e-01 |
Pos logit contributions | |
Synd | +1.471 |
synd | +1.403 |
anda | +1.389 |
Tad | +1.267 |
utt | +1.249 |
Neg logit contributions | |
Guilty | -3.374 |
GH | -2.871 |
naire | -2.829 |
que | -2.821 |
NG | -2.797 |
Token | < |
Token ID | 1279 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
Synd | +3.392 |
synd | +3.258 |
anda | +3.196 |
�醒 | +3.162 |
Tad | +2.940 |
Neg logit contributions | |
Guilty | -8.184 |
GH | -7.084 |
naire | -6.992 |
NG | -6.935 |
itcher | -6.797 |
Token | ok |
Token ID | 482 |
Feature activation | -6.26e-01 |
Pos logit contributions | |
Synd | +1.422 |
anda | +1.390 |
synd | +1.380 |
�醒 | +1.357 |
utt | +1.292 |
Neg logit contributions | |
Guilty | -1.848 |
GH | -1.511 |
que | -1.482 |
naire | -1.481 |
NG | -1.475 |
Token | clock |
Token ID | 15750 |
Feature activation | +8.06e-01 |
Pos logit contributions | |
Guilty | +5.486 |
ready | +4.301 |
GH | +4.287 |
NG | +4.158 |
naire | +4.129 |
Neg logit contributions | |
Synd | -9.109 |
�醒 | -8.919 |
synd | -8.870 |
Tad | -8.550 |
Mutual | -8.462 |
Token | . |
Token ID | 13 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
Guilty | +3.588 |
GH | +2.952 |
que | +2.948 |
naire | +2.921 |
NG | +2.905 |
Neg logit contributions | |
Synd | -2.779 |
�醒 | -2.726 |
synd | -2.674 |
anda | -2.644 |
ahime | -2.545 |
Token | I |
Token ID | 314 |
Feature activation | -2.20e-01 |
Pos logit contributions | |
Synd | +2.369 |
anda | +2.237 |
synd | +2.230 |
�醒 | +2.144 |
Tad | +2.140 |
Neg logit contributions | |
Guilty | -3.248 |
GH | -2.768 |
naire | -2.704 |
que | -2.694 |
NG | -2.679 |
Token | loved |
Token ID | 6151 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
Guilty | +2.934 |
GH | +2.441 |
que | +2.428 |
NG | +2.373 |
naire | +2.370 |
Neg logit contributions | |
�醒 | -2.375 |
Synd | -2.373 |
synd | -2.280 |
anda | -2.276 |
ahime | -2.185 |
Token | the |
Token ID | 262 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
Synd | +2.951 |
anda | +2.858 |
synd | +2.844 |
Tad | +2.697 |
�醒 | +2.666 |
Neg logit contributions | |
Guilty | -4.159 |
GH | -3.546 |
naire | -3.475 |
NG | -3.416 |
ready | -3.361 |
Token | moments |
Token ID | 7188 |
Feature activation | +9.21e-01 |
Pos logit contributions | |
Synd | +1.470 |
synd | +1.438 |
anda | +1.419 |
�醒 | +1.387 |
Tad | +1.341 |
Neg logit contributions | |
Guilty | -1.820 |
GH | -1.521 |
naire | -1.482 |
NG | -1.477 |
que | -1.441 |
Token | of |
Token ID | 286 |
Feature activation | +6.53e-01 |
Pos logit contributions | |
Synd | +7.358 |
anda | +7.188 |
synd | +7.097 |
Tad | +6.886 |
Mutual | +6.438 |
Neg logit contributions | |
Guilty | -13.121 |
GH | -11.422 |
naire | -11.093 |
isSpecialOrderable | -10.903 |
eligible | -10.742 |
Token | le |
Token ID | 443 |
Feature activation | +3.26e-01 |
Pos logit contributions | |
Synd | +7.124 |
synd | +6.909 |
anda | +6.764 |
Tad | +6.634 |
Mutual | +6.562 |
Neg logit contributions | |
Guilty | -7.939 |
GH | -6.857 |
naire | -6.822 |
NG | -6.564 |
isSpecialOrderable | -6.418 |
Token | vity |
Token ID | 21319 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
Synd | +2.439 |
anda | +2.386 |
synd | +2.360 |
�醒 | +2.293 |
utt | +2.150 |
Neg logit contributions | |
Guilty | -5.343 |
GH | -4.611 |
NG | -4.522 |
naire | -4.517 |
que | -4.403 |
Token | that |
Token ID | 326 |
Feature activation | +6.93e-01 |
Pos logit contributions | |
Synd | +8.730 |
synd | +8.434 |
anda | +8.409 |
Tad | +8.003 |
Mutual | +7.669 |
Neg logit contributions | |
Guilty | -13.574 |
GH | -11.605 |
naire | -11.447 |
isSpecialOrderable | -11.077 |
ready | -11.010 |
Token | followed |
Token ID | 3940 |
Feature activation | +7.83e-01 |
Pos logit contributions | |
Synd | +7.502 |
synd | +7.373 |
anda | +7.205 |
Tad | +6.990 |
Mutual | +6.802 |
Neg logit contributions | |
Guilty | -8.508 |
GH | -7.040 |
naire | -6.944 |
isSpecialOrderable | -6.866 |
NG | -6.810 |
Token | that |
Token ID | 326 |
Feature activation | +6.68e-01 |
Pos logit contributions | |
Synd | +6.595 |
anda | +6.539 |
synd | +6.401 |
Tad | +6.207 |
Mutual | +5.937 |
Neg logit contributions | |
Guilty | -11.113 |
GH | -9.587 |
naire | -9.498 |
NG | -9.140 |
itcher | -9.110 |
Token | stride |
Token ID | 33769 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
Guilty | +1.859 |
GH | +1.543 |
que | +1.515 |
naire | +1.508 |
NG | +1.501 |
Neg logit contributions | |
Synd | -1.392 |
�醒 | -1.346 |
synd | -1.343 |
anda | -1.342 |
ahime | -1.260 |
Token | . |
Token ID | 13 |
Feature activation | +8.64e-02 |
Pos logit contributions | |
Synd | +2.972 |
synd | +2.911 |
anda | +2.883 |
�醒 | +2.788 |
Tad | +2.668 |
Neg logit contributions | |
Guilty | -4.632 |
GH | -3.894 |
NG | -3.796 |
naire | -3.791 |
que | -3.717 |
Token | Cricket |
Token ID | 34761 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
Synd | +0.887 |
synd | +0.852 |
anda | +0.847 |
�醒 | +0.836 |
Tad | +0.801 |
Neg logit contributions | |
Guilty | -1.211 |
GH | -1.016 |
naire | -0.997 |
NG | -0.991 |
que | -0.990 |
Token | nerd |
Token ID | 34712 |
Feature activation | +4.30e-01 |
Pos logit contributions | |
Synd | +2.157 |
synd | +2.119 |
anda | +2.081 |
�醒 | +2.024 |
Tad | +1.953 |
Neg logit contributions | |
Guilty | -2.771 |
GH | -2.281 |
naire | -2.235 |
NG | -2.224 |
que | -2.186 |
Token | os |
Token ID | 418 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
Synd | +4.763 |
anda | +4.703 |
synd | +4.690 |
�醒 | +4.485 |
Tad | +4.402 |
Neg logit contributions | |
Guilty | -5.432 |
GH | -4.456 |
NG | -4.377 |
naire | -4.342 |
que | -4.210 |
Token | could |
Token ID | 714 |
Feature activation | +6.68e-01 |
Pos logit contributions | |
Synd | +2.098 |
synd | +2.059 |
anda | +2.041 |
�醒 | +1.972 |
Tad | +1.914 |
Neg logit contributions | |
Guilty | -2.566 |
GH | -2.106 |
naire | -2.056 |
NG | -2.048 |
ready | -2.001 |
Token | look |
Token ID | 804 |
Feature activation | -2.99e-01 |
Pos logit contributions | |
Synd | +6.953 |
anda | +6.940 |
synd | +6.920 |
utt | +6.558 |
�醒 | +6.474 |
Neg logit contributions | |
Guilty | -8.494 |
GH | -6.860 |
isSpecialOrderable | -6.834 |
naire | -6.666 |
NG | -6.641 |
Token | at |
Token ID | 379 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
Guilty | +4.115 |
que | +3.408 |
GH | +3.361 |
NG | +3.297 |
ready | +3.246 |
Neg logit contributions | |
Synd | -3.128 |
�醒 | -3.083 |
synd | -3.010 |
anda | -2.967 |
ahime | -2.895 |
Token | him |
Token ID | 683 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
Synd | +0.122 |
synd | +0.118 |
anda | +0.118 |
�醒 | +0.117 |
Tad | +0.110 |
Neg logit contributions | |
Guilty | -0.165 |
GH | -0.137 |
naire | -0.134 |
NG | -0.134 |
que | -0.133 |
Token | forever |
Token ID | 8097 |
Feature activation | -5.61e-01 |
Pos logit contributions | |
Guilty | +7.189 |
que | +6.053 |
GH | +5.885 |
NG | +5.772 |
ready | +5.680 |
Neg logit contributions | |
�醒 | -5.958 |
Synd | -5.919 |
synd | -5.668 |
anda | -5.596 |
ahime | -5.590 |
Token | . |
Token ID | 13 |
Feature activation | +8.87e-02 |
Pos logit contributions | |
Guilty | +7.177 |
que | +6.021 |
GH | +5.821 |
NG | +5.764 |
ready | +5.722 |
Neg logit contributions | |
�醒 | -6.023 |
Synd | -5.977 |
synd | -5.702 |
ahime | -5.601 |
anda | -5.564 |
Token | . |
Token ID | 13 |
Feature activation | +6.72e-02 |
Pos logit contributions | |
synd | +8.874 |
Synd | +8.450 |
anda | +8.420 |
Tad | +7.991 |
Berkshire | +7.831 |
Neg logit contributions | |
Guilty | -14.470 |
isSpecialOrderable | -12.547 |
GH | -12.452 |
naire | -11.923 |
itcher | -11.667 |
Token |
|
Token ID | 198 |
Feature activation | +2.98e-01 |
Pos logit contributions | |
Synd | +0.687 |
synd | +0.662 |
anda | +0.656 |
�醒 | +0.651 |
Tad | +0.620 |
Neg logit contributions | |
Guilty | -0.947 |
GH | -0.792 |
naire | -0.775 |
que | -0.774 |
NG | -0.772 |
Token |
|
Token ID | 198 |
Feature activation | +4.97e-01 |
Pos logit contributions | |
Synd | +2.668 |
synd | +2.562 |
anda | +2.529 |
Tad | +2.356 |
utt | +2.343 |
Neg logit contributions | |
Guilty | -4.541 |
GH | -3.789 |
naire | -3.723 |
que | -3.718 |
NG | -3.683 |
Token | " |
Token ID | 1 |
Feature activation | +6.12e-01 |
Pos logit contributions | |
anda | +4.802 |
Synd | +4.744 |
synd | +4.594 |
�醒 | +4.427 |
Tad | +4.332 |
Neg logit contributions | |
Guilty | -6.911 |
que | -5.717 |
naire | -5.571 |
anted | -5.357 |
GH | -5.353 |
Token | People |
Token ID | 8061 |
Feature activation | +7.16e-01 |
Pos logit contributions | |
Synd | +5.842 |
anda | +5.735 |
synd | +5.574 |
Tad | +5.396 |
Mutual | +5.304 |
Neg logit contributions | |
Guilty | -8.199 |
que | -6.992 |
naire | -6.722 |
anted | -6.586 |
isSpecialOrderable | -6.541 |
Token | have |
Token ID | 423 |
Feature activation | +6.92e-01 |
Pos logit contributions | |
synd | +6.766 |
Synd | +6.533 |
anda | +6.446 |
Tad | +6.192 |
utt | +5.922 |
Neg logit contributions | |
Guilty | -9.803 |
GH | -8.183 |
isSpecialOrderable | -8.111 |
naire | -8.086 |
Reloaded | -8.082 |
Token | lost |
Token ID | 2626 |
Feature activation | +9.79e-01 |
Pos logit contributions | |
synd | +6.682 |
Synd | +6.527 |
anda | +6.258 |
Tad | +6.129 |
Tyrann | +5.883 |
Neg logit contributions | |
Guilty | -9.507 |
GH | -8.114 |
naire | -7.844 |
isSpecialOrderable | -7.811 |
NG | -7.712 |
Token | fingers |
Token ID | 9353 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
synd | +8.929 |
Synd | +8.428 |
Tad | +8.258 |
anda | +8.102 |
Tyrann | +7.943 |
Neg logit contributions | |
Guilty | -13.321 |
GH | -11.030 |
NG | -10.768 |
naire | -10.756 |
itcher | -10.637 |
Token | -- |
Token ID | 1377 |
Feature activation | +8.98e-01 |
Pos logit contributions | |
synd | +8.311 |
Synd | +7.992 |
anda | +7.968 |
Tad | +7.153 |
Tyrann | +7.035 |
Neg logit contributions | |
Guilty | -16.009 |
isSpecialOrderable | -13.584 |
GH | -13.408 |
naire | -13.334 |
Reloaded | -13.210 |
Token | that |
Token ID | 326 |
Feature activation | +5.55e-01 |
Pos logit contributions | |
synd | +8.329 |
Synd | +8.118 |
anda | +7.887 |
Tad | +7.651 |
Tyrann | +7.569 |
Neg logit contributions | |
Guilty | -11.573 |
GH | -9.763 |
isSpecialOrderable | -9.713 |
naire | -9.564 |
NG | -9.526 |
Token | 's |
Token ID | 338 |
Feature activation | +6.78e-01 |
Pos logit contributions | |
synd | +4.982 |
Synd | +4.865 |
anda | +4.744 |
Tad | +4.565 |
Tyrann | +4.428 |
Neg logit contributions | |
Guilty | -8.089 |
GH | -6.852 |
naire | -6.711 |
ready | -6.691 |
NG | -6.654 |
Token | reports |
Token ID | 3136 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
synd | +4.892 |
Synd | +4.745 |
anda | +4.461 |
�醒 | +4.108 |
andowski | +4.076 |
Neg logit contributions | |
Guilty | -9.136 |
GH | -7.697 |
naire | -7.614 |
itcher | -7.358 |
NG | -7.321 |
Token | after |
Token ID | 706 |
Feature activation | -2.97e-01 |
Pos logit contributions | |
synd | +10.490 |
Synd | +9.922 |
anda | +9.731 |
Tad | +9.440 |
utt | +9.219 |
Neg logit contributions | |
Guilty | -14.401 |
NG | -11.713 |
GH | -11.708 |
naire | -11.457 |
isSpecialOrderable | -11.374 |
Token | the |
Token ID | 262 |
Feature activation | -9.98e-02 |
Pos logit contributions | |
Guilty | +3.914 |
GH | +3.241 |
que | +3.194 |
NG | +3.160 |
naire | +3.152 |
Neg logit contributions | |
Synd | -3.188 |
�醒 | -3.175 |
anda | -3.101 |
synd | -3.074 |
ahime | -3.045 |
Token | Des |
Token ID | 2935 |
Feature activation | -1.86e-01 |
Pos logit contributions | |
Guilty | +1.174 |
GH | +0.936 |
que | +0.911 |
naire | +0.909 |
NG | +0.906 |
Neg logit contributions | |
Synd | -1.250 |
�醒 | -1.223 |
anda | -1.217 |
synd | -1.216 |
ahime | -1.162 |
Token | Moines |
Token ID | 36576 |
Feature activation | +4.15e-01 |
Pos logit contributions | |
Guilty | +3.050 |
GH | +2.620 |
naire | +2.595 |
que | +2.576 |
NG | +2.561 |
Neg logit contributions | |
Synd | -1.448 |
synd | -1.392 |
�醒 | -1.386 |
anda | -1.358 |
ahime | -1.279 |
Token | debate |
Token ID | 4384 |
Feature activation | +6.42e-01 |
Pos logit contributions | |
Synd | +5.110 |
synd | +5.001 |
anda | +4.906 |
�醒 | +4.818 |
Mutual | +4.711 |
Neg logit contributions | |
Guilty | -4.848 |
GH | -3.941 |
naire | -3.842 |
NG | -3.803 |
que | -3.727 |
Token | last |
Token ID | 938 |
Feature activation | +8.36e-02 |
Pos logit contributions | |
synd | +6.457 |
Synd | +6.372 |
anda | +6.203 |
andowski | +5.881 |
Tad | +5.865 |
Neg logit contributions | |
Guilty | -8.494 |
GH | -7.051 |
NG | -6.907 |
naire | -6.709 |
isSpecialOrderable | -6.664 |
Token | month |
Token ID | 1227 |
Feature activation | +8.00e-01 |
Pos logit contributions | |
Synd | +0.955 |
synd | +0.935 |
anda | +0.922 |
�醒 | +0.908 |
Tad | +0.875 |
Neg logit contributions | |
Guilty | -1.078 |
GH | -0.885 |
naire | -0.863 |
NG | -0.857 |
que | -0.850 |
Token | said |
Token ID | 531 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
synd | +7.850 |
Synd | +7.672 |
anda | +7.451 |
utt | +7.201 |
Tad | +7.152 |
Neg logit contributions | |
Guilty | -10.410 |
GH | -8.664 |
NG | -8.610 |
naire | -8.233 |
isSpecialOrderable | -8.205 |
Token | his |
Token ID | 465 |
Feature activation | +3.40e-01 |
Pos logit contributions | |
Synd | +1.855 |
synd | +1.816 |
anda | +1.788 |
�醒 | +1.760 |
Tad | +1.692 |
Neg logit contributions | |
Guilty | -2.546 |
GH | -2.133 |
NG | -2.072 |
naire | -2.059 |
que | -2.055 |
Token | campaign |
Token ID | 1923 |
Feature activation | +8.30e-01 |
Pos logit contributions | |
Synd | +3.431 |
synd | +3.410 |
anda | +3.261 |
�醒 | +3.151 |
Tad | +3.142 |
Neg logit contributions | |
Guilty | -4.732 |
GH | -3.999 |
naire | -3.883 |
NG | -3.852 |
que | -3.794 |
Token | Business |
Token ID | 7320 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
Synd | +5.323 |
synd | +4.827 |
Mutual | +4.808 |
anda | +4.623 |
Tad | +4.606 |
Neg logit contributions | |
Guilty | -7.938 |
que | -6.869 |
GH | -6.861 |
anted | -6.806 |
naire | -6.794 |
Token | es |
Token ID | 274 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
Synd | +1.269 |
synd | +1.245 |
anda | +1.224 |
�醒 | +1.202 |
Mutual | +1.139 |
Neg logit contributions | |
Guilty | -1.789 |
GH | -1.494 |
naire | -1.450 |
NG | -1.445 |
que | -1.444 |
Token | cease |
Token ID | 13468 |
Feature activation | +3.13e-01 |
Pos logit contributions | |
synd | +3.419 |
Synd | +3.408 |
anda | +3.268 |
Tad | +3.094 |
Mutual | +3.085 |
Neg logit contributions | |
Guilty | -5.029 |
GH | -4.229 |
naire | -4.132 |
NG | -4.065 |
ready | -4.020 |
Token | to |
Token ID | 284 |
Feature activation | -1.68e-03 |
Pos logit contributions | |
Synd | +3.043 |
synd | +3.028 |
anda | +2.888 |
�醒 | +2.823 |
Tad | +2.732 |
Neg logit contributions | |
Guilty | -4.506 |
GH | -3.789 |
naire | -3.671 |
NG | -3.643 |
ready | -3.631 |
Token | expand |
Token ID | 4292 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
Guilty | +0.023 |
GH | +0.020 |
naire | +0.019 |
NG | +0.019 |
que | +0.019 |
Neg logit contributions | |
Synd | -0.017 |
synd | -0.017 |
anda | -0.017 |
�醒 | -0.017 |
Tad | -0.016 |
Token | and |
Token ID | 290 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
Synd | +2.038 |
synd | +2.006 |
anda | +1.941 |
�醒 | +1.848 |
Tad | +1.819 |
Neg logit contributions | |
Guilty | -3.301 |
GH | -2.786 |
naire | -2.717 |
NG | -2.698 |
que | -2.670 |
Token | unemployment |
Token ID | 10681 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
synd | +6.688 |
Synd | +6.660 |
anda | +6.137 |
Mutual | +5.980 |
Berkshire | +5.960 |
Neg logit contributions | |
Guilty | -8.749 |
GH | -7.248 |
naire | -6.982 |
NG | -6.832 |
ready | -6.824 |
Token | rises |
Token ID | 16736 |
Feature activation | +5.95e-01 |
Pos logit contributions | |
synd | +3.440 |
Synd | +3.428 |
anda | +3.268 |
�醒 | +3.124 |
Tad | +3.099 |
Neg logit contributions | |
Guilty | -4.389 |
GH | -3.592 |
NG | -3.498 |
naire | -3.492 |
ready | -3.422 |
Token | . |
Token ID | 13 |
Feature activation | +5.37e-01 |
Pos logit contributions | |
Synd | +5.002 |
synd | +4.982 |
anda | +4.782 |
�醒 | +4.414 |
Tad | +4.366 |
Neg logit contributions | |
Guilty | -9.151 |
GH | -7.578 |
naire | -7.415 |
NG | -7.319 |
ready | -7.292 |
Token |
|
Token ID | 198 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
Synd | +5.276 |
synd | +4.802 |
Mutual | +4.774 |
anda | +4.612 |
Tad | +4.575 |
Neg logit contributions | |
Guilty | -7.453 |
GH | -6.429 |
que | -6.387 |
anted | -6.334 |
naire | -6.311 |
Token |
|
Token ID | 198 |
Feature activation | +6.77e-01 |
Pos logit contributions | |
Synd | +1.576 |
synd | +1.525 |
anda | +1.510 |
�醒 | +1.413 |
Tad | +1.407 |
Neg logit contributions | |
Guilty | -2.427 |
GH | -2.019 |
naire | -1.983 |
que | -1.978 |
NG | -1.962 |
Token | dopamine |
Token ID | 26252 |
Feature activation | +5.56e-02 |
Pos logit contributions | |
Synd | +1.742 |
synd | +1.718 |
anda | +1.688 |
�醒 | +1.639 |
Tad | +1.588 |
Neg logit contributions | |
Guilty | -2.133 |
GH | -1.777 |
NG | -1.722 |
naire | -1.717 |
que | -1.682 |
Token | levels |
Token ID | 2974 |
Feature activation | +4.17e-01 |
Pos logit contributions | |
Synd | +0.576 |
synd | +0.562 |
anda | +0.554 |
�醒 | +0.548 |
Tad | +0.519 |
Neg logit contributions | |
Guilty | -0.778 |
GH | -0.649 |
naire | -0.635 |
NG | -0.630 |
que | -0.627 |
Token | to |
Token ID | 284 |
Feature activation | -3.07e-01 |
Pos logit contributions | |
synd | +3.835 |
Synd | +3.808 |
anda | +3.686 |
Tad | +3.426 |
�醒 | +3.342 |
Neg logit contributions | |
Guilty | -6.147 |
GH | -5.224 |
naire | -5.089 |
NG | -5.048 |
ready | -4.955 |
Token | symptoms |
Token ID | 7460 |
Feature activation | +6.63e-02 |
Pos logit contributions | |
Guilty | +3.946 |
que | +3.266 |
GH | +3.203 |
naire | +3.169 |
NG | +3.110 |
Neg logit contributions | |
�醒 | -3.418 |
Synd | -3.398 |
anda | -3.312 |
ahime | -3.241 |
synd | -3.220 |
Token | of |
Token ID | 286 |
Feature activation | -4.35e-01 |
Pos logit contributions | |
Synd | +0.696 |
synd | +0.680 |
anda | +0.670 |
�醒 | +0.661 |
Tad | +0.629 |
Neg logit contributions | |
Guilty | -0.922 |
GH | -0.766 |
naire | -0.746 |
NG | -0.744 |
que | -0.737 |
Token | schizophrenia |
Token ID | 22794 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
Guilty | +5.013 |
que | +4.108 |
naire | +3.926 |
GH | +3.925 |
NG | +3.760 |
Neg logit contributions | |
�醒 | -5.402 |
Synd | -5.232 |
anda | -5.222 |
ahime | -5.124 |
synd | -4.969 |
Token | . |
Token ID | 13 |
Feature activation | -2.69e-01 |
Pos logit contributions | |
Synd | +1.532 |
synd | +1.505 |
anda | +1.463 |
�醒 | +1.416 |
Tad | +1.362 |
Neg logit contributions | |
Guilty | -2.320 |
GH | -1.956 |
NG | -1.894 |
naire | -1.892 |
que | -1.867 |
Token | Indeed |
Token ID | 9676 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
Guilty | +3.675 |
GH | +3.003 |
naire | +2.931 |
que | +2.899 |
NG | +2.885 |
Neg logit contributions | |
�醒 | -2.880 |
Synd | -2.802 |
anda | -2.793 |
synd | -2.788 |
ahime | -2.697 |
Token | , |
Token ID | 11 |
Feature activation | +3.29e-02 |
Pos logit contributions | |
Guilty | +4.161 |
GH | +3.442 |
que | +3.442 |
naire | +3.365 |
NG | +3.347 |
Neg logit contributions | |
�醒 | -3.435 |
Synd | -3.331 |
anda | -3.239 |
ahime | -3.187 |
synd | -3.186 |
Token | a |
Token ID | 257 |
Feature activation | +6.49e-01 |
Pos logit contributions | |
Synd | +0.344 |
synd | +0.335 |
anda | +0.331 |
�醒 | +0.328 |
Tad | +0.312 |
Neg logit contributions | |
Guilty | -0.457 |
GH | -0.380 |
naire | -0.371 |
NG | -0.371 |
que | -0.368 |
Token | flood |
Token ID | 6947 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
synd | +7.007 |
Synd | +6.773 |
anda | +6.480 |
Tad | +6.173 |
�醒 | +6.170 |
Neg logit contributions | |
Guilty | -8.185 |
GH | -6.954 |
NG | -6.750 |
isSpecialOrderable | -6.719 |
ready | -6.556 |
Token | s |
Token ID | 82 |
Feature activation | -9.52e-01 |
Pos logit contributions | |
Synd | +0.563 |
synd | +0.547 |
anda | +0.546 |
�醒 | +0.541 |
Tad | +0.511 |
Neg logit contributions | |
Guilty | -0.704 |
GH | -0.581 |
naire | -0.567 |
NG | -0.564 |
que | -0.563 |
Token | obviously |
Token ID | 6189 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
Guilty | +11.373 |
que | +9.538 |
GH | +9.342 |
NG | +9.154 |
ready | +8.897 |
Neg logit contributions | |
�醒 | -10.911 |
Synd | -9.500 |
anda | -9.251 |
ahime | -9.237 |
synd | -9.125 |
Token | not |
Token ID | 407 |
Feature activation | -6.47e-01 |
Pos logit contributions | |
Guilty | +12.908 |
que | +10.964 |
GH | +10.762 |
NG | +10.268 |
ready | +10.036 |
Neg logit contributions | |
�醒 | -13.385 |
anda | -11.182 |
Synd | -11.049 |
ahime | -11.010 |
andowski | -10.839 |
Token | impossible |
Token ID | 5340 |
Feature activation | -6.69e-01 |
Pos logit contributions | |
Guilty | +8.126 |
que | +6.682 |
GH | +6.643 |
ready | +6.366 |
NG | +6.334 |
Neg logit contributions | |
�醒 | -7.433 |
Synd | -6.783 |
anda | -6.610 |
synd | -6.544 |
andowski | -6.405 |
Token | that |
Token ID | 326 |
Feature activation | -2.25e-01 |
Pos logit contributions | |
Guilty | +7.943 |
GH | +6.546 |
que | +6.459 |
NG | +6.367 |
naire | +6.160 |
Neg logit contributions | |
�醒 | -7.663 |
Synd | -7.333 |
synd | -7.206 |
anda | -7.107 |
ahime | -6.987 |
Token | this |
Token ID | 428 |
Feature activation | -9.61e-02 |
Pos logit contributions | |
Guilty | +3.182 |
GH | +2.678 |
que | +2.607 |
NG | +2.589 |
naire | +2.576 |
Neg logit contributions | |
�醒 | -2.260 |
Synd | -2.250 |
synd | -2.177 |
anda | -2.171 |
ahime | -2.060 |
Token | could |
Token ID | 714 |
Feature activation | +3.31e-01 |
Pos logit contributions | |
Guilty | +1.334 |
GH | +1.111 |
que | +1.085 |
NG | +1.083 |
naire | +1.081 |
Neg logit contributions | |
Synd | -1.001 |
�醒 | -0.977 |
synd | -0.967 |
anda | -0.965 |
ahime | -0.909 |
Token | happen |
Token ID | 1645 |
Feature activation | +7.45e-02 |
Pos logit contributions | |
Synd | +3.577 |
synd | +3.528 |
anda | +3.476 |
�醒 | +3.302 |
utt | +3.255 |
Neg logit contributions | |
Guilty | -4.419 |
GH | -3.576 |
naire | -3.525 |
NG | -3.505 |
ready | -3.441 |
Token | again |
Token ID | 757 |
Feature activation | +2.09e-01 |
Pos logit contributions | |
Synd | +0.744 |
synd | +0.722 |
anda | +0.717 |
�醒 | +0.707 |
Tad | +0.667 |
Neg logit contributions | |
Guilty | -1.069 |
GH | -0.894 |
naire | -0.875 |
NG | -0.871 |
que | -0.866 |
Token | . |
Token ID | 13 |
Feature activation | -1.91e-01 |
Pos logit contributions | |
Synd | +1.983 |
synd | +1.933 |
anda | +1.923 |
�醒 | +1.844 |
Tad | +1.773 |
Neg logit contributions | |
Guilty | -3.081 |
GH | -2.591 |
naire | -2.546 |
NG | -2.520 |
que | -2.503 |
Token |
|
Token ID | 198 |
Feature activation | +5.04e-02 |
Pos logit contributions | |
Guilty | +2.582 |
GH | +2.137 |
NG | +2.071 |
naire | +2.061 |
que | +2.053 |
Neg logit contributions | |
Synd | -2.042 |
�醒 | -2.026 |
synd | -2.007 |
anda | -1.991 |
ahime | -1.891 |
Token | ing |
Token ID | 278 |
Feature activation | +3.24e-01 |
Pos logit contributions | |
Guilty | +3.873 |
GH | +3.148 |
naire | +3.123 |
NG | +3.081 |
que | +3.066 |
Neg logit contributions | |
Synd | -3.746 |
�醒 | -3.693 |
synd | -3.591 |
anda | -3.563 |
ahime | -3.450 |
Token | whether |
Token ID | 1771 |
Feature activation | +6.60e-01 |
Pos logit contributions | |
Synd | +3.344 |
synd | +3.341 |
anda | +3.208 |
�醒 | +3.080 |
Tad | +3.078 |
Neg logit contributions | |
Guilty | -4.440 |
GH | -3.753 |
NG | -3.624 |
naire | -3.584 |
ready | -3.572 |
Token | to |
Token ID | 284 |
Feature activation | +4.23e-01 |
Pos logit contributions | |
synd | +5.773 |
Synd | +5.729 |
anda | +5.401 |
Tad | +5.266 |
andowski | +5.139 |
Neg logit contributions | |
Guilty | -9.476 |
GH | -8.142 |
naire | -7.966 |
NG | -7.956 |
ready | -7.922 |
Token | fire |
Token ID | 2046 |
Feature activation | +7.30e-01 |
Pos logit contributions | |
synd | +4.715 |
Synd | +4.600 |
anda | +4.443 |
Tad | +4.208 |
Mutual | +4.191 |
Neg logit contributions | |
Guilty | -5.463 |
GH | -4.520 |
NG | -4.458 |
ready | -4.363 |
isSpecialOrderable | -4.309 |
Token | its |
Token ID | 663 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
Synd | +6.894 |
synd | +6.736 |
Tad | +6.367 |
anda | +6.321 |
Tyrann | +6.053 |
Neg logit contributions | |
Guilty | -9.921 |
GH | -8.404 |
naire | -8.340 |
NG | -8.330 |
isSpecialOrderable | -8.262 |
Token | controversial |
Token ID | 8381 |
Feature activation | -9.09e-02 |
Pos logit contributions | |
Synd | +1.231 |
synd | +1.204 |
anda | +1.181 |
�醒 | +1.159 |
Tad | +1.121 |
Neg logit contributions | |
Guilty | -1.444 |
GH | -1.190 |
naire | -1.164 |
NG | -1.161 |
que | -1.148 |
Token | editor |
Token ID | 5464 |
Feature activation | +8.55e-01 |
Pos logit contributions | |
Guilty | +1.165 |
GH | +0.947 |
que | +0.925 |
naire | +0.922 |
NG | +0.919 |
Neg logit contributions | |
Synd | -1.042 |
�醒 | -1.024 |
anda | -1.015 |
synd | -1.011 |
ahime | -0.964 |
Token | . |
Token ID | 13 |
Feature activation | -5.58e-03 |
Pos logit contributions | |
Synd | +7.424 |
synd | +7.359 |
anda | +7.141 |
Tad | +6.995 |
Tyrann | +6.604 |
Neg logit contributions | |
Guilty | -11.657 |
GH | -10.310 |
naire | -10.216 |
NG | -10.173 |
isSpecialOrderable | -9.938 |
Token | Some |
Token ID | 2773 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
Guilty | +0.075 |
GH | +0.062 |
naire | +0.061 |
NG | +0.060 |
que | +0.060 |
Neg logit contributions | |
Synd | -0.061 |
synd | -0.059 |
anda | -0.059 |
�醒 | -0.059 |
Tad | -0.055 |
Token | of |
Token ID | 286 |
Feature activation | -3.88e-02 |
Pos logit contributions | |
Synd | +1.464 |
synd | +1.436 |
anda | +1.406 |
�醒 | +1.362 |
Tad | +1.329 |
Neg logit contributions | |
Guilty | -1.859 |
GH | -1.548 |
naire | -1.511 |
NG | -1.505 |
que | -1.482 |
Token | Milo |
Token ID | 32662 |
Feature activation | +5.58e-02 |
Pos logit contributions | |
Guilty | +0.522 |
GH | +0.431 |
naire | +0.420 |
que | +0.419 |
NG | +0.419 |
Neg logit contributions | |
Synd | -0.422 |
synd | -0.410 |
�醒 | -0.409 |
anda | -0.408 |
ahime | -0.385 |
Token | � |
Token ID | 251 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
�醒 | +3.458 |
Synd | +3.411 |
anda | +3.353 |
synd | +3.246 |
Tad | +3.113 |
Neg logit contributions | |
Guilty | -7.288 |
GH | -6.284 |
que | -6.155 |
naire | -6.125 |
NG | -6.111 |
Token | No |
Token ID | 1400 |
Feature activation | -4.83e-02 |
Pos logit contributions | |
Synd | +3.641 |
anda | +3.592 |
synd | +3.481 |
�醒 | +3.383 |
Tad | +3.360 |
Neg logit contributions | |
Guilty | -5.146 |
GH | -4.313 |
naire | -4.274 |
que | -4.229 |
NG | -4.176 |
Token | sooner |
Token ID | 14556 |
Feature activation | +5.38e-01 |
Pos logit contributions | |
Guilty | +0.620 |
GH | +0.507 |
naire | +0.492 |
que | +0.492 |
NG | +0.491 |
Neg logit contributions | |
Synd | -0.558 |
synd | -0.542 |
�醒 | -0.539 |
anda | -0.537 |
ahime | -0.510 |
Token | had |
Token ID | 550 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
Synd | +4.920 |
synd | +4.916 |
anda | +4.898 |
Tad | +4.630 |
utt | +4.426 |
Neg logit contributions | |
Guilty | -7.713 |
GH | -6.465 |
NG | -6.423 |
naire | -6.380 |
itcher | -6.155 |
Token | Donna |
Token ID | 29216 |
Feature activation | +3.00e-01 |
Pos logit contributions | |
anda | +8.088 |
Synd | +8.017 |
synd | +7.651 |
Tad | +7.547 |
Teddy | +7.215 |
Neg logit contributions | |
Guilty | -14.156 |
naire | -12.161 |
GH | -12.092 |
isSpecialOrderable | -11.994 |
NG | -11.968 |
Token | and |
Token ID | 290 |
Feature activation | +5.04e-01 |
Pos logit contributions | |
Synd | +3.335 |
anda | +3.272 |
synd | +3.263 |
Tad | +3.090 |
�醒 | +3.057 |
Neg logit contributions | |
Guilty | -3.867 |
GH | -3.192 |
NG | -3.108 |
naire | -3.106 |
ready | -2.982 |
Token | her |
Token ID | 607 |
Feature activation | +4.63e-01 |
Pos logit contributions | |
Synd | +4.400 |
anda | +4.282 |
synd | +4.269 |
Tad | +4.088 |
Tyrann | +3.924 |
Neg logit contributions | |
Guilty | -7.429 |
GH | -6.376 |
naire | -6.345 |
NG | -6.194 |
ready | -6.090 |
Token | family |
Token ID | 1641 |
Feature activation | +6.80e-01 |
Pos logit contributions | |
Synd | +4.786 |
synd | +4.754 |
anda | +4.703 |
Tad | +4.487 |
�醒 | +4.420 |
Neg logit contributions | |
Guilty | -6.117 |
GH | -5.183 |
naire | -5.018 |
NG | -4.960 |
ready | -4.846 |
Token | left |
Token ID | 1364 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
synd | +7.767 |
Synd | +7.762 |
anda | +7.665 |
Tad | +7.316 |
Berkshire | +7.011 |
Neg logit contributions | |
Guilty | -7.967 |
GH | -6.624 |
NG | -6.318 |
isSpecialOrderable | -6.227 |
naire | -6.224 |
Token | when |
Token ID | 618 |
Feature activation | +9.74e-01 |
Pos logit contributions | |
Tad | +10.529 |
anda | +10.266 |
synd | +10.002 |
Synd | +9.990 |
Teddy | +9.851 |
Neg logit contributions | |
Guilty | -14.954 |
GH | -13.110 |
naire | -13.083 |
NG | -12.861 |
itcher | -12.522 |
Token | we |
Token ID | 356 |
Feature activation | -4.07e-03 |
Pos logit contributions | |
anda | +8.758 |
Synd | +8.421 |
synd | +8.320 |
Tad | +8.249 |
Teddy | +7.892 |
Neg logit contributions | |
Guilty | -12.603 |
GH | -10.848 |
naire | -10.710 |
NG | -10.499 |
itcher | -10.342 |
Token | one |
Token ID | 530 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
Guilty | +3.457 |
GH | +2.770 |
que | +2.712 |
naire | +2.668 |
NG | +2.636 |
Neg logit contributions | |
Synd | -3.492 |
�醒 | -3.448 |
synd | -3.357 |
anda | -3.353 |
ahime | -3.268 |
Token | equals |
Token ID | 21767 |
Feature activation | -6.26e-01 |
Pos logit contributions | |
Synd | +1.292 |
synd | +1.266 |
anda | +1.246 |
�醒 | +1.220 |
Tad | +1.163 |
Neg logit contributions | |
Guilty | -1.943 |
GH | -1.632 |
naire | -1.604 |
NG | -1.601 |
ready | -1.573 |
Token | " |
Token ID | 366 |
Feature activation | -8.33e-01 |
Pos logit contributions | |
Guilty | +7.100 |
que | +5.641 |
GH | +5.430 |
naire | +5.418 |
NG | +5.310 |
Neg logit contributions | |
�醒 | -7.811 |
Synd | -7.543 |
ahime | -7.267 |
anda | -7.187 |
synd | -7.151 |
Token | That |
Token ID | 2504 |
Feature activation | -4.32e-01 |
Pos logit contributions | |
Guilty | +10.583 |
GH | +9.211 |
ready | +9.093 |
NG | +9.075 |
naire | +8.578 |
Neg logit contributions | |
�醒 | -8.281 |
Synd | -8.094 |
synd | -7.936 |
ahime | -7.551 |
iliate | -7.409 |
Token | 's |
Token ID | 338 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
Guilty | +5.813 |
GH | +4.741 |
que | +4.683 |
NG | +4.611 |
naire | +4.589 |
Neg logit contributions | |
�醒 | -4.523 |
Synd | -4.520 |
synd | -4.393 |
anda | -4.304 |
ahime | -4.272 |
Token | unfair |
Token ID | 11675 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
Guilty | +4.031 |
GH | +3.279 |
que | +3.235 |
NG | +3.199 |
naire | +3.167 |
Neg logit contributions | |
�醒 | -3.079 |
Synd | -3.040 |
synd | -2.964 |
anda | -2.959 |
ahime | -2.852 |
Token | !" |
Token ID | 2474 |
Feature activation | -4.93e-01 |
Pos logit contributions | |
Guilty | +2.196 |
GH | +1.831 |
que | +1.792 |
NG | +1.785 |
naire | +1.783 |
Neg logit contributions | |
Synd | -1.611 |
�醒 | -1.578 |
synd | -1.559 |
anda | -1.552 |
ahime | -1.477 |
Token |
|
Token ID | 198 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
Guilty | +6.621 |
que | +5.285 |
GH | +5.265 |
NG | +5.239 |
naire | +5.150 |
Neg logit contributions | |
�醒 | -5.242 |
Synd | -5.067 |
anda | -4.966 |
ahime | -4.946 |
synd | -4.936 |
Token |
|
Token ID | 198 |
Feature activation | -2.78e-01 |
Pos logit contributions | |
Synd | +1.445 |
synd | +1.397 |
anda | +1.387 |
�醒 | +1.300 |
Tad | +1.292 |
Neg logit contributions | |
Guilty | -2.201 |
GH | -1.835 |
naire | -1.800 |
que | -1.794 |
NG | -1.783 |
Token | New |
Token ID | 3791 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
Guilty | +3.430 |
GH | +2.890 |
NG | +2.820 |
ready | +2.713 |
naire | +2.702 |
Neg logit contributions | |
Synd | -3.315 |
�醒 | -3.246 |
synd | -3.240 |
anda | -3.138 |
ahime | -3.107 |
Token | York |
Token ID | 1971 |
Feature activation | +2.87e-02 |
Pos logit contributions | |
Synd | +2.073 |
synd | +2.019 |
anda | +2.009 |
�醒 | +1.945 |
Tad | +1.891 |
Neg logit contributions | |
Guilty | -2.827 |
GH | -2.375 |
naire | -2.332 |
NG | -2.317 |
que | -2.298 |
Token | the |
Token ID | 262 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
Guilty | +8.035 |
GH | +6.722 |
que | +6.687 |
NG | +6.597 |
naire | +6.480 |
Neg logit contributions | |
�醒 | -6.112 |
Synd | -5.841 |
anda | -5.663 |
synd | -5.602 |
andowski | -5.537 |
Token | primary |
Token ID | 4165 |
Feature activation | -4.53e-01 |
Pos logit contributions | |
Guilty | +3.130 |
GH | +2.636 |
que | +2.609 |
NG | +2.573 |
naire | +2.568 |
Neg logit contributions | |
Synd | -1.866 |
�醒 | -1.846 |
anda | -1.804 |
synd | -1.788 |
ahime | -1.695 |
Token | culprit |
Token ID | 26581 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
Guilty | +6.164 |
GH | +5.113 |
que | +5.086 |
NG | +4.914 |
ready | +4.879 |
Neg logit contributions | |
�醒 | -4.736 |
Synd | -4.631 |
anda | -4.531 |
synd | -4.377 |
ahime | -4.285 |
Token | is |
Token ID | 318 |
Feature activation | -3.47e-01 |
Pos logit contributions | |
Guilty | +3.366 |
GH | +2.772 |
que | +2.712 |
NG | +2.688 |
naire | +2.687 |
Neg logit contributions | |
Synd | -2.666 |
�醒 | -2.639 |
anda | -2.574 |
synd | -2.550 |
ahime | -2.454 |
Token | injection |
Token ID | 16954 |
Feature activation | -5.12e-01 |
Pos logit contributions | |
Guilty | +4.564 |
GH | +3.799 |
que | +3.762 |
NG | +3.695 |
naire | +3.682 |
Neg logit contributions | |
�醒 | -3.761 |
Synd | -3.729 |
anda | -3.619 |
synd | -3.561 |
andowski | -3.462 |
Token | - |
Token ID | 12 |
Feature activation | -8.36e-01 |
Pos logit contributions | |
Guilty | +4.854 |
que | +3.900 |
GH | +3.742 |
NG | +3.706 |
ready | +3.610 |
Neg logit contributions | |
�醒 | -7.283 |
Synd | -7.074 |
anda | -6.984 |
andowski | -6.846 |
Mutual | -6.803 |
Token | drug |
Token ID | 30349 |
Feature activation | -3.73e-01 |
Pos logit contributions | |
Guilty | +9.000 |
ready | +7.861 |
NG | +7.586 |
GH | +7.560 |
eligible | +7.451 |
Neg logit contributions | |
�醒 | -10.419 |
Synd | -9.835 |
andowski | -9.338 |
Mutual | -9.269 |
synd | -9.240 |
Token | use |
Token ID | 779 |
Feature activation | -4.47e-01 |
Pos logit contributions | |
Guilty | +4.955 |
GH | +4.087 |
que | +4.040 |
NG | +3.943 |
ready | +3.876 |
Neg logit contributions | |
�醒 | -4.036 |
Synd | -3.935 |
anda | -3.894 |
synd | -3.746 |
ahime | -3.677 |
Token | , |
Token ID | 11 |
Feature activation | -2.68e-01 |
Pos logit contributions | |
Guilty | +5.839 |
que | +4.817 |
GH | +4.801 |
NG | +4.712 |
naire | +4.676 |
Neg logit contributions | |
�醒 | -4.855 |
Synd | -4.720 |
anda | -4.521 |
synd | -4.436 |
ahime | -4.353 |
Token | and |
Token ID | 290 |
Feature activation | -4.54e-01 |
Pos logit contributions | |
Guilty | +3.683 |
GH | +3.067 |
que | +3.028 |
NG | +2.991 |
naire | +2.980 |
Neg logit contributions | |
�醒 | -2.800 |
Synd | -2.760 |
anda | -2.677 |
synd | -2.655 |
ahime | -2.530 |
Token | heterosexual |
Token ID | 24026 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
Guilty | +6.034 |
que | +5.030 |
GH | +5.015 |
NG | +4.963 |
naire | +4.855 |
Neg logit contributions | |
�醒 | -4.842 |
Synd | -4.664 |
anda | -4.539 |
synd | -4.434 |
ahime | -4.363 |
Token | from |
Token ID | 422 |
Feature activation | -1.39e-01 |
Pos logit contributions | |
Guilty | +3.990 |
GH | +3.294 |
que | +3.261 |
NG | +3.243 |
naire | +3.228 |
Neg logit contributions | |
�醒 | -3.335 |
Synd | -3.278 |
anda | -3.171 |
synd | -3.126 |
utt | -3.001 |
Token | 2 |
Token ID | 362 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
Guilty | +1.982 |
GH | +1.657 |
que | +1.623 |
NG | +1.621 |
naire | +1.619 |
Neg logit contributions | |
Synd | -1.390 |
�醒 | -1.372 |
anda | -1.347 |
synd | -1.342 |
ahime | -1.262 |
Token | to |
Token ID | 284 |
Feature activation | -2.08e-01 |
Pos logit contributions | |
Guilty | +6.975 |
GH | +5.891 |
NG | +5.751 |
que | +5.690 |
naire | +5.557 |
Neg logit contributions | |
Synd | -6.045 |
�醒 | -5.864 |
synd | -5.799 |
anda | -5.766 |
ahime | -5.644 |
Token | 10 |
Token ID | 838 |
Feature activation | -7.19e-01 |
Pos logit contributions | |
Guilty | +2.991 |
GH | +2.506 |
que | +2.460 |
NG | +2.454 |
naire | +2.450 |
Neg logit contributions | |
�醒 | -2.044 |
Synd | -2.030 |
anda | -1.973 |
synd | -1.958 |
ahime | -1.868 |
Token | months |
Token ID | 1933 |
Feature activation | -5.98e-01 |
Pos logit contributions | |
Guilty | +8.866 |
GH | +7.627 |
que | +7.484 |
NG | +7.469 |
naire | +7.161 |
Neg logit contributions | |
�醒 | -7.527 |
Synd | -7.313 |
anda | -7.115 |
ahime | -7.029 |
synd | -7.003 |
Token | per |
Token ID | 583 |
Feature activation | -8.35e-01 |
Pos logit contributions | |
Guilty | +7.474 |
que | +6.329 |
GH | +6.279 |
naire | +6.136 |
NG | +6.064 |
Neg logit contributions | |
�醒 | -6.620 |
Synd | -6.242 |
anda | -6.112 |
synd | -5.967 |
ahime | -5.951 |
Token | year |
Token ID | 614 |
Feature activation | -5.16e-01 |
Pos logit contributions | |
Guilty | +7.542 |
GH | +6.075 |
que | +5.881 |
NG | +5.779 |
ready | +5.677 |
Neg logit contributions | |
�醒 | -11.446 |
Synd | -10.985 |
anda | -10.584 |
ahime | -10.424 |
andowski | -10.372 |
Token | , |
Token ID | 11 |
Feature activation | -5.49e-02 |
Pos logit contributions | |
Guilty | +6.539 |
que | +5.449 |
GH | +5.440 |
naire | +5.299 |
NG | +5.288 |
Neg logit contributions | |
�醒 | -5.699 |
Synd | -5.487 |
anda | -5.297 |
synd | -5.258 |
ahime | -5.077 |
Token | and |
Token ID | 290 |
Feature activation | -3.04e-01 |
Pos logit contributions | |
Guilty | +0.788 |
GH | +0.661 |
naire | +0.645 |
que | +0.644 |
NG | +0.644 |
Neg logit contributions | |
Synd | -0.546 |
�醒 | -0.530 |
synd | -0.529 |
anda | -0.526 |
ahime | -0.491 |
Token | in |
Token ID | 287 |
Feature activation | -9.55e-01 |
Pos logit contributions | |
Guilty | +4.059 |
GH | +3.380 |
que | +3.342 |
NG | +3.332 |
naire | +3.301 |
Neg logit contributions | |
�醒 | -3.255 |
Synd | -3.192 |
anda | -3.106 |
synd | -3.072 |
ahime | -2.947 |
Token | the |
Token ID | 262 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
Guilty | +10.771 |
que | +9.020 |
GH | +9.001 |
NG | +8.907 |
ready | +8.612 |
Neg logit contributions | |
�醒 | -10.854 |
Synd | -9.743 |
anda | -9.733 |
andowski | -9.430 |
owship | -9.244 |
Token | only |
Token ID | 691 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
Guilty | +0.681 |
GH | +0.567 |
naire | +0.554 |
que | +0.554 |
NG | +0.553 |
Neg logit contributions | |
Synd | -0.504 |
synd | -0.488 |
�醒 | -0.488 |
anda | -0.486 |
ahime | -0.456 |
Token | , |
Token ID | 11 |
Feature activation | +3.26e-01 |
Pos logit contributions | |
Guilty | +2.156 |
GH | +1.793 |
que | +1.766 |
NG | +1.753 |
naire | +1.748 |
Neg logit contributions | |
Synd | -1.605 |
�醒 | -1.575 |
synd | -1.551 |
anda | -1.551 |
ahime | -1.475 |
Token | after |
Token ID | 706 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
Synd | +3.373 |
synd | +3.271 |
anda | +3.162 |
Tad | +3.032 |
Mutual | +2.975 |
Neg logit contributions | |
Guilty | -4.521 |
GH | -3.850 |
naire | -3.724 |
NG | -3.687 |
ready | -3.629 |
Token | dozens |
Token ID | 9264 |
Feature activation | -1.90e-01 |
Pos logit contributions | |
Guilty | +2.121 |
GH | +1.762 |
que | +1.744 |
NG | +1.725 |
naire | +1.719 |
Neg logit contributions | |
Synd | -1.589 |
�醒 | -1.544 |
anda | -1.539 |
synd | -1.533 |
ahime | -1.456 |
Token | of |
Token ID | 286 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
Guilty | +2.458 |
GH | +2.027 |
que | +2.008 |
naire | +1.990 |
NG | +1.978 |
Neg logit contributions | |
Synd | -2.156 |
�醒 | -2.082 |
synd | -2.071 |
anda | -2.066 |
ahime | -1.976 |
Token | people |
Token ID | 661 |
Feature activation | -7.63e-01 |
Pos logit contributions | |
Guilty | +3.726 |
que | +3.098 |
GH | +3.082 |
NG | +3.021 |
naire | +3.012 |
Neg logit contributions | |
Synd | -2.798 |
�醒 | -2.768 |
anda | -2.712 |
synd | -2.655 |
ahime | -2.586 |
Token | began |
Token ID | 2540 |
Feature activation | -8.63e-01 |
Pos logit contributions | |
Guilty | +8.644 |
que | +7.954 |
GH | +6.992 |
naire | +6.983 |
NG | +6.909 |
Neg logit contributions | |
�醒 | -9.209 |
Synd | -8.450 |
anda | -8.125 |
ahime | -8.092 |
iliate | -7.944 |
Token | sleeping |
Token ID | 11029 |
Feature activation | -9.25e-02 |
Pos logit contributions | |
Guilty | +9.862 |
que | +9.045 |
naire | +7.948 |
NG | +7.809 |
GH | +7.790 |
Neg logit contributions | |
�醒 | -9.771 |
ahime | -9.163 |
Synd | -9.078 |
anda | -8.998 |
iliate | -8.833 |
Token | outside |
Token ID | 2354 |
Feature activation | -4.49e-02 |
Pos logit contributions | |
Guilty | +1.267 |
GH | +1.049 |
que | +1.032 |
NG | +1.026 |
naire | +1.023 |
Neg logit contributions | |
Synd | -0.979 |
�醒 | -0.952 |
synd | -0.948 |
anda | -0.946 |
ahime | -0.894 |
Token | the |
Token ID | 262 |
Feature activation | -2.12e-01 |
Pos logit contributions | |
Guilty | +0.640 |
GH | +0.535 |
que | +0.523 |
naire | +0.522 |
NG | +0.522 |
Neg logit contributions | |
Synd | -0.452 |
synd | -0.437 |
�醒 | -0.437 |
anda | -0.435 |
ahime | -0.409 |
Token | premises |
Token ID | 17095 |
Feature activation | -5.84e-01 |
Pos logit contributions | |
Guilty | +2.841 |
GH | +2.337 |
que | +2.311 |
NG | +2.274 |
naire | +2.261 |
Neg logit contributions | |
Synd | -2.274 |
�醒 | -2.249 |
anda | -2.213 |
synd | -2.193 |
ahime | -2.107 |
Token | Y |
Token ID | 575 |
Feature activation | -4.88e-01 |
Pos logit contributions | |
Guilty | +3.077 |
GH | +2.560 |
que | +2.516 |
NG | +2.486 |
naire | +2.483 |
Neg logit contributions | |
Synd | -2.318 |
�醒 | -2.299 |
anda | -2.251 |
synd | -2.247 |
ahime | -2.126 |
Token | Ba |
Token ID | 34458 |
Feature activation | -9.79e-01 |
Pos logit contributions | |
Guilty | +6.463 |
GH | +5.676 |
NG | +5.508 |
que | +5.401 |
naire | +5.288 |
Neg logit contributions | |
Synd | -5.019 |
�醒 | -4.938 |
synd | -4.784 |
anda | -4.561 |
Mutual | -4.517 |
Token | 2 |
Token ID | 17 |
Feature activation | -6.07e-01 |
Pos logit contributions | |
Guilty | +11.269 |
GH | +9.948 |
NG | +9.562 |
que | +9.412 |
ready | +8.731 |
Neg logit contributions | |
Synd | -10.131 |
�醒 | -10.002 |
synd | -9.832 |
ahime | -9.731 |
anda | -9.320 |
Token | Cu |
Token ID | 46141 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
Guilty | +7.555 |
GH | +6.398 |
NG | +6.250 |
que | +6.209 |
ready | +5.947 |
Neg logit contributions | |
Synd | -6.704 |
synd | -6.506 |
�醒 | -6.406 |
anda | -6.306 |
ahime | -6.110 |
Token | 3 |
Token ID | 18 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
Guilty | +11.760 |
GH | +10.253 |
NG | +10.078 |
que | +9.474 |
osite | +8.980 |
Neg logit contributions | |
Synd | -13.560 |
�醒 | -13.544 |
synd | -13.099 |
ahime | -12.922 |
anda | -12.828 |
Token | O |
Token ID | 46 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
Guilty | +10.277 |
GH | +8.981 |
NG | +8.784 |
que | +8.413 |
osite | +8.195 |
Neg logit contributions | |
Synd | -15.552 |
synd | -14.943 |
anda | -14.798 |
�醒 | -14.479 |
ahime | -14.348 |
Token | 6 |
Token ID | 21 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
Guilty | +11.026 |
GH | +9.660 |
NG | +8.916 |
que | +8.847 |
osite | +8.659 |
Neg logit contributions | |
Synd | -15.515 |
�醒 | -15.062 |
synd | -14.635 |
anda | -14.133 |
Mutual | -13.980 |
Token | + |
Token ID | 10 |
Feature activation | -7.86e-01 |
Pos logit contributions | |
Guilty | +11.359 |
GH | +9.786 |
que | +9.337 |
NG | +9.128 |
ready | +8.871 |
Neg logit contributions | |
Synd | -12.280 |
�醒 | -11.861 |
synd | -11.770 |
anda | -11.519 |
ahime | -11.111 |
Token | x |
Token ID | 87 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
Guilty | +9.448 |
GH | +8.296 |
NG | +8.070 |
que | +7.862 |
ready | +7.826 |
Neg logit contributions | |
�醒 | -8.206 |
Synd | -8.071 |
synd | -7.920 |
anda | -7.748 |
Mutual | -7.379 |
Token | , |
Token ID | 11 |
Feature activation | -6.51e-01 |
Pos logit contributions | |
Guilty | +11.886 |
GH | +10.269 |
que | +10.059 |
NG | +9.741 |
anted | +9.561 |
Neg logit contributions | |
Synd | -11.051 |
�醒 | -10.982 |
synd | -10.554 |
anda | -10.179 |
ahime | -9.957 |
Token | is |
Token ID | 318 |
Feature activation | -6.97e-01 |
Pos logit contributions | |
Guilty | +8.103 |
que | +6.691 |
GH | +6.629 |
NG | +6.435 |
naire | +6.346 |
Neg logit contributions | |
�醒 | -7.122 |
Synd | -6.966 |
synd | -6.653 |
anda | -6.650 |
ahime | -6.499 |
Token | at |
Token ID | 379 |
Feature activation | -5.41e-01 |
Pos logit contributions | |
Guilty | +7.795 |
que | +6.355 |
GH | +6.193 |
ready | +6.155 |
NG | +6.116 |
Neg logit contributions | |
�醒 | -7.415 |
Synd | -7.101 |
anda | -6.878 |
synd | -6.864 |
ahime | -6.773 |
Token | the |
Token ID | 262 |
Feature activation | -4.39e-01 |
Pos logit contributions | |
Guilty | +6.623 |
GH | +5.262 |
que | +5.241 |
NG | +5.231 |
naire | +5.192 |
Neg logit contributions | |
�醒 | -6.124 |
Synd | -5.905 |
anda | -5.892 |
synd | -5.743 |
andowski | -5.717 |
Token | bottom |
Token ID | 4220 |
Feature activation | -6.38e-01 |
Pos logit contributions | |
Guilty | +5.395 |
GH | +4.245 |
que | +4.230 |
NG | +4.179 |
naire | +4.156 |
Neg logit contributions | |
�醒 | -5.140 |
Synd | -4.954 |
anda | -4.914 |
synd | -4.860 |
ahime | -4.739 |
Token | of |
Token ID | 286 |
Feature activation | -8.05e-01 |
Pos logit contributions | |
Guilty | +7.149 |
que | +5.640 |
GH | +5.569 |
naire | +5.500 |
ready | +5.492 |
Neg logit contributions | |
�醒 | -7.554 |
Synd | -7.535 |
synd | -7.284 |
anda | -7.194 |
ahime | -7.192 |
Token | any |
Token ID | 597 |
Feature activation | -9.24e-01 |
Pos logit contributions | |
Guilty | +9.315 |
que | +7.404 |
naire | +7.239 |
GH | +7.165 |
NG | +7.089 |
Neg logit contributions | |
�醒 | -9.208 |
anda | -8.680 |
andowski | -8.636 |
Synd | -8.442 |
utt | -8.404 |
Token | game |
Token ID | 983 |
Feature activation | -9.29e-01 |
Pos logit contributions | |
Guilty | +10.554 |
que | +8.676 |
naire | +8.121 |
GH | +8.104 |
NG | +8.082 |
Neg logit contributions | |
�醒 | -10.455 |
anda | -9.772 |
andowski | -9.623 |
Synd | -9.473 |
utt | -9.330 |
Token | page |
Token ID | 2443 |
Feature activation | -2.75e-01 |
Pos logit contributions | |
Guilty | +10.463 |
que | +8.841 |
NG | +8.545 |
naire | +8.359 |
GH | +8.279 |
Neg logit contributions | |
�醒 | -10.436 |
andowski | -9.652 |
anda | -9.577 |
Synd | -9.571 |
ahime | -9.465 |
Token | , |
Token ID | 11 |
Feature activation | -5.21e-01 |
Pos logit contributions | |
Guilty | +3.725 |
GH | +3.060 |
que | +3.032 |
NG | +3.015 |
naire | +3.012 |
Neg logit contributions | |
Synd | -2.900 |
�醒 | -2.869 |
synd | -2.804 |
anda | -2.793 |
ahime | -2.675 |
Token | then |
Token ID | 788 |
Feature activation | -9.13e-01 |
Pos logit contributions | |
Guilty | +6.557 |
que | +5.404 |
GH | +5.272 |
ready | +5.187 |
NG | +5.173 |
Neg logit contributions | |
�醒 | -5.901 |
Synd | -5.633 |
anda | -5.580 |
ahime | -5.408 |
andowski | -5.372 |
Token | " |
Token ID | 366 |
Feature activation | -5.88e-01 |
Pos logit contributions | |
Guilty | +10.239 |
que | +8.685 |
ready | +8.080 |
GH | +8.046 |
NG | +7.826 |
Neg logit contributions | |
�醒 | -10.651 |
anda | -10.021 |
ahime | -9.950 |
Synd | -9.632 |
andowski | -9.616 |
Token | Print |
Token ID | 18557 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
Guilty | +7.757 |
GH | +6.773 |
NG | +6.665 |
ready | +6.558 |
que | +6.307 |
Neg logit contributions | |
�醒 | -5.854 |
Synd | -5.853 |
anda | -5.691 |
synd | -5.666 |
ahime | -5.477 |