Token | along |
Token ID | 1863 |
Feature activation | +5.15e-01 |
Pos logit contributions | |
zzle | +5.647 |
mble | +4.768 |
uers | +4.659 |
IRE | +4.657 |
reckoning | +4.266 |
Neg logit contributions | |
enh | -8.494 |
practice | -8.445 |
adapt | -8.243 |
ゴン | -8.241 |
Occupations | -8.146 |
Token | the |
Token ID | 262 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
zzle | +1.994 |
mble | +1.740 |
uers | +1.708 |
IRE | +1.703 |
reckoning | +1.560 |
Neg logit contributions | |
enh | -2.340 |
practice | -2.320 |
adapt | -2.255 |
ゴン | -2.231 |
Occupations | -2.226 |
Token | city |
Token ID | 1748 |
Feature activation | +9.75e-01 |
Pos logit contributions | |
zzle | +1.271 |
mble | +1.112 |
uers | +1.087 |
IRE | +1.080 |
reckoning | +0.983 |
Neg logit contributions | |
enh | -1.534 |
practice | -1.516 |
adapt | -1.476 |
Occupations | -1.459 |
theless | -1.447 |
Token | 's |
Token ID | 338 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
zzle | +4.347 |
mble | +3.853 |
uers | +3.799 |
IRE | +3.795 |
reckoning | +3.531 |
Neg logit contributions | |
enh | -3.841 |
practice | -3.812 |
adapt | -3.693 |
ゴン | -3.653 |
Occupations | -3.642 |
Token | broad |
Token ID | 3154 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
zzle | +5.663 |
mble | +5.012 |
IRE | +4.929 |
uers | +4.925 |
reckoning | +4.594 |
Neg logit contributions | |
enh | -5.179 |
practice | -5.142 |
adapt | -4.973 |
ゴン | -4.955 |
Occupations | -4.909 |
Token | bou |
Token ID | 35833 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
zzle | +4.585 |
mble | +4.039 |
uers | +3.997 |
IRE | +3.963 |
reckoning | +3.629 |
Neg logit contributions | |
enh | -4.978 |
practice | -4.930 |
adapt | -4.769 |
Occupations | -4.700 |
theless | -4.677 |
Token | lev |
Token ID | 2768 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
zzle | +9.955 |
uers | +7.824 |
IRE | +7.437 |
mble | +7.268 |
htar | +6.687 |
Neg logit contributions | |
ゴン | -18.649 |
theless | -17.549 |
Occupations | -17.518 |
practice | -17.250 |
Provided | -16.761 |
Token | ards |
Token ID | 1371 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
zzle | +5.258 |
uers | +4.658 |
mble | +4.639 |
IRE | +4.603 |
reckoning | +4.274 |
Neg logit contributions | |
enh | -4.341 |
practice | -4.309 |
ゴン | -4.236 |
adapt | -4.157 |
Occupations | -4.120 |
Token | in |
Token ID | 287 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
zzle | +7.331 |
IRE | +6.153 |
mble | +6.093 |
uers | +6.058 |
reckoning | +5.661 |
Neg logit contributions | |
practice | -9.841 |
enh | -9.841 |
ゴン | -9.769 |
adapt | -9.638 |
odor | -9.420 |
Token | support |
Token ID | 1104 |
Feature activation | +6.26e-02 |
Pos logit contributions | |
zzle | +7.469 |
mble | +6.616 |
IRE | +6.525 |
uers | +6.439 |
reckoning | +6.099 |
Neg logit contributions | |
enh | -7.399 |
practice | -7.262 |
ゴン | -7.140 |
adapt | -7.086 |
Occupations | -7.010 |
Token | , |
Token ID | 11 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
zzle | +0.289 |
mble | +0.258 |
uers | +0.255 |
IRE | +0.254 |
reckoning | +0.236 |
Neg logit contributions | |
enh | -0.238 |
practice | -0.235 |
adapt | -0.227 |
ゴン | -0.224 |
Occupations | -0.224 |
Token | to |
Token ID | 284 |
Feature activation | +2.42e-01 |
Pos logit contributions | |
zzle | +3.278 |
mble | +2.959 |
uers | +2.889 |
IRE | +2.884 |
reckoning | +2.665 |
Neg logit contributions | |
enh | -2.934 |
practice | -2.898 |
adapt | -2.809 |
ゴン | -2.751 |
Occupations | -2.749 |
Token | attend |
Token ID | 5262 |
Feature activation | -7.75e-01 |
Pos logit contributions | |
zzle | +1.068 |
mble | +0.959 |
IRE | +0.951 |
uers | +0.937 |
reckoning | +0.859 |
Neg logit contributions | |
practice | -0.973 |
enh | -0.973 |
adapt | -0.939 |
theless | -0.912 |
odor | -0.901 |
Token | a |
Token ID | 257 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
enh | +2.980 |
practice | +2.961 |
Occupations | +2.822 |
adapt | +2.804 |
theless | +2.787 |
Neg logit contributions | |
zzle | -3.332 |
mble | -3.133 |
uers | -3.026 |
IRE | -2.901 |
reckoning | -2.631 |
Token | meeting |
Token ID | 3249 |
Feature activation | -2.18e-01 |
Pos logit contributions | |
zzle | +0.974 |
mble | +0.869 |
uers | +0.852 |
IRE | +0.835 |
reckoning | +0.750 |
Neg logit contributions | |
practice | -1.102 |
enh | -1.098 |
adapt | -1.050 |
Occupations | -1.044 |
theless | -1.036 |
Token | , |
Token ID | 11 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
enh | +0.865 |
practice | +0.852 |
adapt | +0.827 |
theless | +0.811 |
Occupations | +0.811 |
Neg logit contributions | |
zzle | -0.950 |
mble | -0.885 |
IRE | -0.848 |
uers | -0.843 |
reckoning | -0.756 |
Token | Pu |
Token ID | 11634 |
Feature activation | +3.44e+00 |
Pos logit contributions | |
zzle | +7.736 |
mble | +6.912 |
IRE | +6.833 |
uers | +6.825 |
reckoning | +6.396 |
Neg logit contributions | |
enh | -5.772 |
practice | -5.729 |
adapt | -5.505 |
ゴン | -5.503 |
Occupations | -5.415 |
Token | ig |
Token ID | 328 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
zzle | +10.132 |
uers | +8.077 |
IRE | +7.552 |
mble | +7.363 |
htar | +7.039 |
Neg logit contributions | |
ゴン | -17.271 |
practice | -16.961 |
theless | -16.662 |
Occupations | -16.323 |
adapt | -16.236 |
Token | dem |
Token ID | 9536 |
Feature activation | +5.57e-02 |
Pos logit contributions | |
zzle | +7.068 |
uers | +6.294 |
mble | +6.240 |
IRE | +6.095 |
reckoning | +5.747 |
Neg logit contributions | |
practice | -5.284 |
enh | -5.274 |
Occupations | -5.119 |
ゴン | -5.077 |
adapt | -5.057 |
Token | ont |
Token ID | 756 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
zzle | +0.258 |
mble | +0.237 |
IRE | +0.235 |
uers | +0.230 |
reckoning | +0.217 |
Neg logit contributions | |
enh | -0.215 |
practice | -0.206 |
adapt | -0.202 |
odor | -0.196 |
theless | -0.190 |
Token | said |
Token ID | 531 |
Feature activation | +5.01e-01 |
Pos logit contributions | |
enh | +0.544 |
practice | +0.519 |
adapt | +0.512 |
theless | +0.507 |
Provided | +0.504 |
Neg logit contributions | |
zzle | -0.417 |
mble | -0.381 |
uers | -0.365 |
IRE | -0.364 |
reckoning | -0.325 |
Token | : |
Token ID | 25 |
Feature activation | -6.22e-01 |
Pos logit contributions | |
zzle | +2.247 |
mble | +2.021 |
uers | +1.979 |
IRE | +1.976 |
reckoning | +1.832 |
Neg logit contributions | |
enh | -1.978 |
practice | -1.958 |
adapt | -1.890 |
Occupations | -1.863 |
ゴン | -1.849 |
Token | First |
Token ID | 5962 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
zzle | +0.231 |
mble | +0.211 |
uers | +0.205 |
IRE | +0.197 |
reckoning | +0.193 |
Neg logit contributions | |
enh | -0.178 |
practice | -0.176 |
adapt | -0.172 |
odor | -0.161 |
Occupations | -0.161 |
Token | , |
Token ID | 11 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
zzle | +6.831 |
mble | +5.928 |
IRE | +5.921 |
uers | +5.867 |
reckoning | +5.495 |
Neg logit contributions | |
enh | -6.564 |
practice | -6.527 |
adapt | -6.313 |
ゴン | -6.249 |
Occupations | -6.166 |
Token | the |
Token ID | 262 |
Feature activation | -7.49e-01 |
Pos logit contributions | |
enh | +0.628 |
practice | +0.615 |
Occupations | +0.600 |
adapt | +0.597 |
theless | +0.586 |
Neg logit contributions | |
zzle | -0.662 |
mble | -0.598 |
uers | -0.588 |
IRE | -0.574 |
reckoning | -0.518 |
Token | address |
Token ID | 2209 |
Feature activation | +9.71e-01 |
Pos logit contributions | |
enh | +2.828 |
practice | +2.799 |
Occupations | +2.721 |
odor | +2.690 |
adapt | +2.688 |
Neg logit contributions | |
zzle | -3.363 |
mble | -3.007 |
uers | -2.971 |
IRE | -2.866 |
htar | -2.617 |
Token | by |
Token ID | 416 |
Feature activation | +6.30e-01 |
Pos logit contributions | |
zzle | +3.939 |
mble | +3.462 |
uers | +3.396 |
IRE | +3.379 |
reckoning | +3.094 |
Neg logit contributions | |
enh | -4.309 |
practice | -4.244 |
adapt | -4.140 |
Occupations | -4.055 |
ゴン | -4.042 |
Token | Pu |
Token ID | 11634 |
Feature activation | +3.44e+00 |
Pos logit contributions | |
zzle | +2.793 |
mble | +2.485 |
uers | +2.427 |
IRE | +2.422 |
reckoning | +2.211 |
Neg logit contributions | |
enh | -2.553 |
practice | -2.528 |
Occupations | -2.450 |
adapt | -2.446 |
theless | -2.421 |
Token | ig |
Token ID | 328 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
zzle | +10.176 |
uers | +8.077 |
IRE | +7.972 |
mble | +7.397 |
reckoning | +7.145 |
Neg logit contributions | |
ゴン | -17.335 |
practice | -16.842 |
theless | -16.554 |
Occupations | -16.302 |
adapt | -15.988 |
Token | dem |
Token ID | 9536 |
Feature activation | +4.02e-01 |
Pos logit contributions | |
zzle | +6.860 |
mble | +6.168 |
uers | +6.116 |
IRE | +6.075 |
reckoning | +5.707 |
Neg logit contributions | |
enh | -4.538 |
practice | -4.494 |
adapt | -4.321 |
ゴン | -4.307 |
Occupations | -4.281 |
Token | ont |
Token ID | 756 |
Feature activation | -4.59e-01 |
Pos logit contributions | |
zzle | +1.814 |
mble | +1.641 |
IRE | +1.611 |
uers | +1.597 |
reckoning | +1.491 |
Neg logit contributions | |
enh | -1.608 |
practice | -1.566 |
adapt | -1.526 |
odor | -1.477 |
Occupations | -1.452 |
Token | before |
Token ID | 878 |
Feature activation | -3.19e-02 |
Pos logit contributions | |
enh | +1.744 |
practice | +1.648 |
adapt | +1.617 |
theless | +1.603 |
odor | +1.575 |
Neg logit contributions | |
zzle | -2.092 |
mble | -1.954 |
IRE | -1.877 |
uers | -1.872 |
reckoning | -1.651 |
Token | the |
Token ID | 262 |
Feature activation | +4.51e-03 |
Pos logit contributions | |
enh | +0.129 |
practice | +0.128 |
adapt | +0.124 |
Occupations | +0.123 |
theless | +0.122 |
Neg logit contributions | |
zzle | -0.138 |
mble | -0.123 |
uers | -0.121 |
IRE | -0.119 |
reckoning | -0.107 |
Token | hate |
Token ID | 5465 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
zzle | +2.133 |
mble | +1.920 |
uers | +1.857 |
IRE | +1.856 |
reckoning | +1.686 |
Neg logit contributions | |
enh | -2.373 |
practice | -2.335 |
adapt | -2.248 |
Occupations | -2.213 |
odor | -2.195 |
Token | the |
Token ID | 262 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
enh | +4.204 |
practice | +4.040 |
odor | +3.947 |
adapt | +3.802 |
bid | +3.751 |
Neg logit contributions | |
zzle | -4.532 |
mble | -4.148 |
uers | -4.060 |
IRE | -4.049 |
reckoning | -3.559 |
Token | taste |
Token ID | 6938 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
enh | +3.814 |
practice | +3.651 |
odor | +3.566 |
adapt | +3.499 |
Occupations | +3.365 |
Neg logit contributions | |
zzle | -4.815 |
mble | -4.511 |
IRE | -4.283 |
uers | -4.233 |
reckoning | -3.882 |
Token | of |
Token ID | 286 |
Feature activation | +5.17e-01 |
Pos logit contributions | |
zzle | +1.537 |
mble | +1.366 |
IRE | +1.315 |
uers | +1.310 |
reckoning | +1.200 |
Neg logit contributions | |
enh | -1.986 |
practice | -1.932 |
adapt | -1.882 |
ゴン | -1.861 |
odor | -1.850 |
Token | their |
Token ID | 511 |
Feature activation | +9.32e-01 |
Pos logit contributions | |
zzle | +2.317 |
mble | +2.084 |
IRE | +2.042 |
uers | +2.042 |
reckoning | +1.855 |
Neg logit contributions | |
enh | -2.080 |
practice | -2.036 |
adapt | -1.962 |
Occupations | -1.939 |
odor | -1.938 |
Token | ejac |
Token ID | 39426 |
Feature activation | +3.36e+00 |
Pos logit contributions | |
zzle | +4.404 |
mble | +3.947 |
uers | +3.867 |
IRE | +3.861 |
reckoning | +3.570 |
Neg logit contributions | |
enh | -3.520 |
practice | -3.464 |
adapt | -3.336 |
Occupations | -3.281 |
ゴン | -3.278 |
Token | ulate |
Token ID | 5039 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
zzle | +10.106 |
uers | +9.209 |
IRE | +8.446 |
mble | +8.233 |
reckoning | +7.625 |
Neg logit contributions | |
ゴン | -16.042 |
practice | -15.770 |
Occupations | -15.738 |
theless | -15.629 |
enh | -15.540 |
Token | . |
Token ID | 13 |
Feature activation | +2.08e-02 |
Pos logit contributions | |
zzle | +7.694 |
mble | +6.584 |
uers | +6.567 |
IRE | +6.522 |
reckoning | +6.101 |
Neg logit contributions | |
practice | -8.228 |
enh | -8.093 |
ゴン | -7.930 |
adapt | -7.916 |
Occupations | -7.906 |
Token | And |
Token ID | 843 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
zzle | +0.115 |
mble | +0.107 |
uers | +0.104 |
IRE | +0.103 |
reckoning | +0.098 |
Neg logit contributions | |
enh | -0.062 |
practice | -0.060 |
Occupations | -0.059 |
adapt | -0.058 |
Provided | -0.056 |
Token | there |
Token ID | 612 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
enh | +0.422 |
practice | +0.407 |
adapt | +0.395 |
odor | +0.393 |
Occupations | +0.391 |
Neg logit contributions | |
zzle | -0.464 |
mble | -0.421 |
IRE | -0.410 |
uers | -0.407 |
reckoning | -0.375 |
Token | � |
Token ID | 447 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
enh | +3.901 |
practice | +3.767 |
adapt | +3.663 |
bid | +3.593 |
theless | +3.583 |
Neg logit contributions | |
zzle | -4.607 |
IRE | -4.218 |
mble | -4.176 |
uers | -4.088 |
reckoning | -3.854 |
Token | imagine |
Token ID | 5967 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
enh | +1.619 |
practice | +1.596 |
adapt | +1.536 |
bid | +1.530 |
abil | +1.508 |
Neg logit contributions | |
zzle | -1.248 |
mble | -1.110 |
IRE | -1.073 |
uers | -1.071 |
reckoning | -0.959 |
Token | how |
Token ID | 703 |
Feature activation | +7.72e-01 |
Pos logit contributions | |
zzle | +5.459 |
mble | +4.848 |
uers | +4.778 |
IRE | +4.765 |
reckoning | +4.417 |
Neg logit contributions | |
enh | -5.012 |
practice | -4.950 |
adapt | -4.784 |
Occupations | -4.730 |
ゴン | -4.707 |
Token | many |
Token ID | 867 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
zzle | +3.676 |
mble | +3.307 |
uers | +3.237 |
IRE | +3.212 |
reckoning | +2.978 |
Neg logit contributions | |
enh | -2.891 |
practice | -2.847 |
adapt | -2.744 |
Occupations | -2.723 |
theless | -2.676 |
Token | more |
Token ID | 517 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
zzle | +6.574 |
mble | +5.882 |
uers | +5.794 |
IRE | +5.782 |
reckoning | +5.391 |
Neg logit contributions | |
enh | -5.238 |
practice | -5.182 |
adapt | -5.004 |
ゴン | -4.935 |
Occupations | -4.928 |
Token | people |
Token ID | 661 |
Feature activation | +1.64e+00 |
Pos logit contributions | |
zzle | +7.238 |
mble | +6.485 |
uers | +6.390 |
IRE | +6.380 |
reckoning | +5.956 |
Neg logit contributions | |
enh | -5.588 |
practice | -5.530 |
adapt | -5.340 |
ゴン | -5.270 |
Occupations | -5.248 |
Token | would |
Token ID | 561 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
zzle | +6.519 |
mble | +5.706 |
uers | +5.602 |
IRE | +5.596 |
reckoning | +5.146 |
Neg logit contributions | |
enh | -7.234 |
practice | -7.169 |
adapt | -6.969 |
ゴン | -6.919 |
Occupations | -6.863 |
Token | � |
Token ID | 447 |
Feature activation | +7.56e-01 |
Pos logit contributions | |
zzle | +12.502 |
mble | +10.945 |
IRE | +10.538 |
uers | +10.447 |
reckoning | +9.734 |
Neg logit contributions | |
ゴン | -14.154 |
enh | -13.436 |
practice | -13.098 |
Occupations | -13.017 |
adapt | -12.918 |
Token | � |
Token ID | 247 |
Feature activation | +8.37e-01 |
Pos logit contributions | |
zzle | +3.279 |
mble | +2.962 |
uers | +2.886 |
IRE | +2.866 |
reckoning | +2.688 |
Neg logit contributions | |
enh | -3.103 |
practice | -3.058 |
adapt | -2.941 |
ゴン | -2.936 |
Occupations | -2.924 |
Token | ve |
Token ID | 303 |
Feature activation | +6.37e-01 |
Pos logit contributions | |
zzle | +4.155 |
mble | +3.728 |
uers | +3.714 |
IRE | +3.693 |
reckoning | +3.480 |
Neg logit contributions | |
enh | -2.937 |
practice | -2.920 |
adapt | -2.797 |
theless | -2.720 |
Occupations | -2.708 |
Token | been |
Token ID | 587 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
zzle | +2.885 |
mble | +2.552 |
uers | +2.544 |
IRE | +2.531 |
reckoning | +2.354 |
Neg logit contributions | |
enh | -2.518 |
practice | -2.497 |
adapt | -2.400 |
theless | -2.391 |
Occupations | -2.373 |
Token | protesting |
Token ID | 23655 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
zzle | +6.565 |
mble | +5.722 |
uers | +5.642 |
IRE | +5.635 |
reckoning | +5.192 |
Neg logit contributions | |
enh | -7.094 |
practice | -7.052 |
ゴン | -6.852 |
adapt | -6.851 |
Occupations | -6.759 |
Token | Laurent |
Token ID | 39734 |
Feature activation | -4.63e-02 |
Pos logit contributions | |
enh | +3.314 |
adapt | +3.189 |
practice | +3.106 |
Provided | +3.049 |
odor | +3.019 |
Neg logit contributions | |
zzle | -4.921 |
mble | -4.448 |
IRE | -4.323 |
uers | -4.249 |
reckoning | -3.948 |
Token | Fab |
Token ID | 14236 |
Feature activation | +9.95e-01 |
Pos logit contributions | |
enh | +0.159 |
practice | +0.153 |
adapt | +0.152 |
Provided | +0.148 |
theless | +0.147 |
Neg logit contributions | |
zzle | -0.233 |
mble | -0.212 |
uers | -0.208 |
IRE | -0.202 |
reckoning | -0.192 |
Token | ius |
Token ID | 3754 |
Feature activation | +7.40e-02 |
Pos logit contributions | |
zzle | +4.987 |
mble | +4.496 |
uers | +4.432 |
IRE | +4.426 |
reckoning | +4.149 |
Neg logit contributions | |
enh | -3.396 |
practice | -3.357 |
adapt | -3.233 |
ゴン | -3.182 |
Occupations | -3.173 |
Token | told |
Token ID | 1297 |
Feature activation | -7.32e-02 |
Pos logit contributions | |
zzle | +0.306 |
mble | +0.276 |
IRE | +0.266 |
uers | +0.265 |
reckoning | +0.241 |
Neg logit contributions | |
enh | -0.322 |
practice | -0.307 |
adapt | -0.302 |
theless | -0.298 |
odor | -0.293 |
Token | the |
Token ID | 262 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
enh | +0.270 |
practice | +0.264 |
adapt | +0.260 |
Occupations | +0.250 |
odor | +0.249 |
Neg logit contributions | |
zzle | -0.347 |
mble | -0.310 |
IRE | -0.298 |
uers | -0.292 |
reckoning | -0.282 |
Token | opening |
Token ID | 4756 |
Feature activation | +3.29e+00 |
Pos logit contributions | |
enh | +1.052 |
practice | +1.018 |
odor | +0.986 |
adapt | +0.985 |
Occupations | +0.985 |
Neg logit contributions | |
zzle | -1.577 |
mble | -1.422 |
IRE | -1.374 |
uers | -1.355 |
reckoning | -1.284 |
Token | of |
Token ID | 286 |
Feature activation | +1.72e+00 |
Pos logit contributions | |
zzle | +12.252 |
uers | +10.801 |
mble | +10.682 |
IRE | +10.568 |
reckoning | +9.917 |
Neg logit contributions | |
enh | -13.403 |
practice | -13.307 |
adapt | -13.093 |
ゴン | -13.015 |
Occupations | -12.894 |
Token | a |
Token ID | 257 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
zzle | +6.901 |
mble | +6.107 |
uers | +6.008 |
IRE | +5.974 |
reckoning | +5.512 |
Neg logit contributions | |
enh | -7.377 |
practice | -7.326 |
ゴン | -7.095 |
adapt | -7.070 |
Occupations | -7.025 |
Token | two |
Token ID | 734 |
Feature activation | +2.76e-01 |
Pos logit contributions | |
zzle | +7.590 |
mble | +6.784 |
uers | +6.687 |
IRE | +6.661 |
reckoning | +6.222 |
Neg logit contributions | |
enh | -6.806 |
practice | -6.752 |
ゴン | -6.529 |
adapt | -6.525 |
Occupations | -6.463 |
Token | - |
Token ID | 12 |
Feature activation | -6.10e-01 |
Pos logit contributions | |
zzle | +1.211 |
mble | +1.070 |
IRE | +1.047 |
uers | +1.043 |
reckoning | +0.968 |
Neg logit contributions | |
enh | -1.122 |
practice | -1.113 |
adapt | -1.070 |
ゴン | -1.065 |
Occupations | -1.053 |
Token | day |
Token ID | 820 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
practice | +1.533 |
enh | +1.530 |
adapt | +1.379 |
standard | +1.325 |
bid | +1.280 |
Neg logit contributions | |
zzle | -3.666 |
mble | -3.378 |
IRE | -3.309 |
uers | -3.282 |
reckoning | -3.152 |
Token | UP |
Token ID | 8577 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
zzle | +1.493 |
mble | +1.293 |
uers | +1.226 |
IRE | +1.214 |
reckoning | +1.135 |
Neg logit contributions | |
enh | -2.253 |
practice | -2.215 |
adapt | -2.160 |
odor | -2.131 |
Occupations | -2.117 |
Token | will |
Token ID | 481 |
Feature activation | +6.33e-01 |
Pos logit contributions | |
zzle | +4.536 |
mble | +4.022 |
uers | +3.972 |
IRE | +3.933 |
reckoning | +3.629 |
Neg logit contributions | |
enh | -4.281 |
practice | -4.222 |
adapt | -4.099 |
Occupations | -4.042 |
theless | -4.023 |
Token | continue |
Token ID | 2555 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
zzle | +2.724 |
mble | +2.422 |
IRE | +2.389 |
uers | +2.383 |
reckoning | +2.156 |
Neg logit contributions | |
enh | -2.644 |
practice | -2.623 |
adapt | -2.552 |
theless | -2.517 |
odor | -2.455 |
Token | to |
Token ID | 284 |
Feature activation | -5.89e-01 |
Pos logit contributions | |
enh | +0.918 |
practice | +0.913 |
adapt | +0.868 |
theless | +0.865 |
Occupations | +0.852 |
Neg logit contributions | |
zzle | -1.061 |
uers | -0.959 |
mble | -0.955 |
IRE | -0.928 |
reckoning | -0.823 |
Token | support |
Token ID | 1104 |
Feature activation | -8.05e-01 |
Pos logit contributions | |
practice | +2.442 |
enh | +2.417 |
theless | +2.371 |
adapt | +2.334 |
bid | +2.265 |
Neg logit contributions | |
zzle | -2.428 |
mble | -2.213 |
uers | -2.174 |
IRE | -2.143 |
reckoning | -1.890 |
Token | Pu |
Token ID | 11634 |
Feature activation | +3.26e+00 |
Pos logit contributions | |
enh | +3.136 |
practice | +3.054 |
adapt | +3.002 |
Occupations | +2.974 |
theless | +2.938 |
Neg logit contributions | |
zzle | -3.499 |
mble | -3.161 |
uers | -3.131 |
IRE | -3.027 |
reckoning | -2.724 |
Token | ig |
Token ID | 328 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
zzle | +9.241 |
uers | +7.190 |
IRE | +6.777 |
mble | +6.396 |
unci | +6.213 |
Neg logit contributions | |
ゴン | -17.373 |
practice | -16.616 |
theless | -16.437 |
Occupations | -16.331 |
adapt | -15.799 |
Token | dem |
Token ID | 9536 |
Feature activation | +3.73e-01 |
Pos logit contributions | |
zzle | +5.914 |
mble | +5.335 |
uers | +5.271 |
IRE | +5.255 |
reckoning | +4.933 |
Neg logit contributions | |
enh | -3.848 |
practice | -3.805 |
adapt | -3.659 |
ゴン | -3.617 |
Occupations | -3.602 |
Token | ont |
Token ID | 756 |
Feature activation | -9.24e-01 |
Pos logit contributions | |
zzle | +1.690 |
mble | +1.535 |
IRE | +1.503 |
uers | +1.487 |
reckoning | +1.392 |
Neg logit contributions | |
enh | -1.485 |
practice | -1.443 |
adapt | -1.407 |
odor | -1.361 |
theless | -1.336 |
Token | and |
Token ID | 290 |
Feature activation | -2.78e-01 |
Pos logit contributions | |
enh | +3.207 |
practice | +3.038 |
adapt | +2.983 |
theless | +2.943 |
bid | +2.934 |
Neg logit contributions | |
zzle | -4.372 |
mble | -4.178 |
uers | -4.065 |
IRE | -3.995 |
reckoning | -3.512 |
Token | his |
Token ID | 465 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
enh | +1.103 |
practice | +1.079 |
adapt | +1.050 |
theless | +1.045 |
Occupations | +1.044 |
Neg logit contributions | |
zzle | -1.225 |
mble | -1.100 |
uers | -1.085 |
IRE | -1.069 |
reckoning | -0.958 |
Token | , |
Token ID | 11 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
zzle | +7.407 |
IRE | +6.464 |
mble | +6.453 |
uers | +6.431 |
reckoning | +6.049 |
Neg logit contributions | |
practice | -6.999 |
enh | -6.931 |
adapt | -6.742 |
ゴン | -6.690 |
Occupations | -6.625 |
Token | one |
Token ID | 530 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
zzle | +6.248 |
mble | +5.579 |
uers | +5.483 |
IRE | +5.476 |
reckoning | +5.083 |
Neg logit contributions | |
enh | -5.318 |
practice | -5.260 |
adapt | -5.089 |
Occupations | -5.011 |
ゴン | -5.011 |
Token | of |
Token ID | 286 |
Feature activation | +6.25e-01 |
Pos logit contributions | |
zzle | +6.672 |
mble | +5.814 |
uers | +5.708 |
IRE | +5.696 |
reckoning | +5.216 |
Neg logit contributions | |
enh | -7.888 |
practice | -7.822 |
adapt | -7.606 |
ゴン | -7.525 |
Occupations | -7.506 |
Token | the |
Token ID | 262 |
Feature activation | -2.03e-02 |
Pos logit contributions | |
zzle | +2.726 |
mble | +2.435 |
IRE | +2.386 |
uers | +2.377 |
reckoning | +2.168 |
Neg logit contributions | |
enh | -2.579 |
practice | -2.545 |
adapt | -2.462 |
Occupations | -2.433 |
theless | -2.404 |
Token | most |
Token ID | 749 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
enh | +0.076 |
practice | +0.075 |
odor | +0.072 |
Occupations | +0.072 |
adapt | +0.071 |
Neg logit contributions | |
zzle | -0.095 |
mble | -0.086 |
IRE | -0.084 |
uers | -0.083 |
reckoning | -0.075 |
Token | vocal |
Token ID | 12435 |
Feature activation | +3.19e+00 |
Pos logit contributions | |
zzle | +5.223 |
mble | +4.675 |
uers | +4.579 |
IRE | +4.554 |
reckoning | +4.197 |
Neg logit contributions | |
enh | -4.538 |
practice | -4.481 |
adapt | -4.331 |
Occupations | -4.263 |
ゴン | -4.241 |
Token | # |
Token ID | 1303 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
zzle | +12.285 |
uers | +10.643 |
IRE | +10.473 |
mble | +10.427 |
reckoning | +10.081 |
Neg logit contributions | |
ゴン | -12.706 |
enh | -12.632 |
practice | -12.578 |
adapt | -12.398 |
theless | -11.777 |
Token | Never |
Token ID | 12295 |
Feature activation | -3.95e-01 |
Pos logit contributions | |
zzle | +3.512 |
mble | +3.038 |
IRE | +2.935 |
uers | +2.935 |
reckoning | +2.659 |
Neg logit contributions | |
enh | -5.041 |
practice | -5.004 |
adapt | -4.874 |
ゴン | -4.778 |
Occupations | -4.772 |
Token | Trump |
Token ID | 6170 |
Feature activation | +7.76e-01 |
Pos logit contributions | |
practice | +1.422 |
enh | +1.405 |
adapt | +1.357 |
odor | +1.303 |
bid | +1.292 |
Neg logit contributions | |
zzle | -1.915 |
mble | -1.839 |
uers | -1.708 |
IRE | -1.669 |
reckoning | -1.594 |
Token | ers |
Token ID | 364 |
Feature activation | +2.12e+00 |
Pos logit contributions | |
zzle | +3.282 |
mble | +2.922 |
IRE | +2.849 |
uers | +2.823 |
reckoning | +2.606 |
Neg logit contributions | |
enh | -3.308 |
practice | -3.253 |
adapt | -3.162 |
Occupations | -3.128 |
odor | -3.088 |
Token | of |
Token ID | 286 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
zzle | +8.803 |
mble | +7.609 |
IRE | +7.516 |
uers | +7.508 |
reckoning | +7.087 |
Neg logit contributions | |
enh | -8.814 |
practice | -8.762 |
adapt | -8.515 |
ゴン | -8.472 |
Occupations | -8.373 |
Token | kitten |
Token ID | 42143 |
Feature activation | -5.14e-02 |
Pos logit contributions | |
zzle | +0.918 |
mble | +0.822 |
uers | +0.809 |
IRE | +0.809 |
reckoning | +0.732 |
Neg logit contributions | |
enh | -0.731 |
practice | -0.722 |
adapt | -0.698 |
Occupations | -0.682 |
odor | -0.671 |
Token | . |
Token ID | 13 |
Feature activation | -7.01e-01 |
Pos logit contributions | |
enh | +0.199 |
practice | +0.198 |
adapt | +0.192 |
Occupations | +0.183 |
Provided | +0.182 |
Neg logit contributions | |
zzle | -0.233 |
mble | -0.212 |
IRE | -0.207 |
uers | -0.205 |
reckoning | -0.189 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +9.98e-01 |
Pos logit contributions | |
enh | +2.063 |
practice | +1.995 |
adapt | +1.985 |
Provided | +1.960 |
Occupations | +1.904 |
Neg logit contributions | |
zzle | -3.827 |
mble | -3.534 |
uers | -3.447 |
IRE | -3.400 |
reckoning | -3.248 |
Token | In |
Token ID | 818 |
Feature activation | +6.97e-01 |
Pos logit contributions | |
zzle | +4.632 |
mble | +4.175 |
uers | +4.070 |
IRE | +4.025 |
reckoning | +3.817 |
Neg logit contributions | |
enh | -3.871 |
practice | -3.823 |
adapt | -3.701 |
ゴン | -3.591 |
Occupations | -3.581 |
Token | this |
Token ID | 428 |
Feature activation | +1.76e-01 |
Pos logit contributions | |
zzle | +3.136 |
mble | +2.795 |
IRE | +2.743 |
uers | +2.731 |
reckoning | +2.511 |
Neg logit contributions | |
enh | -2.803 |
practice | -2.795 |
adapt | -2.709 |
Occupations | -2.647 |
ゴン | -2.610 |
Token | inaugural |
Token ID | 26851 |
Feature activation | +3.19e+00 |
Pos logit contributions | |
zzle | +0.757 |
mble | +0.667 |
IRE | +0.650 |
uers | +0.649 |
unci | +0.583 |
Neg logit contributions | |
enh | -0.738 |
practice | -0.732 |
Occupations | -0.708 |
adapt | -0.708 |
Provided | -0.680 |
Token | episode |
Token ID | 4471 |
Feature activation | +2.21e-01 |
Pos logit contributions | |
zzle | +13.547 |
mble | +12.126 |
IRE | +12.076 |
uers | +11.898 |
reckoning | +11.532 |
Neg logit contributions | |
enh | -11.295 |
practice | -11.159 |
ゴン | -11.012 |
adapt | -10.863 |
theless | -10.566 |
Token | of |
Token ID | 286 |
Feature activation | +7.30e-01 |
Pos logit contributions | |
zzle | +0.805 |
mble | +0.688 |
uers | +0.681 |
IRE | +0.668 |
reckoning | +0.608 |
Neg logit contributions | |
enh | -1.061 |
practice | -1.045 |
adapt | -1.030 |
Occupations | -1.019 |
ゴン | -1.015 |
Token | the |
Token ID | 262 |
Feature activation | -1.38e-01 |
Pos logit contributions | |
zzle | +3.575 |
mble | +3.203 |
uers | +3.158 |
IRE | +3.138 |
reckoning | +2.905 |
Neg logit contributions | |
enh | -2.640 |
practice | -2.612 |
adapt | -2.530 |
Occupations | -2.512 |
ゴン | -2.460 |
Token | Nov |
Token ID | 5267 |
Feature activation | -6.35e-01 |
Pos logit contributions | |
enh | +0.504 |
practice | +0.493 |
Occupations | +0.479 |
adapt | +0.477 |
theless | +0.473 |
Neg logit contributions | |
zzle | -0.665 |
mble | -0.591 |
uers | -0.583 |
IRE | -0.577 |
reckoning | -0.524 |
Token | ice |
Token ID | 501 |
Feature activation | +6.31e-01 |
Pos logit contributions | |
enh | +2.265 |
practice | +2.227 |
adapt | +2.154 |
odor | +2.118 |
abil | +2.092 |
Neg logit contributions | |
zzle | -2.991 |
mble | -2.718 |
IRE | -2.680 |
uers | -2.612 |
reckoning | -2.524 |
Token | has |
Token ID | 468 |
Feature activation | +1.90e-01 |
Pos logit contributions | |
zzle | +3.256 |
mble | +2.928 |
uers | +2.876 |
IRE | +2.857 |
reckoning | +2.650 |
Neg logit contributions | |
enh | -2.652 |
practice | -2.613 |
adapt | -2.509 |
Occupations | -2.492 |
odor | -2.437 |
Token | been |
Token ID | 587 |
Feature activation | -3.28e-01 |
Pos logit contributions | |
zzle | +0.838 |
mble | +0.750 |
uers | +0.742 |
IRE | +0.734 |
reckoning | +0.670 |
Neg logit contributions | |
enh | -0.771 |
practice | -0.753 |
Occupations | -0.720 |
adapt | -0.715 |
odor | -0.715 |
Token | chosen |
Token ID | 7147 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
enh | +1.416 |
practice | +1.372 |
adapt | +1.321 |
Occupations | +1.295 |
odor | +1.293 |
Neg logit contributions | |
zzle | -1.338 |
mble | -1.242 |
uers | -1.192 |
IRE | -1.177 |
reckoning | -1.055 |
Token | as |
Token ID | 355 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
enh | +0.973 |
practice | +0.945 |
adapt | +0.918 |
theless | +0.898 |
Occupations | +0.898 |
Neg logit contributions | |
zzle | -1.405 |
IRE | -1.267 |
mble | -1.267 |
uers | -1.262 |
reckoning | -1.145 |
Token | a |
Token ID | 257 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
zzle | +1.560 |
mble | +1.368 |
IRE | +1.367 |
uers | +1.358 |
reckoning | +1.227 |
Neg logit contributions | |
enh | -1.578 |
practice | -1.571 |
adapt | -1.515 |
Occupations | -1.485 |
theless | -1.471 |
Token | ur |
Token ID | 2956 |
Feature activation | +3.18e+00 |
Pos logit contributions | |
zzle | +1.023 |
IRE | +0.914 |
mble | +0.911 |
uers | +0.903 |
reckoning | +0.810 |
Neg logit contributions | |
enh | -0.910 |
practice | -0.905 |
adapt | -0.861 |
theless | -0.846 |
Occupations | -0.845 |
Token | inal |
Token ID | 1292 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
zzle | +11.772 |
mble | +10.478 |
uers | +9.674 |
IRE | +9.429 |
reckoning | +8.994 |
Neg logit contributions | |
ゴン | -13.416 |
practice | -13.316 |
Occupations | -13.200 |
enh | -12.973 |
theless | -12.973 |
Token | . |
Token ID | 13 |
Feature activation | -7.42e-02 |
Pos logit contributions | |
zzle | +5.396 |
mble | +4.826 |
IRE | +4.751 |
uers | +4.735 |
reckoning | +4.370 |
Neg logit contributions | |
enh | -4.851 |
practice | -4.799 |
adapt | -4.635 |
Occupations | -4.556 |
ゴン | -4.547 |
Token | Pretty |
Token ID | 20090 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
enh | +0.220 |
practice | +0.218 |
Occupations | +0.217 |
Provided | +0.209 |
adapt | +0.206 |
Neg logit contributions | |
zzle | -0.408 |
mble | -0.383 |
uers | -0.369 |
IRE | -0.363 |
reckoning | -0.347 |
Token | much |
Token ID | 881 |
Feature activation | -3.85e-02 |
Pos logit contributions | |
zzle | +1.484 |
mble | +1.341 |
uers | +1.323 |
IRE | +1.308 |
reckoning | +1.189 |
Neg logit contributions | |
enh | -1.199 |
practice | -1.191 |
adapt | -1.145 |
Occupations | -1.126 |
odor | -1.117 |
Token | every |
Token ID | 790 |
Feature activation | +7.72e-01 |
Pos logit contributions | |
enh | +0.152 |
practice | +0.151 |
Occupations | +0.146 |
theless | +0.143 |
odor | +0.142 |
Neg logit contributions | |
zzle | -0.169 |
mble | -0.157 |
uers | -0.154 |
IRE | -0.149 |
unci | -0.135 |
Token | for |
Token ID | 329 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
practice | +1.743 |
enh | +1.726 |
adapt | +1.695 |
odor | +1.607 |
bid | +1.599 |
Neg logit contributions | |
zzle | -1.872 |
mble | -1.671 |
uers | -1.661 |
IRE | -1.617 |
unci | -1.468 |
Token | Fox |
Token ID | 5426 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
zzle | +0.636 |
mble | +0.560 |
uers | +0.557 |
IRE | +0.556 |
reckoning | +0.498 |
Neg logit contributions | |
practice | -0.611 |
enh | -0.597 |
adapt | -0.583 |
odor | -0.574 |
Occupations | -0.573 |
Token | News |
Token ID | 3000 |
Feature activation | +6.00e-01 |
Pos logit contributions | |
zzle | +1.771 |
mble | +1.620 |
IRE | +1.600 |
uers | +1.576 |
reckoning | +1.464 |
Neg logit contributions | |
enh | -1.228 |
practice | -1.200 |
adapt | -1.138 |
Occupations | -1.135 |
ゴン | -1.125 |
Token | . |
Token ID | 13 |
Feature activation | +6.81e-02 |
Pos logit contributions | |
zzle | +2.709 |
mble | +2.414 |
IRE | +2.377 |
uers | +2.373 |
reckoning | +2.159 |
Neg logit contributions | |
enh | -2.373 |
practice | -2.363 |
adapt | -2.263 |
Occupations | -2.238 |
ゴン | -2.229 |
Token | The |
Token ID | 383 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
zzle | +0.373 |
mble | +0.344 |
uers | +0.338 |
IRE | +0.330 |
reckoning | +0.314 |
Neg logit contributions | |
enh | -0.205 |
practice | -0.203 |
Occupations | -0.196 |
adapt | -0.195 |
Provided | -0.194 |
Token | First |
Token ID | 3274 |
Feature activation | +3.15e+00 |
Pos logit contributions | |
enh | +0.441 |
practice | +0.440 |
odor | +0.427 |
Occupations | +0.422 |
adapt | +0.420 |
Neg logit contributions | |
zzle | -0.558 |
mble | -0.501 |
uers | -0.496 |
IRE | -0.492 |
unci | -0.444 |
Token | Family |
Token ID | 7884 |
Feature activation | +7.50e-01 |
Pos logit contributions | |
zzle | +11.638 |
IRE | +10.124 |
mble | +9.967 |
uers | +9.905 |
respectively | +9.283 |
Neg logit contributions | |
practice | -12.675 |
enh | -12.533 |
adapt | -12.357 |
ゴン | -12.186 |
theless | -12.108 |
Token | would |
Token ID | 561 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
zzle | +3.275 |
mble | +2.935 |
uers | +2.881 |
IRE | +2.860 |
reckoning | +2.599 |
Neg logit contributions | |
enh | -3.083 |
practice | -3.052 |
Occupations | -2.932 |
adapt | -2.929 |
theless | -2.893 |
Token | have |
Token ID | 423 |
Feature activation | +9.90e-01 |
Pos logit contributions | |
zzle | +7.746 |
mble | +6.703 |
uers | +6.594 |
IRE | +6.556 |
reckoning | +6.044 |
Neg logit contributions | |
enh | -9.175 |
practice | -9.077 |
ゴン | -8.894 |
adapt | -8.851 |
Occupations | -8.798 |
Token | been |
Token ID | 587 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
zzle | +4.364 |
mble | +3.907 |
uers | +3.842 |
IRE | +3.821 |
reckoning | +3.497 |
Neg logit contributions | |
enh | -4.012 |
practice | -3.970 |
adapt | -3.835 |
theless | -3.780 |
Occupations | -3.778 |
Token | denounced |
Token ID | 26443 |
Feature activation | -5.01e-01 |
Pos logit contributions | |
zzle | +5.113 |
mble | +4.531 |
uers | +4.423 |
IRE | +4.414 |
reckoning | +4.022 |
Neg logit contributions | |
enh | -5.534 |
practice | -5.478 |
adapt | -5.311 |
Occupations | -5.231 |
ゴン | -5.230 |
Token | The |
Token ID | 464 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
zzle | +2.266 |
mble | +2.061 |
uers | +1.978 |
IRE | +1.920 |
reckoning | +1.865 |
Neg logit contributions | |
enh | -1.917 |
practice | -1.897 |
adapt | -1.869 |
odor | -1.780 |
ゴン | -1.769 |
Token | final |
Token ID | 2457 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
enh | +0.891 |
practice | +0.874 |
adapt | +0.870 |
odor | +0.869 |
theless | +0.853 |
Neg logit contributions | |
zzle | -1.121 |
mble | -1.008 |
uers | -0.986 |
IRE | -0.978 |
unci | -0.883 |
Token | pages |
Token ID | 5468 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
zzle | +6.193 |
mble | +5.512 |
uers | +5.400 |
IRE | +5.384 |
reckoning | +4.959 |
Neg logit contributions | |
enh | -5.780 |
practice | -5.724 |
adapt | -5.560 |
Occupations | -5.473 |
ゴン | -5.471 |
Token | of |
Token ID | 286 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
zzle | +3.850 |
mble | +3.290 |
uers | +3.212 |
IRE | +3.205 |
reckoning | +2.877 |
Neg logit contributions | |
enh | -5.832 |
practice | -5.782 |
adapt | -5.651 |
ゴン | -5.573 |
Occupations | -5.570 |
Token | the |
Token ID | 262 |
Feature activation | +5.03e-01 |
Pos logit contributions | |
zzle | +5.808 |
mble | +5.096 |
IRE | +5.012 |
uers | +5.011 |
reckoning | +4.618 |
Neg logit contributions | |
enh | -6.276 |
practice | -6.217 |
adapt | -6.025 |
ゴン | -5.977 |
Occupations | -5.945 |
Token | opening |
Token ID | 4756 |
Feature activation | +3.15e+00 |
Pos logit contributions | |
zzle | +2.434 |
mble | +2.202 |
uers | +2.157 |
IRE | +2.125 |
reckoning | +1.953 |
Neg logit contributions | |
enh | -1.826 |
practice | -1.791 |
adapt | -1.771 |
theless | -1.733 |
Occupations | -1.718 |
Token | issue |
Token ID | 2071 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
zzle | +12.616 |
IRE | +11.098 |
mble | +10.864 |
uers | +10.850 |
reckoning | +10.485 |
Neg logit contributions | |
enh | -12.376 |
practice | -12.302 |
ゴン | -12.067 |
adapt | -11.816 |
Occupations | -11.572 |
Token | of |
Token ID | 286 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
zzle | +5.252 |
mble | +4.656 |
uers | +4.573 |
IRE | +4.569 |
reckoning | +4.213 |
Neg logit contributions | |
enh | -5.103 |
practice | -5.048 |
adapt | -4.906 |
Occupations | -4.825 |
ゴン | -4.810 |
Token | the |
Token ID | 262 |
Feature activation | +3.40e-01 |
Pos logit contributions | |
zzle | +4.552 |
mble | +3.994 |
uers | +3.923 |
IRE | +3.911 |
reckoning | +3.595 |
Neg logit contributions | |
enh | -4.952 |
practice | -4.908 |
adapt | -4.772 |
ゴン | -4.713 |
Occupations | -4.705 |
Token | series |
Token ID | 2168 |
Feature activation | +4.84e-01 |
Pos logit contributions | |
zzle | +1.640 |
mble | +1.476 |
uers | +1.452 |
IRE | +1.427 |
reckoning | +1.311 |
Neg logit contributions | |
enh | -1.246 |
practice | -1.217 |
adapt | -1.203 |
theless | -1.178 |
Occupations | -1.170 |
Token | sent |
Token ID | 1908 |
Feature activation | +8.08e-01 |
Pos logit contributions | |
zzle | +2.128 |
mble | +1.908 |
IRE | +1.871 |
uers | +1.869 |
reckoning | +1.711 |
Neg logit contributions | |
enh | -1.963 |
practice | -1.926 |
adapt | -1.891 |
theless | -1.840 |
Occupations | -1.834 |
Token | option |
Token ID | 3038 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
zzle | +1.800 |
mble | +1.627 |
uers | +1.602 |
IRE | +1.571 |
reckoning | +1.442 |
Neg logit contributions | |
enh | -1.526 |
practice | -1.498 |
adapt | -1.453 |
Occupations | -1.441 |
ゴン | -1.424 |
Token | � |
Token ID | 447 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
zzle | +4.937 |
mble | +4.417 |
uers | +4.345 |
IRE | +4.331 |
reckoning | +4.019 |
Neg logit contributions | |
enh | -4.176 |
practice | -4.119 |
adapt | -3.990 |
Occupations | -3.925 |
ゴン | -3.918 |
Token | � |
Token ID | 247 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
zzle | +1.023 |
mble | +0.940 |
uers | +0.899 |
IRE | +0.888 |
reckoning | +0.867 |
Neg logit contributions | |
enh | -0.717 |
practice | -0.708 |
adapt | -0.672 |
Occupations | -0.670 |
ゴン | -0.657 |
Token | adopted |
Token ID | 8197 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
zzle | +2.518 |
mble | +2.256 |
uers | +2.224 |
IRE | +2.203 |
reckoning | +2.037 |
Neg logit contributions | |
enh | -2.217 |
practice | -2.175 |
adapt | -2.112 |
theless | -2.067 |
Occupations | -2.061 |
Token | by |
Token ID | 416 |
Feature activation | +4.97e-01 |
Pos logit contributions | |
zzle | +0.548 |
mble | +0.501 |
IRE | +0.492 |
uers | +0.488 |
reckoning | +0.450 |
Neg logit contributions | |
enh | -0.360 |
practice | -0.355 |
adapt | -0.346 |
theless | -0.338 |
Occupations | -0.332 |
Token | Pu |
Token ID | 11634 |
Feature activation | +3.15e+00 |
Pos logit contributions | |
zzle | +2.200 |
mble | +1.956 |
uers | +1.910 |
IRE | +1.899 |
reckoning | +1.745 |
Neg logit contributions | |
enh | -2.015 |
practice | -1.990 |
Occupations | -1.936 |
adapt | -1.933 |
theless | -1.911 |
Token | ig |
Token ID | 328 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
zzle | +9.149 |
uers | +7.374 |
IRE | +6.940 |
mble | +6.543 |
unci | +6.282 |
Neg logit contributions | |
ゴン | -16.484 |
practice | -15.834 |
theless | -15.695 |
Occupations | -15.498 |
adapt | -15.100 |
Token | dem |
Token ID | 9536 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
zzle | +6.027 |
mble | +5.448 |
uers | +5.370 |
IRE | +5.365 |
reckoning | +5.036 |
Neg logit contributions | |
enh | -3.884 |
practice | -3.837 |
adapt | -3.690 |
ゴン | -3.628 |
Occupations | -3.616 |
Token | ont |
Token ID | 756 |
Feature activation | -8.13e-01 |
Pos logit contributions | |
zzle | +1.872 |
mble | +1.692 |
IRE | +1.661 |
uers | +1.642 |
reckoning | +1.537 |
Neg logit contributions | |
enh | -1.654 |
practice | -1.606 |
adapt | -1.566 |
odor | -1.514 |
theless | -1.490 |
Token | and |
Token ID | 290 |
Feature activation | -2.77e-01 |
Pos logit contributions | |
enh | +3.013 |
practice | +2.829 |
theless | +2.784 |
adapt | +2.770 |
Occupations | +2.724 |
Neg logit contributions | |
zzle | -3.740 |
mble | -3.467 |
IRE | -3.342 |
uers | -3.317 |
reckoning | -2.954 |
Token | his |
Token ID | 465 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
enh | +0.991 |
practice | +0.959 |
Occupations | +0.949 |
adapt | +0.941 |
theless | +0.936 |
Neg logit contributions | |
zzle | -1.344 |
mble | -1.209 |
uers | -1.166 |
IRE | -1.156 |
reckoning | -1.075 |
Token | eliminated |
Token ID | 15254 |
Feature activation | +6.88e-01 |
Pos logit contributions | |
zzle | +1.255 |
mble | +1.119 |
uers | +1.079 |
IRE | +1.078 |
reckoning | +0.999 |
Neg logit contributions | |
enh | -1.426 |
practice | -1.388 |
adapt | -1.353 |
Occupations | -1.323 |
theless | -1.319 |
Token | via |
Token ID | 2884 |
Feature activation | +4.31e-01 |
Pos logit contributions | |
zzle | +2.891 |
mble | +2.550 |
uers | +2.508 |
IRE | +2.502 |
reckoning | +2.310 |
Neg logit contributions | |
enh | -2.902 |
practice | -2.876 |
adapt | -2.788 |
ゴン | -2.758 |
Occupations | -2.750 |
Token | optics |
Token ID | 36237 |
Feature activation | +6.07e-03 |
Pos logit contributions | |
zzle | +2.743 |
mble | +2.564 |
uers | +2.520 |
IRE | +2.511 |
reckoning | +2.374 |
Neg logit contributions | |
enh | -0.896 |
practice | -0.873 |
adapt | -0.843 |
theless | -0.778 |
Occupations | -0.772 |
Token | and |
Token ID | 290 |
Feature activation | +4.07e-01 |
Pos logit contributions | |
zzle | +0.029 |
mble | +0.027 |
uers | +0.025 |
IRE | +0.025 |
reckoning | +0.024 |
Neg logit contributions | |
enh | -0.023 |
practice | -0.022 |
adapt | -0.022 |
Provided | -0.021 |
odor | -0.021 |
Token | i |
Token ID | 1312 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
zzle | +1.613 |
mble | +1.468 |
uers | +1.412 |
IRE | +1.392 |
reckoning | +1.255 |
Neg logit contributions | |
enh | -1.809 |
practice | -1.805 |
adapt | -1.762 |
Occupations | -1.703 |
theless | -1.688 |
Token | 'd |
Token ID | 1549 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
zzle | +4.119 |
mble | +3.311 |
uers | +3.294 |
IRE | +3.269 |
reckoning | +2.852 |
Neg logit contributions | |
enh | -8.023 |
practice | -7.944 |
ゴン | -7.860 |
adapt | -7.786 |
Occupations | -7.776 |
Token | hope |
Token ID | 2911 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
zzle | +5.113 |
uers | +3.497 |
mble | +3.413 |
hoping | +3.354 |
IRE | +3.309 |
Neg logit contributions | |
ゴン | -20.453 |
Occupations | -19.490 |
theless | -19.170 |
adapt | -19.121 |
practice | -18.752 |
Token | that |
Token ID | 326 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
zzle | +4.478 |
mble | +3.854 |
uers | +3.806 |
IRE | +3.794 |
reckoning | +3.466 |
Neg logit contributions | |
enh | -5.608 |
practice | -5.558 |
adapt | -5.417 |
ゴン | -5.389 |
Occupations | -5.358 |
Token | a |
Token ID | 257 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
zzle | +4.544 |
mble | +3.939 |
uers | +3.876 |
IRE | +3.867 |
reckoning | +3.541 |
Neg logit contributions | |
enh | -5.502 |
practice | -5.454 |
adapt | -5.303 |
ゴン | -5.270 |
Occupations | -5.245 |
Token | com |
Token ID | 401 |
Feature activation | -5.25e-01 |
Pos logit contributions | |
zzle | +5.501 |
uers | +4.465 |
IRE | +4.377 |
mble | +4.331 |
reckoning | +4.097 |
Neg logit contributions | |
enh | -10.616 |
practice | -10.516 |
ゴン | -10.493 |
Occupations | -10.361 |
theless | -10.330 |
Token | er |
Token ID | 263 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
enh | +1.724 |
adapt | +1.645 |
practice | +1.619 |
odor | +1.533 |
abil | +1.510 |
Neg logit contributions | |
zzle | -2.675 |
mble | -2.562 |
IRE | -2.469 |
millenn | -2.340 |
uers | -2.340 |
Token | I |
Token ID | 314 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
enh | +1.632 |
practice | +1.561 |
Occupations | +1.550 |
adapt | +1.538 |
odor | +1.510 |
Neg logit contributions | |
zzle | -1.761 |
IRE | -1.573 |
mble | -1.568 |
uers | -1.529 |
unci | -1.364 |
Token | think |
Token ID | 892 |
Feature activation | +8.30e-01 |
Pos logit contributions | |
zzle | +1.256 |
mble | +1.130 |
IRE | +1.090 |
uers | +1.087 |
reckoning | +0.977 |
Neg logit contributions | |
enh | -1.459 |
practice | -1.438 |
adapt | -1.400 |
theless | -1.378 |
bid | -1.356 |
Token | even |
Token ID | 772 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
zzle | +3.504 |
mble | +3.089 |
IRE | +3.042 |
uers | +3.036 |
reckoning | +2.773 |
Neg logit contributions | |
enh | -3.551 |
practice | -3.480 |
adapt | -3.402 |
Occupations | -3.360 |
theless | -3.296 |
Token | the |
Token ID | 262 |
Feature activation | -4.62e-01 |
Pos logit contributions | |
enh | +0.674 |
practice | +0.651 |
adapt | +0.645 |
Occupations | +0.634 |
odor | +0.628 |
Neg logit contributions | |
zzle | -0.766 |
mble | -0.684 |
IRE | -0.672 |
uers | -0.662 |
reckoning | -0.594 |
Token | most |
Token ID | 749 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
enh | +1.732 |
practice | +1.671 |
adapt | +1.641 |
odor | +1.636 |
Occupations | +1.604 |
Neg logit contributions | |
zzle | -2.167 |
mble | -1.926 |
IRE | -1.909 |
uers | -1.853 |
unci | -1.697 |
Token | shameless |
Token ID | 41564 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
zzle | +6.034 |
mble | +5.368 |
uers | +5.279 |
IRE | +5.271 |
reckoning | +4.873 |
Neg logit contributions | |
enh | -5.265 |
practice | -5.196 |
adapt | -5.045 |
Occupations | -4.937 |
ゴン | -4.935 |
Token | per |
Token ID | 583 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
zzle | +13.593 |
mble | +12.183 |
uers | +11.926 |
IRE | +11.608 |
reckoning | +11.199 |
Neg logit contributions | |
practice | -11.159 |
ゴン | -11.145 |
enh | -10.850 |
theless | -10.547 |
adapt | -10.456 |
Token | vert |
Token ID | 1851 |
Feature activation | +8.74e-01 |
Pos logit contributions | |
zzle | +5.158 |
mble | +4.460 |
uers | +4.374 |
IRE | +4.334 |
reckoning | +3.953 |
Neg logit contributions | |
enh | -6.677 |
practice | -6.629 |
adapt | -6.443 |
ゴン | -6.416 |
Occupations | -6.386 |
Token | would |
Token ID | 561 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
zzle | +3.632 |
mble | +3.232 |
IRE | +3.182 |
uers | +3.182 |
reckoning | +2.896 |
Neg logit contributions | |
enh | -3.782 |
practice | -3.692 |
adapt | -3.621 |
Occupations | -3.537 |
odor | -3.504 |
Token | find |
Token ID | 1064 |
Feature activation | +9.89e-02 |
Pos logit contributions | |
zzle | +7.587 |
mble | +6.579 |
uers | +6.487 |
IRE | +6.432 |
reckoning | +5.974 |
Neg logit contributions | |
enh | -8.753 |
practice | -8.684 |
ゴン | -8.559 |
Occupations | -8.432 |
adapt | -8.428 |
Token | it |
Token ID | 340 |
Feature activation | -4.93e-01 |
Pos logit contributions | |
zzle | +0.412 |
IRE | +0.364 |
mble | +0.363 |
uers | +0.355 |
reckoning | +0.320 |
Neg logit contributions | |
enh | -0.432 |
practice | -0.419 |
adapt | -0.410 |
Occupations | -0.408 |
odor | -0.397 |
Token | both |
Token ID | 1111 |
Feature activation | -4.18e-01 |
Pos logit contributions | |
zzle | +0.636 |
mble | +0.566 |
uers | +0.555 |
IRE | +0.555 |
reckoning | +0.506 |
Neg logit contributions | |
enh | -0.573 |
practice | -0.564 |
adapt | -0.543 |
theless | -0.542 |
Occupations | -0.540 |
Token | Cull |
Token ID | 31289 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
enh | +1.508 |
practice | +1.473 |
theless | +1.434 |
Occupations | +1.418 |
adapt | +1.409 |
Neg logit contributions | |
zzle | -1.998 |
mble | -1.779 |
IRE | -1.754 |
uers | -1.744 |
reckoning | -1.601 |
Token | in |
Token ID | 259 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
zzle | +0.999 |
mble | +0.955 |
IRE | +0.925 |
uers | +0.922 |
reckoning | +0.883 |
Neg logit contributions | |
enh | -0.366 |
practice | -0.335 |
adapt | -0.324 |
odor | -0.301 |
bid | -0.284 |
Token | an |
Token ID | 272 |
Feature activation | -3.90e-02 |
Pos logit contributions | |
zzle | +0.613 |
mble | +0.582 |
IRE | +0.564 |
uers | +0.555 |
reckoning | +0.537 |
Neg logit contributions | |
enh | -0.279 |
practice | -0.269 |
adapt | -0.257 |
odor | -0.242 |
bid | -0.237 |
Token | and |
Token ID | 290 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
enh | +0.157 |
practice | +0.154 |
adapt | +0.149 |
ゴン | +0.148 |
Occupations | +0.147 |
Neg logit contributions | |
zzle | -0.173 |
mble | -0.154 |
IRE | -0.151 |
uers | -0.151 |
reckoning | -0.140 |
Token | Ru |
Token ID | 11667 |
Feature activation | +3.13e+00 |
Pos logit contributions | |
enh | +0.446 |
practice | +0.432 |
Occupations | +0.419 |
adapt | +0.418 |
theless | +0.415 |
Neg logit contributions | |
zzle | -0.587 |
mble | -0.518 |
uers | -0.512 |
IRE | -0.511 |
reckoning | -0.471 |
Token | iz |
Token ID | 528 |
Feature activation | -3.95e-01 |
Pos logit contributions | |
zzle | +12.329 |
uers | +10.010 |
IRE | +9.790 |
htar | +9.146 |
reckoning | +8.943 |
Neg logit contributions | |
ゴン | -13.681 |
theless | -13.242 |
Occupations | -12.574 |
practice | -12.466 |
enh | -12.059 |
Token | , |
Token ID | 11 |
Feature activation | +9.56e-01 |
Pos logit contributions | |
enh | +1.575 |
practice | +1.541 |
theless | +1.469 |
adapt | +1.467 |
Provided | +1.429 |
Neg logit contributions | |
zzle | -1.733 |
mble | -1.593 |
IRE | -1.532 |
uers | -1.526 |
reckoning | -1.405 |
Token | who |
Token ID | 508 |
Feature activation | -3.33e-01 |
Pos logit contributions | |
zzle | +3.888 |
mble | +3.429 |
IRE | +3.358 |
uers | +3.351 |
reckoning | +3.048 |
Neg logit contributions | |
enh | -4.221 |
practice | -4.170 |
adapt | -4.054 |
Occupations | -3.994 |
ゴン | -3.967 |
Token | had |
Token ID | 550 |
Feature activation | -9.34e-02 |
Pos logit contributions | |
enh | +1.271 |
practice | +1.270 |
adapt | +1.216 |
Occupations | +1.185 |
theless | +1.172 |
Neg logit contributions | |
zzle | -1.513 |
mble | -1.354 |
uers | -1.330 |
IRE | -1.328 |
reckoning | -1.226 |
Token | memor |
Token ID | 16181 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
enh | +0.364 |
practice | +0.363 |
adapt | +0.343 |
theless | +0.339 |
Occupations | +0.338 |
Neg logit contributions | |
zzle | -0.425 |
mble | -0.378 |
uers | -0.374 |
IRE | -0.372 |
reckoning | -0.338 |
Token | s |
Token ID | 82 |
Feature activation | +6.65e-01 |
Pos logit contributions | |
zzle | +2.626 |
mble | +2.418 |
IRE | +2.365 |
uers | +2.355 |
reckoning | +2.246 |
Neg logit contributions | |
enh | -1.454 |
practice | -1.434 |
adapt | -1.374 |
theless | -1.326 |
Occupations | -1.317 |
Token | President |
Token ID | 1992 |
Feature activation | +7.05e-01 |
Pos logit contributions | |
zzle | +2.943 |
mble | +2.590 |
uers | +2.556 |
IRE | +2.496 |
reckoning | +2.333 |
Neg logit contributions | |
enh | -2.695 |
practice | -2.678 |
Occupations | -2.598 |
adapt | -2.583 |
theless | -2.551 |
Token | , |
Token ID | 11 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
zzle | +3.390 |
mble | +3.016 |
uers | +2.987 |
IRE | +2.960 |
reckoning | +2.763 |
Neg logit contributions | |
enh | -2.628 |
practice | -2.560 |
adapt | -2.473 |
Occupations | -2.457 |
theless | -2.431 |
Token | Car |
Token ID | 1879 |
Feature activation | -3.56e-01 |
Pos logit contributions | |
zzle | +5.677 |
mble | +5.088 |
uers | +5.006 |
IRE | +4.976 |
reckoning | +4.633 |
Neg logit contributions | |
enh | -4.297 |
practice | -4.234 |
adapt | -4.094 |
Occupations | -4.034 |
ゴン | -3.992 |
Token | les |
Token ID | 829 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
enh | +1.614 |
practice | +1.569 |
adapt | +1.541 |
odor | +1.540 |
abil | +1.490 |
Neg logit contributions | |
zzle | -1.412 |
mble | -1.307 |
IRE | -1.235 |
uers | -1.176 |
reckoning | -1.089 |
Token | Pu |
Token ID | 11634 |
Feature activation | +3.11e+00 |
Pos logit contributions | |
enh | +3.439 |
practice | +3.355 |
Provided | +3.318 |
odor | +3.313 |
Occupations | +3.251 |
Neg logit contributions | |
zzle | -5.525 |
mble | -5.197 |
IRE | -4.844 |
uers | -4.605 |
igible | -4.305 |
Token | ig |
Token ID | 328 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
zzle | +7.896 |
IRE | +6.250 |
uers | +5.857 |
reckoning | +5.655 |
mble | +4.981 |
Neg logit contributions | |
ゴン | -17.519 |
practice | -17.124 |
theless | -16.824 |
Occupations | -16.358 |
adapt | -15.922 |
Token | dem |
Token ID | 9536 |
Feature activation | -2.26e-01 |
Pos logit contributions | |
zzle | +6.647 |
mble | +5.978 |
uers | +5.940 |
IRE | +5.910 |
reckoning | +5.545 |
Neg logit contributions | |
enh | -4.405 |
practice | -4.376 |
adapt | -4.196 |
ゴン | -4.161 |
Occupations | -4.134 |
Token | ont |
Token ID | 756 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
enh | +0.833 |
adapt | +0.766 |
practice | +0.751 |
odor | +0.722 |
theless | +0.716 |
Neg logit contributions | |
zzle | -1.128 |
mble | -1.037 |
IRE | -0.987 |
reckoning | -0.937 |
uers | -0.927 |
Token | , |
Token ID | 11 |
Feature activation | +6.66e-01 |
Pos logit contributions | |
enh | +1.356 |
practice | +1.268 |
adapt | +1.260 |
Provided | +1.228 |
theless | +1.225 |
Neg logit contributions | |
zzle | -1.862 |
mble | -1.711 |
uers | -1.676 |
IRE | -1.663 |
reckoning | -1.546 |
Token | announced |
Token ID | 3414 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
zzle | +2.954 |
mble | +2.651 |
uers | +2.593 |
IRE | +2.581 |
reckoning | +2.343 |
Neg logit contributions | |
enh | -2.716 |
practice | -2.670 |
adapt | -2.593 |
theless | -2.552 |
Occupations | -2.525 |
Token | transit |
Token ID | 11168 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
zzle | +0.212 |
uers | +0.189 |
mble | +0.189 |
IRE | +0.187 |
reckoning | +0.172 |
Neg logit contributions | |
enh | -0.184 |
practice | -0.179 |
Occupations | -0.175 |
adapt | -0.173 |
Provided | -0.169 |
Token | corridors |
Token ID | 32807 |
Feature activation | +9.67e-01 |
Pos logit contributions | |
enh | +0.400 |
practice | +0.384 |
adapt | +0.376 |
Occupations | +0.365 |
ゴン | +0.358 |
Neg logit contributions | |
zzle | -0.519 |
mble | -0.471 |
uers | -0.464 |
IRE | -0.456 |
reckoning | -0.424 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e-03 |
Pos logit contributions | |
zzle | +4.338 |
mble | +3.886 |
uers | +3.821 |
IRE | +3.799 |
reckoning | +3.522 |
Neg logit contributions | |
enh | -3.853 |
practice | -3.776 |
adapt | -3.668 |
ゴン | -3.613 |
Occupations | -3.613 |
Token | major |
Token ID | 1688 |
Feature activation | +3.50e-01 |
Pos logit contributions | |
enh | +0.039 |
practice | +0.038 |
adapt | +0.037 |
Occupations | +0.037 |
theless | +0.036 |
Neg logit contributions | |
zzle | -0.044 |
uers | -0.039 |
IRE | -0.039 |
mble | -0.039 |
reckoning | -0.035 |
Token | commercial |
Token ID | 5068 |
Feature activation | +6.93e-01 |
Pos logit contributions | |
zzle | +1.568 |
mble | +1.395 |
uers | +1.389 |
IRE | +1.381 |
reckoning | +1.251 |
Neg logit contributions | |
enh | -1.400 |
practice | -1.362 |
Occupations | -1.339 |
adapt | -1.322 |
theless | -1.297 |
Token | bou |
Token ID | 35833 |
Feature activation | +3.10e+00 |
Pos logit contributions | |
zzle | +3.404 |
mble | +3.082 |
uers | +3.048 |
IRE | +3.027 |
reckoning | +2.787 |
Neg logit contributions | |
enh | -2.490 |
practice | -2.435 |
adapt | -2.330 |
Occupations | -2.323 |
ゴン | -2.284 |
Token | lev |
Token ID | 2768 |
Feature activation | +7.83e-01 |
Pos logit contributions | |
zzle | +9.028 |
uers | +7.377 |
mble | +7.026 |
IRE | +6.839 |
reckoning | +6.250 |
Neg logit contributions | |
ゴン | -15.926 |
theless | -15.580 |
practice | -15.557 |
Occupations | -15.466 |
enh | -15.324 |
Token | ards |
Token ID | 1371 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
zzle | +3.831 |
mble | +3.462 |
IRE | +3.382 |
uers | +3.343 |
reckoning | +3.163 |
Neg logit contributions | |
enh | -2.817 |
practice | -2.776 |
adapt | -2.681 |
Occupations | -2.623 |
odor | -2.591 |
Token | . |
Token ID | 13 |
Feature activation | -1.51e-03 |
Pos logit contributions | |
zzle | +7.910 |
mble | +6.797 |
IRE | +6.763 |
uers | +6.717 |
reckoning | +6.214 |
Neg logit contributions | |
practice | -8.236 |
enh | -8.173 |
adapt | -7.987 |
theless | -7.955 |
ゴン | -7.929 |
Token | This |
Token ID | 770 |
Feature activation | +4.82e-01 |
Pos logit contributions | |
enh | +0.004 |
practice | +0.004 |
Occupations | +0.004 |
adapt | +0.004 |
Provided | +0.004 |
Neg logit contributions | |
zzle | -0.008 |
mble | -0.008 |
uers | -0.008 |
IRE | -0.008 |
reckoning | -0.007 |
Token | proposal |
Token ID | 6961 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
zzle | +1.994 |
mble | +1.765 |
uers | +1.730 |
IRE | +1.711 |
reckoning | +1.534 |
Neg logit contributions | |
enh | -2.103 |
practice | -2.077 |
adapt | -2.028 |
theless | -1.983 |
Occupations | -1.972 |
Token | - |
Token ID | 12 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
zzle | +4.911 |
mble | +4.363 |
IRE | +4.248 |
uers | +4.246 |
reckoning | +3.817 |
Neg logit contributions | |
enh | -5.288 |
practice | -5.257 |
adapt | -5.096 |
ゴン | -4.983 |
Occupations | -4.968 |
Token | minute |
Token ID | 11374 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
enh | +2.506 |
practice | +2.497 |
adapt | +2.367 |
odor | +2.235 |
bid | +2.209 |
Neg logit contributions | |
zzle | -5.819 |
mble | -5.785 |
IRE | -5.531 |
uers | -5.477 |
unci | -5.006 |
Token | marketing |
Token ID | 7124 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
zzle | +6.377 |
mble | +5.663 |
uers | +5.573 |
IRE | +5.562 |
reckoning | +5.157 |
Neg logit contributions | |
enh | -5.804 |
practice | -5.748 |
adapt | -5.566 |
ゴン | -5.497 |
Occupations | -5.482 |
Token | for |
Token ID | 329 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
zzle | +1.653 |
mble | +1.498 |
uers | +1.491 |
IRE | +1.491 |
reckoning | +1.314 |
Neg logit contributions | |
enh | -1.673 |
practice | -1.653 |
adapt | -1.600 |
Occupations | -1.532 |
ゴン | -1.522 |
Token | The |
Token ID | 383 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
zzle | +1.100 |
mble | +0.985 |
IRE | +0.975 |
uers | +0.969 |
reckoning | +0.879 |
Neg logit contributions | |
enh | -0.992 |
practice | -0.975 |
adapt | -0.956 |
Occupations | -0.937 |
odor | -0.934 |
Token | Pur |
Token ID | 9330 |
Feature activation | +3.09e+00 |
Pos logit contributions | |
zzle | +0.854 |
mble | +0.779 |
uers | +0.770 |
IRE | +0.766 |
reckoning | +0.710 |
Neg logit contributions | |
enh | -0.576 |
practice | -0.564 |
Occupations | -0.547 |
adapt | -0.546 |
odor | -0.546 |
Token | ge |
Token ID | 469 |
Feature activation | +7.71e-01 |
Pos logit contributions | |
zzle | +12.037 |
uers | +10.670 |
mble | +10.518 |
IRE | +9.992 |
unci | +9.136 |
Neg logit contributions | |
ゴン | -12.510 |
theless | -12.182 |
enh | -12.156 |
practice | -12.078 |
Occupations | -11.982 |
Token | : |
Token ID | 25 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
zzle | +3.548 |
mble | +3.191 |
uers | +3.133 |
IRE | +3.131 |
reckoning | +2.894 |
Neg logit contributions | |
enh | -2.976 |
practice | -2.921 |
adapt | -2.848 |
Occupations | -2.806 |
ゴン | -2.777 |
Token | Anarchy |
Token ID | 38899 |
Feature activation | +3.03e-01 |
Pos logit contributions | |
enh | +0.926 |
practice | +0.897 |
Occupations | +0.881 |
adapt | +0.880 |
Provided | +0.850 |
Neg logit contributions | |
zzle | -1.362 |
mble | -1.237 |
IRE | -1.218 |
uers | -1.195 |
reckoning | -1.125 |
Token | , |
Token ID | 11 |
Feature activation | +6.17e-01 |
Pos logit contributions | |
zzle | +1.455 |
mble | +1.316 |
uers | +1.299 |
IRE | +1.298 |
reckoning | +1.192 |
Neg logit contributions | |
enh | -1.111 |
practice | -1.076 |
adapt | -1.056 |
Occupations | -1.044 |
ゴン | -1.023 |
Token | now |
Token ID | 783 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
zzle | +2.785 |
mble | +2.501 |
uers | +2.462 |
IRE | +2.461 |
reckoning | +2.219 |
Neg logit contributions | |
enh | -2.466 |
practice | -2.403 |
adapt | -2.394 |
Occupations | -2.354 |
theless | -2.265 |
Token | a |
Token ID | 257 |
Feature activation | +3.92e-01 |
Pos logit contributions | |
enh | +0.309 |
practice | +0.305 |
adapt | +0.300 |
Occupations | +0.295 |
odor | +0.289 |
Neg logit contributions | |
zzle | -0.351 |
mble | -0.312 |
IRE | -0.311 |
uers | -0.308 |
reckoning | -0.274 |
Token | nutshell |
Token ID | 43875 |
Feature activation | +7.63e-01 |
Pos logit contributions | |
zzle | +1.507 |
mble | +1.310 |
uers | +1.293 |
IRE | +1.289 |
reckoning | +1.156 |
Neg logit contributions | |
enh | -1.798 |
practice | -1.787 |
adapt | -1.731 |
theless | -1.705 |
ゴン | -1.704 |
Token | . |
Token ID | 13 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
zzle | +3.304 |
mble | +2.929 |
uers | +2.886 |
IRE | +2.883 |
reckoning | +2.658 |
Neg logit contributions | |
enh | -3.150 |
practice | -3.116 |
adapt | -3.022 |
Occupations | -2.971 |
ゴン | -2.966 |
Token | Given |
Token ID | 11259 |
Feature activation | -5.14e-01 |
Pos logit contributions | |
enh | +0.961 |
practice | +0.951 |
Occupations | +0.932 |
adapt | +0.926 |
Provided | +0.920 |
Neg logit contributions | |
zzle | -1.828 |
mble | -1.701 |
uers | -1.660 |
IRE | -1.610 |
reckoning | -1.560 |
Token | the |
Token ID | 262 |
Feature activation | -8.32e-01 |
Pos logit contributions | |
enh | +1.992 |
practice | +1.973 |
adapt | +1.950 |
theless | +1.889 |
odor | +1.889 |
Neg logit contributions | |
zzle | -2.243 |
IRE | -1.990 |
uers | -1.966 |
mble | -1.947 |
reckoning | -1.827 |
Token | outp |
Token ID | 38701 |
Feature activation | +3.08e+00 |
Pos logit contributions | |
enh | +2.969 |
practice | +2.957 |
adapt | +2.906 |
Occupations | +2.833 |
odor | +2.821 |
Neg logit contributions | |
zzle | -3.791 |
mble | -3.393 |
IRE | -3.362 |
uers | -3.342 |
unci | -3.050 |
Token | ouring |
Token ID | 21823 |
Feature activation | +2.31e+00 |
Pos logit contributions | |
zzle | +8.970 |
uers | +7.633 |
mble | +7.223 |
IRE | +6.988 |
unci | +6.309 |
Neg logit contributions | |
ゴン | -16.375 |
Occupations | -15.497 |
theless | -15.375 |
practice | -15.272 |
enh | -15.174 |
Token | of |
Token ID | 286 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
zzle | +6.064 |
mble | +4.804 |
IRE | +4.719 |
uers | +4.684 |
reckoning | +4.086 |
Neg logit contributions | |
enh | -12.710 |
practice | -12.586 |
ゴン | -12.415 |
adapt | -12.341 |
Occupations | -12.204 |
Token | glowing |
Token ID | 21377 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
zzle | +6.720 |
mble | +5.986 |
uers | +5.898 |
IRE | +5.886 |
reckoning | +5.481 |
Neg logit contributions | |
enh | -5.738 |
practice | -5.680 |
adapt | -5.498 |
ゴン | -5.441 |
Occupations | -5.411 |
Token | praise |
Token ID | 13463 |
Feature activation | +7.26e-01 |
Pos logit contributions | |
zzle | +7.241 |
mble | +6.617 |
uers | +6.538 |
IRE | +6.528 |
reckoning | +6.175 |
Neg logit contributions | |
enh | -3.389 |
practice | -3.339 |
adapt | -3.181 |
ゴン | -3.119 |
Occupations | -3.108 |
Token | for |
Token ID | 329 |
Feature activation | +5.35e-02 |
Pos logit contributions | |
zzle | +3.267 |
mble | +2.937 |
uers | +2.892 |
IRE | +2.874 |
reckoning | +2.666 |
Neg logit contributions | |
enh | -2.865 |
practice | -2.807 |
adapt | -2.732 |
Occupations | -2.679 |
odor | -2.651 |
Token | implementing |
Token ID | 15427 |
Feature activation | +4.68e-02 |
Pos logit contributions | |
enh | +3.598 |
adapt | +3.427 |
practice | +3.411 |
theless | +3.299 |
Occupations | +3.289 |
Neg logit contributions | |
zzle | -3.566 |
IRE | -3.189 |
mble | -3.110 |
uers | -3.000 |
unci | -2.769 |
Token | a |
Token ID | 257 |
Feature activation | -9.91e-02 |
Pos logit contributions | |
zzle | +0.202 |
mble | +0.180 |
uers | +0.178 |
IRE | +0.175 |
reckoning | +0.161 |
Neg logit contributions | |
enh | -0.197 |
practice | -0.190 |
adapt | -0.186 |
Occupations | -0.183 |
theless | -0.179 |
Token | balanced |
Token ID | 12974 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
enh | +0.404 |
practice | +0.395 |
adapt | +0.384 |
theless | +0.378 |
Occupations | +0.373 |
Neg logit contributions | |
zzle | -0.434 |
mble | -0.388 |
uers | -0.380 |
IRE | -0.378 |
unci | -0.339 |
Token | yet |
Token ID | 1865 |
Feature activation | -7.24e-01 |
Pos logit contributions | |
enh | +0.435 |
practice | +0.425 |
adapt | +0.415 |
Occupations | +0.406 |
ゴン | +0.401 |
Neg logit contributions | |
zzle | -0.513 |
uers | -0.459 |
mble | -0.458 |
IRE | -0.452 |
unci | -0.407 |
Token | skill |
Token ID | 5032 |
Feature activation | -2.37e+00 |
Pos logit contributions | |
enh | +2.805 |
practice | +2.722 |
adapt | +2.715 |
theless | +2.580 |
odor | +2.560 |
Neg logit contributions | |
zzle | -3.245 |
mble | -2.857 |
uers | -2.839 |
IRE | -2.814 |
unci | -2.551 |
Token | - |
Token ID | 12 |
Feature activation | -4.07e+00 |
Pos logit contributions | |
enh | +7.984 |
adapt | +7.681 |
practice | +7.499 |
tested | +7.124 |
standard | +7.088 |
Neg logit contributions | |
zzle | -10.595 |
uers | -9.269 |
IRE | -9.233 |
mble | -9.207 |
unci | -8.413 |
Token | focused |
Token ID | 18143 |
Feature activation | +8.89e-01 |
Pos logit contributions | |
enh | +11.420 |
adapt | +9.926 |
practice | +9.789 |
tested | +9.332 |
standard | +8.934 |
Neg logit contributions | |
zzle | -18.932 |
mble | -17.234 |
IRE | -17.197 |
millenn | -16.813 |
uers | -16.609 |
Token | take |
Token ID | 1011 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
zzle | +4.327 |
mble | +3.885 |
uers | +3.846 |
IRE | +3.825 |
reckoning | +3.549 |
Neg logit contributions | |
enh | -3.218 |
practice | -3.162 |
adapt | -3.050 |
Occupations | -3.009 |
ゴン | -2.997 |
Token | on |
Token ID | 319 |
Feature activation | +3.97e-01 |
Pos logit contributions | |
zzle | +4.279 |
mble | +3.779 |
uers | +3.703 |
IRE | +3.697 |
reckoning | +3.415 |
Neg logit contributions | |
enh | -4.336 |
practice | -4.301 |
adapt | -4.174 |
Occupations | -4.108 |
ゴン | -4.102 |
Token | shooting |
Token ID | 4395 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
zzle | +1.747 |
mble | +1.549 |
uers | +1.523 |
IRE | +1.514 |
reckoning | +1.392 |
Neg logit contributions | |
enh | -1.638 |
practice | -1.614 |
adapt | -1.554 |
Occupations | -1.542 |
ゴン | -1.515 |
Token | specifically |
Token ID | 5734 |
Feature activation | -3.78e-01 |
Pos logit contributions | |
zzle | +0.740 |
mble | +0.673 |
uers | +0.658 |
IRE | +0.648 |
reckoning | +0.604 |
Neg logit contributions | |
enh | -0.621 |
practice | -0.611 |
adapt | -0.584 |
Occupations | -0.579 |
ゴン | -0.566 |
Token | effects |
Token ID | 3048 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
enh | +0.913 |
practice | +0.868 |
adapt | +0.858 |
Occupations | +0.829 |
ゴン | +0.807 |
Neg logit contributions | |
zzle | -1.386 |
mble | -1.262 |
IRE | -1.241 |
uers | -1.218 |
reckoning | -1.144 |
Token | that |
Token ID | 326 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
enh | +0.415 |
practice | +0.406 |
adapt | +0.392 |
Occupations | +0.382 |
theless | +0.380 |
Neg logit contributions | |
zzle | -0.469 |
mble | -0.426 |
uers | -0.418 |
IRE | -0.416 |
reckoning | -0.378 |
Token | we |
Token ID | 356 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
enh | +1.313 |
practice | +1.276 |
adapt | +1.253 |
theless | +1.222 |
Occupations | +1.208 |
Neg logit contributions | |
zzle | -1.305 |
mble | -1.159 |
IRE | -1.141 |
uers | -1.130 |
reckoning | -1.034 |
Token | were |
Token ID | 547 |
Feature activation | +9.71e-01 |
Pos logit contributions | |
enh | +0.738 |
practice | +0.712 |
adapt | +0.699 |
theless | +0.683 |
odor | +0.665 |
Neg logit contributions | |
zzle | -0.771 |
mble | -0.715 |
uers | -0.690 |
IRE | -0.689 |
reckoning | -0.625 |
Token | play |
Token ID | 711 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
zzle | +4.077 |
mble | +3.658 |
IRE | +3.587 |
uers | +3.567 |
reckoning | +3.194 |
Neg logit contributions | |
enh | -4.174 |
practice | -4.105 |
adapt | -3.973 |
Occupations | -3.886 |
theless | -3.863 |
Token | - |
Token ID | 12 |
Feature activation | -3.80e+00 |
Pos logit contributions | |
tested | +6.406 |
enh | +6.160 |
adapt | +6.017 |
practice | +5.991 |
standard | +5.412 |
Neg logit contributions | |
zzle | -14.163 |
IRE | -13.034 |
mble | -12.935 |
uers | -12.723 |
reckoning | -11.909 |
Token | testing |
Token ID | 33407 |
Feature activation | -3.97e-01 |
Pos logit contributions | |
tested | +7.738 |
enh | +7.608 |
practice | +7.260 |
adapt | +7.065 |
standard | +6.349 |
Neg logit contributions | |
zzle | -20.563 |
mble | -19.323 |
IRE | -19.127 |
uers | -19.033 |
reckoning | -17.848 |
Token | . |
Token ID | 13 |
Feature activation | -4.62e-01 |
Pos logit contributions | |
enh | +1.476 |
practice | +1.442 |
adapt | +1.405 |
Occupations | +1.347 |
theless | +1.332 |
Neg logit contributions | |
zzle | -1.839 |
mble | -1.690 |
uers | -1.668 |
IRE | -1.652 |
reckoning | -1.516 |
Token | One |
Token ID | 1881 |
Feature activation | +6.37e-01 |
Pos logit contributions | |
enh | +1.318 |
practice | +1.287 |
Occupations | +1.287 |
Provided | +1.260 |
adapt | +1.254 |
Neg logit contributions | |
zzle | -2.562 |
mble | -2.418 |
uers | -2.342 |
IRE | -2.280 |
reckoning | -2.208 |
Token | was |
Token ID | 373 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
zzle | +2.960 |
mble | +2.671 |
uers | +2.642 |
IRE | +2.605 |
reckoning | +2.431 |
Neg logit contributions | |
enh | -2.440 |
practice | -2.395 |
adapt | -2.312 |
Occupations | -2.260 |
ゴン | -2.252 |
Token | a |
Token ID | 257 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
zzle | +0.737 |
mble | +0.664 |
uers | +0.656 |
IRE | +0.645 |
reckoning | +0.593 |
Neg logit contributions | |
enh | -0.702 |
practice | -0.687 |
adapt | -0.669 |
Occupations | -0.657 |
odor | -0.650 |
Token |
|
Token ID | 198 |
Feature activation | -9.63e-01 |
Pos logit contributions | |
enh | +3.510 |
practice | +3.489 |
adapt | +3.387 |
Occupations | +3.093 |
Provided | +3.041 |
Neg logit contributions | |
zzle | -9.559 |
mble | -9.479 |
millenn | -8.995 |
uers | -8.747 |
IRE | -8.543 |
Token |
|
Token ID | 198 |
Feature activation | -6.10e-01 |
Pos logit contributions | |
enh | +2.293 |
practice | +2.265 |
adapt | +2.204 |
bid | +1.971 |
odor | +1.960 |
Neg logit contributions | |
mble | -5.763 |
zzle | -5.733 |
millenn | -5.433 |
uers | -5.285 |
IRE | -5.135 |
Token | O |
Token ID | 46 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
practice | +2.141 |
enh | +2.137 |
adapt | +2.046 |
odor | +1.937 |
ゴン | +1.894 |
Neg logit contributions | |
zzle | -3.022 |
mble | -2.813 |
uers | -2.705 |
reckoning | -2.599 |
IRE | -2.529 |
Token | ka |
Token ID | 4914 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
zzle | +2.321 |
mble | +2.087 |
IRE | +2.071 |
uers | +2.050 |
reckoning | +1.931 |
Neg logit contributions | |
enh | -1.849 |
practice | -1.812 |
adapt | -1.743 |
odor | -1.712 |
ゴン | -1.705 |
Token | for |
Token ID | 1640 |
Feature activation | -7.35e-01 |
Pos logit contributions | |
zzle | +2.842 |
mble | +2.623 |
uers | +2.589 |
IRE | +2.587 |
reckoning | +2.462 |
Neg logit contributions | |
enh | -0.874 |
practice | -0.842 |
adapt | -0.797 |
Occupations | -0.760 |
ゴン | -0.749 |
Token | played |
Token ID | 2826 |
Feature activation | -3.70e+00 |
Pos logit contributions | |
enh | +2.652 |
practice | +2.553 |
adapt | +2.440 |
Occupations | +2.431 |
Provided | +2.378 |
Neg logit contributions | |
zzle | -3.518 |
mble | -3.225 |
uers | -3.121 |
IRE | -3.059 |
reckoning | -2.910 |
Token | one |
Token ID | 530 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
extensively | +10.386 |
practice | +10.345 |
enh | +10.087 |
firsthand | +9.649 |
standard | +9.297 |
Neg logit contributions | |
zzle | -15.536 |
mble | -13.784 |
uers | -13.757 |
IRE | -13.607 |
unci | -12.336 |
Token | season |
Token ID | 1622 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
practice | +1.540 |
enh | +1.524 |
adapt | +1.439 |
Occupations | +1.408 |
odor | +1.385 |
Neg logit contributions | |
zzle | -1.730 |
mble | -1.544 |
uers | -1.518 |
IRE | -1.455 |
reckoning | -1.364 |
Token | of |
Token ID | 286 |
Feature activation | -7.68e-01 |
Pos logit contributions | |
practice | +6.411 |
enh | +6.341 |
adapt | +6.222 |
firsthand | +5.920 |
bid | +5.862 |
Neg logit contributions | |
zzle | -8.392 |
mble | -7.579 |
uers | -7.360 |
IRE | -7.238 |
reckoning | -6.575 |
Token | college |
Token ID | 4152 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
enh | +2.662 |
practice | +2.649 |
adapt | +2.527 |
Occupations | +2.482 |
odor | +2.419 |
Neg logit contributions | |
zzle | -3.774 |
mble | -3.328 |
uers | -3.324 |
IRE | -3.307 |
htar | -3.014 |
Token | basketball |
Token ID | 9669 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
practice | +4.042 |
enh | +4.038 |
adapt | +3.796 |
Occupations | +3.610 |
firsthand | +3.595 |
Neg logit contributions | |
zzle | -6.574 |
mble | -5.888 |
uers | -5.821 |
IRE | -5.788 |
htar | -5.267 |
Token | liver |
Token ID | 14383 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
enh | +0.921 |
practice | +0.919 |
adapt | +0.866 |
odor | +0.859 |
Occupations | +0.843 |
Neg logit contributions | |
zzle | -1.287 |
mble | -1.165 |
uers | -1.156 |
IRE | -1.142 |
unci | -1.040 |
Token | disease |
Token ID | 4369 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
enh | +3.245 |
practice | +3.158 |
adapt | +3.063 |
odor | +2.947 |
bid | +2.943 |
Neg logit contributions | |
zzle | -5.219 |
mble | -4.866 |
uers | -4.678 |
IRE | -4.585 |
reckoning | -4.282 |
Token | and |
Token ID | 290 |
Feature activation | -7.04e-01 |
Pos logit contributions | |
enh | +3.688 |
practice | +3.620 |
bid | +3.442 |
adapt | +3.438 |
firsthand | +3.417 |
Neg logit contributions | |
zzle | -5.242 |
mble | -4.868 |
uers | -4.769 |
IRE | -4.757 |
unci | -4.348 |
Token | other |
Token ID | 584 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
enh | +2.448 |
practice | +2.377 |
adapt | +2.265 |
odor | +2.252 |
bid | +2.229 |
Neg logit contributions | |
zzle | -3.434 |
mble | -3.101 |
uers | -3.067 |
IRE | -3.041 |
unci | -2.802 |
Token | alcohol |
Token ID | 5548 |
Feature activation | -8.39e-01 |
Pos logit contributions | |
enh | +3.447 |
practice | +3.322 |
bid | +3.297 |
Occupations | +3.154 |
adapt | +3.120 |
Neg logit contributions | |
zzle | -6.589 |
mble | -6.030 |
uers | -5.935 |
IRE | -5.822 |
unci | -5.428 |
Token | - |
Token ID | 12 |
Feature activation | -3.69e+00 |
Pos logit contributions | |
enh | +3.032 |
practice | +2.827 |
adapt | +2.791 |
odor | +2.700 |
ゴン | +2.697 |
Neg logit contributions | |
zzle | -4.037 |
mble | -3.779 |
uers | -3.633 |
IRE | -3.619 |
reckoning | -3.308 |
Token | related |
Token ID | 5363 |
Feature activation | -7.12e-01 |
Pos logit contributions | |
enh | +7.350 |
related | +7.012 |
practice | +6.177 |
adapt | +6.136 |
only | +5.575 |
Neg logit contributions | |
mble | -21.083 |
zzle | -20.148 |
uers | -20.042 |
IRE | -18.789 |
millenn | -18.762 |
Token | illnesses |
Token ID | 24024 |
Feature activation | -6.78e-01 |
Pos logit contributions | |
enh | +1.596 |
practice | +1.545 |
bid | +1.483 |
Occupations | +1.458 |
odor | +1.409 |
Neg logit contributions | |
zzle | -4.357 |
mble | -4.095 |
uers | -3.991 |
IRE | -3.973 |
unci | -3.685 |
Token | . |
Token ID | 13 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
enh | +2.390 |
practice | +2.343 |
bid | +2.234 |
adapt | +2.224 |
firsthand | +2.200 |
Neg logit contributions | |
zzle | -3.152 |
mble | -2.944 |
uers | -2.883 |
IRE | -2.869 |
unci | -2.580 |
Token | About |
Token ID | 7994 |
Feature activation | +1.77e-01 |
Pos logit contributions | |
zzle | +0.072 |
mble | +0.067 |
uers | +0.065 |
IRE | +0.063 |
reckoning | +0.060 |
Neg logit contributions | |
enh | -0.037 |
practice | -0.035 |
Occupations | -0.035 |
adapt | -0.034 |
Provided | -0.034 |
Token | a |
Token ID | 257 |
Feature activation | +7.07e-01 |
Pos logit contributions | |
zzle | +0.806 |
mble | +0.729 |
uers | +0.713 |
IRE | +0.706 |
reckoning | +0.639 |
Neg logit contributions | |
enh | -0.686 |
practice | -0.682 |
Occupations | -0.652 |
adapt | -0.650 |
theless | -0.646 |
Token | , |
Token ID | 11 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
enh | +2.405 |
practice | +2.358 |
adapt | +2.269 |
Occupations | +2.205 |
Provided | +2.190 |
Neg logit contributions | |
zzle | -3.076 |
mble | -2.803 |
IRE | -2.771 |
uers | -2.714 |
reckoning | -2.509 |
Token | 2011 |
Token ID | 2813 |
Feature activation | -2.62e-01 |
Pos logit contributions | |
zzle | +0.951 |
mble | +0.865 |
IRE | +0.839 |
uers | +0.835 |
reckoning | +0.766 |
Neg logit contributions | |
practice | -0.602 |
enh | -0.594 |
adapt | -0.576 |
Occupations | -0.562 |
theless | -0.543 |
Token | data |
Token ID | 1366 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
enh | +0.996 |
practice | +0.973 |
adapt | +0.961 |
Occupations | +0.934 |
ゴン | +0.921 |
Neg logit contributions | |
zzle | -1.234 |
mble | -1.113 |
IRE | -1.074 |
uers | -1.073 |
reckoning | -0.983 |
Token | : |
Token ID | 25 |
Feature activation | -6.64e-01 |
Pos logit contributions | |
enh | +3.502 |
practice | +3.443 |
adapt | +3.353 |
Provided | +3.275 |
Occupations | +3.240 |
Neg logit contributions | |
zzle | -4.823 |
IRE | -4.308 |
mble | -4.289 |
uers | -4.163 |
htar | -3.928 |
Token | alcohol |
Token ID | 5548 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
enh | +2.420 |
practice | +2.405 |
adapt | +2.350 |
Occupations | +2.316 |
Provided | +2.250 |
Neg logit contributions | |
zzle | -3.199 |
mble | -2.881 |
IRE | -2.759 |
uers | -2.750 |
reckoning | -2.515 |
Token | - |
Token ID | 12 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
enh | +4.361 |
practice | +4.232 |
adapt | +4.071 |
Provided | +4.019 |
Occupations | +3.996 |
Neg logit contributions | |
zzle | -6.554 |
mble | -6.142 |
uers | -5.904 |
IRE | -5.759 |
unci | -5.331 |
Token | im |
Token ID | 320 |
Feature activation | -7.32e-02 |
Pos logit contributions | |
enh | +9.868 |
practice | +9.502 |
related | +9.418 |
adapt | +9.187 |
only | +8.966 |
Neg logit contributions | |
mble | -17.087 |
zzle | -16.974 |
uers | -16.895 |
IRE | -15.234 |
millenn | -15.034 |
Token | pa |
Token ID | 8957 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
enh | +0.397 |
practice | +0.382 |
adapt | +0.380 |
odor | +0.371 |
bid | +0.366 |
Neg logit contributions | |
zzle | -0.234 |
IRE | -0.205 |
mble | -0.203 |
uers | -0.200 |
reckoning | -0.182 |
Token | ired |
Token ID | 1202 |
Feature activation | +1.60e-03 |
Pos logit contributions | |
zzle | +2.039 |
mble | +1.850 |
uers | +1.788 |
IRE | +1.773 |
reckoning | +1.669 |
Neg logit contributions | |
enh | -1.958 |
practice | -1.933 |
adapt | -1.889 |
odor | -1.832 |
Occupations | -1.819 |
Token | driving |
Token ID | 5059 |
Feature activation | -3.57e-01 |
Pos logit contributions | |
zzle | +0.008 |
uers | +0.007 |
mble | +0.007 |
IRE | +0.007 |
htar | +0.007 |
Neg logit contributions | |
enh | -0.005 |
practice | -0.005 |
adapt | -0.005 |
Occupations | -0.005 |
odor | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
practice | +1.252 |
enh | +1.242 |
adapt | +1.167 |
Occupations | +1.158 |
odor | +1.128 |
Neg logit contributions | |
zzle | -1.751 |
mble | -1.640 |
IRE | -1.577 |
uers | -1.577 |
reckoning | -1.433 |
Token | and |
Token ID | 290 |
Feature activation | -5.36e-01 |
Pos logit contributions | |
enh | +3.133 |
practice | +2.942 |
Occupations | +2.896 |
adapt | +2.827 |
Provided | +2.779 |
Neg logit contributions | |
zzle | -4.135 |
mble | -3.792 |
uers | -3.686 |
IRE | -3.655 |
htar | -3.328 |
Token | retirees |
Token ID | 43731 |
Feature activation | +6.32e-01 |
Pos logit contributions | |
enh | +2.043 |
practice | +1.956 |
Occupations | +1.890 |
adapt | +1.881 |
theless | +1.873 |
Neg logit contributions | |
zzle | -2.439 |
mble | -2.235 |
uers | -2.176 |
IRE | -2.162 |
unci | -1.954 |
Token | � |
Token ID | 447 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
zzle | +2.243 |
mble | +1.950 |
uers | +1.913 |
IRE | +1.869 |
reckoning | +1.675 |
Neg logit contributions | |
enh | -3.122 |
practice | -3.088 |
adapt | -2.991 |
Occupations | -2.967 |
theless | -2.926 |
Token | � |
Token ID | 247 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
zzle | +0.652 |
mble | +0.579 |
uers | +0.568 |
IRE | +0.562 |
reckoning | +0.526 |
Neg logit contributions | |
enh | -0.631 |
practice | -0.625 |
ゴン | -0.606 |
adapt | -0.601 |
Occupations | -0.600 |
Token | health |
Token ID | 1535 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
enh | +0.426 |
practice | +0.422 |
adapt | +0.399 |
Occupations | +0.396 |
theless | +0.388 |
Neg logit contributions | |
zzle | -0.528 |
mble | -0.480 |
uers | -0.471 |
IRE | -0.465 |
reckoning | -0.425 |
Token | - |
Token ID | 12 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
enh | +5.695 |
practice | +5.665 |
adapt | +5.266 |
Occupations | +5.118 |
abil | +5.089 |
Neg logit contributions | |
zzle | -8.326 |
uers | -7.519 |
mble | -7.433 |
IRE | -7.314 |
unci | -6.786 |
Token | plan |
Token ID | 11578 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
enh | +8.273 |
practice | +8.259 |
related | +7.468 |
adapt | +7.324 |
standard | +7.301 |
Neg logit contributions | |
zzle | -19.144 |
uers | -17.805 |
mble | -17.438 |
IRE | -16.934 |
unci | -16.371 |
Token | costs |
Token ID | 3484 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
enh | +0.356 |
practice | +0.348 |
adapt | +0.337 |
theless | +0.322 |
Occupations | +0.320 |
Neg logit contributions | |
zzle | -0.547 |
mble | -0.498 |
uers | -0.493 |
IRE | -0.493 |
reckoning | -0.448 |
Token | . |
Token ID | 13 |
Feature activation | -4.56e-01 |
Pos logit contributions | |
enh | +0.062 |
practice | +0.061 |
adapt | +0.058 |
Occupations | +0.058 |
Provided | +0.057 |
Neg logit contributions | |
zzle | -0.074 |
mble | -0.067 |
uers | -0.066 |
IRE | -0.066 |
reckoning | -0.060 |
Token | The |
Token ID | 383 |
Feature activation | +4.55e-02 |
Pos logit contributions | |
enh | +1.338 |
practice | +1.303 |
Occupations | +1.277 |
adapt | +1.261 |
Provided | +1.242 |
Neg logit contributions | |
zzle | -2.520 |
mble | -2.327 |
uers | -2.292 |
IRE | -2.234 |
reckoning | -2.143 |
Token | Tories |
Token ID | 25098 |
Feature activation | +3.99e-01 |
Pos logit contributions | |
zzle | +0.217 |
mble | +0.195 |
uers | +0.192 |
IRE | +0.190 |
reckoning | +0.173 |
Neg logit contributions | |
enh | -0.167 |
practice | -0.166 |
adapt | -0.159 |
Occupations | -0.157 |
odor | -0.156 |
Token | Hart |
Token ID | 11345 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
enh | +3.445 |
practice | +3.425 |
adapt | +3.382 |
Occupations | +3.332 |
Provided | +3.289 |
Neg logit contributions | |
zzle | -4.238 |
IRE | -3.747 |
mble | -3.734 |
uers | -3.657 |
reckoning | -3.359 |
Token | z |
Token ID | 89 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
enh | +7.799 |
practice | +6.909 |
odor | +6.629 |
adapt | +6.591 |
bid | +6.577 |
Neg logit contributions | |
zzle | -9.917 |
IRE | -8.794 |
mble | -8.731 |
uers | -8.569 |
reckoning | -8.161 |
Token | ell |
Token ID | 695 |
Feature activation | -7.55e-01 |
Pos logit contributions | |
enh | +5.679 |
practice | +5.101 |
odor | +5.026 |
adapt | +4.844 |
abil | +4.699 |
Neg logit contributions | |
zzle | -6.483 |
mble | -5.920 |
IRE | -5.850 |
uers | -5.845 |
reckoning | -5.449 |
Token | House |
Token ID | 2097 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
enh | +2.765 |
practice | +2.591 |
adapt | +2.511 |
Occupations | +2.465 |
odor | +2.420 |
Neg logit contributions | |
zzle | -3.612 |
mble | -3.270 |
IRE | -3.237 |
uers | -3.201 |
reckoning | -2.999 |
Token | Bed |
Token ID | 15585 |
Feature activation | -2.42e+00 |
Pos logit contributions | |
zzle | +0.717 |
uers | +0.638 |
mble | +0.634 |
IRE | +0.631 |
reckoning | +0.586 |
Neg logit contributions | |
enh | -0.599 |
practice | -0.579 |
adapt | -0.563 |
Occupations | -0.553 |
ゴン | -0.541 |
Token | & |
Token ID | 1222 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
enh | +8.135 |
practice | +7.506 |
adapt | +7.330 |
abil | +6.938 |
standard | +6.914 |
Neg logit contributions | |
zzle | -10.883 |
mble | -9.888 |
uers | -9.824 |
IRE | -9.814 |
reckoning | -9.092 |
Token | Breakfast |
Token ID | 32175 |
Feature activation | -4.53e-01 |
Pos logit contributions | |
Occupations | +5.943 |
Provided | +5.942 |
enh | +5.381 |
odor | +5.308 |
Played | +5.194 |
Neg logit contributions | |
zzle | -19.916 |
uers | -19.604 |
IRE | -18.722 |
mble | -18.484 |
reckoning | -17.900 |
Token | in |
Token ID | 287 |
Feature activation | +8.37e-02 |
Pos logit contributions | |
enh | +1.718 |
practice | +1.627 |
adapt | +1.608 |
Occupations | +1.569 |
Provided | +1.549 |
Neg logit contributions | |
zzle | -2.114 |
uers | -1.884 |
mble | -1.878 |
IRE | -1.864 |
reckoning | -1.713 |
Token | Add |
Token ID | 3060 |
Feature activation | +8.58e-01 |
Pos logit contributions | |
zzle | +0.411 |
mble | +0.373 |
uers | +0.369 |
IRE | +0.366 |
reckoning | +0.337 |
Neg logit contributions | |
enh | -0.297 |
practice | -0.291 |
adapt | -0.283 |
Occupations | -0.280 |
theless | -0.273 |
Token | ision |
Token ID | 1166 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
zzle | +4.694 |
mble | +4.256 |
IRE | +4.197 |
uers | +4.181 |
reckoning | +3.980 |
Neg logit contributions | |
enh | -2.630 |
practice | -2.556 |
adapt | -2.438 |
Occupations | -2.371 |
odor | -2.340 |
Token | , |
Token ID | 11 |
Feature activation | +9.21e-01 |
Pos logit contributions | |
zzle | +0.587 |
mble | +0.538 |
uers | +0.530 |
IRE | +0.519 |
reckoning | +0.496 |
Neg logit contributions | |
enh | -0.444 |
practice | -0.428 |
Occupations | -0.411 |
adapt | -0.411 |
odor | -0.396 |
Token | J |
Token ID | 41 |
Feature activation | -6.68e-01 |
Pos logit contributions | |
enh | +3.227 |
practice | +3.151 |
adapt | +3.055 |
ゴン | +3.024 |
Occupations | +2.973 |
Neg logit contributions | |
zzle | -4.072 |
mble | -3.643 |
uers | -3.584 |
IRE | -3.523 |
reckoning | -3.339 |
Token | . |
Token ID | 13 |
Feature activation | -4.55e-01 |
Pos logit contributions | |
enh | +2.545 |
practice | +2.503 |
adapt | +2.428 |
ゴン | +2.405 |
Occupations | +2.390 |
Neg logit contributions | |
zzle | -3.074 |
mble | -2.741 |
uers | -2.698 |
IRE | -2.687 |
reckoning | -2.507 |
Token | Costs |
Token ID | 36845 |
Feature activation | -3.78e-03 |
Pos logit contributions | |
enh | +1.310 |
Occupations | +1.299 |
practice | +1.287 |
adapt | +1.257 |
Provided | +1.236 |
Neg logit contributions | |
zzle | -2.583 |
mble | -2.397 |
uers | -2.292 |
IRE | -2.234 |
reckoning | -2.169 |
Token | of |
Token ID | 286 |
Feature activation | +4.85e-01 |
Pos logit contributions | |
enh | +0.017 |
practice | +0.017 |
adapt | +0.016 |
Occupations | +0.016 |
ゴン | +0.016 |
Neg logit contributions | |
zzle | -0.015 |
mble | -0.014 |
IRE | -0.013 |
uers | -0.013 |
reckoning | -0.012 |
Token | alcohol |
Token ID | 5548 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
zzle | +2.367 |
mble | +2.142 |
uers | +2.100 |
IRE | +2.090 |
reckoning | +1.917 |
Neg logit contributions | |
enh | -1.763 |
practice | -1.747 |
adapt | -1.675 |
Occupations | -1.653 |
theless | -1.621 |
Token | - |
Token ID | 12 |
Feature activation | -3.53e+00 |
Pos logit contributions | |
enh | +4.083 |
practice | +3.979 |
adapt | +3.817 |
Provided | +3.703 |
bid | +3.660 |
Neg logit contributions | |
zzle | -5.643 |
mble | -5.300 |
uers | -5.104 |
IRE | -5.006 |
unci | -4.593 |
Token | involved |
Token ID | 44697 |
Feature activation | -9.54e-02 |
Pos logit contributions | |
enh | +9.285 |
practice | +8.682 |
adapt | +8.669 |
related | +8.344 |
only | +7.902 |
Neg logit contributions | |
zzle | -17.319 |
mble | -17.212 |
uers | -16.586 |
IRE | -15.317 |
reckoning | -14.994 |
Token | crashes |
Token ID | 17616 |
Feature activation | -3.68e-01 |
Pos logit contributions | |
practice | +0.316 |
enh | +0.315 |
Occupations | +0.297 |
adapt | +0.297 |
theless | +0.291 |
Neg logit contributions | |
zzle | -0.490 |
mble | -0.447 |
uers | -0.441 |
IRE | -0.436 |
unci | -0.395 |
Token | , |
Token ID | 11 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
enh | +1.376 |
practice | +1.369 |
adapt | +1.296 |
Occupations | +1.286 |
Provided | +1.259 |
Neg logit contributions | |
zzle | -1.689 |
mble | -1.565 |
IRE | -1.537 |
uers | -1.520 |
reckoning | -1.380 |
Token | United |
Token ID | 1578 |
Feature activation | -3.35e-02 |
Pos logit contributions | |
zzle | +1.539 |
mble | +1.399 |
uers | +1.376 |
IRE | +1.360 |
reckoning | +1.250 |
Neg logit contributions | |
practice | -0.907 |
enh | -0.903 |
adapt | -0.870 |
Occupations | -0.859 |
theless | -0.829 |
Token | States |
Token ID | 1829 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
enh | +0.107 |
practice | +0.106 |
Occupations | +0.106 |
adapt | +0.102 |
Provided | +0.099 |
Neg logit contributions | |
zzle | -0.176 |
mble | -0.164 |
uers | -0.156 |
IRE | -0.155 |
reckoning | -0.147 |
Token | ka |
Token ID | 4914 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
zzle | +2.828 |
mble | +2.586 |
IRE | +2.557 |
uers | +2.508 |
reckoning | +2.374 |
Neg logit contributions | |
enh | -2.340 |
practice | -2.331 |
adapt | -2.240 |
odor | -2.180 |
Occupations | -2.139 |
Token | for |
Token ID | 1640 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
zzle | +2.977 |
mble | +2.777 |
IRE | +2.731 |
uers | +2.724 |
reckoning | +2.599 |
Neg logit contributions | |
enh | -0.939 |
practice | -0.918 |
adapt | -0.861 |
Occupations | -0.792 |
odor | -0.788 |
Token | posted |
Token ID | 4481 |
Feature activation | -1.96e-01 |
Pos logit contributions | |
enh | +0.516 |
practice | +0.504 |
theless | +0.480 |
adapt | +0.476 |
Provided | +0.466 |
Neg logit contributions | |
zzle | -0.681 |
mble | -0.631 |
IRE | -0.601 |
uers | -0.599 |
reckoning | -0.549 |
Token | a |
Token ID | 257 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
enh | +0.751 |
practice | +0.746 |
adapt | +0.704 |
Occupations | +0.701 |
odor | +0.689 |
Neg logit contributions | |
zzle | -0.922 |
mble | -0.816 |
IRE | -0.803 |
uers | -0.794 |
reckoning | -0.716 |
Token | career |
Token ID | 3451 |
Feature activation | -1.76e+00 |
Pos logit contributions | |
practice | +0.564 |
enh | +0.558 |
adapt | +0.525 |
Occupations | +0.522 |
odor | +0.516 |
Neg logit contributions | |
zzle | -0.705 |
mble | -0.636 |
uers | -0.620 |
IRE | -0.617 |
unci | -0.553 |
Token | - |
Token ID | 12 |
Feature activation | -3.51e+00 |
Pos logit contributions | |
enh | +5.567 |
practice | +5.414 |
standard | +5.100 |
bid | +4.946 |
adapt | +4.913 |
Neg logit contributions | |
zzle | -8.673 |
mble | -8.035 |
uers | -7.874 |
IRE | -7.724 |
unci | -7.177 |
Token | high |
Token ID | 8929 |
Feature activation | -7.30e-01 |
Pos logit contributions | |
enh | +5.239 |
practice | +4.457 |
standard | +4.424 |
adapt | +3.537 |
only | +3.523 |
Neg logit contributions | |
zzle | -21.511 |
mble | -20.640 |
uers | -20.476 |
IRE | -20.416 |
unci | -19.129 |
Token | 30 |
Token ID | 1542 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
practice | +2.390 |
enh | +2.369 |
odor | +2.229 |
Occupations | +2.227 |
adapt | +2.212 |
Neg logit contributions | |
zzle | -3.655 |
mble | -3.313 |
IRE | -3.276 |
uers | -3.276 |
unci | -2.976 |
Token | points |
Token ID | 2173 |
Feature activation | -4.29e-01 |
Pos logit contributions | |
practice | +3.271 |
enh | +3.240 |
adapt | +2.971 |
odor | +2.910 |
Occupations | +2.834 |
Neg logit contributions | |
zzle | -7.068 |
mble | -6.527 |
IRE | -6.490 |
uers | -6.454 |
htar | -6.045 |
Token | in |
Token ID | 287 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
practice | +1.550 |
enh | +1.542 |
adapt | +1.419 |
theless | +1.408 |
Occupations | +1.389 |
Neg logit contributions | |
zzle | -2.052 |
mble | -1.890 |
IRE | -1.825 |
uers | -1.821 |
htar | -1.662 |
Token | an |
Token ID | 281 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
practice | +1.472 |
enh | +1.426 |
adapt | +1.357 |
odor | +1.321 |
theless | +1.299 |
Neg logit contributions | |
zzle | -1.683 |
uers | -1.511 |
mble | -1.509 |
IRE | -1.488 |
reckoning | -1.342 |
Token | � |
Token ID | 247 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
zzle | +3.251 |
mble | +2.971 |
uers | +2.851 |
IRE | +2.821 |
reckoning | +2.668 |
Neg logit contributions | |
enh | -2.938 |
practice | -2.910 |
adapt | -2.790 |
Occupations | -2.774 |
ゴン | -2.743 |
Token | s |
Token ID | 82 |
Feature activation | +4.50e-01 |
Pos logit contributions | |
zzle | +1.098 |
mble | +1.008 |
IRE | +0.982 |
uers | +0.981 |
reckoning | +0.937 |
Neg logit contributions | |
enh | -0.611 |
practice | -0.595 |
adapt | -0.576 |
theless | -0.555 |
odor | -0.551 |
Token | called |
Token ID | 1444 |
Feature activation | -3.57e-01 |
Pos logit contributions | |
zzle | +1.745 |
mble | +1.571 |
IRE | +1.509 |
uers | +1.489 |
reckoning | +1.339 |
Neg logit contributions | |
enh | -2.072 |
practice | -2.031 |
adapt | -1.979 |
ゴン | -1.962 |
theless | -1.937 |
Token | a |
Token ID | 257 |
Feature activation | -2.32e-01 |
Pos logit contributions | |
enh | +1.453 |
practice | +1.424 |
adapt | +1.383 |
Occupations | +1.361 |
odor | +1.344 |
Neg logit contributions | |
zzle | -1.529 |
mble | -1.368 |
IRE | -1.366 |
uers | -1.350 |
reckoning | -1.230 |
Token | credit |
Token ID | 3884 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
enh | +0.866 |
practice | +0.860 |
adapt | +0.818 |
odor | +0.802 |
Occupations | +0.799 |
Neg logit contributions | |
zzle | -1.058 |
mble | -0.969 |
IRE | -0.965 |
uers | -0.954 |
reckoning | -0.855 |
Token | - |
Token ID | 12 |
Feature activation | -3.50e+00 |
Pos logit contributions | |
enh | +4.556 |
practice | +4.227 |
abil | +4.163 |
adapt | +4.110 |
bid | +4.014 |
Neg logit contributions | |
zzle | -5.379 |
mble | -5.134 |
IRE | -4.950 |
uers | -4.904 |
unci | -4.456 |
Token | default |
Token ID | 12286 |
Feature activation | -5.29e-01 |
Pos logit contributions | |
enh | +11.655 |
practice | +10.410 |
standard | +9.983 |
only | +9.869 |
adapt | +9.848 |
Neg logit contributions | |
zzle | -14.822 |
mble | -14.639 |
uers | -13.901 |
IRE | -13.750 |
unci | -12.772 |
Token | swap |
Token ID | 16075 |
Feature activation | -9.94e-01 |
Pos logit contributions | |
enh | +1.775 |
practice | +1.712 |
adapt | +1.657 |
abil | +1.617 |
odor | +1.585 |
Neg logit contributions | |
zzle | -2.615 |
mble | -2.476 |
uers | -2.371 |
IRE | -2.356 |
unci | -2.177 |
Token | , |
Token ID | 11 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
enh | +3.651 |
practice | +3.567 |
adapt | +3.382 |
abil | +3.354 |
bid | +3.282 |
Neg logit contributions | |
zzle | -4.450 |
mble | -4.184 |
uers | -4.087 |
IRE | -4.002 |
unci | -3.712 |
Token | essentially |
Token ID | 6986 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
zzle | +1.183 |
mble | +1.089 |
IRE | +1.056 |
uers | +1.043 |
reckoning | +0.918 |
Neg logit contributions | |
enh | -1.252 |
practice | -1.219 |
adapt | -1.198 |
Occupations | -1.166 |
ゴン | -1.154 |
Token | an |
Token ID | 281 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
zzle | +1.608 |
mble | +1.461 |
IRE | +1.428 |
uers | +1.428 |
reckoning | +1.266 |
Neg logit contributions | |
enh | -1.650 |
practice | -1.628 |
adapt | -1.559 |
Occupations | -1.550 |
ゴン | -1.533 |
Token | something |
Token ID | 1223 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
zzle | +1.678 |
mble | +1.521 |
IRE | +1.500 |
uers | +1.491 |
reckoning | +1.363 |
Neg logit contributions | |
enh | -1.373 |
practice | -1.350 |
adapt | -1.300 |
Occupations | -1.287 |
theless | -1.252 |
Token | in |
Token ID | 287 |
Feature activation | +2.42e-01 |
Pos logit contributions | |
enh | +0.545 |
practice | +0.530 |
adapt | +0.510 |
Occupations | +0.500 |
Provided | +0.496 |
Neg logit contributions | |
zzle | -0.682 |
mble | -0.628 |
IRE | -0.612 |
uers | -0.609 |
reckoning | -0.547 |
Token | return |
Token ID | 1441 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
zzle | +1.118 |
mble | +1.034 |
IRE | +1.030 |
uers | +1.014 |
reckoning | +0.915 |
Neg logit contributions | |
enh | -0.909 |
practice | -0.901 |
adapt | -0.861 |
Occupations | -0.844 |
bid | -0.833 |
Token | – |
Token ID | 784 |
Feature activation | -6.22e-01 |
Pos logit contributions | |
enh | +0.423 |
practice | +0.414 |
adapt | +0.398 |
Occupations | +0.393 |
odor | +0.384 |
Neg logit contributions | |
zzle | -0.579 |
mble | -0.528 |
IRE | -0.521 |
uers | -0.519 |
reckoning | -0.477 |
Token | good |
Token ID | 922 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
enh | +2.639 |
practice | +2.564 |
adapt | +2.481 |
Occupations | +2.467 |
Provided | +2.405 |
Neg logit contributions | |
zzle | -2.558 |
mble | -2.349 |
uers | -2.282 |
IRE | -2.277 |
reckoning | -2.065 |
Token | - |
Token ID | 12 |
Feature activation | -3.49e+00 |
Pos logit contributions | |
practice | +4.137 |
enh | +4.123 |
Occupations | +3.950 |
adapt | +3.877 |
firsthand | +3.737 |
Neg logit contributions | |
zzle | -6.068 |
mble | -5.674 |
IRE | -5.575 |
uers | -5.496 |
unci | -4.994 |
Token | paying |
Token ID | 32629 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
practice | +9.026 |
enh | +8.296 |
adapt | +7.883 |
odor | +7.447 |
standard | +7.407 |
Neg logit contributions | |
zzle | -16.901 |
mble | -16.724 |
IRE | -16.295 |
uers | -15.749 |
reckoning | -14.593 |
Token | jobs |
Token ID | 3946 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
zzle | +5.462 |
mble | +4.881 |
uers | +4.814 |
IRE | +4.803 |
reckoning | +4.488 |
Neg logit contributions | |
enh | -4.269 |
practice | -4.226 |
adapt | -4.081 |
ゴン | -4.038 |
Occupations | -4.006 |
Token | , |
Token ID | 11 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
enh | +5.452 |
practice | +4.959 |
Provided | +4.903 |
adapt | +4.898 |
Occupations | +4.880 |
Neg logit contributions | |
zzle | -7.443 |
mble | -7.073 |
IRE | -7.010 |
uers | -6.724 |
unci | -6.227 |
Token | making |
Token ID | 1642 |
Feature activation | +3.91e-01 |
Pos logit contributions | |
zzle | +0.691 |
mble | +0.625 |
IRE | +0.617 |
uers | +0.610 |
reckoning | +0.562 |
Neg logit contributions | |
enh | -0.610 |
practice | -0.589 |
adapt | -0.575 |
Occupations | -0.568 |
Provided | -0.547 |
Token | sure |
Token ID | 1654 |
Feature activation | +4.77e-02 |
Pos logit contributions | |
zzle | +1.681 |
mble | +1.522 |
IRE | +1.494 |
uers | +1.462 |
reckoning | +1.345 |
Neg logit contributions | |
enh | -1.634 |
practice | -1.601 |
adapt | -1.558 |
Occupations | -1.544 |
odor | -1.492 |
Token | P |
Token ID | 350 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
enh | +0.415 |
Occupations | +0.410 |
practice | +0.406 |
adapt | +0.390 |
Provided | +0.388 |
Neg logit contributions | |
zzle | -0.907 |
mble | -0.843 |
uers | -0.816 |
IRE | -0.805 |
reckoning | -0.767 |
Token | unks |
Token ID | 14125 |
Feature activation | -4.17e-02 |
Pos logit contributions | |
zzle | +8.126 |
uers | +7.167 |
mble | +7.153 |
IRE | +7.056 |
reckoning | +6.516 |
Neg logit contributions | |
practice | -7.846 |
enh | -7.831 |
ゴン | -7.700 |
adapt | -7.602 |
Occupations | -7.570 |
Token | are |
Token ID | 389 |
Feature activation | +5.59e-01 |
Pos logit contributions | |
enh | +0.176 |
practice | +0.175 |
adapt | +0.170 |
theless | +0.166 |
Occupations | +0.165 |
Neg logit contributions | |
zzle | -0.175 |
mble | -0.157 |
uers | -0.154 |
IRE | -0.153 |
reckoning | -0.139 |
Token | given |
Token ID | 1813 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
zzle | +2.445 |
mble | +2.183 |
IRE | +2.133 |
uers | +2.116 |
reckoning | +1.884 |
Neg logit contributions | |
enh | -2.327 |
practice | -2.285 |
adapt | -2.245 |
Occupations | -2.206 |
theless | -2.204 |
Token | inferior |
Token ID | 18536 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
enh | +5.450 |
practice | +5.142 |
odor | +5.130 |
firsthand | +5.076 |
Occupations | +5.058 |
Neg logit contributions | |
zzle | -6.826 |
mble | -6.088 |
IRE | -6.065 |
uers | -5.894 |
unci | -5.210 |
Token | service |
Token ID | 2139 |
Feature activation | -3.48e+00 |
Pos logit contributions | |
enh | +3.675 |
practice | +3.546 |
odor | +3.425 |
Occupations | +3.408 |
adapt | +3.381 |
Neg logit contributions | |
zzle | -5.502 |
IRE | -4.948 |
mble | -4.939 |
uers | -4.842 |
htar | -4.371 |
Token | or |
Token ID | 393 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
enh | +10.154 |
Occupations | +9.836 |
firsthand | +9.805 |
practice | +9.594 |
ability | +9.315 |
Neg logit contributions | |
zzle | -14.610 |
mble | -13.830 |
IRE | -13.343 |
uers | -12.880 |
peria | -11.904 |
Token | not |
Token ID | 407 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
enh | +3.866 |
practice | +3.714 |
Occupations | +3.665 |
theless | +3.623 |
adapt | +3.532 |
Neg logit contributions | |
zzle | -4.619 |
IRE | -4.107 |
mble | -4.103 |
uers | -4.017 |
unci | -3.583 |
Token | served |
Token ID | 4983 |
Feature activation | -2.62e+00 |
Pos logit contributions | |
enh | +4.447 |
practice | +4.319 |
adapt | +4.254 |
theless | +4.171 |
Occupations | +4.126 |
Neg logit contributions | |
zzle | -4.907 |
IRE | -4.511 |
mble | -4.466 |
uers | -4.310 |
reckoning | -3.921 |
Token | at |
Token ID | 379 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
enh | +7.822 |
firsthand | +7.234 |
adapt | +7.153 |
Occupations | +7.081 |
practice | +7.072 |
Neg logit contributions | |
zzle | -12.175 |
mble | -11.370 |
IRE | -11.286 |
uers | -10.652 |
�� | -10.250 |
Token | all |
Token ID | 477 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
enh | +4.763 |
practice | +4.677 |
Occupations | +4.531 |
odor | +4.333 |
adapt | +4.325 |
Neg logit contributions | |
zzle | -7.878 |
mble | -7.144 |
IRE | -6.711 |
uers | -6.628 |
htar | -6.319 |
Token | not |
Token ID | 407 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
enh | +5.242 |
practice | +5.130 |
adapt | +5.061 |
bid | +4.758 |
odor | +4.739 |
Neg logit contributions | |
zzle | -7.175 |
mble | -6.384 |
IRE | -6.330 |
uers | -6.208 |
unci | -5.944 |
Token | appear |
Token ID | 1656 |
Feature activation | -6.25e-01 |
Pos logit contributions | |
enh | +5.079 |
practice | +4.881 |
standard | +4.708 |
adapt | +4.659 |
firsthand | +4.595 |
Neg logit contributions | |
zzle | -8.115 |
mble | -7.659 |
IRE | -7.299 |
uers | -6.896 |
unci | -6.782 |
Token | to |
Token ID | 284 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
enh | +2.329 |
practice | +2.285 |
adapt | +2.187 |
Occupations | +2.142 |
ゴン | +2.123 |
Neg logit contributions | |
zzle | -2.984 |
mble | -2.672 |
uers | -2.613 |
IRE | -2.573 |
reckoning | -2.425 |
Token | be |
Token ID | 307 |
Feature activation | -6.61e-01 |
Pos logit contributions | |
enh | +5.220 |
practice | +5.089 |
adapt | +4.829 |
abil | +4.750 |
standard | +4.644 |
Neg logit contributions | |
zzle | -6.609 |
mble | -5.946 |
IRE | -5.610 |
uers | -5.513 |
unci | -5.269 |
Token | life |
Token ID | 1204 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
enh | +2.087 |
practice | +2.041 |
adapt | +1.927 |
Occupations | +1.895 |
odor | +1.869 |
Neg logit contributions | |
zzle | -3.460 |
mble | -3.147 |
uers | -3.118 |
IRE | -3.040 |
unci | -2.900 |
Token | - |
Token ID | 12 |
Feature activation | -3.47e+00 |
Pos logit contributions | |
enh | +5.670 |
adapt | +5.397 |
practice | +5.371 |
standard | +5.014 |
theless | +4.993 |
Neg logit contributions | |
zzle | -6.001 |
mble | -5.629 |
IRE | -5.382 |
uers | -5.308 |
unci | -4.827 |
Token | threatening |
Token ID | 26159 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
enh | +6.473 |
related | +5.444 |
adapt | +5.390 |
practice | +5.004 |
standard | +4.742 |
Neg logit contributions | |
mble | -20.338 |
zzle | -20.260 |
IRE | -19.067 |
uers | -18.966 |
unci | -18.436 |
Token | , |
Token ID | 11 |
Feature activation | +8.60e-01 |
Pos logit contributions | |
zzle | +0.676 |
mble | +0.600 |
IRE | +0.594 |
uers | +0.593 |
reckoning | +0.550 |
Neg logit contributions | |
enh | -0.590 |
practice | -0.582 |
adapt | -0.563 |
Occupations | -0.556 |
ゴン | -0.553 |
Token | White |
Token ID | 2635 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
zzle | +4.204 |
mble | +3.818 |
IRE | +3.768 |
uers | +3.741 |
reckoning | +3.464 |
Neg logit contributions | |
enh | -3.102 |
practice | -3.035 |
adapt | -2.938 |
Occupations | -2.908 |
theless | -2.869 |
Token | said |
Token ID | 531 |
Feature activation | +3.24e-01 |
Pos logit contributions | |
zzle | +0.702 |
mble | +0.583 |
uers | +0.573 |
IRE | +0.567 |
reckoning | +0.503 |
Neg logit contributions | |
enh | -1.267 |
practice | -1.261 |
adapt | -1.232 |
Occupations | -1.221 |
ゴン | -1.219 |
Token | . |
Token ID | 13 |
Feature activation | -7.01e-01 |
Pos logit contributions | |
zzle | +1.319 |
mble | +1.151 |
uers | +1.140 |
IRE | +1.126 |
reckoning | +1.044 |
Neg logit contributions | |
enh | -1.400 |
practice | -1.394 |
adapt | -1.354 |
Occupations | -1.341 |
theless | -1.334 |
Token | � |
Token ID | 247 |
Feature activation | +3.26e-01 |
Pos logit contributions | |
zzle | +2.110 |
mble | +1.881 |
uers | +1.827 |
IRE | +1.822 |
reckoning | +1.711 |
Neg logit contributions | |
enh | -1.993 |
practice | -1.975 |
adapt | -1.901 |
Occupations | -1.896 |
ゴン | -1.887 |
Token | s |
Token ID | 82 |
Feature activation | +8.08e-02 |
Pos logit contributions | |
zzle | +1.756 |
mble | +1.606 |
IRE | +1.580 |
uers | +1.566 |
reckoning | +1.482 |
Neg logit contributions | |
enh | -1.008 |
practice | -0.981 |
adapt | -0.951 |
theless | -0.914 |
Occupations | -0.912 |
Token | focusing |
Token ID | 10759 |
Feature activation | -3.36e-01 |
Pos logit contributions | |
zzle | +0.343 |
mble | +0.307 |
IRE | +0.299 |
uers | +0.298 |
reckoning | +0.270 |
Neg logit contributions | |
enh | -0.343 |
practice | -0.333 |
adapt | -0.328 |
Occupations | -0.320 |
theless | -0.317 |
Token | on |
Token ID | 319 |
Feature activation | -9.54e-01 |
Pos logit contributions | |
enh | +1.311 |
practice | +1.296 |
adapt | +1.252 |
Occupations | +1.226 |
theless | +1.203 |
Neg logit contributions | |
zzle | -1.525 |
mble | -1.341 |
uers | -1.322 |
IRE | -1.321 |
reckoning | -1.219 |
Token | working |
Token ID | 1762 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
practice | +3.608 |
enh | +3.607 |
Occupations | +3.514 |
adapt | +3.436 |
odor | +3.405 |
Neg logit contributions | |
zzle | -4.191 |
mble | -3.809 |
IRE | -3.732 |
uers | -3.722 |
htar | -3.289 |
Token | - |
Token ID | 12 |
Feature activation | -3.46e+00 |
Pos logit contributions | |
practice | +6.862 |
enh | +6.844 |
Occupations | +6.757 |
adapt | +6.480 |
firsthand | +6.272 |
Neg logit contributions | |
zzle | -8.794 |
mble | -8.401 |
uers | -7.956 |
IRE | -7.673 |
�� | -7.020 |
Token | class |
Token ID | 4871 |
Feature activation | -9.49e-01 |
Pos logit contributions | |
practice | +8.419 |
enh | +8.295 |
standard | +8.059 |
adapt | +7.568 |
Occupations | +6.835 |
Neg logit contributions | |
zzle | -17.251 |
mble | -16.761 |
uers | -16.324 |
IRE | -14.860 |
reckoning | -14.453 |
Token | white |
Token ID | 2330 |
Feature activation | +5.26e-01 |
Pos logit contributions | |
enh | +3.474 |
Occupations | +3.465 |
practice | +3.383 |
odor | +3.260 |
adapt | +3.224 |
Neg logit contributions | |
zzle | -4.304 |
mble | -3.980 |
uers | -3.927 |
IRE | -3.783 |
htar | -3.414 |
Token | Phil |
Token ID | 4543 |
Feature activation | +6.91e-02 |
Pos logit contributions | |
zzle | +2.412 |
mble | +2.174 |
uers | +2.131 |
IRE | +2.119 |
reckoning | +1.947 |
Neg logit contributions | |
enh | -2.047 |
practice | -2.018 |
adapt | -1.953 |
Occupations | -1.945 |
ゴン | -1.897 |
Token | adel |
Token ID | 6959 |
Feature activation | +1.51e-02 |
Pos logit contributions | |
zzle | +0.388 |
mble | +0.359 |
IRE | +0.355 |
uers | +0.349 |
reckoning | +0.334 |
Neg logit contributions | |
enh | -0.194 |
practice | -0.190 |
adapt | -0.183 |
Occupations | -0.175 |
ゴン | -0.173 |
Token | ph |
Token ID | 746 |
Feature activation | -8.91e-02 |
Pos logit contributions | |
zzle | +0.090 |
mble | +0.086 |
IRE | +0.084 |
uers | +0.083 |
reckoning | +0.080 |
Neg logit contributions | |
enh | -0.037 |
practice | -0.037 |
adapt | -0.034 |
bid | -0.031 |
Occupations | -0.031 |
Token | On |
Token ID | 1550 |
Feature activation | +5.54e-01 |
Pos logit contributions | |
zzle | +2.041 |
mble | +1.812 |
IRE | +1.781 |
uers | +1.774 |
reckoning | +1.612 |
Neg logit contributions | |
enh | -1.714 |
practice | -1.705 |
adapt | -1.649 |
Occupations | -1.614 |
odor | -1.582 |
Token | the |
Token ID | 262 |
Feature activation | -3.81e-01 |
Pos logit contributions | |
zzle | +2.704 |
mble | +2.414 |
IRE | +2.386 |
uers | +2.368 |
reckoning | +2.198 |
Neg logit contributions | |
enh | -2.034 |
practice | -2.009 |
adapt | -1.931 |
Occupations | -1.908 |
odor | -1.870 |
Token | Gene |
Token ID | 13005 |
Feature activation | -5.22e-01 |
Pos logit contributions | |
enh | +1.265 |
practice | +1.251 |
Occupations | +1.220 |
adapt | +1.208 |
odor | +1.202 |
Neg logit contributions | |
zzle | -1.939 |
mble | -1.770 |
uers | -1.721 |
IRE | -1.712 |
reckoning | -1.577 |
Token | alogy |
Token ID | 48909 |
Feature activation | -4.84e-01 |
Pos logit contributions | |
enh | +1.601 |
practice | +1.502 |
adapt | +1.457 |
bid | +1.453 |
Occupations | +1.438 |
Neg logit contributions | |
zzle | -2.792 |
mble | -2.512 |
IRE | -2.492 |
uers | -2.485 |
reckoning | -2.343 |
Token | of |
Token ID | 286 |
Feature activation | -3.45e-03 |
Pos logit contributions | |
enh | +2.527 |
practice | +2.469 |
Occupations | +2.444 |
adapt | +2.425 |
ゴン | +2.381 |
Neg logit contributions | |
zzle | -1.536 |
mble | -1.322 |
uers | -1.256 |
IRE | -1.254 |
reckoning | -1.095 |
Token | Mor |
Token ID | 3461 |
Feature activation | -3.42e+00 |
Pos logit contributions | |
enh | +0.012 |
practice | +0.012 |
Occupations | +0.012 |
adapt | +0.011 |
odor | +0.011 |
Neg logit contributions | |
zzle | -0.018 |
mble | -0.016 |
IRE | -0.015 |
uers | -0.015 |
reckoning | -0.014 |
Token | als |
Token ID | 874 |
Feature activation | -4.31e-01 |
Pos logit contributions | |
bid | +9.444 |
practice | +8.452 |
odor | +8.425 |
enh | +8.423 |
adapt | +8.359 |
Neg logit contributions | |
zzle | -15.808 |
IRE | -15.540 |
mble | -15.336 |
�� | -14.671 |
uers | -14.578 |
Token | , |
Token ID | 11 |
Feature activation | +5.85e-01 |
Pos logit contributions | |
enh | +1.533 |
practice | +1.477 |
Occupations | +1.460 |
adapt | +1.446 |
theless | +1.402 |
Neg logit contributions | |
zzle | -2.107 |
mble | -1.901 |
uers | -1.864 |
IRE | -1.833 |
reckoning | -1.692 |
Token | Nietzsche |
Token ID | 40258 |
Feature activation | -7.42e-01 |
Pos logit contributions | |
zzle | +3.261 |
mble | +2.977 |
uers | +2.923 |
IRE | +2.918 |
reckoning | +2.720 |
Neg logit contributions | |
enh | -1.722 |
practice | -1.678 |
adapt | -1.639 |
Occupations | -1.609 |
theless | -1.565 |
Token | discusses |
Token ID | 19451 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
enh | +2.595 |
practice | +2.421 |
adapt | +2.395 |
theless | +2.361 |
odor | +2.313 |
Neg logit contributions | |
zzle | -3.640 |
mble | -3.386 |
IRE | -3.340 |
uers | -3.210 |
htar | -2.915 |
Token | the |
Token ID | 262 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
enh | +4.692 |
practice | +4.612 |
adapt | +4.475 |
Occupations | +4.354 |
odor | +4.283 |
Neg logit contributions | |
zzle | -5.512 |
mble | -4.848 |
IRE | -4.830 |
uers | -4.742 |
reckoning | -4.202 |
Token | players |
Token ID | 1938 |
Feature activation | -6.49e-01 |
Pos logit contributions | |
enh | +1.053 |
practice | +1.036 |
Occupations | +0.998 |
adapt | +0.982 |
odor | +0.970 |
Neg logit contributions | |
zzle | -1.289 |
mble | -1.108 |
uers | -1.101 |
IRE | -1.086 |
reckoning | -1.011 |
Token | will |
Token ID | 481 |
Feature activation | +5.05e-01 |
Pos logit contributions | |
enh | +2.576 |
practice | +2.568 |
adapt | +2.420 |
Occupations | +2.415 |
Provided | +2.410 |
Neg logit contributions | |
zzle | -2.846 |
uers | -2.456 |
mble | -2.451 |
IRE | -2.359 |
unci | -2.189 |
Token | be |
Token ID | 307 |
Feature activation | +6.99e-01 |
Pos logit contributions | |
zzle | +2.271 |
mble | +2.003 |
uers | +1.960 |
IRE | +1.952 |
reckoning | +1.805 |
Neg logit contributions | |
practice | -2.020 |
enh | -2.019 |
adapt | -1.921 |
odor | -1.874 |
Occupations | -1.843 |
Token | joined |
Token ID | 5399 |
Feature activation | -3.86e-01 |
Pos logit contributions | |
zzle | +2.957 |
mble | +2.622 |
uers | +2.540 |
IRE | +2.515 |
reckoning | +2.248 |
Neg logit contributions | |
enh | -2.992 |
practice | -2.989 |
adapt | -2.860 |
Occupations | -2.834 |
Provided | -2.782 |
Token | by |
Token ID | 416 |
Feature activation | +2.76e-01 |
Pos logit contributions | |
enh | +1.293 |
practice | +1.285 |
adapt | +1.237 |
ゴン | +1.195 |
Occupations | +1.194 |
Neg logit contributions | |
zzle | -1.953 |
mble | -1.720 |
IRE | -1.707 |
uers | -1.675 |
reckoning | -1.568 |
Token | Jim |
Token ID | 5395 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
zzle | +1.320 |
mble | +1.167 |
IRE | +1.144 |
uers | +1.138 |
reckoning | +1.040 |
Neg logit contributions | |
enh | -1.033 |
practice | -1.022 |
adapt | -0.980 |
Occupations | -0.972 |
theless | -0.958 |
Token | Hub |
Token ID | 14699 |
Feature activation | +9.65e-02 |
Pos logit contributions | |
enh | +9.692 |
practice | +8.821 |
adapt | +8.552 |
bid | +8.533 |
Cunningham | +8.412 |
Neg logit contributions | |
zzle | -15.170 |
uers | -13.703 |
mble | -13.617 |
IRE | -13.537 |
reckoning | -12.258 |
Token | ay |
Token ID | 323 |
Feature activation | -5.72e-01 |
Pos logit contributions | |
zzle | +0.496 |
mble | +0.450 |
IRE | +0.446 |
uers | +0.439 |
reckoning | +0.422 |
Neg logit contributions | |
enh | -0.329 |
practice | -0.313 |
adapt | -0.301 |
odor | -0.289 |
bid | -0.287 |
Token | and |
Token ID | 290 |
Feature activation | -7.59e-01 |
Pos logit contributions | |
enh | +2.100 |
practice | +1.941 |
adapt | +1.892 |
Occupations | +1.828 |
bid | +1.824 |
Neg logit contributions | |
zzle | -2.739 |
IRE | -2.487 |
uers | -2.453 |
mble | -2.451 |
reckoning | -2.284 |
Token | the |
Token ID | 262 |
Feature activation | -8.99e-01 |
Pos logit contributions | |
enh | +2.653 |
practice | +2.630 |
Occupations | +2.527 |
adapt | +2.522 |
Provided | +2.504 |
Neg logit contributions | |
zzle | -3.665 |
mble | -3.219 |
IRE | -3.190 |
uers | -3.170 |
unci | -2.831 |
Token | late |
Token ID | 2739 |
Feature activation | -6.03e-01 |
Pos logit contributions | |
enh | +3.190 |
practice | +3.081 |
odor | +3.040 |
Occupations | +2.999 |
Provided | +2.922 |
Neg logit contributions | |
zzle | -4.317 |
mble | -3.792 |
uers | -3.735 |
IRE | -3.717 |
reckoning | -3.402 |
Token | who |
Token ID | 508 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
zzle | +2.393 |
mble | +2.148 |
uers | +2.101 |
IRE | +2.091 |
reckoning | +1.865 |
Neg logit contributions | |
enh | -2.207 |
practice | -2.141 |
adapt | -2.101 |
Occupations | -2.071 |
ゴン | -2.057 |
Token | has |
Token ID | 468 |
Feature activation | -5.19e-02 |
Pos logit contributions | |
enh | +0.544 |
practice | +0.532 |
adapt | +0.507 |
Occupations | +0.503 |
theless | +0.501 |
Neg logit contributions | |
zzle | -0.738 |
mble | -0.680 |
IRE | -0.660 |
uers | -0.656 |
reckoning | -0.605 |
Token | followed |
Token ID | 3940 |
Feature activation | -9.01e-01 |
Pos logit contributions | |
enh | +0.207 |
practice | +0.201 |
adapt | +0.192 |
theless | +0.189 |
Occupations | +0.189 |
Neg logit contributions | |
zzle | -0.231 |
mble | -0.210 |
uers | -0.207 |
IRE | -0.205 |
reckoning | -0.184 |
Token | them |
Token ID | 606 |
Feature activation | -1.93e-01 |
Pos logit contributions | |
enh | +3.089 |
practice | +2.921 |
Occupations | +2.887 |
adapt | +2.835 |
odor | +2.811 |
Neg logit contributions | |
zzle | -4.341 |
mble | -4.028 |
IRE | -3.860 |
uers | -3.819 |
reckoning | -3.518 |
Token | from |
Token ID | 422 |
Feature activation | -3.55e-01 |
Pos logit contributions | |
enh | +0.763 |
practice | +0.740 |
adapt | +0.712 |
theless | +0.695 |
Occupations | +0.694 |
Neg logit contributions | |
zzle | -0.870 |
mble | -0.814 |
IRE | -0.775 |
uers | -0.765 |
unci | -0.687 |
Token | Mor |
Token ID | 3461 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
enh | +1.299 |
practice | +1.239 |
adapt | +1.214 |
Occupations | +1.204 |
odor | +1.181 |
Neg logit contributions | |
zzle | -1.700 |
mble | -1.551 |
uers | -1.499 |
IRE | -1.488 |
unci | -1.352 |
Token | ia |
Token ID | 544 |
Feature activation | -2.50e-01 |
Pos logit contributions | |
bid | +9.739 |
enh | +9.704 |
adapt | +9.250 |
practice | +9.235 |
odor | +8.712 |
Neg logit contributions | |
mble | -14.989 |
millenn | -14.729 |
zzle | -14.035 |
IRE | -13.166 |
GBT | -13.078 |
Token | . |
Token ID | 13 |
Feature activation | +9.86e-02 |
Pos logit contributions | |
enh | +0.953 |
practice | +0.920 |
adapt | +0.884 |
Occupations | +0.872 |
ゴン | +0.870 |
Neg logit contributions | |
zzle | -1.150 |
mble | -1.067 |
uers | -1.025 |
IRE | -1.021 |
reckoning | -0.927 |
Token | They |
Token ID | 1119 |
Feature activation | +8.30e-02 |
Pos logit contributions | |
zzle | +0.551 |
mble | +0.514 |
uers | +0.495 |
IRE | +0.489 |
reckoning | +0.465 |
Neg logit contributions | |
enh | -0.290 |
practice | -0.279 |
Occupations | -0.277 |
adapt | -0.272 |
Provided | -0.266 |
Token | force |
Token ID | 2700 |
Feature activation | +3.54e-01 |
Pos logit contributions | |
zzle | +0.346 |
mble | +0.312 |
uers | +0.303 |
IRE | +0.302 |
unci | +0.274 |
Neg logit contributions | |
enh | -0.352 |
practice | -0.348 |
adapt | -0.335 |
theless | -0.329 |
Occupations | -0.324 |
Token | him |
Token ID | 683 |
Feature activation | -5.68e-01 |
Pos logit contributions | |
zzle | +1.699 |
mble | +1.545 |
uers | +1.509 |
IRE | +1.504 |
reckoning | +1.387 |
Neg logit contributions | |
enh | -1.307 |
practice | -1.264 |
Occupations | -1.224 |
adapt | -1.220 |
ゴン | -1.207 |
Token | s |
Token ID | 82 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
enh | +2.452 |
practice | +2.412 |
adapt | +2.298 |
Occupations | +2.206 |
Provided | +2.193 |
Neg logit contributions | |
zzle | -3.455 |
mble | -3.098 |
IRE | -3.036 |
uers | -3.014 |
reckoning | -2.902 |
Token | six |
Token ID | 2237 |
Feature activation | -4.56e-01 |
Pos logit contributions | |
enh | +0.881 |
practice | +0.871 |
adapt | +0.832 |
Occupations | +0.830 |
theless | +0.819 |
Neg logit contributions | |
zzle | -1.137 |
mble | -1.014 |
IRE | -0.982 |
uers | -0.982 |
reckoning | -0.908 |
Token | career |
Token ID | 3451 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
practice | +1.566 |
enh | +1.559 |
Occupations | +1.492 |
adapt | +1.477 |
theless | +1.456 |
Neg logit contributions | |
zzle | -2.258 |
mble | -2.038 |
IRE | -1.993 |
uers | -1.969 |
reckoning | -1.875 |
Token | playoff |
Token ID | 13119 |
Feature activation | -9.28e-01 |
Pos logit contributions | |
enh | +4.794 |
Occupations | +4.755 |
practice | +4.747 |
Provided | +4.511 |
standard | +4.490 |
Neg logit contributions | |
zzle | -5.478 |
mble | -4.876 |
IRE | -4.767 |
uers | -4.689 |
unci | -4.340 |
Token | game |
Token ID | 983 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
enh | +2.776 |
practice | +2.710 |
Occupations | +2.586 |
adapt | +2.584 |
theless | +2.559 |
Neg logit contributions | |
zzle | -4.963 |
mble | -4.433 |
uers | -4.280 |
IRE | -4.271 |
unci | -4.031 |
Token | - |
Token ID | 12 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
enh | +4.166 |
practice | +4.098 |
Occupations | +3.872 |
adapt | +3.864 |
theless | +3.806 |
Neg logit contributions | |
zzle | -6.021 |
mble | -5.287 |
IRE | -5.244 |
uers | -5.219 |
unci | -4.880 |
Token | win |
Token ID | 5404 |
Feature activation | -6.23e-01 |
Pos logit contributions | |
enh | +5.562 |
practice | +5.159 |
adapt | +4.418 |
standard | +4.414 |
only | +3.993 |
Neg logit contributions | |
zzle | -20.185 |
mble | -19.055 |
IRE | -19.045 |
uers | -18.303 |
millenn | -18.222 |
Token | ners |
Token ID | 2741 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
enh | +2.307 |
practice | +2.278 |
adapt | +2.217 |
abil | +2.148 |
Occupations | +2.139 |
Neg logit contributions | |
zzle | -2.899 |
IRE | -2.615 |
mble | -2.564 |
uers | -2.499 |
reckoning | -2.371 |
Token | are |
Token ID | 389 |
Feature activation | +7.93e-01 |
Pos logit contributions | |
enh | +0.073 |
practice | +0.072 |
Occupations | +0.069 |
adapt | +0.068 |
theless | +0.067 |
Neg logit contributions | |
zzle | -0.082 |
mble | -0.073 |
IRE | -0.072 |
uers | -0.071 |
reckoning | -0.065 |
Token | tied |
Token ID | 8165 |
Feature activation | -8.27e-01 |
Pos logit contributions | |
zzle | +3.602 |
mble | +3.211 |
IRE | +3.135 |
uers | +3.131 |
reckoning | +2.883 |
Neg logit contributions | |
enh | -3.129 |
practice | -3.108 |
adapt | -2.993 |
Occupations | -2.967 |
ゴン | -2.920 |
Token | for |
Token ID | 329 |
Feature activation | -3.24e-01 |
Pos logit contributions | |
enh | +2.675 |
practice | +2.607 |
adapt | +2.479 |
Occupations | +2.455 |
ゴン | +2.379 |
Neg logit contributions | |
zzle | -4.237 |
mble | -3.836 |
IRE | -3.785 |
uers | -3.642 |
reckoning | -3.500 |
Token | February |
Token ID | 3945 |
Feature activation | +3.40e-01 |
Pos logit contributions | |
zzle | +1.886 |
mble | +1.689 |
IRE | +1.660 |
uers | +1.647 |
reckoning | +1.508 |
Neg logit contributions | |
enh | -1.591 |
practice | -1.567 |
adapt | -1.517 |
Occupations | -1.471 |
theless | -1.448 |
Token | , |
Token ID | 11 |
Feature activation | +9.60e-01 |
Pos logit contributions | |
zzle | +1.586 |
mble | +1.421 |
uers | +1.396 |
IRE | +1.391 |
reckoning | +1.280 |
Neg logit contributions | |
enh | -1.300 |
practice | -1.254 |
adapt | -1.227 |
theless | -1.209 |
Occupations | -1.199 |
Token | Munich |
Token ID | 22418 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
zzle | +4.338 |
mble | +3.861 |
IRE | +3.790 |
uers | +3.784 |
reckoning | +3.494 |
Neg logit contributions | |
enh | -3.817 |
practice | -3.740 |
adapt | -3.655 |
Occupations | -3.581 |
theless | -3.560 |
Token | design |
Token ID | 1486 |
Feature activation | +5.56e-01 |
Pos logit contributions | |
enh | +5.451 |
adapt | +4.918 |
practice | +4.899 |
theless | +4.882 |
Provided | +4.872 |
Neg logit contributions | |
zzle | -6.340 |
mble | -5.672 |
uers | -5.567 |
IRE | -5.523 |
reckoning | -4.936 |
Token | student |
Token ID | 3710 |
Feature activation | -3.20e-02 |
Pos logit contributions | |
zzle | +2.613 |
mble | +2.326 |
IRE | +2.309 |
uers | +2.282 |
reckoning | +2.130 |
Neg logit contributions | |
enh | -2.108 |
practice | -2.077 |
adapt | -1.998 |
ゴン | -1.965 |
Occupations | -1.954 |
Token | Mor |
Token ID | 3461 |
Feature activation | -3.40e+00 |
Pos logit contributions | |
enh | +0.114 |
practice | +0.110 |
adapt | +0.107 |
Occupations | +0.107 |
odor | +0.105 |
Neg logit contributions | |
zzle | -0.158 |
mble | -0.141 |
IRE | -0.140 |
uers | -0.139 |
reckoning | -0.127 |
Token | itz |
Token ID | 4224 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
enh | +10.179 |
bid | +9.810 |
practice | +9.492 |
odor | +9.462 |
adapt | +9.183 |
Neg logit contributions | |
zzle | -14.658 |
IRE | -14.123 |
mble | -13.521 |
uers | -12.546 |
FontSize | -12.467 |
Token | Bre |
Token ID | 3719 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
enh | +3.668 |
practice | +3.397 |
odor | +3.309 |
adapt | +3.300 |
Occupations | +3.219 |
Neg logit contributions | |
zzle | -5.539 |
mble | -4.947 |
IRE | -4.946 |
uers | -4.865 |
reckoning | -4.571 |
Token | it |
Token ID | 270 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
enh | +5.835 |
adapt | +5.496 |
practice | +5.476 |
odor | +5.398 |
bid | +5.167 |
Neg logit contributions | |
zzle | -6.049 |
IRE | -5.849 |
mble | -5.477 |
reckoning | -5.425 |
respectively | -5.225 |
Token | en |
Token ID | 268 |
Feature activation | -7.24e-01 |
Pos logit contributions | |
enh | +4.864 |
adapt | +4.307 |
practice | +4.149 |
theless | +4.104 |
odor | +3.998 |
Neg logit contributions | |
zzle | -6.215 |
IRE | -5.698 |
mble | -5.552 |
uers | -5.508 |
reckoning | -5.198 |
Token | hu |
Token ID | 13415 |
Feature activation | +9.56e-01 |
Pos logit contributions | |
enh | +2.623 |
practice | +2.402 |
adapt | +2.387 |
theless | +2.317 |
bid | +2.265 |
Neg logit contributions | |
zzle | -3.537 |
IRE | -3.180 |
mble | -3.178 |
uers | -3.165 |
reckoning | -2.941 |
Token |
|
Token ID | 198 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
enh | +0.409 |
Occupations | +0.402 |
practice | +0.401 |
adapt | +0.386 |
Provided | +0.376 |
Neg logit contributions | |
zzle | -0.851 |
mble | -0.801 |
uers | -0.771 |
IRE | -0.762 |
reckoning | -0.727 |
Token |
|
Token ID | 198 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
zzle | +0.749 |
mble | +0.714 |
uers | +0.677 |
IRE | +0.672 |
reckoning | +0.640 |
Neg logit contributions | |
enh | -0.405 |
practice | -0.401 |
adapt | -0.384 |
Occupations | -0.365 |
odor | -0.360 |
Token | Hist |
Token ID | 13749 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
zzle | +1.379 |
mble | +1.276 |
uers | +1.222 |
IRE | +1.196 |
reckoning | +1.151 |
Neg logit contributions | |
enh | -1.113 |
practice | -1.105 |
adapt | -1.069 |
Occupations | -1.023 |
odor | -1.017 |
Token | orian |
Token ID | 22618 |
Feature activation | -6.04e-01 |
Pos logit contributions | |
enh | +5.110 |
practice | +4.804 |
adapt | +4.678 |
odor | +4.478 |
Occupations | +4.431 |
Neg logit contributions | |
zzle | -9.741 |
IRE | -8.735 |
mble | -8.531 |
uers | -8.149 |
reckoning | -8.098 |
Token | Regina |
Token ID | 38739 |
Feature activation | +3.05e-02 |
Pos logit contributions | |
enh | +2.187 |
practice | +2.112 |
Occupations | +2.060 |
adapt | +2.031 |
odor | +2.000 |
Neg logit contributions | |
zzle | -2.876 |
mble | -2.627 |
IRE | -2.567 |
uers | -2.547 |
reckoning | -2.297 |
Token | Mor |
Token ID | 3461 |
Feature activation | -3.39e+00 |
Pos logit contributions | |
zzle | +0.156 |
mble | +0.143 |
uers | +0.139 |
IRE | +0.139 |
reckoning | +0.130 |
Neg logit contributions | |
enh | -0.102 |
practice | -0.099 |
Occupations | -0.096 |
adapt | -0.096 |
odor | -0.094 |
Token | antz |
Token ID | 46269 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
enh | +11.899 |
practice | +11.452 |
bid | +11.422 |
adapt | +11.076 |
oney | +10.799 |
Neg logit contributions | |
zzle | -12.744 |
IRE | -12.505 |
mble | -11.723 |
millenn | -11.198 |
uers | -11.150 |
Token | highlighted |
Token ID | 14537 |
Feature activation | -7.38e-01 |
Pos logit contributions | |
enh | +0.411 |
practice | +0.390 |
adapt | +0.380 |
Occupations | +0.375 |
odor | +0.373 |
Neg logit contributions | |
zzle | -0.464 |
mble | -0.422 |
IRE | -0.414 |
uers | -0.411 |
reckoning | -0.376 |
Token | the |
Token ID | 262 |
Feature activation | -9.17e-01 |
Pos logit contributions | |
enh | +2.966 |
practice | +2.938 |
Occupations | +2.846 |
adapt | +2.825 |
odor | +2.756 |
Neg logit contributions | |
zzle | -3.151 |
mble | -2.865 |
IRE | -2.828 |
uers | -2.779 |
reckoning | -2.549 |
Token | fear |
Token ID | 3252 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
practice | +3.544 |
enh | +3.512 |
odor | +3.385 |
Occupations | +3.380 |
adapt | +3.337 |
Neg logit contributions | |
zzle | -4.060 |
mble | -3.733 |
IRE | -3.574 |
uers | -3.568 |
reckoning | -3.160 |
Token | underlying |
Token ID | 10238 |
Feature activation | +5.11e-01 |
Pos logit contributions | |
zzle | +1.133 |
mble | +1.034 |
uers | +1.010 |
IRE | +0.995 |
reckoning | +0.901 |
Neg logit contributions | |
enh | -1.292 |
practice | -1.279 |
adapt | -1.228 |
Occupations | -1.219 |
odor | -1.204 |
Token | another |
Token ID | 1194 |
Feature activation | +4.35e-01 |
Pos logit contributions | |
zzle | +0.171 |
mble | +0.159 |
uers | +0.153 |
IRE | +0.152 |
reckoning | +0.136 |
Neg logit contributions | |
enh | -0.173 |
practice | -0.170 |
adapt | -0.165 |
Occupations | -0.164 |
odor | -0.161 |
Token | way |
Token ID | 835 |
Feature activation | -4.26e-02 |
Pos logit contributions | |
zzle | +2.042 |
mble | +1.874 |
uers | +1.837 |
IRE | +1.832 |
reckoning | +1.631 |
Neg logit contributions | |
enh | -1.634 |
practice | -1.597 |
adapt | -1.533 |
Occupations | -1.530 |
ゴン | -1.509 |
Token | of |
Token ID | 286 |
Feature activation | +6.27e-01 |
Pos logit contributions | |
enh | +0.207 |
practice | +0.202 |
adapt | +0.198 |
Occupations | +0.197 |
ゴン | +0.195 |
Neg logit contributions | |
zzle | -0.151 |
mble | -0.136 |
IRE | -0.131 |
uers | -0.130 |
reckoning | -0.113 |
Token | saying |
Token ID | 2282 |
Feature activation | +4.40e-01 |
Pos logit contributions | |
zzle | +2.031 |
mble | +1.782 |
IRE | +1.728 |
uers | +1.696 |
htar | +1.408 |
Neg logit contributions | |
enh | -3.293 |
practice | -3.243 |
adapt | -3.163 |
Occupations | -3.133 |
theless | -3.121 |
Token | the |
Token ID | 262 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
zzle | +2.062 |
mble | +1.844 |
uers | +1.825 |
IRE | +1.825 |
reckoning | +1.675 |
Neg logit contributions | |
enh | -1.648 |
practice | -1.637 |
adapt | -1.575 |
Occupations | -1.559 |
theless | -1.532 |
Token | beginning |
Token ID | 3726 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
enh | +1.226 |
practice | +1.201 |
odor | +1.176 |
Occupations | +1.153 |
adapt | +1.152 |
Neg logit contributions | |
zzle | -1.434 |
mble | -1.283 |
uers | -1.247 |
IRE | -1.233 |
htar | -1.120 |
Token | of |
Token ID | 286 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
zzle | +6.916 |
mble | +5.969 |
uers | +5.848 |
IRE | +5.825 |
reckoning | +5.438 |
Neg logit contributions | |
enh | -9.063 |
practice | -9.010 |
adapt | -8.780 |
ゴン | -8.716 |
Occupations | -8.634 |
Token | the |
Token ID | 262 |
Feature activation | +7.94e-01 |
Pos logit contributions | |
zzle | +6.178 |
mble | +5.437 |
uers | +5.344 |
IRE | +5.331 |
reckoning | +4.949 |
Neg logit contributions | |
enh | -6.475 |
practice | -6.418 |
adapt | -6.234 |
ゴン | -6.174 |
Occupations | -6.143 |
Token | end |
Token ID | 886 |
Feature activation | +7.85e-01 |
Pos logit contributions | |
zzle | +3.619 |
mble | +3.213 |
uers | +3.157 |
IRE | +3.149 |
reckoning | +2.847 |
Neg logit contributions | |
enh | -3.129 |
practice | -3.079 |
adapt | -2.988 |
Occupations | -2.960 |
ゴン | -2.929 |
Token | . |
Token ID | 13 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
zzle | +3.004 |
mble | +2.626 |
IRE | +2.564 |
uers | +2.553 |
reckoning | +2.310 |
Neg logit contributions | |
enh | -3.650 |
practice | -3.604 |
adapt | -3.505 |
ゴン | -3.458 |
Occupations | -3.457 |
Token |
|
Token ID | 198 |
Feature activation | +3.66e-01 |
Pos logit contributions | |
zzle | +1.176 |
mble | +1.080 |
uers | +1.053 |
IRE | +1.037 |
reckoning | +0.982 |
Neg logit contributions | |
enh | -0.646 |
practice | -0.629 |
Occupations | -0.620 |
adapt | -0.611 |
Provided | -0.592 |
Token | in |
Token ID | 287 |
Feature activation | +2.02e-01 |
Pos logit contributions | |
enh | +0.625 |
practice | +0.602 |
adapt | +0.592 |
Occupations | +0.589 |
theless | +0.585 |
Neg logit contributions | |
zzle | -0.802 |
mble | -0.734 |
IRE | -0.720 |
uers | -0.709 |
unci | -0.643 |
Token | May |
Token ID | 1737 |
Feature activation | -5.33e-01 |
Pos logit contributions | |
zzle | +0.802 |
mble | +0.720 |
uers | +0.705 |
IRE | +0.699 |
reckoning | +0.615 |
Neg logit contributions | |
practice | -0.898 |
enh | -0.896 |
adapt | -0.867 |
Occupations | -0.845 |
odor | -0.842 |
Token | became |
Token ID | 2627 |
Feature activation | +5.95e-01 |
Pos logit contributions | |
enh | +2.066 |
practice | +1.981 |
theless | +1.951 |
Provided | +1.927 |
bid | +1.919 |
Neg logit contributions | |
zzle | -2.325 |
mble | -2.195 |
IRE | -2.100 |
uers | -2.075 |
reckoning | -1.831 |
Token | the |
Token ID | 262 |
Feature activation | -1.73e-01 |
Pos logit contributions | |
zzle | +2.478 |
mble | +2.210 |
IRE | +2.150 |
uers | +2.138 |
reckoning | +1.954 |
Neg logit contributions | |
enh | -2.546 |
practice | -2.523 |
adapt | -2.455 |
Occupations | -2.427 |
theless | -2.408 |
Token | most |
Token ID | 749 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
practice | +0.641 |
enh | +0.640 |
Occupations | +0.610 |
odor | +0.606 |
adapt | +0.603 |
Neg logit contributions | |
zzle | -0.811 |
IRE | -0.723 |
mble | -0.722 |
uers | -0.706 |
unci | -0.648 |
Token | expensive |
Token ID | 5789 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
zzle | +5.934 |
mble | +5.334 |
uers | +5.246 |
IRE | +5.233 |
reckoning | +4.853 |
Neg logit contributions | |
enh | -4.614 |
practice | -4.556 |
adapt | -4.398 |
Occupations | -4.330 |
ゴン | -4.322 |
Token | congressional |
Token ID | 11702 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
zzle | +6.718 |
mble | +5.869 |
uers | +5.766 |
IRE | +5.761 |
reckoning | +5.367 |
Neg logit contributions | |
enh | -7.201 |
practice | -7.119 |
adapt | -6.947 |
ゴン | -6.916 |
Occupations | -6.822 |
Token | election |
Token ID | 3071 |
Feature activation | +9.64e-01 |
Pos logit contributions | |
zzle | +4.893 |
mble | +4.120 |
uers | +4.022 |
IRE | +4.010 |
reckoning | +3.582 |
Neg logit contributions | |
enh | -8.261 |
practice | -8.198 |
adapt | -8.006 |
ゴン | -7.933 |
Occupations | -7.913 |
Token | ever |
Token ID | 1683 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
zzle | +4.105 |
mble | +3.653 |
uers | +3.581 |
IRE | +3.581 |
reckoning | +3.249 |
Neg logit contributions | |
enh | -4.048 |
practice | -4.024 |
adapt | -3.884 |
Occupations | -3.829 |
ゴン | -3.821 |
Token | . |
Token ID | 13 |
Feature activation | -2.44e-02 |
Pos logit contributions | |
enh | +0.875 |
practice | +0.871 |
adapt | +0.837 |
theless | +0.830 |
Occupations | +0.824 |
Neg logit contributions | |
zzle | -1.083 |
mble | -0.997 |
IRE | -0.984 |
uers | -0.972 |
unci | -0.853 |
Token | With |
Token ID | 2080 |
Feature activation | +9.70e-01 |
Pos logit contributions | |
enh | +0.070 |
practice | +0.069 |
Occupations | +0.068 |
Provided | +0.066 |
adapt | +0.065 |
Neg logit contributions | |
zzle | -0.137 |
mble | -0.128 |
uers | -0.124 |
IRE | -0.122 |
reckoning | -0.115 |
Token | Cape |
Token ID | 15725 |
Feature activation | -6.12e-01 |
Pos logit contributions | |
enh | +1.606 |
practice | +1.572 |
adapt | +1.470 |
Occupations | +1.447 |
odor | +1.432 |
Neg logit contributions | |
zzle | -2.147 |
mble | -1.965 |
uers | -1.918 |
IRE | -1.897 |
reckoning | -1.755 |
Token | llo |
Token ID | 18798 |
Feature activation | -8.97e-02 |
Pos logit contributions | |
enh | +3.311 |
practice | +3.297 |
odor | +3.216 |
adapt | +3.184 |
Occupations | +3.090 |
Neg logit contributions | |
zzle | -1.739 |
mble | -1.483 |
IRE | -1.424 |
uers | -1.373 |
reckoning | -1.309 |
Token | 's |
Token ID | 338 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
enh | +0.325 |
practice | +0.321 |
adapt | +0.301 |
odor | +0.294 |
Occupations | +0.293 |
Neg logit contributions | |
zzle | -0.433 |
mble | -0.399 |
IRE | -0.390 |
uers | -0.387 |
unci | -0.347 |
Token | thoughts |
Token ID | 6066 |
Feature activation | +5.66e-01 |
Pos logit contributions | |
zzle | +1.258 |
mble | +1.089 |
IRE | +1.073 |
uers | +1.071 |
unci | +0.938 |
Neg logit contributions | |
practice | -1.417 |
enh | -1.414 |
adapt | -1.359 |
Occupations | -1.351 |
odor | -1.335 |
Token | ," |
Token ID | 553 |
Feature activation | +7.74e-01 |
Pos logit contributions | |
zzle | +2.497 |
mble | +2.235 |
IRE | +2.222 |
uers | +2.207 |
reckoning | +2.004 |
Neg logit contributions | |
enh | -2.300 |
practice | -2.264 |
adapt | -2.185 |
Occupations | -2.139 |
ゴン | -2.122 |
Token | said |
Token ID | 531 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
zzle | +3.197 |
mble | +2.851 |
IRE | +2.795 |
uers | +2.779 |
reckoning | +2.531 |
Neg logit contributions | |
enh | -3.373 |
practice | -3.315 |
adapt | -3.219 |
theless | -3.158 |
Occupations | -3.152 |
Token | Bruce |
Token ID | 11088 |
Feature activation | -1.49e-01 |
Pos logit contributions | |
zzle | +8.094 |
mble | +7.274 |
uers | +7.188 |
IRE | +7.138 |
reckoning | +6.729 |
Neg logit contributions | |
enh | -5.643 |
practice | -5.607 |
adapt | -5.404 |
ゴン | -5.378 |
Occupations | -5.312 |
Token | . |
Token ID | 13 |
Feature activation | -2.19e-01 |
Pos logit contributions | |
enh | +0.551 |
practice | +0.539 |
adapt | +0.513 |
bid | +0.508 |
theless | +0.504 |
Neg logit contributions | |
zzle | -0.697 |
mble | -0.651 |
IRE | -0.625 |
uers | -0.623 |
reckoning | -0.550 |
Token | " |
Token ID | 366 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
enh | +0.752 |
practice | +0.744 |
adapt | +0.715 |
Occupations | +0.701 |
ゴン | +0.697 |
Neg logit contributions | |
zzle | -1.096 |
mble | -0.987 |
IRE | -0.973 |
uers | -0.972 |
reckoning | -0.910 |
Token | He |
Token ID | 1544 |
Feature activation | -8.68e-01 |
Pos logit contributions | |
enh | +0.044 |
practice | +0.044 |
adapt | +0.042 |
odor | +0.040 |
Occupations | +0.040 |
Neg logit contributions | |
zzle | -0.054 |
mble | -0.050 |
uers | -0.047 |
IRE | -0.046 |
reckoning | -0.045 |
Token | 's |
Token ID | 338 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
enh | +3.065 |
practice | +2.957 |
adapt | +2.794 |
theless | +2.793 |
bid | +2.712 |
Neg logit contributions | |
zzle | -4.097 |
mble | -3.895 |
IRE | -3.778 |
uers | -3.664 |
reckoning | -3.315 |
Token | along |
Token ID | 1863 |
Feature activation | -5.77e-01 |
Pos logit contributions | |
enh | +0.690 |
practice | +0.678 |
adapt | +0.646 |
theless | +0.624 |
Occupations | +0.621 |
Neg logit contributions | |
zzle | -0.855 |
mble | -0.804 |
uers | -0.785 |
IRE | -0.779 |
unci | -0.689 |
Token | the |
Token ID | 262 |
Feature activation | -4.39e-01 |
Pos logit contributions | |
enh | +2.236 |
practice | +2.206 |
adapt | +2.193 |
Occupations | +2.191 |
theless | +2.168 |
Neg logit contributions | |
zzle | -2.522 |
mble | -2.229 |
uers | -2.162 |
IRE | -2.121 |
reckoning | -1.988 |
Token | front |
Token ID | 2166 |
Feature activation | +6.93e-01 |
Pos logit contributions | |
enh | +1.632 |
practice | +1.602 |
Occupations | +1.581 |
adapt | +1.578 |
odor | +1.561 |
Neg logit contributions | |
zzle | -2.016 |
mble | -1.833 |
uers | -1.755 |
IRE | -1.724 |
reckoning | -1.582 |
Token | iers |
Token ID | 3183 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
zzle | +3.580 |
mble | +3.285 |
IRE | +3.163 |
uers | +3.163 |
reckoning | +2.974 |
Neg logit contributions | |
enh | -2.338 |
practice | -2.258 |
adapt | -2.206 |
Occupations | -2.159 |
theless | -2.099 |
Token | of |
Token ID | 286 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
zzle | +4.170 |
mble | +3.639 |
uers | +3.516 |
IRE | +3.480 |
reckoning | +3.098 |
Neg logit contributions | |
enh | -6.185 |
practice | -6.091 |
adapt | -5.960 |
Occupations | -5.879 |
ゴン | -5.847 |
Token | Armenian |
Token ID | 29388 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
zzle | +6.221 |
mble | +5.498 |
uers | +5.407 |
IRE | +5.396 |
reckoning | +4.987 |
Neg logit contributions | |
enh | -6.096 |
practice | -6.039 |
adapt | -5.856 |
ゴン | -5.786 |
Occupations | -5.771 |
Token | freedom |
Token ID | 4925 |
Feature activation | -2.95e-01 |
Pos logit contributions | |
zzle | +7.503 |
mble | +6.694 |
IRE | +6.601 |
uers | +6.598 |
reckoning | +6.171 |
Neg logit contributions | |
enh | -6.190 |
practice | -6.125 |
adapt | -5.930 |
ゴン | -5.877 |
Occupations | -5.829 |
Token |
|
Token ID | 198 |
Feature activation | +4.22e-01 |
Pos logit contributions | |
enh | +1.105 |
practice | +1.071 |
adapt | +1.017 |
Occupations | +0.988 |
bid | +0.984 |
Neg logit contributions | |
zzle | -1.370 |
mble | -1.279 |
uers | -1.246 |
IRE | -1.209 |
unci | -1.118 |
Token |
|
Token ID | 198 |
Feature activation | +3.89e-01 |
Pos logit contributions | |
zzle | +2.274 |
mble | +2.135 |
uers | +2.046 |
IRE | +2.029 |
reckoning | +1.923 |
Neg logit contributions | |
enh | -1.321 |
practice | -1.304 |
adapt | -1.252 |
Occupations | -1.196 |
odor | -1.175 |
Token | But |
Token ID | 1537 |
Feature activation | -2.56e-01 |
Pos logit contributions | |
zzle | +1.998 |
mble | +1.839 |
uers | +1.798 |
IRE | +1.775 |
reckoning | +1.676 |
Neg logit contributions | |
enh | -1.329 |
practice | -1.312 |
adapt | -1.263 |
odor | -1.192 |
ゴン | -1.188 |
Token | the |
Token ID | 262 |
Feature activation | -4.65e-01 |
Pos logit contributions | |
enh | +1.086 |
practice | +1.072 |
adapt | +1.049 |
theless | +1.041 |
Occupations | +1.030 |
Neg logit contributions | |
zzle | -1.048 |
mble | -0.936 |
uers | -0.918 |
IRE | -0.915 |
unci | -0.809 |
Token | hit |
Token ID | 2277 |
Feature activation | -2.72e-01 |
Pos logit contributions | |
practice | +1.707 |
enh | +1.700 |
adapt | +1.620 |
Occupations | +1.578 |
theless | +1.578 |
Neg logit contributions | |
zzle | -2.418 |
mble | -2.157 |
uers | -2.140 |
IRE | -2.134 |
htar | -1.895 |
Token | just |
Token ID | 655 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
practice | +1.111 |
enh | +1.098 |
adapt | +1.054 |
Occupations | +1.045 |
theless | +1.039 |
Neg logit contributions | |
zzle | -1.165 |
mble | -1.044 |
uers | -1.015 |
IRE | -1.005 |
reckoning | -0.901 |
Token | as |
Token ID | 355 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
zzle | +0.846 |
mble | +0.786 |
uers | +0.761 |
IRE | +0.753 |
reckoning | +0.682 |
Neg logit contributions | |
enh | -0.670 |
practice | -0.670 |
adapt | -0.646 |
theless | -0.632 |
Occupations | -0.625 |
Token | Donald |
Token ID | 3759 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
zzle | +2.558 |
mble | +2.291 |
uers | +2.239 |
IRE | +2.199 |
reckoning | +2.012 |
Neg logit contributions | |
practice | -2.308 |
enh | -2.294 |
adapt | -2.195 |
theless | -2.164 |
Occupations | -2.162 |
Token | Trump |
Token ID | 1301 |
Feature activation | +3.06e-01 |
Pos logit contributions | |
zzle | +1.273 |
mble | +1.116 |
uers | +1.098 |
IRE | +1.095 |
reckoning | +1.013 |
Neg logit contributions | |
enh | -1.373 |
practice | -1.362 |
adapt | -1.323 |
ゴン | -1.312 |
Occupations | -1.307 |
Token | is |
Token ID | 318 |
Feature activation | +2.22e+00 |
Pos logit contributions | |
zzle | +1.422 |
mble | +1.286 |
IRE | +1.248 |
uers | +1.247 |
reckoning | +1.134 |
Neg logit contributions | |
enh | -1.184 |
practice | -1.151 |
adapt | -1.111 |
theless | -1.101 |
Occupations | -1.077 |
Token | wreck |
Token ID | 15228 |
Feature activation | -9.39e-01 |
Pos logit contributions | |
zzle | +8.213 |
mble | +7.040 |
uers | +6.972 |
IRE | +6.953 |
reckoning | +6.530 |
Neg logit contributions | |
enh | -10.172 |
practice | -10.128 |
adapt | -9.865 |
ゴン | -9.861 |
Occupations | -9.778 |
Token | ing |
Token ID | 278 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
enh | +2.606 |
practice | +2.500 |
adapt | +2.361 |
abil | +2.287 |
odor | +2.197 |
Neg logit contributions | |
zzle | -5.308 |
mble | -4.997 |
IRE | -4.805 |
uers | -4.712 |
reckoning | -4.343 |
Token | the |
Token ID | 262 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
zzle | +1.710 |
mble | +1.507 |
uers | +1.485 |
IRE | +1.465 |
reckoning | +1.342 |
Neg logit contributions | |
practice | -1.486 |
enh | -1.477 |
adapt | -1.398 |
Occupations | -1.388 |
ゴン | -1.371 |
Token | GOP |
Token ID | 6796 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
zzle | +0.830 |
uers | +0.716 |
mble | +0.709 |
IRE | +0.705 |
reckoning | +0.631 |
Neg logit contributions | |
enh | -0.781 |
practice | -0.771 |
Occupations | -0.734 |
adapt | -0.731 |
odor | -0.715 |
Token | � |
Token ID | 447 |
Feature activation | +5.34e-01 |
Pos logit contributions | |
zzle | +5.638 |
mble | +4.986 |
uers | +4.907 |
IRE | +4.885 |
reckoning | +4.512 |
Neg logit contributions | |
enh | -5.299 |
practice | -5.246 |
adapt | -5.075 |
Occupations | -5.000 |
ゴン | -4.999 |
Token | not |
Token ID | 407 |
Feature activation | -4.83e-01 |
Pos logit contributions | |
zzle | +8.520 |
mble | +7.517 |
uers | +7.418 |
IRE | +7.390 |
reckoning | +6.880 |
Neg logit contributions | |
enh | -7.979 |
practice | -7.947 |
ゴン | -7.841 |
adapt | -7.696 |
Occupations | -7.690 |
Token | be |
Token ID | 307 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
enh | +1.943 |
practice | +1.900 |
adapt | +1.834 |
bid | +1.806 |
theless | +1.788 |
Neg logit contributions | |
zzle | -2.057 |
mble | -1.891 |
IRE | -1.843 |
uers | -1.833 |
reckoning | -1.661 |
Token | able |
Token ID | 1498 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
zzle | +4.033 |
mble | +3.517 |
IRE | +3.429 |
uers | +3.423 |
reckoning | +3.088 |
Neg logit contributions | |
enh | -5.216 |
practice | -5.142 |
adapt | -5.019 |
Occupations | -4.941 |
ゴン | -4.934 |
Token | to |
Token ID | 284 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
enh | +1.472 |
practice | +1.422 |
adapt | +1.376 |
Occupations | +1.320 |
odor | +1.305 |
Neg logit contributions | |
zzle | -1.879 |
mble | -1.759 |
IRE | -1.698 |
uers | -1.668 |
reckoning | -1.528 |
Token | . |
Token ID | 13 |
Feature activation | -2.56e-01 |
Pos logit contributions | |
enh | +0.627 |
practice | +0.611 |
adapt | +0.590 |
theless | +0.563 |
abil | +0.562 |
Neg logit contributions | |
zzle | -0.808 |
mble | -0.744 |
IRE | -0.725 |
uers | -0.715 |
reckoning | -0.666 |
Token | 1 |
Token ID | 16 |
Feature activation | +6.58e-01 |
Pos logit contributions | |
enh | +0.768 |
practice | +0.745 |
adapt | +0.719 |
Provided | +0.716 |
Occupations | +0.699 |
Neg logit contributions | |
zzle | -1.404 |
mble | -1.296 |
uers | -1.269 |
IRE | -1.246 |
reckoning | -1.175 |
Token | . |
Token ID | 13 |
Feature activation | -7.05e-01 |
Pos logit contributions | |
zzle | +3.086 |
mble | +2.765 |
uers | +2.721 |
IRE | +2.713 |
reckoning | +2.531 |
Neg logit contributions | |
enh | -2.498 |
practice | -2.460 |
adapt | -2.381 |
ゴン | -2.329 |
Occupations | -2.324 |
Token | The |
Token ID | 383 |
Feature activation | -5.96e-01 |
Pos logit contributions | |
enh | +2.502 |
adapt | +2.352 |
practice | +2.348 |
Provided | +2.234 |
Occupations | +2.206 |
Neg logit contributions | |
zzle | -3.402 |
mble | -3.159 |
uers | -3.077 |
IRE | -3.026 |
reckoning | -2.852 |
Token | pixels |
Token ID | 17848 |
Feature activation | +5.98e-01 |
Pos logit contributions | |
enh | +2.368 |
practice | +2.245 |
adapt | +2.219 |
Occupations | +2.193 |
Provided | +2.171 |
Neg logit contributions | |
zzle | -2.605 |
mble | -2.353 |
uers | -2.293 |
IRE | -2.241 |
reckoning | -2.073 |
Token | are |
Token ID | 389 |
Feature activation | +6.78e-01 |
Pos logit contributions | |
zzle | +2.490 |
mble | +2.192 |
uers | +2.150 |
IRE | +2.144 |
reckoning | +1.937 |
Neg logit contributions | |
enh | -2.628 |
practice | -2.567 |
adapt | -2.522 |
Occupations | -2.459 |
theless | -2.432 |
Token | large |
Token ID | 1588 |
Feature activation | +4.15e-02 |
Pos logit contributions | |
zzle | +3.069 |
mble | +2.753 |
uers | +2.684 |
IRE | +2.673 |
reckoning | +2.449 |
Neg logit contributions | |
enh | -2.744 |
practice | -2.639 |
adapt | -2.605 |
Occupations | -2.526 |
theless | -2.512 |
Token | ani |
Token ID | 3216 |
Feature activation | +3.47e-02 |
Pos logit contributions | |
enh | +4.453 |
adapt | +4.022 |
practice | +3.972 |
bid | +3.935 |
odor | +3.906 |
Neg logit contributions | |
zzle | -6.266 |
mble | -5.872 |
IRE | -5.809 |
uers | -5.589 |
reckoning | -5.508 |
Token |
|
Token ID | 198 |
Feature activation | -2.03e-01 |
Pos logit contributions | |
zzle | +0.171 |
mble | +0.155 |
IRE | +0.153 |
uers | +0.152 |
reckoning | +0.143 |
Neg logit contributions | |
enh | -0.124 |
practice | -0.119 |
adapt | -0.115 |
Occupations | -0.113 |
ゴン | -0.112 |
Token |
|
Token ID | 198 |
Feature activation | +4.58e-01 |
Pos logit contributions | |
enh | +0.583 |
practice | +0.576 |
adapt | +0.556 |
Occupations | +0.516 |
odor | +0.515 |
Neg logit contributions | |
zzle | -1.141 |
mble | -1.096 |
uers | -1.030 |
IRE | -1.023 |
reckoning | -0.981 |
Token | On |
Token ID | 2202 |
Feature activation | +4.98e-01 |
Pos logit contributions | |
zzle | +2.136 |
mble | +1.956 |
uers | +1.871 |
IRE | +1.829 |
reckoning | +1.777 |
Neg logit contributions | |
enh | -1.787 |
practice | -1.762 |
adapt | -1.716 |
odor | -1.634 |
ゴン | -1.625 |
Token | the |
Token ID | 262 |
Feature activation | -2.62e-01 |
Pos logit contributions | |
zzle | +2.210 |
mble | +1.982 |
IRE | +1.942 |
uers | +1.922 |
reckoning | +1.761 |
Neg logit contributions | |
enh | -2.035 |
practice | -1.998 |
adapt | -1.946 |
Occupations | -1.906 |
theless | -1.884 |
Token | bright |
Token ID | 6016 |
Feature activation | +6.95e-01 |
Pos logit contributions | |
enh | +0.893 |
practice | +0.865 |
adapt | +0.847 |
Occupations | +0.834 |
theless | +0.821 |
Neg logit contributions | |
zzle | -1.318 |
mble | -1.203 |
IRE | -1.157 |
uers | -1.154 |
reckoning | -1.064 |
Token | side |
Token ID | 1735 |
Feature activation | +4.99e-01 |
Pos logit contributions | |
zzle | +3.118 |
mble | +2.777 |
uers | +2.732 |
IRE | +2.718 |
reckoning | +2.475 |
Neg logit contributions | |
enh | -2.822 |
practice | -2.747 |
adapt | -2.683 |
theless | -2.606 |
Occupations | -2.598 |
Token | , |
Token ID | 11 |
Feature activation | +7.92e-01 |
Pos logit contributions | |
zzle | +2.293 |
mble | +2.047 |
uers | +2.015 |
IRE | +2.013 |
reckoning | +1.871 |
Neg logit contributions | |
enh | -1.916 |
practice | -1.894 |
adapt | -1.833 |
ゴン | -1.809 |
Occupations | -1.804 |
Token | growing |
Token ID | 3957 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
zzle | +3.550 |
mble | +3.193 |
IRE | +3.111 |
uers | +3.111 |
reckoning | +2.845 |
Neg logit contributions | |
enh | -3.179 |
practice | -3.118 |
adapt | -3.040 |
Occupations | -2.987 |
theless | -2.955 |
Token | public |
Token ID | 1171 |
Feature activation | +6.27e-01 |
Pos logit contributions | |
zzle | +5.836 |
mble | +5.214 |
uers | +5.140 |
IRE | +5.128 |
reckoning | +4.769 |
Neg logit contributions | |
enh | -4.712 |
practice | -4.663 |
adapt | -4.507 |
ゴン | -4.438 |
Occupations | -4.435 |
Token | awareness |
Token ID | 9359 |
Feature activation | +6.77e-01 |
Pos logit contributions | |
zzle | +2.876 |
mble | +2.549 |
uers | +2.512 |
IRE | +2.479 |
reckoning | +2.242 |
Neg logit contributions | |
enh | -2.481 |
practice | -2.455 |
adapt | -2.385 |
Occupations | -2.328 |
theless | -2.311 |
Token | testing |
Token ID | 4856 |
Feature activation | -4.51e-01 |
Pos logit contributions | |
enh | +5.750 |
practice | +5.662 |
theless | +5.580 |
adapt | +5.452 |
firsthand | +5.426 |
Neg logit contributions | |
zzle | -5.004 |
mble | -4.951 |
IRE | -4.744 |
uers | -4.631 |
htar | -3.826 |
Token | his |
Token ID | 465 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
practice | +1.629 |
enh | +1.618 |
adapt | +1.567 |
firsthand | +1.529 |
Occupations | +1.521 |
Neg logit contributions | |
zzle | -2.127 |
mble | -1.917 |
IRE | -1.882 |
uers | -1.872 |
htar | -1.668 |
Token | tribe |
Token ID | 14893 |
Feature activation | -5.45e-02 |
Pos logit contributions | |
enh | +1.189 |
practice | +1.172 |
adapt | +1.121 |
Occupations | +1.090 |
firsthand | +1.084 |
Neg logit contributions | |
zzle | -1.355 |
mble | -1.220 |
IRE | -1.188 |
uers | -1.163 |
htar | -1.050 |
Token | through |
Token ID | 832 |
Feature activation | -4.80e-01 |
Pos logit contributions | |
enh | +0.203 |
practice | +0.200 |
adapt | +0.194 |
Occupations | +0.185 |
theless | +0.185 |
Neg logit contributions | |
zzle | -0.256 |
mble | -0.235 |
IRE | -0.229 |
uers | -0.228 |
reckoning | -0.208 |
Token | er |
Token ID | 1931 |
Feature activation | +5.23e-01 |
Pos logit contributions | |
practice | +1.881 |
enh | +1.872 |
adapt | +1.768 |
ゴン | +1.736 |
Occupations | +1.733 |
Neg logit contributions | |
zzle | -2.132 |
mble | -1.940 |
IRE | -1.928 |
uers | -1.904 |
htar | -1.683 |
Token | rant |
Token ID | 5250 |
Feature activation | +7.71e-01 |
Pos logit contributions | |
zzle | +2.023 |
mble | +1.776 |
IRE | +1.754 |
uers | +1.697 |
reckoning | +1.574 |
Neg logit contributions | |
enh | -2.429 |
practice | -2.390 |
adapt | -2.308 |
Occupations | -2.262 |
ゴン | -2.261 |
Token | word |
Token ID | 1573 |
Feature activation | +3.64e-01 |
Pos logit contributions | |
zzle | +3.635 |
mble | +3.276 |
IRE | +3.214 |
uers | +3.212 |
reckoning | +2.940 |
Neg logit contributions | |
enh | -2.894 |
practice | -2.879 |
adapt | -2.764 |
Occupations | -2.726 |
ゴン | -2.713 |
Token | and |
Token ID | 290 |
Feature activation | -5.10e-01 |
Pos logit contributions | |
zzle | +1.843 |
mble | +1.684 |
IRE | +1.670 |
uers | +1.649 |
reckoning | +1.516 |
Neg logit contributions | |
enh | -1.243 |
practice | -1.235 |
adapt | -1.182 |
ゴン | -1.131 |
odor | -1.131 |
Token | deed |
Token ID | 28637 |
Feature activation | +8.96e-01 |
Pos logit contributions | |
practice | +1.935 |
enh | +1.924 |
Occupations | +1.761 |
adapt | +1.757 |
firsthand | +1.753 |
Neg logit contributions | |
zzle | -2.312 |
mble | -2.167 |
IRE | -2.123 |
uers | -2.079 |
htar | -1.827 |
Token | . |
Token ID | 13 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
zzle | +3.920 |
mble | +3.502 |
IRE | +3.436 |
uers | +3.432 |
reckoning | +3.162 |
Neg logit contributions | |
enh | -3.647 |
practice | -3.618 |
adapt | -3.489 |
Occupations | -3.442 |
ゴン | -3.436 |
Token | Even |
Token ID | 3412 |
Feature activation | -4.79e-01 |
Pos logit contributions | |
enh | +0.461 |
practice | +0.455 |
Occupations | +0.452 |
adapt | +0.438 |
Provided | +0.434 |
Neg logit contributions | |
zzle | -1.029 |
mble | -0.969 |
uers | -0.934 |
IRE | -0.919 |
reckoning | -0.874 |
Token | credit |
Token ID | 3884 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
zzle | +0.933 |
mble | +0.844 |
IRE | +0.830 |
uers | +0.825 |
reckoning | +0.747 |
Neg logit contributions | |
enh | -0.799 |
practice | -0.770 |
adapt | -0.750 |
Occupations | -0.739 |
theless | -0.722 |
Token | card |
Token ID | 2657 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
enh | +4.114 |
practice | +3.770 |
adapt | +3.652 |
abil | +3.618 |
Provided | +3.563 |
Neg logit contributions | |
zzle | -5.512 |
mble | -5.154 |
IRE | -4.931 |
uers | -4.750 |
htar | -4.393 |
Token | processing |
Token ID | 7587 |
Feature activation | -3.07e-01 |
Pos logit contributions | |
zzle | +0.639 |
mble | +0.578 |
IRE | +0.562 |
uers | +0.558 |
reckoning | +0.504 |
Neg logit contributions | |
enh | -0.551 |
practice | -0.534 |
adapt | -0.519 |
Occupations | -0.508 |
odor | -0.500 |
Token | , |
Token ID | 11 |
Feature activation | +6.87e-02 |
Pos logit contributions | |
enh | +1.085 |
practice | +1.048 |
adapt | +1.010 |
ゴン | +0.994 |
Occupations | +0.990 |
Neg logit contributions | |
zzle | -1.505 |
mble | -1.360 |
IRE | -1.340 |
uers | -1.329 |
reckoning | -1.218 |
Token | and |
Token ID | 290 |
Feature activation | -7.45e-01 |
Pos logit contributions | |
zzle | +0.311 |
mble | +0.280 |
IRE | +0.273 |
uers | +0.273 |
reckoning | +0.247 |
Neg logit contributions | |
enh | -0.271 |
practice | -0.262 |
adapt | -0.256 |
Occupations | -0.252 |
odor | -0.247 |
Token | detailed |
Token ID | 6496 |
Feature activation | +3.14e-02 |
Pos logit contributions | |
enh | +2.886 |
practice | +2.718 |
adapt | +2.674 |
Occupations | +2.626 |
theless | +2.617 |
Neg logit contributions | |
zzle | -3.312 |
mble | -3.009 |
IRE | -2.934 |
uers | -2.911 |
unci | -2.644 |
Token | reporting |
Token ID | 6447 |
Feature activation | -9.20e-05 |
Pos logit contributions | |
zzle | +0.144 |
mble | +0.131 |
IRE | +0.129 |
uers | +0.128 |
htar | +0.116 |
Neg logit contributions | |
enh | -0.120 |
practice | -0.117 |
Occupations | -0.113 |
adapt | -0.113 |
theless | -0.110 |
Token | - |
Token ID | 532 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
enh | +0.000 |
practice | +0.000 |
adapt | +0.000 |
Occupations | +0.000 |
Provided | +0.000 |
Neg logit contributions | |
zzle | -0.000 |
mble | -0.000 |
IRE | -0.000 |
uers | -0.000 |
reckoning | -0.000 |
Token | all |
Token ID | 477 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
enh | +4.529 |
practice | +4.300 |
adapt | +4.160 |
Provided | +4.096 |
Occupations | +4.092 |
Neg logit contributions | |
zzle | -5.205 |
mble | -4.812 |
IRE | -4.645 |
uers | -4.504 |
htar | -4.147 |
Token | bundled |
Token ID | 34358 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
enh | +4.936 |
practice | +4.702 |
Provided | +4.626 |
firsthand | +4.555 |
adapt | +4.514 |
Neg logit contributions | |
zzle | -5.769 |
mble | -5.472 |
IRE | -5.152 |
uers | -5.011 |
htar | -4.560 |
Token | in |
Token ID | 287 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
enh | +4.451 |
practice | +4.213 |
adapt | +4.155 |
Provided | +4.131 |
Occupations | +4.021 |
Neg logit contributions | |
zzle | -4.844 |
mble | -4.269 |
uers | -4.152 |
IRE | -4.150 |
reckoning | -3.802 |
Token | any |
Token ID | 597 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
enh | +0.933 |
practice | +0.904 |
adapt | +0.895 |
Occupations | +0.865 |
Provided | +0.862 |
Neg logit contributions | |
zzle | -1.091 |
mble | -1.018 |
uers | -0.996 |
IRE | -0.985 |
reckoning | -0.907 |
Token | dependencies |
Token ID | 20086 |
Feature activation | -2.20e-01 |
Pos logit contributions | |
enh | +0.514 |
practice | +0.502 |
adapt | +0.498 |
Provided | +0.482 |
Occupations | +0.478 |
Neg logit contributions | |
zzle | -0.521 |
mble | -0.485 |
uers | -0.480 |
IRE | -0.465 |
reckoning | -0.421 |
Token | as |
Token ID | 355 |
Feature activation | +5.10e-01 |
Pos logit contributions | |
enh | +0.895 |
practice | +0.855 |
adapt | +0.850 |
Provided | +0.843 |
theless | +0.825 |
Neg logit contributions | |
zzle | -0.927 |
mble | -0.870 |
uers | -0.835 |
IRE | -0.823 |
reckoning | -0.746 |
Token | needed |
Token ID | 2622 |
Feature activation | -4.32e-02 |
Pos logit contributions | |
zzle | +2.226 |
mble | +2.040 |
uers | +2.008 |
IRE | +1.982 |
reckoning | +1.850 |
Neg logit contributions | |
enh | -2.082 |
practice | -2.038 |
adapt | -2.011 |
Occupations | -1.939 |
theless | -1.920 |
Token | . |
Token ID | 13 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
enh | +0.166 |
practice | +0.161 |
adapt | +0.159 |
Occupations | +0.155 |
theless | +0.154 |
Neg logit contributions | |
zzle | -0.194 |
mble | -0.178 |
uers | -0.176 |
IRE | -0.175 |
reckoning | -0.159 |
Token | Perhaps |
Token ID | 8673 |
Feature activation | +5.95e-01 |
Pos logit contributions | |
zzle | +0.897 |
mble | +0.840 |
uers | +0.821 |
IRE | +0.810 |
reckoning | +0.765 |
Neg logit contributions | |
enh | -0.468 |
practice | -0.456 |
Occupations | -0.442 |
adapt | -0.440 |
Provided | -0.434 |
Token | the |
Token ID | 262 |
Feature activation | -2.01e-01 |
Pos logit contributions | |
zzle | +2.489 |
mble | +2.253 |
uers | +2.194 |
IRE | +2.183 |
reckoning | +1.984 |
Neg logit contributions | |
enh | -2.559 |
practice | -2.504 |
adapt | -2.447 |
Occupations | -2.416 |
theless | -2.405 |
Token | most |
Token ID | 749 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
enh | +0.709 |
practice | +0.697 |
adapt | +0.667 |
odor | +0.666 |
Occupations | +0.657 |
Neg logit contributions | |
zzle | -0.981 |
mble | -0.897 |
IRE | -0.878 |
uers | -0.871 |
reckoning | -0.799 |
Token | popular |
Token ID | 2968 |
Feature activation | +7.97e-01 |
Pos logit contributions | |
zzle | +5.269 |
mble | +4.727 |
uers | +4.640 |
IRE | +4.621 |
reckoning | +4.278 |
Neg logit contributions | |
enh | -4.328 |
practice | -4.259 |
adapt | -4.135 |
Occupations | -4.042 |
ゴン | -4.019 |
Token | is |
Token ID | 318 |
Feature activation | +8.17e-01 |
Pos logit contributions | |
zzle | +3.304 |
mble | +2.973 |
uers | +2.925 |
IRE | +2.910 |
reckoning | +2.617 |
Neg logit contributions | |
enh | -3.459 |
practice | -3.395 |
adapt | -3.285 |
Occupations | -3.272 |
theless | -3.261 |
Token | App |
Token ID | 2034 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
zzle | +3.789 |
mble | +3.431 |
uers | +3.381 |
IRE | +3.359 |
reckoning | +3.103 |
Neg logit contributions | |
enh | -3.113 |
practice | -3.054 |
adapt | -2.988 |
ゴン | -2.928 |
Occupations | -2.926 |
Token | Ichigo |
Token ID | 44547 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
enh | +1.711 |
practice | +1.686 |
adapt | +1.622 |
Occupations | +1.618 |
theless | +1.608 |
Neg logit contributions | |
zzle | -1.710 |
mble | -1.498 |
uers | -1.489 |
IRE | -1.449 |
reckoning | -1.317 |
Token | had |
Token ID | 550 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
zzle | +6.382 |
mble | +5.636 |
uers | +5.565 |
IRE | +5.555 |
reckoning | +5.188 |
Neg logit contributions | |
enh | -5.716 |
practice | -5.687 |
adapt | -5.509 |
ゴン | -5.479 |
Occupations | -5.433 |
Token | managed |
Token ID | 5257 |
Feature activation | -5.57e-01 |
Pos logit contributions | |
zzle | +1.287 |
mble | +1.153 |
uers | +1.130 |
IRE | +1.125 |
reckoning | +1.019 |
Neg logit contributions | |
enh | -1.266 |
practice | -1.248 |
adapt | -1.198 |
theless | -1.187 |
Occupations | -1.178 |
Token | to |
Token ID | 284 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
enh | +2.215 |
practice | +2.201 |
adapt | +2.123 |
ゴン | +2.104 |
Occupations | +2.086 |
Neg logit contributions | |
zzle | -2.425 |
uers | -2.134 |
mble | -2.133 |
IRE | -2.124 |
reckoning | -1.967 |
Token | defeat |
Token ID | 7433 |
Feature activation | -4.04e-01 |
Pos logit contributions | |
practice | +1.167 |
enh | +1.166 |
adapt | +1.107 |
theless | +1.086 |
odor | +1.082 |
Neg logit contributions | |
zzle | -1.156 |
mble | -1.036 |
IRE | -1.028 |
uers | -1.002 |
reckoning | -0.915 |
Token | the |
Token ID | 262 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
enh | +1.521 |
practice | +1.474 |
Occupations | +1.425 |
adapt | +1.416 |
theless | +1.412 |
Neg logit contributions | |
zzle | -1.883 |
mble | -1.673 |
uers | -1.653 |
IRE | -1.643 |
reckoning | -1.513 |
Token | lie |
Token ID | 6486 |
Feature activation | +5.70e-01 |
Pos logit contributions | |
enh | +2.970 |
practice | +2.839 |
odor | +2.796 |
Occupations | +2.763 |
adapt | +2.747 |
Neg logit contributions | |
zzle | -3.432 |
mble | -3.098 |
uers | -3.009 |
IRE | -2.979 |
unci | -2.688 |
Token | uten |
Token ID | 7809 |
Feature activation | +9.52e-02 |
Pos logit contributions | |
zzle | +2.936 |
mble | +2.661 |
IRE | +2.660 |
uers | +2.630 |
reckoning | +2.518 |
Neg logit contributions | |
enh | -1.882 |
practice | -1.810 |
adapt | -1.759 |
ゴン | -1.722 |
odor | -1.721 |
Token | ants |
Token ID | 1187 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
zzle | +0.463 |
mble | +0.418 |
IRE | +0.415 |
uers | +0.398 |
reckoning | +0.386 |
Neg logit contributions | |
enh | -0.348 |
practice | -0.346 |
adapt | -0.329 |
Occupations | -0.313 |
odor | -0.313 |
Token | of |
Token ID | 286 |
Feature activation | +4.67e-01 |
Pos logit contributions | |
zzle | +0.714 |
mble | +0.640 |
uers | +0.624 |
IRE | +0.616 |
reckoning | +0.559 |
Neg logit contributions | |
enh | -0.836 |
practice | -0.821 |
adapt | -0.788 |
Occupations | -0.784 |
ゴン | -0.776 |
Token | the |
Token ID | 262 |
Feature activation | -8.55e-02 |
Pos logit contributions | |
zzle | +2.105 |
mble | +1.870 |
uers | +1.842 |
IRE | +1.827 |
reckoning | +1.679 |
Neg logit contributions | |
enh | -1.858 |
practice | -1.838 |
adapt | -1.768 |
Occupations | -1.757 |
ゴン | -1.741 |
Token | interest |
Token ID | 1393 |
Feature activation | -3.08e-01 |
Pos logit contributions | |
zzle | +1.269 |
mble | +1.163 |
uers | +1.135 |
IRE | +1.133 |
reckoning | +1.038 |
Neg logit contributions | |
enh | -0.854 |
practice | -0.850 |
adapt | -0.795 |
Occupations | -0.774 |
odor | -0.772 |
Token | at |
Token ID | 379 |
Feature activation | -5.30e-01 |
Pos logit contributions | |
enh | +1.134 |
practice | +1.113 |
adapt | +1.058 |
Occupations | +1.043 |
Provided | +1.042 |
Neg logit contributions | |
zzle | -1.399 |
mble | -1.343 |
IRE | -1.290 |
uers | -1.285 |
unci | -1.131 |
Token | Brigham |
Token ID | 37434 |
Feature activation | -8.90e-01 |
Pos logit contributions | |
enh | +2.029 |
practice | +2.015 |
Occupations | +1.979 |
adapt | +1.919 |
Provided | +1.885 |
Neg logit contributions | |
zzle | -2.352 |
mble | -2.112 |
uers | -2.067 |
IRE | -2.048 |
reckoning | -1.916 |
Token | and |
Token ID | 290 |
Feature activation | -6.44e-01 |
Pos logit contributions | |
enh | +2.210 |
practice | +2.170 |
Occupations | +2.149 |
Provided | +1.977 |
theless | +1.904 |
Neg logit contributions | |
zzle | -5.203 |
mble | -4.990 |
uers | -4.760 |
IRE | -4.728 |
htar | -4.385 |
Token | Women |
Token ID | 6926 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
enh | +1.505 |
practice | +1.459 |
Occupations | +1.442 |
bid | +1.268 |
Provided | +1.264 |
Neg logit contributions | |
zzle | -3.970 |
mble | -3.718 |
uers | -3.598 |
IRE | -3.596 |
reckoning | -3.328 |
Token | 's |
Token ID | 338 |
Feature activation | -6.61e-01 |
Pos logit contributions | |
enh | +0.979 |
practice | +0.955 |
Occupations | +0.900 |
adapt | +0.899 |
odor | +0.892 |
Neg logit contributions | |
zzle | -1.374 |
mble | -1.312 |
IRE | -1.267 |
uers | -1.213 |
reckoning | -1.139 |
Token | Hospital |
Token ID | 9256 |
Feature activation | -8.15e-01 |
Pos logit contributions | |
enh | +1.242 |
practice | +1.237 |
Occupations | +1.175 |
adapt | +1.112 |
ゴン | +1.092 |
Neg logit contributions | |
zzle | -4.281 |
mble | -4.012 |
IRE | -3.934 |
uers | -3.880 |
reckoning | -3.658 |
Token | , |
Token ID | 11 |
Feature activation | +8.68e-01 |
Pos logit contributions | |
enh | +3.092 |
practice | +2.973 |
Occupations | +2.827 |
adapt | +2.823 |
Provided | +2.792 |
Neg logit contributions | |
zzle | -3.621 |
uers | -3.367 |
mble | -3.362 |
IRE | -3.320 |
unci | -2.916 |
Token | two |
Token ID | 734 |
Feature activation | +4.10e-01 |
Pos logit contributions | |
zzle | +3.770 |
mble | +3.400 |
IRE | +3.300 |
uers | +3.290 |
reckoning | +2.970 |
Neg logit contributions | |
enh | -3.658 |
practice | -3.580 |
adapt | -3.468 |
Occupations | -3.450 |
ゴン | -3.366 |
Token | miles |
Token ID | 4608 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
zzle | +1.976 |
mble | +1.788 |
IRE | +1.740 |
uers | +1.732 |
reckoning | +1.613 |
Neg logit contributions | |
enh | -1.518 |
practice | -1.492 |
Occupations | -1.441 |
adapt | -1.418 |
ゴン | -1.389 |
Token | from |
Token ID | 422 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
zzle | +1.940 |
mble | +1.738 |
uers | +1.690 |
IRE | +1.680 |
unci | +1.519 |
Neg logit contributions | |
enh | -1.768 |
practice | -1.717 |
adapt | -1.656 |
Occupations | -1.645 |
theless | -1.636 |
Token | new |
Token ID | 649 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
enh | +1.361 |
practice | +1.321 |
adapt | +1.302 |
Occupations | +1.258 |
Provided | +1.243 |
Neg logit contributions | |
zzle | -1.731 |
mble | -1.567 |
uers | -1.561 |
IRE | -1.530 |
htar | -1.391 |
Token | parks |
Token ID | 14860 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
zzle | +0.871 |
mble | +0.787 |
uers | +0.784 |
IRE | +0.775 |
reckoning | +0.717 |
Neg logit contributions | |
enh | -0.540 |
practice | -0.527 |
adapt | -0.513 |
Occupations | -0.502 |
theless | -0.488 |
Token | , |
Token ID | 11 |
Feature activation | +4.78e-01 |
Pos logit contributions | |
enh | +1.022 |
practice | +0.987 |
adapt | +0.969 |
Occupations | +0.939 |
Provided | +0.931 |
Neg logit contributions | |
zzle | -1.262 |
mble | -1.156 |
uers | -1.125 |
IRE | -1.119 |
reckoning | -1.027 |
Token | develop |
Token ID | 1205 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
zzle | +2.128 |
mble | +1.904 |
IRE | +1.857 |
uers | +1.844 |
reckoning | +1.666 |
Neg logit contributions | |
enh | -1.967 |
practice | -1.919 |
adapt | -1.876 |
Occupations | -1.857 |
Provided | -1.818 |
Token | a |
Token ID | 257 |
Feature activation | +2.83e-01 |
Pos logit contributions | |
zzle | +2.065 |
mble | +1.822 |
uers | +1.820 |
IRE | +1.797 |
reckoning | +1.648 |
Neg logit contributions | |
enh | -1.916 |
practice | -1.874 |
adapt | -1.826 |
Occupations | -1.779 |
theless | -1.751 |
Token | park |
Token ID | 3952 |
Feature activation | -5.21e-01 |
Pos logit contributions | |
zzle | +1.176 |
uers | +1.030 |
mble | +1.029 |
IRE | +1.014 |
reckoning | +0.913 |
Neg logit contributions | |
enh | -1.225 |
practice | -1.212 |
adapt | -1.182 |
Occupations | -1.144 |
theless | -1.141 |
Token | or |
Token ID | 393 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
enh | +2.062 |
adapt | +1.965 |
practice | +1.962 |
Occupations | +1.829 |
standard | +1.825 |
Neg logit contributions | |
zzle | -2.372 |
uers | -2.124 |
mble | -2.115 |
IRE | -2.076 |
reckoning | -1.906 |
Token | recreation |
Token ID | 27702 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
zzle | +1.612 |
mble | +1.442 |
uers | +1.432 |
IRE | +1.429 |
reckoning | +1.318 |
Neg logit contributions | |
enh | -1.196 |
practice | -1.161 |
adapt | -1.133 |
Occupations | -1.096 |
theless | -1.067 |
Token | amen |
Token ID | 29448 |
Feature activation | -6.42e-01 |
Pos logit contributions | |
enh | +4.184 |
practice | +4.011 |
adapt | +3.907 |
standard | +3.629 |
Provided | +3.607 |
Neg logit contributions | |
zzle | -5.821 |
uers | -5.286 |
mble | -5.233 |
IRE | -5.204 |
htar | -4.747 |
Token | ity |
Token ID | 414 |
Feature activation | +8.09e-02 |
Pos logit contributions | |
enh | +2.484 |
adapt | +2.381 |
abil | +2.272 |
practice | +2.233 |
bid | +2.224 |
Neg logit contributions | |
zzle | -2.816 |
IRE | -2.708 |
uers | -2.690 |
mble | -2.635 |
htar | -2.541 |
Token | or |
Token ID | 393 |
Feature activation | +8.85e-02 |
Pos logit contributions | |
zzle | +0.379 |
mble | +0.341 |
uers | +0.341 |
IRE | +0.336 |
reckoning | +0.310 |
Neg logit contributions | |
enh | -0.305 |
practice | -0.298 |
adapt | -0.290 |
Occupations | -0.279 |
Provided | -0.276 |
Token | Unfortunately |
Token ID | 8989 |
Feature activation | -9.85e-01 |
Pos logit contributions | |
enh | +0.082 |
practice | +0.080 |
Occupations | +0.079 |
adapt | +0.078 |
Provided | +0.076 |
Neg logit contributions | |
zzle | -0.154 |
mble | -0.144 |
uers | -0.138 |
IRE | -0.138 |
reckoning | -0.129 |
Token | , |
Token ID | 11 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
enh | +3.232 |
practice | +3.107 |
adapt | +3.057 |
Occupations | +2.983 |
odor | +2.970 |
Neg logit contributions | |
zzle | -4.779 |
mble | -4.412 |
IRE | -4.364 |
uers | -4.298 |
reckoning | -3.868 |
Token | Gl |
Token ID | 2671 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
zzle | +1.202 |
mble | +1.090 |
IRE | +1.063 |
uers | +1.048 |
reckoning | +0.944 |
Neg logit contributions | |
enh | -1.102 |
practice | -1.084 |
adapt | -1.052 |
Occupations | -1.049 |
odor | -1.023 |
Token | ü |
Token ID | 9116 |
Feature activation | +1.28e-01 |
Pos logit contributions | |
enh | +4.838 |
practice | +4.428 |
adapt | +4.390 |
odor | +4.228 |
abil | +4.112 |
Neg logit contributions | |
zzle | -6.222 |
mble | -6.120 |
IRE | -6.074 |
millenn | -5.947 |
reckoning | -5.646 |
Token | ck |
Token ID | 694 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
zzle | +0.580 |
mble | +0.545 |
IRE | +0.540 |
uers | +0.518 |
reckoning | +0.491 |
Neg logit contributions | |
enh | -0.495 |
practice | -0.484 |
adapt | -0.468 |
bid | -0.450 |
odor | -0.448 |
Token | doesn |
Token ID | 1595 |
Feature activation | -6.93e-01 |
Pos logit contributions | |
enh | +4.464 |
practice | +4.278 |
adapt | +4.132 |
Occupations | +4.068 |
theless | +4.058 |
Neg logit contributions | |
zzle | -5.771 |
mble | -5.422 |
IRE | -5.290 |
uers | -5.152 |
reckoning | -4.618 |
Token | � |
Token ID | 447 |
Feature activation | +5.98e-01 |
Pos logit contributions | |
enh | +2.534 |
practice | +2.493 |
adapt | +2.464 |
odor | +2.304 |
bid | +2.294 |
Neg logit contributions | |
zzle | -3.225 |
mble | -3.188 |
uers | -2.869 |
millenn | -2.857 |
IRE | -2.848 |
Token | � |
Token ID | 247 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
zzle | +2.672 |
mble | +2.425 |
uers | +2.322 |
IRE | +2.296 |
reckoning | +2.233 |
Neg logit contributions | |
enh | -2.360 |
practice | -2.338 |
adapt | -2.240 |
Occupations | -2.226 |
ゴン | -2.190 |
Token | t |
Token ID | 83 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
enh | +0.356 |
practice | +0.343 |
adapt | +0.326 |
odor | +0.304 |
abil | +0.298 |
Neg logit contributions | |
zzle | -0.819 |
mble | -0.767 |
IRE | -0.756 |
uers | -0.741 |
reckoning | -0.726 |
Token | yet |
Token ID | 1865 |
Feature activation | -7.90e-01 |
Pos logit contributions | |
practice | +5.521 |
enh | +5.504 |
adapt | +5.355 |
bid | +5.163 |
firsthand | +5.144 |
Neg logit contributions | |
zzle | -5.729 |
mble | -5.445 |
IRE | -5.398 |
uers | -5.092 |
�� | -4.663 |
Token | have |
Token ID | 423 |
Feature activation | -6.97e-01 |
Pos logit contributions | |
practice | +3.041 |
enh | +3.034 |
adapt | +2.934 |
bid | +2.802 |
theless | +2.801 |
Neg logit contributions | |
zzle | -3.368 |
mble | -3.077 |
IRE | -3.045 |
uers | -2.957 |
unci | -2.633 |
Token | f |
Token ID | 277 |
Feature activation | -8.05e-01 |
Pos logit contributions | |
enh | +0.963 |
practice | +0.939 |
adapt | +0.929 |
theless | +0.902 |
Occupations | +0.901 |
Neg logit contributions | |
zzle | -1.109 |
mble | -1.005 |
uers | -1.000 |
IRE | -0.982 |
reckoning | -0.895 |
Token | out |
Token ID | 503 |
Feature activation | -2.69e-01 |
Pos logit contributions | |
enh | +3.220 |
adapt | +3.091 |
practice | +3.086 |
theless | +3.000 |
odor | +2.990 |
Neg logit contributions | |
zzle | -3.421 |
mble | -3.155 |
uers | -3.034 |
IRE | -3.007 |
reckoning | -2.732 |
Token | g |
Token ID | 70 |
Feature activation | +6.03e-02 |
Pos logit contributions | |
enh | +0.709 |
practice | +0.689 |
adapt | +0.658 |
Occupations | +0.618 |
odor | +0.615 |
Neg logit contributions | |
zzle | -1.552 |
mble | -1.449 |
IRE | -1.444 |
uers | -1.425 |
reckoning | -1.345 |
Token | assing |
Token ID | 19696 |
Feature activation | -4.92e-01 |
Pos logit contributions | |
zzle | +0.322 |
mble | +0.298 |
IRE | +0.296 |
uers | +0.290 |
reckoning | +0.271 |
Neg logit contributions | |
enh | -0.189 |
practice | -0.186 |
adapt | -0.178 |
Occupations | -0.171 |
odor | -0.168 |
Token | ( |
Token ID | 357 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
enh | +1.749 |
practice | +1.703 |
adapt | +1.668 |
Occupations | +1.622 |
theless | +1.622 |
Neg logit contributions | |
zzle | -2.372 |
mble | -2.131 |
uers | -2.121 |
IRE | -2.113 |
reckoning | -1.902 |
Token | t |
Token ID | 83 |
Feature activation | -8.68e-01 |
Pos logit contributions | |
enh | +3.369 |
practice | +3.258 |
adapt | +3.216 |
odor | +3.012 |
ゴン | +3.004 |
Neg logit contributions | |
zzle | -6.612 |
mble | -6.081 |
uers | -5.998 |
IRE | -5.959 |
reckoning | -5.667 |
Token | ) |
Token ID | 8 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
enh | +3.464 |
practice | +3.389 |
adapt | +3.334 |
ゴン | +3.252 |
Occupations | +3.204 |
Neg logit contributions | |
zzle | -3.755 |
mble | -3.366 |
uers | -3.327 |
IRE | -3.278 |
reckoning | -3.046 |
Token | – |
Token ID | 784 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
enh | +3.743 |
practice | +3.608 |
adapt | +3.593 |
Occupations | +3.446 |
Provided | +3.414 |
Neg logit contributions | |
zzle | -5.264 |
mble | -4.760 |
IRE | -4.697 |
uers | -4.687 |
reckoning | -4.210 |
Token | f |
Token ID | 277 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
enh | +6.266 |
adapt | +6.254 |
practice | +6.023 |
ゴン | +5.897 |
Occupations | +5.810 |
Neg logit contributions | |
zzle | -7.414 |
mble | -6.617 |
uers | -6.572 |
IRE | -6.528 |
reckoning | -5.798 |
Token | absorbed |
Token ID | 19233 |
Feature activation | -3.94e-01 |
Pos logit contributions | |
enh | +4.811 |
adapt | +4.728 |
ゴン | +4.495 |
practice | +4.486 |
theless | +4.479 |
Neg logit contributions | |
zzle | -6.454 |
mble | -5.870 |
uers | -5.792 |
IRE | -5.645 |
reckoning | -5.223 |
Token | ( |
Token ID | 357 |
Feature activation | -9.33e-01 |
Pos logit contributions | |
enh | +1.438 |
practice | +1.412 |
adapt | +1.380 |
ゴン | +1.346 |
Occupations | +1.340 |
Neg logit contributions | |
zzle | -1.884 |
mble | -1.680 |
IRE | -1.663 |
uers | -1.663 |
reckoning | -1.538 |
Token | , |
Token ID | 11 |
Feature activation | +7.98e-02 |
Pos logit contributions | |
enh | +2.705 |
practice | +2.606 |
Occupations | +2.527 |
adapt | +2.476 |
ゴン | +2.424 |
Neg logit contributions | |
zzle | -3.701 |
mble | -3.403 |
uers | -3.352 |
IRE | -3.266 |
reckoning | -3.068 |
Token | a |
Token ID | 257 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
zzle | +0.308 |
mble | +0.279 |
uers | +0.268 |
IRE | +0.268 |
reckoning | +0.237 |
Neg logit contributions | |
enh | -0.367 |
practice | -0.358 |
adapt | -0.355 |
Occupations | -0.349 |
ゴン | -0.342 |
Token | consulting |
Token ID | 18158 |
Feature activation | -8.73e-01 |
Pos logit contributions | |
zzle | +0.054 |
mble | +0.049 |
IRE | +0.048 |
uers | +0.048 |
reckoning | +0.044 |
Neg logit contributions | |
practice | -0.040 |
enh | -0.039 |
adapt | -0.038 |
Occupations | -0.037 |
theless | -0.037 |
Token | group |
Token ID | 1448 |
Feature activation | -6.27e-01 |
Pos logit contributions | |
practice | +2.769 |
enh | +2.656 |
Occupations | +2.547 |
adapt | +2.492 |
Provided | +2.417 |
Neg logit contributions | |
zzle | -4.527 |
mble | -4.155 |
uers | -4.114 |
IRE | -4.009 |
unci | -3.651 |
Token | which |
Token ID | 543 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
enh | +2.464 |
practice | +2.391 |
adapt | +2.339 |
Provided | +2.270 |
Occupations | +2.259 |
Neg logit contributions | |
zzle | -2.745 |
mble | -2.479 |
IRE | -2.436 |
uers | -2.434 |
reckoning | -2.176 |
Token | works |
Token ID | 2499 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
enh | +3.970 |
practice | +3.739 |
adapt | +3.635 |
Occupations | +3.614 |
Provided | +3.564 |
Neg logit contributions | |
zzle | -7.899 |
mble | -7.438 |
IRE | -7.240 |
uers | -7.097 |
reckoning | -6.734 |
Token | for |
Token ID | 329 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
enh | +6.787 |
extensively | +6.632 |
practice | +6.488 |
firsthand | +6.293 |
adapt | +6.197 |
Neg logit contributions | |
zzle | -11.301 |
mble | -10.816 |
uers | -10.193 |
IRE | -10.038 |
reckoning | -9.473 |
Token | foreign |
Token ID | 3215 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
enh | +4.295 |
Occupations | +4.093 |
practice | +4.063 |
adapt | +4.012 |
Provided | +3.932 |
Neg logit contributions | |
zzle | -4.973 |
mble | -4.606 |
uers | -4.418 |
IRE | -4.331 |
reckoning | -4.054 |
Token | governments |
Token ID | 6905 |
Feature activation | -4.59e-01 |
Pos logit contributions | |
enh | +4.666 |
practice | +4.439 |
Occupations | +4.319 |
adapt | +4.314 |
odor | +4.179 |
Neg logit contributions | |
zzle | -6.053 |
mble | -5.477 |
uers | -5.255 |
IRE | -5.146 |
reckoning | -4.762 |
Token | , |
Token ID | 11 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
enh | +1.731 |
practice | +1.660 |
Occupations | +1.609 |
adapt | +1.597 |
Provided | +1.569 |
Neg logit contributions | |
zzle | -2.096 |
mble | -1.980 |
uers | -1.926 |
IRE | -1.886 |
reckoning | -1.741 |
Token | providing |
Token ID | 4955 |
Feature activation | -5.87e-01 |
Pos logit contributions | |
zzle | +0.573 |
mble | +0.536 |
IRE | +0.512 |
uers | +0.508 |
reckoning | +0.462 |
Neg logit contributions | |
enh | -0.497 |
practice | -0.477 |
Occupations | -0.471 |
adapt | -0.464 |
Provided | -0.451 |
Token | Email |
Token ID | 9570 |
Feature activation | +8.45e-01 |
Pos logit contributions | |
zzle | +4.683 |
uers | +3.880 |
mble | +3.820 |
IRE | +3.756 |
reckoning | +3.480 |
Neg logit contributions | |
practice | -6.147 |
enh | -6.066 |
ゴン | -6.062 |
adapt | -5.967 |
theless | -5.877 |
Token | Cancel |
Token ID | 27910 |
Feature activation | -2.91e-01 |
Pos logit contributions | |
zzle | +3.955 |
mble | +3.544 |
uers | +3.491 |
IRE | +3.486 |
reckoning | +3.246 |
Neg logit contributions | |
enh | -3.163 |
practice | -3.128 |
adapt | -3.021 |
ゴン | -2.972 |
Occupations | -2.971 |
Token |
|
Token ID | 198 |
Feature activation | -3.62e-02 |
Pos logit contributions | |
enh | +0.840 |
practice | +0.796 |
Occupations | +0.787 |
adapt | +0.753 |
theless | +0.750 |
Neg logit contributions | |
zzle | -1.618 |
mble | -1.527 |
uers | -1.469 |
IRE | -1.453 |
reckoning | -1.356 |
Token |
|
Token ID | 198 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
enh | +0.105 |
practice | +0.103 |
adapt | +0.099 |
Occupations | +0.094 |
odor | +0.092 |
Neg logit contributions | |
zzle | -0.203 |
mble | -0.195 |
uers | -0.184 |
IRE | -0.181 |
reckoning | -0.175 |
Token | Brown |
Token ID | 20644 |
Feature activation | -8.82e-01 |
Pos logit contributions | |
zzle | +1.450 |
mble | +1.324 |
uers | +1.271 |
IRE | +1.236 |
reckoning | +1.213 |
Neg logit contributions | |
enh | -1.187 |
practice | -1.182 |
adapt | -1.140 |
ゴン | -1.082 |
odor | -1.081 |
Token | - |
Token ID | 12 |
Feature activation | -2.86e+00 |
Pos logit contributions | |
enh | +2.931 |
practice | +2.743 |
adapt | +2.619 |
theless | +2.560 |
Occupations | +2.536 |
Neg logit contributions | |
zzle | -4.549 |
mble | -4.164 |
IRE | -3.977 |
uers | -3.899 |
reckoning | -3.693 |
Token | b |
Token ID | 65 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
enh | +9.934 |
practice | +9.661 |
adapt | +9.275 |
standard | +8.896 |
bid | +8.581 |
Neg logit contributions | |
zzle | -12.159 |
mble | -11.785 |
uers | -11.017 |
IRE | -10.331 |
respectively | -9.832 |
Token | agged |
Token ID | 14655 |
Feature activation | +9.70e-01 |
Pos logit contributions | |
enh | +4.930 |
odor | +4.686 |
practice | +4.624 |
adapt | +4.608 |
abil | +4.486 |
Neg logit contributions | |
zzle | -8.839 |
mble | -8.417 |
IRE | -8.344 |
uers | -8.017 |
reckoning | -7.711 |
Token | lun |
Token ID | 14678 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
zzle | +4.518 |
mble | +4.038 |
IRE | +3.978 |
uers | +3.966 |
reckoning | +3.666 |
Neg logit contributions | |
enh | -3.709 |
practice | -3.660 |
adapt | -3.525 |
Occupations | -3.488 |
ゴン | -3.451 |
Token | ches |
Token ID | 2052 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
zzle | +0.732 |
mble | +0.670 |
IRE | +0.663 |
uers | +0.634 |
reckoning | +0.610 |
Neg logit contributions | |
enh | -0.613 |
practice | -0.603 |
adapt | -0.581 |
odor | -0.562 |
abil | -0.552 |
Token | in |
Token ID | 287 |
Feature activation | +8.13e-02 |
Pos logit contributions | |
enh | +1.115 |
practice | +1.083 |
adapt | +1.066 |
Provided | +1.032 |
theless | +1.027 |
Neg logit contributions | |
zzle | -1.239 |
mble | -1.136 |
IRE | -1.112 |
uers | -1.103 |
reckoning | -1.006 |
Token | fees |
Token ID | 6642 |
Feature activation | -6.41e-01 |
Pos logit contributions | |
practice | +1.336 |
enh | +1.302 |
adapt | +1.236 |
Occupations | +1.216 |
theless | +1.186 |
Neg logit contributions | |
zzle | -2.405 |
mble | -2.224 |
uers | -2.167 |
IRE | -2.156 |
htar | -1.974 |
Token | might |
Token ID | 1244 |
Feature activation | +4.01e-01 |
Pos logit contributions | |
enh | +2.500 |
practice | +2.427 |
adapt | +2.323 |
Provided | +2.291 |
theless | +2.290 |
Neg logit contributions | |
zzle | -2.734 |
uers | -2.534 |
mble | -2.521 |
IRE | -2.520 |
unci | -2.246 |
Token | keep |
Token ID | 1394 |
Feature activation | -1.00e-01 |
Pos logit contributions | |
zzle | +1.749 |
IRE | +1.574 |
mble | +1.569 |
uers | +1.533 |
reckoning | +1.396 |
Neg logit contributions | |
enh | -1.660 |
practice | -1.614 |
adapt | -1.582 |
odor | -1.523 |
theless | -1.513 |
Token | its |
Token ID | 663 |
Feature activation | -4.53e-01 |
Pos logit contributions | |
enh | +0.397 |
practice | +0.390 |
adapt | +0.373 |
Occupations | +0.371 |
theless | +0.364 |
Neg logit contributions | |
zzle | -0.446 |
mble | -0.410 |
IRE | -0.396 |
uers | -0.395 |
reckoning | -0.357 |
Token | drug |
Token ID | 2563 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
practice | +1.641 |
enh | +1.632 |
adapt | +1.542 |
Occupations | +1.534 |
odor | +1.518 |
Neg logit contributions | |
zzle | -2.154 |
mble | -1.972 |
uers | -1.880 |
IRE | -1.865 |
htar | -1.711 |
Token | - |
Token ID | 12 |
Feature activation | -2.24e+00 |
Pos logit contributions | |
practice | +4.431 |
enh | +4.356 |
adapt | +4.238 |
Occupations | +4.095 |
standard | +4.045 |
Neg logit contributions | |
zzle | -5.856 |
mble | -5.277 |
uers | -5.029 |
IRE | -5.011 |
htar | -4.595 |
Token | review |
Token ID | 19023 |
Feature activation | -7.70e-01 |
Pos logit contributions | |
practice | +7.162 |
enh | +7.159 |
adapt | +6.596 |
standard | +6.418 |
bid | +6.243 |
Neg logit contributions | |
zzle | -10.946 |
mble | -10.663 |
uers | -9.754 |
IRE | -9.678 |
reckoning | -9.278 |
Token | pipeline |
Token ID | 11523 |
Feature activation | +7.12e-01 |
Pos logit contributions | |
practice | +2.649 |
enh | +2.612 |
adapt | +2.496 |
Occupations | +2.424 |
theless | +2.388 |
Neg logit contributions | |
zzle | -3.760 |
mble | -3.398 |
IRE | -3.327 |
uers | -3.236 |
htar | -3.026 |
Token | open |
Token ID | 1280 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
zzle | +2.978 |
mble | +2.671 |
IRE | +2.576 |
uers | +2.568 |
reckoning | +2.316 |
Neg logit contributions | |
enh | -3.095 |
practice | -3.008 |
adapt | -2.975 |
Occupations | -2.916 |
theless | -2.881 |
Token | — |
Token ID | 851 |
Feature activation | -7.37e-01 |
Pos logit contributions | |
enh | +0.627 |
practice | +0.600 |
adapt | +0.590 |
Provided | +0.572 |
theless | +0.569 |
Neg logit contributions | |
zzle | -0.807 |
mble | -0.741 |
IRE | -0.728 |
uers | -0.722 |
reckoning | -0.653 |
Token | albeit |
Token ID | 18244 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
enh | +2.911 |
practice | +2.762 |
adapt | +2.712 |
Provided | +2.686 |
Occupations | +2.673 |
Neg logit contributions | |
zzle | -3.220 |
mble | -3.014 |
IRE | -2.892 |
uers | -2.824 |
reckoning | -2.543 |
Token | chance |
Token ID | 2863 |
Feature activation | +5.08e-02 |
Pos logit contributions | |
zzle | +6.034 |
mble | +5.374 |
uers | +5.295 |
IRE | +5.287 |
reckoning | +4.930 |
Neg logit contributions | |
enh | -5.140 |
practice | -5.090 |
adapt | -4.929 |
ゴン | -4.873 |
Occupations | -4.855 |
Token | to |
Token ID | 284 |
Feature activation | +3.07e-01 |
Pos logit contributions | |
zzle | +0.229 |
mble | +0.211 |
uers | +0.205 |
IRE | +0.205 |
reckoning | +0.183 |
Neg logit contributions | |
enh | -0.198 |
practice | -0.195 |
adapt | -0.186 |
theless | -0.184 |
ゴン | -0.182 |
Token | have |
Token ID | 423 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
zzle | +1.349 |
mble | +1.223 |
IRE | +1.196 |
uers | +1.166 |
reckoning | +1.060 |
Neg logit contributions | |
enh | -1.251 |
practice | -1.236 |
adapt | -1.179 |
theless | -1.152 |
odor | -1.149 |
Token | a |
Token ID | 257 |
Feature activation | +5.68e-02 |
Pos logit contributions | |
zzle | +1.675 |
mble | +1.491 |
IRE | +1.464 |
uers | +1.459 |
reckoning | +1.330 |
Neg logit contributions | |
enh | -1.421 |
practice | -1.409 |
adapt | -1.331 |
Occupations | -1.323 |
theless | -1.310 |
Token | none |
Token ID | 4844 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
zzle | +0.227 |
mble | +0.204 |
IRE | +0.196 |
uers | +0.195 |
respectively | +0.169 |
Neg logit contributions | |
enh | -0.250 |
practice | -0.249 |
odor | -0.236 |
firsthand | -0.235 |
adapt | -0.234 |
Token | - |
Token ID | 12 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
practice | +4.420 |
enh | +4.414 |
bid | +4.214 |
adapt | +4.173 |
theless | +4.050 |
Neg logit contributions | |
zzle | -4.640 |
uers | -4.314 |
IRE | -4.169 |
mble | -4.053 |
reckoning | -3.949 |
Token | too |
Token ID | 18820 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
enh | +6.695 |
practice | +6.679 |
bid | +6.127 |
adapt | +5.990 |
standard | +5.754 |
Neg logit contributions | |
zzle | -11.411 |
mble | -10.904 |
uers | -10.696 |
IRE | -10.271 |
reckoning | -9.608 |
Token | - |
Token ID | 12 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
enh | +0.484 |
practice | +0.478 |
adapt | +0.465 |
ゴン | +0.456 |
theless | +0.453 |
Neg logit contributions | |
zzle | -0.563 |
mble | -0.513 |
uers | -0.499 |
IRE | -0.499 |
reckoning | -0.459 |
Token | sub |
Token ID | 7266 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
enh | +3.295 |
practice | +3.173 |
adapt | +3.044 |
odor | +2.844 |
standard | +2.831 |
Neg logit contributions | |
zzle | -6.140 |
mble | -5.720 |
uers | -5.586 |
IRE | -5.526 |
reckoning | -5.278 |
Token | tle |
Token ID | 7100 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
zzle | +5.453 |
mble | +4.940 |
uers | +4.874 |
IRE | +4.868 |
reckoning | +4.576 |
Neg logit contributions | |
enh | -3.317 |
practice | -3.273 |
adapt | -3.146 |
ゴン | -3.089 |
Occupations | -3.077 |
Token | dig |
Token ID | 3100 |
Feature activation | +7.99e-01 |
Pos logit contributions | |
zzle | +5.093 |
mble | +4.485 |
uers | +4.413 |
IRE | +4.397 |
reckoning | +3.999 |
Neg logit contributions | |
enh | -5.530 |
practice | -5.476 |
adapt | -5.302 |
ゴン | -5.240 |
Occupations | -5.217 |
Token | belief |
Token ID | 4901 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
enh | +1.640 |
practice | +1.605 |
adapt | +1.543 |
Occupations | +1.539 |
odor | +1.512 |
Neg logit contributions | |
zzle | -2.012 |
mble | -1.838 |
uers | -1.772 |
IRE | -1.762 |
htar | -1.585 |
Token | that |
Token ID | 326 |
Feature activation | +1.68e-01 |
Pos logit contributions | |
zzle | +1.000 |
mble | +0.899 |
IRE | +0.868 |
uers | +0.868 |
reckoning | +0.785 |
Neg logit contributions | |
enh | -1.122 |
practice | -1.113 |
adapt | -1.077 |
Occupations | -1.063 |
ゴン | -1.055 |
Token | usefulness |
Token ID | 37496 |
Feature activation | -5.76e-01 |
Pos logit contributions | |
zzle | +0.741 |
mble | +0.669 |
IRE | +0.650 |
uers | +0.643 |
reckoning | +0.583 |
Neg logit contributions | |
enh | -0.694 |
practice | -0.677 |
Occupations | -0.658 |
adapt | -0.654 |
theless | -0.638 |
Token | was |
Token ID | 373 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
enh | +2.086 |
practice | +2.021 |
adapt | +1.948 |
Occupations | +1.915 |
theless | +1.885 |
Neg logit contributions | |
zzle | -2.759 |
mble | -2.539 |
IRE | -2.471 |
uers | -2.446 |
unci | -2.212 |
Token | good |
Token ID | 922 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
zzle | +0.870 |
mble | +0.789 |
IRE | +0.766 |
uers | +0.762 |
reckoning | +0.690 |
Neg logit contributions | |
enh | -0.798 |
practice | -0.779 |
adapt | -0.757 |
Occupations | -0.740 |
theless | -0.733 |
Token | - |
Token ID | 12 |
Feature activation | -2.79e+00 |
Pos logit contributions | |
enh | +5.635 |
practice | +5.548 |
adapt | +5.397 |
Occupations | +5.048 |
abil | +5.033 |
Neg logit contributions | |
zzle | -7.343 |
mble | -6.814 |
uers | -6.515 |
IRE | -6.513 |
reckoning | -5.821 |
Token | in |
Token ID | 259 |
Feature activation | -7.62e-02 |
Pos logit contributions | |
enh | +8.098 |
practice | +7.930 |
adapt | +7.876 |
odor | +7.022 |
only | +6.738 |
Neg logit contributions | |
zzle | -13.956 |
mble | -13.363 |
IRE | -12.713 |
uers | -12.394 |
reckoning | -11.634 |
Token | - |
Token ID | 12 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
enh | +0.301 |
practice | +0.297 |
adapt | +0.289 |
Occupations | +0.277 |
abil | +0.272 |
Neg logit contributions | |
zzle | -0.345 |
mble | -0.315 |
IRE | -0.311 |
uers | -0.303 |
reckoning | -0.282 |
Token | it |
Token ID | 270 |
Feature activation | -5.61e-01 |
Pos logit contributions | |
practice | +4.415 |
enh | +4.244 |
adapt | +4.124 |
standard | +3.768 |
odor | +3.752 |
Neg logit contributions | |
zzle | -6.077 |
mble | -5.668 |
uers | -5.367 |
IRE | -5.362 |
respectively | -4.996 |
Token | self |
Token ID | 944 |
Feature activation | +9.04e-02 |
Pos logit contributions | |
enh | +1.533 |
practice | +1.455 |
adapt | +1.374 |
theless | +1.337 |
Occupations | +1.330 |
Neg logit contributions | |
zzle | -3.187 |
mble | -2.907 |
IRE | -2.885 |
uers | -2.839 |
reckoning | -2.757 |
Token | . |
Token ID | 13 |
Feature activation | -2.97e-01 |
Pos logit contributions | |
zzle | +0.412 |
mble | +0.373 |
IRE | +0.363 |
uers | +0.363 |
reckoning | +0.333 |
Neg logit contributions | |
enh | -0.355 |
practice | -0.348 |
adapt | -0.337 |
Occupations | -0.329 |
theless | -0.327 |