Token | into |
Token ID | 656 |
Feature activation | +4.92e+00 |
Pos logit contributions | |
aber | +3.919 |
nl | +3.555 |
Causes | +3.337 |
[' | +3.262 |
owa | +3.177 |
Neg logit contributions | |
ught | -4.414 |
wick | -4.066 |
RG | -3.950 |
wives | -3.920 |
riz | -3.909 |
Token | jail |
Token ID | 7356 |
Feature activation | +5.82e+00 |
Pos logit contributions | |
aber | +3.297 |
nl | +3.001 |
Causes | +2.887 |
[' | +2.742 |
owa | +2.701 |
Neg logit contributions | |
ught | -3.767 |
wick | -3.471 |
CLA | -3.370 |
wives | -3.369 |
RG | -3.320 |
Token | on |
Token ID | 319 |
Feature activation | +5.76e+00 |
Pos logit contributions | |
aber | +3.978 |
nl | +3.549 |
Causes | +3.357 |
[' | +3.332 |
owa | +3.166 |
Neg logit contributions | |
ught | -4.422 |
wick | -4.051 |
RG | -3.914 |
wives | -3.890 |
riz | -3.890 |
Token | a |
Token ID | 257 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
aber | +4.032 |
nl | +3.691 |
Causes | +3.512 |
[' | +3.406 |
owa | +3.317 |
Neg logit contributions | |
ught | -4.143 |
wick | -3.911 |
CLA | -3.778 |
RG | -3.757 |
wives | -3.732 |
Token | domestic |
Token ID | 5928 |
Feature activation | +9.56e+00 |
Pos logit contributions | |
aber | +8.154 |
nl | +7.560 |
Causes | +6.916 |
[' | +6.889 |
owa | +6.777 |
Neg logit contributions | |
ught | -9.647 |
RG | -9.211 |
wick | -9.210 |
CLA | -9.203 |
wives | -9.162 |
Token | battery |
Token ID | 6555 |
Feature activation | +2.22e+01 |
Pos logit contributions | |
aber | +6.791 |
nl | +6.121 |
Causes | +5.826 |
[' | +5.630 |
owa | +5.536 |
Neg logit contributions | |
ught | -6.759 |
wick | -6.190 |
RG | -6.082 |
wives | -5.977 |
elin | -5.975 |
Token | charge |
Token ID | 3877 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
aber | +9.521 |
[' | +7.967 |
nl | +7.852 |
gy | +7.536 |
receiving | +7.453 |
Neg logit contributions | |
ught | -16.751 |
RG | -16.153 |
elin | -15.916 |
riz | -15.913 |
stellar | -15.492 |
Token | following |
Token ID | 1708 |
Feature activation | +4.65e+00 |
Pos logit contributions | |
aber | +7.389 |
nl | +6.276 |
[' | +6.205 |
Causes | +6.062 |
gy | +5.774 |
Neg logit contributions | |
ught | -10.105 |
wick | -9.376 |
RG | -9.361 |
elin | -9.297 |
CLA | -9.155 |
Token | her |
Token ID | 607 |
Feature activation | +5.11e+00 |
Pos logit contributions | |
aber | +3.193 |
nl | +2.913 |
Causes | +2.745 |
[' | +2.676 |
owa | +2.594 |
Neg logit contributions | |
ught | -3.505 |
wick | -3.296 |
RG | -3.137 |
CLA | -3.116 |
wives | -3.094 |
Token | arrest |
Token ID | 3251 |
Feature activation | +9.12e+00 |
Pos logit contributions | |
aber | +3.574 |
nl | +3.286 |
Causes | +3.095 |
[' | +2.983 |
owa | +2.944 |
Neg logit contributions | |
ught | -3.775 |
wick | -3.544 |
RG | -3.373 |
CLA | -3.344 |
wives | -3.311 |
Token | Tuesday |
Token ID | 3431 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
aber | +5.657 |
nl | +4.984 |
Causes | +4.815 |
[' | +4.753 |
gy | +4.511 |
Neg logit contributions | |
ught | -7.123 |
wick | -6.555 |
RG | -6.481 |
elin | -6.326 |
riz | -6.318 |
Token | who |
Token ID | 508 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
aber | +4.780 |
nl | +4.377 |
Causes | +3.963 |
[' | +3.867 |
owa | +3.799 |
Neg logit contributions | |
ught | -5.858 |
wick | -5.390 |
wives | -5.233 |
CLA | -5.038 |
RG | -5.028 |
Token | said |
Token ID | 531 |
Feature activation | +7.72e+00 |
Pos logit contributions | |
aber | +6.822 |
nl | +6.337 |
[' | +5.802 |
Causes | +5.770 |
owa | +5.655 |
Neg logit contributions | |
ught | -7.796 |
wick | -7.318 |
RG | -7.092 |
wives | -7.066 |
riz | -6.925 |
Token | he |
Token ID | 339 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
aber | +5.024 |
nl | +4.549 |
Causes | +4.133 |
[' | +4.118 |
owa | +4.034 |
Neg logit contributions | |
ught | -5.968 |
wick | -5.666 |
wives | -5.446 |
RG | -5.364 |
CLA | -5.318 |
Token | was |
Token ID | 373 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
aber | +1.237 |
nl | +1.125 |
Causes | +1.039 |
[' | +1.008 |
owa | +0.997 |
Neg logit contributions | |
ught | -1.385 |
wick | -1.302 |
wives | -1.241 |
RG | -1.236 |
CLA | -1.216 |
Token | tired |
Token ID | 10032 |
Feature activation | +7.17e+00 |
Pos logit contributions | |
aber | +2.595 |
nl | +2.410 |
Causes | +2.205 |
[' | +2.168 |
owa | +2.133 |
Neg logit contributions | |
ught | -2.517 |
wick | -2.337 |
wives | -2.220 |
RG | -2.201 |
CLA | -2.171 |
Token | after |
Token ID | 706 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
aber | +4.627 |
nl | +4.191 |
[' | +3.726 |
Causes | +3.723 |
owa | +3.666 |
Neg logit contributions | |
ught | -5.692 |
wick | -5.322 |
wives | -5.091 |
RG | -5.084 |
riz | -5.036 |
Token | the |
Token ID | 262 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
aber | +11.186 |
nl | +10.454 |
receiving | +10.004 |
[' | +9.502 |
gy | +9.356 |
Neg logit contributions | |
ught | -13.667 |
wick | -12.837 |
RG | -12.715 |
riz | -12.588 |
wives | -12.588 |
Token | finish |
Token ID | 5461 |
Feature activation | +9.24e+00 |
Pos logit contributions | |
aber | +6.820 |
nl | +6.454 |
Causes | +6.012 |
owa | +5.877 |
[' | +5.743 |
Neg logit contributions | |
ught | -7.095 |
wick | -6.782 |
wives | -6.518 |
RG | -6.405 |
CLA | -6.378 |
Token | but |
Token ID | 475 |
Feature activation | +6.53e+00 |
Pos logit contributions | |
aber | +5.529 |
nl | +5.118 |
[' | +4.505 |
Causes | +4.445 |
owa | +4.388 |
Neg logit contributions | |
ught | -7.443 |
wick | -6.985 |
RG | -6.758 |
wives | -6.729 |
elin | -6.596 |
Token | would |
Token ID | 561 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
aber | +4.293 |
nl | +3.944 |
Causes | +3.597 |
[' | +3.581 |
owa | +3.476 |
Neg logit contributions | |
ught | -4.996 |
wick | -4.765 |
wives | -4.549 |
RG | -4.508 |
CLA | -4.452 |
Token | keep |
Token ID | 1394 |
Feature activation | +6.50e+00 |
Pos logit contributions | |
aber | +1.971 |
nl | +1.824 |
Causes | +1.674 |
[' | +1.652 |
owa | +1.633 |
Neg logit contributions | |
ught | -1.893 |
wick | -1.779 |
wives | -1.695 |
RG | -1.683 |
riz | -1.651 |
Token | three |
Token ID | 1115 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
aber | +8.722 |
nl | +8.660 |
receiving | +8.152 |
[' | +7.953 |
de | +7.647 |
Neg logit contributions | |
ught | -11.756 |
wick | -10.992 |
CLA | -10.882 |
RG | -10.649 |
wives | -10.589 |
Token | counts |
Token ID | 9853 |
Feature activation | +9.61e+00 |
Pos logit contributions | |
aber | +5.624 |
nl | +5.119 |
[' | +4.575 |
Causes | +4.568 |
owa | +4.433 |
Neg logit contributions | |
ught | -9.406 |
wick | -8.955 |
RG | -8.720 |
CLA | -8.620 |
riz | -8.536 |
Token | of |
Token ID | 286 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
aber | +5.266 |
nl | +4.547 |
[' | +4.149 |
gy | +4.069 |
Causes | +4.053 |
Neg logit contributions | |
ught | -8.126 |
wick | -7.733 |
RG | -7.481 |
CLA | -7.478 |
wives | -7.375 |
Token | tresp |
Token ID | 29723 |
Feature activation | +6.90e+00 |
Pos logit contributions | |
aber | +8.374 |
nl | +7.947 |
receiving | +7.612 |
[' | +7.328 |
Causes | +7.240 |
Neg logit contributions | |
ught | -10.083 |
wick | -9.595 |
CLA | -9.432 |
wives | -9.277 |
RG | -9.190 |
Token | assing |
Token ID | 19696 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
aber | +5.010 |
nl | +4.458 |
Causes | +4.106 |
owa | +4.018 |
[' | +4.017 |
Neg logit contributions | |
ught | -4.950 |
wick | -4.671 |
RG | -4.634 |
wives | -4.614 |
CLA | -4.547 |
Token | and |
Token ID | 290 |
Feature activation | +2.04e+01 |
Pos logit contributions | |
aber | +5.741 |
nl | +4.967 |
[' | +4.716 |
Causes | +4.697 |
owa | +4.424 |
Neg logit contributions | |
ught | -8.468 |
wick | -7.898 |
RG | -7.760 |
wives | -7.648 |
riz | -7.609 |
Token | damage |
Token ID | 2465 |
Feature activation | +4.39e+00 |
Pos logit contributions | |
aber | +8.286 |
receiving | +8.160 |
nl | +7.948 |
[' | +7.827 |
Causes | +7.202 |
Neg logit contributions | |
ught | -15.255 |
wick | -14.604 |
CLA | -14.467 |
RG | -14.396 |
wives | -14.311 |
Token | to |
Token ID | 284 |
Feature activation | +2.63e+00 |
Pos logit contributions | |
aber | +2.868 |
nl | +2.577 |
Causes | +2.429 |
[' | +2.328 |
owa | +2.281 |
Neg logit contributions | |
ught | -3.483 |
wick | -3.299 |
RG | -3.172 |
wives | -3.153 |
riz | -3.077 |
Token | property |
Token ID | 3119 |
Feature activation | +4.00e+00 |
Pos logit contributions | |
aber | +2.338 |
nl | +2.182 |
Causes | +2.068 |
[' | +2.022 |
owa | +2.002 |
Neg logit contributions | |
ught | -1.477 |
wick | -1.361 |
wives | -1.270 |
RG | -1.252 |
CLA | -1.241 |
Token | , |
Token ID | 11 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
aber | +2.619 |
nl | +2.369 |
Causes | +2.190 |
[' | +2.150 |
owa | +2.076 |
Neg logit contributions | |
ught | -3.210 |
wick | -3.005 |
RG | -2.859 |
wives | -2.844 |
riz | -2.813 |
Token | stolen |
Token ID | 9909 |
Feature activation | +2.45e+00 |
Pos logit contributions | |
aber | +6.220 |
nl | +5.809 |
Causes | +5.428 |
[' | +5.291 |
owa | +5.038 |
Neg logit contributions | |
ught | -7.973 |
wick | -7.433 |
CLA | -7.073 |
RG | -7.018 |
wives | -6.998 |
Token | - |
Token ID | 12 |
Feature activation | +7.50e+00 |
Pos logit contributions | |
aber | +4.199 |
nl | +3.859 |
Causes | +3.415 |
[' | +3.285 |
owa | +3.265 |
Neg logit contributions | |
ught | -5.605 |
wick | -5.354 |
wives | -5.106 |
RG | -4.934 |
riz | -4.876 |
Token | ethyl |
Token ID | 21610 |
Feature activation | +7.60e+00 |
Pos logit contributions | |
aber | +5.115 |
nl | +4.724 |
Causes | +4.170 |
[' | +4.104 |
owa | +4.027 |
Neg logit contributions | |
ught | -5.631 |
wick | -5.334 |
wives | -5.087 |
RG | -5.041 |
CLA | -4.863 |
Token | - |
Token ID | 12 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
aber | +5.109 |
nl | +4.652 |
Causes | +4.129 |
[' | +3.996 |
owa | +3.978 |
Neg logit contributions | |
ught | -5.783 |
wick | -5.474 |
wives | -5.157 |
RG | -5.137 |
curved | -4.921 |
Token | N |
Token ID | 45 |
Feature activation | +9.02e+00 |
Pos logit contributions | |
aber | +6.553 |
nl | +6.045 |
[' | +5.129 |
Causes | +5.036 |
de | +4.976 |
Neg logit contributions | |
ught | -9.770 |
wick | -9.322 |
wives | -8.765 |
RG | -8.556 |
curved | -8.545 |
Token | -( |
Token ID | 30420 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
aber | +5.550 |
nl | +4.874 |
Causes | +4.333 |
EE | +4.299 |
owa | +4.251 |
Neg logit contributions | |
ught | -7.333 |
wick | -6.917 |
wives | -6.664 |
RG | -6.435 |
riz | -6.285 |
Token | t |
Token ID | 83 |
Feature activation | +2.03e+01 |
Pos logit contributions | |
aber | +8.230 |
nl | +7.427 |
de | +6.330 |
gy | +6.249 |
[' | +6.194 |
Neg logit contributions | |
ught | -11.123 |
wick | -10.577 |
wives | -10.174 |
RG | -9.692 |
elin | -9.675 |
Token | et |
Token ID | 316 |
Feature activation | +4.48e+00 |
Pos logit contributions | |
aber | +12.411 |
nl | +11.814 |
owa | +10.664 |
ys | +10.404 |
iary | +10.234 |
Neg logit contributions | |
ught | -12.913 |
wives | -12.539 |
wick | -11.832 |
RG | -11.828 |
netflix | -11.644 |
Token | rah |
Token ID | 11392 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
aber | +3.538 |
nl | +3.226 |
Causes | +2.974 |
owa | +2.951 |
[' | +2.927 |
Neg logit contributions | |
ught | -3.013 |
wick | -2.731 |
wives | -2.660 |
RG | -2.625 |
CLA | -2.603 |
Token | yd |
Token ID | 5173 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
aber | +3.304 |
nl | +2.471 |
Causes | +1.483 |
xe | +1.455 |
ys | +1.447 |
Neg logit contributions | |
ught | -15.892 |
wives | -15.053 |
tradem | -14.808 |
wick | -14.750 |
RG | -14.722 |
Token | ro |
Token ID | 305 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
aber | +7.774 |
nl | +7.035 |
owa | +6.000 |
[' | +5.873 |
ys | +5.798 |
Neg logit contributions | |
ught | -11.402 |
wives | -10.224 |
wick | -10.141 |
CLA | -10.021 |
RG | -9.993 |
Token | - |
Token ID | 12 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
aber | +7.501 |
nl | +6.790 |
[' | +5.852 |
Causes | +5.835 |
gy | +5.778 |
Neg logit contributions | |
ught | -8.509 |
wick | -8.020 |
RG | -7.749 |
wives | -7.733 |
ewitness | -7.519 |
Token | . |
Token ID | 13 |
Feature activation | -3.63e+00 |
Pos logit contributions | |
aber | +5.733 |
nl | +5.235 |
[' | +5.020 |
Causes | +4.714 |
owa | +4.312 |
Neg logit contributions | |
ught | -9.606 |
wick | -8.829 |
wives | -8.548 |
elin | -8.435 |
CLA | -8.402 |
Token | Draw |
Token ID | 25302 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
ught | +2.448 |
wick | +2.343 |
RG | +2.246 |
wives | +2.182 |
CLA | +2.149 |
Neg logit contributions | |
aber | -2.796 |
nl | -2.543 |
Causes | -2.415 |
owa | -2.331 |
[' | -2.291 |
Token | String |
Token ID | 10100 |
Feature activation | +3.79e+00 |
Pos logit contributions | |
aber | +0.805 |
nl | +0.737 |
Causes | +0.681 |
[' | +0.660 |
owa | +0.651 |
Neg logit contributions | |
ught | -0.859 |
wick | -0.800 |
wives | -0.765 |
CLA | -0.749 |
RG | -0.749 |
Token | ($ |
Token ID | 16763 |
Feature activation | +8.54e+00 |
Pos logit contributions | |
aber | +1.993 |
nl | +1.779 |
Causes | +1.596 |
[' | +1.550 |
owa | +1.474 |
Neg logit contributions | |
ught | -3.536 |
wick | -3.316 |
wives | -3.210 |
CLA | -3.152 |
elin | -3.120 |
Token | art |
Token ID | 433 |
Feature activation | +8.50e+00 |
Pos logit contributions | |
aber | +5.320 |
nl | +4.842 |
[' | +4.226 |
Causes | +4.089 |
owa | +4.013 |
Neg logit contributions | |
ught | -6.891 |
wick | -6.358 |
wives | -6.270 |
elin | -6.078 |
Certified | -5.991 |
Token | ext |
Token ID | 2302 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
aber | +4.839 |
nl | +4.361 |
[' | +3.785 |
xe | +3.580 |
owa | +3.566 |
Neg logit contributions | |
ught | -7.272 |
tradem | -6.920 |
wick | -6.808 |
CLA | -6.771 |
RG | -6.678 |
Token | [ |
Token ID | 58 |
Feature activation | +3.07e+00 |
Pos logit contributions | |
[' | +7.840 |
aber | +7.600 |
nl | +6.937 |
Causes | +5.852 |
xe | +5.535 |
Neg logit contributions | |
ught | -17.056 |
wick | -15.919 |
elin | -15.704 |
wives | -15.584 |
unker | -15.562 |
Token | $ |
Token ID | 3 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
aber | +2.600 |
nl | +2.410 |
Causes | +2.238 |
[' | +2.225 |
owa | +2.168 |
Neg logit contributions | |
ught | -1.881 |
wick | -1.728 |
wives | -1.644 |
RG | -1.593 |
CLA | -1.587 |
Token | i |
Token ID | 72 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
aber | +4.225 |
nl | +3.869 |
[' | +3.130 |
Causes | +2.981 |
owa | +2.917 |
Neg logit contributions | |
ught | -10.046 |
wick | -9.370 |
wives | -9.296 |
CLA | -9.163 |
Certified | -9.160 |
Token | - |
Token ID | 12 |
Feature activation | +9.23e+00 |
Pos logit contributions | |
aber | +6.927 |
nl | +6.152 |
[' | +5.975 |
owa | +5.591 |
Causes | +5.564 |
Neg logit contributions | |
ught | -10.252 |
wick | -9.459 |
wives | -9.415 |
CLA | -9.204 |
RG | -9.155 |
Token | 1 |
Token ID | 16 |
Feature activation | +9.14e+00 |
Pos logit contributions | |
aber | +3.956 |
nl | +3.592 |
[' | +3.041 |
Causes | +2.868 |
owa | +2.767 |
Neg logit contributions | |
ught | -8.973 |
wick | -8.505 |
wives | -8.271 |
RG | -8.159 |
elin | -8.114 |
Token | than |
Token ID | 621 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
aber | +0.229 |
nl | +0.209 |
Causes | +0.193 |
[' | +0.185 |
owa | +0.185 |
Neg logit contributions | |
ught | -0.254 |
wick | -0.239 |
wives | -0.228 |
RG | -0.225 |
CLA | -0.223 |
Token | a |
Token ID | 257 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
aber | +2.239 |
nl | +2.029 |
Causes | +1.901 |
[' | +1.838 |
owa | +1.801 |
Neg logit contributions | |
ught | -2.451 |
wick | -2.321 |
wives | -2.205 |
RG | -2.184 |
CLA | -2.174 |
Token | minute |
Token ID | 5664 |
Feature activation | +1.65e-01 |
Pos logit contributions | |
aber | +1.241 |
nl | +1.140 |
Causes | +1.066 |
[' | +1.029 |
owa | +1.021 |
Neg logit contributions | |
ught | -1.177 |
wick | -1.114 |
wives | -1.057 |
RG | -1.045 |
CLA | -1.031 |
Token | in |
Token ID | 287 |
Feature activation | +6.44e+00 |
Pos logit contributions | |
aber | +0.125 |
nl | +0.115 |
Causes | +0.107 |
[' | +0.103 |
owa | +0.103 |
Neg logit contributions | |
ught | -0.116 |
wick | -0.109 |
wives | -0.103 |
RG | -0.102 |
CLA | -0.101 |
Token | , |
Token ID | 11 |
Feature activation | +9.78e-01 |
Pos logit contributions | |
aber | +3.946 |
nl | +3.602 |
Causes | +3.348 |
[' | +3.230 |
EE | +3.113 |
Neg logit contributions | |
ught | -5.240 |
wick | -4.910 |
wives | -4.712 |
RG | -4.665 |
elin | -4.660 |
Token | when |
Token ID | 618 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
aber | +0.691 |
nl | +0.631 |
Causes | +0.586 |
[' | +0.564 |
owa | +0.559 |
Neg logit contributions | |
ught | -0.740 |
wick | -0.693 |
wives | -0.659 |
RG | -0.652 |
CLA | -0.645 |
Token | Night |
Token ID | 5265 |
Feature activation | +6.97e+00 |
Pos logit contributions | |
aber | +10.836 |
nl | +9.666 |
Causes | +9.237 |
[' | +8.948 |
owa | +8.930 |
Neg logit contributions | |
ught | -13.492 |
wick | -12.706 |
wives | -12.384 |
elin | -12.308 |
CLA | -12.143 |
Token | c |
Token ID | 66 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
aber | +3.558 |
nl | +3.138 |
Causes | +2.716 |
[' | +2.666 |
owa | +2.662 |
Neg logit contributions | |
ught | -6.576 |
wick | -5.960 |
RG | -5.909 |
CLA | -5.865 |
wives | -5.853 |
Token | rawler |
Token ID | 39464 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
aber | +1.059 |
nl | +0.957 |
Causes | +0.878 |
[' | +0.859 |
owa | +0.856 |
Neg logit contributions | |
ught | -1.169 |
wick | -1.091 |
wives | -1.050 |
RG | -1.035 |
CLA | -1.032 |
Token | notices |
Token ID | 19748 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
ught | +1.179 |
wick | +1.109 |
wives | +1.049 |
RG | +1.032 |
CLA | +1.024 |
Neg logit contributions | |
aber | -1.218 |
nl | -1.118 |
Causes | -1.036 |
owa | -1.000 |
[' | -0.996 |
Token | that |
Token ID | 326 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
aber | +10.396 |
nl | +8.897 |
Causes | +8.776 |
owa | +8.369 |
[' | +8.326 |
Neg logit contributions | |
ught | -13.054 |
wick | -12.230 |
CLA | -12.002 |
RG | -11.871 |
wives | -11.825 |
Token | findings |
Token ID | 6373 |
Feature activation | -7.85e-01 |
Pos logit contributions | |
aber | +3.932 |
nl | +3.616 |
Causes | +3.325 |
[' | +3.237 |
owa | +3.215 |
Neg logit contributions | |
ught | -4.125 |
wick | -3.861 |
RG | -3.695 |
wives | -3.685 |
CLA | -3.625 |
Token | showed |
Token ID | 3751 |
Feature activation | +6.83e+00 |
Pos logit contributions | |
ught | +0.582 |
wick | +0.547 |
wives | +0.518 |
RG | +0.513 |
CLA | +0.507 |
Neg logit contributions | |
aber | -0.563 |
nl | -0.516 |
Causes | -0.480 |
[' | -0.459 |
owa | -0.458 |
Token | that |
Token ID | 326 |
Feature activation | +8.61e+00 |
Pos logit contributions | |
aber | +4.427 |
nl | +4.034 |
Causes | +3.638 |
owa | +3.615 |
[' | +3.569 |
Neg logit contributions | |
ught | -5.357 |
wick | -5.054 |
wives | -4.827 |
RG | -4.814 |
CLA | -4.809 |
Token | possessing |
Token ID | 25566 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
aber | +5.588 |
nl | +5.130 |
Causes | +4.660 |
[' | +4.641 |
owa | +4.592 |
Neg logit contributions | |
ught | -6.457 |
wick | -6.094 |
RG | -5.838 |
CLA | -5.804 |
wives | -5.748 |
Token | a |
Token ID | 257 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
aber | +6.419 |
nl | +5.908 |
[' | +5.457 |
Causes | +5.449 |
owa | +5.225 |
Neg logit contributions | |
ught | -7.899 |
wick | -7.298 |
CLA | -7.079 |
wives | -6.975 |
RG | -6.971 |
Token | large |
Token ID | 1588 |
Feature activation | +1.98e+01 |
Pos logit contributions | |
aber | +7.533 |
nl | +7.103 |
[' | +6.336 |
Causes | +6.242 |
owa | +6.212 |
Neg logit contributions | |
ught | -8.410 |
wick | -8.105 |
wives | -7.915 |
RG | -7.827 |
CLA | -7.769 |
Token | complex |
Token ID | 3716 |
Feature activation | +6.36e+00 |
Pos logit contributions | |
aber | +11.149 |
nl | +10.157 |
[' | +9.034 |
dyn | +9.018 |
receiving | +8.977 |
Neg logit contributions | |
ught | -13.126 |
wick | -12.887 |
wives | -12.447 |
CLA | -12.154 |
RG | -12.054 |
Token | brain |
Token ID | 3632 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
aber | +4.422 |
nl | +4.028 |
Causes | +3.621 |
[' | +3.585 |
owa | +3.534 |
Neg logit contributions | |
ught | -4.756 |
wick | -4.448 |
wives | -4.329 |
CLA | -4.220 |
RG | -4.170 |
Token | was |
Token ID | 373 |
Feature activation | -7.65e+00 |
Pos logit contributions | |
ught | +1.277 |
wick | +1.203 |
wives | +1.138 |
RG | +1.130 |
riz | +1.118 |
Neg logit contributions | |
aber | -1.218 |
nl | -1.114 |
Causes | -1.036 |
owa | -0.992 |
[' | -0.991 |
Token | not |
Token ID | 407 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
ught | +4.645 |
wick | +4.324 |
elin | +4.065 |
wives | +4.051 |
riz | +4.034 |
Neg logit contributions | |
aber | -6.142 |
nl | -5.693 |
Causes | -5.443 |
裏� | -5.204 |
owa | -5.190 |
Token | necessary |
Token ID | 3306 |
Feature activation | +2.11e+00 |
Pos logit contributions | |
ught | +0.694 |
wick | +0.647 |
wives | +0.608 |
RG | +0.599 |
CLA | +0.592 |
Neg logit contributions | |
aber | -0.857 |
nl | -0.791 |
Causes | -0.743 |
[' | -0.717 |
owa | -0.716 |
Token | 2 |
Token ID | 17 |
Feature activation | +7.90e+00 |
Pos logit contributions | |
aber | +5.861 |
nl | +5.372 |
[' | +5.010 |
Causes | +4.939 |
owa | +4.706 |
Neg logit contributions | |
ught | -5.171 |
wick | -4.664 |
wives | -4.631 |
elin | -4.393 |
CLA | -4.334 |
Token | + |
Token ID | 1343 |
Feature activation | +2.88e+00 |
Pos logit contributions | |
aber | +4.815 |
nl | +4.403 |
[' | +3.978 |
Causes | +3.944 |
EE | +3.788 |
Neg logit contributions | |
ught | -6.405 |
wick | -5.949 |
wives | -5.820 |
CLA | -5.623 |
elin | -5.594 |
Token | $ |
Token ID | 720 |
Feature activation | +7.86e+00 |
Pos logit contributions | |
aber | +2.095 |
nl | +1.912 |
Causes | +1.776 |
[' | +1.718 |
owa | +1.684 |
Neg logit contributions | |
ught | -2.116 |
wick | -1.970 |
wives | -1.887 |
CLA | -1.841 |
RG | -1.841 |
Token | s |
Token ID | 82 |
Feature activation | +6.61e+00 |
Pos logit contributions | |
aber | +4.435 |
nl | +4.042 |
[' | +3.464 |
Causes | +3.407 |
owa | +3.300 |
Neg logit contributions | |
ught | -6.782 |
wick | -6.264 |
wives | -6.185 |
elin | -6.033 |
CLA | -5.987 |
Token | z |
Token ID | 89 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
aber | +4.756 |
nl | +4.388 |
Causes | +4.004 |
[' | +3.974 |
owa | +3.933 |
Neg logit contributions | |
ught | -4.746 |
wick | -4.336 |
wives | -4.211 |
CLA | -4.113 |
elin | -4.059 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.98e+01 |
Pos logit contributions | |
aber | +6.237 |
nl | +5.551 |
[' | +5.326 |
Causes | +4.580 |
tool | +4.358 |
Neg logit contributions | |
ught | -12.821 |
wick | -11.798 |
wives | -11.660 |
elin | -11.439 |
CLA | -11.279 |
Token | . |
Token ID | 13 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
aber | +8.847 |
[' | +8.590 |
nl | +8.392 |
EE | +7.040 |
owa | +6.895 |
Neg logit contributions | |
ught | -15.524 |
ewitness | -14.342 |
wives | -14.261 |
wick | -14.172 |
tradem | -13.970 |
Token | Height |
Token ID | 23106 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
aber | +6.411 |
nl | +6.133 |
[' | +5.515 |
Causes | +5.416 |
Customer | +5.225 |
Neg logit contributions | |
ught | -7.695 |
wick | -6.967 |
wives | -6.769 |
ewitness | -6.705 |
tradem | -6.684 |
Token | ), |
Token ID | 828 |
Feature activation | +3.98e+00 |
Pos logit contributions | |
aber | +6.828 |
nl | +6.140 |
[' | +5.636 |
Causes | +5.585 |
EE | +5.296 |
Neg logit contributions | |
ught | -8.504 |
wick | -7.608 |
wives | -7.573 |
CLA | -7.382 |
riz | -7.367 |
Token | $ |
Token ID | 3 |
Feature activation | +5.67e+00 |
Pos logit contributions | |
aber | +3.299 |
nl | +3.058 |
Causes | +2.850 |
[' | +2.811 |
owa | +2.748 |
Neg logit contributions | |
ught | -2.496 |
wick | -2.270 |
wives | -2.172 |
RG | -2.098 |
CLA | -2.086 |
Token | SR |
Token ID | 12562 |
Feature activation | +8.45e+00 |
Pos logit contributions | |
aber | +3.936 |
nl | +3.671 |
Causes | +3.260 |
[' | +3.258 |
owa | +3.169 |
Neg logit contributions | |
ught | -4.249 |
wick | -3.902 |
wives | -3.793 |
elin | -3.701 |
riz | -3.631 |
Token | when |
Token ID | 618 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
aber | +0.691 |
nl | +0.631 |
Causes | +0.586 |
[' | +0.564 |
owa | +0.559 |
Neg logit contributions | |
ught | -0.740 |
wick | -0.693 |
wives | -0.659 |
RG | -0.652 |
CLA | -0.645 |
Token | Night |
Token ID | 5265 |
Feature activation | +6.97e+00 |
Pos logit contributions | |
aber | +10.836 |
nl | +9.666 |
Causes | +9.237 |
[' | +8.948 |
owa | +8.930 |
Neg logit contributions | |
ught | -13.492 |
wick | -12.706 |
wives | -12.384 |
elin | -12.308 |
CLA | -12.143 |
Token | c |
Token ID | 66 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
aber | +3.558 |
nl | +3.138 |
Causes | +2.716 |
[' | +2.666 |
owa | +2.662 |
Neg logit contributions | |
ught | -6.576 |
wick | -5.960 |
RG | -5.909 |
CLA | -5.865 |
wives | -5.853 |
Token | rawler |
Token ID | 39464 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
aber | +1.059 |
nl | +0.957 |
Causes | +0.878 |
[' | +0.859 |
owa | +0.856 |
Neg logit contributions | |
ught | -1.169 |
wick | -1.091 |
wives | -1.050 |
RG | -1.035 |
CLA | -1.032 |
Token | notices |
Token ID | 19748 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
ught | +1.179 |
wick | +1.109 |
wives | +1.049 |
RG | +1.032 |
CLA | +1.024 |
Neg logit contributions | |
aber | -1.218 |
nl | -1.118 |
Causes | -1.036 |
owa | -1.000 |
[' | -0.996 |
Token | that |
Token ID | 326 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
aber | +10.396 |
nl | +8.897 |
Causes | +8.776 |
owa | +8.369 |
[' | +8.326 |
Neg logit contributions | |
ught | -13.054 |
wick | -12.230 |
CLA | -12.002 |
RG | -11.871 |
wives | -11.825 |
Token | no |
Token ID | 645 |
Feature activation | +5.16e+00 |
Pos logit contributions | |
aber | +10.335 |
nl | +8.848 |
Causes | +8.762 |
[' | +8.489 |
owa | +8.444 |
Neg logit contributions | |
ught | -13.878 |
wick | -12.957 |
CLA | -12.791 |
RG | -12.698 |
elin | -12.629 |
Token | one |
Token ID | 530 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
aber | +3.290 |
nl | +2.954 |
Causes | +2.761 |
[' | +2.655 |
owa | +2.581 |
Neg logit contributions | |
ught | -4.131 |
wick | -3.927 |
RG | -3.755 |
wives | -3.717 |
CLA | -3.680 |
Token | in |
Token ID | 287 |
Feature activation | +9.26e+00 |
Pos logit contributions | |
ught | +1.246 |
wick | +1.164 |
wives | +1.104 |
RG | +1.084 |
CLA | +1.078 |
Neg logit contributions | |
aber | -1.245 |
nl | -1.136 |
Causes | -1.056 |
owa | -1.010 |
[' | -1.005 |
Token | the |
Token ID | 262 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
aber | +6.032 |
nl | +5.489 |
Causes | +5.254 |
[' | +5.017 |
owa | +4.916 |
Neg logit contributions | |
ught | -6.783 |
wick | -6.475 |
wives | -6.165 |
CLA | -6.164 |
RG | -6.130 |
Token | mall |
Token ID | 17374 |
Feature activation | +3.74e+00 |
Pos logit contributions | |
aber | +0.999 |
nl | +0.918 |
Causes | +0.863 |
[' | +0.830 |
owa | +0.821 |
Neg logit contributions | |
ught | -0.941 |
wick | -0.882 |
wives | -0.836 |
RG | -0.828 |
CLA | -0.819 |
Token | / |
Token ID | 1220 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
aber | +5.881 |
nl | +5.373 |
[' | +4.947 |
Causes | +4.686 |
owa | +4.656 |
Neg logit contributions | |
ught | -7.364 |
wick | -6.805 |
wives | -6.603 |
elin | -6.432 |
CLA | -6.420 |
Token | _ |
Token ID | 4808 |
Feature activation | +8.30e+00 |
Pos logit contributions | |
aber | +2.170 |
nl | +1.964 |
Causes | +1.817 |
[' | +1.760 |
owa | +1.736 |
Neg logit contributions | |
ught | -2.405 |
wick | -2.240 |
wives | -2.178 |
RG | -2.136 |
CLA | -2.119 |
Token | P |
Token ID | 47 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
aber | +5.196 |
nl | +4.716 |
[' | +4.227 |
EE | +4.150 |
Causes | +4.133 |
Neg logit contributions | |
ught | -6.488 |
wick | -6.049 |
wives | -5.949 |
elin | -5.859 |
riz | -5.718 |
Token | ulse |
Token ID | 9615 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
aber | +0.117 |
nl | +0.109 |
Causes | +0.102 |
[' | +0.099 |
owa | +0.099 |
Neg logit contributions | |
ught | -0.078 |
wick | -0.072 |
wives | -0.067 |
RG | -0.066 |
CLA | -0.065 |
Token | Per |
Token ID | 5990 |
Feature activation | +7.44e+00 |
Pos logit contributions | |
aber | +7.030 |
nl | +6.729 |
[' | +6.399 |
EE | +6.010 |
Causes | +5.700 |
Neg logit contributions | |
ught | -12.527 |
tradem | -12.388 |
agos | -11.634 |
ewitness | -11.620 |
wick | -11.582 |
Token | iod |
Token ID | 2101 |
Feature activation | +1.95e+01 |
Pos logit contributions | |
aber | +5.571 |
nl | +5.235 |
Causes | +4.672 |
owa | +4.638 |
[' | +4.595 |
Neg logit contributions | |
ught | -4.910 |
wick | -4.557 |
RG | -4.537 |
tradem | -4.439 |
wives | -4.434 |
Token | * |
Token ID | 1635 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
aber | +9.584 |
[' | +9.069 |
nl | +8.656 |
EE | +7.525 |
Causes | +7.466 |
Neg logit contributions | |
ught | -14.460 |
wives | -13.429 |
wick | -13.258 |
ewitness | -12.998 |
elin | -12.973 |
Token | TA |
Token ID | 21664 |
Feature activation | +7.66e+00 |
Pos logit contributions | |
aber | +1.246 |
nl | +1.125 |
Causes | +1.045 |
[' | +1.004 |
owa | +0.991 |
Neg logit contributions | |
ught | -1.423 |
wick | -1.336 |
wives | -1.286 |
RG | -1.267 |
CLA | -1.256 |
Token | U |
Token ID | 52 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
aber | +3.821 |
nl | +3.439 |
[' | +3.079 |
EE | +2.940 |
Causes | +2.819 |
Neg logit contributions | |
ught | -6.886 |
wick | -6.586 |
wives | -6.574 |
tradem | -6.471 |
elin | -6.464 |
Token | ) |
Token ID | 8 |
Feature activation | +6.91e+00 |
Pos logit contributions | |
aber | +7.505 |
nl | +6.597 |
[' | +6.520 |
EE | +6.055 |
Causes | +5.938 |
Neg logit contributions | |
ught | -11.531 |
wick | -10.628 |
wives | -10.493 |
ewitness | -10.392 |
elin | -10.373 |
Token | + |
Token ID | 1343 |
Feature activation | -4.16e-02 |
Pos logit contributions | |
aber | +4.233 |
nl | +3.824 |
Causes | +3.534 |
[' | +3.451 |
EE | +3.305 |
Neg logit contributions | |
ught | -5.679 |
wick | -5.249 |
wives | -5.063 |
CLA | -5.024 |
elin | -4.975 |
Token | should |
Token ID | 815 |
Feature activation | -2.53e+00 |
Pos logit contributions | |
ught | +2.866 |
wick | +2.678 |
wives | +2.559 |
RG | +2.487 |
CLA | +2.462 |
Neg logit contributions | |
aber | -2.858 |
nl | -2.633 |
Causes | -2.465 |
owa | -2.376 |
[' | -2.350 |
Token | work |
Token ID | 670 |
Feature activation | +3.69e+00 |
Pos logit contributions | |
ught | +1.697 |
wick | +1.582 |
wives | +1.475 |
RG | +1.453 |
CLA | +1.445 |
Neg logit contributions | |
aber | -1.997 |
nl | -1.846 |
Causes | -1.746 |
owa | -1.672 |
[' | -1.666 |
Token | ) |
Token ID | 8 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
aber | +2.357 |
nl | +2.103 |
Causes | +1.922 |
[' | +1.872 |
owa | +1.852 |
Neg logit contributions | |
ught | -3.012 |
wick | -2.849 |
RG | -2.722 |
wives | -2.715 |
riz | -2.690 |
Token |
|
Token ID | 198 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
ught | +0.930 |
wick | +0.871 |
wives | +0.824 |
RG | +0.813 |
CLA | +0.804 |
Neg logit contributions | |
aber | -1.010 |
nl | -0.927 |
Causes | -0.862 |
[' | -0.835 |
owa | -0.834 |
Token |
|
Token ID | 198 |
Feature activation | +7.05e+00 |
Pos logit contributions | |
ught | +0.840 |
wick | +0.788 |
wives | +0.744 |
RG | +0.737 |
CLA | +0.728 |
Neg logit contributions | |
aber | -0.951 |
nl | -0.867 |
Causes | -0.816 |
owa | -0.788 |
[' | -0.780 |
Token | 1 |
Token ID | 16 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
aber | +4.643 |
nl | +4.238 |
[' | +3.773 |
Causes | +3.673 |
owa | +3.652 |
Neg logit contributions | |
ught | -5.339 |
wick | -5.027 |
wives | -4.815 |
elin | -4.810 |
RG | -4.762 |
Token | thumbnail |
Token ID | 40901 |
Feature activation | +4.57e+00 |
Pos logit contributions | |
aber | +11.662 |
nl | +11.114 |
gy | +9.706 |
xe | +9.683 |
de | +9.376 |
Neg logit contributions | |
ught | -11.358 |
wives | -11.202 |
wick | -11.174 |
acci | -10.973 |
agos | -10.832 |
Token | of |
Token ID | 286 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
aber | +3.183 |
nl | +2.891 |
Causes | +2.684 |
[' | +2.580 |
owa | +2.551 |
Neg logit contributions | |
ught | -3.400 |
wick | -3.219 |
wives | -3.057 |
RG | -3.057 |
CLA | -3.019 |
Token | baking |
Token ID | 16871 |
Feature activation | +4.31e+00 |
Pos logit contributions | |
ught | +0.886 |
wick | +0.828 |
wives | +0.785 |
RG | +0.774 |
CLA | +0.767 |
Neg logit contributions | |
aber | -0.908 |
nl | -0.829 |
Causes | -0.770 |
[' | -0.744 |
owa | -0.743 |
Token | yeast |
Token ID | 20146 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
aber | +3.095 |
nl | +2.906 |
Causes | +2.667 |
[' | +2.562 |
owa | +2.547 |
Neg logit contributions | |
ught | -3.098 |
wick | -2.863 |
RG | -2.746 |
wives | -2.731 |
CLA | -2.722 |
Token |
|
Token ID | 198 |
Feature activation | -2.76e+00 |
Pos logit contributions | |
ught | +1.613 |
wick | +1.514 |
wives | +1.431 |
RG | +1.412 |
CLA | +1.398 |
Neg logit contributions | |
aber | -1.653 |
nl | -1.512 |
Causes | -1.399 |
owa | -1.364 |
[' | -1.359 |
Token | � |
Token ID | 447 |
Feature activation | +3.39e+00 |
Pos logit contributions | |
aber | +3.188 |
nl | +2.893 |
Causes | +2.614 |
[' | +2.592 |
owa | +2.543 |
Neg logit contributions | |
ught | -4.426 |
wick | -4.103 |
RG | -4.019 |
wives | -4.001 |
CLA | -3.915 |
Token | � |
Token ID | 247 |
Feature activation | +8.47e+00 |
Pos logit contributions | |
aber | +1.954 |
nl | +1.758 |
Causes | +1.596 |
[' | +1.583 |
owa | +1.498 |
Neg logit contributions | |
ught | -2.976 |
wick | -2.793 |
wives | -2.709 |
RG | -2.648 |
CLA | -2.629 |
Token | s |
Token ID | 82 |
Feature activation | +3.41e+00 |
Pos logit contributions | |
aber | +4.611 |
nl | +4.303 |
[' | +3.794 |
Causes | +3.770 |
owa | +3.579 |
Neg logit contributions | |
ught | -7.222 |
wick | -6.720 |
RG | -6.611 |
wives | -6.592 |
CLA | -6.434 |
Token | late |
Token ID | 2739 |
Feature activation | +4.41e+00 |
Pos logit contributions | |
aber | +2.498 |
nl | +2.302 |
Causes | +2.151 |
[' | +2.093 |
owa | +2.069 |
Neg logit contributions | |
ught | -2.409 |
wick | -2.282 |
wives | -2.173 |
RG | -2.162 |
CLA | -2.129 |
Token | equal |
Token ID | 4961 |
Feature activation | +2.56e+00 |
Pos logit contributions | |
aber | +3.244 |
nl | +2.974 |
Causes | +2.762 |
[' | +2.685 |
owa | +2.660 |
Neg logit contributions | |
ught | -3.072 |
wick | -2.906 |
RG | -2.795 |
wives | -2.781 |
CLA | -2.735 |
Token | iser |
Token ID | 5847 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
aber | +1.112 |
nl | +0.954 |
Causes | +0.829 |
[' | +0.771 |
owa | +0.762 |
Neg logit contributions | |
ught | -2.636 |
wick | -2.512 |
wives | -2.432 |
RG | -2.416 |
CLA | -2.392 |
Token | from |
Token ID | 422 |
Feature activation | +6.30e+00 |
Pos logit contributions | |
aber | +9.583 |
nl | +8.776 |
Causes | +8.088 |
owa | +7.992 |
gy | +7.913 |
Neg logit contributions | |
ught | -14.010 |
RG | -13.007 |
wick | -12.880 |
riz | -12.618 |
wives | -12.565 |
Token | a |
Token ID | 257 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
aber | +4.324 |
nl | +3.972 |
Causes | +3.714 |
[' | +3.540 |
owa | +3.494 |
Neg logit contributions | |
ught | -4.701 |
wick | -4.372 |
RG | -4.231 |
wives | -4.210 |
CLA | -4.129 |
Token | corner |
Token ID | 5228 |
Feature activation | +8.17e+00 |
Pos logit contributions | |
aber | +3.106 |
nl | +2.895 |
Causes | +2.666 |
[' | +2.586 |
owa | +2.564 |
Neg logit contributions | |
ught | -2.809 |
wick | -2.678 |
wives | -2.558 |
RG | -2.520 |
CLA | -2.468 |
Token | , |
Token ID | 11 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
aber | +5.131 |
nl | +4.584 |
Causes | +4.138 |
[' | +4.053 |
owa | +4.037 |
Neg logit contributions | |
ught | -6.505 |
wick | -6.015 |
RG | -5.991 |
CLA | -5.922 |
wives | -5.861 |
Token | it |
Token ID | 340 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
aber | +8.117 |
nl | +7.788 |
Causes | +7.154 |
owa | +6.919 |
[' | +6.901 |
Neg logit contributions | |
ught | -9.505 |
wick | -8.624 |
wives | -8.453 |
RG | -8.452 |
riz | -8.340 |
Token | of |
Token ID | 286 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
ught | +1.329 |
wick | +1.246 |
wives | +1.184 |
RG | +1.171 |
CLA | +1.155 |
Neg logit contributions | |
aber | -1.275 |
nl | -1.156 |
Causes | -1.085 |
owa | -1.035 |
[' | -1.024 |
Token | reaction |
Token ID | 6317 |
Feature activation | +7.09e-01 |
Pos logit contributions | |
aber | +1.222 |
nl | +1.130 |
Causes | +1.053 |
[' | +1.028 |
owa | +1.018 |
Neg logit contributions | |
ught | -1.017 |
wick | -0.952 |
wives | -0.899 |
RG | -0.886 |
CLA | -0.878 |
Token | ," |
Token ID | 553 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
aber | +0.502 |
nl | +0.458 |
Causes | +0.424 |
[' | +0.410 |
owa | +0.407 |
Neg logit contributions | |
ught | -0.534 |
wick | -0.502 |
wives | -0.478 |
RG | -0.473 |
CLA | -0.468 |
Token | Ger |
Token ID | 13573 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
aber | +6.285 |
nl | +5.555 |
Causes | +5.182 |
[' | +4.914 |
gy | +4.748 |
Neg logit contributions | |
ught | -8.993 |
wick | -8.455 |
wives | -8.434 |
elin | -8.190 |
CLA | -8.122 |
Token | ads |
Token ID | 5643 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
aber | +0.148 |
nl | +0.130 |
Causes | +0.116 |
[' | +0.110 |
owa | +0.109 |
Neg logit contributions | |
ught | -0.273 |
wick | -0.260 |
wives | -0.250 |
RG | -0.249 |
CLA | -0.247 |
Token | tells |
Token ID | 4952 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
aber | +1.512 |
nl | +1.367 |
Causes | +1.264 |
[' | +1.227 |
owa | +1.216 |
Neg logit contributions | |
ught | -1.686 |
wick | -1.579 |
wives | -1.514 |
RG | -1.496 |
CLA | -1.479 |
Token | Heat |
Token ID | 12308 |
Feature activation | +2.84e-01 |
Pos logit contributions | |
aber | +11.637 |
nl | +10.288 |
Causes | +9.901 |
EE | +9.328 |
[' | +9.145 |
Neg logit contributions | |
ught | -12.294 |
wives | -11.372 |
elin | -11.232 |
CLA | -11.190 |
wick | -11.149 |
Token | Vision |
Token ID | 19009 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
aber | +0.202 |
nl | +0.184 |
Causes | +0.171 |
[' | +0.164 |
owa | +0.163 |
Neg logit contributions | |
ught | -0.214 |
wick | -0.201 |
wives | -0.191 |
RG | -0.189 |
CLA | -0.187 |
Token | via |
Token ID | 2884 |
Feature activation | +2.85e+00 |
Pos logit contributions | |
aber | +1.323 |
nl | +1.197 |
Causes | +1.097 |
[' | +1.056 |
owa | +1.053 |
Neg logit contributions | |
ught | -1.601 |
wick | -1.503 |
wives | -1.439 |
RG | -1.425 |
CLA | -1.418 |
Token | phone |
Token ID | 3072 |
Feature activation | +5.33e+00 |
Pos logit contributions | |
aber | +2.224 |
nl | +2.027 |
Causes | +1.906 |
[' | +1.828 |
owa | +1.825 |
Neg logit contributions | |
ught | -1.940 |
wick | -1.792 |
wives | -1.722 |
RG | -1.690 |
CLA | -1.685 |
Token | . |
Token ID | 13 |
Feature activation | +7.43e+00 |
Pos logit contributions | |
aber | +3.358 |
nl | +2.981 |
Causes | +2.717 |
[' | +2.575 |
owa | +2.559 |
Neg logit contributions | |
ught | -4.416 |
wick | -4.178 |
wives | -4.011 |
RG | -3.928 |
elin | -3.926 |
Token | Caps |
Token ID | 23534 |
Feature activation | +1.84e+00 |
Pos logit contributions | |
aber | +6.947 |
nl | +6.339 |
Causes | +6.075 |
owa | +5.751 |
[' | +5.718 |
Neg logit contributions | |
ught | -8.447 |
wick | -7.934 |
RG | -7.685 |
wives | -7.667 |
CLA | -7.589 |
Token | knew |
Token ID | 2993 |
Feature activation | +6.38e+00 |
Pos logit contributions | |
aber | +1.282 |
nl | +1.169 |
Causes | +1.081 |
[' | +1.050 |
owa | +1.042 |
Neg logit contributions | |
ught | -1.398 |
wick | -1.313 |
wives | -1.247 |
RG | -1.243 |
CLA | -1.221 |
Token | that |
Token ID | 326 |
Feature activation | +7.20e+00 |
Pos logit contributions | |
aber | +4.057 |
nl | +3.740 |
Causes | +3.421 |
[' | +3.373 |
owa | +3.317 |
Neg logit contributions | |
ught | -4.959 |
wick | -4.774 |
wives | -4.568 |
RG | -4.484 |
CLA | -4.472 |
Token | a |
Token ID | 257 |
Feature activation | +7.77e+00 |
Pos logit contributions | |
aber | +4.683 |
nl | +4.327 |
Causes | +4.001 |
[' | +3.943 |
owa | +3.870 |
Neg logit contributions | |
ught | -5.424 |
wick | -5.145 |
wives | -4.979 |
RG | -4.917 |
CLA | -4.862 |
Token | second |
Token ID | 1218 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
aber | +5.397 |
nl | +5.001 |
Causes | +4.523 |
owa | +4.504 |
[' | +4.467 |
Neg logit contributions | |
ught | -5.422 |
wick | -5.325 |
wives | -5.071 |
RG | -4.932 |
CLA | -4.853 |
Token | goal |
Token ID | 3061 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
aber | +8.552 |
nl | +7.903 |
owa | +7.267 |
Causes | +7.116 |
[' | +7.035 |
Neg logit contributions | |
ught | -8.751 |
wick | -8.535 |
wives | -8.304 |
RG | -8.067 |
CLA | -8.028 |
Token | could |
Token ID | 714 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
aber | +9.716 |
nl | +8.766 |
[' | +8.001 |
owa | +7.945 |
gy | +7.855 |
Neg logit contributions | |
ught | -13.582 |
RG | -13.489 |
wick | -13.479 |
CLA | -12.837 |
agos | -12.732 |
Token | probably |
Token ID | 2192 |
Feature activation | +8.45e-01 |
Pos logit contributions | |
aber | +1.591 |
nl | +1.457 |
Causes | +1.341 |
[' | +1.321 |
owa | +1.310 |
Neg logit contributions | |
ught | -1.588 |
wick | -1.498 |
RG | -1.419 |
wives | -1.419 |
riz | -1.389 |
Token | be |
Token ID | 307 |
Feature activation | -4.00e+00 |
Pos logit contributions | |
aber | +0.632 |
nl | +0.579 |
Causes | +0.537 |
[' | +0.523 |
owa | +0.520 |
Neg logit contributions | |
ught | -0.601 |
wick | -0.565 |
wives | -0.535 |
RG | -0.533 |
CLA | -0.523 |
Token | enough |
Token ID | 1576 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
ught | +2.779 |
wick | +2.616 |
wives | +2.494 |
RG | +2.419 |
CLA | +2.401 |
Neg logit contributions | |
aber | -2.994 |
nl | -2.767 |
Causes | -2.600 |
owa | -2.487 |
[' | -2.483 |
Token | to |
Token ID | 284 |
Feature activation | -7.95e+00 |
Pos logit contributions | |
aber | +1.085 |
nl | +0.992 |
Causes | +0.918 |
[' | +0.884 |
owa | +0.881 |
Neg logit contributions | |
ught | -1.178 |
wick | -1.111 |
wives | -1.055 |
RG | -1.047 |
CLA | -1.032 |
Token | was |
Token ID | 373 |
Feature activation | +2.52e+00 |
Pos logit contributions | |
aber | +2.893 |
nl | +2.645 |
Causes | +2.459 |
[' | +2.370 |
owa | +2.332 |
Neg logit contributions | |
ught | -3.350 |
wick | -3.146 |
wives | -3.013 |
RG | -3.000 |
CLA | -2.956 |
Token | arrested |
Token ID | 5169 |
Feature activation | +5.30e+00 |
Pos logit contributions | |
aber | +1.775 |
nl | +1.631 |
Causes | +1.497 |
[' | +1.454 |
owa | +1.433 |
Neg logit contributions | |
ught | -1.896 |
wick | -1.783 |
wives | -1.697 |
RG | -1.681 |
CLA | -1.664 |
Token | and |
Token ID | 290 |
Feature activation | +7.02e+00 |
Pos logit contributions | |
aber | +3.586 |
nl | +3.224 |
Causes | +3.008 |
[' | +2.959 |
owa | +2.819 |
Neg logit contributions | |
ught | -4.087 |
wick | -3.799 |
wives | -3.627 |
RG | -3.619 |
riz | -3.590 |
Token | charged |
Token ID | 5047 |
Feature activation | +5.94e+00 |
Pos logit contributions | |
aber | +4.299 |
nl | +3.992 |
Causes | +3.710 |
[' | +3.636 |
owa | +3.401 |
Neg logit contributions | |
ught | -5.560 |
wick | -5.312 |
wives | -5.089 |
RG | -5.038 |
riz | -4.997 |
Token | with |
Token ID | 351 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
aber | +3.815 |
nl | +3.356 |
Causes | +3.129 |
[' | +3.063 |
owa | +2.931 |
Neg logit contributions | |
ught | -4.752 |
wick | -4.448 |
RG | -4.245 |
wives | -4.236 |
elin | -4.217 |
Token | felony |
Token ID | 14544 |
Feature activation | +1.87e+01 |
Pos logit contributions | |
aber | +9.426 |
nl | +8.797 |
receiving | +8.711 |
Causes | +8.462 |
[' | +8.155 |
Neg logit contributions | |
ught | -11.633 |
wick | -11.232 |
wives | -11.079 |
CLA | -10.977 |
RG | -10.764 |
Token | theft |
Token ID | 12402 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
aber | +9.992 |
nl | +9.107 |
receiving | +8.896 |
Causes | +8.815 |
[' | +8.639 |
Neg logit contributions | |
ught | -12.786 |
wick | -12.400 |
wives | -12.179 |
RG | -12.170 |
CLA | -12.094 |
Token | . |
Token ID | 13 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
aber | +8.403 |
nl | +7.128 |
[' | +6.921 |
Causes | +6.686 |
receiving | +6.484 |
Neg logit contributions | |
ught | -13.834 |
wick | -12.845 |
RG | -12.683 |
CLA | -12.615 |
agos | -12.392 |
Token |
|
Token ID | 198 |
Feature activation | +3.05e+00 |
Pos logit contributions | |
aber | +1.598 |
nl | +1.477 |
Causes | +1.381 |
[' | +1.325 |
owa | +1.295 |
Neg logit contributions | |
ught | -1.661 |
wick | -1.542 |
wives | -1.470 |
RG | -1.454 |
elin | -1.434 |
Token |
|
Token ID | 198 |
Feature activation | +8.38e-01 |
Pos logit contributions | |
aber | +2.095 |
nl | +1.949 |
Causes | +1.768 |
[' | +1.752 |
owa | +1.685 |
Neg logit contributions | |
ught | -2.335 |
wick | -2.170 |
wives | -2.073 |
RG | -2.049 |
CLA | -2.034 |
Token | According |
Token ID | 4821 |
Feature activation | -4.45e+00 |
Pos logit contributions | |
aber | +0.609 |
nl | +0.559 |
Causes | +0.516 |
[' | +0.503 |
owa | +0.496 |
Neg logit contributions | |
ught | -0.615 |
wick | -0.576 |
wives | -0.547 |
RG | -0.540 |
CLA | -0.534 |
Token | be |
Token ID | 307 |
Feature activation | +2.99e+00 |
Pos logit contributions | |
aber | +1.857 |
nl | +1.697 |
Causes | +1.550 |
[' | +1.519 |
owa | +1.512 |
Neg logit contributions | |
ught | -2.118 |
wick | -1.999 |
RG | -1.925 |
wives | -1.918 |
riz | -1.883 |
Token | seated |
Token ID | 21639 |
Feature activation | -5.33e-01 |
Pos logit contributions | |
aber | +2.280 |
nl | +2.111 |
Causes | +1.946 |
[' | +1.909 |
owa | +1.890 |
Neg logit contributions | |
ught | -2.058 |
wick | -1.925 |
RG | -1.829 |
wives | -1.821 |
riz | -1.790 |
Token | in |
Token ID | 287 |
Feature activation | +6.38e+00 |
Pos logit contributions | |
ught | +0.394 |
wick | +0.370 |
wives | +0.351 |
RG | +0.347 |
CLA | +0.344 |
Neg logit contributions | |
aber | -0.384 |
nl | -0.351 |
Causes | -0.328 |
[' | -0.314 |
owa | -0.314 |
Token | the |
Token ID | 262 |
Feature activation | +6.18e+00 |
Pos logit contributions | |
aber | +4.268 |
nl | +3.903 |
Causes | +3.622 |
[' | +3.528 |
owa | +3.431 |
Neg logit contributions | |
ught | -4.815 |
wick | -4.555 |
wives | -4.393 |
RG | -4.371 |
CLA | -4.362 |
Token | theater |
Token ID | 13766 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
aber | +4.183 |
nl | +3.845 |
Causes | +3.563 |
[' | +3.464 |
owa | +3.390 |
Neg logit contributions | |
ught | -4.608 |
wick | -4.335 |
RG | -4.183 |
wives | -4.182 |
CLA | -4.130 |
Token | after |
Token ID | 706 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
ught | +0.880 |
wick | +0.825 |
wives | +0.782 |
RG | +0.771 |
CLA | +0.763 |
Neg logit contributions | |
aber | -0.867 |
nl | -0.789 |
Causes | -0.739 |
[' | -0.703 |
owa | -0.703 |
Token | Psycho |
Token ID | 38955 |
Feature activation | -2.99e+00 |
Pos logit contributions | |
aber | +10.728 |
nl | +9.797 |
receiving | +9.277 |
[' | +8.962 |
Causes | +8.837 |
Neg logit contributions | |
ught | -12.056 |
RG | -11.661 |
elin | -11.448 |
CLA | -11.410 |
riz | -11.370 |
Token | 's |
Token ID | 338 |
Feature activation | +4.24e+00 |
Pos logit contributions | |
ught | +2.221 |
wick | +2.112 |
wives | +1.986 |
RG | +1.938 |
CLA | +1.935 |
Neg logit contributions | |
aber | -2.132 |
nl | -1.935 |
Causes | -1.794 |
[' | -1.715 |
owa | -1.715 |
Token | opening |
Token ID | 29443 |
Feature activation | +3.96e+00 |
Pos logit contributions | |
aber | +3.086 |
nl | +2.862 |
Causes | +2.666 |
[' | +2.569 |
owa | +2.543 |
Neg logit contributions | |
ught | -3.005 |
wick | -2.849 |
RG | -2.710 |
wives | -2.709 |
CLA | -2.647 |
Token | credits |
Token ID | 10824 |
Feature activation | +5.77e-01 |
Pos logit contributions | |
aber | +2.649 |
nl | +2.442 |
Causes | +2.227 |
[' | +2.167 |
owa | +2.129 |
Neg logit contributions | |
ught | -3.068 |
wick | -2.905 |
RG | -2.761 |
wives | -2.756 |
elin | -2.715 |
Token | , |
Token ID | 11 |
Feature activation | +2.52e+00 |
Pos logit contributions | |
aber | +0.398 |
nl | +0.362 |
Causes | +0.335 |
[' | +0.322 |
owa | +0.321 |
Neg logit contributions | |
ught | -0.445 |
wick | -0.419 |
wives | -0.399 |
RG | -0.395 |
CLA | -0.391 |
Token | the |
Token ID | 262 |
Feature activation | -5.64e+00 |
Pos logit contributions | |
ught | +3.705 |
wick | +3.492 |
wives | +3.347 |
RG | +3.302 |
riz | +3.268 |
Neg logit contributions | |
aber | -2.843 |
nl | -2.553 |
Causes | -2.299 |
owa | -2.248 |
[' | -2.213 |
Token | year |
Token ID | 614 |
Feature activation | +3.35e+00 |
Pos logit contributions | |
ught | +4.030 |
wick | +3.739 |
wives | +3.574 |
RG | +3.477 |
elin | +3.458 |
Neg logit contributions | |
aber | -4.120 |
nl | -3.753 |
Causes | -3.429 |
owa | -3.374 |
[' | -3.339 |
Token | . |
Token ID | 13 |
Feature activation | +2.63e+00 |
Pos logit contributions | |
aber | +2.184 |
nl | +1.979 |
Causes | +1.826 |
[' | +1.755 |
owa | +1.733 |
Neg logit contributions | |
ught | -2.691 |
wick | -2.537 |
RG | -2.414 |
wives | -2.401 |
CLA | -2.377 |
Token | Happy |
Token ID | 14628 |
Feature activation | +9.88e+00 |
Pos logit contributions | |
aber | +1.847 |
nl | +1.718 |
Causes | +1.599 |
[' | +1.520 |
owa | +1.493 |
Neg logit contributions | |
ught | -1.990 |
wick | -1.857 |
wives | -1.764 |
RG | -1.744 |
CLA | -1.730 |
Token | Hol |
Token ID | 6479 |
Feature activation | +6.97e+00 |
Pos logit contributions | |
aber | +6.288 |
nl | +5.813 |
Causes | +5.707 |
[' | +5.253 |
EE | +5.049 |
Neg logit contributions | |
ught | -7.450 |
wick | -6.804 |
CLA | -6.562 |
wives | -6.523 |
RG | -6.516 |
Token | idays |
Token ID | 13842 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
aber | +3.545 |
nl | +3.150 |
Causes | +2.767 |
owa | +2.711 |
[' | +2.671 |
Neg logit contributions | |
ught | -6.483 |
wick | -6.015 |
RG | -5.869 |
wives | -5.831 |
CLA | -5.822 |
Token | ! |
Token ID | 0 |
Feature activation | +7.15e+00 |
Pos logit contributions | |
aber | +9.814 |
nl | +9.137 |
Causes | +8.554 |
[' | +8.222 |
EE | +8.059 |
Neg logit contributions | |
ught | -13.232 |
wick | -11.994 |
CLA | -11.855 |
RG | -11.787 |
riz | -11.597 |
Token | -- |
Token ID | 1377 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
aber | +4.648 |
nl | +4.381 |
Causes | +4.065 |
[' | +3.808 |
owa | +3.725 |
Neg logit contributions | |
ught | -5.482 |
wick | -5.088 |
RG | -4.836 |
wives | -4.818 |
CLA | -4.811 |
Token | Remy |
Token ID | 32912 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
aber | +7.396 |
nl | +7.049 |
Causes | +6.393 |
[' | +6.252 |
EE | +6.142 |
Neg logit contributions | |
ught | -7.249 |
wick | -6.594 |
wives | -6.327 |
agos | -6.217 |
elin | -6.165 |
Token |
|
Token ID | 198 |
Feature activation | +3.13e+00 |
Pos logit contributions | |
aber | +1.085 |
nl | +0.993 |
Causes | +0.922 |
[' | +0.889 |
owa | +0.882 |
Neg logit contributions | |
ught | -1.122 |
wick | -1.049 |
wives | -0.999 |
RG | -0.987 |
CLA | -0.978 |
Token |
|
Token ID | 198 |
Feature activation | +3.07e+00 |
Pos logit contributions | |
aber | +2.184 |
nl | +2.025 |
Causes | +1.847 |
[' | +1.818 |
EE | +1.749 |
Neg logit contributions | |
ught | -2.384 |
wick | -2.207 |
wives | -2.104 |
elin | -2.056 |
riz | -2.051 |
Token | under |
Token ID | 739 |
Feature activation | -4.56e+00 |
Pos logit contributions | |
aber | +2.079 |
nl | +1.893 |
Causes | +1.749 |
[' | +1.710 |
owa | +1.676 |
Neg logit contributions | |
ught | -2.392 |
wick | -2.239 |
wives | -2.132 |
RG | -2.122 |
CLA | -2.099 |
Token | Title |
Token ID | 11851 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
ught | +2.988 |
wick | +2.832 |
RG | +2.652 |
wives | +2.636 |
CLA | +2.626 |
Neg logit contributions | |
aber | -3.605 |
nl | -3.292 |
Causes | -3.013 |
[' | -2.911 |
owa | -2.896 |
Token | VI |
Token ID | 13889 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
ught | +0.569 |
wick | +0.533 |
wives | +0.493 |
CLA | +0.480 |
RG | +0.479 |
Neg logit contributions | |
aber | -1.083 |
nl | -0.994 |
Causes | -0.937 |
[' | -0.918 |
owa | -0.907 |
Token | of |
Token ID | 286 |
Feature activation | -5.90e-01 |
Pos logit contributions | |
aber | +1.061 |
nl | +0.970 |
Causes | +0.899 |
[' | +0.867 |
owa | +0.860 |
Neg logit contributions | |
ught | -1.247 |
wick | -1.177 |
wives | -1.120 |
RG | -1.107 |
CLA | -1.092 |
Token | the |
Token ID | 262 |
Feature activation | +3.88e+00 |
Pos logit contributions | |
ught | +0.414 |
wick | +0.390 |
wives | +0.368 |
RG | +0.365 |
CLA | +0.362 |
Neg logit contributions | |
aber | -0.448 |
nl | -0.408 |
Causes | -0.381 |
[' | -0.366 |
owa | -0.365 |
Token | Civil |
Token ID | 7511 |
Feature activation | +1.84e+01 |
Pos logit contributions | |
aber | +2.468 |
nl | +2.281 |
Causes | +2.122 |
[' | +2.024 |
owa | +2.019 |
Neg logit contributions | |
ught | -3.184 |
wick | -2.962 |
wives | -2.859 |
RG | -2.828 |
elin | -2.770 |
Token | Rights |
Token ID | 6923 |
Feature activation | +6.88e+00 |
Pos logit contributions | |
aber | +5.657 |
Causes | +5.195 |
nl | +4.383 |
[' | +3.934 |
Notification | +3.290 |
Neg logit contributions | |
ught | -19.660 |
wives | -17.836 |
agos | -17.713 |
acci | -17.617 |
amination | -17.550 |
Token | Act |
Token ID | 2191 |
Feature activation | +8.42e+00 |
Pos logit contributions | |
aber | +3.366 |
nl | +2.909 |
Causes | +2.688 |
[' | +2.525 |
owa | +2.360 |
Neg logit contributions | |
ught | -6.720 |
wick | -6.352 |
wives | -6.179 |
RG | -6.127 |
elin | -6.045 |
Token | of |
Token ID | 286 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
aber | +4.812 |
nl | +4.353 |
Causes | +4.039 |
[' | +4.036 |
owa | +3.874 |
Neg logit contributions | |
ught | -7.184 |
wick | -6.643 |
RG | -6.439 |
wives | -6.339 |
elin | -6.289 |
Token | 1964 |
Token ID | 17575 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
aber | +3.615 |
nl | +3.498 |
Causes | +3.345 |
[' | +3.163 |
owa | +2.897 |
Neg logit contributions | |
ught | -10.865 |
wives | -10.143 |
RG | -10.132 |
wick | -10.009 |
elin | -9.918 |
Token | . |
Token ID | 13 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
ught | +0.897 |
wick | +0.845 |
wives | +0.805 |
RG | +0.794 |
CLA | +0.787 |
Neg logit contributions | |
aber | -0.833 |
nl | -0.760 |
Causes | -0.704 |
owa | -0.673 |
[' | -0.672 |
Token | owed |
Token ID | 6972 |
Feature activation | +5.83e+00 |
Pos logit contributions | |
aber | +1.855 |
nl | +1.619 |
Causes | +1.436 |
owa | +1.402 |
[' | +1.386 |
Neg logit contributions | |
ught | -3.209 |
wick | -3.061 |
wives | -2.960 |
RG | -2.928 |
CLA | -2.920 |
Token | only |
Token ID | 691 |
Feature activation | +8.87e+00 |
Pos logit contributions | |
aber | +3.904 |
nl | +3.604 |
Causes | +3.320 |
owa | +3.208 |
[' | +3.201 |
Neg logit contributions | |
ught | -4.446 |
wick | -4.189 |
wives | -3.990 |
RG | -3.987 |
CLA | -3.887 |
Token | a |
Token ID | 257 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
aber | +5.589 |
nl | +5.145 |
Causes | +4.748 |
owa | +4.567 |
[' | +4.532 |
Neg logit contributions | |
ught | -6.890 |
wick | -6.417 |
RG | -6.167 |
wives | -6.118 |
CLA | -6.033 |
Token | brief |
Token ID | 4506 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
aber | +7.361 |
nl | +6.993 |
Causes | +6.360 |
owa | +6.302 |
gy | +6.180 |
Neg logit contributions | |
ught | -6.834 |
wick | -6.625 |
wives | -6.360 |
RG | -6.264 |
CLA | -6.060 |
Token | , |
Token ID | 11 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
aber | +9.190 |
nl | +8.584 |
gy | +7.797 |
owa | +7.762 |
Causes | +7.681 |
Neg logit contributions | |
ught | -8.798 |
wick | -8.522 |
wives | -8.312 |
RG | -8.114 |
CLA | -7.839 |
Token | non |
Token ID | 1729 |
Feature activation | +1.84e+01 |
Pos logit contributions | |
aber | +7.854 |
nl | +7.292 |
Causes | +6.693 |
owa | +6.578 |
gy | +6.557 |
Neg logit contributions | |
ught | -7.723 |
wick | -7.384 |
wives | -6.937 |
RG | -6.918 |
CLA | -6.750 |
Token | - |
Token ID | 12 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
aber | +10.480 |
nl | +9.831 |
de | +8.744 |
gy | +8.707 |
owa | +8.566 |
Neg logit contributions | |
ught | -12.680 |
wick | -11.822 |
wives | -11.635 |
RG | -11.509 |
unker | -11.323 |
Token | prime |
Token ID | 35505 |
Feature activation | +6.44e+00 |
Pos logit contributions | |
aber | +10.845 |
nl | +10.176 |
de | +9.192 |
gy | +9.050 |
tool | +8.891 |
Neg logit contributions | |
ught | -9.931 |
wick | -9.133 |
curved | -8.775 |
unker | -8.592 |
Certified | -8.577 |
Token | - |
Token ID | 12 |
Feature activation | +7.79e+00 |
Pos logit contributions | |
aber | +4.271 |
nl | +3.909 |
Causes | +3.606 |
owa | +3.518 |
[' | +3.448 |
Neg logit contributions | |
ught | -4.966 |
wick | -4.683 |
wives | -4.512 |
RG | -4.415 |
CLA | -4.373 |
Token | time |
Token ID | 2435 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
aber | +3.540 |
nl | +3.056 |
[' | +2.539 |
Causes | +2.523 |
EE | +2.502 |
Neg logit contributions | |
ught | -7.730 |
wick | -7.219 |
RG | -6.971 |
CLA | -6.935 |
wives | -6.898 |
Token | video |
Token ID | 2008 |
Feature activation | +3.44e+00 |
Pos logit contributions | |
aber | +8.605 |
nl | +8.115 |
Causes | +7.455 |
owa | +7.432 |
[' | +7.267 |
Neg logit contributions | |
ught | -8.443 |
wick | -8.226 |
wives | -8.015 |
RG | -7.754 |
riz | -7.537 |
Token | court |
Token ID | 2184 |
Feature activation | -2.40e+00 |
Pos logit contributions | |
aber | +3.665 |
nl | +3.243 |
Causes | +3.026 |
[' | +2.840 |
EE | +2.763 |
Neg logit contributions | |
ught | -6.671 |
wick | -6.224 |
wives | -6.094 |
CLA | -6.066 |
RG | -5.931 |
Token | on |
Token ID | 319 |
Feature activation | -6.04e+00 |
Pos logit contributions | |
ught | +1.627 |
wick | +1.522 |
wives | +1.450 |
RG | +1.416 |
CLA | +1.404 |
Neg logit contributions | |
aber | -1.877 |
nl | -1.727 |
Causes | -1.602 |
owa | -1.553 |
[' | -1.537 |
Token | the |
Token ID | 262 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
ught | +3.798 |
wick | +3.489 |
wives | +3.267 |
RG | +3.178 |
elin | +3.175 |
Neg logit contributions | |
aber | -4.993 |
nl | -4.555 |
Causes | -4.185 |
owa | -4.169 |
[' | -4.085 |
Token | inter |
Token ID | 987 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
aber | +0.398 |
nl | +0.363 |
Causes | +0.337 |
[' | +0.323 |
owa | +0.321 |
Neg logit contributions | |
ught | -0.437 |
wick | -0.411 |
wives | -0.392 |
RG | -0.388 |
CLA | -0.384 |
Token | lock |
Token ID | 5354 |
Feature activation | +5.50e+00 |
Pos logit contributions | |
aber | +1.454 |
nl | +1.349 |
Causes | +1.271 |
[' | +1.237 |
owa | +1.234 |
Neg logit contributions | |
ught | -0.957 |
wick | -0.872 |
wives | -0.823 |
RG | -0.816 |
CLA | -0.796 |
Token | violation |
Token ID | 8747 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
aber | +3.931 |
nl | +3.601 |
Causes | +3.372 |
[' | +3.243 |
owa | +3.220 |
Neg logit contributions | |
ught | -3.972 |
wick | -3.723 |
RG | -3.569 |
wives | -3.554 |
riz | -3.502 |
Token | on |
Token ID | 319 |
Feature activation | -2.19e+00 |
Pos logit contributions | |
aber | +10.001 |
nl | +9.076 |
Causes | +8.705 |
[' | +8.554 |
EE | +8.427 |
Neg logit contributions | |
ught | -12.718 |
wick | -12.219 |
riz | -12.174 |
RG | -12.051 |
agos | -11.891 |
Token | May |
Token ID | 1737 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
ught | +1.424 |
wick | +1.317 |
wives | +1.238 |
RG | +1.217 |
CLA | +1.204 |
Neg logit contributions | |
aber | -1.785 |
nl | -1.644 |
Causes | -1.526 |
owa | -1.492 |
[' | -1.482 |
Token | 26 |
Token ID | 2608 |
Feature activation | +8.77e+00 |
Pos logit contributions | |
aber | +0.101 |
nl | +0.092 |
Causes | +0.085 |
[' | +0.082 |
owa | +0.082 |
Neg logit contributions | |
ught | -0.114 |
wick | -0.107 |
wives | -0.102 |
RG | -0.101 |
CLA | -0.100 |
Token | . |
Token ID | 13 |
Feature activation | +9.02e+00 |
Pos logit contributions | |
aber | +4.700 |
nl | +4.211 |
Causes | +3.652 |
owa | +3.608 |
[' | +3.503 |
Neg logit contributions | |
ught | -7.698 |
wick | -7.234 |
RG | -7.013 |
wives | -6.973 |
riz | -6.874 |
Token |
|
Token ID | 198 |
Feature activation | -7.31e-01 |
Pos logit contributions | |
aber | +5.472 |
nl | +5.044 |
Causes | +4.743 |
EE | +4.341 |
[' | +4.278 |
Neg logit contributions | |
ught | -7.329 |
wick | -6.634 |
CLA | -6.522 |
RG | -6.448 |
riz | -6.414 |
Token | in |
Token ID | 287 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
ught | +2.337 |
wick | +2.193 |
wives | +2.069 |
RG | +2.058 |
CLA | +2.026 |
Neg logit contributions | |
aber | -2.689 |
nl | -2.461 |
Causes | -2.318 |
owa | -2.224 |
[' | -2.207 |
Token | us |
Token ID | 514 |
Feature activation | -3.81e+00 |
Pos logit contributions | |
aber | +1.046 |
nl | +0.961 |
Causes | +0.893 |
[' | +0.866 |
owa | +0.858 |
Neg logit contributions | |
ught | -1.018 |
wick | -0.956 |
wives | -0.906 |
RG | -0.895 |
CLA | -0.884 |
Token | as |
Token ID | 355 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
ught | +2.750 |
wick | +2.596 |
wives | +2.464 |
RG | +2.436 |
CLA | +2.421 |
Neg logit contributions | |
aber | -2.772 |
nl | -2.519 |
Causes | -2.374 |
owa | -2.262 |
[' | -2.225 |
Token | much |
Token ID | 881 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
aber | +1.301 |
nl | +1.198 |
Causes | +1.105 |
[' | +1.071 |
owa | +1.065 |
Neg logit contributions | |
ught | -1.391 |
wick | -1.308 |
wives | -1.235 |
RG | -1.229 |
riz | -1.215 |
Token | as |
Token ID | 355 |
Feature activation | -3.96e+00 |
Pos logit contributions | |
ught | +1.266 |
wick | +1.189 |
wives | +1.131 |
RG | +1.117 |
CLA | +1.107 |
Neg logit contributions | |
aber | -1.266 |
nl | -1.152 |
Causes | -1.079 |
[' | -1.030 |
owa | -1.030 |
Token | I |
Token ID | 314 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
ught | +2.856 |
wick | +2.652 |
wives | +2.545 |
RG | +2.510 |
CLA | +2.482 |
Neg logit contributions | |
aber | -2.937 |
nl | -2.638 |
Causes | -2.475 |
owa | -2.366 |
[' | -2.356 |
Token | do |
Token ID | 466 |
Feature activation | -8.07e+00 |
Pos logit contributions | |
ught | +10.746 |
riz | +8.749 |
wick | +8.667 |
CLA | +8.434 |
RG | +8.407 |
Neg logit contributions | |
aber | -19.926 |
裏� | -18.040 |
nl | -17.715 |
Causes | -17.509 |
iary | -17.110 |
Token | , |
Token ID | 11 |
Feature activation | -2.36e+00 |
Pos logit contributions | |
ught | +5.496 |
wick | +5.086 |
wives | +4.875 |
RG | +4.868 |
CLA | +4.812 |
Neg logit contributions | |
aber | -5.978 |
nl | -5.339 |
Causes | -5.085 |
owa | -4.804 |
[' | -4.701 |
Token | but |
Token ID | 475 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
ught | +1.753 |
wick | +1.654 |
wives | +1.576 |
RG | +1.568 |
CLA | +1.543 |
Neg logit contributions | |
aber | -1.691 |
nl | -1.524 |
Causes | -1.426 |
owa | -1.370 |
[' | -1.359 |
Token | I |
Token ID | 314 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
ught | +1.157 |
wick | +1.092 |
wives | +1.032 |
RG | +1.030 |
CLA | +1.014 |
Neg logit contributions | |
aber | -1.153 |
nl | -1.047 |
Causes | -0.978 |
[' | -0.935 |
owa | -0.933 |
Token | think |
Token ID | 892 |
Feature activation | -6.64e-03 |
Pos logit contributions | |
ught | +1.469 |
wick | +1.369 |
wives | +1.290 |
RG | +1.277 |
CLA | +1.266 |
Neg logit contributions | |
aber | -1.778 |
nl | -1.638 |
Causes | -1.542 |
[' | -1.464 |
owa | -1.461 |
Token | aud |
Token ID | 3885 |
Feature activation | -5.45e+00 |
Pos logit contributions | |
wick | +7.953 |
ught | +7.952 |
riz | +7.088 |
RG | +6.928 |
CLA | +6.723 |
Neg logit contributions | |
Causes | -15.897 |
裏� | -15.373 |
aber | -14.847 |
nl | -14.412 |
JPM | -13.928 |
Token | Lav |
Token ID | 21438 |
Feature activation | -8.25e-01 |
Pos logit contributions | |
ught | +2.864 |
wick | +2.705 |
CLA | +2.461 |
RG | +2.457 |
wives | +2.406 |
Neg logit contributions | |
aber | -5.002 |
nl | -4.581 |
Causes | -4.319 |
owa | -4.272 |
[' | -4.143 |
Token | o |
Token ID | 78 |
Feature activation | +6.26e+00 |
Pos logit contributions | |
ught | +0.685 |
wick | +0.650 |
wives | +0.619 |
RG | +0.613 |
CLA | +0.606 |
Neg logit contributions | |
aber | -0.520 |
nl | -0.468 |
Causes | -0.434 |
[' | -0.411 |
owa | -0.410 |
Token | ie |
Token ID | 494 |
Feature activation | -4.43e-01 |
Pos logit contributions | |
aber | +2.183 |
nl | +1.920 |
[' | +1.559 |
Causes | +1.426 |
EE | +1.377 |
Neg logit contributions | |
ught | -6.744 |
wick | -6.423 |
tradem | -6.308 |
wives | -6.268 |
RG | -6.263 |
Token | (@ |
Token ID | 4275 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
ught | +0.288 |
wick | +0.268 |
wives | +0.253 |
RG | +0.250 |
CLA | +0.247 |
Neg logit contributions | |
aber | -0.360 |
nl | -0.332 |
Causes | -0.312 |
owa | -0.301 |
[' | -0.301 |
Token | ren |
Token ID | 918 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
ught | +8.333 |
wick | +8.299 |
riz | +7.837 |
elin | +7.716 |
bern | +7.679 |
Neg logit contributions | |
Causes | -9.271 |
aber | -8.932 |
裏� | -8.917 |
UPS | -8.253 |
baskets | -8.090 |
Token | lav |
Token ID | 18809 |
Feature activation | -3.24e+00 |
Pos logit contributions | |
ught | +9.505 |
wick | +9.054 |
CLA | +7.969 |
elin | +7.813 |
wives | +7.635 |
Neg logit contributions | |
裏� | -19.129 |
Causes | -18.363 |
� | -18.258 |
aber | -17.433 |
vertisement | -17.428 |
Token | o |
Token ID | 78 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
ught | +2.545 |
wick | +2.435 |
wives | +2.284 |
RG | +2.252 |
riz | +2.245 |
Neg logit contributions | |
aber | -2.140 |
nl | -1.908 |
Causes | -1.866 |
裏� | -1.716 |
[' | -1.706 |
Token | iet |
Token ID | 1155 |
Feature activation | -8.96e+00 |
Pos logit contributions | |
ught | +0.992 |
wick | +0.944 |
wives | +0.904 |
RG | +0.895 |
CLA | +0.888 |
Neg logit contributions | |
aber | -0.517 |
nl | -0.448 |
Causes | -0.411 |
owa | -0.379 |
[' | -0.376 |
Token | va |
Token ID | 6862 |
Feature activation | +6.03e+00 |
Pos logit contributions | |
ught | +5.600 |
wick | +5.340 |
wives | +4.896 |
CLA | +4.757 |
elin | +4.738 |
Neg logit contributions | |
aber | -7.064 |
Causes | -6.299 |
nl | -6.221 |
裏� | -6.113 |
Customer | -5.842 |
Token | ) |
Token ID | 8 |
Feature activation | -6.35e+00 |
Pos logit contributions | |
aber | +3.123 |
nl | +2.936 |
[' | +2.577 |
Causes | +2.467 |
EE | +2.328 |
Neg logit contributions | |
ught | -5.545 |
tradem | -5.195 |
wick | -5.170 |
wives | -5.003 |
elin | -4.925 |
Token | breaths |
Token ID | 45576 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
ught | +1.649 |
wick | +1.561 |
wives | +1.487 |
RG | +1.457 |
CLA | +1.438 |
Neg logit contributions | |
aber | -1.678 |
nl | -1.538 |
Causes | -1.438 |
[' | -1.381 |
owa | -1.379 |
Token | and |
Token ID | 290 |
Feature activation | +7.56e-01 |
Pos logit contributions | |
ught | +0.946 |
wick | +0.887 |
wives | +0.843 |
RG | +0.826 |
CLA | +0.821 |
Neg logit contributions | |
aber | -0.970 |
nl | -0.890 |
Causes | -0.831 |
[' | -0.797 |
owa | -0.795 |
Token | feeling |
Token ID | 4203 |
Feature activation | -5.30e+00 |
Pos logit contributions | |
aber | +0.575 |
nl | +0.529 |
Causes | +0.493 |
[' | +0.477 |
owa | +0.475 |
Neg logit contributions | |
ught | -0.528 |
wick | -0.495 |
wives | -0.468 |
RG | -0.464 |
CLA | -0.458 |
Token | my |
Token ID | 616 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
ught | +3.567 |
wick | +3.333 |
wives | +3.158 |
RG | +3.097 |
CLA | +3.080 |
Neg logit contributions | |
aber | -4.170 |
nl | -3.723 |
Causes | -3.516 |
owa | -3.343 |
[' | -3.334 |
Token | own |
Token ID | 898 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
ught | +3.180 |
wick | +2.951 |
wives | +2.827 |
riz | +2.762 |
RG | +2.750 |
Neg logit contributions | |
aber | -3.259 |
nl | -2.946 |
Causes | -2.749 |
[' | -2.635 |
owa | -2.609 |
Token | eyes |
Token ID | 2951 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
ught | +7.337 |
wick | +6.651 |
wives | +6.427 |
riz | +6.221 |
CLA | +6.196 |
Neg logit contributions | |
aber | -8.327 |
nl | -7.316 |
Causes | -6.909 |
裏� | -6.579 |
owa | -6.542 |
Token | fill |
Token ID | 6070 |
Feature activation | +2.87e+00 |
Pos logit contributions | |
wick | +12.209 |
ught | +11.988 |
curved | +11.534 |
blaze | +11.069 |
wives | +10.887 |
Neg logit contributions | |
aber | -14.200 |
nl | -13.293 |
Causes | -13.043 |
裏� | -12.881 |
OTAL | -12.452 |
Token | with |
Token ID | 351 |
Feature activation | -5.58e+00 |
Pos logit contributions | |
aber | +1.972 |
nl | +1.782 |
Causes | +1.649 |
[' | +1.602 |
owa | +1.584 |
Neg logit contributions | |
ught | -2.209 |
wick | -2.067 |
wives | -1.989 |
RG | -1.963 |
CLA | -1.951 |
Token | tears |
Token ID | 10953 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
ught | +3.544 |
wick | +3.269 |
wives | +3.089 |
RG | +2.986 |
CLA | +2.969 |
Neg logit contributions | |
aber | -4.555 |
nl | -4.151 |
Causes | -3.922 |
[' | -3.759 |
owa | -3.740 |
Token | . |
Token ID | 13 |
Feature activation | +9.23e-01 |
Pos logit contributions | |
aber | +1.142 |
nl | +1.035 |
Causes | +0.955 |
[' | +0.922 |
owa | +0.917 |
Neg logit contributions | |
ught | -1.344 |
wick | -1.263 |
wives | -1.207 |
RG | -1.200 |
CLA | -1.188 |
Token | The |
Token ID | 383 |
Feature activation | -2.86e+00 |
Pos logit contributions | |
aber | +0.644 |
nl | +0.590 |
Causes | +0.548 |
[' | +0.525 |
owa | +0.520 |
Neg logit contributions | |
ught | -0.706 |
wick | -0.661 |
wives | -0.629 |
RG | -0.623 |
CLA | -0.616 |
Token | Scholar |
Token ID | 11713 |
Feature activation | +2.99e+00 |
Pos logit contributions | |
aber | +2.060 |
nl | +1.926 |
Causes | +1.823 |
[' | +1.772 |
owa | +1.746 |
Neg logit contributions | |
ught | -1.289 |
wick | -1.165 |
wives | -1.101 |
RG | -1.059 |
CLA | -1.057 |
Token | Crossref |
Token ID | 23613 |
Feature activation | -4.84e+00 |
Pos logit contributions | |
aber | +1.752 |
nl | +1.591 |
Causes | +1.467 |
[' | +1.372 |
owa | +1.365 |
Neg logit contributions | |
ught | -2.606 |
wick | -2.440 |
wives | -2.366 |
RG | -2.305 |
CLA | -2.298 |
Token | | |
Token ID | 930 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
ught | +3.146 |
wick | +2.962 |
RG | +2.784 |
wives | +2.757 |
CLA | +2.744 |
Neg logit contributions | |
aber | -3.810 |
nl | -3.474 |
Causes | -3.250 |
owa | -3.158 |
[' | -3.106 |
Token | ISI |
Token ID | 22048 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
ught | +1.059 |
wick | +1.001 |
RG | +0.949 |
wives | +0.942 |
CLA | +0.936 |
Neg logit contributions | |
aber | -1.210 |
nl | -1.089 |
Causes | -1.015 |
owa | -1.001 |
[' | -0.982 |
Token |
|
Token ID | 198 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
wick | +5.169 |
ught | +5.134 |
RG | +4.878 |
CLA | +4.649 |
wives | +4.572 |
Neg logit contributions | |
aber | -9.321 |
nl | -8.291 |
owa | -7.993 |
裏� | -7.921 |
Causes | -7.824 |
Token |
|
Token ID | 198 |
Feature activation | -2.15e+01 |
Pos logit contributions | |
ught | +5.496 |
wick | +5.447 |
RG | +4.985 |
wives | +4.725 |
riz | +4.655 |
Neg logit contributions | |
aber | -11.841 |
vertisement | -10.963 |
nl | -10.545 |
裏� | -10.457 |
� | -10.456 |
Token | Sch |
Token ID | 14874 |
Feature activation | -6.32e+00 |
Pos logit contributions | |
RG | +11.861 |
ught | +11.446 |
wick | +11.204 |
riz | +10.581 |
CLA | +10.384 |
Neg logit contributions | |
aber | -13.960 |
nl | -13.087 |
Causes | -12.967 |
JPM | -12.336 |
owa | -12.114 |
Token | w |
Token ID | 86 |
Feature activation | +8.95e+00 |
Pos logit contributions | |
ught | +4.661 |
wick | +4.456 |
riz | +4.080 |
wives | +4.040 |
elin | +4.021 |
Neg logit contributions | |
aber | -4.290 |
nl | -3.983 |
Causes | -3.928 |
裏� | -3.712 |
[' | -3.702 |
Token | artz |
Token ID | 13636 |
Feature activation | -9.92e-01 |
Pos logit contributions | |
aber | +6.166 |
nl | +5.296 |
owa | +4.844 |
[' | +4.637 |
Causes | +4.632 |
Neg logit contributions | |
ught | -6.709 |
wick | -6.381 |
wives | -6.337 |
CLA | -6.239 |
RG | -6.108 |
Token | , |
Token ID | 11 |
Feature activation | +6.69e-01 |
Pos logit contributions | |
ught | +0.754 |
wick | +0.713 |
wives | +0.674 |
RG | +0.668 |
CLA | +0.660 |
Neg logit contributions | |
aber | -0.694 |
nl | -0.632 |
Causes | -0.588 |
[' | -0.565 |
owa | -0.561 |
Token | D |
Token ID | 360 |
Feature activation | -8.02e-01 |
Pos logit contributions | |
aber | +0.439 |
nl | +0.398 |
Causes | +0.367 |
[' | +0.351 |
owa | +0.350 |
Neg logit contributions | |
ught | -0.538 |
wick | -0.508 |
wives | -0.485 |
RG | -0.480 |
CLA | -0.475 |
Token | y |
Token ID | 88 |
Feature activation | -4.39e+00 |
Pos logit contributions | |
aber | +0.273 |
nl | +0.240 |
Causes | +0.215 |
[' | +0.203 |
owa | +0.201 |
Neg logit contributions | |
ught | -0.512 |
wick | -0.488 |
wives | -0.469 |
RG | -0.465 |
CLA | -0.461 |
Token | , |
Token ID | 11 |
Feature activation | -3.50e+00 |
Pos logit contributions | |
ught | +3.165 |
wick | +2.996 |
wives | +2.840 |
CLA | +2.727 |
RG | +2.725 |
Neg logit contributions | |
aber | -3.200 |
nl | -2.910 |
Causes | -2.729 |
[' | -2.621 |
owa | -2.612 |
Token | he |
Token ID | 339 |
Feature activation | -4.26e+00 |
Pos logit contributions | |
ught | +2.495 |
wick | +2.340 |
wives | +2.221 |
RG | +2.168 |
CLA | +2.167 |
Neg logit contributions | |
aber | -2.603 |
nl | -2.356 |
Causes | -2.209 |
owa | -2.122 |
[' | -2.115 |
Token | should |
Token ID | 815 |
Feature activation | -8.27e-01 |
Pos logit contributions | |
ught | +2.979 |
wick | +2.771 |
wives | +2.612 |
CLA | +2.551 |
RG | +2.546 |
Neg logit contributions | |
aber | -3.224 |
nl | -2.941 |
Causes | -2.723 |
owa | -2.653 |
[' | -2.611 |
Token | proceed |
Token ID | 5120 |
Feature activation | -6.93e+00 |
Pos logit contributions | |
ught | +0.601 |
wick | +0.562 |
wives | +0.531 |
RG | +0.525 |
CLA | +0.519 |
Neg logit contributions | |
aber | -0.610 |
nl | -0.558 |
Causes | -0.521 |
owa | -0.499 |
[' | -0.499 |
Token | most |
Token ID | 749 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
ught | +4.534 |
wick | +4.180 |
wives | +3.879 |
curved | +3.740 |
RG | +3.734 |
Neg logit contributions | |
aber | -5.392 |
nl | -5.011 |
Causes | -4.705 |
owa | -4.577 |
[' | -4.428 |
Token | carefully |
Token ID | 7773 |
Feature activation | -5.66e+00 |
Pos logit contributions | |
ught | +12.395 |
wick | +10.696 |
curved | +10.389 |
nob | +9.343 |
RG | +9.342 |
Neg logit contributions | |
aber | -13.821 |
nl | -13.046 |
Causes | -12.748 |
裏� | -12.090 |
icket | -11.904 |
Token | — |
Token ID | 960 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
ught | +3.836 |
wick | +3.593 |
wives | +3.357 |
RG | +3.238 |
CLA | +3.222 |
Neg logit contributions | |
aber | -4.272 |
nl | -3.998 |
Causes | -3.789 |
owa | -3.646 |
[' | -3.550 |
Token | h |
Token ID | 71 |
Feature activation | -7.19e+00 |
Pos logit contributions | |
ught | +2.891 |
wick | +2.730 |
wives | +2.618 |
RG | +2.574 |
CLA | +2.541 |
Neg logit contributions | |
aber | -2.400 |
nl | -2.168 |
Causes | -2.046 |
owa | -1.946 |
[' | -1.921 |
Token | aste |
Token ID | 4594 |
Feature activation | -6.86e+00 |
Pos logit contributions | |
ught | +5.509 |
wick | +5.074 |
wives | +4.740 |
onest | +4.737 |
riz | +4.689 |
Neg logit contributions | |
aber | -4.812 |
nl | -4.462 |
Causes | -4.316 |
裏� | -4.065 |
[' | -4.006 |
Token | would |
Token ID | 561 |
Feature activation | -6.02e+00 |
Pos logit contributions | |
ught | +4.837 |
wick | +4.566 |
wives | +4.287 |
riz | +4.216 |
RG | +4.184 |
Neg logit contributions | |
aber | -4.894 |
nl | -4.466 |
Causes | -4.207 |
owa | -4.059 |
[' | -4.023 |
Token | done |
Token ID | 1760 |
Feature activation | -6.54e+00 |
Pos logit contributions | |
ught | +3.437 |
wick | +3.219 |
RG | +3.045 |
wives | +3.034 |
elin | +2.989 |
Neg logit contributions | |
aber | -3.595 |
nl | -3.239 |
Causes | -3.074 |
[' | -2.888 |
owa | -2.882 |
Token | well |
Token ID | 880 |
Feature activation | -8.66e+00 |
Pos logit contributions | |
ught | +4.548 |
wick | +4.218 |
RG | +3.969 |
wives | +3.875 |
CLA | +3.873 |
Neg logit contributions | |
aber | -4.880 |
nl | -4.431 |
Causes | -4.183 |
[' | -3.979 |
owa | -3.949 |
Token | against |
Token ID | 1028 |
Feature activation | -6.91e+00 |
Pos logit contributions | |
ught | +5.759 |
wick | +5.516 |
RG | +5.096 |
wives | +5.074 |
CLA | +5.019 |
Neg logit contributions | |
aber | -6.326 |
nl | -5.816 |
Causes | -5.524 |
owa | -5.195 |
[' | -5.135 |
Token | the |
Token ID | 262 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
ught | +4.415 |
wick | +4.091 |
RG | +3.933 |
wives | +3.816 |
CLA | +3.732 |
Neg logit contributions | |
aber | -5.567 |
nl | -5.062 |
Causes | -4.712 |
owa | -4.591 |
[' | -4.579 |
Token | Ravens |
Token ID | 20091 |
Feature activation | -7.23e+00 |
Pos logit contributions | |
aber | +0.259 |
nl | +0.236 |
Causes | +0.219 |
[' | +0.210 |
owa | +0.209 |
Neg logit contributions | |
ught | -0.283 |
wick | -0.266 |
wives | -0.253 |
RG | -0.250 |
CLA | -0.248 |
Token | this |
Token ID | 428 |
Feature activation | -2.08e+01 |
Pos logit contributions | |
ught | +4.848 |
wick | +4.637 |
RG | +4.360 |
wives | +4.288 |
CLA | +4.239 |
Neg logit contributions | |
aber | -5.468 |
nl | -5.005 |
Causes | -4.675 |
owa | -4.490 |
[' | -4.391 |
Token | year |
Token ID | 614 |
Feature activation | -9.58e+00 |
Pos logit contributions | |
ught | +7.742 |
wick | +7.319 |
elin | +6.701 |
wives | +6.662 |
curved | +6.587 |
Neg logit contributions | |
aber | -18.128 |
Causes | -16.576 |
nl | -16.507 |
owa | -15.429 |
裏� | -15.257 |
Token | , |
Token ID | 11 |
Feature activation | -5.52e+00 |
Pos logit contributions | |
ught | +5.924 |
wick | +5.637 |
RG | +5.126 |
wives | +5.126 |
CLA | +5.119 |
Neg logit contributions | |
aber | -7.347 |
nl | -6.755 |
Causes | -6.509 |
owa | -6.166 |
[' | -6.010 |
Token | and |
Token ID | 290 |
Feature activation | -8.27e+00 |
Pos logit contributions | |
ught | +3.647 |
wick | +3.459 |
RG | +3.277 |
wives | +3.197 |
CLA | +3.172 |
Neg logit contributions | |
aber | -4.288 |
nl | -3.876 |
Causes | -3.679 |
[' | -3.502 |
owa | -3.502 |
Token | Baltimore |
Token ID | 10346 |
Feature activation | -2.84e+00 |
Pos logit contributions | |
ught | +5.209 |
wick | +4.896 |
RG | +4.640 |
wives | +4.544 |
CLA | +4.377 |
Neg logit contributions | |
aber | -6.512 |
nl | -5.979 |
Causes | -5.497 |
[' | -5.331 |
owa | -5.287 |
Token | has |
Token ID | 468 |
Feature activation | -3.81e+00 |
Pos logit contributions | |
ught | +2.054 |
wick | +1.932 |
RG | +1.813 |
wives | +1.809 |
CLA | +1.782 |
Neg logit contributions | |
aber | -2.098 |
nl | -1.917 |
Causes | -1.788 |
owa | -1.705 |
[' | -1.702 |
Token | at |
Token ID | 379 |
Feature activation | -6.04e+00 |
Pos logit contributions | |
ught | +1.763 |
wick | +1.675 |
wives | +1.587 |
RG | +1.577 |
CLA | +1.560 |
Neg logit contributions | |
aber | -1.542 |
nl | -1.398 |
Causes | -1.296 |
owa | -1.240 |
[' | -1.237 |
Token | least |
Token ID | 1551 |
Feature activation | -8.89e+00 |
Pos logit contributions | |
ught | +3.672 |
wick | +3.451 |
RG | +3.162 |
CLA | +3.119 |
wives | +3.114 |
Neg logit contributions | |
aber | -4.975 |
nl | -4.702 |
Causes | -4.322 |
owa | -4.199 |
[' | -4.170 |
Token | 20 |
Token ID | 1160 |
Feature activation | -3.92e+00 |
Pos logit contributions | |
ught | +6.397 |
wick | +6.183 |
RG | +5.818 |
wives | +5.715 |
CLA | +5.699 |
Neg logit contributions | |
aber | -5.988 |
nl | -5.565 |
Causes | -5.058 |
owa | -4.882 |
裏� | -4.842 |
Token | Fantasy |
Token ID | 10982 |
Feature activation | -3.70e+00 |
Pos logit contributions | |
ught | +2.313 |
wick | +2.209 |
RG | +2.030 |
wives | +2.010 |
CLA | +1.983 |
Neg logit contributions | |
aber | -3.373 |
nl | -3.134 |
Causes | -2.930 |
[' | -2.842 |
owa | -2.840 |
Token | points |
Token ID | 2173 |
Feature activation | -3.18e+00 |
Pos logit contributions | |
ught | +1.834 |
wick | +1.697 |
wives | +1.573 |
RG | +1.542 |
CLA | +1.499 |
Neg logit contributions | |
aber | -3.515 |
nl | -3.307 |
Causes | -3.127 |
owa | -3.046 |
[' | -3.011 |
Token | this |
Token ID | 428 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
ught | +2.195 |
wick | +2.070 |
wives | +1.926 |
CLA | +1.901 |
RG | +1.900 |
Neg logit contributions | |
aber | -2.437 |
nl | -2.243 |
Causes | -2.110 |
owa | -2.014 |
[' | -1.993 |
Token | season |
Token ID | 1622 |
Feature activation | -4.76e+00 |
Pos logit contributions | |
ught | +7.995 |
wick | +7.622 |
wives | +6.788 |
riz | +6.736 |
curved | +6.690 |
Neg logit contributions | |
aber | -17.366 |
Causes | -15.838 |
nl | -15.687 |
owa | -14.635 |
裏� | -14.483 |
Token | , |
Token ID | 11 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
ught | +3.442 |
wick | +3.282 |
wives | +3.050 |
CLA | +3.024 |
RG | +3.019 |
Neg logit contributions | |
aber | -3.404 |
nl | -3.128 |
Causes | -2.947 |
owa | -2.789 |
[' | -2.763 |
Token | including |
Token ID | 1390 |
Feature activation | -6.08e+00 |
Pos logit contributions | |
aber | +0.076 |
nl | +0.069 |
Causes | +0.064 |
[' | +0.062 |
owa | +0.062 |
Neg logit contributions | |
ught | -0.078 |
wick | -0.074 |
wives | -0.070 |
RG | -0.069 |
CLA | -0.068 |
Token | last |
Token ID | 938 |
Feature activation | -5.30e+00 |
Pos logit contributions | |
ught | +4.246 |
wick | +4.008 |
RG | +3.852 |
wives | +3.775 |
riz | +3.680 |
Neg logit contributions | |
aber | -4.506 |
nl | -4.114 |
Causes | -3.792 |
[' | -3.625 |
owa | -3.617 |
Token | week |
Token ID | 1285 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
ught | +3.512 |
wick | +3.313 |
wives | +3.134 |
RG | +3.078 |
elin | +3.035 |
Neg logit contributions | |
aber | -4.118 |
nl | -3.758 |
Causes | -3.596 |
[' | -3.409 |
owa | -3.364 |
Token | to |
Token ID | 284 |
Feature activation | -2.13e-01 |
Pos logit contributions | |
aber | +4.944 |
nl | +4.549 |
Causes | +4.040 |
[' | +4.016 |
owa | +3.961 |
Neg logit contributions | |
ught | -6.166 |
wick | -5.804 |
wives | -5.614 |
CLA | -5.450 |
riz | -5.430 |
Token | learn |
Token ID | 2193 |
Feature activation | +3.27e+00 |
Pos logit contributions | |
ught | +0.157 |
wick | +0.148 |
wives | +0.140 |
RG | +0.139 |
CLA | +0.137 |
Neg logit contributions | |
aber | -0.154 |
nl | -0.141 |
Causes | -0.131 |
[' | -0.126 |
owa | -0.126 |
Token | as |
Token ID | 355 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
aber | +2.157 |
nl | +1.968 |
Causes | +1.788 |
[' | +1.742 |
owa | +1.711 |
Neg logit contributions | |
ught | -2.621 |
wick | -2.458 |
wives | -2.351 |
CLA | -2.326 |
RG | -2.320 |
Token | much |
Token ID | 881 |
Feature activation | +5.96e+00 |
Pos logit contributions | |
aber | +1.563 |
nl | +1.424 |
Causes | +1.294 |
[' | +1.256 |
owa | +1.249 |
Neg logit contributions | |
ught | -1.907 |
wick | -1.803 |
wives | -1.711 |
RG | -1.709 |
CLA | -1.689 |
Token | as |
Token ID | 355 |
Feature activation | +3.97e-01 |
Pos logit contributions | |
aber | +4.004 |
nl | +3.678 |
Causes | +3.323 |
[' | +3.295 |
owa | +3.218 |
Neg logit contributions | |
ught | -4.554 |
wick | -4.345 |
wives | -4.106 |
CLA | -4.082 |
RG | -4.082 |
Token | we |
Token ID | 356 |
Feature activation | -2.00e+01 |
Pos logit contributions | |
aber | +0.277 |
nl | +0.253 |
Causes | +0.234 |
[' | +0.225 |
owa | +0.224 |
Neg logit contributions | |
ught | -0.303 |
wick | -0.285 |
wives | -0.271 |
RG | -0.269 |
CLA | -0.266 |
Token | can |
Token ID | 460 |
Feature activation | +2.90e+00 |
Pos logit contributions | |
ught | +10.614 |
wick | +8.466 |
wives | +8.365 |
RG | +8.159 |
elin | +8.135 |
Neg logit contributions | |
aber | -15.021 |
nl | -13.970 |
裏� | -13.950 |
Causes | -13.822 |
EE | -12.679 |
Token | ahead |
Token ID | 4058 |
Feature activation | -2.89e+00 |
Pos logit contributions | |
aber | +1.971 |
nl | +1.788 |
Causes | +1.634 |
[' | +1.598 |
owa | +1.569 |
Neg logit contributions | |
ught | -2.267 |
wick | -2.145 |
wives | -2.039 |
RG | -2.022 |
riz | -1.999 |
Token | of |
Token ID | 286 |
Feature activation | -3.74e+00 |
Pos logit contributions | |
ught | +2.120 |
wick | +1.994 |
wives | +1.906 |
RG | +1.868 |
CLA | +1.846 |
Neg logit contributions | |
aber | -2.076 |
nl | -1.894 |
Causes | -1.786 |
[' | -1.694 |
owa | -1.691 |
Token | the |
Token ID | 262 |
Feature activation | -5.12e+00 |
Pos logit contributions | |
ught | +2.534 |
wick | +2.367 |
wives | +2.225 |
RG | +2.212 |
elin | +2.187 |
Neg logit contributions | |
aber | -2.896 |
nl | -2.633 |
Causes | -2.485 |
owa | -2.393 |
[' | -2.374 |
Token | UEFA |
Token ID | 40858 |
Feature activation | -4.15e+00 |
Pos logit contributions | |
ught | +3.473 |
wick | +3.204 |
elin | +3.005 |
wives | +2.999 |
RG | +2.968 |
Neg logit contributions | |
aber | -3.970 |
nl | -3.583 |
Causes | -3.404 |
[' | -3.268 |
owa | -3.234 |
Token | Ik |
Token ID | 32840 |
Feature activation | -4.16e+00 |
Pos logit contributions | |
ught | +1.386 |
wick | +1.306 |
wives | +1.232 |
RG | +1.223 |
CLA | +1.206 |
Neg logit contributions | |
aber | -1.514 |
nl | -1.375 |
Causes | -1.272 |
owa | -1.249 |
[' | -1.236 |
Token | ki |
Token ID | 4106 |
Feature activation | -9.50e+00 |
Pos logit contributions | |
ught | +2.875 |
wick | +2.739 |
wives | +2.522 |
riz | +2.518 |
elin | +2.499 |
Neg logit contributions | |
aber | -3.112 |
nl | -2.871 |
Causes | -2.787 |
裏� | -2.605 |
[' | -2.572 |
Token | , |
Token ID | 11 |
Feature activation | -8.48e+00 |
Pos logit contributions | |
ught | +6.430 |
wick | +5.991 |
wives | +5.535 |
curved | +5.522 |
CLA | +5.379 |
Neg logit contributions | |
aber | -6.985 |
nl | -6.544 |
Causes | -6.136 |
裏� | -5.751 |
tool | -5.637 |
Token | who |
Token ID | 508 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
ught | +5.494 |
wick | +5.098 |
wives | +4.796 |
RG | +4.729 |
riz | +4.714 |
Neg logit contributions | |
aber | -6.465 |
nl | -5.923 |
Causes | -5.503 |
[' | -5.280 |
owa | -5.275 |
Token | caught |
Token ID | 4978 |
Feature activation | -9.84e+00 |
Pos logit contributions | |
ught | +0.935 |
wick | +0.876 |
wives | +0.834 |
RG | +0.820 |
CLA | +0.815 |
Neg logit contributions | |
aber | -0.873 |
nl | -0.798 |
Causes | -0.743 |
[' | -0.705 |
owa | -0.702 |
Token | her |
Token ID | 607 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
ught | +6.189 |
wick | +5.802 |
wives | +5.253 |
riz | +5.213 |
RG | +5.161 |
Neg logit contributions | |
aber | -7.642 |
nl | -7.002 |
Causes | -6.524 |
owa | -6.218 |
tool | -6.144 |
Token | on |
Token ID | 319 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
ught | +11.262 |
wick | +10.074 |
curved | +9.997 |
gaze | +9.832 |
wives | +9.304 |
Neg logit contributions | |
aber | -14.184 |
nl | -12.805 |
Causes | -12.176 |
裏� | -11.914 |
OTAL | -11.490 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+00 |
Pos logit contributions | |
ught | +6.217 |
wick | +5.910 |
wives | +5.437 |
RG | +5.293 |
curved | +5.277 |
Neg logit contributions | |
aber | -8.297 |
nl | -7.597 |
Causes | -7.240 |
[' | -6.903 |
owa | -6.836 |
Token | chest |
Token ID | 7721 |
Feature activation | -6.78e+00 |
Pos logit contributions | |
ught | +2.917 |
wick | +2.701 |
wives | +2.547 |
RG | +2.500 |
riz | +2.495 |
Neg logit contributions | |
aber | -3.384 |
nl | -3.134 |
Causes | -2.938 |
[' | -2.786 |
owa | -2.763 |
Token | before |
Token ID | 878 |
Feature activation | -9.94e-02 |
Pos logit contributions | |
ught | +4.635 |
wick | +4.380 |
wives | +4.087 |
CLA | +3.958 |
riz | +3.947 |
Neg logit contributions | |
aber | -5.067 |
nl | -4.693 |
Causes | -4.458 |
owa | -4.169 |
[' | -4.147 |
Token | she |
Token ID | 673 |
Feature activation | -9.07e+00 |
Pos logit contributions | |
ught | +0.073 |
wick | +0.068 |
wives | +0.065 |
RG | +0.064 |
CLA | +0.063 |
Neg logit contributions | |
aber | -0.073 |
nl | -0.066 |
Causes | -0.062 |
[' | -0.059 |
owa | -0.059 |
Token | Scholar |
Token ID | 11713 |
Feature activation | +3.60e+00 |
Pos logit contributions | |
aber | +2.160 |
nl | +2.021 |
Causes | +1.912 |
[' | +1.859 |
owa | +1.830 |
Neg logit contributions | |
ught | -1.360 |
wick | -1.228 |
wives | -1.162 |
RG | -1.116 |
elin | -1.115 |
Token | Crossref |
Token ID | 23613 |
Feature activation | -3.88e+00 |
Pos logit contributions | |
aber | +2.070 |
nl | +1.876 |
Causes | +1.725 |
[' | +1.608 |
owa | +1.602 |
Neg logit contributions | |
ught | -3.180 |
wick | -2.966 |
wives | -2.898 |
RG | -2.808 |
CLA | -2.806 |
Token | | |
Token ID | 930 |
Feature activation | +5.41e-01 |
Pos logit contributions | |
ught | +2.626 |
wick | +2.471 |
RG | +2.323 |
wives | +2.309 |
CLA | +2.291 |
Neg logit contributions | |
aber | -2.989 |
nl | -2.725 |
Causes | -2.539 |
owa | -2.467 |
[' | -2.439 |
Token | ISI |
Token ID | 22048 |
Feature activation | -9.16e+00 |
Pos logit contributions | |
aber | +0.408 |
nl | +0.374 |
Causes | +0.348 |
[' | +0.336 |
owa | +0.335 |
Neg logit contributions | |
ught | -0.383 |
wick | -0.359 |
wives | -0.340 |
RG | -0.337 |
CLA | -0.333 |
Token |
|
Token ID | 198 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
ught | +4.744 |
wick | +4.719 |
RG | +4.475 |
CLA | +4.306 |
wives | +4.195 |
Neg logit contributions | |
aber | -7.904 |
nl | -7.047 |
owa | -6.754 |
Causes | -6.676 |
裏� | -6.674 |
Token |
|
Token ID | 198 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
ught | +4.953 |
wick | +4.805 |
RG | +4.472 |
wives | +4.296 |
CLA | +4.228 |
Neg logit contributions | |
aber | -9.168 |
nl | -8.153 |
Causes | -8.003 |
裏� | -8.000 |
vertisement | -7.988 |
Token | Sal |
Token ID | 19221 |
Feature activation | -4.01e-01 |
Pos logit contributions | |
RG | +12.772 |
ught | +11.963 |
wick | +11.755 |
riz | +11.398 |
CLA | +11.186 |
Neg logit contributions | |
aber | -12.229 |
Causes | -11.266 |
nl | -11.096 |
JPM | -10.629 |
owa | -10.337 |
Token | m |
Token ID | 76 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
ught | +0.295 |
wick | +0.278 |
wives | +0.263 |
RG | +0.260 |
CLA | +0.257 |
Neg logit contributions | |
aber | -0.290 |
nl | -0.266 |
Causes | -0.248 |
[' | -0.238 |
owa | -0.237 |
Token | iv |
Token ID | 452 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
ught | +0.920 |
wick | +0.872 |
wives | +0.818 |
RG | +0.812 |
CLA | +0.802 |
Neg logit contributions | |
aber | -0.923 |
nl | -0.846 |
Causes | -0.790 |
[' | -0.761 |
owa | -0.751 |
Token | alli |
Token ID | 36546 |
Feature activation | +3.58e+00 |
Pos logit contributions | |
aber | +7.506 |
nl | +6.705 |
owa | +6.077 |
Causes | +6.062 |
[' | +5.901 |
Neg logit contributions | |
ught | -7.196 |
wives | -6.377 |
wick | -6.324 |
RG | -6.244 |
CLA | -6.048 |
Token | , |
Token ID | 11 |
Feature activation | +6.27e-01 |
Pos logit contributions | |
aber | +2.345 |
nl | +2.121 |
Causes | +1.963 |
owa | +1.884 |
[' | +1.866 |
Neg logit contributions | |
ught | -2.874 |
wick | -2.684 |
wives | -2.580 |
RG | -2.554 |
CLA | -2.530 |
Token | fried |
Token ID | 23018 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
ught | +3.516 |
wick | +3.213 |
curved | +2.996 |
wives | +2.994 |
riz | +2.959 |
Neg logit contributions | |
aber | -5.205 |
nl | -4.832 |
Causes | -4.663 |
owa | -4.416 |
裏� | -4.301 |
Token | and |
Token ID | 290 |
Feature activation | +4.28e+00 |
Pos logit contributions | |
ught | +1.336 |
wick | +1.263 |
wives | +1.192 |
RG | +1.178 |
riz | +1.159 |
Neg logit contributions | |
aber | -1.493 |
nl | -1.357 |
Causes | -1.284 |
owa | -1.237 |
[' | -1.211 |
Token | not |
Token ID | 407 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
aber | +2.535 |
nl | +2.312 |
[' | +2.062 |
Causes | +2.047 |
owa | +1.954 |
Neg logit contributions | |
ught | -3.650 |
wick | -3.487 |
wives | -3.340 |
RG | -3.288 |
CLA | -3.264 |
Token | deep |
Token ID | 2769 |
Feature activation | -8.06e+00 |
Pos logit contributions | |
ught | +2.721 |
wick | +2.474 |
wives | +2.338 |
RG | +2.316 |
riz | +2.271 |
Neg logit contributions | |
aber | -3.625 |
nl | -3.325 |
Causes | -3.226 |
owa | -3.012 |
裏� | -2.984 |
Token | fried |
Token ID | 23018 |
Feature activation | -3.85e+00 |
Pos logit contributions | |
ught | +4.557 |
wick | +4.105 |
wives | +3.848 |
curved | +3.822 |
riz | +3.749 |
Neg logit contributions | |
aber | -7.097 |
nl | -6.423 |
Causes | -6.246 |
owa | -5.932 |
裏� | -5.869 |
Token | . |
Token ID | 13 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
ught | +2.809 |
wick | +2.665 |
wives | +2.523 |
RG | +2.498 |
CLA | +2.459 |
Neg logit contributions | |
aber | -2.795 |
nl | -2.491 |
Causes | -2.377 |
owa | -2.299 |
裏� | -2.201 |
Token | 6 |
Token ID | 718 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
wick | +10.337 |
ught | +9.814 |
wives | +9.232 |
Closed | +8.813 |
RG | +8.805 |
Neg logit contributions | |
aber | -14.452 |
nl | -12.738 |
owa | -12.389 |
[' | -11.960 |
icket | -11.713 |
Token | . |
Token ID | 13 |
Feature activation | -3.56e-01 |
Pos logit contributions | |
ught | +0.836 |
wick | +0.794 |
wives | +0.754 |
RG | +0.748 |
CLA | +0.738 |
Neg logit contributions | |
aber | -0.728 |
nl | -0.654 |
Causes | -0.611 |
owa | -0.585 |
[' | -0.578 |
Token | Drain |
Token ID | 36024 |
Feature activation | +5.25e+00 |
Pos logit contributions | |
ught | +0.213 |
wick | +0.197 |
wives | +0.184 |
RG | +0.182 |
CLA | +0.180 |
Neg logit contributions | |
aber | -0.308 |
nl | -0.285 |
Causes | -0.267 |
owa | -0.260 |
[' | -0.260 |
Token | on |
Token ID | 319 |
Feature activation | -6.16e-01 |
Pos logit contributions | |
aber | +3.555 |
nl | +3.343 |
[' | +3.023 |
Causes | +3.006 |
owa | +2.825 |
Neg logit contributions | |
ught | -4.038 |
wick | -3.756 |
RG | -3.566 |
CLA | -3.537 |
wives | -3.518 |
Token | a |
Token ID | 257 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
ught | +0.432 |
wick | +0.405 |
wives | +0.383 |
RG | +0.378 |
CLA | +0.374 |
Neg logit contributions | |
aber | -0.468 |
nl | -0.429 |
Causes | -0.401 |
[' | -0.386 |
owa | -0.385 |
Token | but |
Token ID | 475 |
Feature activation | +9.93e+00 |
Pos logit contributions | |
aber | +2.324 |
nl | +2.122 |
Causes | +1.961 |
[' | +1.896 |
owa | +1.879 |
Neg logit contributions | |
ught | -2.545 |
wick | -2.371 |
wives | -2.266 |
RG | -2.228 |
elin | -2.206 |
Token | much |
Token ID | 881 |
Feature activation | +8.90e-01 |
Pos logit contributions | |
aber | +6.570 |
nl | +6.044 |
Causes | +5.613 |
[' | +5.597 |
owa | +5.360 |
Neg logit contributions | |
ught | -7.283 |
wick | -6.860 |
wives | -6.517 |
RG | -6.485 |
CLA | -6.388 |
Token | of |
Token ID | 286 |
Feature activation | +5.99e+00 |
Pos logit contributions | |
aber | +0.607 |
nl | +0.554 |
Causes | +0.509 |
[' | +0.492 |
owa | +0.489 |
Neg logit contributions | |
ught | -0.694 |
wick | -0.654 |
wives | -0.623 |
RG | -0.617 |
CLA | -0.611 |
Token | that |
Token ID | 326 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
aber | +3.981 |
nl | +3.714 |
Causes | +3.373 |
[' | +3.296 |
owa | +3.192 |
Neg logit contributions | |
ught | -4.595 |
wick | -4.336 |
wives | -4.203 |
RG | -4.119 |
CLA | -4.099 |
Token | has |
Token ID | 468 |
Feature activation | -9.75e+00 |
Pos logit contributions | |
aber | +1.139 |
nl | +1.053 |
Causes | +0.980 |
[' | +0.956 |
owa | +0.944 |
Neg logit contributions | |
ught | -0.990 |
wick | -0.923 |
wives | -0.876 |
RG | -0.863 |
CLA | -0.852 |
Token | to |
Token ID | 284 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
ught | +5.626 |
wick | +5.441 |
riz | +5.130 |
wives | +5.101 |
curved | +4.943 |
Neg logit contributions | |
aber | -7.970 |
nl | -7.163 |
Causes | -6.936 |
owa | -6.668 |
[' | -6.468 |
Token | do |
Token ID | 466 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
ught | +6.346 |
wick | +6.336 |
riz | +5.443 |
wives | +5.322 |
curved | +4.959 |
Neg logit contributions | |
aber | -17.543 |
nl | -16.775 |
Causes | -16.443 |
owa | -16.024 |
裏� | -15.568 |
Token | with |
Token ID | 351 |
Feature activation | +2.31e+00 |
Pos logit contributions | |
ught | +5.625 |
wick | +5.252 |
wives | +5.009 |
RG | +4.958 |
riz | +4.899 |
Neg logit contributions | |
aber | -8.397 |
nl | -7.752 |
Causes | -7.482 |
owa | -7.286 |
裏� | -6.972 |
Token | where |
Token ID | 810 |
Feature activation | +5.22e+00 |
Pos logit contributions | |
aber | +1.723 |
nl | +1.596 |
Causes | +1.485 |
[' | +1.438 |
owa | +1.414 |
Neg logit contributions | |
ught | -1.650 |
wick | -1.542 |
wives | -1.462 |
RG | -1.445 |
CLA | -1.437 |
Token | they |
Token ID | 484 |
Feature activation | -4.08e-02 |
Pos logit contributions | |
aber | +3.363 |
nl | +3.118 |
Causes | +2.841 |
[' | +2.810 |
owa | +2.708 |
Neg logit contributions | |
ught | -4.118 |
wick | -3.884 |
wives | -3.689 |
CLA | -3.661 |
RG | -3.660 |
Token | were |
Token ID | 547 |
Feature activation | +2.80e+00 |
Pos logit contributions | |
ught | +0.032 |
wick | +0.030 |
wives | +0.028 |
RG | +0.028 |
CLA | +0.028 |
Neg logit contributions | |
aber | -0.028 |
nl | -0.025 |
Causes | -0.024 |
[' | -0.023 |
owa | -0.023 |
Token | love |
Token ID | 1842 |
Feature activation | +3.45e+00 |
Pos logit contributions | |
ught | +2.021 |
wick | +1.879 |
wives | +1.751 |
RG | +1.717 |
CLA | +1.716 |
Neg logit contributions | |
aber | -2.311 |
nl | -2.106 |
Causes | -2.004 |
owa | -1.900 |
[' | -1.893 |
Token | it |
Token ID | 340 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
aber | +2.398 |
nl | +2.188 |
Causes | +2.037 |
[' | +1.966 |
owa | +1.941 |
Neg logit contributions | |
ught | -2.606 |
wick | -2.447 |
RG | -2.334 |
wives | -2.334 |
CLA | -2.316 |
Token | as |
Token ID | 355 |
Feature activation | +2.60e-02 |
Pos logit contributions | |
ught | +1.916 |
wick | +1.804 |
wives | +1.711 |
RG | +1.688 |
CLA | +1.675 |
Neg logit contributions | |
aber | -1.860 |
nl | -1.698 |
Causes | -1.593 |
owa | -1.520 |
[' | -1.510 |
Token | much |
Token ID | 881 |
Feature activation | +2.22e+00 |
Pos logit contributions | |
aber | +0.017 |
nl | +0.015 |
Causes | +0.014 |
[' | +0.013 |
owa | +0.013 |
Neg logit contributions | |
ught | -0.021 |
wick | -0.020 |
wives | -0.019 |
RG | -0.019 |
CLA | -0.019 |
Token | as |
Token ID | 355 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
aber | +1.638 |
nl | +1.504 |
Causes | +1.390 |
[' | +1.345 |
owa | +1.342 |
Neg logit contributions | |
ught | -1.604 |
wick | -1.501 |
wives | -1.421 |
RG | -1.414 |
CLA | -1.398 |
Token | I |
Token ID | 314 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
ught | +1.210 |
wick | +1.131 |
wives | +1.077 |
RG | +1.062 |
CLA | +1.044 |
Neg logit contributions | |
aber | -1.194 |
nl | -1.088 |
Causes | -1.015 |
[' | -0.974 |
owa | -0.971 |
Token | did |
Token ID | 750 |
Feature activation | -5.62e+00 |
Pos logit contributions | |
ught | +9.329 |
wick | +8.407 |
riz | +8.256 |
wives | +7.513 |
CLA | +7.485 |
Neg logit contributions | |
aber | -15.649 |
Causes | -14.189 |
nl | -13.906 |
裏� | -13.708 |
tool | -13.346 |
Token | – |
Token ID | 784 |
Feature activation | -6.24e-01 |
Pos logit contributions | |
ught | +3.994 |
wick | +3.757 |
wives | +3.550 |
RG | +3.499 |
CLA | +3.453 |
Neg logit contributions | |
aber | -4.112 |
nl | -3.708 |
Causes | -3.525 |
owa | -3.361 |
[' | -3.286 |
Token | we |
Token ID | 356 |
Feature activation | +2.58e+00 |
Pos logit contributions | |
ught | +0.461 |
wick | +0.433 |
wives | +0.412 |
RG | +0.408 |
CLA | +0.402 |
Neg logit contributions | |
aber | -0.450 |
nl | -0.410 |
Causes | -0.382 |
[' | -0.367 |
owa | -0.367 |
Token | managed |
Token ID | 5257 |
Feature activation | -2.48e+00 |
Pos logit contributions | |
aber | +1.751 |
nl | +1.590 |
Causes | +1.459 |
[' | +1.427 |
owa | +1.406 |
Neg logit contributions | |
ught | -2.013 |
wick | -1.895 |
wives | -1.808 |
RG | -1.793 |
CLA | -1.772 |
Token | to |
Token ID | 284 |
Feature activation | -5.71e+00 |
Pos logit contributions | |
ught | +1.754 |
wick | +1.654 |
wives | +1.567 |
RG | +1.538 |
riz | +1.527 |
Neg logit contributions | |
aber | -1.863 |
nl | -1.702 |
Causes | -1.594 |
owa | -1.533 |
[' | -1.524 |
Token | Sony |
Token ID | 10184 |
Feature activation | -7.76e+00 |
Pos logit contributions | |
ught | +1.735 |
wick | +1.643 |
wives | +1.564 |
RG | +1.546 |
CLA | +1.535 |
Neg logit contributions | |
aber | -1.376 |
nl | -1.237 |
Causes | -1.138 |
owa | -1.088 |
[' | -1.085 |
Token | 's |
Token ID | 338 |
Feature activation | -6.03e+00 |
Pos logit contributions | |
ught | +5.650 |
wick | +5.293 |
Certified | +5.055 |
RG | +5.004 |
CLA | +4.942 |
Neg logit contributions | |
aber | -5.345 |
nl | -4.767 |
Causes | -4.418 |
裏� | -4.256 |
owa | -4.216 |
Token | next |
Token ID | 1306 |
Feature activation | -5.40e+00 |
Pos logit contributions | |
ught | +4.523 |
wick | +4.194 |
wives | +3.996 |
RG | +3.948 |
elin | +3.946 |
Neg logit contributions | |
aber | -4.126 |
nl | -3.739 |
Causes | -3.486 |
[' | -3.354 |
owa | -3.320 |
Token | - |
Token ID | 12 |
Feature activation | -5.05e+00 |
Pos logit contributions | |
ught | +3.555 |
wick | +3.352 |
wives | +3.193 |
RG | +3.102 |
elin | +3.087 |
Neg logit contributions | |
aber | -4.180 |
nl | -3.854 |
Causes | -3.644 |
[' | -3.505 |
owa | -3.446 |
Token | generation |
Token ID | 20158 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
ught | +2.786 |
wick | +2.602 |
wives | +2.467 |
RG | +2.351 |
riz | +2.342 |
Neg logit contributions | |
aber | -4.498 |
nl | -4.137 |
Causes | -4.035 |
owa | -3.850 |
[' | -3.821 |
Token | PlayStation |
Token ID | 14047 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
ught | +7.300 |
wick | +6.612 |
wives | +6.410 |
curved | +6.385 |
Certified | +6.311 |
Neg logit contributions | |
aber | -7.572 |
nl | -6.919 |
Causes | -6.377 |
[' | -6.165 |
Customer | -6.105 |
Token | is |
Token ID | 318 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
ught | +8.631 |
Certified | +8.201 |
curved | +8.148 |
wick | +7.903 |
equivalent | +7.770 |
Neg logit contributions | |
aber | -14.930 |
nl | -13.607 |
裏� | -13.134 |
Causes | -13.081 |
owa | -12.962 |
Token | dated |
Token ID | 14567 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
aber | +0.884 |
nl | +0.807 |
Causes | +0.747 |
[' | +0.722 |
owa | +0.719 |
Neg logit contributions | |
ught | -0.914 |
wick | -0.857 |
wives | -0.815 |
RG | -0.807 |
CLA | -0.799 |
Token | for |
Token ID | 329 |
Feature activation | +3.10e+00 |
Pos logit contributions | |
aber | +0.763 |
nl | +0.701 |
Causes | +0.655 |
[' | +0.632 |
owa | +0.628 |
Neg logit contributions | |
ught | -0.709 |
wick | -0.663 |
wives | -0.628 |
RG | -0.622 |
CLA | -0.614 |
Token | fall |
Token ID | 2121 |
Feature activation | +6.03e+00 |
Pos logit contributions | |
aber | +2.196 |
nl | +2.015 |
Causes | +1.885 |
[' | +1.811 |
owa | +1.793 |
Neg logit contributions | |
ught | -2.306 |
wick | -2.171 |
wives | -2.064 |
RG | -2.042 |
CLA | -2.019 |
Token | 2014 |
Token ID | 1946 |
Feature activation | +6.48e-01 |
Pos logit contributions | |
aber | +2.885 |
nl | +2.504 |
Causes | +2.308 |
[' | +2.230 |
owa | +2.146 |
Neg logit contributions | |
ught | -5.763 |
wick | -5.484 |
wives | -5.297 |
RG | -5.286 |
CLA | -5.221 |
Token | the |
Token ID | 262 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
ught | +2.521 |
wick | +2.362 |
wives | +2.205 |
RG | +2.184 |
riz | +2.153 |
Neg logit contributions | |
aber | -2.899 |
nl | -2.673 |
Causes | -2.516 |
owa | -2.429 |
[' | -2.402 |
Token | console |
Token ID | 8624 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
ught | +0.784 |
wick | +0.734 |
wives | +0.695 |
RG | +0.688 |
riz | +0.679 |
Neg logit contributions | |
aber | -0.765 |
nl | -0.700 |
Causes | -0.651 |
[' | -0.625 |
owa | -0.625 |
Token | as |
Token ID | 355 |
Feature activation | -4.13e+00 |
Pos logit contributions | |
ught | +2.543 |
wick | +2.392 |
wives | +2.244 |
RG | +2.228 |
CLA | +2.208 |
Neg logit contributions | |
aber | -2.356 |
nl | -2.131 |
Causes | -2.009 |
owa | -1.916 |
[' | -1.895 |
Token | it |
Token ID | 340 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
ught | +2.890 |
wick | +2.710 |
wives | +2.557 |
RG | +2.522 |
elin | +2.470 |
Neg logit contributions | |
aber | -3.115 |
nl | -2.842 |
Causes | -2.656 |
owa | -2.566 |
[' | -2.559 |
Token | should |
Token ID | 815 |
Feature activation | -6.18e+00 |
Pos logit contributions | |
ught | +8.395 |
wick | +7.631 |
curved | +7.521 |
acci | +6.776 |
curves | +6.721 |
Neg logit contributions | |
aber | -10.465 |
nl | -9.477 |
裏� | -9.068 |
Causes | -8.977 |
owa | -8.674 |
Token | have |
Token ID | 423 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
ught | +4.041 |
wick | +3.724 |
wives | +3.392 |
CLA | +3.382 |
RG | +3.367 |
Neg logit contributions | |
aber | -4.865 |
nl | -4.483 |
Causes | -4.304 |
owa | -4.095 |
[' | -4.094 |
Token | been |
Token ID | 587 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
ught | +10.093 |
wick | +9.268 |
curved | +8.865 |
wives | +8.044 |
CLA | +7.723 |
Neg logit contributions | |
aber | -14.348 |
Causes | -13.343 |
nl | -13.207 |
owa | -12.681 |
裏� | -12.573 |
Token | . |
Token ID | 13 |
Feature activation | -2.46e+00 |
Pos logit contributions | |
ught | +6.942 |
wick | +6.530 |
wives | +6.057 |
curved | +6.053 |
CLA | +5.855 |
Neg logit contributions | |
aber | -7.660 |
nl | -7.091 |
Causes | -6.776 |
owa | -6.611 |
[' | -6.443 |
Token | " |
Token ID | 366 |
Feature activation | -4.82e+00 |
Pos logit contributions | |
ught | +1.791 |
wick | +1.696 |
RG | +1.604 |
wives | +1.603 |
CLA | +1.577 |
Neg logit contributions | |
aber | -1.781 |
nl | -1.606 |
Causes | -1.477 |
owa | -1.465 |
[' | -1.442 |
Token | Sh |
Token ID | 2484 |
Feature activation | -7.38e+00 |
Pos logit contributions | |
ught | +3.437 |
wick | +3.235 |
RG | +3.159 |
CLA | +3.060 |
wives | +3.056 |
Neg logit contributions | |
aber | -3.530 |
nl | -3.165 |
Causes | -3.030 |
owa | -2.919 |
[' | -2.813 |
Token | it |
Token ID | 270 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
ught | +5.896 |
wick | +5.607 |
elin | +5.178 |
RG | +5.174 |
riz | +5.137 |
Neg logit contributions | |
aber | -4.536 |
nl | -4.229 |
Causes | -4.032 |
裏� | -3.832 |
[' | -3.730 |
Token | Fle |
Token ID | 12005 |
Feature activation | +8.56e+00 |
Pos logit contributions | |
aber | +2.214 |
nl | +2.026 |
Causes | +1.885 |
[' | +1.833 |
owa | +1.811 |
Neg logit contributions | |
ught | -2.151 |
wick | -2.011 |
wives | -1.933 |
RG | -1.891 |
riz | -1.868 |
Token | ury |
Token ID | 1601 |
Feature activation | -3.58e-01 |
Pos logit contributions | |
aber | +4.980 |
nl | +4.452 |
[' | +3.889 |
owa | +3.860 |
gy | +3.831 |
Neg logit contributions | |
ught | -7.108 |
wick | -6.732 |
tradem | -6.625 |
CLA | -6.572 |
wives | -6.559 |
Token | agreed |
Token ID | 4987 |
Feature activation | +5.80e+00 |
Pos logit contributions | |
ught | +0.270 |
wick | +0.255 |
wives | +0.242 |
RG | +0.239 |
CLA | +0.237 |
Neg logit contributions | |
aber | -0.252 |
nl | -0.230 |
Causes | -0.214 |
[' | -0.205 |
owa | -0.204 |
Token | . |
Token ID | 13 |
Feature activation | +6.24e+00 |
Pos logit contributions | |
aber | +3.798 |
nl | +3.420 |
Causes | +3.104 |
[' | +3.087 |
owa | +3.034 |
Neg logit contributions | |
ught | -4.577 |
wick | -4.274 |
wives | -4.105 |
RG | -4.045 |
riz | -4.026 |
Token | — |
Token ID | 851 |
Feature activation | +4.31e+00 |
Pos logit contributions | |
aber | +4.122 |
nl | +3.855 |
Causes | +3.620 |
[' | +3.393 |
owa | +3.267 |
Neg logit contributions | |
ught | -4.824 |
wick | -4.480 |
wives | -4.297 |
riz | -4.197 |
elin | -4.171 |
Token | Ren |
Token ID | 7152 |
Feature activation | -1.95e+01 |
Pos logit contributions | |
aber | +3.205 |
nl | +2.943 |
Causes | +2.759 |
[' | +2.655 |
owa | +2.626 |
Neg logit contributions | |
ught | -3.034 |
wick | -2.815 |
wives | -2.708 |
RG | -2.621 |
CLA | -2.616 |
Token | aud |
Token ID | 3885 |
Feature activation | -5.45e+00 |
Pos logit contributions | |
wick | +7.953 |
ught | +7.952 |
riz | +7.088 |
RG | +6.928 |
CLA | +6.723 |
Neg logit contributions | |
Causes | -15.897 |
裏� | -15.373 |
aber | -14.847 |
nl | -14.412 |
JPM | -13.928 |
Token | Lav |
Token ID | 21438 |
Feature activation | -8.25e-01 |
Pos logit contributions | |
ught | +2.864 |
wick | +2.705 |
CLA | +2.461 |
RG | +2.457 |
wives | +2.406 |
Neg logit contributions | |
aber | -5.002 |
nl | -4.581 |
Causes | -4.319 |
owa | -4.272 |
[' | -4.143 |
Token | o |
Token ID | 78 |
Feature activation | +6.26e+00 |
Pos logit contributions | |
ught | +0.685 |
wick | +0.650 |
wives | +0.619 |
RG | +0.613 |
CLA | +0.606 |
Neg logit contributions | |
aber | -0.520 |
nl | -0.468 |
Causes | -0.434 |
[' | -0.411 |
owa | -0.410 |
Token | ie |
Token ID | 494 |
Feature activation | -4.43e-01 |
Pos logit contributions | |
aber | +2.183 |
nl | +1.920 |
[' | +1.559 |
Causes | +1.426 |
EE | +1.377 |
Neg logit contributions | |
ught | -6.744 |
wick | -6.423 |
tradem | -6.308 |
wives | -6.268 |
RG | -6.263 |
Token | (@ |
Token ID | 4275 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
ught | +0.288 |
wick | +0.268 |
wives | +0.253 |
RG | +0.250 |
CLA | +0.247 |
Neg logit contributions | |
aber | -0.360 |
nl | -0.332 |
Causes | -0.312 |
owa | -0.301 |
[' | -0.301 |
Token | Ruk |
Token ID | 49037 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
ught | +5.027 |
wick | +4.723 |
wives | +4.505 |
RG | +4.481 |
riz | +4.430 |
Neg logit contributions | |
aber | -5.281 |
nl | -4.765 |
owa | -4.299 |
[' | -4.275 |
Causes | -4.249 |
Token | mini |
Token ID | 45313 |
Feature activation | +3.93e-01 |
Pos logit contributions | |
ught | +2.725 |
wick | +2.678 |
riz | +2.134 |
wives | +2.069 |
elin | +2.057 |
Neg logit contributions | |
aber | -14.184 |
裏� | -13.223 |
nl | -13.212 |
Causes | -12.990 |
EE | -12.795 |
Token | Temple |
Token ID | 10857 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
aber | +0.255 |
nl | +0.231 |
Causes | +0.213 |
[' | +0.203 |
owa | +0.203 |
Neg logit contributions | |
ught | -0.319 |
wick | -0.302 |
wives | -0.288 |
RG | -0.285 |
CLA | -0.283 |
Token | Here |
Token ID | 3423 |
Feature activation | -6.67e+00 |
Pos logit contributions | |
ught | +2.405 |
wick | +2.246 |
wives | +2.159 |
RG | +2.118 |
CLA | +2.090 |
Neg logit contributions | |
aber | -2.296 |
nl | -2.095 |
Causes | -1.906 |
[' | -1.867 |
owa | -1.861 |
Token |
|
Token ID | 198 |
Feature activation | -7.14e-01 |
Pos logit contributions | |
ught | +4.183 |
wick | +3.907 |
wives | +3.718 |
RG | +3.686 |
CLA | +3.547 |
Neg logit contributions | |
aber | -5.282 |
nl | -4.884 |
Causes | -4.504 |
owa | -4.475 |
[' | -4.449 |
Token |
|
Token ID | 198 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
ught | +0.498 |
wick | +0.467 |
wives | +0.442 |
RG | +0.437 |
CLA | +0.432 |
Neg logit contributions | |
aber | -0.546 |
nl | -0.499 |
Causes | -0.468 |
owa | -0.451 |
[' | -0.449 |
Token | 6 |
Token ID | 21 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
ught | +10.226 |
RG | +10.076 |
wick | +9.702 |
CLA | +9.381 |
wives | +9.141 |
Neg logit contributions | |
aber | -13.805 |
Causes | -12.168 |
nl | -11.987 |
owa | -11.733 |
receiving | -11.132 |
Token | . |
Token ID | 13 |
Feature activation | -4.72e+00 |
Pos logit contributions | |
ught | +0.150 |
wick | +0.142 |
wives | +0.135 |
RG | +0.134 |
CLA | +0.133 |
Neg logit contributions | |
aber | -0.125 |
nl | -0.113 |
Causes | -0.105 |
owa | -0.100 |
[' | -0.100 |
Token | B |
Token ID | 347 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
ught | +3.423 |
wick | +3.228 |
RG | +3.065 |
wives | +3.055 |
riz | +3.016 |
Neg logit contributions | |
aber | -3.405 |
nl | -3.086 |
Causes | -2.811 |
[' | -2.773 |
owa | -2.766 |
Token | ala |
Token ID | 6081 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
ught | +0.822 |
wick | +0.770 |
wives | +0.729 |
RG | +0.723 |
CLA | +0.715 |
Neg logit contributions | |
aber | -0.809 |
nl | -0.741 |
Causes | -0.691 |
[' | -0.665 |
owa | -0.659 |
Token | Han |
Token ID | 9530 |
Feature activation | -6.77e+00 |
Pos logit contributions | |
aber | +1.405 |
nl | +1.275 |
Causes | +1.188 |
owa | +1.139 |
[' | +1.134 |
Neg logit contributions | |
ught | -1.521 |
wick | -1.437 |
wives | -1.368 |
RG | -1.349 |
CLA | -1.347 |
Token | 2 |
Token ID | 362 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
ught | +8.753 |
Closed | +7.873 |
riz | +7.791 |
wick | +7.566 |
Certified | +7.475 |
Neg logit contributions | |
aber | -13.999 |
nl | -13.125 |
icket | -12.479 |
xe | -12.134 |
owa | -12.114 |
Token | of |
Token ID | 286 |
Feature activation | -8.69e+00 |
Pos logit contributions | |
ught | +7.887 |
wives | +7.327 |
wick | +7.315 |
RG | +7.124 |
bern | +7.037 |
Neg logit contributions | |
aber | -10.807 |
nl | -10.365 |
Causes | -9.541 |
icket | -9.441 |
owa | -9.196 |
Token | 15 |
Token ID | 1315 |
Feature activation | -8.03e+00 |
Pos logit contributions | |
ught | +5.207 |
wick | +4.933 |
wives | +4.701 |
CLA | +4.521 |
RG | +4.497 |
Neg logit contributions | |
aber | -7.110 |
nl | -6.631 |
owa | -6.105 |
Causes | -5.928 |
tool | -5.860 |
Token | Photo |
Token ID | 5555 |
Feature activation | -7.48e+00 |
Pos logit contributions | |
ught | +3.982 |
wick | +3.589 |
wives | +3.388 |
RG | +3.367 |
riz | +3.355 |
Neg logit contributions | |
aber | -7.248 |
nl | -6.682 |
owa | -6.452 |
Causes | -6.269 |
icket | -6.267 |
Token | : |
Token ID | 25 |
Feature activation | -2.47e+00 |
Pos logit contributions | |
ught | +3.944 |
wick | +3.795 |
RG | +3.593 |
wives | +3.443 |
CLA | +3.424 |
Neg logit contributions | |
aber | -6.575 |
nl | -5.935 |
Causes | -5.683 |
owa | -5.666 |
icket | -5.448 |
Token | Le |
Token ID | 1004 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
ught | +1.915 |
wick | +1.804 |
wives | +1.718 |
RG | +1.708 |
CLA | +1.690 |
Neg logit contributions | |
aber | -1.690 |
nl | -1.514 |
Causes | -1.390 |
owa | -1.358 |
[' | -1.355 |
Token | a |
Token ID | 64 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
ught | +6.924 |
wick | +6.489 |
wives | +5.672 |
elin | +5.633 |
riz | +5.592 |
Neg logit contributions | |
裏� | -16.026 |
aber | -15.834 |
nl | -15.527 |
vertisement | -15.512 |
Causes | -15.364 |
Token | Suzuki |
Token ID | 35807 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
ught | +5.451 |
wick | +5.260 |
riz | +4.843 |
wives | +4.751 |
RG | +4.748 |
Neg logit contributions | |
aber | -10.155 |
nl | -9.485 |
icket | -8.805 |
[' | -8.721 |
owa | -8.644 |
Token | , |
Token ID | 11 |
Feature activation | -5.59e+00 |
Pos logit contributions | |
ught | +2.832 |
wick | +2.706 |
RG | +2.536 |
wives | +2.528 |
CLA | +2.510 |
Neg logit contributions | |
aber | -3.114 |
nl | -2.794 |
Causes | -2.618 |
owa | -2.602 |
[' | -2.494 |
Token | The |
Token ID | 383 |
Feature activation | -6.57e-01 |
Pos logit contributions | |
ught | +3.767 |
wick | +3.628 |
RG | +3.449 |
wives | +3.380 |
CLA | +3.371 |
Neg logit contributions | |
aber | -4.243 |
nl | -3.746 |
owa | -3.585 |
Causes | -3.464 |
[' | -3.420 |
Token | Chronicle |
Token ID | 14160 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
ught | +0.441 |
wick | +0.413 |
wives | +0.389 |
RG | +0.387 |
CLA | +0.381 |
Neg logit contributions | |
aber | -0.520 |
nl | -0.477 |
Causes | -0.446 |
owa | -0.432 |
[' | -0.431 |
Token | coordinator |
Token ID | 16052 |
Feature activation | -3.09e+00 |
Pos logit contributions | |
ught | +2.327 |
wick | +2.133 |
wives | +1.986 |
RG | +1.986 |
riz | +1.928 |
Neg logit contributions | |
aber | -3.422 |
nl | -3.123 |
Causes | -2.975 |
[' | -2.866 |
owa | -2.863 |
Token | Dennis |
Token ID | 16902 |
Feature activation | -9.25e-01 |
Pos logit contributions | |
ught | +2.180 |
wick | +2.025 |
wives | +1.941 |
RG | +1.923 |
CLA | +1.885 |
Neg logit contributions | |
aber | -2.296 |
nl | -2.083 |
Causes | -1.957 |
[' | -1.899 |
owa | -1.883 |
Token | Allen |
Token ID | 9659 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
ught | +0.505 |
wick | +0.467 |
wives | +0.434 |
RG | +0.428 |
CLA | +0.420 |
Neg logit contributions | |
aber | -0.849 |
nl | -0.786 |
Causes | -0.741 |
[' | -0.722 |
owa | -0.722 |
Token | the |
Token ID | 262 |
Feature activation | -9.78e+00 |
Pos logit contributions | |
aber | +0.889 |
nl | +0.808 |
Causes | +0.746 |
[' | +0.719 |
owa | +0.716 |
Neg logit contributions | |
ught | -1.020 |
wick | -0.959 |
wives | -0.915 |
RG | -0.907 |
CLA | -0.897 |
Token | past |
Token ID | 1613 |
Feature activation | -8.09e+00 |
Pos logit contributions | |
ught | +4.434 |
wick | +4.011 |
wives | +3.560 |
CLA | +3.497 |
RG | +3.448 |
Neg logit contributions | |
aber | -9.572 |
nl | -8.685 |
Causes | -8.350 |
[' | -8.010 |
owa | -7.973 |
Token | three |
Token ID | 1115 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
ught | +5.309 |
wick | +5.004 |
wives | +4.782 |
elin | +4.760 |
RG | +4.747 |
Neg logit contributions | |
aber | -6.217 |
nl | -5.575 |
Causes | -5.237 |
owa | -5.022 |
[' | -4.984 |
Token | games |
Token ID | 1830 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
ught | +8.158 |
wick | +7.746 |
RG | +7.588 |
wives | +7.190 |
riz | +7.187 |
Neg logit contributions | |
aber | -15.821 |
nl | -13.955 |
Causes | -13.619 |
裏� | -12.964 |
owa | -12.927 |
Token | than |
Token ID | 621 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
ught | +2.655 |
wick | +2.526 |
wives | +2.356 |
RG | +2.353 |
CLA | +2.327 |
Neg logit contributions | |
aber | -2.678 |
nl | -2.446 |
Causes | -2.317 |
owa | -2.186 |
[' | -2.173 |
Token | at |
Token ID | 379 |
Feature activation | -8.30e+00 |
Pos logit contributions | |
ught | +3.361 |
wick | +3.122 |
wives | +2.935 |
RG | +2.926 |
CLA | +2.882 |
Neg logit contributions | |
aber | -3.576 |
nl | -3.262 |
Causes | -3.063 |
owa | -2.931 |
[' | -2.924 |
Token | any |
Token ID | 597 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
ught | +6.181 |
wick | +5.827 |
RG | +5.453 |
riz | +5.426 |
wives | +5.350 |
Neg logit contributions | |
aber | -5.676 |
nl | -5.199 |
Causes | -4.754 |
owa | -4.554 |
[' | -4.521 |
Token | point |
Token ID | 966 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
ught | +5.294 |
wick | +4.754 |
RG | +4.407 |
wives | +4.262 |
CLA | +4.250 |
Neg logit contributions | |
aber | -9.000 |
nl | -8.237 |
Causes | -7.829 |
owa | -7.695 |
[' | -7.492 |
Token | ing |
Token ID | 278 |
Feature activation | -5.83e+00 |
Pos logit contributions | |
ught | +5.646 |
wick | +5.457 |
riz | +5.037 |
RG | +5.007 |
CLA | +4.862 |
Neg logit contributions | |
aber | -7.638 |
nl | -7.231 |
[' | -6.613 |
Causes | -6.552 |
裏� | -6.528 |
Token | contributor |
Token ID | 18920 |
Feature activation | -6.78e+00 |
Pos logit contributions | |
ught | +4.038 |
wick | +3.873 |
RG | +3.673 |
wives | +3.591 |
riz | +3.561 |
Neg logit contributions | |
aber | -4.329 |
nl | -3.880 |
[' | -3.478 |
owa | -3.463 |
Causes | -3.453 |
Token | : |
Token ID | 25 |
Feature activation | -7.42e+00 |
Pos logit contributions | |
ught | +4.240 |
wick | +3.985 |
wives | +3.731 |
RG | +3.707 |
CLA | +3.693 |
Neg logit contributions | |
aber | -5.483 |
nl | -4.979 |
Causes | -4.619 |
owa | -4.513 |
[' | -4.476 |
Token | David |
Token ID | 3271 |
Feature activation | -8.68e+00 |
Pos logit contributions | |
ught | +5.200 |
wick | +4.949 |
CLA | +4.692 |
RG | +4.676 |
wives | +4.675 |
Neg logit contributions | |
aber | -5.354 |
nl | -4.736 |
Causes | -4.318 |
[' | -4.304 |
owa | -4.298 |
Token | A |
Token ID | 317 |
Feature activation | -4.48e+00 |
Pos logit contributions | |
ught | +6.057 |
wick | +5.954 |
riz | +5.495 |
RG | +5.471 |
CLA | +5.466 |
Neg logit contributions | |
aber | -5.914 |
nl | -5.433 |
owa | -4.882 |
Causes | -4.858 |
[' | -4.851 |
Token | . |
Token ID | 13 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
ught | +3.324 |
wick | +3.142 |
wives | +2.936 |
riz | +2.920 |
CLA | +2.900 |
Neg logit contributions | |
aber | -3.140 |
nl | -2.851 |
Causes | -2.697 |
owa | -2.589 |
[' | -2.572 |
Token | Sle |
Token ID | 19498 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
wick | +7.710 |
ught | +7.457 |
riz | +6.434 |
Certified | +6.385 |
elin | +6.383 |
Neg logit contributions | |
aber | -15.760 |
nl | -14.538 |
owa | -13.932 |
tool | -13.776 |
[' | -13.314 |
Token | et |
Token ID | 316 |
Feature activation | -3.80e+00 |
Pos logit contributions | |
ught | +1.811 |
wick | +1.711 |
wives | +1.584 |
elin | +1.577 |
RG | +1.554 |
Neg logit contributions | |
aber | -1.747 |
nl | -1.603 |
Causes | -1.549 |
[' | -1.447 |
owa | -1.441 |
Token | , |
Token ID | 11 |
Feature activation | -8.11e+00 |
Pos logit contributions | |
ught | +2.734 |
wick | +2.608 |
RG | +2.460 |
wives | +2.440 |
CLA | +2.427 |
Neg logit contributions | |
aber | -2.758 |
nl | -2.487 |
Causes | -2.317 |
[' | -2.229 |
owa | -2.226 |
Token | d |
Token ID | 288 |
Feature activation | -5.44e+00 |
Pos logit contributions | |
ught | +5.204 |
wick | +4.929 |
wives | +4.706 |
RG | +4.705 |
CLA | +4.703 |
Neg logit contributions | |
aber | -6.247 |
nl | -5.447 |
Causes | -5.030 |
[' | -5.026 |
owa | -4.958 |
Token | sle |
Token ID | 26738 |
Feature activation | +4.94e+00 |
Pos logit contributions | |
ught | +4.326 |
wick | +4.084 |
elin | +3.885 |
wives | +3.873 |
riz | +3.850 |
Neg logit contributions | |
aber | -3.438 |
nl | -3.054 |
Causes | -2.989 |
owa | -2.753 |
[' | -2.753 |
Token | racism |
Token ID | 10713 |
Feature activation | +1.68e-01 |
Pos logit contributions | |
ught | +0.143 |
wick | +0.133 |
wives | +0.126 |
RG | +0.125 |
CLA | +0.123 |
Neg logit contributions | |
aber | -0.164 |
nl | -0.151 |
Causes | -0.141 |
[' | -0.136 |
owa | -0.135 |
Token | and |
Token ID | 290 |
Feature activation | +3.87e+00 |
Pos logit contributions | |
aber | +0.122 |
nl | +0.112 |
Causes | +0.104 |
[' | +0.100 |
owa | +0.100 |
Neg logit contributions | |
ught | -0.123 |
wick | -0.115 |
wives | -0.110 |
RG | -0.108 |
CLA | -0.107 |
Token | sexism |
Token ID | 24953 |
Feature activation | -6.26e-01 |
Pos logit contributions | |
aber | +3.311 |
nl | +3.127 |
Causes | +2.938 |
[' | +2.872 |
owa | +2.854 |
Neg logit contributions | |
ught | -2.254 |
wick | -2.107 |
wives | -1.978 |
RG | -1.953 |
CLA | -1.933 |
Token | I |
Token ID | 314 |
Feature activation | +7.27e+00 |
Pos logit contributions | |
ught | +0.449 |
wick | +0.420 |
wives | +0.400 |
RG | +0.394 |
CLA | +0.390 |
Neg logit contributions | |
aber | -0.466 |
nl | -0.426 |
Causes | -0.397 |
owa | -0.381 |
[' | -0.381 |
Token | was |
Token ID | 373 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
aber | +4.694 |
nl | +4.267 |
[' | +3.918 |
Causes | +3.902 |
owa | +3.842 |
Neg logit contributions | |
ught | -5.601 |
wick | -5.275 |
wives | -5.080 |
RG | -5.025 |
CLA | -4.908 |
Token | telling |
Token ID | 5149 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
aber | +1.075 |
nl | +0.980 |
Causes | +0.906 |
[' | +0.879 |
owa | +0.866 |
Neg logit contributions | |
ught | -1.208 |
wick | -1.132 |
wives | -1.077 |
RG | -1.072 |
CLA | -1.059 |
Token | you |
Token ID | 345 |
Feature activation | +9.73e+00 |
Pos logit contributions | |
aber | +6.861 |
nl | +6.232 |
Causes | +5.913 |
[' | +5.886 |
ys | +5.264 |
Neg logit contributions | |
ught | -10.538 |
wick | -10.194 |
elin | -9.498 |
CLA | -9.453 |
wives | -9.430 |
Token | about |
Token ID | 546 |
Feature activation | +3.39e-01 |
Pos logit contributions | |
aber | +5.686 |
nl | +5.102 |
[' | +4.707 |
Causes | +4.681 |
owa | +4.417 |
Neg logit contributions | |
ught | -7.851 |
wick | -7.458 |
CLA | -7.139 |
RG | -7.131 |
elin | -7.077 |
Token | ? |
Token ID | 30 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
aber | +0.245 |
nl | +0.224 |
Causes | +0.209 |
[' | +0.201 |
owa | +0.200 |
Neg logit contributions | |
ught | -0.251 |
wick | -0.235 |
wives | -0.223 |
RG | -0.221 |
CLA | -0.219 |
Token | Well |
Token ID | 3894 |
Feature activation | +3.12e+00 |
Pos logit contributions | |
aber | +2.824 |
nl | +2.632 |
Causes | +2.480 |
[' | +2.352 |
owa | +2.260 |
Neg logit contributions | |
ught | -3.286 |
wick | -3.048 |
wives | -2.892 |
elin | -2.869 |
RG | -2.857 |
Token | , |
Token ID | 11 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
aber | +2.019 |
nl | +1.824 |
Causes | +1.679 |
[' | +1.627 |
owa | +1.606 |
Neg logit contributions | |
ught | -2.522 |
wick | -2.361 |
wives | -2.258 |
RG | -2.237 |
CLA | -2.217 |
Token | minute |
Token ID | 5664 |
Feature activation | +6.40e+00 |
Pos logit contributions | |
aber | +4.215 |
nl | +3.911 |
Causes | +3.606 |
owa | +3.451 |
[' | +3.437 |
Neg logit contributions | |
ught | -4.668 |
wick | -4.546 |
wives | -4.363 |
RG | -4.295 |
CLA | -4.246 |
Token | and |
Token ID | 290 |
Feature activation | +5.91e+00 |
Pos logit contributions | |
aber | +4.316 |
nl | +3.910 |
[' | +3.622 |
Causes | +3.581 |
owa | +3.486 |
Neg logit contributions | |
ught | -4.820 |
wick | -4.554 |
RG | -4.377 |
wives | -4.339 |
CLA | -4.268 |
Token | nineteen |
Token ID | 43063 |
Feature activation | +6.41e+00 |
Pos logit contributions | |
aber | +3.845 |
nl | +3.536 |
Causes | +3.320 |
[' | +3.213 |
owa | +3.154 |
Neg logit contributions | |
ught | -4.538 |
wick | -4.292 |
wives | -4.095 |
CLA | -4.067 |
RG | -4.064 |
Token | seconds |
Token ID | 4201 |
Feature activation | +7.69e+00 |
Pos logit contributions | |
aber | +3.938 |
nl | +3.602 |
Causes | +3.342 |
[' | +3.255 |
owa | +3.230 |
Neg logit contributions | |
ught | -5.111 |
wick | -4.814 |
RG | -4.620 |
wives | -4.616 |
CLA | -4.593 |
Token | into |
Token ID | 656 |
Feature activation | +5.82e+00 |
Pos logit contributions | |
aber | +4.950 |
nl | +4.484 |
[' | +4.199 |
Causes | +4.145 |
owa | +4.001 |
Neg logit contributions | |
ught | -5.917 |
wick | -5.553 |
RG | -5.323 |
wives | -5.306 |
CLA | -5.245 |
Token | launch |
Token ID | 4219 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
aber | +3.663 |
nl | +3.332 |
Causes | +3.079 |
[' | +2.956 |
owa | +2.909 |
Neg logit contributions | |
ught | -4.586 |
wick | -4.400 |
wives | -4.230 |
CLA | -4.178 |
RG | -4.128 |
Token | . |
Token ID | 13 |
Feature activation | +5.05e+00 |
Pos logit contributions | |
aber | +5.693 |
nl | +5.347 |
[' | +4.748 |
Causes | +4.666 |
gy | +4.530 |
Neg logit contributions | |
ught | -8.870 |
wick | -8.396 |
wives | -8.048 |
CLA | -7.976 |
RG | -7.964 |
Token | The |
Token ID | 383 |
Feature activation | +4.43e+00 |
Pos logit contributions | |
aber | +3.271 |
nl | +3.064 |
Causes | +2.901 |
[' | +2.709 |
EE | +2.596 |
Neg logit contributions | |
ught | -4.048 |
wick | -3.757 |
wives | -3.578 |
CLA | -3.507 |
RG | -3.504 |
Token | rocket |
Token ID | 10701 |
Feature activation | +4.09e+00 |
Pos logit contributions | |
aber | +3.207 |
nl | +2.948 |
Causes | +2.799 |
[' | +2.671 |
owa | +2.639 |
Neg logit contributions | |
ught | -3.174 |
wick | -2.990 |
wives | -2.826 |
CLA | -2.812 |
RG | -2.808 |
Token | had |
Token ID | 550 |
Feature activation | +1.78e+00 |
Pos logit contributions | |
aber | +2.762 |
nl | +2.537 |
Causes | +2.338 |
[' | +2.275 |
owa | +2.248 |
Neg logit contributions | |
ught | -3.154 |
wick | -2.965 |
wives | -2.821 |
RG | -2.810 |
CLA | -2.790 |
Token | to |
Token ID | 284 |
Feature activation | +5.61e+00 |
Pos logit contributions | |
aber | +1.268 |
nl | +1.162 |
Causes | +1.076 |
[' | +1.042 |
owa | +1.033 |
Neg logit contributions | |
ught | -1.326 |
wick | -1.247 |
wives | -1.187 |
RG | -1.179 |
CLA | -1.167 |
Token | double |
Token ID | 4274 |
Feature activation | +5.64e-01 |
Pos logit contributions | |
aber | +5.790 |
nl | +5.336 |
Causes | +4.899 |
[' | +4.825 |
owa | +4.794 |
Neg logit contributions | |
ught | -5.468 |
wick | -5.131 |
wives | -4.888 |
RG | -4.869 |
CLA | -4.766 |
Token | - |
Token ID | 12 |
Feature activation | +5.46e+00 |
Pos logit contributions | |
aber | +0.411 |
nl | +0.376 |
Causes | +0.349 |
[' | +0.337 |
owa | +0.335 |
Neg logit contributions | |
ught | -0.414 |
wick | -0.389 |
wives | -0.369 |
RG | -0.365 |
CLA | -0.361 |
Token | o |
Token ID | 78 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
aber | +3.404 |
nl | +3.033 |
[' | +2.630 |
Causes | +2.629 |
owa | +2.603 |
Neg logit contributions | |
ught | -4.542 |
wick | -4.239 |
wives | -4.082 |
RG | -4.063 |
CLA | -4.033 |
Token | vert |
Token ID | 1851 |
Feature activation | +6.19e+00 |
Pos logit contributions | |
aber | +0.846 |
nl | +0.747 |
Causes | +0.665 |
[' | +0.639 |
owa | +0.638 |
Neg logit contributions | |
ught | -1.418 |
wick | -1.363 |
wives | -1.307 |
RG | -1.300 |
CLA | -1.284 |
Token | ime |
Token ID | 524 |
Feature activation | +8.31e+00 |
Pos logit contributions | |
aber | +3.665 |
nl | +3.040 |
[' | +2.707 |
Causes | +2.695 |
owa | +2.643 |
Neg logit contributions | |
ught | -5.403 |
wick | -5.109 |
wives | -5.053 |
CLA | -4.918 |
RG | -4.897 |
Token | goal |
Token ID | 3061 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
aber | +5.604 |
nl | +5.146 |
Causes | +4.654 |
[' | +4.565 |
owa | +4.540 |
Neg logit contributions | |
ught | -6.028 |
wick | -5.817 |
wives | -5.624 |
RG | -5.543 |
CLA | -5.492 |
Token | clin |
Token ID | 5327 |
Feature activation | -2.48e+00 |
Pos logit contributions | |
aber | +6.407 |
nl | +5.909 |
Causes | +5.255 |
owa | +5.181 |
[' | +5.175 |
Neg logit contributions | |
ught | -7.663 |
wick | -7.216 |
RG | -7.089 |
wives | -6.889 |
CLA | -6.803 |
Token | ched |
Token ID | 1740 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
ught | +1.560 |
wick | +1.462 |
wives | +1.352 |
RG | +1.319 |
riz | +1.316 |
Neg logit contributions | |
aber | -2.074 |
nl | -1.900 |
Causes | -1.815 |
[' | -1.738 |
owa | -1.730 |
Token | New |
Token ID | 968 |
Feature activation | +3.87e+00 |
Pos logit contributions | |
aber | +2.904 |
nl | +2.662 |
Causes | +2.432 |
[' | +2.363 |
owa | +2.342 |
Neg logit contributions | |
ught | -3.210 |
wick | -3.021 |
wives | -2.893 |
RG | -2.851 |
riz | -2.792 |
Token | Jersey |
Token ID | 8221 |
Feature activation | +4.04e+00 |
Pos logit contributions | |
aber | +2.684 |
nl | +2.450 |
Causes | +2.194 |
owa | +2.112 |
[' | +2.079 |
Neg logit contributions | |
ught | -2.976 |
wick | -2.770 |
RG | -2.678 |
wives | -2.672 |
CLA | -2.630 |
Token | � |
Token ID | 447 |
Feature activation | -2.21e-04 |
Pos logit contributions | |
aber | +2.593 |
nl | +2.369 |
Causes | +2.162 |
[' | +2.124 |
owa | +2.072 |
Neg logit contributions | |
ught | -3.279 |
wick | -3.054 |
wives | -2.932 |
RG | -2.899 |
CLA | -2.861 |
Token | in |
Token ID | 287 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
aber | +0.670 |
nl | +0.612 |
Causes | +0.571 |
[' | +0.551 |
owa | +0.548 |
Neg logit contributions | |
ught | -0.652 |
wick | -0.610 |
wives | -0.577 |
RG | -0.572 |
CLA | -0.567 |
Token | how |
Token ID | 703 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
aber | +1.081 |
nl | +0.988 |
Causes | +0.920 |
[' | +0.886 |
owa | +0.880 |
Neg logit contributions | |
ught | -1.143 |
wick | -1.075 |
wives | -1.019 |
RG | -1.009 |
CLA | -1.001 |
Token | Good |
Token ID | 4599 |
Feature activation | -3.32e-01 |
Pos logit contributions | |
ught | +1.000 |
wick | +0.935 |
wives | +0.890 |
RG | +0.879 |
CLA | +0.868 |
Neg logit contributions | |
aber | -1.021 |
nl | -0.931 |
Causes | -0.863 |
[' | -0.833 |
owa | -0.831 |
Token | will |
Token ID | 10594 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
ught | +0.243 |
wick | +0.229 |
wives | +0.217 |
RG | +0.214 |
CLA | +0.212 |
Neg logit contributions | |
aber | -0.242 |
nl | -0.221 |
Causes | -0.205 |
[' | -0.198 |
owa | -0.197 |
Token | determines |
Token ID | 15947 |
Feature activation | +7.23e+00 |
Pos logit contributions | |
aber | +2.075 |
nl | +1.896 |
Causes | +1.755 |
[' | +1.702 |
owa | +1.680 |
Neg logit contributions | |
ught | -2.387 |
wick | -2.234 |
wives | -2.126 |
RG | -2.113 |
CLA | -2.096 |
Token | what |
Token ID | 644 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
aber | +4.538 |
nl | +4.188 |
Causes | +3.956 |
[' | +3.806 |
owa | +3.704 |
Neg logit contributions | |
ught | -5.648 |
wick | -5.419 |
CLA | -5.106 |
RG | -5.097 |
riz | -5.051 |
Token | it |
Token ID | 340 |
Feature activation | +3.33e+00 |
Pos logit contributions | |
aber | +7.297 |
nl | +6.977 |
Causes | +6.753 |
[' | +6.521 |
owa | +6.333 |
Neg logit contributions | |
ught | -7.811 |
wick | -7.506 |
RG | -7.004 |
agos | -6.942 |
riz | -6.905 |
Token | pays |
Token ID | 13831 |
Feature activation | +8.01e-01 |
Pos logit contributions | |
aber | +2.346 |
nl | +2.148 |
Causes | +2.002 |
[' | +1.952 |
owa | +1.926 |
Neg logit contributions | |
ught | -2.493 |
wick | -2.341 |
wives | -2.224 |
RG | -2.210 |
CLA | -2.174 |
Token | in |
Token ID | 287 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
aber | +0.570 |
nl | +0.521 |
Causes | +0.485 |
[' | +0.468 |
owa | +0.464 |
Neg logit contributions | |
ught | -0.600 |
wick | -0.564 |
wives | -0.533 |
RG | -0.531 |
CLA | -0.525 |
Token | executive |
Token ID | 4640 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
ught | +1.234 |
wick | +1.141 |
wives | +1.078 |
RG | +1.060 |
CLA | +1.040 |
Neg logit contributions | |
aber | -1.636 |
nl | -1.506 |
Causes | -1.410 |
owa | -1.364 |
[' | -1.362 |
Token | bonuses |
Token ID | 17568 |
Feature activation | +4.70e+00 |
Pos logit contributions | |
aber | +0.237 |
nl | +0.218 |
Causes | +0.203 |
[' | +0.196 |
owa | +0.196 |
Neg logit contributions | |
ught | -0.213 |
wick | -0.199 |
wives | -0.188 |
RG | -0.186 |
CLA | -0.184 |
Token | > |
Token ID | 29 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
aber | +1.612 |
nl | +1.482 |
Causes | +1.374 |
[' | +1.347 |
owa | +1.321 |
Neg logit contributions | |
ught | -1.607 |
wick | -1.506 |
wives | -1.445 |
RG | -1.414 |
CLA | -1.404 |
Token | |
Token ID | 7359 |
Feature activation | -4.22e+00 |
Pos logit contributions | |
ught | +2.171 |
wick | +2.032 |
wives | +1.915 |
RG | +1.904 |
CLA | +1.865 |
Neg logit contributions | |
aber | -2.702 |
nl | -2.462 |
Causes | -2.296 |
owa | -2.240 |
[' | -2.226 |
Token | li |
Token ID | 4528 |
Feature activation | +4.62e+00 |
Pos logit contributions | |
ught | +3.408 |
wick | +3.226 |
RG | +3.040 |
CLA | +3.040 |
wives | +3.038 |
Neg logit contributions | |
aber | -2.671 |
nl | -2.377 |
Causes | -2.300 |
owa | -2.141 |
[' | -2.110 |
Token | > |
Token ID | 29 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
aber | +3.183 |
nl | +2.915 |
[' | +2.694 |
Causes | +2.680 |
owa | +2.561 |
Neg logit contributions | |
ught | -3.513 |
wick | -3.306 |
wives | -3.189 |
CLA | -3.089 |
elin | -3.086 |
Token | |
Token ID | 7359 |
Feature activation | -2.31e+00 |
Pos logit contributions | |
ught | +0.933 |
wick | +0.872 |
wives | +0.825 |
RG | +0.817 |
CLA | +0.804 |
Neg logit contributions | |
aber | -1.080 |
nl | -0.989 |
Causes | -0.924 |
owa | -0.894 |
[' | -0.893 |
Token | ul |
Token ID | 377 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
ught | +1.285 |
wick | +1.190 |
wives | +1.095 |
RG | +1.087 |
CLA | +1.066 |
Neg logit contributions | |
aber | -2.073 |
nl | -1.912 |
Causes | -1.852 |
owa | -1.781 |
[' | -1.764 |
Token | > |
Token ID | 29 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
aber | +5.897 |
nl | +5.561 |
[' | +5.190 |
Causes | +4.751 |
xe | +4.631 |
Neg logit contributions | |
ught | -8.332 |
tradem | -7.984 |
wick | -7.761 |
wives | -7.703 |
elin | -7.512 |
Token | |
Token ID | 7359 |
Feature activation | +2.33e+00 |
Pos logit contributions | |
aber | +0.189 |
nl | +0.173 |
Causes | +0.162 |
[' | +0.156 |
owa | +0.156 |
Neg logit contributions | |
ught | -0.172 |
wick | -0.161 |
wives | -0.152 |
RG | -0.150 |
CLA | -0.149 |
Token | body |
Token ID | 2618 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
aber | +1.682 |
nl | +1.556 |
Causes | +1.402 |
[' | +1.386 |
owa | +1.359 |
Neg logit contributions | |
ught | -1.715 |
wick | -1.610 |
wives | -1.536 |
RG | -1.513 |
riz | -1.493 |
Token | > |
Token ID | 29 |
Feature activation | -2.88e-01 |
Pos logit contributions | |
aber | +6.083 |
nl | +5.839 |
[' | +5.614 |
Causes | +4.836 |
xe | +4.779 |
Neg logit contributions | |
ught | -9.422 |
tradem | -9.106 |
wives | -8.691 |
wick | -8.643 |
ewitness | -8.405 |
Token |
|
Token ID | 198 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
ught | +0.202 |
wick | +0.189 |
wives | +0.179 |
RG | +0.177 |
CLA | +0.175 |
Neg logit contributions | |
aber | -0.219 |
nl | -0.201 |
Causes | -0.188 |
[' | -0.181 |
owa | -0.181 |
Token | manage |
Token ID | 6687 |
Feature activation | -5.53e+00 |
Pos logit contributions | |
ught | +0.155 |
wick | +0.146 |
wives | +0.138 |
RG | +0.137 |
CLA | +0.135 |
Neg logit contributions | |
aber | -0.148 |
nl | -0.135 |
Causes | -0.126 |
[' | -0.121 |
owa | -0.121 |
Token | electronic |
Token ID | 7914 |
Feature activation | -4.00e+00 |
Pos logit contributions | |
ught | +3.694 |
wick | +3.471 |
wives | +3.265 |
RG | +3.233 |
elin | +3.161 |
Neg logit contributions | |
aber | -4.277 |
nl | -3.883 |
Causes | -3.651 |
owa | -3.500 |
[' | -3.499 |
Token | and |
Token ID | 290 |
Feature activation | +5.95e-01 |
Pos logit contributions | |
ught | +2.547 |
wick | +2.348 |
wives | +2.233 |
RG | +2.193 |
CLA | +2.148 |
Neg logit contributions | |
aber | -3.283 |
nl | -3.008 |
Causes | -2.829 |
[' | -2.724 |
owa | -2.715 |
Token | print |
Token ID | 3601 |
Feature activation | +1.72e+00 |
Pos logit contributions | |
aber | +0.460 |
nl | +0.424 |
Causes | +0.396 |
[' | +0.382 |
owa | +0.381 |
Neg logit contributions | |
ught | -0.409 |
wick | -0.382 |
wives | -0.362 |
RG | -0.357 |
CLA | -0.354 |
Token | collections |
Token ID | 17268 |
Feature activation | +8.47e-01 |
Pos logit contributions | |
aber | +1.370 |
nl | +1.274 |
Causes | +1.183 |
[' | +1.151 |
owa | +1.147 |
Neg logit contributions | |
ught | -1.136 |
wick | -1.060 |
wives | -0.999 |
RG | -0.982 |
CLA | -0.977 |
Token | . |
Token ID | 13 |
Feature activation | +4.59e+00 |
Pos logit contributions | |
aber | +0.585 |
nl | +0.533 |
Causes | +0.492 |
[' | +0.474 |
owa | +0.471 |
Neg logit contributions | |
ught | -0.654 |
wick | -0.616 |
wives | -0.585 |
RG | -0.580 |
CLA | -0.574 |
Token | These |
Token ID | 2312 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
aber | +3.115 |
nl | +2.889 |
Causes | +2.708 |
[' | +2.551 |
owa | +2.491 |
Neg logit contributions | |
ught | -3.578 |
wick | -3.317 |
wives | -3.177 |
elin | -3.122 |
RG | -3.089 |
Token | platforms |
Token ID | 9554 |
Feature activation | -3.90e+00 |
Pos logit contributions | |
aber | +0.146 |
nl | +0.134 |
Causes | +0.124 |
[' | +0.119 |
owa | +0.119 |
Neg logit contributions | |
ught | -0.152 |
wick | -0.142 |
wives | -0.135 |
RG | -0.134 |
CLA | -0.132 |
Token | follow |
Token ID | 1061 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
ught | +2.749 |
wick | +2.551 |
wives | +2.426 |
RG | +2.386 |
riz | +2.359 |
Neg logit contributions | |
aber | -2.930 |
nl | -2.675 |
Causes | -2.521 |
owa | -2.399 |
[' | -2.365 |
Token | the |
Token ID | 262 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
ught | +2.984 |
wick | +2.793 |
wives | +2.648 |
RG | +2.633 |
CLA | +2.580 |
Neg logit contributions | |
aber | -3.374 |
nl | -3.130 |
Causes | -2.902 |
[' | -2.808 |
owa | -2.805 |
Token | services |
Token ID | 2594 |
Feature activation | -2.71e+00 |
Pos logit contributions | |
ught | +0.950 |
wick | +0.886 |
wives | +0.838 |
RG | +0.829 |
riz | +0.818 |
Neg logit contributions | |
aber | -1.049 |
nl | -0.968 |
Causes | -0.899 |
[' | -0.869 |
owa | -0.868 |
Token | s |
Token ID | 82 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
aber | +2.730 |
nl | +2.512 |
Causes | +2.302 |
[' | +2.187 |
owa | +2.122 |
Neg logit contributions | |
ught | -4.672 |
wick | -4.458 |
wives | -4.266 |
RG | -4.261 |
CLA | -4.199 |
Token | her |
Token ID | 607 |
Feature activation | -4.73e+00 |
Pos logit contributions | |
aber | +2.362 |
nl | +2.169 |
Causes | +2.039 |
[' | +1.965 |
owa | +1.933 |
Neg logit contributions | |
ught | -2.334 |
wick | -2.197 |
RG | -2.069 |
wives | -2.062 |
CLA | -2.049 |
Token | burned |
Token ID | 11544 |
Feature activation | -4.89e-01 |
Pos logit contributions | |
ught | +2.674 |
wick | +2.439 |
wives | +2.307 |
RG | +2.254 |
riz | +2.247 |
Neg logit contributions | |
aber | -4.195 |
nl | -3.863 |
Causes | -3.602 |
owa | -3.514 |
[' | -3.451 |
Token | arm |
Token ID | 3211 |
Feature activation | +7.07e-01 |
Pos logit contributions | |
ught | +0.368 |
wick | +0.346 |
wives | +0.328 |
RG | +0.325 |
CLA | +0.322 |
Neg logit contributions | |
aber | -0.347 |
nl | -0.317 |
Causes | -0.293 |
[' | -0.282 |
owa | -0.281 |
Token |
|
Token ID | 198 |
Feature activation | -2.73e+00 |
Pos logit contributions | |
aber | +0.514 |
nl | +0.470 |
Causes | +0.438 |
[' | +0.421 |
owa | +0.419 |
Neg logit contributions | |
ught | -0.519 |
wick | -0.487 |
wives | -0.462 |
RG | -0.458 |
CLA | -0.452 |
Token |
|
Token ID | 198 |
Feature activation | +6.06e-01 |
Pos logit contributions | |
ught | +1.795 |
wick | +1.693 |
wives | +1.596 |
RG | +1.580 |
CLA | +1.558 |
Neg logit contributions | |
aber | -2.189 |
nl | -1.983 |
Causes | -1.882 |
owa | -1.826 |
[' | -1.773 |
Token | T |
Token ID | 51 |
Feature activation | -4.71e+00 |
Pos logit contributions | |
aber | +0.421 |
nl | +0.384 |
Causes | +0.354 |
[' | +0.343 |
owa | +0.339 |
Neg logit contributions | |
ught | -0.465 |
wick | -0.438 |
wives | -0.416 |
RG | -0.411 |
CLA | -0.407 |
Token | ori |
Token ID | 10145 |
Feature activation | -3.75e+00 |
Pos logit contributions | |
ught | +1.893 |
wick | +1.702 |
riz | +1.496 |
wives | +1.490 |
RG | +1.468 |
Neg logit contributions | |
aber | -4.917 |
nl | -4.643 |
Causes | -4.489 |
[' | -4.332 |
裏� | -4.275 |
Token | and |
Token ID | 290 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
ught | +2.797 |
wick | +2.619 |
wives | +2.485 |
CLA | +2.424 |
RG | +2.418 |
Neg logit contributions | |
aber | -2.680 |
nl | -2.441 |
Causes | -2.222 |
owa | -2.150 |
[' | -2.120 |
Token | family |
Token ID | 1641 |
Feature activation | -3.77e-01 |
Pos logit contributions | |
aber | +0.164 |
nl | +0.150 |
Causes | +0.140 |
[' | +0.135 |
owa | +0.134 |
Neg logit contributions | |
ught | -0.161 |
wick | -0.151 |
wives | -0.143 |
RG | -0.141 |
CLA | -0.140 |
Token | and |
Token ID | 290 |
Feature activation | +6.71e+00 |
Pos logit contributions | |
ught | +0.263 |
wick | +0.246 |
wives | +0.233 |
RG | +0.229 |
CLA | +0.227 |
Neg logit contributions | |
aber | -0.290 |
nl | -0.265 |
Causes | -0.248 |
owa | -0.238 |
[' | -0.237 |
Token | This |
Token ID | 1212 |
Feature activation | -7.38e+00 |
Pos logit contributions | |
ught | +4.677 |
wick | +4.398 |
wives | +4.221 |
RG | +4.137 |
CLA | +4.086 |
Neg logit contributions | |
aber | -4.264 |
nl | -3.896 |
Causes | -3.740 |
owa | -3.535 |
[' | -3.429 |
Token | means |
Token ID | 1724 |
Feature activation | -7.91e+00 |
Pos logit contributions | |
ught | +5.144 |
wick | +4.761 |
wives | +4.392 |
RG | +4.337 |
riz | +4.325 |
Neg logit contributions | |
aber | -5.371 |
nl | -4.993 |
Causes | -4.555 |
owa | -4.442 |
[' | -4.360 |
Token | that |
Token ID | 326 |
Feature activation | -7.98e+00 |
Pos logit contributions | |
ught | +5.033 |
wick | +4.800 |
wives | +4.546 |
riz | +4.439 |
RG | +4.425 |
Neg logit contributions | |
aber | -6.065 |
nl | -5.594 |
Causes | -5.296 |
owa | -5.025 |
[' | -4.944 |
Token | the |
Token ID | 262 |
Feature activation | -4.33e+00 |
Pos logit contributions | |
ught | +5.152 |
wick | +4.908 |
wives | +4.722 |
riz | +4.511 |
RG | +4.476 |
Neg logit contributions | |
aber | -6.082 |
nl | -5.622 |
Causes | -5.218 |
owa | -5.019 |
[' | -4.906 |
Token | Government |
Token ID | 5070 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
ught | +3.039 |
wick | +2.853 |
wives | +2.706 |
riz | +2.629 |
RG | +2.615 |
Neg logit contributions | |
aber | -3.240 |
nl | -2.995 |
Causes | -2.746 |
owa | -2.670 |
[' | -2.658 |
Token | itself |
Token ID | 2346 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
ught | +1.382 |
wick | +1.311 |
wives | +1.248 |
RG | +1.229 |
riz | +1.214 |
Neg logit contributions | |
aber | -1.315 |
nl | -1.198 |
Causes | -1.110 |
owa | -1.067 |
[' | -1.059 |
Token | will |
Token ID | 481 |
Feature activation | -8.01e-01 |
Pos logit contributions | |
aber | +1.444 |
nl | +1.314 |
Causes | +1.214 |
[' | +1.179 |
owa | +1.160 |
Neg logit contributions | |
ught | -1.682 |
wick | -1.580 |
wives | -1.502 |
RG | -1.496 |
CLA | -1.480 |
Token | be |
Token ID | 307 |
Feature activation | -8.36e-01 |
Pos logit contributions | |
ught | +0.576 |
wick | +0.541 |
wives | +0.511 |
RG | +0.505 |
CLA | +0.500 |
Neg logit contributions | |
aber | -0.596 |
nl | -0.545 |
Causes | -0.510 |
owa | -0.487 |
[' | -0.487 |
Token | subject |
Token ID | 2426 |
Feature activation | -5.54e+00 |
Pos logit contributions | |
ught | +0.573 |
wick | +0.538 |
wives | +0.508 |
RG | +0.502 |
CLA | +0.495 |
Neg logit contributions | |
aber | -0.647 |
nl | -0.594 |
Causes | -0.557 |
owa | -0.535 |
[' | -0.534 |
Token | to |
Token ID | 284 |
Feature activation | -6.40e+00 |
Pos logit contributions | |
ught | +3.668 |
wick | +3.445 |
wives | +3.262 |
RG | +3.211 |
riz | +3.206 |
Neg logit contributions | |
aber | -4.271 |
nl | -3.883 |
Causes | -3.694 |
owa | -3.508 |
[' | -3.474 |
Token | sh |
Token ID | 427 |
Feature activation | -5.82e+00 |
Pos logit contributions | |
ught | +4.202 |
wick | +3.959 |
wives | +3.742 |
riz | +3.683 |
RG | +3.660 |
Neg logit contributions | |
aber | -4.919 |
nl | -4.534 |
Causes | -4.231 |
owa | -4.108 |
[' | -3.980 |
Token | ition |
Token ID | 653 |
Feature activation | +3.66e+00 |
Pos logit contributions | |
aber | +2.683 |
nl | +2.357 |
Causes | +2.043 |
owa | +2.016 |
[' | +2.013 |
Neg logit contributions | |
ught | -4.279 |
wick | -4.191 |
wives | -4.055 |
RG | -4.007 |
CLA | -3.939 |
Token | standing |
Token ID | 5055 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
aber | +2.509 |
nl | +2.288 |
Causes | +2.106 |
[' | +2.069 |
owa | +2.029 |
Neg logit contributions | |
ught | -2.766 |
wick | -2.655 |
RG | -2.523 |
wives | -2.506 |
CLA | -2.468 |
Token | in |
Token ID | 287 |
Feature activation | +2.44e+00 |
Pos logit contributions | |
aber | +0.791 |
nl | +0.721 |
Causes | +0.669 |
[' | +0.646 |
owa | +0.642 |
Neg logit contributions | |
ught | -0.830 |
wick | -0.781 |
wives | -0.741 |
RG | -0.736 |
CLA | -0.726 |
Token | the |
Token ID | 262 |
Feature activation | +2.72e+00 |
Pos logit contributions | |
aber | +1.593 |
nl | +1.454 |
Causes | +1.330 |
[' | +1.278 |
owa | +1.276 |
Neg logit contributions | |
ught | -1.963 |
wick | -1.835 |
wives | -1.776 |
RG | -1.738 |
CLA | -1.727 |
Token | security |
Token ID | 2324 |
Feature activation | +3.69e+00 |
Pos logit contributions | |
aber | +2.016 |
nl | +1.861 |
Causes | +1.733 |
[' | +1.674 |
owa | +1.668 |
Neg logit contributions | |
ught | -1.931 |
wick | -1.786 |
wives | -1.723 |
RG | -1.695 |
CLA | -1.685 |
Token | line |
Token ID | 1627 |
Feature activation | +3.68e+00 |
Pos logit contributions | |
aber | +2.895 |
nl | +2.713 |
Causes | +2.524 |
[' | +2.478 |
owa | +2.455 |
Neg logit contributions | |
ught | -2.415 |
wick | -2.244 |
wives | -2.155 |
RG | -2.124 |
CLA | -2.081 |
Token | : |
Token ID | 25 |
Feature activation | +6.03e+00 |
Pos logit contributions | |
aber | +2.410 |
nl | +2.186 |
Causes | +1.993 |
[' | +1.960 |
owa | +1.933 |
Neg logit contributions | |
ught | -2.924 |
wick | -2.756 |
wives | -2.630 |
RG | -2.627 |
CLA | -2.590 |
Token | a |
Token ID | 257 |
Feature activation | +7.72e+00 |
Pos logit contributions | |
aber | +4.127 |
nl | +3.788 |
Causes | +3.547 |
[' | +3.411 |
owa | +3.318 |
Neg logit contributions | |
ught | -4.521 |
wick | -4.193 |
wives | -3.990 |
RG | -3.978 |
riz | -3.911 |
Token | tall |
Token ID | 7331 |
Feature activation | +8.14e+00 |
Pos logit contributions | |
aber | +5.344 |
nl | +4.979 |
Causes | +4.568 |
[' | +4.486 |
owa | +4.402 |
Neg logit contributions | |
ught | -5.361 |
wick | -5.100 |
wives | -4.972 |
RG | -4.874 |
CLA | -4.818 |
Token | , |
Token ID | 11 |
Feature activation | +9.16e+00 |
Pos logit contributions | |
aber | +5.308 |
nl | +4.702 |
Causes | +4.276 |
[' | +4.261 |
owa | +4.227 |
Neg logit contributions | |
ught | -6.226 |
wick | -5.755 |
wives | -5.679 |
RG | -5.618 |
CLA | -5.541 |
Token | pale |
Token ID | 14005 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
aber | +6.163 |
nl | +5.606 |
gy | +5.165 |
Causes | +5.133 |
[' | +5.123 |
Neg logit contributions | |
ught | -6.456 |
wick | -6.017 |
wives | -5.873 |
CLA | -5.826 |
RG | -5.808 |
Token | locking |
Token ID | 48331 |
Feature activation | +8.47e+00 |
Pos logit contributions | |
aber | +7.709 |
nl | +7.174 |
Causes | +6.703 |
[' | +6.520 |
owa | +6.402 |
Neg logit contributions | |
ught | -7.272 |
wick | -6.418 |
CLA | -6.175 |
wives | -6.152 |
RG | -6.131 |
Token | intellectual |
Token ID | 9028 |
Feature activation | +3.98e+00 |
Pos logit contributions | |
aber | +5.865 |
nl | +5.376 |
Causes | +5.224 |
[' | +4.980 |
owa | +4.913 |
Neg logit contributions | |
ught | -6.095 |
wick | -5.711 |
CLA | -5.382 |
wives | -5.306 |
RG | -5.286 |
Token | , |
Token ID | 11 |
Feature activation | +6.55e+00 |
Pos logit contributions | |
aber | +2.998 |
nl | +2.742 |
Causes | +2.568 |
[' | +2.478 |
owa | +2.471 |
Neg logit contributions | |
ught | -2.805 |
wick | -2.642 |
wives | -2.469 |
RG | -2.456 |
CLA | -2.430 |
Token | legal |
Token ID | 2742 |
Feature activation | +6.88e+00 |
Pos logit contributions | |
aber | +4.651 |
nl | +4.305 |
Causes | +3.977 |
[' | +3.824 |
owa | +3.811 |
Neg logit contributions | |
ught | -4.822 |
wick | -4.539 |
wives | -4.227 |
CLA | -4.158 |
RG | -4.131 |
Token | and |
Token ID | 290 |
Feature activation | +7.19e+00 |
Pos logit contributions | |
aber | +4.208 |
nl | +3.749 |
Causes | +3.458 |
[' | +3.385 |
owa | +3.311 |
Neg logit contributions | |
ught | -5.687 |
wick | -5.399 |
CLA | -5.055 |
wives | -5.041 |
RG | -5.032 |
Token | political |
Token ID | 1964 |
Feature activation | +7.27e+00 |
Pos logit contributions | |
aber | +4.964 |
nl | +4.630 |
Causes | +4.251 |
[' | +4.126 |
owa | +4.075 |
Neg logit contributions | |
ught | -5.347 |
wick | -5.022 |
wives | -4.728 |
CLA | -4.638 |
riz | -4.583 |
Token | institutions |
Token ID | 6712 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
aber | +5.101 |
nl | +4.650 |
Causes | +4.459 |
[' | +4.256 |
owa | +4.207 |
Neg logit contributions | |
ught | -5.264 |
wick | -4.963 |
wives | -4.684 |
RG | -4.668 |
CLA | -4.594 |
Token | and |
Token ID | 290 |
Feature activation | +6.87e+00 |
Pos logit contributions | |
ught | +1.014 |
wick | +0.952 |
wives | +0.906 |
RG | +0.893 |
CLA | +0.883 |
Neg logit contributions | |
aber | -0.995 |
nl | -0.911 |
Causes | -0.849 |
owa | -0.811 |
[' | -0.810 |
Token | mobilized |
Token ID | 50166 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
aber | +4.739 |
nl | +4.416 |
Causes | +4.134 |
[' | +4.045 |
owa | +3.995 |
Neg logit contributions | |
ught | -4.996 |
wick | -4.702 |
CLA | -4.437 |
wives | -4.419 |
RG | -4.404 |
Token | every |
Token ID | 790 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
aber | +1.547 |
nl | +1.422 |
Causes | +1.324 |
[' | +1.282 |
owa | +1.270 |
Neg logit contributions | |
ught | -1.557 |
wick | -1.458 |
wives | -1.380 |
RG | -1.368 |
CLA | -1.358 |
Token | four |
Token ID | 1440 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
ught | +0.894 |
wick | +0.831 |
wives | +0.786 |
RG | +0.777 |
CLA | +0.767 |
Neg logit contributions | |
aber | -0.993 |
nl | -0.912 |
Causes | -0.855 |
[' | -0.821 |
owa | -0.820 |
Token | Mary |
Token ID | 5335 |
Feature activation | +6.48e-01 |
Pos logit contributions | |
ught | +1.900 |
wick | +1.790 |
wives | +1.698 |
RG | +1.673 |
CLA | +1.667 |
Neg logit contributions | |
aber | -1.808 |
nl | -1.652 |
Causes | -1.524 |
owa | -1.466 |
[' | -1.460 |
Token | Elizabeth |
Token ID | 10674 |
Feature activation | -4.27e+00 |
Pos logit contributions | |
aber | +0.453 |
nl | +0.410 |
Causes | +0.380 |
owa | +0.366 |
[' | +0.365 |
Neg logit contributions | |
ught | -0.497 |
wick | -0.466 |
wives | -0.444 |
RG | -0.440 |
CLA | -0.434 |
Token | Williams |
Token ID | 6484 |
Feature activation | -4.21e+00 |
Pos logit contributions | |
ught | +2.954 |
wick | +2.804 |
wives | +2.615 |
riz | +2.562 |
RG | +2.553 |
Neg logit contributions | |
aber | -3.262 |
nl | -2.999 |
Causes | -2.766 |
owa | -2.679 |
[' | -2.672 |
Token | did |
Token ID | 750 |
Feature activation | +3.76e-01 |
Pos logit contributions | |
ught | +3.009 |
wick | +2.839 |
wives | +2.658 |
RG | +2.631 |
CLA | +2.625 |
Neg logit contributions | |
aber | -3.087 |
nl | -2.851 |
Causes | -2.622 |
owa | -2.499 |
[' | -2.483 |
Token | tear |
Token ID | 11626 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
aber | +0.261 |
nl | +0.237 |
Causes | +0.220 |
[' | +0.211 |
owa | +0.210 |
Neg logit contributions | |
ught | -0.289 |
wick | -0.272 |
wives | -0.259 |
RG | -0.257 |
CLA | -0.254 |
Token | into |
Token ID | 656 |
Feature activation | -7.41e+00 |
Pos logit contributions | |
ught | +1.723 |
wick | +1.627 |
wives | +1.538 |
RG | +1.532 |
CLA | +1.512 |
Neg logit contributions | |
aber | -1.692 |
nl | -1.544 |
Causes | -1.435 |
[' | -1.373 |
owa | -1.373 |
Token | the |
Token ID | 262 |
Feature activation | -5.13e+00 |
Pos logit contributions | |
ught | +4.262 |
wick | +3.935 |
wives | +3.736 |
CLA | +3.652 |
RG | +3.646 |
Neg logit contributions | |
aber | -6.339 |
nl | -5.845 |
Causes | -5.351 |
owa | -5.263 |
[' | -5.177 |
Token | transgender |
Token ID | 10637 |
Feature activation | -3.80e-01 |
Pos logit contributions | |
ught | +3.561 |
wick | +3.306 |
wives | +3.149 |
RG | +3.091 |
CLA | +3.078 |
Neg logit contributions | |
aber | -3.879 |
nl | -3.580 |
Causes | -3.239 |
owa | -3.164 |
[' | -3.148 |
Token | analogy |
Token ID | 23970 |
Feature activation | -3.32e+00 |
Pos logit contributions | |
ught | +0.258 |
wick | +0.241 |
wives | +0.227 |
RG | +0.225 |
CLA | +0.222 |
Neg logit contributions | |
aber | -0.297 |
nl | -0.274 |
Causes | -0.256 |
[' | -0.247 |
owa | -0.246 |
Token | in |
Token ID | 287 |
Feature activation | +8.36e+00 |
Pos logit contributions | |
ught | +2.339 |
wick | +2.176 |
wives | +2.074 |
RG | +2.036 |
CLA | +2.036 |
Neg logit contributions | |
aber | -2.494 |
nl | -2.298 |
Causes | -2.136 |
owa | -2.047 |
[' | -2.019 |
Token | 2015 |
Token ID | 1853 |
Feature activation | -6.28e+00 |
Pos logit contributions | |
aber | +5.355 |
nl | +4.940 |
Causes | +4.707 |
[' | +4.530 |
owa | +4.349 |
Neg logit contributions | |
ught | -6.331 |
wick | -6.007 |
wives | -5.814 |
RG | -5.683 |
elin | -5.595 |
Token | will |
Token ID | 481 |
Feature activation | -6.93e+00 |
Pos logit contributions | |
ught | +1.477 |
wick | +1.393 |
wives | +1.309 |
RG | +1.299 |
CLA | +1.293 |
Neg logit contributions | |
aber | -1.499 |
nl | -1.367 |
Causes | -1.267 |
owa | -1.221 |
[' | -1.217 |
Token | be |
Token ID | 307 |
Feature activation | -7.48e+00 |
Pos logit contributions | |
ught | +4.251 |
wick | +4.064 |
CLA | +3.705 |
wives | +3.658 |
RG | +3.656 |
Neg logit contributions | |
aber | -5.625 |
nl | -5.109 |
Causes | -4.880 |
[' | -4.705 |
owa | -4.645 |
Token | two |
Token ID | 734 |
Feature activation | -3.74e+00 |
Pos logit contributions | |
ught | +4.853 |
wick | +4.558 |
curved | +4.190 |
RG | +4.183 |
wives | +4.180 |
Neg logit contributions | |
aber | -5.914 |
nl | -5.247 |
Causes | -4.881 |
owa | -4.755 |
[' | -4.725 |
Token | clips |
Token ID | 19166 |
Feature activation | -3.13e+00 |
Pos logit contributions | |
ught | +2.608 |
wick | +2.415 |
wives | +2.285 |
RG | +2.251 |
CLA | +2.225 |
Neg logit contributions | |
aber | -2.879 |
nl | -2.588 |
Causes | -2.420 |
[' | -2.341 |
owa | -2.334 |
Token | on |
Token ID | 319 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
ught | +2.220 |
wick | +2.083 |
wives | +1.961 |
RG | +1.945 |
CLA | +1.926 |
Neg logit contributions | |
aber | -2.341 |
nl | -2.133 |
Causes | -2.008 |
owa | -1.927 |
[' | -1.917 |
Token | the |
Token ID | 262 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
ught | +1.339 |
wick | +1.251 |
wives | +1.176 |
RG | +1.167 |
CLA | +1.150 |
Neg logit contributions | |
aber | -1.560 |
nl | -1.429 |
Causes | -1.345 |
[' | -1.293 |
owa | -1.291 |
Token | front |
Token ID | 2166 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
ught | +1.877 |
wick | +1.751 |
wives | +1.637 |
RG | +1.635 |
riz | +1.612 |
Neg logit contributions | |
aber | -2.041 |
nl | -1.861 |
Causes | -1.745 |
[' | -1.684 |
owa | -1.682 |
Token | and |
Token ID | 290 |
Feature activation | +2.99e+00 |
Pos logit contributions | |
aber | +0.896 |
nl | +0.819 |
Causes | +0.758 |
[' | +0.730 |
owa | +0.727 |
Neg logit contributions | |
ught | -0.925 |
wick | -0.869 |
wives | -0.828 |
RG | -0.817 |
CLA | -0.809 |
Token | back |
Token ID | 736 |
Feature activation | -4.47e-01 |
Pos logit contributions | |
aber | +2.169 |
nl | +1.996 |
Causes | +1.836 |
[' | +1.779 |
owa | +1.766 |
Neg logit contributions | |
ught | -2.179 |
wick | -2.038 |
wives | -1.955 |
RG | -1.927 |
CLA | -1.905 |
Token | of |
Token ID | 286 |
Feature activation | -3.48e+00 |
Pos logit contributions | |
ught | +0.333 |
wick | +0.313 |
wives | +0.297 |
RG | +0.295 |
CLA | +0.291 |
Neg logit contributions | |
aber | -0.320 |
nl | -0.292 |
Causes | -0.272 |
[' | -0.262 |
owa | -0.261 |
Token | the |
Token ID | 262 |
Feature activation | -2.66e+00 |
Pos logit contributions | |
ught | +2.368 |
wick | +2.223 |
RG | +2.081 |
wives | +2.079 |
riz | +2.042 |
Neg logit contributions | |
aber | -2.689 |
nl | -2.457 |
Causes | -2.321 |
owa | -2.238 |
[' | -2.230 |
Token | worlds |
Token ID | 11621 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
ught | +0.821 |
wick | +0.764 |
wives | +0.729 |
RG | +0.716 |
CLA | +0.707 |
Neg logit contributions | |
aber | -0.842 |
nl | -0.770 |
Causes | -0.714 |
[' | -0.692 |
owa | -0.689 |
Token | : |
Token ID | 25 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
ught | +0.115 |
wick | +0.108 |
wives | +0.103 |
RG | +0.102 |
CLA | +0.100 |
Neg logit contributions | |
aber | -0.106 |
nl | -0.096 |
Causes | -0.089 |
[' | -0.086 |
owa | -0.085 |
Token |
|
Token ID | 198 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
ught | +0.821 |
wick | +0.766 |
wives | +0.731 |
RG | +0.719 |
CLA | +0.710 |
Neg logit contributions | |
aber | -0.851 |
nl | -0.778 |
Causes | -0.725 |
[' | -0.700 |
owa | -0.697 |
Token |
|
Token ID | 198 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
aber | +0.281 |
nl | +0.258 |
Causes | +0.240 |
[' | +0.232 |
owa | +0.230 |
Neg logit contributions | |
ught | -0.274 |
wick | -0.256 |
wives | -0.243 |
RG | -0.241 |
CLA | -0.238 |
Token | how |
Token ID | 4919 |
Feature activation | -5.24e+00 |
Pos logit contributions | |
aber | +0.698 |
nl | +0.633 |
Causes | +0.577 |
[' | +0.558 |
owa | +0.554 |
Neg logit contributions | |
ught | -0.860 |
wick | -0.812 |
wives | -0.771 |
RG | -0.767 |
CLA | -0.760 |
Token | much |
Token ID | 881 |
Feature activation | -4.04e+00 |
Pos logit contributions | |
ught | +3.857 |
wick | +3.513 |
wives | +3.382 |
CLA | +3.295 |
RG | +3.280 |
Neg logit contributions | |
aber | -3.787 |
nl | -3.438 |
Causes | -3.222 |
[' | -3.100 |
owa | -3.066 |
Token | less |
Token ID | 1342 |
Feature activation | -7.40e+00 |
Pos logit contributions | |
ught | +2.942 |
wick | +2.679 |
wives | +2.574 |
CLA | +2.497 |
RG | +2.495 |
Neg logit contributions | |
aber | -3.017 |
nl | -2.700 |
Causes | -2.553 |
[' | -2.438 |
owa | -2.423 |
Token | for |
Token ID | 329 |
Feature activation | -3.03e+00 |
Pos logit contributions | |
ught | +5.191 |
wick | +4.627 |
wives | +4.464 |
RG | +4.338 |
CLA | +4.334 |
Neg logit contributions | |
aber | -5.541 |
nl | -5.007 |
Causes | -4.726 |
[' | -4.553 |
裏� | -4.467 |
Token | a |
Token ID | 257 |
Feature activation | -5.74e+00 |
Pos logit contributions | |
ught | +2.121 |
wick | +1.953 |
wives | +1.876 |
RG | +1.823 |
CLA | +1.801 |
Neg logit contributions | |
aber | -2.324 |
nl | -2.112 |
Causes | -1.979 |
[' | -1.918 |
owa | -1.898 |
Token | kingdom |
Token ID | 13239 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
ught | +4.310 |
wick | +3.850 |
wives | +3.709 |
elin | +3.576 |
RG | +3.575 |
Neg logit contributions | |
aber | -4.162 |
nl | -3.753 |
Causes | -3.553 |
[' | -3.391 |
owa | -3.335 |
Token | of |
Token ID | 286 |
Feature activation | -3.06e+00 |
Pos logit contributions | |
aber | +2.354 |
nl | +2.139 |
Causes | +1.970 |
[' | +1.916 |
owa | +1.900 |
Neg logit contributions | |
ught | -2.716 |
wick | -2.586 |
RG | -2.465 |
wives | -2.430 |
riz | -2.429 |
Token | , |
Token ID | 11 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
aber | +3.674 |
nl | +3.356 |
Causes | +3.008 |
[' | +2.930 |
owa | +2.912 |
Neg logit contributions | |
ught | -4.851 |
wick | -4.584 |
wives | -4.422 |
RG | -4.369 |
CLA | -4.351 |
Token | says |
Token ID | 1139 |
Feature activation | +2.26e+00 |
Pos logit contributions | |
ught | +1.051 |
wick | +0.984 |
wives | +0.932 |
RG | +0.923 |
CLA | +0.914 |
Neg logit contributions | |
aber | -1.041 |
nl | -0.952 |
Causes | -0.883 |
[' | -0.849 |
owa | -0.848 |
Token | that |
Token ID | 326 |
Feature activation | -9.57e-01 |
Pos logit contributions | |
aber | +1.606 |
nl | +1.470 |
Causes | +1.366 |
[' | +1.326 |
owa | +1.310 |
Neg logit contributions | |
ught | -1.682 |
wick | -1.580 |
wives | -1.506 |
RG | -1.482 |
CLA | -1.466 |
Token | the |
Token ID | 262 |
Feature activation | -3.11e+00 |
Pos logit contributions | |
ught | +0.696 |
wick | +0.652 |
wives | +0.618 |
RG | +0.613 |
CLA | +0.605 |
Neg logit contributions | |
aber | -0.704 |
nl | -0.644 |
Causes | -0.598 |
[' | -0.574 |
owa | -0.574 |
Token | J |
Token ID | 449 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
ught | +2.125 |
wick | +1.986 |
wives | +1.872 |
RG | +1.854 |
riz | +1.830 |
Neg logit contributions | |
aber | -2.406 |
nl | -2.219 |
Causes | -2.045 |
[' | -1.975 |
owa | -1.973 |
Token | H |
Token ID | 39 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
ught | +1.193 |
wick | +1.129 |
wives | +1.074 |
RG | +1.070 |
CLA | +1.058 |
Neg logit contributions | |
aber | -0.939 |
nl | -0.851 |
Causes | -0.785 |
[' | -0.745 |
owa | -0.743 |
Token | 15 |
Token ID | 1314 |
Feature activation | -6.33e+00 |
Pos logit contributions | |
ught | +3.205 |
wick | +3.085 |
wives | +2.932 |
RG | +2.912 |
CLA | +2.884 |
Neg logit contributions | |
aber | -2.749 |
nl | -2.525 |
Causes | -2.291 |
owa | -2.196 |
[' | -2.137 |
Token | mission |
Token ID | 4365 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
ught | +4.227 |
wick | +3.991 |
RG | +3.782 |
wives | +3.751 |
CLA | +3.704 |
Neg logit contributions | |
aber | -4.782 |
nl | -4.383 |
Causes | -4.087 |
[' | -3.897 |
owa | -3.885 |
Token | objectives |
Token ID | 15221 |
Feature activation | +8.97e-02 |
Pos logit contributions | |
ught | +0.960 |
wick | +0.904 |
wives | +0.861 |
RG | +0.846 |
CLA | +0.839 |
Neg logit contributions | |
aber | -0.930 |
nl | -0.845 |
Causes | -0.787 |
[' | -0.752 |
owa | -0.751 |
Token | may |
Token ID | 743 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
aber | +0.064 |
nl | +0.059 |
Causes | +0.055 |
[' | +0.052 |
owa | +0.052 |
Neg logit contributions | |
ught | -0.067 |
wick | -0.063 |
wives | -0.060 |
RG | -0.059 |
CLA | -0.058 |
Token | go |
Token ID | 467 |
Feature activation | -4.59e+00 |
Pos logit contributions | |
ught | +1.609 |
wick | +1.498 |
wives | +1.412 |
RG | +1.388 |
CLA | +1.385 |
Neg logit contributions | |
aber | -1.748 |
nl | -1.610 |
Causes | -1.516 |
owa | -1.442 |
[' | -1.436 |
Token | v |
Token ID | 85 |
Feature activation | +9.19e+00 |
Pos logit contributions | |
ught | +0.417 |
wick | +0.385 |
wives | +0.359 |
RG | +0.355 |
CLA | +0.349 |
Neg logit contributions | |
aber | -0.635 |
nl | -0.590 |
Causes | -0.558 |
[' | -0.539 |
owa | -0.539 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
aber | +4.137 |
nl | +3.945 |
[' | +3.505 |
xe | +2.981 |
gy | +2.951 |
Neg logit contributions | |
ught | -8.778 |
tradem | -8.497 |
wick | -8.205 |
wives | -8.061 |
ewitness | -7.922 |
Token | . |
Token ID | 13 |
Feature activation | -5.25e-02 |
Pos logit contributions | |
nl | +5.337 |
aber | +5.296 |
[' | +5.237 |
xe | +3.980 |
gy | +3.929 |
Neg logit contributions | |
tradem | -13.007 |
ught | -12.358 |
ewitness | -11.596 |
agos | -11.385 |
wick | -11.319 |
Token | get |
Token ID | 1136 |
Feature activation | -3.99e+00 |
Pos logit contributions | |
ught | +0.043 |
wick | +0.041 |
wives | +0.039 |
RG | +0.039 |
CLA | +0.038 |
Neg logit contributions | |
aber | -0.033 |
nl | -0.030 |
Causes | -0.028 |
[' | -0.026 |
owa | -0.026 |
Token | Struct |
Token ID | 44909 |
Feature activation | -9.38e+00 |
Pos logit contributions | |
ught | +2.908 |
wick | +2.779 |
RG | +2.718 |
wives | +2.616 |
CLA | +2.602 |
Neg logit contributions | |
aber | -2.877 |
nl | -2.555 |
Causes | -2.440 |
owa | -2.326 |
[' | -2.247 |
Token | uring |
Token ID | 870 |
Feature activation | -2.79e+00 |
Pos logit contributions | |
ught | +3.313 |
wick | +3.028 |
RG | +2.802 |
riz | +2.693 |
wives | +2.626 |
Neg logit contributions | |
aber | -9.795 |
nl | -9.149 |
Causes | -8.932 |
裏� | -8.707 |
owa | -8.663 |
Token | Element |
Token ID | 20180 |
Feature activation | +2.11e+00 |
Pos logit contributions | |
ught | +2.025 |
wick | +1.927 |
RG | +1.851 |
wives | +1.811 |
CLA | +1.804 |
Neg logit contributions | |
aber | -2.031 |
nl | -1.822 |
Causes | -1.713 |
owa | -1.676 |
[' | -1.605 |
Token | ( |
Token ID | 7 |
Feature activation | -2.44e+00 |
Pos logit contributions | |
aber | +1.106 |
nl | +0.987 |
Causes | +0.871 |
[' | +0.855 |
owa | +0.813 |
Neg logit contributions | |
ught | -1.985 |
wick | -1.867 |
wives | -1.801 |
elin | -1.769 |
RG | -1.763 |
Token | cv |
Token ID | 33967 |
Feature activation | +9.96e+00 |
Pos logit contributions | |
ught | +1.716 |
wick | +1.619 |
RG | +1.521 |
wives | +1.512 |
CLA | +1.490 |
Neg logit contributions | |
aber | -1.841 |
nl | -1.674 |
Causes | -1.592 |
owa | -1.525 |
[' | -1.502 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
aber | +4.202 |
nl | +4.159 |
[' | +3.713 |
de | +3.100 |
xe | +3.040 |
Neg logit contributions | |
tradem | -9.749 |
ught | -9.665 |
wick | -9.001 |
wives | -8.880 |
ewitness | -8.843 |
Token | . |
Token ID | 13 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
nl | +5.341 |
aber | +5.123 |
[' | +5.089 |
de | +3.949 |
EE | +3.948 |
Neg logit contributions | |
tradem | -13.510 |
ught | -12.576 |
ewitness | -11.889 |
agos | -11.622 |
elin | -11.478 |
Token | at |
Token ID | 379 |
Feature activation | -9.45e+00 |
Pos logit contributions | |
ught | +5.281 |
wick | +5.025 |
RG | +4.705 |
wives | +4.670 |
CLA | +4.611 |
Neg logit contributions | |
aber | -5.515 |
nl | -5.086 |
Causes | -4.680 |
owa | -4.563 |
[' | -4.460 |
Token | least |
Token ID | 1551 |
Feature activation | -9.51e+00 |
Pos logit contributions | |
ught | +5.374 |
wick | +5.068 |
RG | +4.594 |
riz | +4.558 |
CLA | +4.470 |
Neg logit contributions | |
aber | -7.814 |
nl | -7.488 |
Causes | -6.801 |
owa | -6.691 |
[' | -6.681 |
Token | 25 |
Token ID | 1679 |
Feature activation | -7.36e+00 |
Pos logit contributions | |
ught | +6.564 |
wick | +6.263 |
RG | +5.876 |
CLA | +5.754 |
wives | +5.753 |
Neg logit contributions | |
aber | -6.633 |
nl | -6.199 |
Causes | -5.608 |
owa | -5.486 |
裏� | -5.478 |
Token | Fantasy |
Token ID | 10982 |
Feature activation | -3.91e+00 |
Pos logit contributions | |
ught | +4.155 |
wick | +4.002 |
RG | +3.688 |
CLA | +3.624 |
wives | +3.607 |
Neg logit contributions | |
aber | -6.266 |
nl | -5.880 |
Causes | -5.463 |
owa | -5.320 |
[' | -5.289 |
Token | points |
Token ID | 2173 |
Feature activation | -4.94e+00 |
Pos logit contributions | |
ught | +1.935 |
wick | +1.782 |
wives | +1.651 |
RG | +1.612 |
CLA | +1.571 |
Neg logit contributions | |
aber | -3.736 |
nl | -3.515 |
Causes | -3.323 |
owa | -3.234 |
[' | -3.190 |
Token | in |
Token ID | 287 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
ught | +3.378 |
wick | +3.178 |
wives | +2.953 |
CLA | +2.920 |
RG | +2.913 |
Neg logit contributions | |
aber | -3.758 |
nl | -3.490 |
Causes | -3.277 |
owa | -3.119 |
[' | -3.068 |
Token | two |
Token ID | 734 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
ught | +8.541 |
wick | +8.165 |
RG | +7.479 |
curved | +7.304 |
elin | +7.278 |
Neg logit contributions | |
aber | -10.924 |
nl | -9.846 |
Causes | -9.113 |
裏� | -8.908 |
owa | -8.886 |
Token | of |
Token ID | 286 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
ught | +6.658 |
wick | +6.255 |
RG | +5.699 |
wives | +5.656 |
curved | +5.627 |
Neg logit contributions | |
aber | -9.296 |
nl | -8.468 |
Causes | -8.013 |
[' | -7.633 |
裏� | -7.558 |
Token | his |
Token ID | 465 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
ught | +6.200 |
wick | +5.777 |
RG | +5.353 |
wives | +5.298 |
riz | +5.170 |
Neg logit contributions | |
aber | -9.162 |
nl | -8.466 |
Causes | -7.849 |
owa | -7.596 |
[' | -7.586 |
Token | past |
Token ID | 1613 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
ught | +4.983 |
wick | +4.660 |
RG | +4.153 |
elin | +4.136 |
wives | +4.102 |
Neg logit contributions | |
aber | -9.708 |
nl | -8.861 |
Causes | -8.235 |
[' | -8.031 |
裏� | -8.017 |
Token | three |
Token ID | 1115 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
ught | +6.992 |
wick | +6.561 |
wives | +6.312 |
elin | +6.248 |
curved | +6.158 |
Neg logit contributions | |
aber | -7.890 |
nl | -7.126 |
Causes | -6.425 |
裏� | -6.284 |
owa | -6.201 |
Token | and |
Token ID | 290 |
Feature activation | -4.70e+00 |
Pos logit contributions | |
ught | +1.583 |
wick | +1.485 |
wives | +1.409 |
RG | +1.397 |
CLA | +1.371 |
Neg logit contributions | |
aber | -1.680 |
nl | -1.536 |
Causes | -1.434 |
owa | -1.382 |
[' | -1.378 |
Token | Snap |
Token ID | 16026 |
Feature activation | -5.61e+00 |
Pos logit contributions | |
ught | +2.339 |
wick | +2.181 |
RG | +1.935 |
wives | +1.930 |
riz | +1.905 |
Neg logit contributions | |
aber | -4.469 |
nl | -4.174 |
Causes | -3.905 |
owa | -3.834 |
[' | -3.829 |
Token | also |
Token ID | 635 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
ught | +3.904 |
wick | +3.686 |
wives | +3.462 |
RG | +3.410 |
riz | +3.353 |
Neg logit contributions | |
aber | -4.143 |
nl | -3.842 |
Causes | -3.555 |
owa | -3.418 |
[' | -3.378 |
Token | claim |
Token ID | 1624 |
Feature activation | -4.69e+00 |
Pos logit contributions | |
ught | +1.338 |
wick | +1.250 |
wives | +1.182 |
RG | +1.165 |
riz | +1.151 |
Neg logit contributions | |
aber | -1.304 |
nl | -1.190 |
Causes | -1.098 |
owa | -1.058 |
[' | -1.053 |
Token | to |
Token ID | 284 |
Feature activation | -9.90e+00 |
Pos logit contributions | |
ught | +3.228 |
wick | +3.018 |
wives | +2.823 |
riz | +2.802 |
RG | +2.797 |
Neg logit contributions | |
aber | -3.561 |
nl | -3.276 |
Causes | -3.048 |
[' | -2.946 |
owa | -2.944 |
Token | be |
Token ID | 307 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
ught | +6.602 |
wick | +6.052 |
elin | +5.543 |
wives | +5.506 |
curved | +5.459 |
Neg logit contributions | |
aber | -7.443 |
nl | -6.789 |
Causes | -6.348 |
owa | -6.177 |
裏� | -6.154 |
Token | ( |
Token ID | 357 |
Feature activation | -3.27e+00 |
Pos logit contributions | |
ught | +9.033 |
wick | +8.555 |
Certified | +8.086 |
wives | +8.045 |
curved | +8.004 |
Neg logit contributions | |
aber | -11.255 |
nl | -10.142 |
[' | -9.432 |
Causes | -9.353 |
裏� | -9.351 |
Token | in |
Token ID | 259 |
Feature activation | -3.91e+00 |
Pos logit contributions | |
ught | +2.456 |
wick | +2.315 |
wives | +2.208 |
RG | +2.190 |
CLA | +2.152 |
Neg logit contributions | |
aber | -2.274 |
nl | -2.074 |
Causes | -1.978 |
owa | -1.875 |
[' | -1.873 |
Token | theory |
Token ID | 4583 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
ught | +2.728 |
wick | +2.539 |
wives | +2.419 |
RG | +2.382 |
CLA | +2.362 |
Neg logit contributions | |
aber | -2.909 |
nl | -2.660 |
Causes | -2.489 |
[' | -2.443 |
owa | -2.422 |
Token | at |
Token ID | 379 |
Feature activation | +2.31e+00 |
Pos logit contributions | |
aber | +0.793 |
nl | +0.713 |
Causes | +0.652 |
[' | +0.625 |
owa | +0.621 |
Neg logit contributions | |
ught | -1.066 |
wick | -1.011 |
wives | -0.964 |
RG | -0.957 |
CLA | -0.947 |
Token | least |
Token ID | 1551 |
Feature activation | -6.20e+00 |
Pos logit contributions | |
aber | +1.660 |
nl | +1.519 |
Causes | +1.412 |
[' | +1.356 |
owa | +1.339 |
Neg logit contributions | |
ught | -1.713 |
wick | -1.610 |
wives | -1.534 |
RG | -1.519 |
CLA | -1.501 |
Token | take |
Token ID | 1011 |
Feature activation | -6.24e+00 |
Pos logit contributions | |
ught | +3.429 |
wick | +3.234 |
wives | +2.979 |
RG | +2.961 |
CLA | +2.950 |
Neg logit contributions | |
aber | -3.719 |
nl | -3.379 |
Causes | -3.145 |
owa | -2.992 |
裏� | -2.986 |
Token | the |
Token ID | 262 |
Feature activation | -7.10e+00 |
Pos logit contributions | |
ught | +4.055 |
wick | +3.803 |
wives | +3.577 |
RG | +3.520 |
elin | +3.501 |
Neg logit contributions | |
aber | -4.925 |
nl | -4.462 |
Causes | -4.196 |
owa | -4.001 |
[' | -3.989 |
Token | string |
Token ID | 4731 |
Feature activation | -4.14e+00 |
Pos logit contributions | |
ught | +4.874 |
wick | +4.580 |
elin | +4.267 |
wives | +4.260 |
RG | +4.226 |
Neg logit contributions | |
aber | -5.362 |
nl | -4.853 |
Causes | -4.471 |
[' | -4.308 |
owa | -4.269 |
Token | and |
Token ID | 290 |
Feature activation | -2.39e+00 |
Pos logit contributions | |
ught | +3.028 |
wick | +2.872 |
wives | +2.711 |
RG | +2.669 |
elin | +2.648 |
Neg logit contributions | |
aber | -3.005 |
nl | -2.700 |
Causes | -2.537 |
owa | -2.412 |
[' | -2.404 |
Token | go |
Token ID | 467 |
Feature activation | +4.94e+00 |
Pos logit contributions | |
ught | +1.658 |
wick | +1.548 |
wives | +1.452 |
RG | +1.443 |
CLA | +1.424 |
Neg logit contributions | |
aber | -1.846 |
nl | -1.681 |
Causes | -1.570 |
owa | -1.507 |
[' | -1.506 |
Token | around |
Token ID | 1088 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
aber | +3.368 |
nl | +3.130 |
Causes | +2.879 |
owa | +2.799 |
[' | +2.797 |
Neg logit contributions | |
ught | -3.719 |
wick | -3.462 |
wives | -3.348 |
RG | -3.285 |
CLA | -3.277 |
Token | and |
Token ID | 290 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
ught | +7.654 |
wick | +7.341 |
curved | +6.792 |
wives | +6.606 |
elin | +6.473 |
Neg logit contributions | |
aber | -11.670 |
nl | -10.155 |
Causes | -9.588 |
owa | -9.500 |
裏� | -9.339 |
Token | around |
Token ID | 1088 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
ught | +1.318 |
wick | +1.233 |
wives | +1.158 |
RG | +1.148 |
CLA | +1.133 |
Neg logit contributions | |
aber | -1.460 |
nl | -1.329 |
Causes | -1.245 |
[' | -1.195 |
owa | -1.195 |
Token | the |
Token ID | 262 |
Feature activation | -6.00e+00 |
Pos logit contributions | |
ught | +6.714 |
wick | +6.347 |
curved | +5.820 |
wives | +5.789 |
RG | +5.619 |
Neg logit contributions | |
aber | -9.300 |
nl | -8.127 |
Causes | -7.655 |
owa | -7.595 |
裏� | -7.421 |
Token | edge |
Token ID | 5743 |
Feature activation | -8.73e+00 |
Pos logit contributions | |
ught | +4.204 |
wick | +3.975 |
wives | +3.699 |
elin | +3.657 |
curved | +3.655 |
Neg logit contributions | |
aber | -4.548 |
nl | -4.053 |
Causes | -3.769 |
owa | -3.623 |
[' | -3.610 |
Token | . |
Token ID | 13 |
Feature activation | -5.96e+00 |
Pos logit contributions | |
ught | +5.687 |
wick | +5.339 |
wives | +4.933 |
curved | +4.840 |
CLA | +4.832 |
Neg logit contributions | |
aber | -6.805 |
nl | -6.077 |
Causes | -5.813 |
owa | -5.565 |
裏� | -5.463 |
Token | x |
Token ID | 2124 |
Feature activation | -4.06e+00 |
Pos logit contributions | |
ught | +1.546 |
wick | +1.470 |
wives | +1.392 |
RG | +1.389 |
CLA | +1.369 |
Neg logit contributions | |
aber | -1.276 |
nl | -1.147 |
Causes | -1.052 |
owa | -1.018 |
[' | -1.001 |
Token | . |
Token ID | 13 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
ught | +2.935 |
wick | +2.826 |
RG | +2.651 |
wives | +2.647 |
CLA | +2.596 |
Neg logit contributions | |
aber | -2.942 |
nl | -2.609 |
Causes | -2.527 |
owa | -2.432 |
裏� | -2.344 |
Token | x |
Token ID | 87 |
Feature activation | -3.60e+00 |
Pos logit contributions | |
aber | +0.759 |
nl | +0.623 |
[' | +0.454 |
Causes | +0.449 |
xe | +0.392 |
Neg logit contributions | |
ught | -2.969 |
wick | -2.824 |
wives | -2.750 |
CLA | -2.732 |
RG | -2.729 |
Token | . |
Token ID | 13 |
Feature activation | -3.20e+00 |
Pos logit contributions | |
ught | +2.635 |
wick | +2.529 |
wives | +2.373 |
RG | +2.366 |
CLA | +2.319 |
Neg logit contributions | |
aber | -2.583 |
nl | -2.297 |
Causes | -2.220 |
owa | -2.126 |
裏� | -2.059 |
Token | x |
Token ID | 87 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
ught | +3.439 |
wick | +3.328 |
wives | +3.194 |
RG | +3.181 |
riz | +3.144 |
Neg logit contributions | |
aber | -1.212 |
nl | -0.984 |
Causes | -0.913 |
owa | -0.817 |
裏� | -0.750 |
Token | . |
Token ID | 13 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
ught | +7.927 |
wick | +7.788 |
RG | +7.315 |
CLA | +7.120 |
wives | +6.939 |
Neg logit contributions | |
aber | -12.514 |
vertisement | -12.177 |
� | -11.735 |
enthusi | -11.454 |
cryst | -11.454 |
Token | 127 |
Token ID | 16799 |
Feature activation | -5.18e+00 |
Pos logit contributions | |
ught | +7.611 |
wick | +6.502 |
CLA | +6.471 |
wives | +6.389 |
riz | +6.302 |
Neg logit contributions | |
aber | -13.178 |
Causes | -12.058 |
nl | -11.637 |
裏� | -11.503 |
vertisement | -11.397 |
Token | 98 |
Token ID | 9661 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
ught | +3.442 |
wick | +3.337 |
wives | +3.109 |
RG | +3.074 |
CLA | +3.017 |
Neg logit contributions | |
aber | -4.018 |
nl | -3.586 |
Causes | -3.325 |
owa | -3.270 |
[' | -3.235 |
Token | 59 |
Token ID | 3270 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
aber | +0.011 |
nl | +0.010 |
Causes | +0.009 |
owa | +0.009 |
[' | +0.009 |
Neg logit contributions | |
ught | -0.015 |
wick | -0.014 |
wives | -0.013 |
RG | -0.013 |
CLA | -0.013 |
Token | 64 |
Token ID | 2414 |
Feature activation | -4.72e+00 |
Pos logit contributions | |
ught | +1.730 |
wick | +1.658 |
RG | +1.575 |
wives | +1.569 |
CLA | +1.549 |
Neg logit contributions | |
aber | -1.496 |
nl | -1.339 |
Causes | -1.248 |
owa | -1.206 |
[' | -1.178 |
Token | x |
Token ID | 2124 |
Feature activation | -4.04e+00 |
Pos logit contributions | |
ught | +3.560 |
wick | +3.395 |
RG | +3.201 |
wives | +3.173 |
CLA | +3.155 |
Neg logit contributions | |
aber | -3.258 |
nl | -2.920 |
Causes | -2.680 |
owa | -2.635 |
[' | -2.559 |
Token | open |
Token ID | 1280 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
ught | +6.341 |
wick | +5.743 |
curved | +5.327 |
CLA | +5.242 |
elin | +5.224 |
Neg logit contributions | |
aber | -8.293 |
nl | -7.595 |
Causes | -7.328 |
裏� | -7.185 |
Customer | -6.671 |
Token | my |
Token ID | 616 |
Feature activation | -4.04e+00 |
Pos logit contributions | |
ught | +3.168 |
wick | +2.972 |
RG | +2.804 |
wives | +2.787 |
elin | +2.744 |
Neg logit contributions | |
aber | -3.710 |
nl | -3.378 |
Causes | -3.199 |
owa | -3.016 |
[' | -3.004 |
Token | mouth |
Token ID | 5422 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
ught | +2.063 |
wick | +1.828 |
RG | +1.722 |
wives | +1.705 |
riz | +1.686 |
Neg logit contributions | |
aber | -3.864 |
nl | -3.555 |
Causes | -3.407 |
owa | -3.246 |
[' | -3.244 |
Token | and |
Token ID | 290 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
ught | +6.550 |
wick | +6.238 |
CLA | +5.684 |
curved | +5.648 |
wives | +5.586 |
Neg logit contributions | |
aber | -8.905 |
nl | -8.169 |
Causes | -7.938 |
裏� | -7.308 |
Customer | -7.280 |
Token | her |
Token ID | 607 |
Feature activation | -9.00e+00 |
Pos logit contributions | |
ught | +7.045 |
wick | +6.389 |
wives | +6.068 |
CLA | +6.051 |
RG | +5.975 |
Neg logit contributions | |
aber | -9.108 |
nl | -8.067 |
Causes | -7.782 |
裏� | -7.461 |
tool | -7.120 |
Token | tongue |
Token ID | 11880 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
ught | +5.669 |
wick | +5.104 |
curved | +4.827 |
wives | +4.794 |
elin | +4.778 |
Neg logit contributions | |
aber | -7.349 |
nl | -6.493 |
Causes | -6.297 |
裏� | -6.091 |
owa | -5.841 |
Token | sl |
Token ID | 1017 |
Feature activation | -8.83e+00 |
Pos logit contributions | |
ught | +8.449 |
wick | +7.631 |
curved | +7.569 |
wives | +7.238 |
curves | +6.959 |
Neg logit contributions | |
aber | -10.803 |
nl | -10.030 |
Causes | -9.231 |
裏� | -9.208 |
OTAL | -8.896 |
Token | ither |
Token ID | 1555 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
ught | +6.716 |
wick | +6.266 |
wives | +5.821 |
riz | +5.668 |
unker | +5.618 |
Neg logit contributions | |
aber | -5.795 |
nl | -5.386 |
Causes | -5.296 |
裏� | -5.264 |
[' | -4.879 |
Token | s |
Token ID | 82 |
Feature activation | -5.88e+00 |
Pos logit contributions | |
ught | +1.277 |
wick | +1.211 |
wives | +1.151 |
RG | +1.134 |
CLA | +1.126 |
Neg logit contributions | |
aber | -0.975 |
nl | -0.878 |
Causes | -0.809 |
[' | -0.767 |
owa | -0.766 |
Token | into |
Token ID | 656 |
Feature activation | -3.42e+00 |
Pos logit contributions | |
ught | +4.097 |
wick | +3.832 |
wives | +3.548 |
curved | +3.519 |
CLA | +3.464 |
Neg logit contributions | |
aber | -4.382 |
nl | -4.038 |
Causes | -3.819 |
owa | -3.606 |
裏� | -3.561 |
Token | mine |
Token ID | 6164 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
ught | +2.226 |
wick | +2.095 |
wives | +1.959 |
RG | +1.940 |
elin | +1.907 |
Neg logit contributions | |
aber | -2.763 |
nl | -2.533 |
Causes | -2.389 |
owa | -2.291 |
[' | -2.263 |