Token | at |
Token ID | 379 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
�� | +2.528 |
ゼ | +2.455 |
dos | +2.445 |
eeper | +2.380 |
verting | +2.360 |
Neg logit contributions | |
Honour | -2.639 |
emin | -2.474 |
MENT | -2.389 |
acceptance | -2.364 |
ODY | -2.359 |
Token | least |
Token ID | 1551 |
Feature activation | +5.04e-01 |
Pos logit contributions | |
Honour | +2.734 |
emin | +2.579 |
acceptance | +2.548 |
MENT | +2.470 |
ODY | +2.440 |
Neg logit contributions | |
�� | -1.934 |
ゼ | -1.835 |
verting | -1.707 |
dos | -1.685 |
eeper | -1.640 |
Token | one |
Token ID | 530 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
Honour | +2.075 |
emin | +1.899 |
acceptance | +1.830 |
MENT | +1.770 |
ODY | +1.709 |
Neg logit contributions | |
�� | -4.905 |
ゼ | -4.749 |
dos | -4.693 |
verting | -4.618 |
eeper | -4.570 |
Token | blank |
Token ID | 9178 |
Feature activation | +7.57e-01 |
Pos logit contributions | |
�� | +0.734 |
ゼ | +0.709 |
dos | +0.699 |
eeper | +0.676 |
verting | +0.674 |
Neg logit contributions | |
Honour | -1.041 |
emin | -0.990 |
acceptance | -0.954 |
MENT | -0.953 |
ODY | -0.947 |
Token | character |
Token ID | 2095 |
Feature activation | +7.30e-01 |
Pos logit contributions | |
Honour | +4.734 |
emin | +4.614 |
acceptance | +4.469 |
MENT | +4.292 |
Expression | +4.279 |
Neg logit contributions | |
�� | -5.585 |
ゼ | -5.437 |
dos | -5.339 |
eeper | -5.135 |
verting | -5.078 |
Token | (< |
Token ID | 38155 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
Honour | +3.756 |
emin | +3.578 |
acceptance | +3.376 |
ODY | +3.307 |
Expression | +3.239 |
Neg logit contributions | |
�� | -6.158 |
ゼ | -6.073 |
dos | -5.864 |
verting | -5.775 |
eeper | -5.606 |
Token | Space |
Token ID | 14106 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
emin | +7.655 |
Honour | +7.541 |
MENT | +7.280 |
Expression | +6.761 |
ODY | +6.621 |
Neg logit contributions | |
�� | -14.199 |
eeper | -13.394 |
arthed | -13.048 |
ゼ | -13.014 |
verting | -12.901 |
Token | > |
Token ID | 29 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
Honour | +1.097 |
emin | +1.056 |
acceptance | +1.008 |
MENT | +1.005 |
ODY | +0.991 |
Neg logit contributions | |
�� | -0.917 |
ゼ | -0.867 |
dos | -0.834 |
eeper | -0.823 |
verting | -0.820 |
Token | or |
Token ID | 393 |
Feature activation | +7.59e-01 |
Pos logit contributions | |
Honour | +3.708 |
emin | +3.291 |
acceptance | +3.111 |
MENT | +2.917 |
ODY | +2.912 |
Neg logit contributions | |
�� | -10.015 |
ゼ | -9.514 |
verting | -9.328 |
dos | -9.310 |
eeper | -9.176 |
Token | < |
Token ID | 1279 |
Feature activation | +9.72e-01 |
Pos logit contributions | |
Honour | +3.561 |
emin | +3.176 |
acceptance | +3.026 |
Expression | +3.012 |
MENT | +2.930 |
Neg logit contributions | |
�� | -7.164 |
ゼ | -6.853 |
dos | -6.622 |
eeper | -6.593 |
verting | -6.550 |
Token | Tab |
Token ID | 33349 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
Honour | +3.551 |
emin | +3.362 |
MENT | +3.328 |
WATCH | +3.125 |
OPS | +3.117 |
Neg logit contributions | |
�� | -9.750 |
eeper | -9.195 |
verting | -8.960 |
olulu | -8.953 |
ゼ | -8.907 |
Token | 20 |
Token ID | 1238 |
Feature activation | +6.65e-01 |
Pos logit contributions | |
Honour | +1.438 |
emin | +1.361 |
MENT | +1.306 |
ODY | +1.296 |
acceptance | +1.287 |
Neg logit contributions | |
�� | -1.465 |
ゼ | -1.380 |
dos | -1.357 |
eeper | -1.341 |
verting | -1.329 |
Token | z |
Token ID | 89 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
Honour | +3.875 |
emin | +3.655 |
ODY | +3.497 |
MENT | +3.487 |
acceptance | +3.459 |
Neg logit contributions | |
�� | -5.249 |
ゼ | -4.953 |
eeper | -4.879 |
verting | -4.846 |
dos | -4.831 |
Token | BLACK |
Token ID | 31963 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
Honour | +1.510 |
emin | +1.358 |
MENT | +1.323 |
ODY | +1.312 |
acceptance | +1.293 |
Neg logit contributions | |
�� | -2.343 |
ゼ | -2.266 |
dos | -2.243 |
eeper | -2.220 |
verting | -2.203 |
Token | FO |
Token ID | 6080 |
Feature activation | -8.21e-02 |
Pos logit contributions | |
Honour | +1.589 |
emin | +1.496 |
MENT | +1.458 |
ODY | +1.442 |
acceptance | +1.430 |
Neg logit contributions | |
�� | -1.714 |
ゼ | -1.659 |
dos | -1.645 |
verting | -1.605 |
eeper | -1.603 |
Token | OT |
Token ID | 2394 |
Feature activation | +5.11e-01 |
Pos logit contributions | |
�� | +0.645 |
ゼ | +0.627 |
dos | +0.622 |
eeper | +0.609 |
verting | +0.608 |
Neg logit contributions | |
Honour | -0.499 |
emin | -0.465 |
MENT | -0.445 |
ODY | -0.444 |
acceptance | -0.441 |
Token | T |
Token ID | 309 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
Honour | +2.903 |
emin | +2.621 |
MENT | +2.606 |
ODY | +2.593 |
OPS | +2.545 |
Neg logit contributions | |
�� | -4.223 |
ゼ | -4.098 |
dos | -3.994 |
eeper | -3.983 |
verting | -3.934 |
Token | OC |
Token ID | 4503 |
Feature activation | +8.87e-01 |
Pos logit contributions | |
OC | +4.467 |
OPS | +4.262 |
ODY | +4.065 |
ONY | +3.722 |
MENT | +3.572 |
Neg logit contributions | |
�� | -18.710 |
verting | -17.583 |
olulu | -17.402 |
eeper | -17.356 |
dos | -17.133 |
Token | NOT |
Token ID | 5626 |
Feature activation | +4.29e-01 |
Pos logit contributions | |
Honour | +4.409 |
MENT | +3.985 |
ODY | +3.969 |
OPS | +3.892 |
acceptance | +3.808 |
Neg logit contributions | |
�� | -7.841 |
ゼ | -7.487 |
dos | -7.407 |
eeper | -7.340 |
verting | -7.215 |
Token | IFIED |
Token ID | 28343 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
Honour | +3.108 |
emin | +2.919 |
ODY | +2.917 |
MENT | +2.898 |
OPS | +2.861 |
Neg logit contributions | |
�� | -2.883 |
ゼ | -2.770 |
dos | -2.712 |
eeper | -2.667 |
verting | -2.648 |
Token | 1 |
Token ID | 352 |
Feature activation | +3.23e-01 |
Pos logit contributions | |
�� | +1.122 |
ゼ | +1.094 |
dos | +1.082 |
eeper | +1.057 |
verting | +1.054 |
Neg logit contributions | |
Honour | -0.908 |
emin | -0.849 |
acceptance | -0.808 |
MENT | -0.807 |
ODY | -0.800 |
Token | GER |
Token ID | 44186 |
Feature activation | +2.00e-01 |
Pos logit contributions | |
Honour | +2.019 |
emin | +1.887 |
MENT | +1.837 |
ODY | +1.834 |
OPS | +1.796 |
Neg logit contributions | |
�� | -2.458 |
ゼ | -2.379 |
dos | -2.340 |
eeper | -2.320 |
verting | -2.301 |
Token | v |
Token ID | 85 |
Feature activation | +2.00e-01 |
Pos logit contributions | |
Honour | +2.075 |
emin | +2.035 |
MENT | +1.891 |
acceptance | +1.849 |
OPS | +1.833 |
Neg logit contributions | |
�� | -2.366 |
ゼ | -2.166 |
eeper | -2.044 |
� | -2.023 |
dos | -1.996 |
Token | 2 |
Token ID | 17 |
Feature activation | -2.23e-01 |
Pos logit contributions | |
Honour | +1.224 |
emin | +1.183 |
MENT | +1.125 |
ODY | +1.084 |
acceptance | +1.082 |
Neg logit contributions | |
�� | -1.637 |
ゼ | -1.499 |
eeper | -1.465 |
dos | -1.449 |
verting | -1.419 |
Token | . |
Token ID | 13 |
Feature activation | -1.72e-01 |
Pos logit contributions | |
�� | +1.623 |
ゼ | +1.574 |
dos | +1.556 |
eeper | +1.519 |
verting | +1.513 |
Neg logit contributions | |
Honour | -1.485 |
emin | -1.396 |
MENT | -1.332 |
acceptance | -1.331 |
ODY | -1.319 |
Token | get |
Token ID | 1136 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
�� | +1.001 |
ゼ | +0.960 |
dos | +0.942 |
eeper | +0.918 |
verting | +0.914 |
Neg logit contributions | |
Honour | -1.402 |
emin | -1.340 |
MENT | -1.290 |
acceptance | -1.285 |
ODY | -1.278 |
Token | Struct |
Token ID | 44909 |
Feature activation | +6.33e-01 |
Pos logit contributions | |
Honour | +7.755 |
MENT | +7.373 |
emin | +7.332 |
OPS | +7.210 |
Ont | +7.184 |
Neg logit contributions | |
�� | -7.042 |
olulu | -5.996 |
eeper | -5.905 |
� | -5.775 |
dos | -5.770 |
Token | uring |
Token ID | 870 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
Honour | +3.650 |
emin | +3.555 |
MENT | +3.298 |
acceptance | +3.260 |
OPS | +3.136 |
Neg logit contributions | |
�� | -5.325 |
ゼ | -5.036 |
dos | -4.930 |
� | -4.653 |
arthed | -4.596 |
Token | Element |
Token ID | 20180 |
Feature activation | +4.50e-01 |
Pos logit contributions | |
MENT | +4.228 |
Honour | +3.816 |
emin | +3.172 |
Ont | +3.152 |
ODY | +2.834 |
Neg logit contributions | |
�� | -19.878 |
olulu | -17.798 |
destro | -17.533 |
verting | -17.490 |
dos | -17.457 |
Token | ( |
Token ID | 7 |
Feature activation | +4.09e-01 |
Pos logit contributions | |
Honour | +3.128 |
emin | +2.956 |
MENT | +2.890 |
ODY | +2.841 |
Ont | +2.777 |
Neg logit contributions | |
�� | -3.376 |
ゼ | -3.015 |
dos | -2.927 |
eeper | -2.920 |
verting | -2.897 |
Token | cv |
Token ID | 33967 |
Feature activation | +6.51e-01 |
Pos logit contributions | |
Honour | +3.548 |
emin | +3.522 |
MENT | +3.414 |
acceptance | +3.327 |
ODY | +3.304 |
Neg logit contributions | |
�� | -2.160 |
ゼ | -1.937 |
eeper | -1.830 |
� | -1.774 |
dos | -1.741 |
Token | 2 |
Token ID | 17 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
Honour | +3.374 |
emin | +3.301 |
MENT | +3.214 |
Ont | +3.016 |
ODY | +2.993 |
Neg logit contributions | |
�� | -5.947 |
ゼ | -5.236 |
eeper | -5.220 |
olulu | -5.074 |
dos | -5.012 |
Token | . |
Token ID | 13 |
Feature activation | +5.24e-01 |
Pos logit contributions | |
Honour | +1.445 |
emin | +1.349 |
MENT | +1.298 |
ODY | +1.252 |
acceptance | +1.249 |
Neg logit contributions | |
�� | -2.121 |
ゼ | -1.940 |
eeper | -1.909 |
dos | -1.909 |
verting | -1.878 |
Token | His |
Token ID | 6653 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
�� | +1.082 |
ゼ | +1.049 |
dos | +1.037 |
eeper | +1.019 |
verting | +1.012 |
Neg logit contributions | |
Honour | -0.830 |
emin | -0.779 |
MENT | -0.742 |
acceptance | -0.735 |
ODY | -0.733 |
Token | comments |
Token ID | 3651 |
Feature activation | +6.17e-01 |
Pos logit contributions | |
Honour | +3.654 |
acceptance | +3.381 |
emin | +3.284 |
MENT | +3.101 |
ODY | +3.055 |
Neg logit contributions | |
�� | -4.812 |
ゼ | -4.652 |
dos | -4.549 |
eeper | -4.434 |
verting | -4.416 |
Token | seemed |
Token ID | 3947 |
Feature activation | +5.77e-01 |
Pos logit contributions | |
Honour | +3.374 |
emin | +3.196 |
acceptance | +3.112 |
MENT | +2.987 |
afety | +2.866 |
Neg logit contributions | |
�� | -5.148 |
dos | -4.888 |
ゼ | -4.848 |
arthed | -4.683 |
eeper | -4.682 |
Token | to |
Token ID | 284 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
Honour | +2.971 |
emin | +2.922 |
acceptance | +2.820 |
MENT | +2.714 |
ODY | +2.557 |
Neg logit contributions | |
�� | -4.831 |
dos | -4.670 |
ゼ | -4.653 |
eeper | -4.580 |
verting | -4.567 |
Token | put |
Token ID | 1234 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
Honour | +2.129 |
emin | +1.989 |
acceptance | +1.964 |
MENT | +1.904 |
ODY | +1.824 |
Neg logit contributions | |
�� | -2.604 |
ゼ | -2.476 |
dos | -2.441 |
verting | -2.408 |
eeper | -2.391 |
Token | McDonnell |
Token ID | 39441 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
Honour | +1.984 |
emin | +1.903 |
acceptance | +1.849 |
MENT | +1.793 |
ODY | +1.733 |
Neg logit contributions | |
�� | -2.638 |
ゼ | -2.548 |
dos | -2.517 |
verting | -2.441 |
eeper | -2.425 |
Token | in |
Token ID | 287 |
Feature activation | +9.88e-01 |
Pos logit contributions | |
Honour | +7.805 |
acceptance | +7.502 |
emin | +7.413 |
MENT | +7.020 |
� | +6.813 |
Neg logit contributions | |
�� | -13.730 |
dos | -12.583 |
verting | -12.241 |
ゼ | -12.127 |
arthed | -12.026 |
Token | line |
Token ID | 1627 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
Honour | +5.463 |
emin | +4.957 |
acceptance | +4.920 |
OPS | +4.539 |
afety | +4.511 |
Neg logit contributions | |
�� | -7.784 |
ゼ | -7.561 |
dos | -7.516 |
arthed | -7.294 |
verting | -7.137 |
Token | with |
Token ID | 351 |
Feature activation | -9.94e-04 |
Pos logit contributions | |
�� | +1.904 |
ゼ | +1.888 |
dos | +1.847 |
eeper | +1.828 |
verting | +1.808 |
Neg logit contributions | |
Honour | -1.704 |
emin | -1.585 |
MENT | -1.518 |
ODY | -1.518 |
acceptance | -1.508 |
Token | the |
Token ID | 262 |
Feature activation | -8.40e-02 |
Pos logit contributions | |
�� | +0.008 |
ゼ | +0.008 |
dos | +0.008 |
eeper | +0.008 |
verting | +0.008 |
Neg logit contributions | |
Honour | -0.006 |
emin | -0.005 |
acceptance | -0.005 |
MENT | -0.005 |
ODY | -0.005 |
Token | police |
Token ID | 1644 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
�� | +0.625 |
ゼ | +0.610 |
dos | +0.601 |
eeper | +0.588 |
verting | +0.585 |
Neg logit contributions | |
Honour | -0.546 |
emin | -0.510 |
acceptance | -0.490 |
MENT | -0.485 |
ODY | -0.481 |
Token | v |
Token ID | 85 |
Feature activation | +1.28e-01 |
Pos logit contributions | |
Honour | +0.491 |
emin | +0.474 |
MENT | +0.446 |
acceptance | +0.441 |
ODY | +0.437 |
Neg logit contributions | |
�� | -0.478 |
ゼ | -0.447 |
eeper | -0.424 |
dos | -0.423 |
verting | -0.413 |
Token | 2 |
Token ID | 17 |
Feature activation | -5.57e-01 |
Pos logit contributions | |
Honour | +0.806 |
emin | +0.774 |
MENT | +0.736 |
acceptance | +0.716 |
ODY | +0.714 |
Neg logit contributions | |
�� | -1.013 |
ゼ | -0.939 |
eeper | -0.917 |
dos | -0.913 |
verting | -0.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.73e-01 |
Pos logit contributions | |
ゼ | +3.547 |
dos | +3.533 |
�� | +3.459 |
verting | +3.416 |
eeper | +3.369 |
Neg logit contributions | |
Honour | -3.984 |
emin | -3.750 |
acceptance | -3.635 |
ODY | -3.623 |
MENT | -3.601 |
Token | get |
Token ID | 1136 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
dos | +2.402 |
�� | +2.387 |
ゼ | +2.368 |
verting | +2.251 |
eeper | +2.245 |
Neg logit contributions | |
Honour | -4.119 |
emin | -3.856 |
acceptance | -3.778 |
ODY | -3.754 |
MENT | -3.739 |
Token | Struct |
Token ID | 44909 |
Feature activation | +4.52e-01 |
Pos logit contributions | |
Honour | +7.314 |
MENT | +7.034 |
emin | +6.936 |
OPS | +6.821 |
Ont | +6.807 |
Neg logit contributions | |
�� | -6.829 |
eeper | -5.833 |
olulu | -5.788 |
� | -5.660 |
ゼ | -5.657 |
Token | uring |
Token ID | 870 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
Honour | +2.692 |
emin | +2.609 |
MENT | +2.446 |
acceptance | +2.405 |
ODY | +2.322 |
Neg logit contributions | |
�� | -3.754 |
ゼ | -3.545 |
dos | -3.507 |
� | -3.282 |
eeper | -3.270 |
Token | Element |
Token ID | 20180 |
Feature activation | +9.52e-02 |
Pos logit contributions | |
MENT | +3.988 |
Honour | +3.499 |
emin | +2.892 |
Ont | +2.874 |
ODY | +2.636 |
Neg logit contributions | |
�� | -19.757 |
olulu | -17.662 |
dos | -17.447 |
verting | -17.428 |
destro | -17.285 |
Token | ( |
Token ID | 7 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
Honour | +0.716 |
emin | +0.680 |
MENT | +0.659 |
ODY | +0.652 |
acceptance | +0.645 |
Neg logit contributions | |
�� | -0.642 |
ゼ | -0.594 |
dos | -0.579 |
eeper | -0.570 |
verting | -0.565 |
Token | cv |
Token ID | 33967 |
Feature activation | +5.98e-01 |
Pos logit contributions | |
Honour | +3.311 |
emin | +3.267 |
MENT | +3.184 |
acceptance | +3.107 |
ODY | +3.089 |
Neg logit contributions | |
�� | -1.981 |
ゼ | -1.782 |
eeper | -1.704 |
� | -1.634 |
dos | -1.624 |
Token | 2 |
Token ID | 17 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
Honour | +3.129 |
emin | +3.078 |
MENT | +2.999 |
ODY | +2.804 |
Ont | +2.799 |
Neg logit contributions | |
�� | -5.421 |
ゼ | -4.786 |
eeper | -4.775 |
olulu | -4.648 |
dos | -4.588 |
Token | . |
Token ID | 13 |
Feature activation | +4.33e-01 |
Pos logit contributions | |
�� | +0.790 |
ゼ | +0.754 |
dos | +0.744 |
eeper | +0.732 |
verting | +0.726 |
Neg logit contributions | |
Honour | -0.670 |
emin | -0.630 |
MENT | -0.602 |
acceptance | -0.597 |
ODY | -0.593 |
Token | K |
Token ID | 42 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
Honour | +0.046 |
emin | +0.043 |
MENT | +0.041 |
ODY | +0.040 |
acceptance | +0.040 |
Neg logit contributions | |
�� | -0.067 |
ゼ | -0.065 |
dos | -0.065 |
eeper | -0.064 |
verting | -0.063 |
Token | AND |
Token ID | 5357 |
Feature activation | +5.87e-01 |
Pos logit contributions | |
Honour | +1.379 |
emin | +1.278 |
MENT | +1.238 |
ODY | +1.224 |
OPS | +1.208 |
Neg logit contributions | |
�� | -1.948 |
ゼ | -1.893 |
dos | -1.865 |
verting | -1.835 |
eeper | -1.826 |
Token | AP |
Token ID | 3486 |
Feature activation | +4.60e-01 |
Pos logit contributions | |
Honour | +3.231 |
emin | +2.916 |
MENT | +2.913 |
ODY | +2.875 |
OPS | +2.860 |
Neg logit contributions | |
�� | -4.929 |
dos | -4.741 |
ゼ | -4.712 |
eeper | -4.678 |
verting | -4.655 |
Token | AC |
Token ID | 2246 |
Feature activation | +9.06e-01 |
Pos logit contributions | |
Honour | +1.927 |
emin | +1.764 |
MENT | +1.699 |
ODY | +1.664 |
OPS | +1.632 |
Neg logit contributions | |
�� | -4.416 |
ゼ | -4.297 |
dos | -4.293 |
eeper | -4.245 |
verting | -4.226 |
Token | HE |
Token ID | 13909 |
Feature activation | +2.80e-01 |
Pos logit contributions | |
Honour | +2.212 |
emin | +2.065 |
MENT | +2.025 |
ODY | +1.878 |
OPS | +1.835 |
Neg logit contributions | |
�� | -10.465 |
dos | -9.986 |
eeper | -9.807 |
verting | -9.770 |
olulu | -9.652 |
Token | T |
Token ID | 309 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
Honour | +1.651 |
emin | +1.520 |
MENT | +1.489 |
ODY | +1.469 |
acceptance | +1.449 |
Neg logit contributions | |
�� | -2.259 |
ゼ | -2.185 |
dos | -2.166 |
eeper | -2.127 |
verting | -2.116 |
Token | OC |
Token ID | 4503 |
Feature activation | +4.16e-02 |
Pos logit contributions | |
OC | +2.751 |
OPS | +2.540 |
ODY | +2.100 |
ONY | +1.917 |
MENT | +1.784 |
Neg logit contributions | |
�� | -19.701 |
verting | -18.527 |
eeper | -18.356 |
olulu | -18.269 |
dos | -18.042 |
Token | RE |
Token ID | 4526 |
Feature activation | +4.00e-01 |
Pos logit contributions | |
Honour | +0.220 |
emin | +0.202 |
MENT | +0.192 |
acceptance | +0.191 |
ODY | +0.190 |
Neg logit contributions | |
�� | -0.361 |
ゼ | -0.351 |
dos | -0.349 |
eeper | -0.342 |
verting | -0.340 |
Token | P |
Token ID | 47 |
Feature activation | +3.91e-02 |
Pos logit contributions | |
Honour | +1.401 |
MENT | +1.333 |
OPS | +1.276 |
emin | +1.269 |
ODY | +1.196 |
Neg logit contributions | |
�� | -4.174 |
eeper | -4.011 |
ゼ | -4.000 |
dos | -3.960 |
olulu | -3.912 |
Token | ORTS |
Token ID | 33002 |
Feature activation | -2.88e-01 |
Pos logit contributions | |
Honour | +0.248 |
emin | +0.232 |
MENT | +0.226 |
ODY | +0.225 |
OPS | +0.223 |
Neg logit contributions | |
�� | -0.300 |
ゼ | -0.290 |
dos | -0.284 |
eeper | -0.279 |
verting | -0.278 |
Token | 100 |
Token ID | 1802 |
Feature activation | -6.11e-01 |
Pos logit contributions | |
�� | +2.002 |
ゼ | +1.960 |
dos | +1.933 |
eeper | +1.880 |
verting | +1.877 |
Neg logit contributions | |
Honour | -1.978 |
emin | -1.867 |
acceptance | -1.781 |
MENT | -1.769 |
ODY | -1.758 |
Token | 505 |
Token ID | 31654 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
Honour | +4.226 |
emin | +3.978 |
MENT | +3.882 |
acceptance | +3.853 |
ODY | +3.852 |
Neg logit contributions | |
�� | -4.894 |
ゼ | -4.614 |
eeper | -4.548 |
verting | -4.543 |
dos | -4.504 |
Token | z |
Token ID | 89 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
Honour | +2.216 |
emin | +2.073 |
MENT | +1.999 |
ODY | +1.995 |
acceptance | +1.977 |
Neg logit contributions | |
�� | -2.697 |
ゼ | -2.586 |
dos | -2.536 |
eeper | -2.519 |
verting | -2.519 |
Token | BLACK |
Token ID | 31963 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
Honour | +1.709 |
emin | +1.583 |
MENT | +1.536 |
ODY | +1.519 |
acceptance | +1.502 |
Neg logit contributions | |
�� | -2.262 |
ゼ | -2.177 |
dos | -2.157 |
eeper | -2.126 |
verting | -2.122 |
Token | FO |
Token ID | 6080 |
Feature activation | -9.96e-02 |
Pos logit contributions | |
Honour | +1.003 |
emin | +0.943 |
MENT | +0.916 |
ODY | +0.905 |
acceptance | +0.902 |
Neg logit contributions | |
�� | -1.099 |
ゼ | -1.065 |
dos | -1.055 |
verting | -1.029 |
eeper | -1.027 |
Token | OT |
Token ID | 2394 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
�� | +0.780 |
ゼ | +0.759 |
dos | +0.753 |
eeper | +0.736 |
verting | +0.735 |
Neg logit contributions | |
Honour | -0.607 |
emin | -0.566 |
MENT | -0.541 |
ODY | -0.540 |
acceptance | -0.537 |
Token | T |
Token ID | 309 |
Feature activation | +1.64e+00 |
Pos logit contributions | |
Honour | +3.100 |
emin | +2.794 |
MENT | +2.779 |
ODY | +2.758 |
acceptance | +2.727 |
Neg logit contributions | |
�� | -4.376 |
ゼ | -4.235 |
dos | -4.131 |
eeper | -4.113 |
verting | -4.078 |
Token | OC |
Token ID | 4503 |
Feature activation | +7.00e-01 |
Pos logit contributions | |
OPS | +6.267 |
ODY | +6.194 |
OC | +6.172 |
ONY | +6.016 |
MENT | +5.879 |
Neg logit contributions | |
�� | -14.199 |
verting | -13.711 |
dos | -13.506 |
ゼ | -13.465 |
eeper | -13.307 |
Token | RE |
Token ID | 4526 |
Feature activation | +5.10e-01 |
Pos logit contributions | |
Honour | +3.800 |
MENT | +3.438 |
ODY | +3.389 |
emin | +3.347 |
OPS | +3.332 |
Neg logit contributions | |
�� | -5.943 |
ゼ | -5.699 |
dos | -5.624 |
eeper | -5.569 |
verting | -5.482 |
Token | P |
Token ID | 47 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
Honour | +1.791 |
MENT | +1.688 |
emin | +1.610 |
OPS | +1.602 |
ODY | +1.499 |
Neg logit contributions | |
�� | -5.194 |
ゼ | -5.058 |
eeper | -5.025 |
dos | -4.997 |
verting | -4.923 |
Token | ORTS |
Token ID | 33002 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
Honour | +2.219 |
MENT | +2.081 |
ODY | +2.075 |
emin | +2.072 |
OPS | +2.053 |
Neg logit contributions | |
�� | -3.069 |
ゼ | -2.976 |
dos | -2.892 |
verting | -2.844 |
eeper | -2.843 |
Token | B |
Token ID | 347 |
Feature activation | -2.52e-01 |
Pos logit contributions | |
�� | +2.819 |
ゼ | +2.761 |
dos | +2.736 |
eeper | +2.665 |
verting | +2.658 |
Neg logit contributions | |
Honour | -2.256 |
emin | -2.131 |
acceptance | -2.012 |
MENT | -1.994 |
ODY | -1.976 |
Token | 1 |
Token ID | 352 |
Feature activation | +1.54e-02 |
Pos logit contributions | |
Honour | +1.058 |
emin | +0.953 |
MENT | +0.923 |
ODY | +0.911 |
acceptance | +0.909 |
Neg logit contributions | |
�� | -1.701 |
ゼ | -1.646 |
dos | -1.636 |
eeper | -1.608 |
verting | -1.601 |
Token | GER |
Token ID | 44186 |
Feature activation | +8.24e-01 |
Pos logit contributions | |
Honour | +0.091 |
emin | +0.085 |
MENT | +0.081 |
acceptance | +0.080 |
ODY | +0.080 |
Neg logit contributions | |
�� | -0.124 |
ゼ | -0.121 |
dos | -0.119 |
eeper | -0.117 |
verting | -0.117 |
Token | ON |
Token ID | 1340 |
Feature activation | +9.00e-01 |
Pos logit contributions | |
Honour | +2.746 |
MENT | +2.547 |
ODY | +2.491 |
emin | +2.448 |
OPS | +2.408 |
Neg logit contributions | |
�� | -8.389 |
ゼ | -8.170 |
dos | -8.075 |
verting | -8.044 |
eeper | -8.036 |
Token | IM |
Token ID | 3955 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
Honour | +2.625 |
MENT | +2.455 |
emin | +2.321 |
OPS | +2.259 |
ODY | +2.174 |
Neg logit contributions | |
�� | -9.884 |
dos | -9.398 |
eeper | -9.391 |
verting | -9.300 |
olulu | -9.280 |
Token | O |
Token ID | 46 |
Feature activation | +3.77e-01 |
Pos logit contributions | |
�� | +1.036 |
ゼ | +1.008 |
dos | +0.998 |
eeper | +0.977 |
verting | +0.974 |
Neg logit contributions | |
Honour | -0.790 |
emin | -0.737 |
MENT | -0.702 |
acceptance | -0.700 |
ODY | -0.696 |
Token | T |
Token ID | 309 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
Honour | +2.201 |
emin | +2.002 |
MENT | +1.962 |
ODY | +1.948 |
acceptance | +1.947 |
Neg logit contributions | |
�� | -3.045 |
ゼ | -2.983 |
dos | -2.935 |
eeper | -2.883 |
verting | -2.859 |
Token | OC |
Token ID | 4503 |
Feature activation | +5.54e-01 |
Pos logit contributions | |
OC | +2.638 |
OPS | +2.259 |
ODY | +2.147 |
MENT | +1.720 |
ONY | +1.655 |
Neg logit contributions | |
�� | -19.346 |
verting | -18.261 |
olulu | -18.111 |
eeper | -18.071 |
dos | -17.960 |
Token | IN |
Token ID | 3268 |
Feature activation | +5.92e-01 |
Pos logit contributions | |
Honour | +3.085 |
ODY | +2.774 |
MENT | +2.763 |
emin | +2.735 |
acceptance | +2.704 |
Neg logit contributions | |
�� | -4.714 |
ゼ | -4.536 |
dos | -4.445 |
eeper | -4.361 |
verting | -4.313 |
Token | IT |
Token ID | 2043 |
Feature activation | +6.52e-01 |
Pos logit contributions | |
Honour | +3.410 |
emin | +3.113 |
MENT | +3.033 |
ODY | +3.026 |
OPS | +2.991 |
Neg logit contributions | |
�� | -4.838 |
ゼ | -4.693 |
dos | -4.621 |
eeper | -4.586 |
verting | -4.440 |
Token | I |
Token ID | 40 |
Feature activation | +3.64e-01 |
Pos logit contributions | |
Honour | +3.260 |
MENT | +3.061 |
emin | +2.964 |
ODY | +2.902 |
OPS | +2.897 |
Neg logit contributions | |
�� | -5.883 |
ゼ | -5.530 |
dos | -5.522 |
eeper | -5.410 |
verting | -5.362 |
Token | ATES |
Token ID | 29462 |
Feature activation | -8.46e-02 |
Pos logit contributions | |
Honour | +2.086 |
emin | +1.964 |
MENT | +1.929 |
ODY | +1.924 |
OPS | +1.880 |
Neg logit contributions | |
�� | -2.984 |
dos | -2.850 |
ゼ | -2.845 |
eeper | -2.767 |
verting | -2.743 |
Token | Ri |
Token ID | 30385 |
Feature activation | -2.26e-01 |
Pos logit contributions | |
�� | +1.051 |
ゼ | +1.030 |
dos | +1.017 |
eeper | +0.999 |
verting | +0.995 |
Neg logit contributions | |
Honour | -0.636 |
emin | -0.591 |
MENT | -0.557 |
acceptance | -0.554 |
ODY | -0.551 |
Token | ks |
Token ID | 591 |
Feature activation | -5.71e-01 |
Pos logit contributions | |
�� | +1.417 |
ゼ | +1.375 |
dos | +1.362 |
eeper | +1.324 |
verting | +1.317 |
Neg logit contributions | |
Honour | -1.713 |
emin | -1.618 |
acceptance | -1.559 |
MENT | -1.559 |
ODY | -1.545 |
Token | bank |
Token ID | 17796 |
Feature activation | -4.59e-01 |
Pos logit contributions | |
dos | +3.959 |
�� | +3.932 |
ゼ | +3.899 |
verting | +3.794 |
eeper | +3.793 |
Neg logit contributions | |
Honour | -3.831 |
emin | -3.566 |
MENT | -3.445 |
ODY | -3.435 |
acceptance | -3.433 |
Token | Prize |
Token ID | 15895 |
Feature activation | -8.59e-02 |
Pos logit contributions | |
�� | +2.069 |
ゼ | +2.000 |
dos | +1.939 |
eeper | +1.908 |
verting | +1.871 |
Neg logit contributions | |
Honour | -4.105 |
emin | -4.007 |
MENT | -3.886 |
ODY | -3.886 |
OPS | -3.845 |
Token | in |
Token ID | 287 |
Feature activation | +9.06e-01 |
Pos logit contributions | |
�� | +0.625 |
ゼ | +0.608 |
dos | +0.601 |
eeper | +0.587 |
verting | +0.584 |
Neg logit contributions | |
Honour | -0.566 |
emin | -0.533 |
MENT | -0.508 |
acceptance | -0.507 |
ODY | -0.505 |
Token | Economic |
Token ID | 11279 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
Honour | +4.003 |
emin | +3.319 |
acceptance | +3.205 |
Expression | +3.033 |
ODY | +2.962 |
Neg logit contributions | |
dos | -8.534 |
�� | -8.500 |
ゼ | -8.443 |
eeper | -8.216 |
verting | -8.032 |
Token | Sciences |
Token ID | 13473 |
Feature activation | -3.50e-02 |
Pos logit contributions | |
Honour | +6.150 |
emin | +4.926 |
Expression | +4.869 |
acceptance | +4.425 |
Congratulations | +4.187 |
Neg logit contributions | |
�� | -15.922 |
ゼ | -15.408 |
olulu | -15.105 |
eeper | -14.928 |
dos | -14.400 |
Token | in |
Token ID | 287 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
�� | +0.251 |
ゼ | +0.245 |
dos | +0.242 |
eeper | +0.236 |
verting | +0.235 |
Neg logit contributions | |
Honour | -0.233 |
emin | -0.220 |
MENT | -0.210 |
acceptance | -0.209 |
ODY | -0.208 |
Token | Memory |
Token ID | 14059 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
Honour | +1.678 |
emin | +1.501 |
acceptance | +1.449 |
MENT | +1.430 |
ODY | +1.404 |
Neg logit contributions | |
�� | -1.698 |
ゼ | -1.642 |
dos | -1.609 |
eeper | -1.580 |
verting | -1.540 |
Token | of |
Token ID | 286 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
�� | +1.850 |
ゼ | +1.814 |
dos | +1.795 |
eeper | +1.748 |
verting | +1.743 |
Neg logit contributions | |
Honour | -1.587 |
emin | -1.493 |
acceptance | -1.422 |
MENT | -1.420 |
ODY | -1.411 |
Token | Alfred |
Token ID | 22044 |
Feature activation | +6.82e-01 |
Pos logit contributions | |
Honour | +3.720 |
emin | +3.082 |
acceptance | +2.834 |
MENT | +2.669 |
Expression | +2.580 |
Neg logit contributions | |
�� | -10.304 |
ゼ | -9.956 |
dos | -9.942 |
eeper | -9.774 |
verting | -9.758 |
Token | . |
Token ID | 13 |
Feature activation | +3.06e-01 |
Pos logit contributions | |
�� | +1.141 |
ゼ | +1.098 |
dos | +1.085 |
eeper | +1.064 |
verting | +1.057 |
Neg logit contributions | |
Honour | -1.006 |
emin | -0.944 |
MENT | -0.902 |
acceptance | -0.897 |
ODY | -0.891 |
Token | Solid |
Token ID | 46933 |
Feature activation | +9.38e-01 |
Pos logit contributions | |
Honour | +1.644 |
emin | +1.550 |
MENT | +1.494 |
ODY | +1.449 |
OPS | +1.423 |
Neg logit contributions | |
�� | -2.670 |
eeper | -2.510 |
ゼ | -2.499 |
dos | -2.496 |
verting | -2.438 |
Token | Br |
Token ID | 9414 |
Feature activation | +2.29e-01 |
Pos logit contributions | |
Honour | +3.574 |
emin | +3.244 |
MENT | +3.165 |
Ont | +2.961 |
ODY | +2.937 |
Neg logit contributions | |
�� | -9.505 |
eeper | -8.796 |
olulu | -8.772 |
ゼ | -8.736 |
verting | -8.708 |
Token | ush |
Token ID | 1530 |
Feature activation | +4.80e-01 |
Pos logit contributions | |
Honour | +1.513 |
emin | +1.443 |
acceptance | +1.337 |
MENT | +1.323 |
ODY | +1.307 |
Neg logit contributions | |
�� | -1.738 |
ゼ | -1.651 |
dos | -1.588 |
verting | -1.570 |
eeper | -1.537 |
Token | ( |
Token ID | 357 |
Feature activation | +7.47e-01 |
Pos logit contributions | |
Honour | +2.764 |
emin | +2.513 |
MENT | +2.478 |
ODY | +2.428 |
OPS | +2.356 |
Neg logit contributions | |
�� | -4.152 |
ゼ | -3.811 |
dos | -3.753 |
verting | -3.737 |
eeper | -3.722 |
Token | [ |
Token ID | 685 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
Honour | +4.784 |
emin | +4.562 |
MENT | +4.382 |
ODY | +4.358 |
acceptance | +4.338 |
Neg logit contributions | |
�� | -5.393 |
ゼ | -5.179 |
dos | -5.084 |
eeper | -5.048 |
verting | -4.880 |
Token | System |
Token ID | 11964 |
Feature activation | +3.54e-02 |
Pos logit contributions | |
emin | +5.099 |
MENT | +5.086 |
Ont | +5.000 |
Honour | +4.916 |
GN | +4.720 |
Neg logit contributions | |
�� | -15.439 |
olulu | -14.504 |
eeper | -14.406 |
destro | -14.324 |
ゼ | -13.845 |
Token | . |
Token ID | 13 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
Honour | +0.220 |
emin | +0.206 |
MENT | +0.196 |
acceptance | +0.193 |
ODY | +0.192 |
Neg logit contributions | |
�� | -0.284 |
ゼ | -0.268 |
dos | -0.263 |
eeper | -0.261 |
verting | -0.257 |
Token | Draw |
Token ID | 25302 |
Feature activation | -4.93e-01 |
Pos logit contributions | |
Honour | +2.164 |
emin | +2.044 |
MENT | +1.983 |
ODY | +1.975 |
OPS | +1.955 |
Neg logit contributions | |
�� | -2.510 |
eeper | -2.321 |
ゼ | -2.297 |
dos | -2.234 |
verting | -2.232 |
Token | ing |
Token ID | 278 |
Feature activation | -2.08e-02 |
Pos logit contributions | |
�� | +2.609 |
dos | +2.594 |
ゼ | +2.572 |
verting | +2.507 |
eeper | +2.489 |
Neg logit contributions | |
Honour | -4.114 |
emin | -3.869 |
acceptance | -3.783 |
ODY | -3.747 |
MENT | -3.735 |
Token | . |
Token ID | 13 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
�� | +0.162 |
ゼ | +0.153 |
dos | +0.151 |
eeper | +0.150 |
verting | +0.148 |
Neg logit contributions | |
Honour | -0.132 |
emin | -0.124 |
MENT | -0.118 |
acceptance | -0.117 |
ODY | -0.116 |
Token | ( |
Token ID | 7 |
Feature activation | +3.45e-01 |
Pos logit contributions | |
Honour | +3.222 |
emin | +3.099 |
MENT | +3.002 |
ODY | +2.961 |
OPS | +2.899 |
Neg logit contributions | |
�� | -3.467 |
ゼ | -3.102 |
dos | -3.031 |
verting | -2.961 |
eeper | -2.959 |
Token | cv |
Token ID | 33967 |
Feature activation | +7.49e-01 |
Pos logit contributions | |
Honour | +3.136 |
emin | +3.045 |
MENT | +2.966 |
acceptance | +2.938 |
ODY | +2.915 |
Neg logit contributions | |
�� | -1.635 |
ゼ | -1.513 |
dos | -1.451 |
eeper | -1.430 |
verting | -1.410 |
Token | 2 |
Token ID | 17 |
Feature activation | +2.12e-02 |
Pos logit contributions | |
emin | +3.767 |
Honour | +3.748 |
MENT | +3.535 |
ODY | +3.367 |
Ont | +3.357 |
Neg logit contributions | |
�� | -6.873 |
ゼ | -6.059 |
eeper | -5.990 |
� | -5.828 |
olulu | -5.822 |
Token | . |
Token ID | 13 |
Feature activation | +9.55e-01 |
Pos logit contributions | |
Honour | +0.132 |
emin | +0.124 |
MENT | +0.119 |
acceptance | +0.117 |
ODY | +0.116 |
Neg logit contributions | |
�� | -0.169 |
ゼ | -0.159 |
dos | -0.156 |
eeper | -0.155 |
verting | -0.153 |
Token | M |
Token ID | 44 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
MENT | +4.272 |
Honour | +4.169 |
emin | +4.071 |
ODY | +4.058 |
OPS | +3.955 |
Neg logit contributions | |
�� | -8.445 |
ゼ | -8.044 |
dos | -8.035 |
eeper | -7.979 |
verting | -7.967 |
Token | OR |
Token ID | 1581 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
ODY | +2.091 |
Honour | +2.063 |
MENT | +1.952 |
OPS | +1.909 |
emin | +1.639 |
Neg logit contributions | |
�� | -12.955 |
ゼ | -12.172 |
verting | -12.125 |
dos | -12.045 |
eeper | -11.868 |
Token | PH |
Token ID | 11909 |
Feature activation | +9.99e-01 |
Pos logit contributions | |
MENT | +3.555 |
ODY | +2.809 |
OPS | +2.626 |
Honour | +2.607 |
WATCH | +2.320 |
Neg logit contributions | |
�� | -18.019 |
olulu | -17.337 |
dos | -17.132 |
verting | -16.951 |
eeper | -16.745 |
Token | _ |
Token ID | 62 |
Feature activation | +5.29e-01 |
Pos logit contributions | |
MENT | +3.573 |
Honour | +3.451 |
OPS | +3.297 |
ODY | +3.287 |
emin | +3.241 |
Neg logit contributions | |
�� | -10.371 |
olulu | -9.399 |
ゼ | -9.371 |
verting | -9.253 |
eeper | -9.248 |
Token | RECT |
Token ID | 23988 |
Feature activation | -7.26e-03 |
Pos logit contributions | |
Honour | +2.576 |
MENT | +2.484 |
OPS | +2.424 |
emin | +2.419 |
ODY | +2.418 |
Neg logit contributions | |
�� | -4.718 |
ゼ | -4.475 |
dos | -4.456 |
eeper | -4.407 |
verting | -4.353 |
Token | , |
Token ID | 11 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
�� | +0.054 |
ゼ | +0.053 |
dos | +0.052 |
eeper | +0.051 |
verting | +0.051 |
Neg logit contributions | |
Honour | -0.047 |
emin | -0.043 |
acceptance | -0.042 |
MENT | -0.041 |
ODY | -0.041 |
Token | ( |
Token ID | 357 |
Feature activation | +4.12e-01 |
Pos logit contributions | |
Honour | +1.585 |
emin | +1.480 |
acceptance | +1.429 |
MENT | +1.426 |
ODY | +1.417 |
Neg logit contributions | |
�� | -1.890 |
ゼ | -1.808 |
dos | -1.790 |
verting | -1.750 |
eeper | -1.736 |
Token |
|
Token ID | 198 |
Feature activation | -2.08e-01 |
Pos logit contributions | |
Honour | +0.947 |
emin | +0.865 |
MENT | +0.817 |
acceptance | +0.815 |
ODY | +0.798 |
Neg logit contributions | |
�� | -1.522 |
ゼ | -1.440 |
eeper | -1.409 |
dos | -1.408 |
verting | -1.390 |
Token |
|
Token ID | 198 |
Feature activation | -9.15e-01 |
Pos logit contributions | |
�� | +1.626 |
ゼ | +1.591 |
dos | +1.577 |
eeper | +1.537 |
verting | +1.535 |
Neg logit contributions | |
Honour | -1.258 |
emin | -1.176 |
acceptance | -1.118 |
MENT | -1.115 |
ODY | -1.107 |
Token | 2004 |
Token ID | 15724 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
dos | +5.784 |
ゼ | +5.488 |
�� | +5.484 |
verting | +5.359 |
................................................................ | +5.338 |
Neg logit contributions | |
Honour | -6.540 |
emin | -6.092 |
acceptance | -6.018 |
afety | -5.926 |
Expression | -5.778 |
Token | Matt |
Token ID | 4705 |
Feature activation | +4.98e-02 |
Pos logit contributions | |
�� | +1.294 |
ゼ | +1.261 |
dos | +1.248 |
eeper | +1.219 |
verting | +1.215 |
Neg logit contributions | |
Honour | -1.029 |
emin | -0.962 |
acceptance | -0.915 |
MENT | -0.914 |
ODY | -0.906 |
Token | Le |
Token ID | 1004 |
Feature activation | +7.49e-01 |
Pos logit contributions | |
Honour | +0.348 |
emin | +0.322 |
acceptance | +0.306 |
MENT | +0.305 |
ODY | +0.299 |
Neg logit contributions | |
�� | -0.363 |
ゼ | -0.343 |
dos | -0.338 |
eeper | -0.331 |
verting | -0.327 |
Token | Bl |
Token ID | 3629 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
Honour | +2.746 |
emin | +2.440 |
Ont | +2.177 |
MENT | +2.161 |
OPS | +2.090 |
Neg logit contributions | |
�� | -7.872 |
dos | -7.373 |
eeper | -7.319 |
ゼ | -7.218 |
verting | -7.047 |
Token | anc |
Token ID | 1192 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
Honour | +7.160 |
emin | +7.102 |
abre | +6.574 |
acceptance | +6.065 |
older | +5.949 |
Neg logit contributions | |
�� | -14.012 |
ゼ | -12.574 |
� | -12.452 |
ゴン | -12.247 |
�� | -12.111 |
Token |
|
Token ID | 198 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
�� | +1.844 |
ゼ | +1.804 |
dos | +1.790 |
eeper | +1.743 |
verting | +1.741 |
Neg logit contributions | |
Honour | -1.432 |
emin | -1.341 |
acceptance | -1.273 |
MENT | -1.272 |
ODY | -1.261 |
Token |
|
Token ID | 198 |
Feature activation | -8.79e-01 |
Pos logit contributions | |
�� | +2.318 |
ゼ | +2.298 |
dos | +2.289 |
verting | +2.220 |
eeper | +2.211 |
Neg logit contributions | |
Honour | -1.932 |
emin | -1.812 |
acceptance | -1.732 |
MENT | -1.721 |
ODY | -1.716 |
Token | 2004 |
Token ID | 15724 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
dos | +5.643 |
ゼ | +5.392 |
�� | +5.383 |
verting | +5.275 |
................................................................ | +5.228 |
Neg logit contributions | |
Honour | -6.184 |
emin | -5.770 |
acceptance | -5.688 |
afety | -5.597 |
Expression | -5.421 |
Token | John |
Token ID | 1757 |
Feature activation | +2.68e-02 |
Pos logit contributions | |
�� | +2.670 |
ゼ | +2.621 |
dos | +2.586 |
verting | +2.524 |
eeper | +2.510 |
Neg logit contributions | |
Honour | -2.600 |
emin | -2.464 |
MENT | -2.356 |
acceptance | -2.352 |
ODY | -2.343 |
Token | v |
Token ID | 85 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
Honour | +1.158 |
emin | +1.128 |
acceptance | +1.042 |
MENT | +1.041 |
ODY | +1.025 |
Neg logit contributions | |
�� | -1.223 |
ゼ | -1.147 |
eeper | -1.059 |
dos | -1.058 |
� | -1.057 |
Token | 2 |
Token ID | 17 |
Feature activation | -4.23e-01 |
Pos logit contributions | |
Honour | +2.012 |
emin | +1.976 |
MENT | +1.831 |
acceptance | +1.785 |
OPS | +1.781 |
Neg logit contributions | |
�� | -2.836 |
ゼ | -2.594 |
eeper | -2.510 |
dos | -2.500 |
� | -2.435 |
Token | . |
Token ID | 13 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
�� | +2.846 |
ゼ | +2.824 |
dos | +2.811 |
verting | +2.728 |
eeper | +2.717 |
Neg logit contributions | |
Honour | -2.942 |
emin | -2.760 |
acceptance | -2.663 |
MENT | -2.642 |
ODY | -2.636 |
Token | get |
Token ID | 1136 |
Feature activation | +9.10e-01 |
Pos logit contributions | |
Honour | +2.480 |
emin | +2.397 |
MENT | +2.316 |
ODY | +2.274 |
acceptance | +2.267 |
Neg logit contributions | |
�� | -2.138 |
ゼ | -2.037 |
dos | -1.981 |
eeper | -1.958 |
verting | -1.947 |
Token | Struct |
Token ID | 44909 |
Feature activation | +5.82e-01 |
Pos logit contributions | |
Honour | +6.890 |
MENT | +6.645 |
emin | +6.603 |
ODY | +6.572 |
OPS | +6.501 |
Neg logit contributions | |
�� | -5.568 |
dos | -4.914 |
ゼ | -4.840 |
eeper | -4.816 |
verting | -4.691 |
Token | uring |
Token ID | 870 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
Honour | +3.361 |
emin | +3.256 |
MENT | +3.043 |
acceptance | +2.946 |
afety | +2.899 |
Neg logit contributions | |
�� | -4.919 |
ゼ | -4.624 |
dos | -4.548 |
� | -4.272 |
eeper | -4.254 |
Token | Element |
Token ID | 20180 |
Feature activation | +4.68e-01 |
Pos logit contributions | |
MENT | +5.135 |
Honour | +4.811 |
Ont | +4.378 |
ODY | +4.373 |
emin | +4.172 |
Neg logit contributions | |
�� | -16.435 |
olulu | -14.749 |
dos | -14.657 |
verting | -14.533 |
gettable | -14.350 |
Token | ( |
Token ID | 7 |
Feature activation | +3.45e-01 |
Pos logit contributions | |
Honour | +3.222 |
emin | +3.099 |
MENT | +3.002 |
ODY | +2.961 |
OPS | +2.899 |
Neg logit contributions | |
�� | -3.467 |
ゼ | -3.102 |
dos | -3.031 |
verting | -2.961 |
eeper | -2.959 |
Token | cv |
Token ID | 33967 |
Feature activation | +7.49e-01 |
Pos logit contributions | |
Honour | +3.136 |
emin | +3.045 |
MENT | +2.966 |
acceptance | +2.938 |
ODY | +2.915 |
Neg logit contributions | |
�� | -1.635 |
ゼ | -1.513 |
dos | -1.451 |
eeper | -1.430 |
verting | -1.410 |
Token | 2 |
Token ID | 17 |
Feature activation | +2.12e-02 |
Pos logit contributions | |
emin | +3.767 |
Honour | +3.748 |
MENT | +3.535 |
ODY | +3.367 |
Ont | +3.357 |
Neg logit contributions | |
�� | -6.873 |
ゼ | -6.059 |
eeper | -5.990 |
� | -5.828 |
olulu | -5.822 |
Token | . |
Token ID | 13 |
Feature activation | +9.55e-01 |
Pos logit contributions | |
Honour | +0.132 |
emin | +0.124 |
MENT | +0.119 |
acceptance | +0.117 |
ODY | +0.116 |
Neg logit contributions | |
�� | -0.169 |
ゼ | -0.159 |
dos | -0.156 |
eeper | -0.155 |
verting | -0.153 |
Token | 41 |
Token ID | 3901 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
�� | +0.181 |
ゼ | +0.175 |
dos | +0.173 |
eeper | +0.170 |
verting | +0.169 |
Neg logit contributions | |
Honour | -0.167 |
emin | -0.157 |
MENT | -0.151 |
ODY | -0.150 |
acceptance | -0.149 |
Token | z |
Token ID | 89 |
Feature activation | -8.78e-03 |
Pos logit contributions | |
Honour | +1.596 |
emin | +1.511 |
MENT | +1.417 |
acceptance | +1.407 |
ODY | +1.397 |
Neg logit contributions | |
�� | -2.240 |
ゼ | -2.103 |
dos | -2.041 |
eeper | -2.040 |
verting | -2.025 |
Token | BLACK |
Token ID | 31963 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
�� | +0.071 |
ゼ | +0.069 |
dos | +0.069 |
eeper | +0.067 |
verting | +0.067 |
Neg logit contributions | |
Honour | -0.051 |
emin | -0.048 |
MENT | -0.045 |
acceptance | -0.045 |
ODY | -0.045 |
Token | FO |
Token ID | 6080 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
Honour | +0.751 |
emin | +0.706 |
MENT | +0.682 |
acceptance | +0.675 |
ODY | +0.675 |
Neg logit contributions | |
�� | -0.807 |
ゼ | -0.783 |
dos | -0.775 |
eeper | -0.756 |
verting | -0.755 |
Token | OT |
Token ID | 2394 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
�� | +0.854 |
ゼ | +0.830 |
dos | +0.823 |
eeper | +0.805 |
verting | +0.803 |
Neg logit contributions | |
Honour | -0.668 |
emin | -0.624 |
MENT | -0.595 |
ODY | -0.593 |
acceptance | -0.592 |
Token | T |
Token ID | 309 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
Honour | +1.633 |
emin | +1.498 |
MENT | +1.466 |
ODY | +1.450 |
acceptance | +1.445 |
Neg logit contributions | |
�� | -2.262 |
ゼ | -2.199 |
dos | -2.166 |
eeper | -2.128 |
verting | -2.114 |
Token | OC |
Token ID | 4503 |
Feature activation | +3.67e-01 |
Pos logit contributions | |
OC | +2.464 |
OPS | +2.298 |
ODY | +2.175 |
ONY | +1.821 |
MENT | +1.725 |
Neg logit contributions | |
�� | -18.300 |
verting | -17.295 |
olulu | -17.113 |
eeper | -17.082 |
dos | -17.062 |
Token | AK |
Token ID | 15837 |
Feature activation | +6.92e-01 |
Pos logit contributions | |
Honour | +2.046 |
emin | +1.851 |
MENT | +1.835 |
ODY | +1.824 |
acceptance | +1.793 |
Neg logit contributions | |
�� | -3.117 |
ゼ | -3.006 |
dos | -2.951 |
eeper | -2.910 |
verting | -2.881 |
Token | NOW |
Token ID | 45669 |
Feature activation | +9.11e-01 |
Pos logit contributions | |
Honour | +4.033 |
MENT | +3.841 |
emin | +3.813 |
ODY | +3.813 |
OPS | +3.794 |
Neg logit contributions | |
�� | -5.369 |
dos | -5.184 |
ゼ | -5.151 |
verting | -5.006 |
eeper | -4.971 |
Token | LED |
Token ID | 30465 |
Feature activation | -4.94e-02 |
Pos logit contributions | |
MENT | +3.978 |
Honour | +3.860 |
emin | +3.818 |
ODY | +3.814 |
OPS | +3.677 |
Neg logit contributions | |
�� | -8.457 |
ゼ | -8.070 |
dos | -8.031 |
eeper | -7.833 |
olulu | -7.818 |
Token | G |
Token ID | 38 |
Feature activation | +1.81e-02 |
Pos logit contributions | |
�� | +0.469 |
ゼ | +0.453 |
dos | +0.451 |
eeper | +0.445 |
verting | +0.443 |
Neg logit contributions | |
Honour | -0.222 |
emin | -0.204 |
MENT | -0.193 |
ODY | -0.189 |
acceptance | -0.188 |
Token | estate |
Token ID | 7964 |
Feature activation | +6.39e-04 |
Pos logit contributions | |
Honour | +4.209 |
acceptance | +3.918 |
emin | +3.759 |
MENT | +3.725 |
ODY | +3.527 |
Neg logit contributions | |
�� | -4.348 |
ゼ | -4.036 |
dos | -3.810 |
verting | -3.792 |
eeper | -3.729 |
Token | in |
Token ID | 287 |
Feature activation | +6.27e-01 |
Pos logit contributions | |
Honour | +0.004 |
emin | +0.004 |
acceptance | +0.004 |
MENT | +0.004 |
ODY | +0.004 |
Neg logit contributions | |
�� | -0.005 |
ゼ | -0.005 |
dos | -0.005 |
eeper | -0.005 |
verting | -0.005 |
Token | W |
Token ID | 370 |
Feature activation | +5.51e-01 |
Pos logit contributions | |
Honour | +3.069 |
emin | +2.846 |
acceptance | +2.620 |
ODY | +2.589 |
MENT | +2.577 |
Neg logit contributions | |
�� | -5.502 |
ゼ | -5.328 |
dos | -5.315 |
eeper | -5.282 |
verting | -5.190 |
Token | alth |
Token ID | 1094 |
Feature activation | +4.04e-01 |
Pos logit contributions | |
Honour | +2.731 |
emin | +2.707 |
acceptance | +2.345 |
MENT | +2.344 |
abre | +2.288 |
Neg logit contributions | |
�� | -5.013 |
ゼ | -4.811 |
dos | -4.704 |
eeper | -4.553 |
� | -4.518 |
Token | am |
Token ID | 321 |
Feature activation | +6.82e-01 |
Pos logit contributions | |
Honour | +2.576 |
emin | +2.490 |
acceptance | +2.296 |
MENT | +2.271 |
ODY | +2.228 |
Neg logit contributions | |
�� | -3.105 |
ゼ | -2.989 |
dos | -2.816 |
eeper | -2.813 |
verting | -2.793 |
Token | and |
Token ID | 290 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
Honour | +3.557 |
emin | +3.320 |
acceptance | +3.098 |
MENT | +2.980 |
OPS | +2.898 |
Neg logit contributions | |
�� | -6.241 |
ゼ | -5.625 |
eeper | -5.542 |
dos | -5.486 |
verting | -5.467 |
Token | Som |
Token ID | 9995 |
Feature activation | +4.17e-01 |
Pos logit contributions | |
Honour | +3.000 |
emin | +2.627 |
MENT | +1.886 |
Expression | +1.830 |
acceptance | +1.795 |
Neg logit contributions | |
�� | -17.276 |
eeper | -16.459 |
dos | -16.169 |
arthed | -15.943 |
ゼ | -15.760 |
Token | erville |
Token ID | 33487 |
Feature activation | -6.00e-01 |
Pos logit contributions | |
Honour | +3.503 |
emin | +3.493 |
MENT | +3.322 |
acceptance | +3.278 |
ODY | +3.254 |
Neg logit contributions | |
�� | -2.283 |
ゼ | -2.174 |
dos | -2.126 |
verting | -1.961 |
eeper | -1.944 |
Token | 's |
Token ID | 338 |
Feature activation | +5.27e-01 |
Pos logit contributions | |
ゼ | +3.235 |
dos | +3.202 |
�� | +3.165 |
verting | +3.071 |
eeper | +3.066 |
Neg logit contributions | |
Honour | -4.830 |
emin | -4.628 |
acceptance | -4.468 |
ODY | -4.447 |
MENT | -4.440 |
Token | Union |
Token ID | 4479 |
Feature activation | +7.78e-01 |
Pos logit contributions | |
Honour | +3.976 |
emin | +3.788 |
acceptance | +3.658 |
MENT | +3.628 |
ODY | +3.578 |
Neg logit contributions | |
�� | -3.335 |
ゼ | -3.150 |
dos | -3.123 |
eeper | -3.050 |
verting | -3.034 |
Token | Square |
Token ID | 9276 |
Feature activation | -6.99e-03 |
Pos logit contributions | |
Honour | +3.227 |
emin | +2.764 |
acceptance | +2.572 |
Expression | +2.486 |
OPS | +2.474 |
Neg logit contributions | |
�� | -7.715 |
dos | -7.330 |
ゼ | -7.314 |
eeper | -7.170 |
olulu | -7.008 |
Token | 605 |
Token ID | 32417 |
Feature activation | +1.97e-02 |
Pos logit contributions | |
�� | +2.593 |
ゼ | +2.536 |
dos | +2.526 |
verting | +2.452 |
eeper | +2.433 |
Neg logit contributions | |
Honour | -2.835 |
emin | -2.696 |
acceptance | -2.589 |
MENT | -2.553 |
ODY | -2.540 |
Token | z |
Token ID | 89 |
Feature activation | -4.23e-02 |
Pos logit contributions | |
Honour | +0.124 |
emin | +0.117 |
MENT | +0.111 |
acceptance | +0.111 |
ODY | +0.110 |
Neg logit contributions | |
�� | -0.152 |
ゼ | -0.146 |
dos | -0.143 |
eeper | -0.142 |
verting | -0.141 |
Token | BLACK |
Token ID | 31963 |
Feature activation | +1.39e-02 |
Pos logit contributions | |
�� | +0.356 |
ゼ | +0.347 |
dos | +0.344 |
eeper | +0.337 |
verting | +0.336 |
Neg logit contributions | |
Honour | -0.234 |
emin | -0.216 |
MENT | -0.205 |
acceptance | -0.204 |
ODY | -0.203 |
Token | FO |
Token ID | 6080 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
Honour | +0.097 |
emin | +0.091 |
MENT | +0.087 |
acceptance | +0.087 |
ODY | +0.087 |
Neg logit contributions | |
�� | -0.097 |
ゼ | -0.094 |
dos | -0.093 |
eeper | -0.091 |
verting | -0.090 |
Token | OT |
Token ID | 2394 |
Feature activation | +2.11e-01 |
Pos logit contributions | |
�� | +2.242 |
ゼ | +2.200 |
dos | +2.163 |
eeper | +2.105 |
verting | +2.098 |
Neg logit contributions | |
Honour | -1.948 |
emin | -1.832 |
acceptance | -1.755 |
MENT | -1.726 |
ODY | -1.690 |
Token | T |
Token ID | 309 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
Honour | +1.274 |
emin | +1.180 |
MENT | +1.145 |
ODY | +1.131 |
acceptance | +1.128 |
Neg logit contributions | |
�� | -1.678 |
ゼ | -1.630 |
dos | -1.616 |
eeper | -1.582 |
verting | -1.574 |
Token | OC |
Token ID | 4503 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
OC | +1.504 |
OPS | +1.228 |
ODY | +1.011 |
ONY | +0.705 |
MENT | +0.667 |
Neg logit contributions | |
�� | -19.493 |
verting | -18.451 |
olulu | -18.303 |
eeper | -18.245 |
dos | -18.205 |
Token | RE |
Token ID | 4526 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
Honour | +0.689 |
emin | +0.631 |
MENT | +0.610 |
ODY | +0.605 |
acceptance | +0.603 |
Neg logit contributions | |
�� | -1.064 |
ゼ | -1.031 |
dos | -1.025 |
eeper | -1.004 |
verting | -0.997 |
Token | P |
Token ID | 47 |
Feature activation | +8.91e-02 |
Pos logit contributions | |
Honour | +1.545 |
MENT | +1.499 |
OPS | +1.428 |
emin | +1.397 |
ODY | +1.323 |
Neg logit contributions | |
�� | -4.883 |
eeper | -4.700 |
ゼ | -4.657 |
dos | -4.606 |
olulu | -4.591 |
Token | ORTS |
Token ID | 33002 |
Feature activation | -3.69e-01 |
Pos logit contributions | |
Honour | +0.563 |
emin | +0.527 |
MENT | +0.515 |
ODY | +0.512 |
OPS | +0.505 |
Neg logit contributions | |
�� | -0.683 |
ゼ | -0.661 |
dos | -0.648 |
eeper | -0.635 |
verting | -0.633 |
Token | 100 |
Token ID | 1802 |
Feature activation | -6.72e-01 |
Pos logit contributions | |
�� | +2.592 |
ゼ | +2.542 |
dos | +2.507 |
eeper | +2.435 |
verting | +2.434 |
Neg logit contributions | |
Honour | -2.488 |
emin | -2.353 |
acceptance | -2.239 |
MENT | -2.219 |
ODY | -2.203 |
Token | 3 |
Token ID | 18 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
Honour | +1.744 |
emin | +1.677 |
MENT | +1.576 |
ODY | +1.550 |
OPS | +1.530 |
Neg logit contributions | |
�� | -3.714 |
ゼ | -3.551 |
eeper | -3.488 |
dos | -3.453 |
verting | -3.395 |
Token | minutes |
Token ID | 2431 |
Feature activation | +8.16e-01 |
Pos logit contributions | |
�� | +0.805 |
ゼ | +0.766 |
dos | +0.754 |
verting | +0.723 |
eeper | +0.722 |
Neg logit contributions | |
Honour | -0.825 |
emin | -0.781 |
acceptance | -0.761 |
MENT | -0.747 |
ODY | -0.735 |
Token | until |
Token ID | 1566 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
Honour | +3.390 |
emin | +3.038 |
acceptance | +3.036 |
MENT | +2.776 |
ODY | +2.560 |
Neg logit contributions | |
�� | -8.049 |
ゼ | -7.682 |
dos | -7.596 |
� | -7.400 |
eeper | -7.143 |
Token | golden |
Token ID | 10861 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
Honour | +1.462 |
emin | +1.381 |
acceptance | +1.365 |
MENT | +1.306 |
OPS | +1.272 |
Neg logit contributions | |
�� | -1.470 |
ゼ | -1.406 |
dos | -1.393 |
eeper | -1.358 |
verting | -1.309 |
Token | brown |
Token ID | 7586 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
�� | +1.421 |
ゼ | +1.371 |
dos | +1.354 |
eeper | +1.312 |
verting | +1.304 |
Neg logit contributions | |
Honour | -1.601 |
emin | -1.518 |
acceptance | -1.463 |
MENT | -1.450 |
ODY | -1.439 |
Token | . |
Token ID | 13 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
�� | +1.704 |
ゼ | +1.657 |
dos | +1.638 |
eeper | +1.597 |
verting | +1.592 |
Neg logit contributions | |
Honour | -1.576 |
emin | -1.481 |
acceptance | -1.415 |
MENT | -1.414 |
ODY | -1.401 |
Token | These |
Token ID | 2312 |
Feature activation | +3.83e-01 |
Pos logit contributions | |
Honour | +3.587 |
emin | +2.973 |
Congratulations | +2.738 |
Expression | +2.467 |
ODY | +2.156 |
Neg logit contributions | |
eeper | -16.265 |
�� | -16.175 |
ゼ | -15.886 |
dos | -15.340 |
olulu | -15.274 |
Token | are |
Token ID | 389 |
Feature activation | +3.33e-01 |
Pos logit contributions | |
Honour | +1.760 |
emin | +1.625 |
acceptance | +1.548 |
MENT | +1.463 |
ODY | +1.463 |
Neg logit contributions | |
�� | -3.615 |
ゼ | -3.481 |
eeper | -3.408 |
dos | -3.390 |
verting | -3.357 |
Token | lightly |
Token ID | 15376 |
Feature activation | -4.30e-02 |
Pos logit contributions | |
Honour | +0.783 |
emin | +0.646 |
MENT | +0.581 |
acceptance | +0.566 |
ODY | +0.516 |
Neg logit contributions | |
�� | -3.879 |
ゼ | -3.790 |
dos | -3.781 |
verting | -3.695 |
eeper | -3.676 |
Token | fried |
Token ID | 23018 |
Feature activation | +4.84e-01 |
Pos logit contributions | |
�� | +0.345 |
ゼ | +0.335 |
dos | +0.332 |
eeper | +0.324 |
verting | +0.322 |
Neg logit contributions | |
Honour | -0.255 |
emin | -0.238 |
acceptance | -0.227 |
MENT | -0.225 |
ODY | -0.223 |
Token | and |
Token ID | 290 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
Honour | +2.653 |
emin | +2.459 |
acceptance | +2.377 |
MENT | +2.272 |
ODY | +2.189 |
Neg logit contributions | |
�� | -4.327 |
ゼ | -3.930 |
dos | -3.865 |
eeper | -3.809 |
verting | -3.775 |
Token |
|
Token ID | 198 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
�� | +1.599 |
ゼ | +1.560 |
dos | +1.554 |
eeper | +1.507 |
verting | +1.506 |
Neg logit contributions | |
Honour | -1.343 |
emin | -1.270 |
MENT | -1.211 |
ODY | -1.200 |
acceptance | -1.195 |
Token |
|
Token ID | 198 |
Feature activation | -9.73e-01 |
Pos logit contributions | |
�� | +1.633 |
ゼ | +1.601 |
dos | +1.588 |
eeper | +1.545 |
verting | +1.545 |
Neg logit contributions | |
Honour | -1.281 |
emin | -1.197 |
acceptance | -1.139 |
MENT | -1.136 |
ODY | -1.128 |
Token | 2003 |
Token ID | 16088 |
Feature activation | -3.42e-01 |
Pos logit contributions | |
dos | +6.206 |
�� | +6.193 |
ゼ | +6.127 |
verting | +6.020 |
................................................................ | +5.897 |
Neg logit contributions | |
Honour | -6.785 |
emin | -6.106 |
acceptance | -6.046 |
afety | -6.002 |
ODY | -5.852 |
Token | Matt |
Token ID | 4705 |
Feature activation | -3.56e-01 |
Pos logit contributions | |
�� | +2.580 |
ゼ | +2.535 |
dos | +2.497 |
verting | +2.441 |
eeper | +2.435 |
Neg logit contributions | |
Honour | -2.118 |
emin | -1.997 |
MENT | -1.902 |
acceptance | -1.900 |
ODY | -1.885 |
Token | Le |
Token ID | 1004 |
Feature activation | +4.82e-01 |
Pos logit contributions | |
�� | +2.275 |
ゼ | +2.226 |
dos | +2.209 |
verting | +2.145 |
eeper | +2.145 |
Neg logit contributions | |
Honour | -2.612 |
emin | -2.489 |
MENT | -2.407 |
ODY | -2.394 |
acceptance | -2.392 |
Token | Bl |
Token ID | 3629 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
Honour | +2.080 |
emin | +1.829 |
acceptance | +1.687 |
MENT | +1.657 |
OPS | +1.618 |
Neg logit contributions | |
�� | -4.693 |
dos | -4.522 |
ゼ | -4.443 |
eeper | -4.409 |
verting | -4.300 |
Token | anc |
Token ID | 1192 |
Feature activation | -1.76e-01 |
Pos logit contributions | |
emin | +7.022 |
Honour | +6.944 |
abre | +6.458 |
acceptance | +5.974 |
afety | +5.790 |
Neg logit contributions | |
�� | -13.212 |
ゼ | -11.955 |
� | -11.742 |
ゴン | -11.502 |
�� | -11.422 |
Token |
|
Token ID | 198 |
Feature activation | -3.56e-01 |
Pos logit contributions | |
�� | +1.330 |
ゼ | +1.299 |
dos | +1.293 |
verting | +1.255 |
eeper | +1.253 |
Neg logit contributions | |
Honour | -1.099 |
emin | -1.035 |
MENT | -0.984 |
ODY | -0.975 |
acceptance | -0.974 |
Token |
|
Token ID | 198 |
Feature activation | -8.87e-01 |
Pos logit contributions | |
�� | +2.598 |
ゼ | +2.591 |
dos | +2.586 |
verting | +2.504 |
eeper | +2.487 |
Neg logit contributions | |
Honour | -2.239 |
emin | -2.105 |
acceptance | -2.015 |
MENT | -2.000 |
ODY | -1.999 |
Token | 2003 |
Token ID | 16088 |
Feature activation | -2.52e-01 |
Pos logit contributions | |
dos | +5.824 |
ゼ | +5.787 |
�� | +5.730 |
verting | +5.604 |
................................................................ | +5.570 |
Neg logit contributions | |
Honour | -6.079 |
emin | -5.535 |
acceptance | -5.498 |
afety | -5.419 |
ODY | -5.253 |
Token | Bernie |
Token ID | 10477 |
Feature activation | +4.29e-01 |
Pos logit contributions | |
�� | +1.919 |
ゼ | +1.878 |
dos | +1.855 |
eeper | +1.809 |
verting | +1.809 |
Neg logit contributions | |
Honour | -1.572 |
emin | -1.477 |
MENT | -1.405 |
acceptance | -1.404 |
ODY | -1.392 |
Token | . |
Token ID | 13 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
�� | +0.381 |
ゼ | +0.370 |
dos | +0.363 |
eeper | +0.357 |
verting | +0.356 |
Neg logit contributions | |
Honour | -0.328 |
emin | -0.309 |
MENT | -0.296 |
acceptance | -0.293 |
ODY | -0.293 |
Token | Solid |
Token ID | 46933 |
Feature activation | +7.55e-01 |
Pos logit contributions | |
�� | +0.821 |
ゼ | +0.797 |
dos | +0.787 |
eeper | +0.772 |
verting | +0.768 |
Neg logit contributions | |
Honour | -0.723 |
emin | -0.680 |
MENT | -0.650 |
acceptance | -0.646 |
ODY | -0.644 |
Token | Br |
Token ID | 9414 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
Honour | +3.646 |
emin | +3.390 |
MENT | +3.207 |
ODY | +3.136 |
acceptance | +3.091 |
Neg logit contributions | |
�� | -6.594 |
ゼ | -6.394 |
dos | -6.254 |
verting | -6.252 |
eeper | -6.147 |
Token | ush |
Token ID | 1530 |
Feature activation | +4.70e-01 |
Pos logit contributions | |
Honour | +1.869 |
emin | +1.789 |
acceptance | +1.653 |
MENT | +1.639 |
ODY | +1.624 |
Neg logit contributions | |
�� | -2.193 |
ゼ | -2.093 |
dos | -2.001 |
verting | -1.983 |
eeper | -1.932 |
Token | ( |
Token ID | 357 |
Feature activation | +8.78e-01 |
Pos logit contributions | |
Honour | +3.391 |
emin | +3.222 |
MENT | +3.138 |
ODY | +3.123 |
acceptance | +3.081 |
Neg logit contributions | |
�� | -3.105 |
ゼ | -2.979 |
dos | -2.928 |
verting | -2.867 |
eeper | -2.833 |
Token | [ |
Token ID | 685 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
Honour | +5.460 |
emin | +5.224 |
ODY | +5.042 |
MENT | +5.035 |
acceptance | +4.953 |
Neg logit contributions | |
�� | -6.312 |
ゼ | -6.081 |
eeper | -5.888 |
dos | -5.773 |
verting | -5.734 |
Token | System |
Token ID | 11964 |
Feature activation | +1.86e-01 |
Pos logit contributions | |
Honour | +6.200 |
emin | +5.980 |
MENT | +5.848 |
ODY | +5.796 |
OPS | +5.640 |
Neg logit contributions | |
�� | -12.050 |
ゼ | -11.657 |
eeper | -11.605 |
olulu | -11.287 |
................................................................ | -11.145 |
Token | . |
Token ID | 13 |
Feature activation | +3.88e-01 |
Pos logit contributions | |
Honour | +1.113 |
emin | +1.041 |
MENT | +0.992 |
ODY | +0.963 |
acceptance | +0.961 |
Neg logit contributions | |
�� | -1.559 |
ゼ | -1.453 |
eeper | -1.425 |
dos | -1.422 |
verting | -1.396 |
Token | Draw |
Token ID | 25302 |
Feature activation | -5.16e-01 |
Pos logit contributions | |
Honour | +2.667 |
emin | +2.525 |
MENT | +2.437 |
ODY | +2.432 |
acceptance | +2.396 |
Neg logit contributions | |
�� | -2.710 |
ゼ | -2.595 |
eeper | -2.544 |
dos | -2.539 |
verting | -2.483 |
Token | ing |
Token ID | 278 |
Feature activation | -1.56e-01 |
Pos logit contributions | |
�� | +2.727 |
dos | +2.711 |
ゼ | +2.686 |
verting | +2.621 |
eeper | +2.604 |
Neg logit contributions | |
Honour | -4.311 |
emin | -4.053 |
acceptance | -3.963 |
ODY | -3.928 |
MENT | -3.911 |
Token | . |
Token ID | 13 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
�� | +1.167 |
ゼ | +1.122 |
dos | +1.109 |
eeper | +1.090 |
verting | +1.081 |
Neg logit contributions | |
Honour | -1.025 |
emin | -0.962 |
MENT | -0.920 |
acceptance | -0.915 |
ODY | -0.909 |
Token | ( |
Token ID | 7 |
Feature activation | +4.09e-01 |
Pos logit contributions | |
Honour | +3.128 |
emin | +2.956 |
MENT | +2.890 |
ODY | +2.841 |
Ont | +2.777 |
Neg logit contributions | |
�� | -3.376 |
ゼ | -3.015 |
dos | -2.927 |
eeper | -2.920 |
verting | -2.897 |
Token | cv |
Token ID | 33967 |
Feature activation | +6.51e-01 |
Pos logit contributions | |
Honour | +3.548 |
emin | +3.522 |
MENT | +3.414 |
acceptance | +3.327 |
ODY | +3.304 |
Neg logit contributions | |
�� | -2.160 |
ゼ | -1.937 |
eeper | -1.830 |
� | -1.774 |
dos | -1.741 |
Token | 2 |
Token ID | 17 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
Honour | +3.374 |
emin | +3.301 |
MENT | +3.214 |
Ont | +3.016 |
ODY | +2.993 |
Neg logit contributions | |
�� | -5.947 |
ゼ | -5.236 |
eeper | -5.220 |
olulu | -5.074 |
dos | -5.012 |
Token | . |
Token ID | 13 |
Feature activation | +5.24e-01 |
Pos logit contributions | |
Honour | +1.445 |
emin | +1.349 |
MENT | +1.298 |
ODY | +1.252 |
acceptance | +1.249 |
Neg logit contributions | |
�� | -2.121 |
ゼ | -1.940 |
eeper | -1.909 |
dos | -1.909 |
verting | -1.878 |
Token | M |
Token ID | 44 |
Feature activation | +8.86e-01 |
Pos logit contributions | |
Honour | +2.190 |
MENT | +2.134 |
emin | +2.098 |
ODY | +1.999 |
OPS | +1.959 |
Neg logit contributions | |
�� | -5.202 |
eeper | -4.841 |
dos | -4.812 |
verting | -4.803 |
ゼ | -4.778 |
Token | OR |
Token ID | 1581 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
Honour | +1.536 |
MENT | +1.536 |
ODY | +1.463 |
OPS | +1.293 |
emin | +1.270 |
Neg logit contributions | |
�� | -10.817 |
verting | -10.136 |
ゼ | -10.097 |
eeper | -10.058 |
dos | -9.951 |
Token | PH |
Token ID | 11909 |
Feature activation | +7.36e-01 |
Pos logit contributions | |
MENT | +2.374 |
ODY | +1.495 |
OPS | +1.448 |
Honour | +1.365 |
emin | +1.232 |
Neg logit contributions | |
�� | -17.857 |
olulu | -17.119 |
verting | -16.828 |
eeper | -16.753 |
dos | -16.733 |
Token | _ |
Token ID | 62 |
Feature activation | +7.60e-01 |
Pos logit contributions | |
Honour | +2.913 |
MENT | +2.777 |
emin | +2.664 |
ODY | +2.601 |
OPS | +2.583 |
Neg logit contributions | |
�� | -7.576 |
ゼ | -6.860 |
olulu | -6.806 |
eeper | -6.782 |
verting | -6.751 |
Token | RECT |
Token ID | 23988 |
Feature activation | +2.22e-02 |
Pos logit contributions | |
MENT | +4.361 |
OPS | +4.278 |
Honour | +4.245 |
ODY | +4.210 |
emin | +4.140 |
Neg logit contributions | |
�� | -6.374 |
eeper | -5.725 |
olulu | -5.706 |
ゼ | -5.678 |
dos | -5.655 |
Token | , |
Token ID | 11 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
Honour | +0.131 |
emin | +0.122 |
MENT | +0.118 |
ODY | +0.115 |
acceptance | +0.115 |
Neg logit contributions | |
�� | -0.182 |
ゼ | -0.174 |
dos | -0.171 |
eeper | -0.169 |
verting | -0.168 |
Token | ( |
Token ID | 357 |
Feature activation | +5.42e-01 |
Pos logit contributions | |
�� | +0.142 |
ゼ | +0.135 |
dos | +0.133 |
eeper | +0.131 |
verting | +0.130 |
Neg logit contributions | |
Honour | -0.118 |
emin | -0.110 |
MENT | -0.105 |
acceptance | -0.105 |
ODY | -0.103 |
Token | on |
Token ID | 319 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
�� | +0.409 |
ゼ | +0.398 |
dos | +0.394 |
eeper | +0.385 |
verting | +0.384 |
Neg logit contributions | |
Honour | -0.298 |
emin | -0.277 |
acceptance | -0.264 |
MENT | -0.263 |
ODY | -0.260 |
Token | Twitter |
Token ID | 3009 |
Feature activation | +5.07e-02 |
Pos logit contributions | |
�� | +1.386 |
ゼ | +1.359 |
dos | +1.342 |
eeper | +1.310 |
verting | +1.307 |
Neg logit contributions | |
Honour | -1.086 |
emin | -1.017 |
MENT | -0.966 |
acceptance | -0.965 |
ODY | -0.960 |
Token | . |
Token ID | 13 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
Honour | +0.332 |
emin | +0.312 |
acceptance | +0.298 |
MENT | +0.296 |
ODY | +0.295 |
Neg logit contributions | |
�� | -0.375 |
ゼ | -0.364 |
dos | -0.359 |
eeper | -0.351 |
verting | -0.350 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -2.23e-01 |
Pos logit contributions | |
�� | +4.173 |
ゼ | +4.162 |
dos | +4.099 |
verting | +3.993 |
eeper | +3.913 |
Neg logit contributions | |
Honour | -3.402 |
emin | -3.227 |
acceptance | -3.183 |
ODY | -3.068 |
MENT | -3.065 |
Token | Media |
Token ID | 13152 |
Feature activation | -2.51e-01 |
Pos logit contributions | |
�� | +1.765 |
ゼ | +1.720 |
dos | +1.701 |
eeper | +1.665 |
verting | +1.659 |
Neg logit contributions | |
Honour | -1.337 |
emin | -1.250 |
MENT | -1.187 |
acceptance | -1.184 |
ODY | -1.175 |
Token | playback |
Token ID | 16388 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
�� | +1.736 |
ゼ | +1.692 |
dos | +1.686 |
eeper | +1.638 |
verting | +1.628 |
Neg logit contributions | |
Honour | -1.713 |
emin | -1.627 |
ODY | -1.549 |
acceptance | -1.543 |
MENT | -1.540 |
Token | is |
Token ID | 318 |
Feature activation | -6.18e-01 |
Pos logit contributions | |
ゼ | +7.622 |
dos | +7.494 |
verting | +7.338 |
�� | +7.241 |
eeper | +6.860 |
Neg logit contributions | |
Honour | -13.596 |
� | -13.516 |
OPS | -13.424 |
emin | -13.375 |
MENT | -13.190 |
Token | unsupported |
Token ID | 24222 |
Feature activation | -6.69e-01 |
Pos logit contributions | |
�� | +3.681 |
ゼ | +3.549 |
dos | +3.474 |
verting | +3.394 |
eeper | +3.363 |
Neg logit contributions | |
Honour | -4.808 |
emin | -4.572 |
MENT | -4.431 |
ODY | -4.419 |
acceptance | -4.387 |
Token | on |
Token ID | 319 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
ゼ | +4.677 |
dos | +4.630 |
�� | +4.612 |
verting | +4.498 |
eeper | +4.414 |
Neg logit contributions | |
Honour | -4.264 |
emin | -4.114 |
ODY | -3.908 |
MENT | -3.906 |
acceptance | -3.892 |
Token | your |
Token ID | 534 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
�� | +0.886 |
ゼ | +0.857 |
dos | +0.847 |
eeper | +0.829 |
verting | +0.821 |
Neg logit contributions | |
Honour | -0.602 |
emin | -0.560 |
MENT | -0.533 |
acceptance | -0.532 |
ODY | -0.522 |
Token | device |
Token ID | 3335 |
Feature activation | -2.55e-01 |
Pos logit contributions | |
�� | +1.433 |
ゼ | +1.368 |
dos | +1.336 |
eeper | +1.291 |
verting | +1.264 |
Neg logit contributions | |
Honour | -2.582 |
emin | -2.451 |
acceptance | -2.397 |
MENT | -2.380 |
ODY | -2.355 |
Token | Hide |
Token ID | 10415 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
�� | +1.829 |
ゼ | +1.783 |
dos | +1.762 |
eeper | +1.714 |
verting | +1.711 |
Neg logit contributions | |
Honour | -1.729 |
emin | -1.629 |
acceptance | -1.560 |
MENT | -1.558 |
ODY | -1.546 |
Token | Caption |
Token ID | 11260 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
Honour | +0.086 |
emin | +0.081 |
MENT | +0.078 |
acceptance | +0.077 |
ODY | +0.077 |
Neg logit contributions | |
�� | -0.068 |
ゼ | -0.065 |
dos | -0.063 |
eeper | -0.062 |
verting | -0.061 |
Token | 6 |
Token ID | 718 |
Feature activation | -6.10e-01 |
Pos logit contributions | |
................................................................ | +6.809 |
dos | +6.547 |
verting | +6.403 |
ゼ | +6.152 |
kj | +6.058 |
Neg logit contributions | |
Honour | -10.957 |
emin | -10.832 |
ONY | -10.579 |
ODY | -10.472 |
acceptance | -10.472 |
Token | of |
Token ID | 286 |
Feature activation | -7.33e-01 |
Pos logit contributions | |
ゼ | +3.985 |
dos | +3.972 |
�� | +3.883 |
verting | +3.806 |
eeper | +3.790 |
Neg logit contributions | |
Honour | -4.227 |
emin | -3.984 |
acceptance | -3.845 |
ODY | -3.803 |
MENT | -3.800 |
Token | 15 |
Token ID | 1315 |
Feature activation | -3.51e-01 |
Pos logit contributions | |
dos | +4.221 |
ゼ | +4.207 |
�� | +4.177 |
................................................................ | +4.114 |
eeper | +4.061 |
Neg logit contributions | |
Honour | -5.313 |
emin | -5.224 |
acceptance | -5.058 |
afety | -5.007 |
ODY | -4.990 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.77e+00 |
Pos logit contributions | |
�� | +1.586 |
ゼ | +1.554 |
dos | +1.537 |
eeper | +1.458 |
verting | +1.455 |
Neg logit contributions | |
Honour | -3.218 |
emin | -3.086 |
acceptance | -3.008 |
MENT | -2.991 |
ODY | -2.980 |
Token | : |
Token ID | 25 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
................................................................ | +5.241 |
dos | +4.618 |
kj | +4.312 |
(): | +4.273 |
ゼ | +4.268 |
Neg logit contributions | |
mathemat | -16.518 |
Honour | -16.297 |
carbohyd | -16.176 |
ODY | -15.928 |
afety | -15.809 |
Token | Carly |
Token ID | 35982 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
ゼ | +6.604 |
................................................................ | +6.466 |
�� | +6.417 |
dos | +6.365 |
verting | +6.304 |
Neg logit contributions | |
Honour | -6.573 |
emin | -6.360 |
acceptance | -6.337 |
MENT | -6.274 |
ODY | -6.273 |
Token | Fiorina |
Token ID | 49028 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
�� | +1.584 |
ゼ | +1.543 |
dos | +1.529 |
eeper | +1.504 |
verting | +1.494 |
Neg logit contributions | |
Honour | -0.770 |
emin | -0.703 |
acceptance | -0.653 |
MENT | -0.649 |
ODY | -0.635 |
Token | 's |
Token ID | 338 |
Feature activation | +3.54e-01 |
Pos logit contributions | |
ゼ | +3.054 |
�� | +3.047 |
dos | +3.046 |
verting | +2.957 |
eeper | +2.921 |
Neg logit contributions | |
Honour | -4.473 |
emin | -4.272 |
ODY | -4.134 |
MENT | -4.117 |
acceptance | -4.095 |
Token | political |
Token ID | 1964 |
Feature activation | +3.14e-01 |
Pos logit contributions | |
Honour | +2.214 |
acceptance | +2.015 |
emin | +2.015 |
MENT | +1.905 |
abre | +1.825 |
Neg logit contributions | |
�� | -2.848 |
dos | -2.711 |
ゼ | -2.700 |
eeper | -2.617 |
� | -2.516 |
Token | Hide |
Token ID | 10415 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
�� | +0.490 |
ゼ | +0.475 |
dos | +0.469 |
eeper | +0.460 |
verting | +0.457 |
Neg logit contributions | |
Honour | -0.434 |
emin | -0.407 |
MENT | -0.387 |
acceptance | -0.386 |
ODY | -0.382 |
Token | Caption |
Token ID | 11260 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
�� | +0.780 |
ゼ | +0.747 |
dos | +0.730 |
eeper | +0.711 |
verting | +0.705 |
Neg logit contributions | |
Honour | -1.087 |
emin | -1.028 |
MENT | -0.994 |
acceptance | -0.988 |
ODY | -0.980 |
Token | 7 |
Token ID | 767 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
................................................................ | +6.588 |
ゼ | +6.335 |
dos | +6.240 |
�� | +5.991 |
kj | +5.899 |
Neg logit contributions | |
emin | -11.522 |
Honour | -11.279 |
afety | -11.219 |
ONY | -11.193 |
abre | -11.140 |
Token | of |
Token ID | 286 |
Feature activation | -7.10e-01 |
Pos logit contributions | |
�� | +1.943 |
ゼ | +1.910 |
dos | +1.893 |
eeper | +1.841 |
verting | +1.838 |
Neg logit contributions | |
Honour | -1.682 |
emin | -1.577 |
acceptance | -1.505 |
MENT | -1.502 |
ODY | -1.489 |
Token | 15 |
Token ID | 1315 |
Feature activation | -2.97e-01 |
Pos logit contributions | |
ゼ | +4.134 |
dos | +4.128 |
�� | +4.084 |
................................................................ | +4.020 |
eeper | +3.963 |
Neg logit contributions | |
Honour | -5.111 |
emin | -5.013 |
acceptance | -4.855 |
afety | -4.819 |
ODY | -4.809 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
�� | +1.385 |
ゼ | +1.349 |
dos | +1.331 |
eeper | +1.268 |
verting | +1.266 |
Neg logit contributions | |
Honour | -2.703 |
emin | -2.590 |
acceptance | -2.517 |
MENT | -2.507 |
ODY | -2.496 |
Token | : |
Token ID | 25 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
................................................................ | +5.221 |
dos | +4.677 |
ゼ | +4.357 |
kj | +4.343 |
verting | +4.302 |
Neg logit contributions | |
mathemat | -15.813 |
Honour | -15.770 |
carbohyd | -15.459 |
ODY | -15.377 |
emin | -15.273 |
Token | Carly |
Token ID | 35982 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
ゼ | +6.584 |
................................................................ | +6.489 |
�� | +6.419 |
dos | +6.369 |
verting | +6.321 |
Neg logit contributions | |
Honour | -6.629 |
emin | -6.428 |
acceptance | -6.388 |
ODY | -6.346 |
MENT | -6.335 |
Token | Fiorina |
Token ID | 49028 |
Feature activation | -5.80e-01 |
Pos logit contributions | |
�� | +1.439 |
ゼ | +1.401 |
dos | +1.389 |
eeper | +1.366 |
verting | +1.356 |
Neg logit contributions | |
Honour | -0.697 |
emin | -0.636 |
acceptance | -0.590 |
MENT | -0.587 |
ODY | -0.574 |
Token | 's |
Token ID | 338 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
ゼ | +3.137 |
dos | +3.133 |
�� | +3.126 |
verting | +3.046 |
eeper | +3.002 |
Neg logit contributions | |
Honour | -4.647 |
emin | -4.445 |
ODY | -4.301 |
MENT | -4.281 |
acceptance | -4.258 |
Token | political |
Token ID | 1964 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
Honour | +1.844 |
emin | +1.687 |
acceptance | +1.680 |
MENT | +1.598 |
ODY | +1.533 |
Neg logit contributions | |
�� | -2.271 |
dos | -2.162 |
ゼ | -2.158 |
eeper | -2.092 |
verting | -2.010 |
Token | energy |
Token ID | 2568 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
Honour | +0.954 |
emin | +0.876 |
acceptance | +0.852 |
MENT | +0.830 |
ODY | +0.813 |
Neg logit contributions | |
�� | -1.383 |
ゼ | -1.340 |
dos | -1.331 |
eeper | -1.295 |
verting | -1.291 |
Token | goals |
Token ID | 4661 |
Feature activation | +2.23e-01 |
Pos logit contributions | |
Honour | +0.861 |
emin | +0.803 |
acceptance | +0.778 |
MENT | +0.765 |
ODY | +0.748 |
Neg logit contributions | |
�� | -1.042 |
ゼ | -1.004 |
dos | -1.000 |
eeper | -0.977 |
verting | -0.967 |
Token | . |
Token ID | 13 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
Honour | +1.419 |
emin | +1.336 |
acceptance | +1.278 |
MENT | +1.265 |
ODY | +1.247 |
Neg logit contributions | |
�� | -1.688 |
ゼ | -1.629 |
dos | -1.624 |
verting | -1.579 |
eeper | -1.570 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
�� | +1.161 |
ゼ | +1.137 |
dos | +1.121 |
verting | +1.095 |
eeper | +1.095 |
Neg logit contributions | |
Honour | -0.947 |
emin | -0.891 |
acceptance | -0.850 |
MENT | -0.847 |
ODY | -0.839 |
Token | Media |
Token ID | 13152 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
�� | +1.416 |
ゼ | +1.377 |
dos | +1.361 |
eeper | +1.336 |
verting | +1.329 |
Neg logit contributions | |
Honour | -1.075 |
emin | -1.007 |
MENT | -0.958 |
acceptance | -0.952 |
ODY | -0.947 |
Token | playback |
Token ID | 16388 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
�� | +1.468 |
ゼ | +1.429 |
dos | +1.421 |
eeper | +1.384 |
verting | +1.376 |
Neg logit contributions | |
Honour | -1.425 |
emin | -1.351 |
ODY | -1.286 |
acceptance | -1.283 |
MENT | -1.282 |
Token | is |
Token ID | 318 |
Feature activation | -5.72e-01 |
Pos logit contributions | |
ゼ | +7.350 |
dos | +7.182 |
verting | +7.021 |
�� | +6.970 |
eeper | +6.672 |
Neg logit contributions | |
Honour | -12.953 |
� | -12.790 |
OPS | -12.722 |
emin | -12.675 |
MENT | -12.443 |
Token | unsupported |
Token ID | 24222 |
Feature activation | -6.26e-01 |
Pos logit contributions | |
�� | +3.429 |
ゼ | +3.310 |
dos | +3.241 |
verting | +3.164 |
eeper | +3.136 |
Neg logit contributions | |
Honour | -4.434 |
emin | -4.219 |
MENT | -4.085 |
ODY | -4.080 |
acceptance | -4.044 |
Token | on |
Token ID | 319 |
Feature activation | -8.35e-02 |
Pos logit contributions | |
ゼ | +4.436 |
dos | +4.391 |
�� | +4.390 |
verting | +4.264 |
eeper | +4.200 |
Neg logit contributions | |
Honour | -3.959 |
emin | -3.808 |
ODY | -3.622 |
MENT | -3.615 |
acceptance | -3.601 |
Token | your |
Token ID | 534 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
�� | +0.706 |
ゼ | +0.680 |
dos | +0.672 |
eeper | +0.658 |
verting | +0.650 |
Neg logit contributions | |
Honour | -0.469 |
emin | -0.435 |
MENT | -0.415 |
acceptance | -0.414 |
ODY | -0.405 |
Token | device |
Token ID | 3335 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
�� | +1.348 |
ゼ | +1.284 |
dos | +1.254 |
eeper | +1.213 |
verting | +1.185 |
Neg logit contributions | |
Honour | -2.411 |
emin | -2.286 |
acceptance | -2.238 |
MENT | -2.220 |
ODY | -2.195 |
Token | Hide |
Token ID | 10415 |
Feature activation | -4.81e-02 |
Pos logit contributions | |
�� | +2.129 |
ゼ | +2.080 |
dos | +2.055 |
eeper | +1.998 |
verting | +1.994 |
Neg logit contributions | |
Honour | -2.041 |
emin | -1.925 |
acceptance | -1.844 |
MENT | -1.842 |
ODY | -1.829 |
Token | Caption |
Token ID | 11260 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
�� | +0.299 |
ゼ | +0.284 |
dos | +0.277 |
eeper | +0.268 |
verting | +0.267 |
Neg logit contributions | |
Honour | -0.386 |
emin | -0.362 |
MENT | -0.351 |
acceptance | -0.347 |
ODY | -0.346 |
Token | 5 |
Token ID | 642 |
Feature activation | -6.40e-01 |
Pos logit contributions | |
dos | +5.986 |
ゼ | +5.881 |
................................................................ | +5.851 |
�� | +5.795 |
verting | +5.608 |
Neg logit contributions | |
emin | -7.678 |
Honour | -7.533 |
abre | -7.456 |
afety | -7.420 |
acceptance | -7.327 |
Token | of |
Token ID | 286 |
Feature activation | -5.46e-01 |
Pos logit contributions | |
ゼ | +4.133 |
dos | +4.115 |
�� | +3.996 |
................................................................ | +3.934 |
verting | +3.932 |
Neg logit contributions | |
Honour | -4.487 |
emin | -4.199 |
acceptance | -4.060 |
MENT | -4.008 |
afety | -4.002 |
Token | 15 |
Token ID | 1315 |
Feature activation | -3.31e-01 |
Pos logit contributions | |
�� | +3.373 |
ゼ | +3.337 |
dos | +3.327 |
eeper | +3.234 |
verting | +3.217 |
Neg logit contributions | |
Honour | -3.904 |
emin | -3.769 |
acceptance | -3.644 |
MENT | -3.605 |
ODY | -3.599 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
�� | +1.520 |
ゼ | +1.479 |
dos | +1.460 |
eeper | +1.390 |
verting | +1.387 |
Neg logit contributions | |
Honour | -3.033 |
emin | -2.907 |
acceptance | -2.831 |
MENT | -2.817 |
ODY | -2.804 |
Token | : |
Token ID | 25 |
Feature activation | -9.73e-01 |
Pos logit contributions | |
................................................................ | +5.396 |
dos | +4.704 |
verting | +4.427 |
ゼ | +4.355 |
kj | +4.342 |
Neg logit contributions | |
Honour | -15.720 |
mathemat | -15.547 |
carbohyd | -15.166 |
acceptance | -15.149 |
ODY | -15.145 |
Token | Carly |
Token ID | 35982 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
ゼ | +6.379 |
................................................................ | +6.279 |
�� | +6.220 |
dos | +6.215 |
verting | +6.095 |
Neg logit contributions | |
Honour | -6.097 |
emin | -5.865 |
acceptance | -5.817 |
MENT | -5.747 |
ODY | -5.747 |
Token | Fiorina |
Token ID | 49028 |
Feature activation | -5.37e-01 |
Pos logit contributions | |
�� | +1.493 |
ゼ | +1.451 |
dos | +1.436 |
eeper | +1.415 |
verting | +1.404 |
Neg logit contributions | |
Honour | -0.709 |
emin | -0.648 |
acceptance | -0.604 |
MENT | -0.595 |
ODY | -0.581 |
Token | 's |
Token ID | 338 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
�� | +2.987 |
ゼ | +2.977 |
dos | +2.970 |
verting | +2.883 |
eeper | +2.857 |
Neg logit contributions | |
Honour | -4.278 |
emin | -4.061 |
ODY | -3.942 |
MENT | -3.928 |
acceptance | -3.876 |
Token | political |
Token ID | 1964 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
Honour | +1.402 |
emin | +1.301 |
acceptance | +1.290 |
MENT | +1.223 |
ODY | +1.186 |
Neg logit contributions | |
�� | -1.694 |
ゼ | -1.615 |
dos | -1.610 |
eeper | -1.560 |
verting | -1.517 |
Token | Hide |
Token ID | 10415 |
Feature activation | +4.76e-02 |
Pos logit contributions | |
�� | +1.365 |
ゼ | +1.329 |
dos | +1.315 |
eeper | +1.282 |
verting | +1.278 |
Neg logit contributions | |
Honour | -1.218 |
emin | -1.144 |
acceptance | -1.092 |
MENT | -1.091 |
ODY | -1.081 |
Token | Caption |
Token ID | 11260 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
Honour | +0.378 |
emin | +0.352 |
MENT | +0.342 |
acceptance | +0.337 |
ODY | +0.335 |
Neg logit contributions | |
�� | -0.304 |
ゼ | -0.286 |
dos | -0.280 |
eeper | -0.273 |
verting | -0.270 |
Token | 11 |
Token ID | 1367 |
Feature activation | -4.77e-01 |
Pos logit contributions | |
dos | +6.332 |
................................................................ | +6.301 |
ゼ | +6.269 |
�� | +6.156 |
verting | +6.062 |
Neg logit contributions | |
Honour | -6.623 |
emin | -6.472 |
ODY | -6.212 |
MENT | -6.201 |
afety | -6.184 |
Token | of |
Token ID | 286 |
Feature activation | -8.07e-01 |
Pos logit contributions | |
ゼ | +3.241 |
dos | +3.219 |
�� | +3.206 |
verting | +3.111 |
eeper | +3.094 |
Neg logit contributions | |
Honour | -3.213 |
emin | -3.032 |
acceptance | -2.906 |
MENT | -2.890 |
ODY | -2.887 |
Token | 15 |
Token ID | 1315 |
Feature activation | -4.38e-01 |
Pos logit contributions | |
dos | +4.554 |
ゼ | +4.521 |
................................................................ | +4.470 |
�� | +4.424 |
verting | +4.346 |
Neg logit contributions | |
Honour | -5.867 |
emin | -5.770 |
afety | -5.599 |
acceptance | -5.597 |
ODY | -5.543 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
�� | +1.860 |
ゼ | +1.858 |
dos | +1.843 |
verting | +1.732 |
eeper | +1.725 |
Neg logit contributions | |
Honour | -4.062 |
emin | -3.907 |
acceptance | -3.824 |
MENT | -3.786 |
ODY | -3.782 |
Token | : |
Token ID | 25 |
Feature activation | -9.18e-01 |
Pos logit contributions | |
................................................................ | +5.054 |
dos | +4.678 |
kj | +4.325 |
ゼ | +4.312 |
verting | +4.290 |
Neg logit contributions | |
Honour | -15.053 |
mathemat | -14.906 |
ODY | -14.674 |
emin | -14.651 |
carbohyd | -14.593 |
Token | Carly |
Token ID | 35982 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
ゼ | +6.013 |
�� | +5.914 |
................................................................ | +5.889 |
dos | +5.852 |
verting | +5.788 |
Neg logit contributions | |
Honour | -5.737 |
emin | -5.553 |
acceptance | -5.469 |
ODY | -5.442 |
MENT | -5.442 |
Token | Fiorina |
Token ID | 49028 |
Feature activation | -6.69e-01 |
Pos logit contributions | |
�� | +1.355 |
ゼ | +1.319 |
dos | +1.307 |
eeper | +1.286 |
verting | +1.276 |
Neg logit contributions | |
Honour | -0.652 |
emin | -0.594 |
acceptance | -0.551 |
MENT | -0.548 |
ODY | -0.534 |
Token | 's |
Token ID | 338 |
Feature activation | +3.47e-01 |
Pos logit contributions | |
dos | +3.530 |
ゼ | +3.505 |
�� | +3.455 |
verting | +3.426 |
eeper | +3.353 |
Neg logit contributions | |
Honour | -5.414 |
emin | -5.191 |
ODY | -5.035 |
MENT | -5.004 |
acceptance | -4.966 |
Token | political |
Token ID | 1964 |
Feature activation | +2.58e-01 |
Pos logit contributions | |
Honour | +2.177 |
acceptance | +1.993 |
emin | +1.979 |
MENT | +1.870 |
abre | +1.793 |
Neg logit contributions | |
�� | -2.793 |
ゼ | -2.646 |
dos | -2.645 |
eeper | -2.565 |
� | -2.460 |
Token | Hide |
Token ID | 10415 |
Feature activation | -3.56e-02 |
Pos logit contributions | |
�� | +1.721 |
ゼ | +1.683 |
dos | +1.663 |
eeper | +1.614 |
verting | +1.614 |
Neg logit contributions | |
Honour | -1.658 |
emin | -1.564 |
acceptance | -1.499 |
MENT | -1.497 |
ODY | -1.488 |
Token | Caption |
Token ID | 11260 |
Feature activation | -8.03e-01 |
Pos logit contributions | |
�� | +0.221 |
ゼ | +0.208 |
dos | +0.204 |
eeper | +0.199 |
verting | +0.197 |
Neg logit contributions | |
Honour | -0.287 |
emin | -0.269 |
MENT | -0.261 |
acceptance | -0.257 |
ODY | -0.255 |
Token | 12 |
Token ID | 1105 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
dos | +4.735 |
ゼ | +4.732 |
................................................................ | +4.647 |
�� | +4.627 |
verting | +4.589 |
Neg logit contributions | |
Honour | -5.675 |
emin | -5.518 |
ODY | -5.389 |
afety | -5.346 |
acceptance | -5.330 |
Token | of |
Token ID | 286 |
Feature activation | -8.42e-01 |
Pos logit contributions | |
ゼ | +2.967 |
�� | +2.946 |
dos | +2.944 |
verting | +2.846 |
eeper | +2.833 |
Neg logit contributions | |
Honour | -2.873 |
emin | -2.711 |
acceptance | -2.596 |
ODY | -2.584 |
MENT | -2.583 |
Token | 15 |
Token ID | 1315 |
Feature activation | -3.88e-01 |
Pos logit contributions | |
dos | +4.713 |
ゼ | +4.662 |
................................................................ | +4.616 |
�� | +4.573 |
verting | +4.488 |
Neg logit contributions | |
Honour | -6.142 |
emin | -6.052 |
afety | -5.863 |
acceptance | -5.851 |
ODY | -5.792 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
�� | +1.701 |
ゼ | +1.684 |
dos | +1.671 |
verting | +1.574 |
eeper | +1.569 |
Neg logit contributions | |
Honour | -3.580 |
emin | -3.438 |
acceptance | -3.358 |
MENT | -3.331 |
ODY | -3.325 |
Token | : |
Token ID | 25 |
Feature activation | -8.86e-01 |
Pos logit contributions | |
................................................................ | +5.052 |
dos | +4.662 |
ゼ | +4.322 |
kj | +4.322 |
verting | +4.281 |
Neg logit contributions | |
Honour | -14.983 |
mathemat | -14.852 |
ODY | -14.593 |
emin | -14.584 |
carbohyd | -14.541 |
Token | Carly |
Token ID | 35982 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
ゼ | +5.874 |
�� | +5.791 |
................................................................ | +5.737 |
dos | +5.719 |
verting | +5.655 |
Neg logit contributions | |
Honour | -5.515 |
emin | -5.331 |
acceptance | -5.243 |
MENT | -5.215 |
ODY | -5.211 |
Token | Fiorina |
Token ID | 49028 |
Feature activation | -7.92e-01 |
Pos logit contributions | |
�� | +1.339 |
ゼ | +1.304 |
dos | +1.291 |
eeper | +1.271 |
verting | +1.262 |
Neg logit contributions | |
Honour | -0.645 |
emin | -0.587 |
acceptance | -0.544 |
MENT | -0.542 |
ODY | -0.528 |
Token | 's |
Token ID | 338 |
Feature activation | +3.38e-01 |
Pos logit contributions | |
dos | +3.967 |
ゼ | +3.911 |
verting | +3.859 |
�� | +3.796 |
eeper | +3.735 |
Neg logit contributions | |
Honour | -6.514 |
emin | -6.267 |
ODY | -6.111 |
MENT | -6.052 |
afety | -6.015 |
Token | political |
Token ID | 1964 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
Honour | +2.129 |
acceptance | +1.951 |
emin | +1.941 |
MENT | +1.834 |
abre | +1.757 |
Neg logit contributions | |
�� | -2.706 |
ゼ | -2.564 |
dos | -2.563 |
eeper | -2.487 |
� | -2.385 |
Token | Hide |
Token ID | 10415 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
�� | +1.903 |
ゼ | +1.861 |
dos | +1.841 |
eeper | +1.793 |
verting | +1.791 |
Neg logit contributions | |
Honour | -1.585 |
emin | -1.486 |
acceptance | -1.418 |
MENT | -1.415 |
ODY | -1.406 |
Token | Caption |
Token ID | 11260 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
�� | +0.070 |
ゼ | +0.066 |
dos | +0.065 |
eeper | +0.063 |
verting | +0.063 |
Neg logit contributions | |
Honour | -0.091 |
emin | -0.085 |
MENT | -0.082 |
acceptance | -0.081 |
ODY | -0.081 |
Token | 9 |
Token ID | 860 |
Feature activation | -2.48e-01 |
Pos logit contributions | |
................................................................ | +6.376 |
ゼ | +6.145 |
dos | +6.037 |
kj | +5.814 |
eeper | +5.792 |
Neg logit contributions | |
emin | -9.040 |
Honour | -9.014 |
ODY | -8.922 |
afety | -8.918 |
MENT | -8.773 |
Token | of |
Token ID | 286 |
Feature activation | -7.31e-01 |
Pos logit contributions | |
�� | +1.839 |
ゼ | +1.807 |
dos | +1.789 |
eeper | +1.741 |
verting | +1.738 |
Neg logit contributions | |
Honour | -1.582 |
emin | -1.483 |
acceptance | -1.415 |
MENT | -1.412 |
ODY | -1.401 |
Token | 15 |
Token ID | 1315 |
Feature activation | -4.09e-01 |
Pos logit contributions | |
dos | +4.206 |
ゼ | +4.196 |
�� | +4.133 |
................................................................ | +4.106 |
eeper | +4.041 |
Neg logit contributions | |
Honour | -5.283 |
emin | -5.187 |
acceptance | -5.014 |
afety | -4.994 |
ODY | -4.987 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
�� | +1.775 |
ゼ | +1.761 |
dos | +1.746 |
verting | +1.647 |
eeper | +1.641 |
Neg logit contributions | |
Honour | -3.780 |
emin | -3.635 |
acceptance | -3.551 |
MENT | -3.523 |
ODY | -3.518 |
Token | : |
Token ID | 25 |
Feature activation | -9.06e-01 |
Pos logit contributions | |
................................................................ | +5.061 |
dos | +4.677 |
ゼ | +4.353 |
kj | +4.316 |
verting | +4.311 |
Neg logit contributions | |
Honour | -14.840 |
mathemat | -14.650 |
ODY | -14.436 |
emin | -14.398 |
afety | -14.347 |
Token | Carly |
Token ID | 35982 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
ゼ | +5.964 |
�� | +5.858 |
................................................................ | +5.828 |
dos | +5.796 |
verting | +5.733 |
Neg logit contributions | |
Honour | -5.656 |
emin | -5.470 |
acceptance | -5.390 |
MENT | -5.370 |
ODY | -5.366 |
Token | Fiorina |
Token ID | 49028 |
Feature activation | -6.03e-01 |
Pos logit contributions | |
�� | +1.371 |
ゼ | +1.335 |
dos | +1.322 |
eeper | +1.301 |
verting | +1.291 |
Neg logit contributions | |
Honour | -0.661 |
emin | -0.602 |
acceptance | -0.559 |
MENT | -0.555 |
ODY | -0.542 |
Token | 's |
Token ID | 338 |
Feature activation | +3.57e-01 |
Pos logit contributions | |
dos | +3.241 |
ゼ | +3.231 |
�� | +3.214 |
verting | +3.150 |
eeper | +3.097 |
Neg logit contributions | |
Honour | -4.851 |
emin | -4.643 |
ODY | -4.499 |
MENT | -4.475 |
acceptance | -4.432 |
Token | political |
Token ID | 1964 |
Feature activation | +2.79e-01 |
Pos logit contributions | |
Honour | +2.228 |
acceptance | +2.041 |
emin | +2.024 |
MENT | +1.910 |
abre | +1.829 |
Neg logit contributions | |
�� | -2.880 |
dos | -2.738 |
ゼ | -2.730 |
eeper | -2.648 |
� | -2.539 |
Token | Hide |
Token ID | 10415 |
Feature activation | +9.93e-02 |
Pos logit contributions | |
�� | +2.090 |
ゼ | +2.049 |
dos | +2.027 |
eeper | +1.966 |
verting | +1.965 |
Neg logit contributions | |
Honour | -1.882 |
emin | -1.777 |
acceptance | -1.700 |
MENT | -1.696 |
ODY | -1.692 |
Token | Caption |
Token ID | 11260 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
Honour | +0.785 |
emin | +0.730 |
MENT | +0.709 |
acceptance | +0.696 |
ODY | +0.690 |
Neg logit contributions | |
�� | -0.642 |
ゼ | -0.603 |
dos | -0.589 |
eeper | -0.577 |
verting | -0.569 |
Token | 10 |
Token ID | 838 |
Feature activation | -7.37e-01 |
Pos logit contributions | |
ゼ | +5.863 |
................................................................ | +5.681 |
dos | +5.612 |
verting | +5.473 |
� | +5.272 |
Neg logit contributions | |
Honour | -9.021 |
emin | -8.958 |
ODY | -8.737 |
afety | -8.728 |
acceptance | -8.672 |
Token | of |
Token ID | 286 |
Feature activation | -8.23e-01 |
Pos logit contributions | |
ゼ | +4.560 |
dos | +4.544 |
................................................................ | +4.366 |
�� | +4.342 |
verting | +4.341 |
Neg logit contributions | |
Honour | -5.228 |
emin | -4.962 |
acceptance | -4.774 |
ODY | -4.752 |
afety | -4.748 |
Token | 15 |
Token ID | 1315 |
Feature activation | -3.83e-01 |
Pos logit contributions | |
dos | +4.611 |
ゼ | +4.574 |
................................................................ | +4.540 |
�� | +4.495 |
eeper | +4.417 |
Neg logit contributions | |
Honour | -5.988 |
emin | -5.885 |
afety | -5.712 |
acceptance | -5.704 |
ODY | -5.664 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
�� | +1.689 |
ゼ | +1.669 |
dos | +1.655 |
verting | +1.563 |
eeper | +1.559 |
Neg logit contributions | |
Honour | -3.528 |
emin | -3.389 |
acceptance | -3.308 |
MENT | -3.284 |
ODY | -3.277 |
Token | : |
Token ID | 25 |
Feature activation | -8.88e-01 |
Pos logit contributions | |
................................................................ | +5.019 |
dos | +4.665 |
ゼ | +4.326 |
kj | +4.311 |
verting | +4.293 |
Neg logit contributions | |
Honour | -14.693 |
mathemat | -14.452 |
ODY | -14.262 |
emin | -14.254 |
afety | -14.194 |
Token | Carly |
Token ID | 35982 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
ゼ | +5.868 |
�� | +5.777 |
................................................................ | +5.737 |
dos | +5.707 |
verting | +5.642 |
Neg logit contributions | |
Honour | -5.539 |
emin | -5.353 |
acceptance | -5.271 |
MENT | -5.244 |
ODY | -5.243 |
Token | Fiorina |
Token ID | 49028 |
Feature activation | -6.24e-01 |
Pos logit contributions | |
�� | +1.036 |
ゼ | +1.007 |
dos | +0.997 |
eeper | +0.982 |
verting | +0.974 |
Neg logit contributions | |
Honour | -0.492 |
emin | -0.447 |
acceptance | -0.414 |
MENT | -0.411 |
ODY | -0.400 |
Token | 's |
Token ID | 338 |
Feature activation | +3.67e-01 |
Pos logit contributions | |
dos | +3.340 |
ゼ | +3.321 |
�� | +3.293 |
verting | +3.238 |
eeper | +3.184 |
Neg logit contributions | |
Honour | -5.023 |
emin | -4.812 |
ODY | -4.659 |
MENT | -4.638 |
acceptance | -4.605 |
Token | political |
Token ID | 1964 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
Honour | +2.284 |
acceptance | +2.091 |
emin | +2.070 |
MENT | +1.954 |
abre | +1.874 |
Neg logit contributions | |
�� | -2.982 |
dos | -2.825 |
ゼ | -2.821 |
eeper | -2.736 |
� | -2.625 |
Token | Hide |
Token ID | 10415 |
Feature activation | +5.48e-02 |
Pos logit contributions | |
�� | +0.744 |
ゼ | +0.721 |
dos | +0.714 |
eeper | +0.698 |
verting | +0.694 |
Neg logit contributions | |
Honour | -0.676 |
emin | -0.634 |
MENT | -0.603 |
acceptance | -0.603 |
ODY | -0.597 |
Token | Caption |
Token ID | 11260 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
Honour | +0.435 |
emin | +0.406 |
MENT | +0.394 |
acceptance | +0.388 |
ODY | +0.385 |
Neg logit contributions | |
�� | -0.349 |
ゼ | -0.330 |
dos | -0.322 |
eeper | -0.314 |
verting | -0.311 |
Token | 8 |
Token ID | 807 |
Feature activation | -3.56e-01 |
Pos logit contributions | |
................................................................ | +6.483 |
dos | +6.366 |
verting | +6.220 |
ゼ | +6.212 |
eeper | +5.913 |
Neg logit contributions | |
emin | -8.551 |
Honour | -8.500 |
ODY | -8.298 |
acceptance | -8.271 |
MENT | -8.196 |
Token | of |
Token ID | 286 |
Feature activation | -7.17e-01 |
Pos logit contributions | |
�� | +2.532 |
ゼ | +2.521 |
dos | +2.499 |
verting | +2.419 |
eeper | +2.418 |
Neg logit contributions | |
Honour | -2.338 |
emin | -2.200 |
acceptance | -2.103 |
MENT | -2.095 |
ODY | -2.085 |
Token | 15 |
Token ID | 1315 |
Feature activation | -2.96e-01 |
Pos logit contributions | |
dos | +4.167 |
ゼ | +4.161 |
�� | +4.115 |
................................................................ | +4.055 |
eeper | +4.006 |
Neg logit contributions | |
Honour | -5.160 |
emin | -5.066 |
acceptance | -4.887 |
ODY | -4.852 |
afety | -4.849 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
�� | +1.379 |
ゼ | +1.343 |
dos | +1.326 |
eeper | +1.264 |
verting | +1.261 |
Neg logit contributions | |
Honour | -2.691 |
emin | -2.578 |
acceptance | -2.505 |
MENT | -2.495 |
ODY | -2.485 |
Token | : |
Token ID | 25 |
Feature activation | -9.52e-01 |
Pos logit contributions | |
................................................................ | +5.103 |
dos | +4.701 |
ゼ | +4.392 |
verting | +4.347 |
kj | +4.328 |
Neg logit contributions | |
Honour | -14.653 |
mathemat | -14.345 |
ODY | -14.234 |
emin | -14.188 |
acceptance | -14.125 |
Token | Carly |
Token ID | 35982 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
ゼ | +6.167 |
�� | +6.068 |
................................................................ | +6.044 |
dos | +5.990 |
verting | +5.937 |
Neg logit contributions | |
Honour | -5.975 |
emin | -5.773 |
acceptance | -5.708 |
MENT | -5.687 |
ODY | -5.677 |
Token | Fiorina |
Token ID | 49028 |
Feature activation | -5.93e-01 |
Pos logit contributions | |
�� | +1.224 |
ゼ | +1.191 |
dos | +1.180 |
eeper | +1.161 |
verting | +1.152 |
Neg logit contributions | |
Honour | -0.586 |
emin | -0.533 |
acceptance | -0.494 |
MENT | -0.491 |
ODY | -0.479 |
Token | 's |
Token ID | 338 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
dos | +3.190 |
ゼ | +3.184 |
�� | +3.176 |
verting | +3.104 |
eeper | +3.053 |
Neg logit contributions | |
Honour | -4.768 |
emin | -4.561 |
ODY | -4.415 |
MENT | -4.399 |
acceptance | -4.366 |
Token | political |
Token ID | 1964 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
Honour | +2.245 |
acceptance | +2.047 |
emin | +2.045 |
MENT | +1.929 |
abre | +1.852 |
Neg logit contributions | |
�� | -2.872 |
dos | -2.730 |
ゼ | -2.725 |
eeper | -2.641 |
� | -2.536 |
Token | Hide |
Token ID | 10415 |
Feature activation | -2.38e-02 |
Pos logit contributions | |
�� | +1.272 |
ゼ | +1.239 |
dos | +1.225 |
eeper | +1.195 |
verting | +1.191 |
Neg logit contributions | |
Honour | -1.140 |
emin | -1.070 |
acceptance | -1.021 |
MENT | -1.021 |
ODY | -1.012 |
Token | Caption |
Token ID | 11260 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
�� | +0.148 |
ゼ | +0.139 |
dos | +0.136 |
eeper | +0.133 |
verting | +0.132 |
Neg logit contributions | |
Honour | -0.192 |
emin | -0.180 |
MENT | -0.175 |
acceptance | -0.172 |
ODY | -0.171 |
Token | 14 |
Token ID | 1478 |
Feature activation | -2.44e-01 |
Pos logit contributions | |
................................................................ | +5.706 |
dos | +5.642 |
verting | +5.500 |
ゼ | +5.464 |
eeper | +5.391 |
Neg logit contributions | |
emin | -7.211 |
Honour | -7.201 |
ODY | -6.997 |
MENT | -6.908 |
afety | -6.896 |
Token | of |
Token ID | 286 |
Feature activation | -7.96e-01 |
Pos logit contributions | |
�� | +1.800 |
ゼ | +1.773 |
dos | +1.757 |
eeper | +1.707 |
verting | +1.706 |
Neg logit contributions | |
Honour | -1.567 |
emin | -1.471 |
acceptance | -1.404 |
MENT | -1.400 |
ODY | -1.392 |
Token | 15 |
Token ID | 1315 |
Feature activation | -4.73e-01 |
Pos logit contributions | |
dos | +4.597 |
ゼ | +4.563 |
�� | +4.500 |
................................................................ | +4.478 |
verting | +4.377 |
Neg logit contributions | |
Honour | -5.740 |
emin | -5.632 |
acceptance | -5.444 |
afety | -5.434 |
ODY | -5.393 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
ゼ | +1.973 |
�� | +1.960 |
dos | +1.959 |
verting | +1.835 |
eeper | +1.822 |
Neg logit contributions | |
Honour | -4.397 |
emin | -4.238 |
acceptance | -4.151 |
ODY | -4.106 |
MENT | -4.102 |
Token | : |
Token ID | 25 |
Feature activation | -8.65e-01 |
Pos logit contributions | |
................................................................ | +5.045 |
dos | +4.670 |
ゼ | +4.324 |
kj | +4.300 |
verting | +4.299 |
Neg logit contributions | |
Honour | -14.616 |
mathemat | -14.375 |
emin | -14.230 |
ODY | -14.211 |
afety | -14.163 |
Token | Carly |
Token ID | 35982 |
Feature activation | -1.73e-01 |
Pos logit contributions | |
ゼ | +5.745 |
�� | +5.655 |
................................................................ | +5.620 |
dos | +5.597 |
verting | +5.529 |
Neg logit contributions | |
Honour | -5.386 |
emin | -5.220 |
acceptance | -5.116 |
MENT | -5.092 |
ODY | -5.083 |
Token | Fiorina |
Token ID | 49028 |
Feature activation | -7.80e-01 |
Pos logit contributions | |
�� | +1.628 |
ゼ | +1.586 |
dos | +1.572 |
eeper | +1.545 |
verting | +1.536 |
Neg logit contributions | |
Honour | -0.797 |
emin | -0.726 |
acceptance | -0.675 |
MENT | -0.673 |
ODY | -0.658 |
Token | 's |
Token ID | 338 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
dos | +3.920 |
ゼ | +3.871 |
verting | +3.804 |
�� | +3.744 |
eeper | +3.691 |
Neg logit contributions | |
Honour | -6.404 |
emin | -6.165 |
ODY | -6.004 |
MENT | -5.945 |
afety | -5.914 |
Token | political |
Token ID | 1964 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
Honour | +1.511 |
emin | +1.388 |
acceptance | +1.382 |
MENT | +1.315 |
ODY | +1.267 |
Neg logit contributions | |
�� | -1.805 |
ゼ | -1.716 |
dos | -1.711 |
eeper | -1.663 |
verting | -1.599 |
Token | Hide |
Token ID | 10415 |
Feature activation | +4.83e-03 |
Pos logit contributions | |
�� | +1.204 |
ゼ | +1.173 |
dos | +1.159 |
eeper | +1.129 |
verting | +1.126 |
Neg logit contributions | |
Honour | -1.140 |
emin | -1.073 |
acceptance | -1.026 |
MENT | -1.025 |
ODY | -1.017 |
Token | Caption |
Token ID | 11260 |
Feature activation | -9.95e-01 |
Pos logit contributions | |
Honour | +0.039 |
emin | +0.036 |
MENT | +0.035 |
acceptance | +0.035 |
ODY | +0.034 |
Neg logit contributions | |
�� | -0.030 |
ゼ | -0.029 |
dos | -0.028 |
eeper | -0.027 |
verting | -0.027 |
Token | 13 |
Token ID | 1511 |
Feature activation | -2.47e-01 |
Pos logit contributions | |
................................................................ | +5.608 |
dos | +5.577 |
ゼ | +5.549 |
�� | +5.442 |
eeper | +5.378 |
Neg logit contributions | |
Honour | -7.047 |
emin | -6.895 |
afety | -6.788 |
ODY | -6.773 |
MENT | -6.670 |
Token | of |
Token ID | 286 |
Feature activation | -8.19e-01 |
Pos logit contributions | |
�� | +1.821 |
ゼ | +1.792 |
dos | +1.775 |
eeper | +1.727 |
verting | +1.724 |
Neg logit contributions | |
Honour | -1.578 |
emin | -1.481 |
acceptance | -1.414 |
MENT | -1.410 |
ODY | -1.402 |
Token | 15 |
Token ID | 1315 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
dos | +4.655 |
ゼ | +4.622 |
................................................................ | +4.553 |
�� | +4.548 |
verting | +4.438 |
Neg logit contributions | |
Honour | -5.931 |
emin | -5.835 |
afety | -5.654 |
acceptance | -5.648 |
ODY | -5.580 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
�� | +1.734 |
ゼ | +1.723 |
dos | +1.707 |
verting | +1.609 |
eeper | +1.602 |
Neg logit contributions | |
Honour | -3.688 |
emin | -3.547 |
acceptance | -3.464 |
MENT | -3.434 |
ODY | -3.431 |
Token | : |
Token ID | 25 |
Feature activation | -8.49e-01 |
Pos logit contributions | |
................................................................ | +4.995 |
dos | +4.677 |
ゼ | +4.350 |
kj | +4.304 |
verting | +4.300 |
Neg logit contributions | |
Honour | -14.297 |
mathemat | -13.938 |
emin | -13.909 |
ODY | -13.885 |
afety | -13.828 |
Token | Carly |
Token ID | 35982 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
ゼ | +5.686 |
�� | +5.588 |
................................................................ | +5.549 |
dos | +5.547 |
verting | +5.466 |
Neg logit contributions | |
Honour | -5.270 |
emin | -5.102 |
acceptance | -4.991 |
ODY | -4.973 |
MENT | -4.971 |
Token | Fiorina |
Token ID | 49028 |
Feature activation | -7.93e-01 |
Pos logit contributions | |
�� | +1.448 |
ゼ | +1.410 |
dos | +1.397 |
eeper | +1.374 |
verting | +1.365 |
Neg logit contributions | |
Honour | -0.702 |
emin | -0.639 |
acceptance | -0.594 |
MENT | -0.591 |
ODY | -0.577 |
Token | 's |
Token ID | 338 |
Feature activation | +2.69e-01 |
Pos logit contributions | |
dos | +3.967 |
ゼ | +3.914 |
verting | +3.854 |
�� | +3.787 |
eeper | +3.735 |
Neg logit contributions | |
Honour | -6.523 |
emin | -6.281 |
ODY | -6.120 |
MENT | -6.062 |
afety | -6.028 |
Token | political |
Token ID | 1964 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
Honour | +1.732 |
acceptance | +1.586 |
emin | +1.585 |
MENT | +1.501 |
ODY | +1.440 |
Neg logit contributions | |
�� | -2.122 |
ゼ | -2.015 |
dos | -2.010 |
eeper | -1.952 |
verting | -1.872 |
Token | surface |
Token ID | 4417 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
�� | +0.753 |
ゼ | +0.733 |
dos | +0.726 |
eeper | +0.707 |
verting | +0.705 |
Neg logit contributions | |
Honour | -0.699 |
emin | -0.658 |
MENT | -0.629 |
acceptance | -0.625 |
ODY | -0.623 |
Token | . |
Token ID | 13 |
Feature activation | -3.21e-01 |
Pos logit contributions | |
�� | +1.123 |
ゼ | +1.096 |
dos | +1.084 |
eeper | +1.058 |
verting | +1.054 |
Neg logit contributions | |
Honour | -1.021 |
emin | -0.961 |
MENT | -0.916 |
acceptance | -0.912 |
ODY | -0.908 |
Token |
|
Token ID | 198 |
Feature activation | +2.58e-01 |
Pos logit contributions | |
�� | +2.309 |
ゼ | +2.288 |
dos | +2.258 |
verting | +2.189 |
eeper | +2.164 |
Neg logit contributions | |
Honour | -2.039 |
emin | -1.945 |
acceptance | -1.898 |
MENT | -1.876 |
ODY | -1.854 |
Token |
|
Token ID | 198 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
Honour | +1.370 |
emin | +1.249 |
MENT | +1.187 |
acceptance | +1.157 |
ODY | +1.146 |
Neg logit contributions | |
�� | -2.334 |
ゼ | -2.200 |
eeper | -2.154 |
dos | -2.149 |
verting | -2.108 |
Token | Media |
Token ID | 13152 |
Feature activation | -3.64e-02 |
Pos logit contributions | |
Honour | +1.152 |
emin | +1.090 |
MENT | +1.041 |
OPS | +1.020 |
ODY | +1.020 |
Neg logit contributions | |
�� | -1.598 |
ゼ | -1.526 |
dos | -1.504 |
eeper | -1.503 |
verting | -1.480 |
Token | playback |
Token ID | 16388 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
�� | +0.267 |
ゼ | +0.259 |
dos | +0.256 |
eeper | +0.250 |
verting | +0.249 |
Neg logit contributions | |
Honour | -0.241 |
emin | -0.226 |
acceptance | -0.217 |
MENT | -0.216 |
ODY | -0.214 |
Token | is |
Token ID | 318 |
Feature activation | -4.08e-01 |
Pos logit contributions | |
dos | +7.284 |
ゼ | +7.228 |
verting | +6.961 |
�� | +6.915 |
eeper | +6.745 |
Neg logit contributions | |
Honour | -11.565 |
emin | -11.261 |
OPS | -11.251 |
� | -11.117 |
MENT | -11.023 |
Token | unsupported |
Token ID | 24222 |
Feature activation | -6.36e-01 |
Pos logit contributions | |
�� | +2.601 |
ゼ | +2.522 |
dos | +2.489 |
eeper | +2.418 |
verting | +2.410 |
Neg logit contributions | |
Honour | -3.071 |
emin | -2.908 |
acceptance | -2.792 |
MENT | -2.791 |
ODY | -2.770 |
Token | on |
Token ID | 319 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
ゼ | +4.515 |
dos | +4.478 |
�� | +4.471 |
verting | +4.342 |
eeper | +4.280 |
Neg logit contributions | |
Honour | -4.007 |
emin | -3.863 |
ODY | -3.658 |
MENT | -3.658 |
acceptance | -3.651 |
Token | your |
Token ID | 534 |
Feature activation | -3.53e-01 |
Pos logit contributions | |
�� | +0.957 |
ゼ | +0.927 |
dos | +0.915 |
eeper | +0.896 |
verting | +0.889 |
Neg logit contributions | |
Honour | -0.661 |
emin | -0.615 |
MENT | -0.586 |
acceptance | -0.585 |
ODY | -0.576 |
Token | device |
Token ID | 3335 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
�� | +1.715 |
ゼ | +1.640 |
dos | +1.605 |
eeper | +1.545 |
verting | +1.524 |
Neg logit contributions | |
Honour | -3.230 |
emin | -3.078 |
acceptance | -2.995 |
MENT | -2.982 |
ODY | -2.959 |
Token | 20 |
Token ID | 1160 |
Feature activation | -9.55e-01 |
Pos logit contributions | |
�� | +4.015 |
ゼ | +3.959 |
dos | +3.912 |
verting | +3.847 |
eeper | +3.815 |
Neg logit contributions | |
Honour | -3.808 |
emin | -3.604 |
MENT | -3.393 |
ODY | -3.371 |
acceptance | -3.369 |
Token | 21 |
Token ID | 2310 |
Feature activation | -8.94e-01 |
Pos logit contributions | |
�� | +6.006 |
ゼ | +5.977 |
dos | +5.914 |
eeper | +5.859 |
verting | +5.827 |
Neg logit contributions | |
Honour | -6.505 |
emin | -6.231 |
MENT | -5.810 |
OPS | -5.708 |
afety | -5.686 |
Token | 22 |
Token ID | 2534 |
Feature activation | -7.43e-01 |
Pos logit contributions | |
�� | +5.586 |
dos | +5.512 |
ゼ | +5.496 |
verting | +5.459 |
eeper | +5.439 |
Neg logit contributions | |
Honour | -6.193 |
emin | -5.800 |
MENT | -5.423 |
ODY | -5.399 |
afety | -5.328 |
Token | 23 |
Token ID | 2242 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
�� | +4.720 |
eeper | +4.565 |
ゼ | +4.554 |
................................................................ | +4.469 |
verting | +4.468 |
Neg logit contributions | |
Honour | -5.170 |
emin | -4.918 |
MENT | -4.687 |
OPS | -4.677 |
afety | -4.617 |
Token | 24 |
Token ID | 1987 |
Feature activation | -7.54e-01 |
Pos logit contributions | |
�� | +3.455 |
ゼ | +3.397 |
dos | +3.368 |
verting | +3.338 |
eeper | +3.338 |
Neg logit contributions | |
Honour | -2.928 |
emin | -2.770 |
MENT | -2.613 |
ODY | -2.578 |
acceptance | -2.522 |
Token | 25 |
Token ID | 1679 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
�� | +4.997 |
ゼ | +4.943 |
dos | +4.872 |
eeper | +4.833 |
verting | +4.800 |
Neg logit contributions | |
Honour | -5.152 |
emin | -4.902 |
MENT | -4.631 |
ODY | -4.615 |
afety | -4.599 |
Token | 26 |
Token ID | 2608 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
verting | +7.550 |
................................................................ | +7.434 |
ゼ | +7.315 |
� | +7.279 |
dos | +7.268 |
Neg logit contributions | |
Honour | -11.898 |
emin | -11.171 |
MENT | -10.754 |
ODY | -10.571 |
afety | -10.538 |
Token | 27 |
Token ID | 2681 |
Feature activation | -9.07e-01 |
Pos logit contributions | |
�� | +7.476 |
................................................................ | +7.370 |
verting | +7.360 |
ゼ | +7.357 |
dos | +7.034 |
Neg logit contributions | |
Honour | -9.746 |
emin | -9.421 |
OPS | -9.071 |
afety | -9.056 |
MENT | -9.030 |
Token | # |
Token ID | 1303 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
verting | +5.915 |
�� | +5.863 |
dos | +5.808 |
ゼ | +5.770 |
................................................................ | +5.627 |
Neg logit contributions | |
Honour | -6.065 |
emin | -5.791 |
MENT | -5.502 |
ODY | -5.403 |
afety | -5.351 |
Token | loop |
Token ID | 9052 |
Feature activation | +8.29e-03 |
Pos logit contributions | |
Honour | +1.515 |
emin | +1.418 |
acceptance | +1.366 |
MENT | +1.354 |
ODY | +1.339 |
Neg logit contributions | |
�� | -1.825 |
ゼ | -1.764 |
dos | -1.726 |
eeper | -1.701 |
verting | -1.681 |
Token | over |
Token ID | 625 |
Feature activation | -4.91e-01 |
Pos logit contributions | |
Honour | +0.044 |
emin | +0.041 |
acceptance | +0.039 |
MENT | +0.039 |
ODY | +0.038 |
Neg logit contributions | |
�� | -0.071 |
ゼ | -0.069 |
dos | -0.068 |
eeper | -0.067 |
verting | -0.067 |
Token | ( |
Token ID | 7 |
Feature activation | -8.09e-01 |
Pos logit contributions | |
�� | +1.511 |
ゼ | +1.474 |
dos | +1.458 |
eeper | +1.407 |
verting | +1.404 |
Neg logit contributions | |
Honour | -2.145 |
emin | -2.040 |
acceptance | -1.968 |
MENT | -1.961 |
ODY | -1.951 |
Token | args |
Token ID | 22046 |
Feature activation | +2.97e-03 |
Pos logit contributions | |
dos | +1.470 |
�� | +1.339 |
ゼ | +1.213 |
eeper | +1.200 |
verting | +1.128 |
Neg logit contributions | |
Honour | -9.724 |
emin | -9.173 |
ODY | -9.039 |
acceptance | -9.004 |
MENT | -8.940 |
Token | [" |
Token ID | 14692 |
Feature activation | -1.49e-02 |
Pos logit contributions | |
Honour | +0.027 |
emin | +0.026 |
MENT | +0.025 |
acceptance | +0.025 |
ODY | +0.025 |
Neg logit contributions | |
�� | -0.015 |
ゼ | -0.014 |
dos | -0.014 |
verting | -0.013 |
eeper | -0.013 |
Token | images |
Token ID | 17566 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
�� | +0.116 |
ゼ | +0.111 |
dos | +0.107 |
eeper | +0.106 |
verting | +0.105 |
Neg logit contributions | |
Honour | -0.092 |
emin | -0.090 |
MENT | -0.084 |
acceptance | -0.084 |
ODY | -0.083 |
Token | "] |
Token ID | 8973 |
Feature activation | -7.38e-01 |
Pos logit contributions | |
�� | +0.746 |
ゼ | +0.709 |
dos | +0.694 |
eeper | +0.680 |
verting | +0.679 |
Neg logit contributions | |
Honour | -0.743 |
emin | -0.704 |
MENT | -0.677 |
acceptance | -0.670 |
ODY | -0.665 |
Token | ): |
Token ID | 2599 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
ゼ | +3.481 |
dos | +3.461 |
verting | +3.329 |
�� | +3.321 |
eeper | +3.291 |
Neg logit contributions | |
Honour | -6.411 |
emin | -6.131 |
acceptance | -5.957 |
ODY | -5.932 |
MENT | -5.845 |
Token | # |
Token ID | 1303 |
Feature activation | -6.13e-02 |
Pos logit contributions | |
dos | +5.691 |
................................................................ | +5.419 |
ゼ | +5.415 |
verting | +5.390 |
eeper | +5.144 |
Neg logit contributions | |
Honour | -13.268 |
emin | -12.965 |
MENT | -12.461 |
ODY | -12.393 |
afety | -12.385 |
Token | load |
Token ID | 3440 |
Feature activation | -6.65e-01 |
Pos logit contributions | |
�� | +0.573 |
ゼ | +0.556 |
dos | +0.547 |
eeper | +0.540 |
verting | +0.539 |
Neg logit contributions | |
Honour | -0.286 |
emin | -0.261 |
acceptance | -0.252 |
MENT | -0.244 |
ODY | -0.244 |
Token | the |
Token ID | 262 |
Feature activation | -5.19e-01 |
Pos logit contributions | |
ゼ | +4.422 |
dos | +4.388 |
�� | +4.365 |
verting | +4.243 |
eeper | +4.221 |
Neg logit contributions | |
Honour | -4.522 |
emin | -4.304 |
ODY | -4.092 |
acceptance | -4.083 |
MENT | -4.061 |
Token | image |
Token ID | 2939 |
Feature activation | +2.59e-03 |
Pos logit contributions | |
ゼ | +4.286 |
�� | +4.281 |
dos | +4.249 |
verting | +4.174 |
eeper | +4.174 |
Neg logit contributions | |
Honour | -2.736 |
emin | -2.535 |
MENT | -2.369 |
ODY | -2.365 |
afety | -2.342 |
Token | , |
Token ID | 11 |
Feature activation | +4.30e-01 |
Pos logit contributions | |
Honour | +0.015 |
emin | +0.014 |
acceptance | +0.014 |
MENT | +0.013 |
ODY | +0.013 |
Neg logit contributions | |
�� | -0.021 |
ゼ | -0.020 |
dos | -0.020 |
eeper | -0.020 |
verting | -0.019 |
Token | Women |
Token ID | 6926 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
Honour | +0.070 |
emin | +0.062 |
acceptance | +0.056 |
MENT | +0.056 |
ODY | +0.055 |
Neg logit contributions | |
�� | -0.212 |
ゼ | -0.208 |
dos | -0.206 |
eeper | -0.203 |
verting | -0.202 |
Token | in |
Token ID | 287 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
�� | +0.881 |
ゼ | +0.857 |
dos | +0.847 |
eeper | +0.827 |
verting | +0.824 |
Neg logit contributions | |
Honour | -0.770 |
emin | -0.722 |
acceptance | -0.690 |
MENT | -0.688 |
ODY | -0.681 |
Token | politics |
Token ID | 4819 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
Honour | +1.455 |
emin | +1.348 |
acceptance | +1.298 |
MENT | +1.257 |
ODY | +1.253 |
Neg logit contributions | |
�� | -1.814 |
ゼ | -1.776 |
dos | -1.740 |
eeper | -1.707 |
verting | -1.666 |
Token | . |
Token ID | 13 |
Feature activation | -6.61e-02 |
Pos logit contributions | |
Honour | +1.490 |
emin | +1.393 |
acceptance | +1.347 |
MENT | +1.316 |
ODY | +1.290 |
Neg logit contributions | |
�� | -1.887 |
ゼ | -1.812 |
dos | -1.786 |
eeper | -1.758 |
verting | -1.742 |
Token | Hide |
Token ID | 10415 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
�� | +0.490 |
ゼ | +0.475 |
dos | +0.469 |
eeper | +0.460 |
verting | +0.457 |
Neg logit contributions | |
Honour | -0.434 |
emin | -0.407 |
MENT | -0.387 |
acceptance | -0.386 |
ODY | -0.382 |
Token | Caption |
Token ID | 11260 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
�� | +0.780 |
ゼ | +0.747 |
dos | +0.730 |
eeper | +0.711 |
verting | +0.705 |
Neg logit contributions | |
Honour | -1.087 |
emin | -1.028 |
MENT | -0.994 |
acceptance | -0.988 |
ODY | -0.980 |
Token | 7 |
Token ID | 767 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
................................................................ | +6.588 |
ゼ | +6.335 |
dos | +6.240 |
�� | +5.991 |
kj | +5.899 |
Neg logit contributions | |
emin | -11.522 |
Honour | -11.279 |
afety | -11.219 |
ONY | -11.193 |
abre | -11.140 |
Token | of |
Token ID | 286 |
Feature activation | -7.10e-01 |
Pos logit contributions | |
�� | +1.943 |
ゼ | +1.910 |
dos | +1.893 |
eeper | +1.841 |
verting | +1.838 |
Neg logit contributions | |
Honour | -1.682 |
emin | -1.577 |
acceptance | -1.505 |
MENT | -1.502 |
ODY | -1.489 |
Token | 15 |
Token ID | 1315 |
Feature activation | -2.97e-01 |
Pos logit contributions | |
ゼ | +4.134 |
dos | +4.128 |
�� | +4.084 |
................................................................ | +4.020 |
eeper | +3.963 |
Neg logit contributions | |
Honour | -5.111 |
emin | -5.013 |
acceptance | -4.855 |
afety | -4.819 |
ODY | -4.809 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
�� | +1.385 |
ゼ | +1.349 |
dos | +1.331 |
eeper | +1.268 |
verting | +1.266 |
Neg logit contributions | |
Honour | -2.703 |
emin | -2.590 |
acceptance | -2.517 |
MENT | -2.507 |
ODY | -2.496 |
Token | : |
Token ID | 25 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
................................................................ | +5.221 |
dos | +4.677 |
ゼ | +4.357 |
kj | +4.343 |
verting | +4.302 |
Neg logit contributions | |
mathemat | -15.813 |
Honour | -15.770 |
carbohyd | -15.459 |
ODY | -15.377 |
emin | -15.273 |
Token | carried |
Token ID | 5281 |
Feature activation | -5.71e-01 |
Pos logit contributions | |
Honour | +2.597 |
emin | +2.404 |
acceptance | +2.308 |
MENT | +2.267 |
ODY | +2.243 |
Neg logit contributions | |
�� | -4.048 |
ゼ | -3.915 |
dos | -3.906 |
eeper | -3.817 |
verting | -3.810 |
Token | the |
Token ID | 262 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
�� | +3.765 |
ゼ | +3.756 |
dos | +3.709 |
verting | +3.615 |
eeper | +3.575 |
Neg logit contributions | |
Honour | -3.918 |
emin | -3.733 |
ODY | -3.580 |
MENT | -3.565 |
acceptance | -3.481 |
Token | Catalan |
Token ID | 31066 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
Honour | +2.956 |
emin | +2.820 |
acceptance | +2.758 |
MENT | +2.731 |
ODY | +2.694 |
Neg logit contributions | |
�� | -1.196 |
dos | -1.106 |
ゼ | -1.101 |
eeper | -1.049 |
verting | -1.017 |
Token | pro |
Token ID | 386 |
Feature activation | -5.38e-03 |
Pos logit contributions | |
ゼ | +6.842 |
dos | +6.777 |
verting | +6.624 |
�� | +6.615 |
................................................................ | +6.499 |
Neg logit contributions | |
Honour | -8.704 |
ODY | -8.306 |
emin | -8.260 |
MENT | -8.172 |
afety | -8.103 |
Token | - |
Token ID | 12 |
Feature activation | -6.32e-01 |
Pos logit contributions | |
�� | +0.043 |
ゼ | +0.041 |
dos | +0.041 |
eeper | +0.040 |
verting | +0.039 |
Neg logit contributions | |
Honour | -0.033 |
emin | -0.031 |
acceptance | -0.029 |
MENT | -0.029 |
ODY | -0.028 |
Token | independence |
Token ID | 39894 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
�� | +1.666 |
dos | +1.663 |
ゼ | +1.603 |
verting | +1.590 |
eeper | +1.527 |
Neg logit contributions | |
Honour | -6.943 |
emin | -6.497 |
ODY | -6.449 |
MENT | -6.398 |
acceptance | -6.394 |
Token | flag |
Token ID | 6056 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
verting | +3.877 |
dos | +3.727 |
ゼ | +3.670 |
................................................................ | +3.643 |
�� | +3.464 |
Neg logit contributions | |
ODY | -14.120 |
Honour | -14.078 |
emin | -14.052 |
afety | -13.752 |
ONY | -13.649 |
Token | - |
Token ID | 532 |
Feature activation | -5.72e-01 |
Pos logit contributions | |
�� | +1.033 |
ゼ | +1.004 |
dos | +0.996 |
verting | +0.970 |
eeper | +0.968 |
Neg logit contributions | |
Honour | -0.902 |
emin | -0.847 |
MENT | -0.811 |
acceptance | -0.805 |
ODY | -0.802 |
Token | the |
Token ID | 1169 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
�� | +3.839 |
ゼ | +3.744 |
dos | +3.679 |
verting | +3.631 |
eeper | +3.580 |
Neg logit contributions | |
Honour | -3.918 |
emin | -3.649 |
ODY | -3.542 |
MENT | -3.533 |
acceptance | -3.512 |
Token | est |
Token ID | 1556 |
Feature activation | -2.22e-02 |
Pos logit contributions | |
�� | +1.203 |
ゼ | +1.178 |
dos | +1.168 |
eeper | +1.144 |
verting | +1.142 |
Neg logit contributions | |
Honour | -0.673 |
emin | -0.619 |
MENT | -0.581 |
acceptance | -0.580 |
ODY | -0.575 |
Token | el |
Token ID | 417 |
Feature activation | -6.14e-01 |
Pos logit contributions | |
�� | +0.135 |
ゼ | +0.127 |
dos | +0.123 |
eeper | +0.119 |
verting | +0.119 |
Neg logit contributions | |
Honour | -0.179 |
emin | -0.174 |
acceptance | -0.163 |
MENT | -0.162 |
ODY | -0.161 |
Token | , |
Token ID | 11 |
Feature activation | +2.79e-01 |
Pos logit contributions | |
Honour | +3.033 |
emin | +2.837 |
acceptance | +2.672 |
MENT | +2.662 |
OPS | +2.562 |
Neg logit contributions | |
�� | -4.870 |
ゼ | -4.827 |
dos | -4.632 |
eeper | -4.619 |
verting | -4.542 |
Token | New |
Token ID | 968 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
Honour | +1.756 |
emin | +1.640 |
MENT | +1.593 |
acceptance | +1.579 |
ODY | +1.535 |
Neg logit contributions | |
�� | -2.171 |
ゼ | -2.088 |
dos | -2.047 |
eeper | -2.026 |
verting | -1.986 |
Token | Hampshire |
Token ID | 13910 |
Feature activation | +4.04e-01 |
Pos logit contributions | |
Honour | +1.649 |
emin | +1.530 |
MENT | +1.471 |
acceptance | +1.459 |
ODY | +1.424 |
Neg logit contributions | |
�� | -1.889 |
ゼ | -1.831 |
dos | -1.781 |
eeper | -1.765 |
verting | -1.720 |
Token | . |
Token ID | 13 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
Honour | +2.530 |
emin | +2.369 |
acceptance | +2.263 |
MENT | +2.235 |
ODY | +2.202 |
Neg logit contributions | |
�� | -3.095 |
ゼ | -3.003 |
dos | -2.958 |
eeper | -2.887 |
verting | -2.873 |
Token | Hide |
Token ID | 10415 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
�� | +1.829 |
ゼ | +1.783 |
dos | +1.762 |
eeper | +1.714 |
verting | +1.711 |
Neg logit contributions | |
Honour | -1.729 |
emin | -1.629 |
acceptance | -1.560 |
MENT | -1.558 |
ODY | -1.546 |
Token | Caption |
Token ID | 11260 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
Honour | +0.086 |
emin | +0.081 |
MENT | +0.078 |
acceptance | +0.077 |
ODY | +0.077 |
Neg logit contributions | |
�� | -0.068 |
ゼ | -0.065 |
dos | -0.063 |
eeper | -0.062 |
verting | -0.061 |
Token | 6 |
Token ID | 718 |
Feature activation | -6.10e-01 |
Pos logit contributions | |
................................................................ | +6.809 |
dos | +6.547 |
verting | +6.403 |
ゼ | +6.152 |
kj | +6.058 |
Neg logit contributions | |
Honour | -10.957 |
emin | -10.832 |
ONY | -10.579 |
ODY | -10.472 |
acceptance | -10.472 |
Token | of |
Token ID | 286 |
Feature activation | -7.33e-01 |
Pos logit contributions | |
ゼ | +3.985 |
dos | +3.972 |
�� | +3.883 |
verting | +3.806 |
eeper | +3.790 |
Neg logit contributions | |
Honour | -4.227 |
emin | -3.984 |
acceptance | -3.845 |
ODY | -3.803 |
MENT | -3.800 |
Token | 15 |
Token ID | 1315 |
Feature activation | -3.51e-01 |
Pos logit contributions | |
dos | +4.221 |
ゼ | +4.207 |
�� | +4.177 |
................................................................ | +4.114 |
eeper | +4.061 |
Neg logit contributions | |
Honour | -5.313 |
emin | -5.224 |
acceptance | -5.058 |
afety | -5.007 |
ODY | -4.990 |
Token | Photos |
Token ID | 9434 |
Feature activation | -1.77e+00 |
Pos logit contributions | |
�� | +1.586 |
ゼ | +1.554 |
dos | +1.537 |
eeper | +1.458 |
verting | +1.455 |
Neg logit contributions | |
Honour | -3.218 |
emin | -3.086 |
acceptance | -3.008 |
MENT | -2.991 |
ODY | -2.980 |
Token | : |
Token ID | 25 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
................................................................ | +5.241 |
dos | +4.618 |
kj | +4.312 |
(): | +4.273 |
ゼ | +4.268 |
Neg logit contributions | |
mathemat | -16.518 |
Honour | -16.297 |
carbohyd | -16.176 |
ODY | -15.928 |
afety | -15.809 |
Token | 10 |
Token ID | 838 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
ゼ | +5.047 |
�� | +4.940 |
dos | +4.812 |
verting | +4.781 |
eeper | +4.763 |
Neg logit contributions | |
Honour | -5.949 |
emin | -5.567 |
MENT | -5.377 |
ODY | -5.316 |
afety | -5.288 |
Token | 11 |
Token ID | 1367 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
ゼ | +7.649 |
�� | +7.524 |
dos | +7.402 |
verting | +7.395 |
eeper | +7.296 |
Neg logit contributions | |
Honour | -7.939 |
emin | -7.322 |
MENT | -7.114 |
afety | -6.899 |
OPS | -6.845 |
Token | 12 |
Token ID | 1105 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
ゼ | +6.243 |
�� | +6.233 |
verting | +6.149 |
dos | +6.111 |
eeper | +6.020 |
Neg logit contributions | |
Honour | -7.733 |
emin | -7.264 |
MENT | -7.034 |
afety | -7.006 |
ODY | -6.979 |
Token | 13 |
Token ID | 1511 |
Feature activation | -7.52e-01 |
Pos logit contributions | |
�� | +6.319 |
ゼ | +6.221 |
verting | +6.032 |
eeper | +5.983 |
dos | +5.970 |
Neg logit contributions | |
Honour | -7.692 |
emin | -7.310 |
afety | -7.193 |
MENT | -6.988 |
ODY | -6.960 |
Token | 14 |
Token ID | 1478 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
�� | +4.750 |
ゼ | +4.688 |
dos | +4.617 |
verting | +4.615 |
eeper | +4.595 |
Neg logit contributions | |
Honour | -5.203 |
emin | -4.986 |
MENT | -4.737 |
ODY | -4.693 |
afety | -4.589 |
Token | 15 |
Token ID | 1315 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
�� | +6.542 |
ゼ | +6.431 |
dos | +6.373 |
eeper | +6.370 |
verting | +6.281 |
Neg logit contributions | |
Honour | -7.709 |
emin | -7.364 |
afety | -7.060 |
MENT | -6.991 |
OPS | -6.918 |
Token | -- |
Token ID | 1377 |
Feature activation | -3.62e-01 |
Pos logit contributions | |
verting | +7.550 |
dos | +7.457 |
�� | +7.365 |
eeper | +7.206 |
................................................................ | +7.112 |
Neg logit contributions | |
Honour | -10.706 |
emin | -9.982 |
MENT | -9.685 |
OPS | -9.480 |
acceptance | -9.370 |
Token | Save |
Token ID | 12793 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
�� | +2.611 |
ゼ | +2.553 |
dos | +2.530 |
eeper | +2.464 |
verting | +2.462 |
Neg logit contributions | |
Honour | -2.396 |
emin | -2.245 |
MENT | -2.146 |
acceptance | -2.141 |
ODY | -2.125 |
Token | the |
Token ID | 262 |
Feature activation | -2.60e-01 |
Pos logit contributions | |
�� | +1.084 |
ゼ | +1.051 |
dos | +1.041 |
eeper | +1.014 |
verting | +1.011 |
Neg logit contributions | |
Honour | -0.956 |
emin | -0.900 |
acceptance | -0.860 |
MENT | -0.859 |
ODY | -0.851 |
Token | results |
Token ID | 2482 |
Feature activation | -9.90e-02 |
Pos logit contributions | |
�� | +1.653 |
ゼ | +1.605 |
dos | +1.585 |
eeper | +1.540 |
verting | +1.535 |
Neg logit contributions | |
Honour | -1.958 |
emin | -1.852 |
MENT | -1.778 |
acceptance | -1.777 |
ODY | -1.765 |
Token | of |
Token ID | 286 |
Feature activation | +6.40e-02 |
Pos logit contributions | |
�� | +0.765 |
ゼ | +0.743 |
dos | +0.735 |
eeper | +0.717 |
verting | +0.716 |
Neg logit contributions | |
Honour | -0.613 |
emin | -0.576 |
acceptance | -0.548 |
MENT | -0.546 |
ODY | -0.541 |
Token | , |
Token ID | 11 |
Feature activation | -6.25e-02 |
Pos logit contributions | |
Honour | +0.609 |
emin | +0.568 |
acceptance | +0.547 |
MENT | +0.542 |
ODY | +0.530 |
Neg logit contributions | |
�� | -0.796 |
ゼ | -0.773 |
dos | -0.764 |
eeper | -0.744 |
verting | -0.742 |
Token | who |
Token ID | 508 |
Feature activation | -4.02e-02 |
Pos logit contributions | |
�� | +0.446 |
ゼ | +0.432 |
dos | +0.427 |
eeper | +0.415 |
verting | +0.414 |
Neg logit contributions | |
Honour | -0.426 |
emin | -0.401 |
acceptance | -0.385 |
MENT | -0.383 |
ODY | -0.379 |
Token | wasn |
Token ID | 2492 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
�� | +0.310 |
ゼ | +0.302 |
dos | +0.297 |
eeper | +0.290 |
verting | +0.289 |
Neg logit contributions | |
Honour | -0.251 |
emin | -0.235 |
acceptance | -0.224 |
MENT | -0.222 |
ODY | -0.220 |
Token | � |
Token ID | 447 |
Feature activation | -3.44e-01 |
Pos logit contributions | |
ゼ | +4.990 |
dos | +4.975 |
................................................................ | +4.921 |
kj | +4.662 |
verting | +4.646 |
Neg logit contributions | |
Honour | -9.288 |
acceptance | -8.896 |
emin | -8.867 |
ODY | -8.661 |
afety | -8.618 |
Token | � |
Token ID | 247 |
Feature activation | -8.04e-02 |
Pos logit contributions | |
�� | +1.524 |
ゼ | +1.462 |
dos | +1.437 |
eeper | +1.372 |
verting | +1.368 |
Neg logit contributions | |
Honour | -3.259 |
emin | -3.124 |
acceptance | -3.026 |
MENT | -3.025 |
ODY | -3.005 |
Token | t |
Token ID | 83 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
�� | +0.641 |
ゼ | +0.617 |
dos | +0.601 |
verting | +0.587 |
eeper | +0.585 |
Neg logit contributions | |
Honour | -0.490 |
emin | -0.464 |
acceptance | -0.437 |
MENT | -0.436 |
ODY | -0.426 |
Token | authorized |
Token ID | 10435 |
Feature activation | -8.92e-01 |
Pos logit contributions | |
verting | +7.505 |
eeper | +7.469 |
ゼ | +7.450 |
�� | +7.428 |
dos | +7.417 |
Neg logit contributions | |
Honour | -10.564 |
emin | -9.826 |
ODY | -9.822 |
acceptance | -9.530 |
MENT | -9.526 |
Token | to |
Token ID | 284 |
Feature activation | -3.82e-01 |
Pos logit contributions | |
dos | +5.915 |
�� | +5.876 |
ゼ | +5.745 |
verting | +5.743 |
................................................................ | +5.738 |
Neg logit contributions | |
Honour | -5.831 |
emin | -5.463 |
MENT | -5.297 |
ODY | -5.205 |
OPS | -5.136 |
Token | speak |
Token ID | 2740 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
�� | +2.744 |
dos | +2.700 |
ゼ | +2.669 |
eeper | +2.631 |
verting | +2.603 |
Neg logit contributions | |
Honour | -2.501 |
emin | -2.365 |
MENT | -2.249 |
ODY | -2.237 |
acceptance | -2.223 |
Token | to |
Token ID | 284 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
�� | +0.992 |
ゼ | +0.967 |
dos | +0.957 |
eeper | +0.935 |
verting | +0.933 |
Neg logit contributions | |
Honour | -0.783 |
emin | -0.732 |
MENT | -0.695 |
acceptance | -0.695 |
ODY | -0.689 |
Token | the |
Token ID | 262 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
Honour | +0.937 |
emin | +0.862 |
acceptance | +0.837 |
MENT | +0.821 |
ODY | +0.814 |
Neg logit contributions | |
�� | -1.322 |
ゼ | -1.277 |
dos | -1.266 |
eeper | -1.232 |
verting | -1.224 |
Token | companies |
Token ID | 2706 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
Honour | +0.894 |
emin | +0.825 |
acceptance | +0.816 |
MENT | +0.786 |
ODY | +0.777 |
Neg logit contributions | |
�� | -1.021 |
ゼ | -0.987 |
dos | -0.966 |
eeper | -0.953 |
verting | -0.939 |
Token | involved |
Token ID | 2950 |
Feature activation | -3.26e-01 |
Pos logit contributions | |
Honour | +1.052 |
emin | +0.986 |
acceptance | +0.951 |
MENT | +0.939 |
ODY | +0.928 |
Neg logit contributions | |
�� | -1.134 |
ゼ | -1.097 |
dos | -1.081 |
eeper | -1.047 |
verting | -1.043 |
Token | in |
Token ID | 287 |
Feature activation | +2.61e-01 |
Pos logit contributions | |
�� | +2.195 |
ゼ | +2.162 |
dos | +2.122 |
eeper | +2.093 |
verting | +2.071 |
Neg logit contributions | |
Honour | -2.273 |
emin | -2.147 |
MENT | -2.051 |
acceptance | -2.031 |
ODY | -2.024 |
Token | the |
Token ID | 262 |
Feature activation | +1.98e-01 |
Pos logit contributions | |
Honour | +1.593 |
emin | +1.472 |
acceptance | +1.439 |
MENT | +1.383 |
ODY | +1.378 |
Neg logit contributions | |
�� | -2.039 |
ゼ | -1.988 |
dos | -1.965 |
eeper | -1.917 |
verting | -1.896 |
Token | development |
Token ID | 2478 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
Honour | +1.242 |
emin | +1.144 |
acceptance | +1.125 |
MENT | +1.083 |
ODY | +1.074 |
Neg logit contributions | |
�� | -1.533 |
ゼ | -1.497 |
dos | -1.474 |
eeper | -1.443 |
verting | -1.432 |
Token | and |
Token ID | 290 |
Feature activation | +9.02e-01 |
Pos logit contributions | |
�� | +0.763 |
ゼ | +0.747 |
dos | +0.731 |
eeper | +0.718 |
verting | +0.716 |
Neg logit contributions | |
Honour | -0.687 |
emin | -0.643 |
MENT | -0.613 |
ODY | -0.609 |
acceptance | -0.607 |
Token | support |
Token ID | 1104 |
Feature activation | +1.79e-01 |
Pos logit contributions | |
acceptance | +4.935 |
Honour | +4.920 |
emin | +4.484 |
MENT | +4.346 |
OPS | +4.137 |
Neg logit contributions | |
�� | -7.324 |
ゼ | -7.021 |
dos | -6.961 |
eeper | -6.819 |
verting | -6.639 |
Token | for |
Token ID | 329 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
Honour | +1.115 |
emin | +1.044 |
acceptance | +0.997 |
MENT | +0.994 |
ODY | +0.984 |
Neg logit contributions | |
�� | -1.368 |
ゼ | -1.332 |
dos | -1.320 |
eeper | -1.286 |
verting | -1.282 |
Token | Koh |
Token ID | 24754 |
Feature activation | -8.82e-02 |
Pos logit contributions | |
Honour | +1.266 |
emin | +1.167 |
acceptance | +1.139 |
MENT | +1.098 |
ODY | +1.092 |
Neg logit contributions | |
�� | -1.622 |
ゼ | -1.584 |
dos | -1.563 |
eeper | -1.532 |
verting | -1.519 |
Token | a |
Token ID | 64 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
�� | +0.705 |
ゼ | +0.688 |
dos | +0.681 |
eeper | +0.666 |
verting | +0.664 |
Neg logit contributions | |
Honour | -0.521 |
emin | -0.486 |
acceptance | -0.461 |
MENT | -0.461 |
ODY | -0.456 |
Token | , |
Token ID | 11 |
Feature activation | -5.46e-02 |
Pos logit contributions | |
�� | +0.747 |
ゼ | +0.727 |
dos | +0.720 |
eeper | +0.701 |
verting | +0.699 |
Neg logit contributions | |
Honour | -0.655 |
emin | -0.615 |
acceptance | -0.587 |
MENT | -0.585 |
ODY | -0.581 |
Token | has |
Token ID | 468 |
Feature activation | +2.44e-01 |
Pos logit contributions | |
�� | +0.512 |
ゼ | +0.498 |
dos | +0.492 |
eeper | +0.480 |
verting | +0.478 |
Neg logit contributions | |
Honour | -0.489 |
emin | -0.461 |
acceptance | -0.440 |
MENT | -0.440 |
ODY | -0.436 |
Token | not |
Token ID | 407 |
Feature activation | -2.40e-01 |
Pos logit contributions | |
Honour | +1.475 |
emin | +1.381 |
acceptance | +1.339 |
MENT | +1.321 |
ODY | +1.301 |
Neg logit contributions | |
�� | -1.931 |
ゼ | -1.857 |
dos | -1.848 |
eeper | -1.798 |
verting | -1.797 |
Token | wanted |
Token ID | 2227 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
�� | +1.771 |
ゼ | +1.735 |
dos | +1.715 |
eeper | +1.672 |
verting | +1.670 |
Neg logit contributions | |
Honour | -1.557 |
emin | -1.451 |
MENT | -1.385 |
acceptance | -1.379 |
ODY | -1.373 |
Token | to |
Token ID | 284 |
Feature activation | +2.73e-01 |
Pos logit contributions | |
Honour | +0.735 |
emin | +0.681 |
acceptance | +0.649 |
MENT | +0.642 |
ODY | +0.638 |
Neg logit contributions | |
�� | -1.119 |
ゼ | -1.090 |
dos | -1.077 |
eeper | -1.054 |
verting | -1.052 |
Token | believe |
Token ID | 1975 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
Honour | +1.680 |
emin | +1.545 |
acceptance | +1.529 |
MENT | +1.473 |
ODY | +1.464 |
Neg logit contributions | |
�� | -2.163 |
ゼ | -2.075 |
dos | -1.995 |
verting | -1.976 |
eeper | -1.975 |
Token | that |
Token ID | 326 |
Feature activation | +9.37e-01 |
Pos logit contributions | |
Honour | +2.460 |
emin | +2.294 |
acceptance | +2.248 |
MENT | +2.199 |
ODY | +2.177 |
Neg logit contributions | |
�� | -3.051 |
ゼ | -2.920 |
dos | -2.897 |
verting | -2.833 |
eeper | -2.825 |
Token | it |
Token ID | 340 |
Feature activation | +4.56e-01 |
Pos logit contributions | |
Honour | +4.902 |
acceptance | +4.671 |
emin | +4.590 |
MENT | +4.344 |
ODY | +4.330 |
Neg logit contributions | |
�� | -7.996 |
ゼ | -7.508 |
dos | -7.408 |
eeper | -7.365 |
arthed | -7.285 |
Token | � |
Token ID | 447 |
Feature activation | +9.74e-02 |
Pos logit contributions | |
Honour | +2.705 |
emin | +2.608 |
acceptance | +2.461 |
MENT | +2.436 |
ODY | +2.416 |
Neg logit contributions | |
�� | -3.593 |
ゼ | -3.445 |
dos | -3.428 |
verting | -3.370 |
eeper | -3.335 |
Token | � |
Token ID | 247 |
Feature activation | +3.67e-01 |
Pos logit contributions | |
Honour | +0.898 |
emin | +0.877 |
MENT | +0.851 |
acceptance | +0.840 |
ODY | +0.831 |
Neg logit contributions | |
�� | -0.437 |
ゼ | -0.433 |
dos | -0.427 |
verting | -0.398 |
eeper | -0.390 |
Token | s |
Token ID | 82 |
Feature activation | +4.10e-01 |
Pos logit contributions | |
Honour | +2.577 |
emin | +2.560 |
acceptance | +2.369 |
MENT | +2.358 |
OPS | +2.317 |
Neg logit contributions | |
�� | -2.501 |
ゼ | -2.421 |
dos | -2.290 |
verting | -2.251 |
eeper | -2.248 |
Token | something |
Token ID | 1223 |
Feature activation | -6.81e-02 |
Pos logit contributions | |
Honour | +2.573 |
emin | +2.449 |
acceptance | +2.399 |
MENT | +2.295 |
ODY | +2.278 |
Neg logit contributions | |
�� | -3.112 |
ゼ | -3.011 |
dos | -2.993 |
eeper | -2.923 |
verting | -2.889 |
Token | … |
Token ID | 1399 |
Feature activation | +9.26e-02 |
Pos logit contributions | |
Honour | +0.376 |
emin | +0.350 |
acceptance | +0.336 |
MENT | +0.333 |
ODY | +0.330 |
Neg logit contributions | |
�� | -0.472 |
ゼ | -0.459 |
dos | -0.452 |
verting | -0.443 |
eeper | -0.441 |
Token | The |
Token ID | 383 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
Honour | +0.592 |
emin | +0.554 |
MENT | +0.529 |
acceptance | +0.528 |
ODY | +0.521 |
Neg logit contributions | |
�� | -0.701 |
ゼ | -0.681 |
dos | -0.671 |
verting | -0.656 |
eeper | -0.654 |
Token | majority |
Token ID | 3741 |
Feature activation | +3.47e-01 |
Pos logit contributions | |
Honour | +0.943 |
emin | +0.877 |
acceptance | +0.859 |
MENT | +0.840 |
ODY | +0.836 |
Neg logit contributions | |
�� | -0.989 |
ゼ | -0.962 |
dos | -0.944 |
eeper | -0.923 |
verting | -0.920 |
Token | of |
Token ID | 286 |
Feature activation | +4.52e-01 |
Pos logit contributions | |
Honour | +2.022 |
emin | +1.857 |
acceptance | +1.817 |
MENT | +1.770 |
ODY | +1.749 |
Neg logit contributions | |
�� | -2.841 |
ゼ | -2.745 |
dos | -2.681 |
verting | -2.640 |
eeper | -2.631 |
Token | the |
Token ID | 262 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
Honour | +2.690 |
emin | +2.431 |
acceptance | +2.421 |
MENT | +2.323 |
ODY | +2.289 |
Neg logit contributions | |
�� | -3.622 |
ゼ | -3.510 |
dos | -3.422 |
eeper | -3.414 |
verting | -3.343 |
Token | time |
Token ID | 640 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
Honour | +1.699 |
emin | +1.551 |
acceptance | +1.536 |
MENT | +1.481 |
ODY | +1.466 |
Neg logit contributions | |
�� | -2.155 |
ゼ | -2.079 |
dos | -2.041 |
eeper | -2.026 |
verting | -1.992 |
Token | when |
Token ID | 618 |
Feature activation | +2.84e-01 |
Pos logit contributions | |
Honour | +5.652 |
acceptance | +5.105 |
emin | +5.017 |
MENT | +4.920 |
ODY | +4.793 |
Neg logit contributions | |
�� | -9.082 |
ゼ | -8.676 |
arthed | -8.446 |
verting | -8.398 |
dos | -8.374 |
Token | I |
Token ID | 314 |
Feature activation | +8.10e-02 |
Pos logit contributions | |
Honour | +1.744 |
emin | +1.613 |
acceptance | +1.571 |
MENT | +1.541 |
ODY | +1.515 |
Neg logit contributions | |
�� | -2.225 |
ゼ | -2.158 |
dos | -2.119 |
eeper | -2.083 |
verting | -2.065 |
Token | meet |
Token ID | 1826 |
Feature activation | +4.83e-01 |
Pos logit contributions | |
Honour | +0.520 |
emin | +0.485 |
acceptance | +0.464 |
MENT | +0.463 |
ODY | +0.456 |
Neg logit contributions | |
�� | -0.614 |
ゼ | -0.598 |
dos | -0.585 |
eeper | -0.573 |
verting | -0.571 |
Token | somebody |
Token ID | 8276 |
Feature activation | -4.97e-01 |
Pos logit contributions | |
Honour | +2.698 |
emin | +2.480 |
acceptance | +2.429 |
MENT | +2.327 |
ODY | +2.319 |
Neg logit contributions | |
�� | -4.069 |
ゼ | -3.941 |
dos | -3.868 |
eeper | -3.778 |
verting | -3.765 |
Token | from |
Token ID | 422 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
�� | +3.182 |
ゼ | +3.118 |
dos | +3.090 |
eeper | +3.012 |
verting | +2.989 |
Neg logit contributions | |
Honour | -3.598 |
emin | -3.422 |
MENT | -3.268 |
ODY | -3.249 |
acceptance | -3.231 |
Token | Andromeda |
Token ID | 34542 |
Feature activation | +6.82e-01 |
Pos logit contributions | |
Honour | +0.109 |
emin | +0.102 |
acceptance | +0.097 |
MENT | +0.097 |
ODY | +0.096 |
Neg logit contributions | |
�� | -0.121 |
ゼ | -0.118 |
dos | -0.116 |
eeper | -0.113 |
verting | -0.113 |
Token | galaxy |
Token ID | 16161 |
Feature activation | +7.18e-01 |
Pos logit contributions | |
Honour | +4.601 |
emin | +4.284 |
acceptance | +4.187 |
ODY | +4.044 |
Expression | +3.989 |
Neg logit contributions | |
�� | -4.819 |
ゼ | -4.708 |
dos | -4.602 |
eeper | -4.449 |
verting | -4.434 |
Token | ( |
Token ID | 357 |
Feature activation | +5.19e-01 |
Pos logit contributions | |
Honour | +4.209 |
emin | +3.996 |
acceptance | +3.789 |
MENT | +3.727 |
ODY | +3.722 |
Neg logit contributions | |
�� | -5.508 |
dos | -5.396 |
ゼ | -5.393 |
verting | -5.249 |
eeper | -5.206 |
Token | 2 |
Token ID | 17 |
Feature activation | +7.40e-01 |
Pos logit contributions | |
Honour | +3.192 |
emin | +3.110 |
MENT | +2.943 |
OPS | +2.891 |
ODY | +2.891 |
Neg logit contributions | |
�� | -3.932 |
ゼ | -3.678 |
dos | -3.642 |
eeper | -3.629 |
verting | -3.626 |
Token | , |
Token ID | 11 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
Honour | +4.142 |
emin | +3.871 |
MENT | +3.607 |
ODY | +3.589 |
acceptance | +3.588 |
Neg logit contributions | |
�� | -5.881 |
ゼ | -5.715 |
dos | -5.711 |
eeper | -5.614 |
verting | -5.556 |
Token | 000 |
Token ID | 830 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
Honour | +0.729 |
emin | +0.689 |
MENT | +0.659 |
acceptance | +0.655 |
ODY | +0.654 |
Neg logit contributions | |
�� | -0.711 |
ゼ | -0.686 |
dos | -0.678 |
eeper | -0.661 |
verting | -0.660 |
Token | , |
Token ID | 11 |
Feature activation | -5.37e-02 |
Pos logit contributions | |
Honour | +5.028 |
emin | +4.592 |
MENT | +4.212 |
acceptance | +4.166 |
ODY | +4.165 |
Neg logit contributions | |
�� | -9.548 |
ゼ | -9.368 |
dos | -9.320 |
eeper | -9.190 |
arthed | -9.094 |
Token | 000 |
Token ID | 830 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
�� | +0.323 |
ゼ | +0.308 |
dos | +0.303 |
eeper | +0.296 |
verting | +0.294 |
Neg logit contributions | |
Honour | -0.429 |
emin | -0.408 |
MENT | -0.393 |
acceptance | -0.391 |
ODY | -0.390 |
Token | Light |
Token ID | 4401 |
Feature activation | +6.76e-01 |
Pos logit contributions | |
Honour | +4.232 |
emin | +3.813 |
MENT | +3.426 |
acceptance | +3.417 |
OPS | +3.390 |
Neg logit contributions | |
�� | -9.789 |
ゼ | -9.612 |
dos | -9.576 |
eeper | -9.483 |
arthed | -9.332 |
Token | Years |
Token ID | 13212 |
Feature activation | +8.48e-01 |
Pos logit contributions | |
Honour | +4.520 |
emin | +4.236 |
OPS | +3.931 |
acceptance | +3.914 |
Expression | +3.876 |
Neg logit contributions | |
�� | -4.847 |
ゼ | -4.781 |
eeper | -4.642 |
dos | -4.546 |
olulu | -4.415 |
Token | ) |
Token ID | 8 |
Feature activation | +5.87e-01 |
Pos logit contributions | |
Honour | +4.376 |
emin | +4.071 |
acceptance | +3.909 |
MENT | +3.838 |
ODY | +3.794 |
Neg logit contributions | |
�� | -7.021 |
ゼ | -6.890 |
dos | -6.878 |
verting | -6.688 |
eeper | -6.600 |
Token | in |
Token ID | 287 |
Feature activation | +1.92e-01 |
Pos logit contributions | |
Honour | +0.077 |
emin | +0.072 |
acceptance | +0.069 |
MENT | +0.069 |
ODY | +0.068 |
Neg logit contributions | |
�� | -0.087 |
ゼ | -0.084 |
dos | -0.083 |
eeper | -0.081 |
verting | -0.081 |
Token | Canada |
Token ID | 3340 |
Feature activation | +2.89e-02 |
Pos logit contributions | |
Honour | +0.912 |
emin | +0.819 |
acceptance | +0.770 |
MENT | +0.755 |
ODY | +0.748 |
Neg logit contributions | |
�� | -1.783 |
ゼ | -1.750 |
dos | -1.714 |
eeper | -1.700 |
verting | -1.668 |
Token | found |
Token ID | 1043 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
Honour | +0.187 |
emin | +0.175 |
acceptance | +0.168 |
MENT | +0.167 |
ODY | +0.165 |
Neg logit contributions | |
�� | -0.218 |
ゼ | -0.212 |
dos | -0.208 |
eeper | -0.203 |
verting | -0.203 |
Token | 73 |
Token ID | 8854 |
Feature activation | +4.85e-01 |
Pos logit contributions | |
Honour | +2.129 |
emin | +1.969 |
acceptance | +1.927 |
MENT | +1.879 |
ODY | +1.843 |
Neg logit contributions | |
�� | -2.881 |
ゼ | -2.787 |
dos | -2.725 |
verting | -2.678 |
eeper | -2.667 |
Token | per |
Token ID | 583 |
Feature activation | -4.05e-01 |
Pos logit contributions | |
Honour | +3.868 |
emin | +3.659 |
acceptance | +3.615 |
MENT | +3.553 |
ODY | +3.528 |
Neg logit contributions | |
�� | -2.855 |
ゼ | -2.751 |
dos | -2.659 |
eeper | -2.616 |
verting | -2.590 |
Token | cent |
Token ID | 1247 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
�� | +2.108 |
ゼ | +2.049 |
dos | +2.022 |
verting | +1.950 |
eeper | +1.948 |
Neg logit contributions | |
Honour | -3.488 |
emin | -3.319 |
MENT | -3.207 |
acceptance | -3.200 |
ODY | -3.196 |
Token | of |
Token ID | 286 |
Feature activation | +4.99e-01 |
Pos logit contributions | |
Honour | +5.734 |
acceptance | +5.298 |
MENT | +5.012 |
emin | +4.951 |
OPS | +4.836 |
Neg logit contributions | |
�� | -9.412 |
ゼ | -8.996 |
dos | -8.718 |
verting | -8.713 |
eeper | -8.620 |
Token | Saskatchewan |
Token ID | 31346 |
Feature activation | +3.27e-01 |
Pos logit contributions | |
Honour | +3.073 |
emin | +2.803 |
acceptance | +2.752 |
MENT | +2.698 |
ODY | +2.633 |
Neg logit contributions | |
�� | -3.953 |
ゼ | -3.850 |
eeper | -3.730 |
dos | -3.702 |
verting | -3.634 |
Token | respondents |
Token ID | 14502 |
Feature activation | +5.90e-01 |
Pos logit contributions | |
Honour | +2.021 |
emin | +1.884 |
acceptance | +1.804 |
MENT | +1.787 |
ODY | +1.753 |
Neg logit contributions | |
�� | -2.579 |
ゼ | -2.489 |
dos | -2.439 |
eeper | -2.400 |
verting | -2.386 |
Token | weren |
Token ID | 6304 |
Feature activation | +3.36e-02 |
Pos logit contributions | |
Honour | +3.452 |
acceptance | +3.186 |
emin | +3.145 |
MENT | +3.049 |
ODY | +2.976 |
Neg logit contributions | |
�� | -4.813 |
ゼ | -4.612 |
dos | -4.472 |
eeper | -4.433 |
verting | -4.390 |
Token | � |
Token ID | 447 |
Feature activation | -8.92e-02 |
Pos logit contributions | |
Honour | +0.255 |
emin | +0.242 |
MENT | +0.233 |
acceptance | +0.230 |
ODY | +0.230 |
Neg logit contributions | |
�� | -0.219 |
ゼ | -0.207 |
dos | -0.204 |
eeper | -0.200 |
verting | -0.198 |
Token | Saul |
Token ID | 31603 |
Feature activation | +4.20e-01 |
Pos logit contributions | |
�� | +3.475 |
ゼ | +3.422 |
dos | +3.385 |
eeper | +3.278 |
verting | +3.276 |
Neg logit contributions | |
Honour | -2.664 |
emin | -2.505 |
acceptance | -2.368 |
MENT | -2.350 |
ODY | -2.316 |
Token | LO |
Token ID | 17579 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
Honour | +2.396 |
emin | +2.290 |
acceptance | +2.127 |
ODY | +2.098 |
MENT | +2.087 |
Neg logit contributions | |
�� | -3.407 |
dos | -3.335 |
ゼ | -3.313 |
verting | -3.256 |
eeper | -3.252 |
Token | EB |
Token ID | 30195 |
Feature activation | +4.84e-01 |
Pos logit contributions | |
Honour | +0.655 |
emin | +0.581 |
acceptance | +0.534 |
MENT | +0.528 |
ODY | +0.520 |
Neg logit contributions | |
�� | -1.665 |
ゼ | -1.624 |
dos | -1.621 |
verting | -1.588 |
eeper | -1.586 |
Token | SA |
Token ID | 4090 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
Honour | +2.863 |
emin | +2.606 |
MENT | +2.577 |
ODY | +2.557 |
acceptance | +2.508 |
Neg logit contributions | |
�� | -3.932 |
ゼ | -3.779 |
dos | -3.684 |
eeper | -3.675 |
verting | -3.657 |
Token | UL |
Token ID | 6239 |
Feature activation | +4.01e-02 |
Pos logit contributions | |
Honour | +0.086 |
emin | +0.080 |
MENT | +0.077 |
acceptance | +0.076 |
ODY | +0.076 |
Neg logit contributions | |
�� | -0.100 |
ゼ | -0.097 |
dos | -0.096 |
eeper | -0.094 |
verting | -0.094 |
Token | LO |
Token ID | 17579 |
Feature activation | +3.95e-01 |
Pos logit contributions | |
Honour | +0.233 |
emin | +0.215 |
MENT | +0.210 |
ODY | +0.206 |
acceptance | +0.204 |
Neg logit contributions | |
�� | -0.330 |
ゼ | -0.319 |
dos | -0.314 |
eeper | -0.311 |
verting | -0.309 |
Token | EB |
Token ID | 30195 |
Feature activation | +2.55e-01 |
Pos logit contributions | |
Honour | +1.125 |
emin | +0.994 |
ODY | +0.991 |
MENT | +0.950 |
OPS | +0.916 |
Neg logit contributions | |
�� | -4.341 |
dos | -4.264 |
ゼ | -4.246 |
eeper | -4.222 |
verting | -4.155 |
Token | / |
Token ID | 14 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
Honour | +1.462 |
emin | +1.359 |
ODY | +1.299 |
MENT | +1.298 |
acceptance | +1.285 |
Neg logit contributions | |
�� | -2.102 |
ゼ | -2.042 |
dos | -2.024 |
eeper | -1.979 |
verting | -1.974 |
Token | AFP |
Token ID | 17449 |
Feature activation | -8.30e-03 |
Pos logit contributions | |
�� | +0.913 |
ゼ | +0.890 |
dos | +0.881 |
eeper | +0.862 |
verting | +0.859 |
Neg logit contributions | |
Honour | -0.673 |
emin | -0.628 |
MENT | -0.596 |
acceptance | -0.595 |
ODY | -0.589 |
Token | / |
Token ID | 14 |
Feature activation | -2.82e-01 |
Pos logit contributions | |
�� | +0.071 |
ゼ | +0.070 |
dos | +0.069 |
eeper | +0.068 |
verting | +0.067 |
Neg logit contributions | |
Honour | -0.044 |
emin | -0.041 |
MENT | -0.039 |
acceptance | -0.039 |
ODY | -0.038 |
Token | Getty |
Token ID | 6633 |
Feature activation | -3.75e-01 |
Pos logit contributions | |
�� | +1.693 |
ゼ | +1.684 |
dos | +1.664 |
verting | +1.587 |
eeper | +1.575 |
Neg logit contributions | |
Honour | -2.185 |
emin | -2.059 |
acceptance | -1.995 |
ODY | -1.953 |
MENT | -1.946 |
Token | Sean |
Token ID | 11465 |
Feature activation | +1.20e-01 |
Pos logit contributions | |
Honour | +1.688 |
emin | +1.527 |
acceptance | +1.495 |
MENT | +1.468 |
ODY | +1.455 |
Neg logit contributions | |
�� | -2.278 |
ゼ | -2.199 |
dos | -2.153 |
verting | -2.119 |
eeper | -2.107 |
Token | , |
Token ID | 11 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
Honour | +0.755 |
emin | +0.705 |
MENT | +0.672 |
acceptance | +0.669 |
ODY | +0.662 |
Neg logit contributions | |
�� | -0.924 |
ゼ | -0.899 |
dos | -0.881 |
eeper | -0.864 |
verting | -0.863 |
Token | found |
Token ID | 1043 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
Honour | +1.205 |
emin | +1.127 |
acceptance | +1.092 |
MENT | +1.089 |
ODY | +1.074 |
Neg logit contributions | |
�� | -1.356 |
ゼ | -1.303 |
dos | -1.280 |
verting | -1.258 |
eeper | -1.250 |
Token | his |
Token ID | 465 |
Feature activation | +1.97e-01 |
Pos logit contributions | |
Honour | +1.243 |
emin | +1.150 |
acceptance | +1.126 |
MENT | +1.106 |
ODY | +1.100 |
Neg logit contributions | |
�� | -1.397 |
ゼ | -1.347 |
dos | -1.325 |
verting | -1.297 |
eeper | -1.292 |
Token | father |
Token ID | 2988 |
Feature activation | +4.26e-01 |
Pos logit contributions | |
Honour | +1.350 |
emin | +1.230 |
acceptance | +1.227 |
MENT | +1.196 |
ODY | +1.193 |
Neg logit contributions | |
�� | -1.433 |
ゼ | -1.391 |
dos | -1.359 |
eeper | -1.331 |
verting | -1.319 |
Token | after |
Token ID | 706 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
Honour | +2.700 |
emin | +2.493 |
acceptance | +2.449 |
MENT | +2.406 |
ODY | +2.373 |
Neg logit contributions | |
�� | -3.286 |
ゼ | -3.100 |
dos | -3.091 |
eeper | -3.021 |
verting | -2.970 |
Token | hearing |
Token ID | 4854 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
Honour | +1.607 |
emin | +1.486 |
acceptance | +1.455 |
ODY | +1.411 |
MENT | +1.410 |
Neg logit contributions | |
�� | -2.116 |
ゼ | -2.044 |
dos | -1.979 |
eeper | -1.960 |
verting | -1.942 |
Token | " |
Token ID | 366 |
Feature activation | -3.80e-01 |
Pos logit contributions | |
�� | +1.684 |
ゼ | +1.647 |
dos | +1.630 |
eeper | +1.587 |
verting | +1.582 |
Neg logit contributions | |
Honour | -1.495 |
emin | -1.411 |
MENT | -1.338 |
acceptance | -1.334 |
ODY | -1.327 |
Token | f |
Token ID | 69 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
�� | +2.859 |
dos | +2.808 |
ゼ | +2.804 |
eeper | +2.708 |
verting | +2.706 |
Neg logit contributions | |
Honour | -2.394 |
emin | -2.184 |
acceptance | -2.124 |
MENT | -2.098 |
ODY | -2.096 |
Token | aint |
Token ID | 2913 |
Feature activation | -7.13e-01 |
Pos logit contributions | |
Honour | +0.728 |
emin | +0.701 |
acceptance | +0.662 |
ODY | +0.650 |
MENT | +0.647 |
Neg logit contributions | |
�� | -0.748 |
ゼ | -0.735 |
dos | -0.714 |
verting | -0.686 |
eeper | -0.685 |
Token | yells |
Token ID | 42675 |
Feature activation | -5.51e-01 |
Pos logit contributions | |
�� | +4.629 |
ゼ | +4.550 |
dos | +4.391 |
verting | +4.382 |
eeper | +4.319 |
Neg logit contributions | |
Honour | -4.930 |
emin | -4.733 |
afety | -4.452 |
MENT | -4.447 |
OPS | -4.444 |
Token | Will |
Token ID | 2561 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
Honour | +0.426 |
emin | +0.395 |
MENT | +0.376 |
acceptance | +0.376 |
ODY | +0.372 |
Neg logit contributions | |
�� | -0.537 |
ゼ | -0.518 |
dos | -0.514 |
eeper | -0.504 |
verting | -0.501 |
Token | has |
Token ID | 468 |
Feature activation | +4.85e-02 |
Pos logit contributions | |
Honour | +1.472 |
emin | +1.395 |
acceptance | +1.335 |
MENT | +1.328 |
ODY | +1.307 |
Neg logit contributions | |
�� | -1.704 |
ゼ | -1.641 |
dos | -1.624 |
verting | -1.590 |
eeper | -1.574 |
Token | used |
Token ID | 973 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
Honour | +0.308 |
emin | +0.289 |
acceptance | +0.278 |
MENT | +0.276 |
ODY | +0.271 |
Neg logit contributions | |
�� | -0.368 |
ゼ | -0.357 |
dos | -0.354 |
verting | -0.344 |
eeper | -0.344 |
Token | his |
Token ID | 465 |
Feature activation | +2.74e-01 |
Pos logit contributions | |
Honour | +0.716 |
emin | +0.662 |
acceptance | +0.641 |
MENT | +0.625 |
ODY | +0.620 |
Neg logit contributions | |
�� | -0.932 |
ゼ | -0.908 |
dos | -0.899 |
eeper | -0.877 |
verting | -0.872 |
Token | experiences |
Token ID | 6461 |
Feature activation | -6.53e-02 |
Pos logit contributions | |
Honour | +1.957 |
emin | +1.840 |
acceptance | +1.823 |
MENT | +1.760 |
ODY | +1.726 |
Neg logit contributions | |
�� | -1.865 |
ゼ | -1.814 |
dos | -1.794 |
eeper | -1.737 |
verting | -1.728 |
Token | to |
Token ID | 284 |
Feature activation | +7.93e-02 |
Pos logit contributions | |
�� | +0.500 |
ゼ | +0.485 |
dos | +0.482 |
eeper | +0.469 |
verting | +0.468 |
Neg logit contributions | |
Honour | -0.408 |
emin | -0.385 |
acceptance | -0.366 |
MENT | -0.364 |
ODY | -0.361 |
Token | help |
Token ID | 1037 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
Honour | +0.527 |
emin | +0.494 |
acceptance | +0.477 |
MENT | +0.473 |
ODY | +0.466 |
Neg logit contributions | |
�� | -0.580 |
ゼ | -0.563 |
dos | -0.554 |
eeper | -0.542 |
verting | -0.540 |
Token | teach |
Token ID | 4545 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
Honour | +1.228 |
emin | +1.127 |
acceptance | +1.093 |
MENT | +1.068 |
ODY | +1.051 |
Neg logit contributions | |
�� | -1.989 |
ゼ | -1.932 |
dos | -1.906 |
eeper | -1.874 |
verting | -1.864 |
Token | others |
Token ID | 1854 |
Feature activation | -6.98e-02 |
Pos logit contributions | |
Honour | +0.587 |
emin | +0.534 |
acceptance | +0.510 |
MENT | +0.498 |
ODY | +0.491 |
Neg logit contributions | |
�� | -1.133 |
ゼ | -1.109 |
dos | -1.095 |
eeper | -1.077 |
verting | -1.068 |
Token | to |
Token ID | 284 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
�� | +0.535 |
ゼ | +0.522 |
dos | +0.517 |
eeper | +0.505 |
verting | +0.504 |
Neg logit contributions | |
Honour | -0.434 |
emin | -0.406 |
MENT | -0.386 |
acceptance | -0.385 |
ODY | -0.382 |
Token | follow |
Token ID | 1061 |
Feature activation | -2.62e-01 |
Pos logit contributions | |
Honour | +0.935 |
emin | +0.866 |
acceptance | +0.840 |
MENT | +0.814 |
ODY | +0.807 |
Neg logit contributions | |
�� | -1.402 |
ゼ | -1.367 |
dos | -1.332 |
eeper | -1.313 |
verting | -1.307 |
Token | � |
Token ID | 447 |
Feature activation | +2.49e-01 |
Pos logit contributions | |
Honour | +1.267 |
emin | +1.188 |
acceptance | +1.136 |
MENT | +1.132 |
ODY | +1.122 |
Neg logit contributions | |
�� | -1.586 |
ゼ | -1.530 |
dos | -1.505 |
verting | -1.477 |
eeper | -1.468 |
Token | � |
Token ID | 251 |
Feature activation | -9.81e-02 |
Pos logit contributions | |
Honour | +2.409 |
emin | +2.323 |
acceptance | +2.263 |
MENT | +2.260 |
ODY | +2.231 |
Neg logit contributions | |
dos | -0.978 |
ゼ | -0.973 |
�� | -0.948 |
verting | -0.893 |
eeper | -0.884 |
Token | and |
Token ID | 290 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
�� | +0.716 |
ゼ | +0.698 |
dos | +0.690 |
eeper | +0.673 |
verting | +0.671 |
Neg logit contributions | |
Honour | -0.646 |
emin | -0.607 |
MENT | -0.579 |
acceptance | -0.578 |
ODY | -0.575 |
Token | � |
Token ID | 564 |
Feature activation | -6.41e-02 |
Pos logit contributions | |
�� | +0.769 |
ゼ | +0.749 |
dos | +0.741 |
eeper | +0.722 |
verting | +0.721 |
Neg logit contributions | |
Honour | -0.665 |
emin | -0.625 |
MENT | -0.595 |
acceptance | -0.594 |
ODY | -0.590 |
Token | � |
Token ID | 250 |
Feature activation | +3.64e-01 |
Pos logit contributions | |
�� | +0.109 |
ゼ | +0.100 |
dos | +0.097 |
eeper | +0.085 |
verting | +0.081 |
Neg logit contributions | |
Honour | -0.779 |
emin | -0.755 |
MENT | -0.737 |
acceptance | -0.736 |
ODY | -0.731 |
Token | My |
Token ID | 3666 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
Honour | +2.064 |
emin | +1.914 |
MENT | +1.838 |
acceptance | +1.807 |
ODY | +1.787 |
Neg logit contributions | |
�� | -3.002 |
ゼ | -2.888 |
eeper | -2.844 |
dos | -2.838 |
verting | -2.802 |
Token | girlfriend |
Token ID | 11077 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
Honour | +1.739 |
emin | +1.619 |
acceptance | +1.573 |
MENT | +1.559 |
ODY | +1.554 |
Neg logit contributions | |
�� | -1.709 |
ゼ | -1.653 |
dos | -1.628 |
eeper | -1.598 |
verting | -1.590 |
Token | thinks |
Token ID | 6834 |
Feature activation | +6.11e-01 |
Pos logit contributions | |
Honour | +1.265 |
emin | +1.191 |
acceptance | +1.147 |
MENT | +1.136 |
ODY | +1.120 |
Neg logit contributions | |
�� | -1.463 |
ゼ | -1.404 |
dos | -1.390 |
verting | -1.360 |
eeper | -1.355 |
Token | I |
Token ID | 314 |
Feature activation | +3.37e-01 |
Pos logit contributions | |
Honour | +3.619 |
emin | +3.342 |
acceptance | +3.266 |
MENT | +3.189 |
ODY | +3.151 |
Neg logit contributions | |
�� | -4.822 |
ゼ | -4.635 |
dos | -4.570 |
verting | -4.507 |
eeper | -4.491 |
Token | � |
Token ID | 447 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
Honour | +2.183 |
emin | +2.071 |
acceptance | +1.980 |
MENT | +1.980 |
ODY | +1.940 |
Neg logit contributions | |
�� | -2.492 |
ゼ | -2.401 |
dos | -2.353 |
verting | -2.311 |
eeper | -2.302 |
Token | � |
Token ID | 247 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
�� | +1.235 |
ゼ | +1.189 |
dos | +1.167 |
verting | +1.100 |
eeper | +1.097 |
Neg logit contributions | |
Honour | -3.104 |
emin | -2.995 |
MENT | -2.906 |
acceptance | -2.900 |
ODY | -2.879 |
Token | firm |
Token ID | 4081 |
Feature activation | -3.82e-01 |
Pos logit contributions | |
Honour | +0.613 |
emin | +0.565 |
acceptance | +0.546 |
MENT | +0.543 |
ODY | +0.534 |
Neg logit contributions | |
�� | -0.730 |
ゼ | -0.692 |
dos | -0.690 |
eeper | -0.671 |
verting | -0.670 |
Token | was |
Token ID | 373 |
Feature activation | -2.65e-01 |
Pos logit contributions | |
�� | +2.659 |
ゼ | +2.614 |
dos | +2.579 |
eeper | +2.525 |
verting | +2.517 |
Neg logit contributions | |
Honour | -2.599 |
emin | -2.446 |
MENT | -2.339 |
ODY | -2.328 |
acceptance | -2.326 |
Token | let |
Token ID | 1309 |
Feature activation | -3.88e-01 |
Pos logit contributions | |
�� | +1.952 |
ゼ | +1.904 |
dos | +1.886 |
eeper | +1.839 |
verting | +1.837 |
Neg logit contributions | |
Honour | -1.717 |
emin | -1.614 |
MENT | -1.539 |
acceptance | -1.538 |
ODY | -1.526 |
Token | off |
Token ID | 572 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
�� | +2.578 |
ゼ | +2.538 |
dos | +2.525 |
eeper | +2.443 |
verting | +2.429 |
Neg logit contributions | |
Honour | -2.745 |
emin | -2.613 |
acceptance | -2.476 |
MENT | -2.473 |
ODY | -2.467 |
Token | because |
Token ID | 780 |
Feature activation | -3.97e-01 |
Pos logit contributions | |
�� | +2.881 |
ゼ | +2.828 |
dos | +2.792 |
eeper | +2.750 |
verting | +2.727 |
Neg logit contributions | |
Honour | -2.456 |
emin | -2.318 |
acceptance | -2.198 |
ODY | -2.198 |
MENT | -2.189 |
Token | it |
Token ID | 340 |
Feature activation | +4.63e-02 |
Pos logit contributions | |
ゼ | +2.772 |
�� | +2.769 |
dos | +2.753 |
eeper | +2.654 |
verting | +2.642 |
Neg logit contributions | |
Honour | -2.610 |
emin | -2.507 |
MENT | -2.367 |
ODY | -2.354 |
acceptance | -2.319 |
Token | had |
Token ID | 550 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
Honour | +0.302 |
emin | +0.280 |
acceptance | +0.273 |
MENT | +0.270 |
ODY | +0.265 |
Neg logit contributions | |
�� | -0.350 |
ゼ | -0.334 |
dos | -0.328 |
eeper | -0.324 |
verting | -0.320 |
Token | blown |
Token ID | 16318 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
Honour | +1.003 |
emin | +0.925 |
acceptance | +0.915 |
MENT | +0.900 |
ODY | +0.878 |
Neg logit contributions | |
�� | -1.153 |
ゼ | -1.091 |
dos | -1.079 |
eeper | -1.061 |
verting | -1.047 |
Token | the |
Token ID | 262 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
�� | +1.268 |
ゼ | +1.238 |
dos | +1.225 |
eeper | +1.198 |
verting | +1.194 |
Neg logit contributions | |
Honour | -0.936 |
emin | -0.873 |
acceptance | -0.828 |
MENT | -0.827 |
ODY | -0.819 |
Token | whistle |
Token ID | 16121 |
Feature activation | -7.94e-03 |
Pos logit contributions | |
�� | +1.667 |
ゼ | +1.630 |
dos | +1.613 |
verting | +1.568 |
eeper | +1.567 |
Neg logit contributions | |
Honour | -1.511 |
emin | -1.429 |
MENT | -1.361 |
ODY | -1.353 |
acceptance | -1.352 |
Token | on |
Token ID | 319 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
�� | +0.064 |
ゼ | +0.062 |
dos | +0.062 |
eeper | +0.060 |
verting | +0.060 |
Neg logit contributions | |
Honour | -0.047 |
emin | -0.043 |
acceptance | -0.041 |
MENT | -0.041 |
ODY | -0.041 |
Token | something |
Token ID | 1223 |
Feature activation | -9.46e-02 |
Pos logit contributions | |
Honour | +1.125 |
emin | +1.047 |
acceptance | +1.015 |
MENT | +0.987 |
ODY | +0.976 |
Neg logit contributions | |
�� | -1.499 |
ゼ | -1.453 |
dos | -1.426 |
eeper | -1.391 |
verting | -1.388 |
Token | more |
Token ID | 517 |
Feature activation | -9.71e-02 |
Pos logit contributions | |
�� | +0.795 |
ゼ | +0.777 |
dos | +0.769 |
eeper | +0.754 |
verting | +0.751 |
Neg logit contributions | |
Honour | -0.520 |
emin | -0.482 |
MENT | -0.455 |
acceptance | -0.455 |
ODY | -0.450 |
Token | like |
Token ID | 588 |
Feature activation | +5.26e-01 |
Pos logit contributions | |
�� | +0.720 |
ゼ | +0.701 |
dos | +0.694 |
eeper | +0.677 |
verting | +0.675 |
Neg logit contributions | |
Honour | -0.630 |
emin | -0.591 |
acceptance | -0.564 |
MENT | -0.563 |
ODY | -0.558 |
Token | the |
Token ID | 262 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
Honour | +3.015 |
emin | +2.692 |
acceptance | +2.679 |
ODY | +2.525 |
MENT | +2.520 |
Neg logit contributions | |
�� | -4.396 |
ゼ | -4.233 |
dos | -4.112 |
eeper | -4.054 |
verting | -3.984 |
Token | dead |
Token ID | 2636 |
Feature activation | +6.65e-01 |
Pos logit contributions | |
Honour | +1.993 |
emin | +1.806 |
acceptance | +1.782 |
MENT | +1.716 |
ODY | +1.715 |
Neg logit contributions | |
�� | -2.479 |
ゼ | -2.405 |
dos | -2.347 |
eeper | -2.313 |
verting | -2.271 |
Token | lier |
Token ID | 2505 |
Feature activation | -1.38e-01 |
Pos logit contributions | |
Honour | +3.646 |
emin | +3.335 |
acceptance | +3.298 |
MENT | +3.150 |
ODY | +3.149 |
Neg logit contributions | |
�� | -5.435 |
ゼ | -5.265 |
dos | -5.169 |
eeper | -5.119 |
arthed | -5.098 |
Token | bird |
Token ID | 6512 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
�� | +0.975 |
ゼ | +0.948 |
dos | +0.935 |
eeper | +0.913 |
verting | +0.908 |
Neg logit contributions | |
Honour | -0.944 |
emin | -0.887 |
acceptance | -0.851 |
MENT | -0.848 |
ODY | -0.841 |
Token | flu |
Token ID | 6562 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
Honour | +1.770 |
emin | +1.656 |
acceptance | +1.618 |
MENT | +1.592 |
ODY | +1.572 |
Neg logit contributions | |
�� | -1.608 |
ゼ | -1.562 |
dos | -1.534 |
eeper | -1.507 |
verting | -1.465 |
Token | . |
Token ID | 13 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
Honour | +1.184 |
emin | +1.108 |
acceptance | +1.066 |
MENT | +1.045 |
ODY | +1.038 |
Neg logit contributions | |
�� | -1.490 |
ゼ | -1.438 |
dos | -1.420 |
eeper | -1.390 |
verting | -1.371 |
Token | " |
Token ID | 366 |
Feature activation | +2.09e-01 |
Pos logit contributions | |
�� | +1.129 |
ゼ | +1.104 |
dos | +1.093 |
eeper | +1.063 |
verting | +1.063 |
Neg logit contributions | |
Honour | -0.949 |
emin | -0.894 |
acceptance | -0.853 |
MENT | -0.850 |
ODY | -0.841 |
Token | It |
Token ID | 1026 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
Honour | +1.199 |
emin | +1.117 |
MENT | +1.070 |
ODY | +1.059 |
acceptance | +1.040 |
Neg logit contributions | |
�� | -1.727 |
ゼ | -1.658 |
dos | -1.643 |
eeper | -1.634 |
verting | -1.610 |
Token |
|
Token ID | 198 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
�� | +0.416 |
ゼ | +0.403 |
dos | +0.401 |
eeper | +0.391 |
verting | +0.390 |
Neg logit contributions | |
Honour | -0.335 |
emin | -0.312 |
MENT | -0.297 |
acceptance | -0.296 |
ODY | -0.294 |
Token |
|
Token ID | 198 |
Feature activation | -4.62e-01 |
Pos logit contributions | |
�� | +1.995 |
ゼ | +1.967 |
dos | +1.954 |
verting | +1.898 |
eeper | +1.896 |
Neg logit contributions | |
Honour | -1.623 |
emin | -1.520 |
acceptance | -1.451 |
MENT | -1.442 |
ODY | -1.435 |
Token | 13 |
Token ID | 1485 |
Feature activation | +9.64e-02 |
Pos logit contributions | |
�� | +3.144 |
ゼ | +3.127 |
dos | +3.064 |
verting | +2.949 |
eeper | +2.947 |
Neg logit contributions | |
Honour | -3.170 |
emin | -2.974 |
acceptance | -2.886 |
ODY | -2.824 |
afety | -2.808 |
Token | . |
Token ID | 13 |
Feature activation | -2.76e-01 |
Pos logit contributions | |
Honour | +0.610 |
emin | +0.567 |
MENT | +0.542 |
acceptance | +0.533 |
ODY | +0.531 |
Neg logit contributions | |
�� | -0.758 |
ゼ | -0.714 |
dos | -0.710 |
eeper | -0.704 |
verting | -0.693 |
Token | Resident |
Token ID | 22373 |
Feature activation | +4.90e-01 |
Pos logit contributions | |
�� | +2.063 |
ゼ | +2.021 |
dos | +1.988 |
eeper | +1.937 |
verting | +1.935 |
Neg logit contributions | |
Honour | -1.751 |
emin | -1.652 |
acceptance | -1.575 |
MENT | -1.570 |
ODY | -1.559 |
Token | Evil |
Token ID | 10461 |
Feature activation | -9.80e-02 |
Pos logit contributions | |
Honour | +2.429 |
emin | +2.126 |
acceptance | +2.082 |
MENT | +2.033 |
ODY | +1.987 |
Neg logit contributions | |
�� | -4.450 |
ゼ | -4.338 |
dos | -4.240 |
eeper | -4.182 |
verting | -4.179 |
Token | 4 |
Token ID | 604 |
Feature activation | +3.50e-01 |
Pos logit contributions | |
�� | +0.735 |
ゼ | +0.714 |
dos | +0.707 |
eeper | +0.691 |
verting | +0.688 |
Neg logit contributions | |
Honour | -0.632 |
emin | -0.590 |
acceptance | -0.563 |
MENT | -0.563 |
ODY | -0.556 |
Token |
|
Token ID | 198 |
Feature activation | +3.13e-02 |
Pos logit contributions | |
Honour | +2.175 |
emin | +1.997 |
MENT | +1.921 |
acceptance | +1.920 |
ODY | +1.867 |
Neg logit contributions | |
�� | -2.711 |
ゼ | -2.601 |
dos | -2.571 |
eeper | -2.553 |
verting | -2.536 |
Token |
|
Token ID | 198 |
Feature activation | +9.25e-02 |
Pos logit contributions | |
Honour | +0.177 |
emin | +0.163 |
MENT | +0.155 |
acceptance | +0.154 |
ODY | +0.152 |
Neg logit contributions | |
�� | -0.267 |
ゼ | -0.255 |
dos | -0.251 |
eeper | -0.249 |
verting | -0.246 |
Token | Mis |
Token ID | 31281 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
Honour | +0.544 |
emin | +0.513 |
MENT | +0.493 |
ODY | +0.482 |
acceptance | +0.479 |
Neg logit contributions | |
�� | -0.747 |
ゼ | -0.712 |
dos | -0.710 |
eeper | -0.704 |
verting | -0.699 |
Token | ao |
Token ID | 5488 |
Feature activation | +1.27e-01 |
Pos logit contributions | |
Honour | +0.088 |
emin | +0.084 |
acceptance | +0.080 |
MENT | +0.080 |
ODY | +0.079 |
Neg logit contributions | |
�� | -0.074 |
ゼ | -0.072 |
dos | -0.070 |
eeper | -0.068 |
verting | -0.068 |
Token | , |
Token ID | 11 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
�� | +1.097 |
ゼ | +1.064 |
dos | +1.047 |
eeper | +1.026 |
verting | +1.020 |
Neg logit contributions | |
Honour | -1.041 |
emin | -0.977 |
acceptance | -0.937 |
MENT | -0.930 |
ODY | -0.922 |
Token | Prophet |
Token ID | 13583 |
Feature activation | +4.11e-02 |
Pos logit contributions | |
Honour | +1.076 |
emin | +0.983 |
acceptance | +0.955 |
MENT | +0.935 |
ODY | +0.922 |
Neg logit contributions | |
�� | -1.240 |
ゼ | -1.203 |
dos | -1.180 |
eeper | -1.162 |
verting | -1.148 |
Token | of |
Token ID | 286 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
Honour | +0.258 |
emin | +0.241 |
acceptance | +0.229 |
MENT | +0.227 |
ODY | +0.224 |
Neg logit contributions | |
�� | -0.316 |
ゼ | -0.307 |
dos | -0.304 |
eeper | -0.298 |
verting | -0.296 |
Token | God |
Token ID | 1793 |
Feature activation | -6.85e-01 |
Pos logit contributions | |
Honour | +0.850 |
emin | +0.773 |
acceptance | +0.740 |
MENT | +0.721 |
ODY | +0.707 |
Neg logit contributions | |
�� | -1.110 |
ゼ | -1.086 |
dos | -1.074 |
eeper | -1.062 |
verting | -1.043 |
Token | � |
Token ID | 447 |
Feature activation | +8.83e-02 |
Pos logit contributions | |
�� | +4.477 |
ゼ | +4.420 |
dos | +4.365 |
eeper | +4.232 |
verting | +4.229 |
Neg logit contributions | |
Honour | -4.661 |
emin | -4.450 |
ODY | -4.298 |
MENT | -4.255 |
acceptance | -4.241 |
Token | � |
Token ID | 251 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
Honour | +0.814 |
emin | +0.775 |
acceptance | +0.754 |
MENT | +0.754 |
ODY | +0.743 |
Neg logit contributions | |
�� | -0.402 |
ゼ | -0.397 |
dos | -0.393 |
eeper | -0.375 |
verting | -0.370 |
Token | , |
Token ID | 11 |
Feature activation | +5.23e-02 |
Pos logit contributions | |
�� | +1.715 |
ゼ | +1.669 |
dos | +1.660 |
eeper | +1.612 |
verting | +1.612 |
Neg logit contributions | |
Honour | -1.547 |
emin | -1.458 |
MENT | -1.387 |
acceptance | -1.387 |
ODY | -1.382 |
Token | page |
Token ID | 2443 |
Feature activation | -4.07e-01 |
Pos logit contributions | |
Honour | +0.345 |
emin | +0.320 |
acceptance | +0.309 |
MENT | +0.306 |
ODY | +0.302 |
Neg logit contributions | |
�� | -0.388 |
ゼ | -0.378 |
dos | -0.371 |
eeper | -0.364 |
verting | -0.361 |
Token | 127 |
Token ID | 18112 |
Feature activation | +3.46e-01 |
Pos logit contributions | |
�� | +2.910 |
ゼ | +2.863 |
dos | +2.847 |
verting | +2.752 |
eeper | +2.751 |
Neg logit contributions | |
Honour | -2.656 |
emin | -2.519 |
MENT | -2.399 |
acceptance | -2.389 |
ODY | -2.387 |
Token | , |
Token ID | 11 |
Feature activation | +3.09e-01 |
Pos logit contributions | |
Honour | +2.199 |
emin | +2.042 |
acceptance | +1.959 |
MENT | +1.954 |
ODY | +1.922 |
Neg logit contributions | |
�� | -2.631 |
ゼ | -2.560 |
dos | -2.492 |
eeper | -2.459 |
verting | -2.438 |
Token | said |
Token ID | 531 |
Feature activation | +3.10e-01 |
Pos logit contributions | |
Honour | +1.952 |
emin | +1.800 |
acceptance | +1.750 |
MENT | +1.719 |
ODY | +1.694 |
Neg logit contributions | |
�� | -2.357 |
ゼ | -2.310 |
dos | -2.244 |
eeper | -2.208 |
verting | -2.194 |
Token | an |
Token ID | 281 |
Feature activation | +4.17e-02 |
Pos logit contributions | |
�� | +1.928 |
ゼ | +1.884 |
dos | +1.863 |
eeper | +1.827 |
verting | +1.815 |
Neg logit contributions | |
Honour | -1.716 |
emin | -1.610 |
MENT | -1.539 |
acceptance | -1.535 |
ODY | -1.535 |
Token | order |
Token ID | 1502 |
Feature activation | +2.95e-01 |
Pos logit contributions | |
Honour | +0.256 |
emin | +0.240 |
MENT | +0.228 |
acceptance | +0.227 |
ODY | +0.226 |
Neg logit contributions | |
�� | -0.322 |
ゼ | -0.314 |
dos | -0.311 |
eeper | -0.305 |
verting | -0.302 |
Token | of |
Token ID | 286 |
Feature activation | +6.64e-02 |
Pos logit contributions | |
Honour | +1.806 |
emin | +1.688 |
acceptance | +1.608 |
MENT | +1.607 |
ODY | +1.584 |
Neg logit contributions | |
�� | -2.288 |
ゼ | -2.223 |
dos | -2.210 |
verting | -2.148 |
eeper | -2.142 |
Token | magnitude |
Token ID | 14735 |
Feature activation | +3.47e-01 |
Pos logit contributions | |
Honour | +0.350 |
emin | +0.323 |
acceptance | +0.305 |
MENT | +0.304 |
ODY | +0.301 |
Neg logit contributions | |
�� | -0.574 |
ゼ | -0.561 |
dos | -0.555 |
eeper | -0.544 |
verting | -0.542 |
Token | smaller |
Token ID | 4833 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
Honour | +2.302 |
emin | +2.148 |
acceptance | +2.087 |
MENT | +2.046 |
OPS | +2.000 |
Neg logit contributions | |
�� | -2.592 |
ゼ | -2.452 |
dos | -2.428 |
verting | -2.349 |
arthed | -2.311 |
Token | , |
Token ID | 11 |
Feature activation | -2.58e-01 |
Pos logit contributions | |
�� | +0.921 |
ゼ | +0.896 |
dos | +0.886 |
eeper | +0.864 |
verting | +0.861 |
Neg logit contributions | |
Honour | -0.902 |
emin | -0.849 |
MENT | -0.812 |
acceptance | -0.812 |
ODY | -0.805 |
Token | creating |
Token ID | 4441 |
Feature activation | -3.71e-02 |
Pos logit contributions | |
�� | +1.916 |
ゼ | +1.875 |
dos | +1.855 |
eeper | +1.813 |
verting | +1.806 |
Neg logit contributions | |
Honour | -1.658 |
emin | -1.551 |
MENT | -1.486 |
acceptance | -1.477 |
ODY | -1.472 |
Token | a |
Token ID | 257 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
�� | +0.292 |
ゼ | +0.284 |
dos | +0.282 |
eeper | +0.274 |
verting | +0.274 |
Neg logit contributions | |
Honour | -0.224 |
emin | -0.210 |
acceptance | -0.201 |
MENT | -0.199 |
ODY | -0.196 |
Token | greater |
Token ID | 3744 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
�� | +2.251 |
ゼ | +2.195 |
dos | +2.168 |
eeper | +2.125 |
verting | +2.122 |
Neg logit contributions | |
Honour | -2.089 |
emin | -1.967 |
MENT | -1.874 |
ODY | -1.869 |
acceptance | -1.867 |
Token | information |
Token ID | 1321 |
Feature activation | +3.17e-02 |
Pos logit contributions | |
Honour | +1.562 |
emin | +1.437 |
acceptance | +1.435 |
MENT | +1.374 |
ODY | +1.340 |
Neg logit contributions | |
�� | -1.974 |
ゼ | -1.915 |
dos | -1.896 |
eeper | -1.837 |
verting | -1.822 |
Token | processing |
Token ID | 7587 |
Feature activation | -9.04e-02 |
Pos logit contributions | |
Honour | +0.208 |
emin | +0.195 |
acceptance | +0.190 |
MENT | +0.186 |
ODY | +0.183 |
Neg logit contributions | |
�� | -0.235 |
ゼ | -0.226 |
dos | -0.225 |
eeper | -0.219 |
verting | -0.218 |
Token | have |
Token ID | 423 |
Feature activation | -2.70e-03 |
Pos logit contributions | |
Honour | +2.558 |
emin | +2.334 |
acceptance | +2.308 |
MENT | +2.221 |
OPS | +2.169 |
Neg logit contributions | |
�� | -3.291 |
ゼ | -3.195 |
arthed | -2.979 |
verting | -2.971 |
eeper | -2.958 |
Token | got |
Token ID | 1392 |
Feature activation | -2.87e-02 |
Pos logit contributions | |
�� | +0.020 |
ゼ | +0.020 |
dos | +0.019 |
eeper | +0.019 |
verting | +0.019 |
Neg logit contributions | |
Honour | -0.018 |
emin | -0.016 |
acceptance | -0.016 |
MENT | -0.016 |
ODY | -0.016 |
Token | a |
Token ID | 257 |
Feature activation | -2.48e-01 |
Pos logit contributions | |
�� | +0.226 |
ゼ | +0.220 |
dos | +0.217 |
eeper | +0.212 |
verting | +0.212 |
Neg logit contributions | |
Honour | -0.175 |
emin | -0.163 |
acceptance | -0.156 |
MENT | -0.155 |
ODY | -0.154 |
Token | draw |
Token ID | 3197 |
Feature activation | -2.33e-01 |
Pos logit contributions | |
�� | +1.773 |
ゼ | +1.725 |
dos | +1.705 |
eeper | +1.662 |
verting | +1.657 |
Neg logit contributions | |
Honour | -1.674 |
emin | -1.575 |
acceptance | -1.504 |
MENT | -1.504 |
ODY | -1.491 |
Token | or |
Token ID | 393 |
Feature activation | +2.44e-01 |
Pos logit contributions | |
�� | +1.723 |
ゼ | +1.683 |
dos | +1.668 |
eeper | +1.628 |
verting | +1.624 |
Neg logit contributions | |
Honour | -1.503 |
emin | -1.410 |
MENT | -1.342 |
acceptance | -1.340 |
ODY | -1.333 |
Token | even |
Token ID | 772 |
Feature activation | -4.40e-01 |
Pos logit contributions | |
Honour | +1.228 |
emin | +1.115 |
acceptance | +1.087 |
MENT | +1.054 |
ODY | +1.031 |
Neg logit contributions | |
�� | -2.173 |
ゼ | -2.126 |
dos | -2.091 |
verting | -2.054 |
eeper | -2.048 |
Token | won |
Token ID | 1839 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
�� | +3.308 |
dos | +3.252 |
ゼ | +3.252 |
eeper | +3.161 |
verting | +3.133 |
Neg logit contributions | |
Honour | -2.696 |
emin | -2.566 |
MENT | -2.417 |
ODY | -2.410 |
acceptance | -2.365 |
Token | , |
Token ID | 11 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
�� | +0.085 |
ゼ | +0.083 |
dos | +0.082 |
eeper | +0.080 |
verting | +0.080 |
Neg logit contributions | |
Honour | -0.068 |
emin | -0.063 |
acceptance | -0.061 |
MENT | -0.060 |
ODY | -0.059 |
Token | but |
Token ID | 475 |
Feature activation | -5.06e-01 |
Pos logit contributions | |
Honour | +1.295 |
emin | +1.191 |
acceptance | +1.156 |
MENT | +1.130 |
ODY | +1.126 |
Neg logit contributions | |
�� | -1.687 |
ゼ | -1.639 |
dos | -1.611 |
verting | -1.573 |
eeper | -1.570 |
Token | at |
Token ID | 379 |
Feature activation | -3.96e-01 |
Pos logit contributions | |
�� | +3.561 |
dos | +3.510 |
ゼ | +3.470 |
eeper | +3.394 |
verting | +3.361 |
Neg logit contributions | |
Honour | -3.302 |
emin | -3.165 |
MENT | -3.005 |
ODY | -2.976 |
acceptance | -2.943 |
Token | that |
Token ID | 326 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
�� | +2.840 |
dos | +2.776 |
ゼ | +2.775 |
eeper | +2.694 |
verting | +2.678 |
Neg logit contributions | |
Honour | -2.608 |
emin | -2.463 |
MENT | -2.347 |
acceptance | -2.328 |
ODY | -2.327 |
Token | 10 |
Token ID | 838 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
�� | +3.443 |
ゼ | +3.400 |
dos | +3.282 |
verting | +3.249 |
eeper | +3.238 |
Neg logit contributions | |
Honour | -3.954 |
emin | -3.735 |
afety | -3.561 |
acceptance | -3.555 |
MENT | -3.552 |
Token | 11 |
Token ID | 1367 |
Feature activation | -9.79e-01 |
Pos logit contributions | |
�� | +6.865 |
ゼ | +6.739 |
dos | +6.626 |
verting | +6.588 |
................................................................ | +6.524 |
Neg logit contributions | |
Honour | -6.891 |
emin | -6.502 |
afety | -6.263 |
MENT | -6.188 |
acceptance | -6.063 |
Token | 12 |
Token ID | 1105 |
Feature activation | -9.12e-01 |
Pos logit contributions | |
�� | +5.722 |
ゼ | +5.609 |
verting | +5.566 |
dos | +5.546 |
................................................................ | +5.484 |
Neg logit contributions | |
Honour | -6.913 |
emin | -6.548 |
afety | -6.380 |
MENT | -6.204 |
acceptance | -6.191 |
Token | 13 |
Token ID | 1511 |
Feature activation | -8.27e-01 |
Pos logit contributions | |
�� | +5.526 |
ゼ | +5.234 |
................................................................ | +5.158 |
verting | +5.110 |
eeper | +5.105 |
Neg logit contributions | |
Honour | -6.434 |
emin | -6.163 |
afety | -6.084 |
ODY | -5.815 |
MENT | -5.811 |
Token | 14 |
Token ID | 1478 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
�� | +5.214 |
dos | +4.977 |
ゼ | +4.960 |
verting | +4.939 |
eeper | +4.912 |
Neg logit contributions | |
Honour | -5.662 |
emin | -5.429 |
MENT | -5.151 |
afety | -5.134 |
ODY | -5.060 |
Token | 15 |
Token ID | 1315 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
�� | +6.083 |
dos | +5.796 |
verting | +5.716 |
eeper | +5.700 |
ゼ | +5.678 |
Neg logit contributions | |
Honour | -7.823 |
emin | -7.492 |
afety | -7.250 |
acceptance | -7.105 |
MENT | -7.041 |
Token | 16 |
Token ID | 1467 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
�� | +6.899 |
verting | +6.842 |
dos | +6.744 |
................................................................ | +6.530 |
eeper | +6.453 |
Neg logit contributions | |
Honour | -9.385 |
emin | -8.811 |
afety | -8.477 |
MENT | -8.452 |
acceptance | -8.387 |
Token | 17 |
Token ID | 1596 |
Feature activation | -6.69e-01 |
Pos logit contributions | |
�� | +6.389 |
verting | +6.016 |
ゼ | +5.911 |
................................................................ | +5.880 |
eeper | +5.806 |
Neg logit contributions | |
Honour | -6.974 |
emin | -6.671 |
afety | -6.465 |
OPS | -6.388 |
MENT | -6.379 |
Token | 18 |
Token ID | 1248 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
�� | +5.184 |
verting | +5.025 |
ゼ | +5.017 |
eeper | +4.886 |
................................................................ | +4.885 |
Neg logit contributions | |
Honour | -3.719 |
emin | -3.495 |
MENT | -3.290 |
ODY | -3.277 |
acceptance | -3.265 |
Token | 19 |
Token ID | 678 |
Feature activation | -4.40e-01 |
Pos logit contributions | |
�� | +4.040 |
ゼ | +3.935 |
verting | +3.783 |
eeper | +3.760 |
dos | +3.751 |
Neg logit contributions | |
Honour | -3.565 |
emin | -3.377 |
afety | -3.140 |
ODY | -3.139 |
MENT | -3.135 |
Token | 20 |
Token ID | 1160 |
Feature activation | -7.90e-01 |
Pos logit contributions | |
�� | +3.001 |
ゼ | +2.953 |
dos | +2.863 |
verting | +2.860 |
eeper | +2.814 |
Neg logit contributions | |
Honour | -2.996 |
emin | -2.829 |
acceptance | -2.666 |
MENT | -2.660 |
afety | -2.645 |
Token | " |
Token ID | 1 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
�� | +1.641 |
ゼ | +1.608 |
dos | +1.583 |
verting | +1.537 |
eeper | +1.536 |
Neg logit contributions | |
Honour | -1.753 |
emin | -1.655 |
acceptance | -1.591 |
MENT | -1.578 |
ODY | -1.570 |
Token | O |
Token ID | 46 |
Feature activation | +2.12e-01 |
Pos logit contributions | |
Honour | +0.628 |
emin | +0.584 |
MENT | +0.554 |
acceptance | +0.552 |
ODY | +0.547 |
Neg logit contributions | |
�� | -0.836 |
ゼ | -0.811 |
dos | -0.801 |
eeper | -0.789 |
verting | -0.784 |
Token | God |
Token ID | 1793 |
Feature activation | -2.18e-01 |
Pos logit contributions | |
Honour | +1.443 |
emin | +1.341 |
acceptance | +1.291 |
MENT | +1.279 |
OPS | +1.272 |
Neg logit contributions | |
�� | -1.502 |
ゼ | -1.480 |
dos | -1.452 |
eeper | -1.416 |
verting | -1.399 |
Token | ! |
Token ID | 0 |
Feature activation | +3.87e-01 |
Pos logit contributions | |
�� | +1.580 |
ゼ | +1.539 |
dos | +1.529 |
eeper | +1.485 |
verting | +1.480 |
Neg logit contributions | |
Honour | -1.437 |
emin | -1.355 |
MENT | -1.293 |
acceptance | -1.290 |
ODY | -1.280 |
Token | O |
Token ID | 440 |
Feature activation | +2.44e-01 |
Pos logit contributions | |
Honour | +2.445 |
emin | +2.217 |
acceptance | +2.149 |
ODY | +2.098 |
MENT | +2.089 |
Neg logit contributions | |
�� | -2.968 |
ゼ | -2.918 |
dos | -2.835 |
eeper | -2.799 |
verting | -2.790 |
Token | God |
Token ID | 1793 |
Feature activation | -9.25e-01 |
Pos logit contributions | |
Honour | +1.661 |
emin | +1.549 |
acceptance | +1.484 |
MENT | +1.459 |
ODY | +1.456 |
Neg logit contributions | |
�� | -1.732 |
ゼ | -1.703 |
dos | -1.684 |
eeper | -1.630 |
verting | -1.626 |
Token | ! |
Token ID | 0 |
Feature activation | +3.89e-01 |
Pos logit contributions | |
dos | +5.150 |
�� | +5.148 |
ゼ | +5.016 |
eeper | +4.819 |
verting | +4.767 |
Neg logit contributions | |
Honour | -7.015 |
emin | -6.686 |
acceptance | -6.395 |
MENT | -6.391 |
afety | -6.382 |
Token |
|
Token ID | 198 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
Honour | +2.326 |
emin | +2.087 |
acceptance | +2.004 |
ODY | +1.982 |
MENT | +1.979 |
Neg logit contributions | |
�� | -3.129 |
ゼ | -3.047 |
dos | -2.997 |
eeper | -2.954 |
verting | -2.943 |
Token |
|
Token ID | 198 |
Feature activation | -2.87e-01 |
Pos logit contributions | |
�� | +1.015 |
ゼ | +0.986 |
dos | +0.974 |
eeper | +0.955 |
verting | +0.951 |
Neg logit contributions | |
Honour | -0.750 |
emin | -0.698 |
MENT | -0.662 |
acceptance | -0.662 |
ODY | -0.654 |
Token | How |
Token ID | 2437 |
Feature activation | +3.95e-02 |
Pos logit contributions | |
�� | +2.275 |
ゼ | +2.236 |
dos | +2.224 |
verting | +2.154 |
eeper | +2.152 |
Neg logit contributions | |
Honour | -1.683 |
emin | -1.564 |
acceptance | -1.501 |
MENT | -1.480 |
ODY | -1.470 |
Token | weary |
Token ID | 34730 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
Honour | +0.252 |
emin | +0.235 |
acceptance | +0.226 |
MENT | +0.223 |
ODY | +0.221 |
Neg logit contributions | |
�� | -0.299 |
ゼ | -0.291 |
dos | -0.286 |
eeper | -0.281 |
verting | -0.278 |
Token | ' |
Token ID | 705 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
Honour | +1.841 |
emin | +1.687 |
MENT | +1.581 |
acceptance | +1.558 |
ODY | +1.548 |
Neg logit contributions | |
�� | -3.700 |
ゼ | -3.578 |
dos | -3.529 |
eeper | -3.469 |
verting | -3.459 |
Token | \ |
Token ID | 59 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
�� | +1.395 |
ゼ | +1.350 |
dos | +1.332 |
eeper | +1.289 |
verting | +1.285 |
Neg logit contributions | |
Honour | -1.894 |
emin | -1.799 |
acceptance | -1.732 |
MENT | -1.731 |
ODY | -1.718 |
Token | [ |
Token ID | 58 |
Feature activation | -6.15e-01 |
Pos logit contributions | |
Honour | +1.407 |
emin | +1.359 |
MENT | +1.320 |
acceptance | +1.310 |
ODY | +1.306 |
Neg logit contributions | |
�� | -0.727 |
ゼ | -0.682 |
dos | -0.664 |
eeper | -0.648 |
verting | -0.635 |
Token | + |
Token ID | 10 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
�� | +3.558 |
ゼ | +3.512 |
dos | +3.501 |
verting | +3.371 |
eeper | +3.347 |
Neg logit contributions | |
Honour | -4.832 |
emin | -4.531 |
acceptance | -4.371 |
MENT | -4.355 |
ODY | -4.313 |
Token | \ |
Token ID | 59 |
Feature activation | +2.17e-01 |
Pos logit contributions | |
�� | +1.664 |
ゼ | +1.615 |
dos | +1.595 |
eeper | +1.543 |
verting | +1.540 |
Neg logit contributions | |
Honour | -2.227 |
emin | -2.111 |
acceptance | -2.034 |
MENT | -2.030 |
ODY | -2.017 |
Token | S |
Token ID | 50 |
Feature activation | -9.78e-01 |
Pos logit contributions | |
Honour | +1.258 |
emin | +1.194 |
MENT | +1.141 |
ODY | +1.111 |
OPS | +1.111 |
Neg logit contributions | |
�� | -1.762 |
ゼ | -1.692 |
dos | -1.656 |
eeper | -1.652 |
verting | -1.623 |
Token | + |
Token ID | 10 |
Feature activation | +2.43e-02 |
Pos logit contributions | |
dos | +3.234 |
ゼ | +3.196 |
�� | +3.166 |
verting | +3.015 |
eeper | +2.867 |
Neg logit contributions | |
Honour | -9.595 |
emin | -9.099 |
acceptance | -8.928 |
MENT | -8.884 |
afety | -8.758 |
Token | \ |
Token ID | 59 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
Honour | +0.192 |
emin | +0.183 |
MENT | +0.176 |
acceptance | +0.176 |
ODY | +0.175 |
Neg logit contributions | |
�� | -0.148 |
ゼ | -0.142 |
dos | -0.139 |
eeper | -0.136 |
verting | -0.134 |
Token | s |
Token ID | 82 |
Feature activation | -8.02e-01 |
Pos logit contributions | |
Honour | +1.918 |
emin | +1.831 |
MENT | +1.754 |
OPS | +1.712 |
ODY | +1.700 |
Neg logit contributions | |
�� | -2.933 |
ゼ | -2.803 |
eeper | -2.746 |
dos | -2.738 |
verting | -2.693 |
Token | + |
Token ID | 10 |
Feature activation | -4.34e-02 |
Pos logit contributions | |
ゼ | +2.337 |
�� | +2.297 |
dos | +2.265 |
verting | +2.110 |
eeper | +1.999 |
Neg logit contributions | |
Honour | -8.377 |
emin | -7.980 |
acceptance | -7.819 |
MENT | -7.761 |
ODY | -7.695 |
Token | "( |
Token ID | 18109 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
�� | +0.274 |
ゼ | +0.264 |
dos | +0.260 |
eeper | +0.253 |
verting | +0.252 |
Neg logit contributions | |
Honour | -0.331 |
emin | -0.315 |
MENT | -0.303 |
acceptance | -0.302 |
ODY | -0.301 |
Token | lled |
Token ID | 3353 |
Feature activation | -7.77e-01 |
Pos logit contributions | |
�� | +1.246 |
ゼ | +1.190 |
dos | +1.178 |
verting | +1.105 |
eeper | +1.098 |
Neg logit contributions | |
Honour | -4.482 |
emin | -4.289 |
acceptance | -4.202 |
ODY | -4.191 |
MENT | -4.191 |
Token | by |
Token ID | 416 |
Feature activation | -5.03e-01 |
Pos logit contributions | |
�� | +4.631 |
ゼ | +4.606 |
dos | +4.526 |
eeper | +4.434 |
verting | +4.406 |
Neg logit contributions | |
Honour | -5.696 |
emin | -5.407 |
MENT | -5.213 |
ODY | -5.169 |
OPS | -5.156 |
Token | its |
Token ID | 663 |
Feature activation | +5.78e-02 |
Pos logit contributions | |
�� | +3.759 |
ゼ | +3.690 |
dos | +3.689 |
eeper | +3.577 |
verting | +3.560 |
Neg logit contributions | |
Honour | -3.050 |
emin | -2.925 |
MENT | -2.790 |
ODY | -2.742 |
acceptance | -2.723 |
Token | rulers |
Token ID | 24925 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
Honour | +0.420 |
emin | +0.390 |
acceptance | +0.381 |
MENT | +0.373 |
ODY | +0.370 |
Neg logit contributions | |
�� | -0.390 |
ゼ | -0.381 |
dos | -0.373 |
verting | -0.362 |
eeper | -0.360 |
Token | , |
Token ID | 11 |
Feature activation | -1.63e-01 |
Pos logit contributions | |
Honour | +0.838 |
emin | +0.782 |
acceptance | +0.749 |
MENT | +0.742 |
ODY | +0.734 |
Neg logit contributions | |
�� | -1.101 |
ゼ | -1.065 |
dos | -1.050 |
eeper | -1.029 |
verting | -1.029 |
Token | Gal |
Token ID | 5027 |
Feature activation | -9.31e-01 |
Pos logit contributions | |
�� | +1.251 |
ゼ | +1.220 |
dos | +1.207 |
eeper | +1.179 |
verting | +1.175 |
Neg logit contributions | |
Honour | -1.016 |
emin | -0.952 |
MENT | -0.905 |
acceptance | -0.905 |
ODY | -0.896 |
Token | ad |
Token ID | 324 |
Feature activation | -5.80e-01 |
Pos logit contributions | |
dos | +4.699 |
�� | +4.649 |
eeper | +4.441 |
verting | +4.361 |
ゼ | +4.341 |
Neg logit contributions | |
Honour | -7.926 |
MENT | -7.442 |
emin | -7.363 |
ODY | -7.352 |
acceptance | -7.321 |
Token | riel |
Token ID | 11719 |
Feature activation | -2.14e-01 |
Pos logit contributions | |
�� | +2.404 |
ゼ | +2.292 |
dos | +2.291 |
verting | +2.171 |
eeper | +2.145 |
Neg logit contributions | |
Honour | -5.555 |
emin | -5.353 |
MENT | -5.197 |
acceptance | -5.184 |
ODY | -5.157 |
Token | and |
Token ID | 290 |
Feature activation | -3.00e-01 |
Pos logit contributions | |
�� | +1.567 |
ゼ | +1.526 |
dos | +1.510 |
eeper | +1.471 |
verting | +1.467 |
Neg logit contributions | |
Honour | -1.408 |
emin | -1.323 |
acceptance | -1.262 |
MENT | -1.261 |
ODY | -1.250 |
Token | Cele |
Token ID | 18909 |
Feature activation | -7.38e-01 |
Pos logit contributions | |
�� | +2.303 |
ゼ | +2.249 |
dos | +2.232 |
eeper | +2.171 |
verting | +2.167 |
Neg logit contributions | |
Honour | -1.841 |
emin | -1.735 |
MENT | -1.650 |
acceptance | -1.638 |
ODY | -1.636 |
Token | born |
Token ID | 6286 |
Feature activation | -2.29e-01 |
Pos logit contributions | |
dos | +4.080 |
�� | +3.979 |
ゼ | +3.924 |
verting | +3.722 |
eeper | +3.675 |
Neg logit contributions | |
Honour | -5.988 |
emin | -5.760 |
MENT | -5.612 |
acceptance | -5.558 |
ODY | -5.522 |
Token | Bad |
Token ID | 7772 |
Feature activation | +1.44e-01 |
Pos logit contributions | |
�� | +0.827 |
ゼ | +0.805 |
dos | +0.795 |
eeper | +0.776 |
verting | +0.773 |
Neg logit contributions | |
Honour | -0.720 |
emin | -0.676 |
acceptance | -0.644 |
MENT | -0.643 |
ODY | -0.638 |
Token | ane |
Token ID | 1531 |
Feature activation | -7.08e-02 |
Pos logit contributions | |
Honour | +0.997 |
emin | +0.950 |
acceptance | +0.891 |
MENT | +0.888 |
ODY | +0.876 |
Neg logit contributions | |
�� | -1.022 |
ゼ | -0.985 |
dos | -0.952 |
verting | -0.935 |
eeper | -0.930 |
Token | but |
Token ID | 475 |
Feature activation | +8.63e-02 |
Pos logit contributions | |
�� | +0.530 |
ゼ | +0.515 |
dos | +0.509 |
eeper | +0.495 |
verting | +0.494 |
Neg logit contributions | |
Honour | -0.458 |
emin | -0.429 |
MENT | -0.409 |
acceptance | -0.409 |
ODY | -0.404 |
Token | no |
Token ID | 645 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
Honour | +0.518 |
emin | +0.479 |
acceptance | +0.462 |
MENT | +0.457 |
ODY | +0.450 |
Neg logit contributions | |
�� | -0.690 |
ゼ | -0.672 |
dos | -0.660 |
eeper | -0.645 |
verting | -0.644 |
Token | action |
Token ID | 2223 |
Feature activation | -3.08e-01 |
Pos logit contributions | |
�� | +0.774 |
ゼ | +0.756 |
dos | +0.749 |
eeper | +0.730 |
verting | +0.728 |
Neg logit contributions | |
Honour | -0.689 |
emin | -0.649 |
MENT | -0.619 |
acceptance | -0.615 |
ODY | -0.613 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
�� | +2.235 |
ゼ | +2.202 |
dos | +2.176 |
verting | +2.129 |
eeper | +2.116 |
Neg logit contributions | |
Honour | -1.978 |
emin | -1.872 |
MENT | -1.780 |
ODY | -1.773 |
acceptance | -1.764 |
Token | taken |
Token ID | 2077 |
Feature activation | -4.87e-01 |
Pos logit contributions | |
�� | +5.752 |
dos | +5.712 |
verting | +5.593 |
ゼ | +5.509 |
eeper | +5.475 |
Neg logit contributions | |
Honour | -7.029 |
emin | -6.748 |
afety | -6.678 |
ODY | -6.606 |
MENT | -6.561 |
Token | against |
Token ID | 1028 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
�� | +3.285 |
ゼ | +3.255 |
dos | +3.212 |
eeper | +3.125 |
verting | +3.121 |
Neg logit contributions | |
Honour | -3.339 |
emin | -3.149 |
MENT | -3.016 |
ODY | -3.006 |
acceptance | -2.998 |
Token | the |
Token ID | 262 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
Honour | +1.207 |
emin | +1.112 |
acceptance | +1.082 |
MENT | +1.071 |
ODY | +1.055 |
Neg logit contributions | |
�� | -1.308 |
ゼ | -1.266 |
dos | -1.236 |
eeper | -1.205 |
verting | -1.195 |
Token | accused |
Token ID | 5371 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
Honour | +0.878 |
emin | +0.809 |
acceptance | +0.785 |
MENT | +0.777 |
ODY | +0.770 |
Neg logit contributions | |
�� | -0.948 |
ゼ | -0.914 |
dos | -0.897 |
eeper | -0.881 |
verting | -0.873 |
Token | for |
Token ID | 329 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
Honour | +1.134 |
emin | +1.049 |
acceptance | +1.010 |
MENT | +1.005 |
ODY | +0.987 |
Neg logit contributions | |
�� | -1.399 |
ゼ | -1.343 |
dos | -1.327 |
eeper | -1.291 |
verting | -1.288 |