Token | scrap |
Token ID | 15881 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
Supplement | +1.068 |
appendix | +1.063 |
defences | +1.001 |
strang | +0.960 |
gard | +0.929 |
Neg logit contributions | |
practiced | -1.360 |
ounge | -1.353 |
thus | -1.287 |
UA | -1.286 |
ildo | -1.264 |
Token | . |
Token ID | 13 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
appendix | +0.895 |
Supplement | +0.894 |
defences | +0.844 |
strang | +0.807 |
gard | +0.783 |
Neg logit contributions | |
ounge | -1.046 |
practiced | -1.042 |
thus | -0.991 |
UA | -0.984 |
ildo | -0.968 |
Token |
|
Token ID | 198 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
Supplement | +0.571 |
appendix | +0.566 |
defences | +0.535 |
strang | +0.516 |
gard | +0.501 |
Neg logit contributions | |
practiced | -0.609 |
ounge | -0.606 |
thus | -0.572 |
UA | -0.571 |
ildo | -0.562 |
Token |
|
Token ID | 198 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
Supplement | +0.525 |
appendix | +0.510 |
defences | +0.463 |
strang | +0.446 |
gard | +0.434 |
Neg logit contributions | |
practiced | -0.753 |
ounge | -0.752 |
UA | -0.703 |
anguage | -0.700 |
ildo | -0.698 |
Token | Article |
Token ID | 14906 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
Supplement | +1.062 |
appendix | +1.048 |
defences | +0.994 |
strang | +0.957 |
gard | +0.933 |
Neg logit contributions | |
practiced | -1.017 |
ounge | -1.010 |
thus | -0.949 |
UA | -0.946 |
ildo | -0.936 |
Token | Continued |
Token ID | 22168 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
appendix | +0.597 |
Supplement | +0.591 |
defences | +0.506 |
strang | +0.451 |
gard | +0.414 |
Neg logit contributions | |
ounge | -2.498 |
practiced | -2.496 |
thus | -2.419 |
UA | -2.410 |
ildo | -2.384 |
Token | Below |
Token ID | 10383 |
Feature activation | +8.30e-01 |
Pos logit contributions | |
Supplement | +5.858 |
appendix | +5.584 |
Moy | +4.513 |
weekend | +4.252 |
tier | +4.224 |
Neg logit contributions | |
anguage | -13.495 |
ounge | -13.474 |
practiced | -13.412 |
�� | -12.847 |
aimon | -12.620 |
Token |
|
Token ID | 198 |
Feature activation | +2.80e-01 |
Pos logit contributions | |
Supplement | +3.086 |
appendix | +2.836 |
defences | +2.418 |
Imm | +2.331 |
strang | +2.276 |
Neg logit contributions | |
practiced | -5.831 |
ounge | -5.744 |
anguage | -5.505 |
�� | -5.454 |
ildo | -5.312 |
Token |
|
Token ID | 198 |
Feature activation | +3.41e-02 |
Pos logit contributions | |
Supplement | +1.196 |
appendix | +1.138 |
defences | +1.021 |
strang | +0.983 |
gard | +0.960 |
Neg logit contributions | |
practiced | -1.839 |
ounge | -1.837 |
anguage | -1.730 |
UA | -1.703 |
ildo | -1.695 |
Token | The |
Token ID | 464 |
Feature activation | -2.88e-02 |
Pos logit contributions | |
Supplement | +0.178 |
appendix | +0.177 |
defences | +0.168 |
strang | +0.162 |
gard | +0.157 |
Neg logit contributions | |
practiced | -0.184 |
ounge | -0.183 |
thus | -0.173 |
UA | -0.173 |
ildo | -0.170 |
Token | T |
Token ID | 309 |
Feature activation | +3.24e-01 |
Pos logit contributions | |
practiced | +0.167 |
ounge | +0.166 |
thus | +0.158 |
UA | +0.158 |
ildo | +0.155 |
Neg logit contributions | |
Supplement | -0.139 |
appendix | -0.138 |
defences | -0.131 |
strang | -0.125 |
gard | -0.122 |
Token | last |
Token ID | 938 |
Feature activation | -4.43e-01 |
Pos logit contributions | |
appendix | +2.931 |
Supplement | +2.805 |
strang | +2.650 |
defences | +2.647 |
gard | +2.517 |
Neg logit contributions | |
ounge | -4.573 |
practiced | -4.454 |
UA | -4.351 |
thus | -4.341 |
ildo | -4.314 |
Token | . |
Token ID | 13 |
Feature activation | +2.86e-01 |
Pos logit contributions | |
practiced | +2.527 |
ounge | +2.482 |
UA | +2.370 |
thus | +2.352 |
ildo | +2.301 |
Neg logit contributions | |
Supplement | -2.193 |
appendix | -2.178 |
defences | -2.065 |
strang | -1.975 |
gard | -1.908 |
Token |
|
Token ID | 198 |
Feature activation | +8.44e-02 |
Pos logit contributions | |
Supplement | +1.458 |
appendix | +1.438 |
defences | +1.344 |
strang | +1.307 |
gard | +1.277 |
Neg logit contributions | |
practiced | -1.595 |
ounge | -1.594 |
thus | -1.489 |
UA | -1.482 |
ildo | -1.463 |
Token |
|
Token ID | 198 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
Supplement | +0.379 |
appendix | +0.368 |
defences | +0.336 |
strang | +0.323 |
gard | +0.315 |
Neg logit contributions | |
practiced | -0.531 |
ounge | -0.530 |
UA | -0.495 |
thus | -0.493 |
ildo | -0.493 |
Token | Article |
Token ID | 14906 |
Feature activation | -4.41e-01 |
Pos logit contributions | |
Supplement | +0.875 |
appendix | +0.873 |
defences | +0.830 |
strang | +0.800 |
gard | +0.778 |
Neg logit contributions | |
practiced | -0.839 |
ounge | -0.836 |
thus | -0.790 |
UA | -0.789 |
ildo | -0.773 |
Token | Continued |
Token ID | 22168 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
practiced | +3.345 |
ounge | +3.303 |
thus | +3.179 |
UA | +3.175 |
ildo | +3.138 |
Neg logit contributions | |
Supplement | -1.309 |
appendix | -1.283 |
defences | -1.210 |
strang | -1.123 |
gard | -1.045 |
Token | Below |
Token ID | 10383 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
Supplement | +5.811 |
appendix | +5.687 |
Moy | +4.434 |
weekend | +4.333 |
tier | +4.227 |
Neg logit contributions | |
practiced | -13.223 |
ounge | -13.207 |
anguage | -13.063 |
�� | -12.610 |
aimon | -12.465 |
Token |
|
Token ID | 198 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
Supplement | +3.565 |
appendix | +3.230 |
defences | +2.675 |
Imm | +2.653 |
Moy | +2.580 |
Neg logit contributions | |
practiced | -7.185 |
ounge | -7.085 |
�� | -6.856 |
anguage | -6.838 |
ildo | -6.543 |
Token |
|
Token ID | 198 |
Feature activation | +5.59e-02 |
Pos logit contributions | |
Supplement | +1.808 |
appendix | +1.704 |
defences | +1.499 |
strang | +1.450 |
gard | +1.420 |
Neg logit contributions | |
ounge | -2.965 |
practiced | -2.961 |
anguage | -2.829 |
�� | -2.763 |
UA | -2.732 |
Token | T |
Token ID | 51 |
Feature activation | +6.75e-01 |
Pos logit contributions | |
Supplement | +0.286 |
appendix | +0.285 |
defences | +0.270 |
strang | +0.260 |
gard | +0.252 |
Neg logit contributions | |
practiced | -0.308 |
ounge | -0.307 |
thus | -0.291 |
UA | -0.290 |
ildo | -0.285 |
Token | od |
Token ID | 375 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
Supplement | +3.868 |
appendix | +3.840 |
defences | +3.646 |
strang | +3.557 |
gard | +3.461 |
Neg logit contributions | |
practiced | -3.270 |
ounge | -3.217 |
thus | -3.037 |
UA | -2.999 |
ildo | -2.941 |
Token | him |
Token ID | 683 |
Feature activation | +7.19e-01 |
Pos logit contributions | |
Supplement | +0.439 |
appendix | +0.435 |
defences | +0.411 |
strang | +0.396 |
gard | +0.384 |
Neg logit contributions | |
practiced | -0.460 |
ounge | -0.454 |
thus | -0.433 |
UA | -0.432 |
ildo | -0.423 |
Token | as |
Token ID | 355 |
Feature activation | +6.45e-01 |
Pos logit contributions | |
appendix | +3.226 |
Supplement | +3.170 |
defences | +3.010 |
strang | +2.920 |
gard | +2.777 |
Neg logit contributions | |
ounge | -4.343 |
practiced | -4.248 |
UA | -4.126 |
thus | -4.066 |
ildo | -4.045 |
Token | one |
Token ID | 530 |
Feature activation | +6.97e-01 |
Pos logit contributions | |
appendix | +2.830 |
Supplement | +2.790 |
defences | +2.617 |
strang | +2.545 |
gard | +2.425 |
Neg logit contributions | |
ounge | -4.005 |
practiced | -3.942 |
UA | -3.809 |
thus | -3.790 |
ildo | -3.743 |
Token | of |
Token ID | 286 |
Feature activation | +6.20e-01 |
Pos logit contributions | |
Supplement | +3.062 |
appendix | +3.031 |
defences | +2.851 |
strang | +2.709 |
gard | +2.621 |
Neg logit contributions | |
practiced | -4.389 |
ounge | -4.357 |
UA | -4.154 |
thus | -4.154 |
ildo | -4.085 |
Token | the |
Token ID | 262 |
Feature activation | +8.15e-01 |
Pos logit contributions | |
appendix | +2.710 |
Supplement | +2.696 |
defences | +2.541 |
strang | +2.446 |
gard | +2.337 |
Neg logit contributions | |
ounge | -3.847 |
practiced | -3.832 |
UA | -3.656 |
thus | -3.646 |
ildo | -3.591 |
Token | NL |
Token ID | 22879 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
appendix | +3.445 |
Supplement | +3.347 |
defences | +3.214 |
strang | +3.162 |
gard | +2.934 |
Neg logit contributions | |
ounge | -5.166 |
practiced | -5.097 |
UA | -4.946 |
thus | -4.931 |
ildo | -4.863 |
Token | � |
Token ID | 447 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
appendix | +6.453 |
defences | +6.416 |
strang | +6.152 |
Supplement | +6.055 |
tier | +5.680 |
Neg logit contributions | |
ounge | -10.734 |
practiced | -10.647 |
thus | -10.546 |
ildo | -10.307 |
UA | -10.179 |
Token | � |
Token ID | 247 |
Feature activation | +3.76e-01 |
Pos logit contributions | |
practiced | +0.683 |
ounge | +0.675 |
thus | +0.638 |
UA | +0.635 |
ildo | +0.611 |
Neg logit contributions | |
Supplement | -0.938 |
appendix | -0.935 |
defences | -0.898 |
strang | -0.869 |
gard | -0.846 |
Token | s |
Token ID | 82 |
Feature activation | +7.34e-01 |
Pos logit contributions | |
Supplement | +1.629 |
appendix | +1.621 |
defences | +1.519 |
strang | +1.453 |
gard | +1.400 |
Neg logit contributions | |
practiced | -2.362 |
ounge | -2.354 |
thus | -2.245 |
UA | -2.244 |
ildo | -2.208 |
Token | very |
Token ID | 845 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
appendix | +3.130 |
Supplement | +3.056 |
defences | +2.943 |
strang | +2.872 |
gard | +2.691 |
Neg logit contributions | |
ounge | -4.624 |
practiced | -4.539 |
thus | -4.384 |
UA | -4.376 |
ildo | -4.320 |
Token | best |
Token ID | 1266 |
Feature activation | +6.73e-01 |
Pos logit contributions | |
Supplement | +0.456 |
appendix | +0.453 |
defences | +0.424 |
strang | +0.403 |
gard | +0.390 |
Neg logit contributions | |
practiced | -0.667 |
ounge | -0.662 |
thus | -0.632 |
UA | -0.631 |
ildo | -0.621 |
Token | mess |
Token ID | 2085 |
Feature activation | -2.73e-03 |
Pos logit contributions | |
practiced | +4.236 |
ounge | +4.176 |
UA | +3.966 |
thus | +3.957 |
ildo | +3.837 |
Neg logit contributions | |
Supplement | -3.557 |
appendix | -3.535 |
defences | -3.308 |
strang | -3.218 |
gard | -3.122 |
Token | seriously |
Token ID | 6411 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
practiced | +0.015 |
ounge | +0.015 |
thus | +0.014 |
UA | +0.014 |
ildo | +0.014 |
Neg logit contributions | |
Supplement | -0.014 |
appendix | -0.014 |
defences | -0.013 |
strang | -0.013 |
gard | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | +2.98e-01 |
Pos logit contributions | |
practiced | +0.909 |
ounge | +0.904 |
UA | +0.862 |
thus | +0.856 |
ildo | +0.840 |
Neg logit contributions | |
Supplement | -0.870 |
appendix | -0.866 |
defences | -0.821 |
strang | -0.795 |
gard | -0.766 |
Token |
|
Token ID | 198 |
Feature activation | +2.73e-01 |
Pos logit contributions | |
Supplement | +1.284 |
appendix | +1.222 |
defences | +1.099 |
strang | +1.054 |
gard | +1.025 |
Neg logit contributions | |
ounge | -1.937 |
practiced | -1.934 |
anguage | -1.827 |
UA | -1.798 |
ildo | -1.798 |
Token | Article |
Token ID | 14906 |
Feature activation | +3.46e-01 |
Pos logit contributions | |
Supplement | +1.771 |
appendix | +1.737 |
defences | +1.660 |
strang | +1.605 |
gard | +1.578 |
Neg logit contributions | |
practiced | -1.158 |
ounge | -1.143 |
thus | -1.055 |
ildo | -1.040 |
UA | -1.037 |
Token | Continued |
Token ID | 22168 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
appendix | +0.602 |
Supplement | +0.570 |
defences | +0.487 |
strang | +0.412 |
gard | +0.361 |
Neg logit contributions | |
ounge | -3.079 |
practiced | -3.078 |
thus | -2.999 |
UA | -2.974 |
ildo | -2.950 |
Token | Below |
Token ID | 10383 |
Feature activation | +7.47e-01 |
Pos logit contributions | |
Supplement | +5.685 |
appendix | +5.387 |
Moy | +4.310 |
Supplement | +4.071 |
tier | +4.007 |
Neg logit contributions | |
practiced | -12.367 |
ounge | -12.317 |
anguage | -12.291 |
�� | -11.852 |
aimon | -11.457 |
Token |
|
Token ID | 198 |
Feature activation | +5.65e-02 |
Pos logit contributions | |
Supplement | +2.830 |
appendix | +2.635 |
defences | +2.280 |
Imm | +2.161 |
gard | +2.149 |
Neg logit contributions | |
practiced | -5.193 |
ounge | -5.110 |
anguage | -4.878 |
�� | -4.805 |
ildo | -4.738 |
Token |
|
Token ID | 198 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
Supplement | +0.252 |
appendix | +0.244 |
defences | +0.223 |
strang | +0.215 |
gard | +0.209 |
Neg logit contributions | |
practiced | -0.357 |
ounge | -0.356 |
UA | -0.332 |
thus | -0.332 |
ildo | -0.330 |
Token | � |
Token ID | 447 |
Feature activation | +3.25e-01 |
Pos logit contributions | |
practiced | +0.787 |
ounge | +0.786 |
UA | +0.750 |
thus | +0.746 |
ildo | +0.726 |
Neg logit contributions | |
appendix | -0.828 |
Supplement | -0.823 |
defences | -0.788 |
strang | -0.761 |
gard | -0.738 |
Token | � |
Token ID | 250 |
Feature activation | +1.44e-01 |
Pos logit contributions | |
Supplement | +1.844 |
appendix | +1.833 |
defences | +1.746 |
strang | +1.688 |
gard | +1.647 |
Neg logit contributions | |
ounge | -1.597 |
practiced | -1.595 |
thus | -1.498 |
UA | -1.490 |
ildo | -1.472 |
Token | , |
Token ID | 11 |
Feature activation | -2.88e-01 |
Pos logit contributions | |
Supplement | +1.328 |
appendix | +1.324 |
defences | +1.253 |
strang | +1.206 |
gard | +1.168 |
Neg logit contributions | |
practiced | -1.483 |
ounge | -1.480 |
UA | -1.403 |
thus | -1.402 |
ildo | -1.377 |
Token | we |
Token ID | 356 |
Feature activation | -4.51e-01 |
Pos logit contributions | |
practiced | +1.720 |
ounge | +1.687 |
thus | +1.616 |
UA | +1.604 |
ildo | +1.574 |
Neg logit contributions | |
Supplement | -1.354 |
appendix | -1.334 |
defences | -1.250 |
strang | -1.198 |
gard | -1.164 |
Token | will |
Token ID | 481 |
Feature activation | -7.44e-02 |
Pos logit contributions | |
practiced | +2.697 |
ounge | +2.607 |
thus | +2.510 |
UA | +2.469 |
ildo | +2.424 |
Neg logit contributions | |
Supplement | -2.117 |
appendix | -2.076 |
defences | -1.969 |
strang | -1.876 |
gard | -1.822 |
Token | not |
Token ID | 407 |
Feature activation | +5.93e-03 |
Pos logit contributions | |
practiced | +0.438 |
ounge | +0.436 |
thus | +0.415 |
UA | +0.414 |
ildo | +0.407 |
Neg logit contributions | |
Supplement | -0.352 |
appendix | -0.350 |
defences | -0.331 |
strang | -0.317 |
gard | -0.307 |
Token | question |
Token ID | 1808 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
Supplement | +0.028 |
appendix | +0.028 |
defences | +0.027 |
strang | +0.026 |
gard | +0.025 |
Neg logit contributions | |
practiced | -0.035 |
ounge | -0.034 |
thus | -0.033 |
UA | -0.032 |
ildo | -0.032 |
Token | its |
Token ID | 663 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
Supplement | +0.758 |
appendix | +0.755 |
defences | +0.713 |
strang | +0.685 |
gard | +0.663 |
Neg logit contributions | |
practiced | -0.900 |
ounge | -0.898 |
thus | -0.853 |
UA | -0.852 |
ildo | -0.837 |
Token | source |
Token ID | 2723 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
appendix | +6.420 |
defences | +6.166 |
strang | +5.911 |
Supplement | +5.767 |
abilities | +5.453 |
Neg logit contributions | |
ounge | -11.200 |
ildo | -10.636 |
thus | -10.630 |
UA | -10.593 |
anguage | -10.536 |
Token | or |
Token ID | 393 |
Feature activation | +9.86e-01 |
Pos logit contributions | |
Supplement | +1.159 |
appendix | +1.154 |
defences | +1.092 |
strang | +1.050 |
gard | +1.018 |
Neg logit contributions | |
practiced | -1.307 |
ounge | -1.303 |
thus | -1.236 |
UA | -1.235 |
ildo | -1.213 |
Token | the |
Token ID | 262 |
Feature activation | +6.43e-01 |
Pos logit contributions | |
appendix | +4.375 |
Supplement | +4.231 |
defences | +4.196 |
strang | +3.984 |
gard | +3.792 |
Neg logit contributions | |
ounge | -5.944 |
practiced | -5.799 |
UA | -5.665 |
thus | -5.604 |
ildo | -5.561 |
Token | means |
Token ID | 1724 |
Feature activation | -1.99e-01 |
Pos logit contributions | |
appendix | +2.785 |
Supplement | +2.686 |
defences | +2.646 |
strang | +2.526 |
gard | +2.425 |
Neg logit contributions | |
ounge | -4.053 |
practiced | -3.944 |
thus | -3.858 |
UA | -3.849 |
ildo | -3.805 |
Token | by |
Token ID | 416 |
Feature activation | -6.79e-01 |
Pos logit contributions | |
practiced | +1.155 |
ounge | +1.134 |
thus | +1.085 |
UA | +1.080 |
ildo | +1.061 |
Neg logit contributions | |
Supplement | -0.971 |
appendix | -0.966 |
defences | -0.906 |
strang | -0.873 |
gard | -0.844 |
Token | us |
Token ID | 385 |
Feature activation | +6.05e-01 |
Pos logit contributions | |
ounge | +2.060 |
practiced | +2.053 |
thus | +1.944 |
UA | +1.889 |
ildo | +1.844 |
Neg logit contributions | |
Supplement | -4.030 |
appendix | -3.982 |
defences | -3.917 |
strang | -3.715 |
gard | -3.642 |
Token | monkeys |
Token ID | 26697 |
Feature activation | +4.20e-01 |
Pos logit contributions | |
appendix | +2.341 |
Supplement | +2.321 |
defences | +2.160 |
strang | +2.087 |
gard | +2.004 |
Neg logit contributions | |
ounge | -4.038 |
practiced | -4.009 |
ildo | -3.840 |
UA | -3.833 |
thus | -3.825 |
Token | ( |
Token ID | 357 |
Feature activation | +4.06e-01 |
Pos logit contributions | |
Supplement | +1.844 |
appendix | +1.838 |
defences | +1.707 |
strang | +1.634 |
gard | +1.595 |
Neg logit contributions | |
ounge | -2.605 |
practiced | -2.522 |
thus | -2.485 |
UA | -2.475 |
ildo | -2.462 |
Token | Mac |
Token ID | 14155 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
Supplement | +2.238 |
appendix | +2.199 |
defences | +2.060 |
strang | +2.001 |
gard | +1.950 |
Neg logit contributions | |
ounge | -2.102 |
practiced | -2.101 |
thus | -1.968 |
ildo | -1.949 |
UA | -1.948 |
Token | aca |
Token ID | 22260 |
Feature activation | +7.04e-01 |
Pos logit contributions | |
appendix | +3.288 |
Supplement | +3.279 |
defences | +3.137 |
strang | +3.076 |
gard | +3.011 |
Neg logit contributions | |
ounge | -1.901 |
practiced | -1.872 |
UA | -1.694 |
thus | -1.693 |
ildo | -1.688 |
Token | mul |
Token ID | 35971 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
appendix | +1.988 |
Supplement | +1.955 |
defences | +1.751 |
strang | +1.674 |
gard | +1.594 |
Neg logit contributions | |
ounge | -5.477 |
practiced | -5.400 |
UA | -5.256 |
thus | -5.180 |
ildo | -5.180 |
Token | atta |
Token ID | 25014 |
Feature activation | +8.26e-01 |
Pos logit contributions | |
appendix | +4.882 |
Supplement | +4.867 |
strang | +3.947 |
tier | +3.840 |
gard | +3.806 |
Neg logit contributions | |
ounge | -11.966 |
practiced | -11.929 |
�� | -11.380 |
soType | -11.284 |
UA | -11.011 |
Token | ) |
Token ID | 8 |
Feature activation | +7.35e-01 |
Pos logit contributions | |
appendix | +3.767 |
Supplement | +3.711 |
defences | +3.484 |
strang | +3.401 |
gard | +3.308 |
Neg logit contributions | |
ounge | -4.913 |
practiced | -4.788 |
ildo | -4.620 |
thus | -4.580 |
UA | -4.571 |
Token | were |
Token ID | 547 |
Feature activation | +7.99e-01 |
Pos logit contributions | |
Supplement | +2.969 |
appendix | +2.943 |
defences | +2.712 |
strang | +2.595 |
gard | +2.522 |
Neg logit contributions | |
ounge | -4.758 |
thus | -4.560 |
ildo | -4.559 |
practiced | -4.544 |
UA | -4.538 |
Token | housed |
Token ID | 23707 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
Supplement | +4.376 |
appendix | +4.359 |
defences | +4.098 |
strang | +4.069 |
gard | +3.951 |
Neg logit contributions | |
ounge | -4.033 |
thus | -3.824 |
UA | -3.779 |
ildo | -3.771 |
practiced | -3.757 |
Token | under |
Token ID | 739 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
appendix | +4.191 |
Supplement | +4.166 |
defences | +3.781 |
strang | +3.680 |
gard | +3.501 |
Neg logit contributions | |
ounge | -7.406 |
practiced | -7.181 |
ildo | -7.138 |
UA | -7.125 |
thus | -7.046 |
Token | Glen |
Token ID | 20716 |
Feature activation | -8.54e-01 |
Pos logit contributions | |
practiced | +3.953 |
ounge | +3.855 |
UA | +3.742 |
thus | +3.730 |
ildo | +3.656 |
Neg logit contributions | |
Supplement | -3.916 |
appendix | -3.835 |
defences | -3.686 |
strang | -3.546 |
gard | -3.352 |
Token | Gab |
Token ID | 12300 |
Feature activation | -5.18e-01 |
Pos logit contributions | |
ounge | +4.275 |
practiced | +4.215 |
thus | +4.082 |
UA | +4.079 |
ildo | +4.046 |
Neg logit contributions | |
Supplement | -4.586 |
appendix | -4.559 |
defences | -4.415 |
strang | -4.114 |
gard | -3.989 |
Token | ert |
Token ID | 861 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
ounge | +2.614 |
practiced | +2.613 |
thus | +2.511 |
ildo | +2.446 |
UA | +2.422 |
Neg logit contributions | |
Supplement | -2.876 |
appendix | -2.854 |
defences | -2.742 |
strang | -2.626 |
gard | -2.540 |
Token | was |
Token ID | 373 |
Feature activation | +8.02e-01 |
Pos logit contributions | |
Supplement | +0.645 |
appendix | +0.643 |
defences | +0.605 |
strang | +0.583 |
gard | +0.566 |
Neg logit contributions | |
practiced | -0.755 |
ounge | -0.753 |
thus | -0.714 |
UA | -0.714 |
ildo | -0.702 |
Token | not |
Token ID | 407 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
appendix | +3.828 |
Supplement | +3.780 |
strang | +3.433 |
defences | +3.417 |
gard | +3.310 |
Neg logit contributions | |
ounge | -4.668 |
ildo | -4.466 |
practiced | -4.463 |
UA | -4.422 |
thus | -4.399 |
Token | returned |
Token ID | 4504 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
appendix | +4.040 |
Supplement | +4.005 |
defences | +3.620 |
strang | +3.533 |
gard | +3.483 |
Neg logit contributions | |
ounge | -8.510 |
UA | -8.215 |
thus | -8.147 |
ildo | -8.068 |
practiced | -8.067 |
Token | . |
Token ID | 13 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
appendix | +6.695 |
Supplement | +6.554 |
gard | +6.145 |
defences | +6.077 |
strang | +5.873 |
Neg logit contributions | |
ounge | -9.570 |
practiced | -9.226 |
ildo | -9.030 |
thus | -8.942 |
UA | -8.856 |
Token | Hudson |
Token ID | 19995 |
Feature activation | +9.28e-02 |
Pos logit contributions | |
Supplement | +1.338 |
appendix | +1.330 |
defences | +1.235 |
strang | +1.193 |
gard | +1.174 |
Neg logit contributions | |
practiced | -1.616 |
ounge | -1.609 |
thus | -1.525 |
UA | -1.515 |
ildo | -1.505 |
Token | County |
Token ID | 3418 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
Supplement | +0.531 |
appendix | +0.529 |
defences | +0.503 |
strang | +0.484 |
gard | +0.467 |
Neg logit contributions | |
practiced | -0.460 |
ounge | -0.453 |
UA | -0.431 |
thus | -0.427 |
ildo | -0.417 |
Token | Executive |
Token ID | 10390 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
practiced | +0.750 |
ounge | +0.747 |
thus | +0.711 |
UA | +0.710 |
ildo | +0.697 |
Neg logit contributions | |
Supplement | -0.587 |
appendix | -0.584 |
defences | -0.550 |
strang | -0.527 |
gard | -0.510 |
Token | Tom |
Token ID | 4186 |
Feature activation | -2.66e-01 |
Pos logit contributions | |
practiced | +1.732 |
ounge | +1.724 |
UA | +1.641 |
thus | +1.635 |
ildo | +1.610 |
Neg logit contributions | |
Supplement | -1.587 |
appendix | -1.577 |
defences | -1.496 |
strang | -1.437 |
gard | -1.384 |
Token | economic |
Token ID | 3034 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
practiced | +4.304 |
ounge | +4.198 |
thus | +4.026 |
UA | +3.967 |
ildo | +3.915 |
Neg logit contributions | |
Supplement | -2.992 |
appendix | -2.886 |
defences | -2.697 |
strang | -2.575 |
erald | -2.488 |
Token | affairs |
Token ID | 9674 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
appendix | +1.085 |
Supplement | +1.085 |
defences | +1.027 |
strang | +0.987 |
gard | +0.953 |
Neg logit contributions | |
practiced | -1.293 |
ounge | -1.292 |
thus | -1.227 |
UA | -1.227 |
ildo | -1.203 |
Token | , |
Token ID | 11 |
Feature activation | -2.52e-01 |
Pos logit contributions | |
Supplement | +0.062 |
appendix | +0.061 |
defences | +0.058 |
strang | +0.056 |
gard | +0.054 |
Neg logit contributions | |
practiced | -0.068 |
ounge | -0.067 |
thus | -0.064 |
UA | -0.064 |
ildo | -0.063 |
Token | Rafael |
Token ID | 31918 |
Feature activation | -2.92e-01 |
Pos logit contributions | |
practiced | +1.405 |
ounge | +1.382 |
thus | +1.329 |
UA | +1.313 |
ildo | +1.291 |
Neg logit contributions | |
Supplement | -1.283 |
appendix | -1.264 |
defences | -1.201 |
strang | -1.146 |
gard | -1.108 |
Token | Ram |
Token ID | 7431 |
Feature activation | +6.49e-02 |
Pos logit contributions | |
practiced | +1.489 |
ounge | +1.476 |
ildo | +1.441 |
thus | +1.419 |
UA | +1.412 |
Neg logit contributions | |
Supplement | -1.591 |
appendix | -1.561 |
defences | -1.488 |
strang | -1.447 |
gard | -1.404 |
Token | í |
Token ID | 8836 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
Supplement | +0.425 |
appendix | +0.424 |
defences | +0.406 |
strang | +0.396 |
gard | +0.384 |
Neg logit contributions | |
practiced | -0.264 |
ounge | -0.263 |
thus | -0.247 |
UA | -0.244 |
ildo | -0.242 |
Token | rez |
Token ID | 21107 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
Supplement | +1.381 |
appendix | +1.230 |
defences | +0.961 |
strang | +0.932 |
Moy | +0.632 |
Neg logit contributions | |
ounge | -14.921 |
practiced | -14.666 |
�� | -14.229 |
aimon | -14.098 |
thus | -13.961 |
Token | , |
Token ID | 11 |
Feature activation | -9.83e-01 |
Pos logit contributions | |
Supplement | +0.907 |
appendix | +0.902 |
defences | +0.855 |
strang | +0.822 |
gard | +0.797 |
Neg logit contributions | |
practiced | -0.959 |
ounge | -0.950 |
thus | -0.904 |
UA | -0.903 |
ildo | -0.889 |
Token | with |
Token ID | 351 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
practiced | +5.106 |
ounge | +4.772 |
thus | +4.678 |
UA | +4.562 |
ildo | +4.450 |
Neg logit contributions | |
Supplement | -5.255 |
appendix | -5.061 |
defences | -4.882 |
strang | -4.677 |
gard | -4.465 |
Token | an |
Token ID | 281 |
Feature activation | -4.33e-02 |
Pos logit contributions | |
practiced | +1.626 |
ounge | +1.596 |
thus | +1.530 |
UA | +1.515 |
ildo | +1.498 |
Neg logit contributions | |
Supplement | -1.396 |
appendix | -1.371 |
defences | -1.292 |
strang | -1.235 |
gard | -1.186 |
Token | army |
Token ID | 5428 |
Feature activation | +1.76e-01 |
Pos logit contributions | |
practiced | +0.272 |
ounge | +0.271 |
thus | +0.258 |
UA | +0.258 |
ildo | +0.254 |
Neg logit contributions | |
Supplement | -0.188 |
appendix | -0.186 |
defences | -0.176 |
strang | -0.167 |
gard | -0.161 |
Token | cus |
Token ID | 9042 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
appendix | +4.133 |
Supplement | +4.106 |
defences | +3.947 |
strang | +3.878 |
gard | +3.806 |
Neg logit contributions | |
ounge | -1.893 |
practiced | -1.854 |
UA | -1.679 |
ildo | -1.658 |
thus | -1.621 |
Token | , |
Token ID | 11 |
Feature activation | +3.14e-01 |
Pos logit contributions | |
appendix | +3.110 |
Supplement | +3.088 |
defences | +2.914 |
strang | +2.795 |
gard | +2.706 |
Neg logit contributions | |
ounge | -3.862 |
practiced | -3.794 |
UA | -3.622 |
thus | -3.597 |
ildo | -3.595 |
Token | Gard |
Token ID | 12790 |
Feature activation | +4.15e-01 |
Pos logit contributions | |
appendix | +1.546 |
Supplement | +1.532 |
defences | +1.447 |
strang | +1.396 |
gard | +1.352 |
Neg logit contributions | |
ounge | -1.799 |
practiced | -1.785 |
UA | -1.691 |
thus | -1.682 |
ildo | -1.666 |
Token | n |
Token ID | 77 |
Feature activation | -4.20e-01 |
Pos logit contributions | |
appendix | +2.228 |
Supplement | +2.203 |
defences | +2.130 |
strang | +2.033 |
gard | +1.967 |
Neg logit contributions | |
practiced | -2.149 |
ounge | -2.124 |
UA | -2.016 |
thus | -1.970 |
ildo | -1.960 |
Token | erella |
Token ID | 36648 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
ounge | +2.300 |
practiced | +2.269 |
thus | +2.185 |
ildo | +2.146 |
UA | +2.134 |
Neg logit contributions | |
Supplement | -2.171 |
appendix | -2.148 |
defences | -2.035 |
strang | -1.939 |
gard | -1.901 |
Token | vaginal |
Token ID | 30131 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
appendix | +2.841 |
Supplement | +2.783 |
defences | +2.644 |
strang | +2.542 |
gard | +2.470 |
Neg logit contributions | |
ounge | -3.583 |
practiced | -3.513 |
UA | -3.364 |
ildo | -3.339 |
thus | -3.312 |
Token | is |
Token ID | 271 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
appendix | +7.474 |
Supplement | +7.329 |
defences | +7.173 |
strang | +7.090 |
gard | +6.579 |
Neg logit contributions | |
ounge | -8.574 |
practiced | -8.265 |
UA | -8.129 |
anguage | -7.832 |
ildo | -7.804 |
Token | , |
Token ID | 11 |
Feature activation | +3.21e-01 |
Pos logit contributions | |
appendix | +1.688 |
Supplement | +1.688 |
defences | +1.591 |
strang | +1.528 |
gard | +1.481 |
Neg logit contributions | |
ounge | -2.003 |
practiced | -1.999 |
UA | -1.896 |
thus | -1.890 |
ildo | -1.865 |
Token | Mobil |
Token ID | 45951 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
appendix | +1.609 |
Supplement | +1.598 |
defences | +1.511 |
strang | +1.457 |
gard | +1.415 |
Neg logit contributions | |
ounge | -1.811 |
practiced | -1.797 |
UA | -1.703 |
thus | -1.696 |
ildo | -1.676 |
Token | un |
Token ID | 403 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
Supplement | +0.908 |
appendix | +0.907 |
defences | +0.864 |
strang | +0.838 |
gard | +0.818 |
Neg logit contributions | |
practiced | -0.665 |
ounge | -0.661 |
UA | -0.616 |
thus | -0.614 |
ildo | -0.601 |
Token | cus |
Token ID | 9042 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
Supplement | +1.011 |
appendix | +1.008 |
defences | +0.964 |
strang | +0.935 |
gard | +0.913 |
Neg logit contributions | |
practiced | -0.701 |
ounge | -0.697 |
UA | -0.650 |
thus | -0.650 |
ildo | -0.634 |
Token | 20 |
Token ID | 1160 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
Supplement | +0.314 |
appendix | +0.313 |
defences | +0.293 |
strang | +0.285 |
gard | +0.276 |
Neg logit contributions | |
ounge | -0.295 |
practiced | -0.295 |
UA | -0.273 |
thus | -0.273 |
ildo | -0.271 |
Token | 2013 |
Token ID | 2211 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
Supplement | +0.811 |
appendix | +0.807 |
defences | +0.751 |
strang | +0.717 |
gard | +0.687 |
Neg logit contributions | |
practiced | -1.397 |
ounge | -1.394 |
UA | -1.333 |
thus | -1.332 |
ildo | -1.313 |
Token | 07 |
Token ID | 8753 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
appendix | +1.278 |
Supplement | +1.277 |
defences | +1.195 |
strang | +1.167 |
gard | +1.140 |
Neg logit contributions | |
ounge | -1.267 |
practiced | -1.257 |
UA | -1.184 |
thus | -1.177 |
ildo | -1.168 |
Token | : |
Token ID | 25 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
Supplement | +0.808 |
appendix | +0.783 |
defences | +0.723 |
strang | +0.697 |
gard | +0.680 |
Neg logit contributions | |
ounge | -1.175 |
practiced | -1.169 |
thus | -1.101 |
UA | -1.097 |
anguage | -1.092 |
Token | 50 |
Token ID | 1120 |
Feature activation | +6.19e-01 |
Pos logit contributions | |
Supplement | +1.588 |
appendix | +1.507 |
defences | +1.364 |
strang | +1.334 |
gard | +1.303 |
Neg logit contributions | |
practiced | -1.914 |
ounge | -1.898 |
anguage | -1.775 |
ildo | -1.753 |
UA | -1.740 |
Token | pur |
Token ID | 1308 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
appendix | +2.973 |
Supplement | +2.969 |
defences | +2.823 |
strang | +2.714 |
gard | +2.643 |
Neg logit contributions | |
ounge | -3.532 |
practiced | -3.527 |
UA | -3.366 |
thus | -3.349 |
ildo | -3.306 |
Token | ak |
Token ID | 461 |
Feature activation | -9.71e-02 |
Pos logit contributions | |
Supplement | +6.132 |
appendix | +5.616 |
defences | +4.761 |
erald | +4.754 |
gard | +4.677 |
Neg logit contributions | |
practiced | -10.218 |
�� | -10.095 |
ounge | -9.703 |
UA | -9.223 |
thus | -9.128 |
Token | ushi |
Token ID | 17731 |
Feature activation | +2.86e-01 |
Pos logit contributions | |
practiced | +0.463 |
ounge | +0.453 |
thus | +0.432 |
UA | +0.431 |
ildo | +0.415 |
Neg logit contributions | |
Supplement | -0.573 |
appendix | -0.561 |
defences | -0.531 |
strang | -0.512 |
gard | -0.500 |
Token | wrote |
Token ID | 2630 |
Feature activation | +3.60e-01 |
Pos logit contributions | |
appendix | +1.481 |
Supplement | +1.473 |
defences | +1.415 |
strang | +1.346 |
gard | +1.312 |
Neg logit contributions | |
practiced | -1.582 |
ounge | -1.565 |
UA | -1.486 |
thus | -1.471 |
ildo | -1.442 |
Token | : |
Token ID | 25 |
Feature activation | +3.05e-01 |
Pos logit contributions | |
Supplement | +1.438 |
appendix | +1.392 |
defences | +1.266 |
strang | +1.215 |
gard | +1.184 |
Neg logit contributions | |
ounge | -2.408 |
practiced | -2.405 |
anguage | -2.292 |
UA | -2.248 |
ildo | -2.246 |
Token |
|
Token ID | 198 |
Feature activation | +5.31e-03 |
Pos logit contributions | |
Supplement | +1.307 |
appendix | +1.241 |
defences | +1.128 |
strang | +1.091 |
gard | +1.060 |
Neg logit contributions | |
ounge | -1.978 |
practiced | -1.970 |
anguage | -1.844 |
ildo | -1.843 |
UA | -1.836 |
Token | 2 |
Token ID | 17 |
Feature activation | -5.11e-01 |
Pos logit contributions | |
Supplement | +3.607 |
appendix | +3.522 |
defences | +3.261 |
strang | +3.129 |
gard | +3.011 |
Neg logit contributions | |
practiced | -5.752 |
ounge | -5.692 |
thus | -5.481 |
UA | -5.415 |
ildo | -5.381 |
Token | [ |
Token ID | 58 |
Feature activation | -8.37e-01 |
Pos logit contributions | |
ounge | +3.400 |
practiced | +3.393 |
thus | +3.272 |
UA | +3.260 |
ildo | +3.200 |
Neg logit contributions | |
appendix | -1.993 |
Supplement | -1.977 |
defences | -1.883 |
strang | -1.785 |
gard | -1.707 |
Token | 0 |
Token ID | 15 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
ounge | +3.673 |
UA | +3.601 |
practiced | +3.495 |
thus | +3.465 |
artist | +3.350 |
Neg logit contributions | |
appendix | -5.002 |
defences | -4.754 |
strang | -4.725 |
Supplement | -4.701 |
gard | -4.540 |
Token | ], |
Token ID | 4357 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
practiced | +0.727 |
ounge | +0.724 |
UA | +0.691 |
thus | +0.691 |
ildo | +0.681 |
Neg logit contributions | |
Supplement | -0.399 |
appendix | -0.395 |
defences | -0.363 |
strang | -0.345 |
gard | -0.329 |
Token | $ |
Token ID | 3 |
Feature activation | +6.05e-01 |
Pos logit contributions | |
Supplement | +2.056 |
appendix | +1.508 |
defences | +1.067 |
Imm | +0.973 |
gard | +0.845 |
Neg logit contributions | |
practiced | -9.229 |
ounge | -9.089 |
�� | -8.880 |
anguage | -8.723 |
ildo | -8.544 |
Token | FC |
Token ID | 4851 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
Supplement | +2.958 |
appendix | +2.787 |
defences | +2.576 |
strang | +2.423 |
gard | +2.412 |
Neg logit contributions | |
practiced | -3.624 |
ounge | -3.559 |
thus | -3.302 |
ildo | -3.296 |
anguage | -3.273 |
Token | 2 |
Token ID | 17 |
Feature activation | -2.01e-01 |
Pos logit contributions | |
Supplement | +4.590 |
appendix | +3.390 |
Imm | +2.820 |
Pac | +2.720 |
gard | +2.504 |
Neg logit contributions | |
practiced | -12.135 |
�� | -12.134 |
anguage | -11.967 |
ounge | -11.700 |
aimon | -11.343 |
Token | [ |
Token ID | 58 |
Feature activation | -5.95e-01 |
Pos logit contributions | |
practiced | +1.433 |
ounge | +1.425 |
thus | +1.358 |
UA | +1.357 |
ildo | +1.344 |
Neg logit contributions | |
Supplement | -0.723 |
appendix | -0.707 |
defences | -0.643 |
strang | -0.606 |
gard | -0.584 |
Token | 1 |
Token ID | 16 |
Feature activation | -8.34e-02 |
Pos logit contributions | |
ounge | +3.203 |
practiced | +3.163 |
thus | +3.094 |
UA | +3.087 |
ildo | +2.964 |
Neg logit contributions | |
appendix | -3.050 |
defences | -2.952 |
Supplement | -2.931 |
strang | -2.842 |
gard | -2.741 |
Token | ], |
Token ID | 4357 |
Feature activation | +7.97e-01 |
Pos logit contributions | |
practiced | +0.579 |
ounge | +0.578 |
UA | +0.551 |
thus | +0.551 |
ildo | +0.544 |
Neg logit contributions | |
Supplement | -0.311 |
appendix | -0.307 |
defences | -0.280 |
strang | -0.267 |
gard | -0.253 |
Token | $ |
Token ID | 3 |
Feature activation | +3.02e-01 |
Pos logit contributions | |
Supplement | +1.619 |
appendix | +1.234 |
defences | +0.899 |
Imm | +0.777 |
strang | +0.728 |
Neg logit contributions | |
practiced | -7.132 |
ounge | -7.033 |
�� | -6.846 |
anguage | -6.756 |
ildo | -6.620 |
Token | statement |
Token ID | 2643 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
practiced | +0.114 |
ounge | +0.113 |
UA | +0.107 |
thus | +0.107 |
ildo | +0.105 |
Neg logit contributions | |
Supplement | -0.107 |
appendix | -0.106 |
defences | -0.100 |
strang | -0.097 |
gard | -0.094 |
Token | . |
Token ID | 13 |
Feature activation | -5.00e-02 |
Pos logit contributions | |
Supplement | +1.624 |
appendix | +1.620 |
defences | +1.532 |
strang | +1.473 |
gard | +1.434 |
Neg logit contributions | |
practiced | -1.723 |
ounge | -1.722 |
UA | -1.629 |
thus | -1.629 |
ildo | -1.601 |
Token |
|
Token ID | 198 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
practiced | +0.265 |
ounge | +0.264 |
thus | +0.249 |
UA | +0.249 |
ildo | +0.244 |
Neg logit contributions | |
Supplement | -0.266 |
appendix | -0.265 |
defences | -0.251 |
strang | -0.242 |
gard | -0.235 |
Token |
|
Token ID | 198 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
Supplement | +0.471 |
appendix | +0.458 |
defences | +0.419 |
strang | +0.402 |
gard | +0.392 |
Neg logit contributions | |
practiced | -0.669 |
ounge | -0.668 |
UA | -0.625 |
thus | -0.621 |
anguage | -0.620 |
Token | Story |
Token ID | 11605 |
Feature activation | +9.91e-01 |
Pos logit contributions | |
Supplement | +1.460 |
appendix | +1.437 |
defences | +1.368 |
strang | +1.320 |
gard | +1.293 |
Neg logit contributions | |
practiced | -1.141 |
ounge | -1.129 |
thus | -1.052 |
UA | -1.044 |
ildo | -1.037 |
Token | continues |
Token ID | 4477 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
appendix | +3.429 |
Supplement | +3.168 |
defences | +2.984 |
gard | +2.744 |
strang | +2.738 |
Neg logit contributions | |
ounge | -6.911 |
practiced | -6.770 |
anguage | -6.686 |
�� | -6.636 |
ildo | -6.614 |
Token | below |
Token ID | 2174 |
Feature activation | +7.72e-01 |
Pos logit contributions | |
appendix | +5.191 |
Supplement | +4.434 |
defences | +4.271 |
tier | +4.228 |
gard | +4.178 |
Neg logit contributions | |
ounge | -11.065 |
�� | -10.804 |
ildo | -10.696 |
anguage | -10.655 |
practiced | -10.494 |
Token | advertisement |
Token ID | 15422 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
appendix | +2.395 |
Supplement | +2.092 |
defences | +2.072 |
strang | +1.957 |
gard | +1.820 |
Neg logit contributions | |
ounge | -5.924 |
practiced | -5.767 |
thus | -5.642 |
UA | -5.575 |
ildo | -5.571 |
Token |
|
Token ID | 198 |
Feature activation | +5.21e-01 |
Pos logit contributions | |
Supplement | +3.968 |
appendix | +3.545 |
defences | +2.786 |
Imm | +2.766 |
gard | +2.761 |
Neg logit contributions | |
practiced | -8.417 |
ounge | -8.397 |
�� | -8.289 |
anguage | -8.244 |
ildo | -7.738 |
Token |
|
Token ID | 198 |
Feature activation | +5.80e-01 |
Pos logit contributions | |
Supplement | +2.107 |
appendix | +1.967 |
defences | +1.723 |
strang | +1.653 |
gard | +1.616 |
Neg logit contributions | |
practiced | -3.546 |
ounge | -3.540 |
anguage | -3.394 |
�� | -3.341 |
ildo | -3.270 |
Token | It |
Token ID | 1026 |
Feature activation | -3.37e-01 |
Pos logit contributions | |
Supplement | +3.184 |
appendix | +3.036 |
defences | +2.849 |
strang | +2.713 |
gard | +2.676 |
Neg logit contributions | |
practiced | -3.083 |
ounge | -3.020 |
ildo | -2.802 |
thus | -2.793 |
UA | -2.737 |
Token | positions |
Token ID | 6116 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
practiced | +1.950 |
ounge | +1.929 |
thus | +1.831 |
UA | +1.821 |
ildo | +1.782 |
Neg logit contributions | |
Supplement | -1.522 |
appendix | -1.494 |
defences | -1.395 |
strang | -1.355 |
gard | -1.275 |
Token | are |
Token ID | 389 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
Supplement | +0.453 |
appendix | +0.451 |
defences | +0.421 |
strang | +0.401 |
gard | +0.387 |
Neg logit contributions | |
practiced | -0.710 |
ounge | -0.709 |
UA | -0.678 |
thus | -0.677 |
ildo | -0.667 |
Token | currently |
Token ID | 3058 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
appendix | +1.466 |
Supplement | +1.464 |
defences | +1.378 |
strang | +1.316 |
gard | +1.289 |
Neg logit contributions | |
ounge | -1.903 |
practiced | -1.892 |
thus | -1.824 |
UA | -1.817 |
ildo | -1.796 |
Token | held |
Token ID | 2714 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
Supplement | +0.838 |
appendix | +0.837 |
defences | +0.788 |
strang | +0.754 |
gard | +0.736 |
Neg logit contributions | |
ounge | -1.051 |
practiced | -1.046 |
thus | -1.002 |
UA | -1.000 |
ildo | -0.986 |
Token | by |
Token ID | 416 |
Feature activation | +4.52e-01 |
Pos logit contributions | |
Supplement | +1.034 |
appendix | +1.027 |
defences | +0.970 |
strang | +0.931 |
gard | +0.896 |
Neg logit contributions | |
practiced | -1.285 |
ounge | -1.280 |
thus | -1.215 |
UA | -1.213 |
ildo | -1.188 |
Token | bilingual |
Token ID | 48116 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
appendix | +2.001 |
Supplement | +1.971 |
defences | +1.870 |
strang | +1.782 |
gard | +1.763 |
Neg logit contributions | |
ounge | -2.786 |
practiced | -2.769 |
thus | -2.670 |
UA | -2.661 |
ildo | -2.630 |
Token | public |
Token ID | 1171 |
Feature activation | +2.44e-01 |
Pos logit contributions | |
appendix | +6.633 |
defences | +6.181 |
Supplement | +6.089 |
gard | +6.024 |
strang | +5.787 |
Neg logit contributions | |
ounge | -9.083 |
practiced | -8.943 |
UA | -8.892 |
thus | -8.752 |
ildo | -8.645 |
Token | servants |
Token ID | 17523 |
Feature activation | +4.55e-01 |
Pos logit contributions | |
Supplement | +1.089 |
appendix | +1.072 |
defences | +0.994 |
strang | +0.954 |
gard | +0.913 |
Neg logit contributions | |
practiced | -1.520 |
ounge | -1.507 |
UA | -1.432 |
thus | -1.431 |
ildo | -1.413 |
Token | . |
Token ID | 13 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
Supplement | +2.221 |
appendix | +2.219 |
defences | +2.089 |
strang | +2.010 |
gard | +1.969 |
Neg logit contributions | |
ounge | -2.572 |
practiced | -2.552 |
UA | -2.446 |
thus | -2.434 |
ildo | -2.411 |
Token |
|
Token ID | 198 |
Feature activation | -3.97e-02 |
Pos logit contributions | |
Supplement | +2.083 |
appendix | +2.073 |
defences | +1.947 |
strang | +1.874 |
gard | +1.832 |
Neg logit contributions | |
practiced | -2.367 |
ounge | -2.357 |
thus | -2.232 |
UA | -2.228 |
ildo | -2.186 |
Token |
|
Token ID | 198 |
Feature activation | +2.59e-01 |
Pos logit contributions | |
practiced | +0.243 |
ounge | +0.243 |
UA | +0.228 |
thus | +0.228 |
ildo | +0.226 |
Neg logit contributions | |
Supplement | -0.183 |
appendix | -0.180 |
defences | -0.166 |
strang | -0.160 |
gard | -0.155 |
Token | , |
Token ID | 11 |
Feature activation | +4.55e-02 |
Pos logit contributions | |
practiced | +3.596 |
ounge | +3.531 |
thus | +3.396 |
UA | +3.385 |
ildo | +3.247 |
Neg logit contributions | |
appendix | -3.246 |
Supplement | -3.242 |
defences | -3.129 |
strang | -2.939 |
gard | -2.842 |
Token | did |
Token ID | 750 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
Supplement | +0.195 |
appendix | +0.194 |
defences | +0.182 |
strang | +0.174 |
gard | +0.168 |
Neg logit contributions | |
practiced | -0.288 |
ounge | -0.287 |
thus | -0.274 |
UA | -0.274 |
ildo | -0.269 |
Token | not |
Token ID | 407 |
Feature activation | +5.90e-01 |
Pos logit contributions | |
Supplement | +1.337 |
appendix | +1.331 |
defences | +1.271 |
strang | +1.222 |
gard | +1.185 |
Neg logit contributions | |
practiced | -1.231 |
ounge | -1.222 |
thus | -1.155 |
UA | -1.153 |
ildo | -1.121 |
Token | respond |
Token ID | 3031 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
appendix | +2.301 |
Supplement | +2.289 |
defences | +2.087 |
strang | +2.024 |
gard | +1.976 |
Neg logit contributions | |
ounge | -3.955 |
practiced | -3.892 |
UA | -3.800 |
thus | -3.769 |
ildo | -3.707 |
Token | when |
Token ID | 618 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
appendix | +5.074 |
Supplement | +5.047 |
defences | +4.764 |
strang | +4.567 |
gard | +4.528 |
Neg logit contributions | |
practiced | -6.365 |
ounge | -6.342 |
thus | -6.094 |
UA | -6.051 |
ildo | -5.966 |
Token | contacted |
Token ID | 11237 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
appendix | +4.572 |
Supplement | +4.362 |
defences | +4.197 |
gard | +4.151 |
strang | +4.126 |
Neg logit contributions | |
ounge | -7.434 |
practiced | -7.200 |
thus | -7.195 |
ildo | -7.016 |
UA | -6.919 |
Token | via |
Token ID | 2884 |
Feature activation | +9.10e-01 |
Pos logit contributions | |
appendix | +6.241 |
Supplement | +6.151 |
gard | +5.657 |
defences | +5.592 |
strang | +5.361 |
Neg logit contributions | |
ounge | -9.671 |
practiced | -9.532 |
thus | -9.207 |
UA | -9.188 |
ildo | -9.057 |
Token | the |
Token ID | 262 |
Feature activation | +7.98e-01 |
Pos logit contributions | |
appendix | +4.353 |
Supplement | +4.276 |
defences | +4.122 |
strang | +4.024 |
gard | +3.948 |
Neg logit contributions | |
ounge | -5.141 |
practiced | -5.053 |
thus | -4.897 |
ildo | -4.827 |
UA | -4.807 |
Token | social |
Token ID | 1919 |
Feature activation | -6.25e-01 |
Pos logit contributions | |
appendix | +3.885 |
Supplement | +3.850 |
defences | +3.651 |
strang | +3.602 |
gard | +3.493 |
Neg logit contributions | |
ounge | -4.428 |
practiced | -4.393 |
thus | -4.194 |
ildo | -4.162 |
UA | -4.151 |
Token | networking |
Token ID | 19140 |
Feature activation | -6.80e-01 |
Pos logit contributions | |
practiced | +3.163 |
ounge | +3.117 |
UA | +2.974 |
thus | +2.870 |
ildo | +2.824 |
Neg logit contributions | |
Supplement | -3.432 |
appendix | -3.348 |
defences | -3.178 |
strang | -3.038 |
erald | -2.956 |
Token | website |
Token ID | 3052 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
practiced | +3.148 |
ounge | +3.063 |
UA | +2.892 |
thus | +2.845 |
ildo | +2.756 |
Neg logit contributions | |
Supplement | -4.069 |
appendix | -3.935 |
defences | -3.771 |
strang | -3.663 |
erald | -3.559 |
Token |
|
Token ID | 198 |
Feature activation | -1.76e-01 |
Pos logit contributions | |
practiced | +1.024 |
ounge | +1.022 |
UA | +0.977 |
thus | +0.975 |
ildo | +0.951 |
Neg logit contributions | |
appendix | -0.997 |
Supplement | -0.992 |
defences | -0.954 |
strang | -0.915 |
gard | -0.885 |
Token |
|
Token ID | 198 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
practiced | +1.055 |
ounge | +1.050 |
thus | +0.991 |
UA | +0.987 |
ildo | +0.978 |
Neg logit contributions | |
Supplement | -0.834 |
appendix | -0.820 |
defences | -0.765 |
strang | -0.734 |
gard | -0.712 |
Token | But |
Token ID | 1537 |
Feature activation | +2.69e-01 |
Pos logit contributions | |
practiced | +0.541 |
ounge | +0.541 |
UA | +0.517 |
thus | +0.515 |
ildo | +0.500 |
Neg logit contributions | |
appendix | -0.559 |
Supplement | -0.553 |
defences | -0.534 |
strang | -0.515 |
gard | -0.499 |
Token | as |
Token ID | 355 |
Feature activation | +9.76e-02 |
Pos logit contributions | |
appendix | +1.230 |
Supplement | +1.227 |
defences | +1.157 |
strang | +1.115 |
gard | +1.077 |
Neg logit contributions | |
ounge | -1.615 |
practiced | -1.615 |
UA | -1.535 |
thus | -1.535 |
ildo | -1.514 |
Token | The |
Token ID | 383 |
Feature activation | +9.34e-02 |
Pos logit contributions | |
Supplement | +0.457 |
appendix | +0.454 |
defences | +0.427 |
strang | +0.410 |
gard | +0.396 |
Neg logit contributions | |
practiced | -0.582 |
ounge | -0.578 |
thus | -0.550 |
UA | -0.550 |
ildo | -0.540 |
Token | Guardian |
Token ID | 8283 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
Supplement | +0.471 |
appendix | +0.468 |
defences | +0.442 |
strang | +0.426 |
gard | +0.414 |
Neg logit contributions | |
practiced | -0.521 |
ounge | -0.519 |
thus | -0.491 |
UA | -0.490 |
ildo | -0.484 |
Token | reported |
Token ID | 2098 |
Feature activation | +7.40e-02 |
Pos logit contributions | |
appendix | +6.525 |
Supplement | +6.170 |
defences | +6.001 |
gard | +5.894 |
strang | +5.618 |
Neg logit contributions | |
ounge | -9.279 |
practiced | -8.953 |
UA | -8.896 |
thus | -8.747 |
ildo | -8.714 |
Token | Sunday |
Token ID | 3502 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
Supplement | +0.338 |
appendix | +0.336 |
defences | +0.316 |
strang | +0.303 |
gard | +0.292 |
Neg logit contributions | |
practiced | -0.450 |
ounge | -0.446 |
thus | -0.427 |
UA | -0.425 |
ildo | -0.417 |
Token | , |
Token ID | 11 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
Supplement | +1.392 |
appendix | +1.386 |
defences | +1.309 |
strang | +1.258 |
gard | +1.219 |
Neg logit contributions | |
practiced | -1.634 |
ounge | -1.628 |
thus | -1.546 |
UA | -1.545 |
ildo | -1.517 |
Token | other |
Token ID | 584 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
Supplement | +0.837 |
appendix | +0.833 |
defences | +0.784 |
strang | +0.751 |
gard | +0.727 |
Neg logit contributions | |
practiced | -1.105 |
ounge | -1.102 |
thus | -1.049 |
UA | -1.048 |
ildo | -1.031 |
Token | public |
Token ID | 1171 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
practiced | +0.791 |
ounge | +0.786 |
thus | +0.748 |
UA | +0.747 |
ildo | +0.735 |
Neg logit contributions | |
Supplement | -0.599 |
appendix | -0.593 |
defences | -0.557 |
strang | -0.533 |
gard | -0.514 |
Token | " |
Token ID | 366 |
Feature activation | +9.81e-02 |
Pos logit contributions | |
appendix | +0.779 |
Supplement | +0.778 |
defences | +0.735 |
strang | +0.706 |
gard | +0.682 |
Neg logit contributions | |
ounge | -0.957 |
practiced | -0.956 |
UA | -0.910 |
thus | -0.908 |
ildo | -0.895 |
Token | people |
Token ID | 15332 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
Supplement | +0.563 |
appendix | +0.559 |
defences | +0.533 |
strang | +0.515 |
gard | +0.502 |
Neg logit contributions | |
practiced | -0.480 |
ounge | -0.478 |
UA | -0.448 |
thus | -0.447 |
ildo | -0.440 |
Token | don |
Token ID | 836 |
Feature activation | +3.55e-01 |
Pos logit contributions | |
Supplement | +0.774 |
appendix | +0.771 |
defences | +0.721 |
strang | +0.688 |
gard | +0.663 |
Neg logit contributions | |
practiced | -1.184 |
ounge | -1.181 |
thus | -1.128 |
UA | -1.127 |
ildo | -1.109 |
Token | 't |
Token ID | 470 |
Feature activation | +4.94e-01 |
Pos logit contributions | |
Supplement | +1.775 |
appendix | +1.700 |
defences | +1.553 |
strang | +1.503 |
gard | +1.487 |
Neg logit contributions | |
practiced | -2.053 |
ounge | -2.035 |
anguage | -1.898 |
UA | -1.888 |
ildo | -1.864 |
Token | know |
Token ID | 760 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
appendix | +1.574 |
Supplement | +1.556 |
defences | +1.432 |
strang | +1.347 |
gard | +1.296 |
Neg logit contributions | |
ounge | -3.655 |
practiced | -3.620 |
UA | -3.533 |
thus | -3.507 |
ildo | -3.476 |
Token | who |
Token ID | 508 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
appendix | +4.217 |
Supplement | +4.155 |
defences | +3.905 |
strang | +3.822 |
gard | +3.646 |
Neg logit contributions | |
ounge | -6.898 |
practiced | -6.828 |
thus | -6.529 |
UA | -6.524 |
ildo | -6.460 |
Token | the |
Token ID | 262 |
Feature activation | +7.68e-01 |
Pos logit contributions | |
appendix | +6.079 |
Supplement | +5.980 |
defences | +5.669 |
strang | +5.576 |
gard | +5.259 |
Neg logit contributions | |
ounge | -9.581 |
practiced | -9.382 |
UA | -9.038 |
thus | -8.998 |
ildo | -8.850 |
Token | Koch |
Token ID | 17009 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
appendix | +3.524 |
Supplement | +3.503 |
defences | +3.311 |
strang | +3.220 |
gard | +3.075 |
Neg logit contributions | |
ounge | -4.534 |
practiced | -4.531 |
UA | -4.312 |
thus | -4.308 |
ildo | -4.235 |
Token | brothers |
Token ID | 9397 |
Feature activation | -3.17e-02 |
Pos logit contributions | |
Supplement | +0.882 |
appendix | +0.866 |
defences | +0.829 |
strang | +0.790 |
gard | +0.776 |
Neg logit contributions | |
practiced | -0.877 |
ounge | -0.863 |
UA | -0.820 |
thus | -0.812 |
ildo | -0.799 |
Token | are |
Token ID | 389 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
practiced | +0.209 |
ounge | +0.202 |
UA | +0.192 |
thus | +0.191 |
ildo | +0.190 |
Neg logit contributions | |
Supplement | -0.137 |
appendix | -0.133 |
defences | -0.125 |
strang | -0.117 |
gard | -0.116 |
Token | ." |
Token ID | 526 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
practiced | +0.630 |
ounge | +0.620 |
thus | +0.593 |
UA | +0.586 |
ildo | +0.575 |
Neg logit contributions | |
Supplement | -0.569 |
appendix | -0.564 |
defences | -0.534 |
strang | -0.513 |
gard | -0.497 |
Token | primary |
Token ID | 4165 |
Feature activation | +5.81e-02 |
Pos logit contributions | |
practiced | +0.274 |
ounge | +0.273 |
thus | +0.259 |
UA | +0.258 |
ildo | +0.254 |
Neg logit contributions | |
Supplement | -0.252 |
appendix | -0.249 |
defences | -0.237 |
strang | -0.228 |
gard | -0.221 |
Token | . |
Token ID | 13 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
Supplement | +0.301 |
appendix | +0.299 |
defences | +0.284 |
strang | +0.273 |
gard | +0.265 |
Neg logit contributions | |
practiced | -0.317 |
ounge | -0.314 |
thus | -0.298 |
UA | -0.298 |
ildo | -0.292 |
Token | And |
Token ID | 843 |
Feature activation | +1.97e-01 |
Pos logit contributions | |
Supplement | +0.062 |
appendix | +0.061 |
defences | +0.058 |
strang | +0.056 |
gard | +0.054 |
Neg logit contributions | |
practiced | -0.063 |
ounge | -0.063 |
thus | -0.059 |
UA | -0.059 |
ildo | -0.058 |
Token | as |
Token ID | 355 |
Feature activation | +1.32e-02 |
Pos logit contributions | |
Supplement | +0.925 |
appendix | +0.920 |
defences | +0.869 |
strang | +0.839 |
gard | +0.809 |
Neg logit contributions | |
ounge | -1.159 |
practiced | -1.156 |
UA | -1.101 |
thus | -1.092 |
ildo | -1.087 |
Token | The |
Token ID | 383 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
Supplement | +0.064 |
appendix | +0.064 |
defences | +0.060 |
strang | +0.058 |
gard | +0.056 |
Neg logit contributions | |
practiced | -0.076 |
ounge | -0.076 |
thus | -0.072 |
UA | -0.072 |
ildo | -0.071 |
Token | Intercept |
Token ID | 37127 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
Supplement | +0.798 |
appendix | +0.794 |
defences | +0.752 |
strang | +0.728 |
gard | +0.707 |
Neg logit contributions | |
practiced | -0.765 |
ounge | -0.763 |
thus | -0.719 |
UA | -0.717 |
ildo | -0.708 |
Token | � |
Token ID | 447 |
Feature activation | +5.39e-01 |
Pos logit contributions | |
appendix | +6.480 |
Supplement | +6.227 |
defences | +5.686 |
gard | +5.640 |
strang | +5.403 |
Neg logit contributions | |
ounge | -9.210 |
thus | -8.785 |
UA | -8.743 |
practiced | -8.735 |
ildo | -8.579 |
Token | � |
Token ID | 247 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
Supplement | +2.806 |
appendix | +2.794 |
defences | +2.553 |
gard | +2.493 |
strang | +2.491 |
Neg logit contributions | |
ounge | -2.889 |
practiced | -2.782 |
UA | -2.648 |
ildo | -2.640 |
thus | -2.582 |
Token | s |
Token ID | 82 |
Feature activation | +6.19e-01 |
Pos logit contributions | |
Supplement | +1.326 |
appendix | +1.321 |
defences | +1.205 |
strang | +1.144 |
gard | +1.099 |
Neg logit contributions | |
practiced | -2.633 |
ounge | -2.628 |
UA | -2.526 |
thus | -2.520 |
ildo | -2.492 |
Token | Z |
Token ID | 1168 |
Feature activation | -2.41e-02 |
Pos logit contributions | |
appendix | +3.150 |
Supplement | +3.117 |
defences | +2.958 |
strang | +2.839 |
gard | +2.786 |
Neg logit contributions | |
ounge | -3.390 |
practiced | -3.344 |
thus | -3.198 |
UA | -3.188 |
ildo | -3.142 |
Token | aid |
Token ID | 1698 |
Feature activation | +4.47e-01 |
Pos logit contributions | |
practiced | +0.107 |
ounge | +0.106 |
thus | +0.099 |
UA | +0.099 |
ildo | +0.097 |
Neg logit contributions | |
Supplement | -0.149 |
appendix | -0.149 |
defences | -0.142 |
strang | -0.138 |
gard | -0.135 |
Token | financial |
Token ID | 3176 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
Supplement | +0.709 |
appendix | +0.708 |
defences | +0.664 |
strang | +0.636 |
gard | +0.615 |
Neg logit contributions | |
practiced | -0.987 |
ounge | -0.985 |
thus | -0.939 |
UA | -0.937 |
ildo | -0.922 |
Token | crisis |
Token ID | 4902 |
Feature activation | +4.61e-01 |
Pos logit contributions | |
appendix | +2.227 |
Supplement | +2.195 |
defences | +2.085 |
strang | +2.004 |
gard | +1.912 |
Neg logit contributions | |
ounge | -3.841 |
practiced | -3.836 |
thus | -3.651 |
UA | -3.645 |
ildo | -3.621 |
Token | . |
Token ID | 13 |
Feature activation | -1.56e-01 |
Pos logit contributions | |
appendix | +2.234 |
Supplement | +2.230 |
defences | +2.119 |
strang | +2.030 |
gard | +1.966 |
Neg logit contributions | |
ounge | -2.649 |
practiced | -2.633 |
UA | -2.510 |
thus | -2.498 |
ildo | -2.461 |
Token |
|
Token ID | 198 |
Feature activation | -2.12e-01 |
Pos logit contributions | |
practiced | +0.816 |
ounge | +0.816 |
UA | +0.784 |
thus | +0.780 |
ildo | +0.754 |
Neg logit contributions | |
appendix | -0.830 |
Supplement | -0.819 |
defences | -0.798 |
strang | -0.763 |
gard | -0.730 |
Token |
|
Token ID | 198 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
practiced | +1.259 |
ounge | +1.255 |
thus | +1.185 |
UA | +1.185 |
ildo | +1.169 |
Neg logit contributions | |
Supplement | -1.000 |
appendix | -0.988 |
defences | -0.926 |
strang | -0.889 |
gard | -0.862 |
Token | Hug |
Token ID | 48098 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
ounge | +0.700 |
practiced | +0.699 |
UA | +0.670 |
thus | +0.667 |
ildo | +0.645 |
Neg logit contributions | |
appendix | -0.738 |
Supplement | -0.729 |
defences | -0.704 |
strang | -0.679 |
gard | -0.657 |
Token | hes |
Token ID | 956 |
Feature activation | +4.85e-02 |
Pos logit contributions | |
appendix | +3.276 |
Supplement | +3.118 |
defences | +2.479 |
strang | +2.411 |
quirks | +2.380 |
Neg logit contributions | |
ounge | -12.071 |
practiced | -11.930 |
anguage | -11.775 |
�� | -11.700 |
soType | -11.565 |
Token | said |
Token ID | 531 |
Feature activation | +7.50e-02 |
Pos logit contributions | |
Supplement | +0.229 |
appendix | +0.228 |
defences | +0.215 |
strang | +0.206 |
gard | +0.199 |
Neg logit contributions | |
practiced | -0.287 |
ounge | -0.285 |
thus | -0.272 |
UA | -0.271 |
ildo | -0.266 |
Token | the |
Token ID | 262 |
Feature activation | -2.31e-01 |
Pos logit contributions | |
Supplement | +0.358 |
appendix | +0.356 |
defences | +0.336 |
strang | +0.322 |
gard | +0.312 |
Neg logit contributions | |
practiced | -0.439 |
ounge | -0.436 |
thus | -0.415 |
UA | -0.415 |
ildo | -0.407 |
Token | � |
Token ID | 564 |
Feature activation | -3.80e-01 |
Pos logit contributions | |
practiced | +1.427 |
ounge | +1.402 |
UA | +1.346 |
thus | +1.344 |
ildo | +1.310 |
Neg logit contributions | |
Supplement | -1.032 |
appendix | -1.002 |
defences | -0.951 |
strang | -0.901 |
gard | -0.869 |
Token | � |
Token ID | 250 |
Feature activation | +2.43e-02 |
Pos logit contributions | |
practiced | +1.646 |
ounge | +1.601 |
thus | +1.535 |
UA | +1.510 |
ildo | +1.458 |
Neg logit contributions | |
appendix | -2.381 |
Supplement | -2.373 |
defences | -2.287 |
strang | -2.216 |
gard | -2.150 |
Token | of |
Token ID | 286 |
Feature activation | -3.33e-01 |
Pos logit contributions | |
practiced | +1.188 |
ounge | +1.172 |
UA | +1.131 |
thus | +1.109 |
ildo | +1.093 |
Neg logit contributions | |
Supplement | -0.959 |
appendix | -0.955 |
defences | -0.913 |
strang | -0.885 |
gard | -0.824 |
Token | the |
Token ID | 262 |
Feature activation | -1.44e-01 |
Pos logit contributions | |
practiced | +1.883 |
ounge | +1.851 |
thus | +1.768 |
UA | +1.765 |
ildo | +1.724 |
Neg logit contributions | |
Supplement | -1.630 |
appendix | -1.618 |
defences | -1.550 |
strang | -1.486 |
gard | -1.423 |
Token | Coalition |
Token ID | 15135 |
Feature activation | +3.64e-01 |
Pos logit contributions | |
practiced | +0.832 |
ounge | +0.825 |
thus | +0.785 |
UA | +0.784 |
ildo | +0.767 |
Neg logit contributions | |
Supplement | -0.695 |
appendix | -0.690 |
defences | -0.657 |
strang | -0.628 |
gard | -0.606 |
Token | for |
Token ID | 329 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
Supplement | +1.751 |
appendix | +1.742 |
defences | +1.640 |
strang | +1.574 |
gard | +1.533 |
Neg logit contributions | |
ounge | -2.118 |
practiced | -2.113 |
thus | -2.012 |
UA | -1.998 |
ildo | -1.969 |
Token | the |
Token ID | 262 |
Feature activation | +5.31e-01 |
Pos logit contributions | |
Supplement | +1.523 |
appendix | +1.510 |
defences | +1.416 |
strang | +1.367 |
gard | +1.324 |
Neg logit contributions | |
practiced | -1.851 |
ounge | -1.849 |
UA | -1.762 |
thus | -1.754 |
ildo | -1.724 |
Token | Homeless |
Token ID | 47706 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
Supplement | +1.779 |
appendix | +1.755 |
defences | +1.596 |
strang | +1.517 |
gard | +1.458 |
Neg logit contributions | |
ounge | -3.868 |
practiced | -3.843 |
UA | -3.710 |
thus | -3.668 |
ildo | -3.652 |
Token | , |
Token ID | 11 |
Feature activation | -7.31e-01 |
Pos logit contributions | |
appendix | +6.557 |
Supplement | +6.540 |
defences | +5.838 |
strang | +5.615 |
gard | +5.560 |
Neg logit contributions | |
ounge | -9.043 |
practiced | -8.802 |
UA | -8.491 |
thus | -8.459 |
ildo | -8.436 |
Token | � |
Token ID | 1587 |
Feature activation | -3.74e-02 |
Pos logit contributions | |
practiced | +4.214 |
ounge | +4.059 |
thus | +3.950 |
UA | +3.936 |
ildo | +3.826 |
Neg logit contributions | |
Supplement | -3.433 |
appendix | -3.382 |
defences | -3.279 |
strang | -3.082 |
gard | -2.945 |
Token | � |
Token ID | 241 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
practiced | +0.170 |
ounge | +0.169 |
thus | +0.159 |
UA | +0.158 |
ildo | +0.155 |
Neg logit contributions | |
Supplement | -0.227 |
appendix | -0.227 |
defences | -0.216 |
strang | -0.210 |
gard | -0.205 |
Token | the |
Token ID | 1169 |
Feature activation | -3.71e-02 |
Pos logit contributions | |
Supplement | +0.623 |
appendix | +0.619 |
defences | +0.590 |
strang | +0.571 |
gard | +0.557 |
Neg logit contributions | |
practiced | -0.517 |
ounge | -0.517 |
UA | -0.483 |
thus | -0.482 |
ildo | -0.474 |
Token | city |
Token ID | 1748 |
Feature activation | +3.76e-01 |
Pos logit contributions | |
practiced | +0.216 |
ounge | +0.215 |
thus | +0.204 |
UA | +0.204 |
ildo | +0.200 |
Neg logit contributions | |
Supplement | -0.178 |
appendix | -0.177 |
defences | -0.167 |
strang | -0.160 |
gard | -0.155 |
Token | authorized |
Token ID | 10435 |
Feature activation | +7.12e-01 |
Pos logit contributions | |
Supplement | +3.475 |
appendix | +3.444 |
defences | +3.259 |
strang | +3.153 |
gard | +3.104 |
Neg logit contributions | |
ounge | -3.771 |
practiced | -3.717 |
thus | -3.556 |
UA | -3.552 |
ildo | -3.493 |
Token | to |
Token ID | 284 |
Feature activation | +8.77e-01 |
Pos logit contributions | |
Supplement | +3.536 |
appendix | +3.530 |
defences | +3.330 |
strang | +3.200 |
gard | +3.115 |
Neg logit contributions | |
practiced | -4.012 |
ounge | -3.996 |
thus | -3.801 |
UA | -3.786 |
ildo | -3.714 |
Token | speak |
Token ID | 2740 |
Feature activation | +8.42e-01 |
Pos logit contributions | |
appendix | +4.139 |
Supplement | +4.093 |
defences | +3.784 |
strang | +3.704 |
gard | +3.631 |
Neg logit contributions | |
ounge | -5.025 |
practiced | -4.945 |
UA | -4.853 |
thus | -4.775 |
ildo | -4.608 |
Token | to |
Token ID | 284 |
Feature activation | +9.47e-01 |
Pos logit contributions | |
appendix | +3.870 |
Supplement | +3.862 |
defences | +3.637 |
strang | +3.468 |
gard | +3.421 |
Neg logit contributions | |
ounge | -4.966 |
practiced | -4.932 |
UA | -4.726 |
thus | -4.693 |
ildo | -4.636 |
Token | the |
Token ID | 262 |
Feature activation | +4.23e-01 |
Pos logit contributions | |
appendix | +4.208 |
Supplement | +4.147 |
defences | +3.972 |
gard | +3.770 |
strang | +3.749 |
Neg logit contributions | |
ounge | -5.642 |
practiced | -5.611 |
thus | -5.363 |
UA | -5.340 |
ildo | -5.220 |
Token | media |
Token ID | 2056 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
appendix | +2.048 |
Supplement | +2.046 |
defences | +1.929 |
strang | +1.855 |
gard | +1.817 |
Neg logit contributions | |
ounge | -2.414 |
practiced | -2.403 |
thus | -2.288 |
UA | -2.287 |
ildo | -2.249 |
Token | about |
Token ID | 546 |
Feature activation | +7.15e-01 |
Pos logit contributions | |
appendix | +6.240 |
Supplement | +6.047 |
defences | +5.686 |
gard | +5.466 |
strang | +5.312 |
Neg logit contributions | |
ounge | -9.267 |
practiced | -8.995 |
UA | -8.838 |
ildo | -8.697 |
thus | -8.587 |
Token | the |
Token ID | 262 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
appendix | +3.147 |
Supplement | +3.130 |
defences | +2.932 |
strang | +2.808 |
gard | +2.731 |
Neg logit contributions | |
practiced | -4.404 |
ounge | -4.395 |
thus | -4.206 |
UA | -4.192 |
ildo | -4.137 |
Token | diplomatic |
Token ID | 13093 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
appendix | +1.766 |
Supplement | +1.755 |
defences | +1.664 |
strang | +1.618 |
gard | +1.572 |
Neg logit contributions | |
ounge | -1.773 |
practiced | -1.772 |
thus | -1.678 |
UA | -1.671 |
ildo | -1.647 |
Token | talks |
Token ID | 6130 |
Feature activation | -7.42e-02 |
Pos logit contributions | |
appendix | +1.915 |
Supplement | +1.889 |
defences | +1.803 |
strang | +1.749 |
gard | +1.693 |
Neg logit contributions | |
ounge | -2.016 |
practiced | -2.010 |
thus | -1.905 |
UA | -1.896 |
ildo | -1.863 |
Token | , |
Token ID | 11 |
Feature activation | +5.29e-01 |
Pos logit contributions | |
practiced | +0.402 |
ounge | +0.392 |
thus | +0.377 |
UA | +0.373 |
ildo | +0.364 |
Neg logit contributions | |
Supplement | -0.393 |
appendix | -0.389 |
defences | -0.374 |
strang | -0.358 |
gard | -0.345 |
Token | was |
Token ID | 373 |
Feature activation | -4.32e-01 |
Pos logit contributions | |
Supplement | +0.202 |
appendix | +0.201 |
defences | +0.189 |
strang | +0.181 |
gard | +0.175 |
Neg logit contributions | |
practiced | -0.271 |
ounge | -0.269 |
thus | -0.257 |
UA | -0.256 |
ildo | -0.251 |
Token | still |
Token ID | 991 |
Feature activation | -4.02e-01 |
Pos logit contributions | |
practiced | +2.385 |
ounge | +2.327 |
thus | +2.225 |
UA | +2.208 |
ildo | +2.174 |
Neg logit contributions | |
Supplement | -2.214 |
appendix | -2.187 |
defences | -2.073 |
strang | -1.996 |
gard | -1.945 |
Token | plenty |
Token ID | 6088 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
practiced | +2.280 |
ounge | +2.241 |
thus | +2.131 |
UA | +2.124 |
ildo | +2.083 |
Neg logit contributions | |
Supplement | -2.005 |
appendix | -1.973 |
defences | -1.857 |
strang | -1.793 |
gard | -1.749 |
Token | of |
Token ID | 286 |
Feature activation | -8.49e-01 |
Pos logit contributions | |
practiced | +5.879 |
ounge | +5.381 |
UA | +5.281 |
thus | +4.987 |
ildo | +4.974 |
Neg logit contributions | |
Supplement | -6.245 |
appendix | -6.142 |
defences | -5.660 |
erald | -5.566 |
strang | -5.563 |
Token | work |
Token ID | 670 |
Feature activation | -9.39e-01 |
Pos logit contributions | |
practiced | +4.465 |
ounge | +4.246 |
UA | +4.007 |
thus | +4.005 |
ildo | +3.894 |
Neg logit contributions | |
Supplement | -4.572 |
appendix | -4.356 |
defences | -4.053 |
strang | -3.948 |
erald | -3.937 |
Token | to |
Token ID | 284 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
practiced | +4.586 |
ounge | +4.248 |
thus | +4.137 |
UA | +4.083 |
ildo | +3.909 |
Neg logit contributions | |
appendix | -5.245 |
Supplement | -5.221 |
strang | -4.905 |
defences | -4.882 |
erald | -4.679 |
Token | do |
Token ID | 466 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
practiced | +7.266 |
ounge | +6.171 |
thus | +5.936 |
ildo | +5.884 |
UA | +5.666 |
Neg logit contributions | |
appendix | -11.548 |
Supplement | -11.464 |
andestine | -11.001 |
strang | -10.869 |
defences | -10.712 |
Token | if |
Token ID | 611 |
Feature activation | -5.77e-01 |
Pos logit contributions | |
practiced | +5.940 |
ounge | +5.619 |
thus | +5.517 |
UA | +5.353 |
ildo | +5.164 |
Neg logit contributions | |
Supplement | -5.944 |
appendix | -5.891 |
strang | -5.474 |
defences | -5.428 |
gard | -5.209 |
Token | the |
Token ID | 262 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
practiced | +3.837 |
ounge | +3.759 |
thus | +3.649 |
UA | +3.614 |
ildo | +3.517 |
Neg logit contributions | |
Supplement | -2.293 |
appendix | -2.245 |
defences | -2.058 |
strang | -1.987 |
gard | -1.916 |
Token | season |
Token ID | 1622 |
Feature activation | +4.77e-03 |
Pos logit contributions | |
practiced | +0.069 |
ounge | +0.069 |
thus | +0.066 |
UA | +0.065 |
ildo | +0.064 |
Neg logit contributions | |
Supplement | -0.063 |
appendix | -0.063 |
defences | -0.059 |
strang | -0.057 |
gard | -0.056 |
Token | was |
Token ID | 373 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
Supplement | +0.021 |
appendix | +0.021 |
defences | +0.020 |
strang | +0.019 |
gard | +0.018 |
Neg logit contributions | |
practiced | -0.030 |
ounge | -0.029 |
thus | -0.028 |
UA | -0.028 |
ildo | -0.027 |
Token | still |
Token ID | 991 |
Feature activation | -2.50e-01 |
Pos logit contributions | |
practiced | +0.588 |
ounge | +0.584 |
thus | +0.556 |
UA | +0.556 |
ildo | +0.545 |
Neg logit contributions | |
Supplement | -0.477 |
appendix | -0.474 |
defences | -0.447 |
strang | -0.429 |
gard | -0.416 |
Token | has |
Token ID | 468 |
Feature activation | -2.97e-01 |
Pos logit contributions | |
practiced | +1.567 |
ounge | +1.537 |
thus | +1.470 |
UA | +1.463 |
ildo | +1.436 |
Neg logit contributions | |
Supplement | -1.110 |
appendix | -1.091 |
defences | -1.029 |
strang | -0.981 |
gard | -0.945 |
Token | a |
Token ID | 257 |
Feature activation | -3.87e-01 |
Pos logit contributions | |
practiced | +1.755 |
ounge | +1.731 |
thus | +1.644 |
UA | +1.644 |
ildo | +1.603 |
Neg logit contributions | |
Supplement | -1.417 |
appendix | -1.395 |
defences | -1.305 |
strang | -1.258 |
gard | -1.222 |
Token | long |
Token ID | 890 |
Feature activation | -8.56e-01 |
Pos logit contributions | |
practiced | +2.271 |
ounge | +2.226 |
thus | +2.115 |
UA | +2.098 |
ildo | +2.067 |
Neg logit contributions | |
Supplement | -1.862 |
appendix | -1.827 |
defences | -1.732 |
strang | -1.654 |
gard | -1.604 |
Token | way |
Token ID | 835 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
practiced | +5.045 |
ounge | +4.968 |
thus | +4.713 |
UA | +4.692 |
ildo | +4.580 |
Neg logit contributions | |
Supplement | -3.925 |
appendix | -3.842 |
defences | -3.599 |
strang | -3.463 |
gard | -3.370 |
Token | to |
Token ID | 284 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
practiced | +4.332 |
ounge | +4.087 |
thus | +3.810 |
UA | +3.662 |
ildo | +3.544 |
Neg logit contributions | |
Supplement | -6.240 |
appendix | -6.225 |
defences | -5.797 |
strang | -5.757 |
erald | -5.659 |
Token | go |
Token ID | 467 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
practiced | +7.900 |
ounge | +7.211 |
thus | +7.079 |
fray | +6.892 |
ildo | +6.746 |
Neg logit contributions | |
Supplement | -10.840 |
appendix | -10.326 |
defences | -10.084 |
andestine | -9.849 |
strang | -9.484 |
Token | with |
Token ID | 351 |
Feature activation | -8.96e-01 |
Pos logit contributions | |
practiced | +5.385 |
ounge | +5.229 |
thus | +4.990 |
UA | +4.895 |
ildo | +4.739 |
Neg logit contributions | |
Supplement | -6.004 |
appendix | -5.965 |
defences | -5.539 |
strang | -5.488 |
gard | -5.292 |
Token | mobile |
Token ID | 5175 |
Feature activation | -5.55e-01 |
Pos logit contributions | |
practiced | +4.721 |
ounge | +4.625 |
UA | +4.368 |
thus | +4.354 |
ildo | +4.227 |
Neg logit contributions | |
Supplement | -4.699 |
appendix | -4.558 |
defences | -4.263 |
strang | -4.134 |
gard | -4.086 |
Token | users |
Token ID | 2985 |
Feature activation | -3.54e-01 |
Pos logit contributions | |
practiced | +3.027 |
ounge | +3.002 |
UA | +2.878 |
thus | +2.796 |
ildo | +2.735 |
Neg logit contributions | |
Supplement | -2.860 |
appendix | -2.804 |
defences | -2.602 |
strang | -2.550 |
gard | -2.504 |
Token | , |
Token ID | 11 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
practiced | +1.907 |
ounge | +1.886 |
thus | +1.775 |
UA | +1.760 |
ildo | +1.725 |
Neg logit contributions | |
Supplement | -1.878 |
appendix | -1.863 |
defences | -1.763 |
strang | -1.706 |
gard | -1.654 |
Token | 's |
Token ID | 338 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
practiced | +2.378 |
ounge | +2.322 |
thus | +2.226 |
UA | +2.180 |
ildo | +2.140 |
Neg logit contributions | |
Supplement | -1.815 |
appendix | -1.783 |
defences | -1.681 |
strang | -1.606 |
gard | -1.541 |
Token | still |
Token ID | 991 |
Feature activation | -4.89e-01 |
Pos logit contributions | |
practiced | +2.381 |
ounge | +2.276 |
thus | +2.171 |
UA | +2.137 |
ildo | +2.099 |
Neg logit contributions | |
Supplement | -2.173 |
appendix | -2.129 |
defences | -2.007 |
strang | -1.919 |
gard | -1.882 |
Token | a |
Token ID | 257 |
Feature activation | -5.35e-01 |
Pos logit contributions | |
practiced | +2.813 |
ounge | +2.712 |
thus | +2.596 |
UA | +2.560 |
ildo | +2.501 |
Neg logit contributions | |
Supplement | -2.413 |
appendix | -2.361 |
defences | -2.226 |
strang | -2.121 |
gard | -2.083 |
Token | long |
Token ID | 890 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
practiced | +2.852 |
ounge | +2.745 |
thus | +2.617 |
UA | +2.567 |
ildo | +2.526 |
Neg logit contributions | |
Supplement | -2.829 |
appendix | -2.775 |
defences | -2.650 |
strang | -2.514 |
gard | -2.466 |
Token | way |
Token ID | 835 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
practiced | +6.547 |
ounge | +6.344 |
thus | +6.126 |
UA | +5.964 |
fray | +5.811 |
Neg logit contributions | |
Supplement | -5.596 |
appendix | -5.387 |
defences | -5.217 |
strang | -4.867 |
gard | -4.857 |
Token | to |
Token ID | 284 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
practiced | +4.484 |
ounge | +4.175 |
thus | +4.025 |
UA | +3.901 |
fray | +3.714 |
Neg logit contributions | |
Supplement | -6.332 |
appendix | -6.329 |
defences | -5.922 |
erald | -5.764 |
strang | -5.721 |
Token | go |
Token ID | 467 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
practiced | +7.439 |
ounge | +6.690 |
thus | +6.473 |
fray | +6.363 |
ildo | +6.135 |
Neg logit contributions | |
Supplement | -11.002 |
appendix | -10.603 |
defences | -10.490 |
andestine | -10.254 |
erald | -9.855 |
Token | to |
Token ID | 284 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
practiced | +5.396 |
thus | +4.989 |
ounge | +4.979 |
UA | +4.786 |
ildo | +4.544 |
Neg logit contributions | |
appendix | -7.097 |
Supplement | -7.060 |
defences | -6.644 |
strang | -6.500 |
erald | -6.313 |
Token | prove |
Token ID | 5879 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
practiced | +6.634 |
ounge | +6.345 |
fray | +6.113 |
thus | +6.075 |
ildo | +6.039 |
Neg logit contributions | |
Supplement | -5.294 |
appendix | -5.079 |
defences | -4.748 |
andestine | -4.610 |
erald | -4.471 |
Token | whether |
Token ID | 1771 |
Feature activation | +2.79e-01 |
Pos logit contributions | |
Supplement | +0.833 |
appendix | +0.830 |
defences | +0.788 |
strang | +0.761 |
gard | +0.740 |
Neg logit contributions | |
practiced | -0.787 |
ounge | -0.784 |
thus | -0.740 |
UA | -0.739 |
ildo | -0.724 |
Token | or |
Token ID | 393 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
appendix | +1.279 |
Supplement | +1.278 |
defences | +1.201 |
strang | +1.155 |
gard | +1.113 |
Neg logit contributions | |
ounge | -1.690 |
practiced | -1.677 |
UA | -1.602 |
thus | -1.600 |
ildo | -1.575 |
Token | it |
Token ID | 340 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
practiced | +1.893 |
ounge | +1.849 |
thus | +1.770 |
UA | +1.769 |
ildo | +1.723 |
Neg logit contributions | |
Supplement | -1.813 |
appendix | -1.784 |
defences | -1.686 |
strang | -1.611 |
gard | -1.579 |
Token | has |
Token ID | 468 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
Supplement | +0.520 |
appendix | +0.518 |
defences | +0.490 |
strang | +0.471 |
gard | +0.457 |
Neg logit contributions | |
practiced | -0.592 |
ounge | -0.591 |
thus | -0.560 |
UA | -0.560 |
ildo | -0.550 |
Token | a |
Token ID | 257 |
Feature activation | -5.41e-01 |
Pos logit contributions | |
practiced | +0.822 |
ounge | +0.807 |
thus | +0.768 |
UA | +0.765 |
ildo | +0.751 |
Neg logit contributions | |
Supplement | -0.680 |
appendix | -0.672 |
defences | -0.631 |
strang | -0.606 |
gard | -0.588 |
Token | long |
Token ID | 890 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
practiced | +3.266 |
ounge | +3.166 |
thus | +3.025 |
UA | +2.981 |
ildo | +2.971 |
Neg logit contributions | |
Supplement | -2.512 |
appendix | -2.451 |
defences | -2.326 |
strang | -2.186 |
gard | -2.138 |
Token | way |
Token ID | 835 |
Feature activation | -9.42e-01 |
Pos logit contributions | |
practiced | +5.625 |
ounge | +5.398 |
thus | +5.182 |
UA | +4.966 |
ildo | +4.947 |
Neg logit contributions | |
Supplement | -5.722 |
appendix | -5.529 |
defences | -5.319 |
strang | -5.033 |
gard | -5.028 |
Token | to |
Token ID | 284 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
practiced | +4.185 |
ounge | +3.894 |
thus | +3.716 |
UA | +3.557 |
ildo | +3.519 |
Neg logit contributions | |
Supplement | -5.634 |
appendix | -5.555 |
defences | -5.233 |
erald | -5.144 |
strang | -5.103 |
Token | go |
Token ID | 467 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
practiced | +7.550 |
ounge | +6.921 |
thus | +6.873 |
ildo | +6.539 |
fray | +6.490 |
Neg logit contributions | |
Supplement | -10.662 |
defences | -10.122 |
appendix | -10.088 |
andestine | -9.767 |
erald | -9.494 |
Token | in |
Token ID | 287 |
Feature activation | -7.48e-01 |
Pos logit contributions | |
practiced | +5.642 |
ounge | +5.392 |
thus | +5.315 |
UA | +5.142 |
ildo | +5.067 |
Neg logit contributions | |
Supplement | -6.294 |
appendix | -6.288 |
defences | -5.892 |
strang | -5.774 |
gard | -5.601 |
Token | reporting |
Token ID | 6447 |
Feature activation | -5.23e-01 |
Pos logit contributions | |
practiced | +3.942 |
ounge | +3.852 |
thus | +3.652 |
ildo | +3.602 |
UA | +3.594 |
Neg logit contributions | |
Supplement | -3.951 |
appendix | -3.848 |
defences | -3.638 |
strang | -3.465 |
gard | -3.441 |
Token | on |
Token ID | 319 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
practiced | +3.213 |
ounge | +3.129 |
thus | +3.020 |
UA | +2.992 |
ildo | +2.936 |
Neg logit contributions | |
Supplement | -2.370 |
appendix | -2.312 |
defences | -2.179 |
strang | -2.065 |
gard | -2.005 |
Token | communities |
Token ID | 5348 |
Feature activation | -2.59e-02 |
Pos logit contributions | |
practiced | +1.388 |
ounge | +1.372 |
thus | +1.310 |
UA | +1.306 |
ildo | +1.283 |
Neg logit contributions | |
Supplement | -1.125 |
appendix | -1.113 |
defences | -1.050 |
strang | -1.004 |
gard | -0.976 |
Token | that |
Token ID | 326 |
Feature activation | -5.56e-01 |
Pos logit contributions | |
practiced | +4.118 |
ounge | +3.920 |
UA | +3.837 |
thus | +3.774 |
ildo | +3.710 |
Neg logit contributions | |
Supplement | -4.417 |
appendix | -4.390 |
defences | -4.233 |
strang | -4.078 |
gard | -3.927 |
Token | there |
Token ID | 612 |
Feature activation | -4.16e-01 |
Pos logit contributions | |
practiced | +3.232 |
ounge | +3.144 |
thus | +3.036 |
UA | +3.031 |
ildo | +2.949 |
Neg logit contributions | |
Supplement | -2.635 |
appendix | -2.612 |
defences | -2.482 |
strang | -2.386 |
gard | -2.293 |
Token | is |
Token ID | 318 |
Feature activation | -9.11e-01 |
Pos logit contributions | |
practiced | +2.586 |
ounge | +2.545 |
thus | +2.434 |
UA | +2.421 |
ildo | +2.384 |
Neg logit contributions | |
Supplement | -1.830 |
appendix | -1.817 |
defences | -1.704 |
strang | -1.646 |
gard | -1.563 |
Token | still |
Token ID | 991 |
Feature activation | -8.57e-01 |
Pos logit contributions | |
practiced | +5.173 |
ounge | +4.915 |
thus | +4.728 |
UA | +4.669 |
ildo | +4.647 |
Neg logit contributions | |
Supplement | -4.429 |
appendix | -4.374 |
defences | -4.151 |
strang | -3.938 |
gard | -3.824 |
Token | work |
Token ID | 670 |
Feature activation | -9.59e-01 |
Pos logit contributions | |
practiced | +4.740 |
ounge | +4.555 |
thus | +4.352 |
UA | +4.327 |
ildo | +4.262 |
Neg logit contributions | |
Supplement | -4.284 |
appendix | -4.221 |
defences | -4.006 |
strang | -3.837 |
gard | -3.752 |
Token | to |
Token ID | 284 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
practiced | +4.614 |
ounge | +4.334 |
thus | +4.199 |
UA | +4.148 |
ildo | +3.990 |
Neg logit contributions | |
Supplement | -5.344 |
appendix | -5.318 |
defences | -5.067 |
strang | -4.925 |
erald | -4.738 |
Token | do |
Token ID | 466 |
Feature activation | -9.60e-01 |
Pos logit contributions | |
practiced | +6.603 |
ounge | +5.733 |
ildo | +5.601 |
thus | +5.533 |
UA | +5.195 |
Neg logit contributions | |
appendix | -10.897 |
Supplement | -10.861 |
defences | -10.573 |
strang | -10.291 |
andestine | -10.146 |
Token | , |
Token ID | 11 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
practiced | +4.647 |
ounge | +4.395 |
thus | +4.340 |
UA | +4.210 |
ildo | +4.054 |
Neg logit contributions | |
Supplement | -5.291 |
appendix | -5.269 |
defences | -5.089 |
strang | -4.924 |
gard | -4.717 |
Token | we |
Token ID | 356 |
Feature activation | -8.28e-01 |
Pos logit contributions | |
practiced | +0.822 |
ounge | +0.809 |
thus | +0.777 |
UA | +0.773 |
ildo | +0.751 |
Neg logit contributions | |
Supplement | -0.764 |
appendix | -0.761 |
defences | -0.729 |
strang | -0.703 |
gard | -0.678 |
Token | are |
Token ID | 389 |
Feature activation | -6.79e-01 |
Pos logit contributions | |
practiced | +4.945 |
ounge | +4.552 |
thus | +4.526 |
UA | +4.395 |
ildo | +4.338 |
Neg logit contributions | |
Supplement | -3.793 |
appendix | -3.759 |
defences | -3.659 |
strang | -3.519 |
gard | -3.330 |
Token | proud |
Token ID | 6613 |
Feature activation | +5.49e-01 |
Pos logit contributions | |
practiced | +3.625 |
ounge | +3.370 |
thus | +3.331 |
UA | +3.191 |
ildo | +3.116 |
Neg logit contributions | |
Supplement | -3.598 |
appendix | -3.597 |
defences | -3.460 |
strang | -3.313 |
erald | -3.179 |
Token | a |
Token ID | 257 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
practiced | +1.490 |
ounge | +1.465 |
UA | +1.394 |
thus | +1.394 |
ildo | +1.360 |
Neg logit contributions | |
Supplement | -1.115 |
appendix | -1.107 |
defences | -1.040 |
strang | -0.996 |
gard | -0.960 |
Token | link |
Token ID | 2792 |
Feature activation | -1.91e-01 |
Pos logit contributions | |
practiced | +1.690 |
ounge | +1.674 |
thus | +1.600 |
UA | +1.596 |
ildo | +1.567 |
Neg logit contributions | |
Supplement | -1.226 |
appendix | -1.214 |
defences | -1.148 |
strang | -1.086 |
gard | -1.052 |
Token | back |
Token ID | 736 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
practiced | +1.063 |
ounge | +1.056 |
thus | +1.003 |
UA | +0.997 |
ildo | +0.980 |
Neg logit contributions | |
Supplement | -0.962 |
appendix | -0.957 |
defences | -0.911 |
strang | -0.873 |
gard | -0.847 |
Token | to |
Token ID | 284 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
practiced | +1.013 |
ounge | +1.009 |
thus | +0.958 |
UA | +0.954 |
ildo | +0.934 |
Neg logit contributions | |
Supplement | -0.944 |
appendix | -0.939 |
defences | -0.893 |
strang | -0.857 |
gard | -0.832 |
Token | your |
Token ID | 534 |
Feature activation | -6.72e-01 |
Pos logit contributions | |
practiced | +1.589 |
ounge | +1.580 |
UA | +1.501 |
thus | +1.489 |
ildo | +1.460 |
Neg logit contributions | |
Supplement | -1.389 |
appendix | -1.373 |
defences | -1.320 |
strang | -1.248 |
gard | -1.211 |
Token | Instagram |
Token ID | 10767 |
Feature activation | -1.76e+00 |
Pos logit contributions | |
practiced | +3.738 |
ounge | +3.703 |
UA | +3.558 |
thus | +3.498 |
ildo | +3.384 |
Neg logit contributions | |
Supplement | -3.300 |
appendix | -3.225 |
defences | -3.134 |
strang | -2.933 |
erald | -2.903 |
Token | , |
Token ID | 11 |
Feature activation | -9.12e-01 |
Pos logit contributions | |
ounge | +8.112 |
practiced | +7.783 |
UA | +7.617 |
thus | +7.572 |
artist | +7.241 |
Neg logit contributions | |
appendix | -8.915 |
Supplement | -8.830 |
defences | -8.494 |
strang | -8.219 |
erald | -8.120 |
Token | Fac |
Token ID | 13585 |
Feature activation | -4.67e-01 |
Pos logit contributions | |
practiced | +4.739 |
ounge | +4.712 |
thus | +4.500 |
UA | +4.468 |
ildo | +4.401 |
Neg logit contributions | |
Supplement | -4.707 |
appendix | -4.649 |
defences | -4.463 |
strang | -4.186 |
gard | -4.106 |
Token | be |
Token ID | 1350 |
Feature activation | -7.34e-01 |
Pos logit contributions | |
practiced | +1.910 |
ounge | +1.902 |
thus | +1.808 |
UA | +1.769 |
ildo | +1.750 |
Neg logit contributions | |
appendix | -3.030 |
Supplement | -3.015 |
defences | -2.892 |
strang | -2.809 |
gard | -2.751 |
Token | ook |
Token ID | 566 |
Feature activation | -3.10e-01 |
Pos logit contributions | |
ounge | +3.742 |
practiced | +3.674 |
thus | +3.510 |
UA | +3.488 |
ildo | +3.419 |
Neg logit contributions | |
appendix | -4.032 |
Supplement | -3.981 |
defences | -3.810 |
strang | -3.635 |
gard | -3.538 |
Token | Page |
Token ID | 7873 |
Feature activation | -5.91e-01 |
Pos logit contributions | |
ounge | +1.730 |
practiced | +1.715 |
thus | +1.636 |
UA | +1.634 |
ildo | +1.593 |
Neg logit contributions | |
appendix | -1.561 |
Supplement | -1.556 |
defences | -1.484 |
strang | -1.418 |
gard | -1.377 |
Token | Had |
Token ID | 25383 |
Feature activation | -2.69e-01 |
Pos logit contributions | |
Supplement | +0.720 |
appendix | +0.699 |
defences | +0.660 |
strang | +0.641 |
gard | +0.627 |
Neg logit contributions | |
ounge | -0.581 |
practiced | -0.565 |
thus | -0.532 |
ildo | -0.527 |
UA | -0.523 |
Token | Enough |
Token ID | 47323 |
Feature activation | -2.75e-01 |
Pos logit contributions | |
ounge | +1.394 |
practiced | +1.394 |
thus | +1.305 |
UA | +1.296 |
ildo | +1.285 |
Neg logit contributions | |
Supplement | -1.484 |
appendix | -1.458 |
defences | -1.388 |
strang | -1.335 |
gard | -1.298 |
Token | . |
Token ID | 13 |
Feature activation | +3.37e-02 |
Pos logit contributions | |
practiced | +1.440 |
ounge | +1.407 |
thus | +1.351 |
UA | +1.349 |
ildo | +1.303 |
Neg logit contributions | |
Supplement | -1.470 |
appendix | -1.470 |
defences | -1.392 |
strang | -1.335 |
gard | -1.296 |
Token | In |
Token ID | 554 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
Supplement | +0.170 |
appendix | +0.169 |
defences | +0.159 |
strang | +0.154 |
gard | +0.149 |
Neg logit contributions | |
practiced | -0.188 |
ounge | -0.188 |
thus | -0.177 |
UA | -0.176 |
ildo | -0.173 |
Token | the |
Token ID | 262 |
Feature activation | -4.94e-01 |
Pos logit contributions | |
practiced | +1.793 |
ounge | +1.771 |
thus | +1.689 |
UA | +1.674 |
ildo | +1.646 |
Neg logit contributions | |
Supplement | -1.534 |
appendix | -1.516 |
defences | -1.431 |
strang | -1.372 |
gard | -1.335 |
Token | Kal |
Token ID | 12612 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
practiced | +2.945 |
ounge | +2.913 |
thus | +2.767 |
UA | +2.750 |
ildo | +2.705 |
Neg logit contributions | |
Supplement | -2.301 |
appendix | -2.235 |
defences | -2.125 |
strang | -1.988 |
gard | -1.960 |
Token | uga |
Token ID | 30302 |
Feature activation | -2.84e-01 |
Pos logit contributions | |
ounge | +2.519 |
thus | +2.235 |
practiced | +2.188 |
ining | +2.129 |
ildo | +1.916 |
Neg logit contributions | |
defences | -14.511 |
appendix | -14.374 |
Supplement | -14.214 |
strang | -13.955 |
gard | -13.805 |
Token | region |
Token ID | 3814 |
Feature activation | -3.98e-02 |
Pos logit contributions | |
practiced | +1.569 |
ounge | +1.563 |
UA | +1.484 |
thus | +1.482 |
ildo | +1.453 |
Neg logit contributions | |
Supplement | -1.450 |
appendix | -1.437 |
defences | -1.362 |
strang | -1.308 |
gard | -1.274 |
Token | , |
Token ID | 11 |
Feature activation | -2.95e-02 |
Pos logit contributions | |
practiced | +0.229 |
ounge | +0.225 |
UA | +0.214 |
thus | +0.212 |
ildo | +0.209 |
Neg logit contributions | |
Supplement | -0.198 |
appendix | -0.196 |
defences | -0.185 |
strang | -0.177 |
gard | -0.171 |
Token | the |
Token ID | 262 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
practiced | +0.170 |
ounge | +0.170 |
thus | +0.161 |
UA | +0.161 |
ildo | +0.158 |
Neg logit contributions | |
Supplement | -0.143 |
appendix | -0.142 |
defences | -0.134 |
strang | -0.129 |
gard | -0.125 |
Token | regional |
Token ID | 7915 |
Feature activation | -7.30e-02 |
Pos logit contributions | |
practiced | +0.798 |
ounge | +0.793 |
thus | +0.754 |
UA | +0.753 |
ildo | +0.739 |
Neg logit contributions | |
Supplement | -0.640 |
appendix | -0.634 |
defences | -0.597 |
strang | -0.571 |
gard | -0.554 |
Token | becoming |
Token ID | 5033 |
Feature activation | +2.35e-02 |
Pos logit contributions | |
practiced | +2.128 |
ounge | +2.072 |
thus | +1.987 |
UA | +1.943 |
ildo | +1.919 |
Neg logit contributions | |
Supplement | -1.622 |
appendix | -1.610 |
defences | -1.508 |
strang | -1.422 |
gard | -1.377 |
Token | grace |
Token ID | 11542 |
Feature activation | -5.24e-01 |
Pos logit contributions | |
Supplement | +0.110 |
appendix | +0.109 |
defences | +0.103 |
strang | +0.098 |
gard | +0.095 |
Neg logit contributions | |
practiced | -0.140 |
ounge | -0.138 |
thus | -0.133 |
UA | -0.131 |
ildo | -0.129 |
Token | ; |
Token ID | 26 |
Feature activation | -8.99e-01 |
Pos logit contributions | |
practiced | +2.776 |
ounge | +2.684 |
thus | +2.606 |
UA | +2.542 |
ildo | +2.494 |
Neg logit contributions | |
appendix | -2.783 |
Supplement | -2.779 |
defences | -2.636 |
strang | -2.515 |
gard | -2.446 |
Token | and |
Token ID | 290 |
Feature activation | -4.97e-01 |
Pos logit contributions | |
practiced | +5.250 |
ounge | +5.043 |
thus | +4.965 |
UA | +4.739 |
ildo | +4.683 |
Neg logit contributions | |
Supplement | -4.232 |
appendix | -4.170 |
defences | -3.907 |
strang | -3.675 |
gard | -3.572 |
Token | , |
Token ID | 11 |
Feature activation | -3.09e-01 |
Pos logit contributions | |
practiced | +2.949 |
ounge | +2.888 |
thus | +2.784 |
UA | +2.727 |
ildo | +2.687 |
Neg logit contributions | |
Supplement | -2.353 |
appendix | -2.315 |
defences | -2.180 |
strang | -2.065 |
gard | -2.006 |
Token | if |
Token ID | 611 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
practiced | +1.881 |
ounge | +1.866 |
thus | +1.786 |
UA | +1.772 |
ildo | +1.744 |
Neg logit contributions | |
Supplement | -1.408 |
appendix | -1.399 |
defences | -1.315 |
strang | -1.253 |
gard | -1.212 |
Token | you |
Token ID | 345 |
Feature activation | -6.30e-01 |
Pos logit contributions | |
practiced | +9.341 |
thus | +8.592 |
ounge | +8.448 |
UA | +7.910 |
fray | +7.910 |
Neg logit contributions | |
Supplement | -8.173 |
appendix | -7.756 |
defences | -7.107 |
erald | -6.787 |
andestine | -6.653 |
Token | perceive |
Token ID | 19973 |
Feature activation | -7.71e-01 |
Pos logit contributions | |
practiced | +3.743 |
ounge | +3.604 |
thus | +3.518 |
UA | +3.383 |
ildo | +3.361 |
Neg logit contributions | |
Supplement | -2.981 |
appendix | -2.907 |
defences | -2.759 |
strang | -2.587 |
erald | -2.521 |
Token | her |
Token ID | 607 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
practiced | +4.112 |
ounge | +3.906 |
thus | +3.818 |
UA | +3.658 |
ildo | +3.617 |
Neg logit contributions | |
Supplement | -4.073 |
appendix | -3.964 |
defences | -3.686 |
erald | -3.487 |
strang | -3.477 |
Token | afterwards |
Token ID | 12979 |
Feature activation | -4.58e-01 |
Pos logit contributions | |
practiced | +0.749 |
ounge | +0.739 |
thus | +0.704 |
UA | +0.696 |
ildo | +0.683 |
Neg logit contributions | |
Supplement | -0.680 |
appendix | -0.673 |
defences | -0.636 |
strang | -0.609 |
gard | -0.592 |
Token | dancing |
Token ID | 15360 |
Feature activation | -9.56e-01 |
Pos logit contributions | |
practiced | +2.523 |
ounge | +2.467 |
thus | +2.364 |
UA | +2.292 |
ildo | +2.284 |
Neg logit contributions | |
Supplement | -2.368 |
appendix | -2.345 |
defences | -2.210 |
strang | -2.096 |
gard | -2.042 |
Token | cigarette |
Token ID | 17779 |
Feature activation | -1.72e-01 |
Pos logit contributions | |
practiced | +0.558 |
ounge | +0.555 |
thus | +0.528 |
UA | +0.525 |
ildo | +0.516 |
Neg logit contributions | |
Supplement | -0.478 |
appendix | -0.474 |
defences | -0.447 |
strang | -0.428 |
gard | -0.416 |
Token | brands |
Token ID | 11394 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
practiced | +0.972 |
ounge | +0.969 |
thus | +0.915 |
UA | +0.913 |
ildo | +0.898 |
Neg logit contributions | |
Supplement | -0.854 |
appendix | -0.841 |
defences | -0.796 |
strang | -0.760 |
gard | -0.748 |
Token | , |
Token ID | 11 |
Feature activation | -5.93e-01 |
Pos logit contributions | |
practiced | +1.230 |
ounge | +1.207 |
thus | +1.151 |
UA | +1.136 |
ildo | +1.108 |
Neg logit contributions | |
Supplement | -1.134 |
appendix | -1.116 |
defences | -1.064 |
strang | -1.021 |
gard | -0.996 |
Token | saw |
Token ID | 2497 |
Feature activation | -9.78e-01 |
Pos logit contributions | |
practiced | +3.105 |
ounge | +2.982 |
thus | +2.864 |
UA | +2.851 |
ildo | +2.759 |
Neg logit contributions | |
Supplement | -3.217 |
appendix | -3.154 |
defences | -3.022 |
strang | -2.867 |
gard | -2.802 |
Token | its |
Token ID | 663 |
Feature activation | -6.97e-01 |
Pos logit contributions | |
practiced | +4.747 |
ounge | +4.599 |
UA | +4.407 |
thus | +4.328 |
ildo | +4.247 |
Neg logit contributions | |
Supplement | -5.476 |
appendix | -5.261 |
defences | -4.995 |
erald | -4.836 |
gard | -4.768 |
Token | stock |
Token ID | 4283 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
practiced | +4.439 |
ounge | +4.406 |
UA | +4.251 |
thus | +4.183 |
ildo | +4.081 |
Neg logit contributions | |
Supplement | -2.906 |
appendix | -2.809 |
defences | -2.632 |
strang | -2.468 |
gard | -2.449 |
Token | decline |
Token ID | 7794 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
practiced | +8.364 |
ounge | +8.184 |
fray | +7.988 |
thus | +7.908 |
UA | +7.752 |
Neg logit contributions | |
Supplement | -7.807 |
appendix | -7.435 |
defences | -7.128 |
andestine | -6.985 |
erald | -6.977 |
Token | more |
Token ID | 517 |
Feature activation | -3.07e-01 |
Pos logit contributions | |
practiced | +1.109 |
ounge | +1.105 |
thus | +1.047 |
UA | +1.046 |
ildo | +1.026 |
Neg logit contributions | |
Supplement | -1.034 |
appendix | -1.030 |
defences | -0.976 |
strang | -0.939 |
gard | -0.912 |
Token | than |
Token ID | 621 |
Feature activation | -3.86e-01 |
Pos logit contributions | |
practiced | +1.596 |
ounge | +1.588 |
thus | +1.501 |
UA | +1.499 |
ildo | +1.468 |
Neg logit contributions | |
Supplement | -1.667 |
appendix | -1.659 |
defences | -1.577 |
strang | -1.521 |
gard | -1.479 |
Token | 4 |
Token ID | 604 |
Feature activation | +6.56e-02 |
Pos logit contributions | |
practiced | +1.917 |
ounge | +1.902 |
thus | +1.793 |
UA | +1.789 |
ildo | +1.751 |
Neg logit contributions | |
Supplement | -2.190 |
appendix | -2.171 |
defences | -2.069 |
strang | -1.998 |
gard | -1.945 |
Token | percent |
Token ID | 1411 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
Supplement | +0.292 |
appendix | +0.287 |
defences | +0.273 |
strang | +0.257 |
gard | +0.247 |
Neg logit contributions | |
practiced | -0.408 |
ounge | -0.406 |
thus | -0.388 |
UA | -0.387 |
ildo | -0.375 |
Token | 93 |
Token ID | 10261 |
Feature activation | +1.97e-01 |
Pos logit contributions | |
practiced | +3.669 |
ounge | +3.591 |
thus | +3.396 |
UA | +3.395 |
ildo | +3.313 |
Neg logit contributions | |
Supplement | -3.174 |
appendix | -3.093 |
defences | -2.961 |
strang | -2.827 |
erald | -2.781 |
Token | . |
Token ID | 13 |
Feature activation | +6.36e-01 |
Pos logit contributions | |
Supplement | +0.893 |
appendix | +0.875 |
defences | +0.840 |
strang | +0.794 |
gard | +0.756 |
Neg logit contributions | |
practiced | -1.216 |
ounge | -1.201 |
thus | -1.150 |
UA | -1.145 |
ildo | -1.118 |
Token | 8 |
Token ID | 23 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
Supplement | +2.726 |
appendix | +2.687 |
defences | +2.478 |
strang | +2.388 |
gard | +2.316 |
Neg logit contributions | |
practiced | -4.021 |
ounge | -4.005 |
thus | -3.803 |
UA | -3.795 |
ildo | -3.751 |
Token | percent |
Token ID | 1411 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
Supplement | +0.730 |
appendix | +0.709 |
defences | +0.688 |
strang | +0.649 |
gard | +0.615 |
Neg logit contributions | |
practiced | -1.049 |
ounge | -1.032 |
thus | -0.993 |
UA | -0.987 |
ildo | -0.967 |
Token | as |
Token ID | 355 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
practiced | +1.133 |
ounge | +1.102 |
thus | +1.060 |
UA | +1.048 |
ildo | +1.022 |
Neg logit contributions | |
Supplement | -1.088 |
appendix | -1.078 |
defences | -1.032 |
strang | -0.991 |
gard | -0.957 |
Token | originally |
Token ID | 6198 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
practiced | +5.917 |
ounge | +5.516 |
UA | +5.297 |
thus | +5.244 |
ildo | +5.145 |
Neg logit contributions | |
Supplement | -5.257 |
appendix | -5.057 |
defences | -4.681 |
strang | -4.562 |
erald | -4.432 |
Token | estimated |
Token ID | 6108 |
Feature activation | -9.02e-01 |
Pos logit contributions | |
practiced | +7.566 |
ounge | +6.285 |
thus | +6.204 |
UA | +6.201 |
ildo | +5.985 |
Neg logit contributions | |
Supplement | -9.284 |
appendix | -8.880 |
defences | -8.473 |
erald | -8.276 |
strang | -8.176 |
Token | , |
Token ID | 11 |
Feature activation | -3.00e-02 |
Pos logit contributions | |
practiced | +4.439 |
ounge | +4.194 |
thus | +4.140 |
UA | +4.030 |
ildo | +3.923 |
Neg logit contributions | |
Supplement | -4.835 |
appendix | -4.752 |
defences | -4.519 |
strang | -4.469 |
erald | -4.258 |
Token | raising |
Token ID | 8620 |
Feature activation | +4.21e-01 |
Pos logit contributions | |
practiced | +0.170 |
ounge | +0.169 |
thus | +0.161 |
UA | +0.161 |
ildo | +0.157 |
Neg logit contributions | |
Supplement | -0.148 |
appendix | -0.147 |
defences | -0.140 |
strang | -0.134 |
gard | -0.130 |
Token | issues |
Token ID | 2428 |
Feature activation | +2.15e-01 |
Pos logit contributions | |
appendix | +1.698 |
Supplement | +1.686 |
defences | +1.602 |
strang | +1.515 |
gard | +1.468 |
Neg logit contributions | |
ounge | -2.760 |
practiced | -2.748 |
thus | -2.638 |
UA | -2.631 |
ildo | -2.592 |
Token | over |
Token ID | 625 |
Feature activation | +7.00e-01 |
Pos logit contributions | |
Supplement | +0.952 |
appendix | +0.948 |
defences | +0.890 |
strang | +0.851 |
gard | +0.822 |
Neg logit contributions | |
practiced | -1.325 |
ounge | -1.322 |
thus | -1.260 |
UA | -1.259 |
ildo | -1.238 |
Token | Moscow |
Token ID | 9070 |
Feature activation | -3.65e-01 |
Pos logit contributions | |
practiced | +0.102 |
ounge | +0.101 |
thus | +0.096 |
UA | +0.096 |
ildo | +0.094 |
Neg logit contributions | |
Supplement | -0.084 |
appendix | -0.083 |
defences | -0.078 |
strang | -0.075 |
gard | -0.073 |
Token | had |
Token ID | 550 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
practiced | +2.157 |
ounge | +2.070 |
thus | +1.987 |
UA | +1.969 |
ildo | +1.925 |
Neg logit contributions | |
Supplement | -1.752 |
appendix | -1.735 |
defences | -1.609 |
strang | -1.568 |
gard | -1.501 |
Token | a |
Token ID | 257 |
Feature activation | +3.23e-02 |
Pos logit contributions | |
practiced | +1.025 |
ounge | +0.984 |
thus | +0.933 |
UA | +0.927 |
ildo | +0.905 |
Neg logit contributions | |
Supplement | -0.911 |
appendix | -0.895 |
defences | -0.836 |
strang | -0.812 |
erald | -0.790 |
Token | long |
Token ID | 890 |
Feature activation | -6.18e-01 |
Pos logit contributions | |
Supplement | +0.145 |
appendix | +0.144 |
defences | +0.135 |
strang | +0.130 |
gard | +0.125 |
Neg logit contributions | |
practiced | -0.199 |
ounge | -0.197 |
thus | -0.188 |
UA | -0.187 |
ildo | -0.185 |
Token | way |
Token ID | 835 |
Feature activation | -6.28e-01 |
Pos logit contributions | |
practiced | +3.612 |
ounge | +3.520 |
thus | +3.337 |
UA | +3.292 |
ildo | +3.237 |
Neg logit contributions | |
Supplement | -2.927 |
appendix | -2.855 |
defences | -2.676 |
strang | -2.584 |
gard | -2.513 |
Token | to |
Token ID | 284 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
practiced | +2.831 |
ounge | +2.698 |
thus | +2.562 |
UA | +2.473 |
ildo | +2.392 |
Neg logit contributions | |
Supplement | -3.740 |
appendix | -3.726 |
strang | -3.432 |
defences | -3.431 |
erald | -3.389 |
Token | go |
Token ID | 467 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
practiced | +7.016 |
ounge | +6.405 |
thus | +6.399 |
ildo | +5.959 |
fray | +5.944 |
Neg logit contributions | |
Supplement | -9.374 |
appendix | -8.957 |
defences | -8.687 |
andestine | -8.481 |
strang | -8.271 |
Token | to |
Token ID | 284 |
Feature activation | -6.67e-01 |
Pos logit contributions | |
practiced | +4.979 |
ounge | +4.744 |
thus | +4.652 |
UA | +4.479 |
ildo | +4.365 |
Neg logit contributions | |
Supplement | -5.969 |
appendix | -5.917 |
strang | -5.473 |
defences | -5.470 |
erald | -5.238 |
Token | prove |
Token ID | 5879 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
practiced | +4.048 |
ounge | +3.949 |
thus | +3.767 |
ildo | +3.716 |
UA | +3.700 |
Neg logit contributions | |
Supplement | -2.971 |
appendix | -2.884 |
defences | -2.684 |
strang | -2.536 |
gard | -2.474 |
Token | its |
Token ID | 663 |
Feature activation | +8.82e-01 |
Pos logit contributions | |
Supplement | +0.695 |
appendix | +0.692 |
defences | +0.657 |
strang | +0.636 |
gard | +0.618 |
Neg logit contributions | |
practiced | -0.629 |
ounge | -0.624 |
thus | -0.589 |
UA | -0.587 |
ildo | -0.575 |
Token | intentions |
Token ID | 14953 |
Feature activation | -5.80e-02 |
Pos logit contributions | |
appendix | +3.772 |
Supplement | +3.756 |
defences | +3.647 |
strang | +3.441 |
gard | +3.270 |
Neg logit contributions | |
ounge | -5.458 |
practiced | -5.379 |
thus | -5.230 |
UA | -5.206 |
ildo | -5.184 |
Token | on |
Token ID | 319 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
practiced | +3.261 |
ounge | +3.175 |
UA | +3.046 |
thus | +3.042 |
ildo | +2.936 |
Neg logit contributions | |
Supplement | -2.847 |
appendix | -2.842 |
defences | -2.667 |
strang | -2.565 |
gard | -2.483 |
Token | the |
Token ID | 262 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
practiced | +2.449 |
ounge | +2.385 |
thus | +2.279 |
UA | +2.278 |
ildo | +2.194 |
Neg logit contributions | |
Supplement | -2.538 |
appendix | -2.524 |
defences | -2.390 |
strang | -2.299 |
gard | -2.246 |
Token | Warriors |
Token ID | 12090 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
practiced | +1.012 |
ounge | +1.006 |
thus | +0.955 |
UA | +0.954 |
ildo | +0.935 |
Neg logit contributions | |
Supplement | -0.884 |
appendix | -0.879 |
defences | -0.831 |
strang | -0.798 |
gard | -0.774 |
Token | ' |
Token ID | 6 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
Supplement | +0.795 |
appendix | +0.790 |
defences | +0.748 |
strang | +0.721 |
gard | +0.699 |
Neg logit contributions | |
ounge | -0.859 |
practiced | -0.858 |
thus | -0.813 |
UA | -0.809 |
ildo | -0.802 |
Token | official |
Token ID | 1743 |
Feature activation | -4.18e-01 |
Pos logit contributions | |
Supplement | +1.214 |
appendix | +1.213 |
defences | +1.153 |
strang | +1.116 |
gard | +1.075 |
Neg logit contributions | |
ounge | -1.357 |
practiced | -1.337 |
thus | -1.281 |
UA | -1.279 |
ildo | -1.277 |
Token | Facebook |
Token ID | 3203 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
practiced | +1.890 |
ounge | +1.865 |
thus | +1.755 |
UA | +1.751 |
ildo | +1.693 |
Neg logit contributions | |
Supplement | -2.547 |
appendix | -2.540 |
defences | -2.420 |
strang | -2.339 |
gard | -2.286 |
Token | page |
Token ID | 2443 |
Feature activation | -5.96e-01 |
Pos logit contributions | |
practiced | +6.870 |
ounge | +6.694 |
UA | +6.475 |
thus | +6.402 |
fray | +5.929 |
Neg logit contributions | |
appendix | -9.247 |
Supplement | -9.150 |
defences | -8.765 |
strang | -8.419 |
erald | -8.315 |
Token | . |
Token ID | 13 |
Feature activation | -5.50e-01 |
Pos logit contributions | |
practiced | +3.226 |
ounge | +3.175 |
thus | +3.054 |
UA | +3.010 |
ildo | +2.914 |
Neg logit contributions | |
Supplement | -3.074 |
appendix | -3.069 |
defences | -2.924 |
strang | -2.819 |
gard | -2.714 |
Token | The |
Token ID | 383 |
Feature activation | -6.31e-01 |
Pos logit contributions | |
practiced | +2.736 |
ounge | +2.729 |
thus | +2.615 |
UA | +2.596 |
ildo | +2.521 |
Neg logit contributions | |
appendix | -3.048 |
Supplement | -3.030 |
defences | -2.940 |
strang | -2.814 |
gard | -2.735 |
Token | program |
Token ID | 1430 |
Feature activation | -4.33e-01 |
Pos logit contributions | |
practiced | +3.313 |
ounge | +3.263 |
thus | +3.095 |
UA | +3.063 |
ildo | +2.975 |
Neg logit contributions | |
Supplement | -3.374 |
appendix | -3.327 |
defences | -3.170 |
strang | -3.021 |
gard | -2.965 |
Token | will |
Token ID | 481 |
Feature activation | -3.82e-01 |
Pos logit contributions | |
practiced | +2.527 |
ounge | +2.507 |
thus | +2.389 |
UA | +2.358 |
ildo | +2.298 |
Neg logit contributions | |
Supplement | -2.080 |
appendix | -2.044 |
defences | -1.960 |
strang | -1.872 |
gard | -1.808 |
Token | still |
Token ID | 991 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
Supplement | +0.309 |
appendix | +0.308 |
defences | +0.289 |
strang | +0.277 |
gard | +0.268 |
Neg logit contributions | |
practiced | -0.416 |
ounge | -0.414 |
thus | -0.395 |
UA | -0.394 |
ildo | -0.388 |
Token | have |
Token ID | 423 |
Feature activation | -3.40e-01 |
Pos logit contributions | |
practiced | +1.493 |
ounge | +1.464 |
thus | +1.402 |
UA | +1.394 |
ildo | +1.368 |
Neg logit contributions | |
Supplement | -1.051 |
appendix | -1.039 |
defences | -0.986 |
strang | -0.938 |
gard | -0.902 |
Token | a |
Token ID | 257 |
Feature activation | -3.86e-01 |
Pos logit contributions | |
practiced | +2.018 |
ounge | +1.979 |
UA | +1.888 |
thus | +1.884 |
ildo | +1.837 |
Neg logit contributions | |
Supplement | -1.613 |
appendix | -1.587 |
defences | -1.499 |
strang | -1.434 |
gard | -1.393 |
Token | lot |
Token ID | 1256 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
practiced | +2.134 |
ounge | +2.084 |
thus | +1.985 |
UA | +1.979 |
ildo | +1.940 |
Neg logit contributions | |
Supplement | -1.970 |
appendix | -1.945 |
defences | -1.857 |
strang | -1.770 |
gard | -1.721 |
Token | more |
Token ID | 517 |
Feature activation | -7.74e-01 |
Pos logit contributions | |
practiced | +5.450 |
ounge | +5.053 |
UA | +4.994 |
thus | +4.688 |
ildo | +4.594 |
Neg logit contributions | |
Supplement | -5.331 |
appendix | -5.205 |
defences | -4.967 |
gard | -4.768 |
strang | -4.764 |
Token | to |
Token ID | 284 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
practiced | +3.929 |
ounge | +3.743 |
UA | +3.598 |
thus | +3.538 |
ildo | +3.423 |
Neg logit contributions | |
Supplement | -4.303 |
appendix | -4.188 |
defences | -3.951 |
strang | -3.831 |
gard | -3.754 |
Token | learn |
Token ID | 2193 |
Feature activation | -6.54e-01 |
Pos logit contributions | |
practiced | +7.478 |
ounge | +7.016 |
thus | +6.538 |
ildo | +6.483 |
UA | +6.467 |
Neg logit contributions | |
Supplement | -8.572 |
appendix | -8.328 |
defences | -8.244 |
andestine | -7.947 |
strang | -7.819 |
Token | ! |
Token ID | 0 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
practiced | +3.461 |
ounge | +3.356 |
thus | +3.226 |
UA | +3.203 |
ildo | +3.125 |
Neg logit contributions | |
Supplement | -3.435 |
appendix | -3.398 |
defences | -3.237 |
strang | -3.125 |
gard | -3.026 |
Token | I |
Token ID | 314 |
Feature activation | -7.56e-02 |
Pos logit contributions | |
practiced | +0.996 |
ounge | +0.992 |
thus | +0.941 |
UA | +0.940 |
ildo | +0.922 |
Neg logit contributions | |
Supplement | -0.932 |
appendix | -0.929 |
defences | -0.880 |
strang | -0.847 |
gard | -0.823 |
Token | hope |
Token ID | 2911 |
Feature activation | +2.94e-01 |
Pos logit contributions | |
practiced | +0.448 |
ounge | +0.444 |
thus | +0.423 |
UA | +0.422 |
ildo | +0.414 |
Neg logit contributions | |
Supplement | -0.357 |
appendix | -0.356 |
defences | -0.336 |
strang | -0.322 |
gard | -0.311 |
Token | to |
Token ID | 284 |
Feature activation | -3.49e-01 |
Pos logit contributions | |
appendix | +1.440 |
Supplement | +1.438 |
defences | +1.352 |
strang | +1.305 |
gard | +1.266 |
Neg logit contributions | |
ounge | -1.676 |
practiced | -1.673 |
thus | -1.586 |
UA | -1.585 |
ildo | -1.557 |
Token | it |
Token ID | 340 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
practiced | +1.325 |
ounge | +1.317 |
UA | +1.251 |
thus | +1.251 |
ildo | +1.222 |
Neg logit contributions | |
Supplement | -1.165 |
appendix | -1.157 |
defences | -1.091 |
strang | -1.051 |
gard | -1.016 |
Token | look |
Token ID | 804 |
Feature activation | +5.30e-02 |
Pos logit contributions | |
practiced | +1.372 |
ounge | +1.362 |
thus | +1.299 |
UA | +1.292 |
ildo | +1.267 |
Neg logit contributions | |
Supplement | -1.168 |
appendix | -1.159 |
defences | -1.098 |
strang | -1.052 |
gard | -1.018 |
Token | the |
Token ID | 262 |
Feature activation | -8.64e-02 |
Pos logit contributions | |
Supplement | +0.231 |
appendix | +0.230 |
defences | +0.216 |
strang | +0.206 |
gard | +0.199 |
Neg logit contributions | |
practiced | -0.331 |
ounge | -0.331 |
thus | -0.315 |
UA | -0.315 |
ildo | -0.310 |
Token | best |
Token ID | 1266 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
practiced | +0.556 |
ounge | +0.551 |
thus | +0.528 |
UA | +0.525 |
ildo | +0.518 |
Neg logit contributions | |
Supplement | -0.366 |
appendix | -0.359 |
defences | -0.337 |
strang | -0.316 |
gard | -0.306 |
Token | it |
Token ID | 340 |
Feature activation | -9.89e-01 |
Pos logit contributions | |
appendix | +1.369 |
Supplement | +1.366 |
defences | +1.289 |
strang | +1.239 |
gard | +1.208 |
Neg logit contributions | |
ounge | -1.711 |
practiced | -1.699 |
thus | -1.619 |
UA | -1.617 |
ildo | -1.591 |
Token | can |
Token ID | 460 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
practiced | +6.259 |
ounge | +6.010 |
thus | +5.872 |
ildo | +5.698 |
UA | +5.670 |
Neg logit contributions | |
Supplement | -4.234 |
appendix | -4.120 |
defences | -3.726 |
strang | -3.592 |
erald | -3.383 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
practiced | +7.254 |
ounge | +7.229 |
thus | +7.106 |
ildo | +6.707 |
UA | +6.593 |
Neg logit contributions | |
Supplement | -8.660 |
appendix | -8.612 |
defences | -8.163 |
strang | -7.889 |
erald | -7.606 |
Token | This |
Token ID | 770 |
Feature activation | -9.72e-02 |
Pos logit contributions | |
practiced | +2.266 |
ounge | +2.264 |
UA | +2.175 |
thus | +2.172 |
ildo | +2.111 |
Neg logit contributions | |
appendix | -2.201 |
Supplement | -2.190 |
defences | -2.105 |
strang | -2.016 |
gard | -1.957 |
Token | is |
Token ID | 318 |
Feature activation | +2.08e-02 |
Pos logit contributions | |
practiced | +0.569 |
ounge | +0.565 |
thus | +0.539 |
UA | +0.539 |
ildo | +0.529 |
Neg logit contributions | |
Supplement | -0.465 |
appendix | -0.460 |
defences | -0.435 |
strang | -0.416 |
gard | -0.403 |
Token | one |
Token ID | 530 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
Supplement | +0.096 |
appendix | +0.096 |
defences | +0.090 |
strang | +0.087 |
gard | +0.084 |
Neg logit contributions | |
practiced | -0.125 |
ounge | -0.125 |
thus | -0.119 |
UA | -0.118 |
ildo | -0.116 |
Token | of |
Token ID | 286 |
Feature activation | -7.60e-03 |
Pos logit contributions | |
practiced | +0.210 |
ounge | +0.209 |
UA | +0.200 |
thus | +0.199 |
ildo | +0.196 |
Neg logit contributions | |
Supplement | -0.158 |
appendix | -0.156 |
defences | -0.148 |
strang | -0.141 |
gard | -0.136 |
Token | also |
Token ID | 635 |
Feature activation | -2.05e-01 |
Pos logit contributions | |
practiced | +2.120 |
ounge | +2.039 |
thus | +1.940 |
UA | +1.930 |
ildo | +1.882 |
Neg logit contributions | |
Supplement | -1.999 |
appendix | -1.976 |
defences | -1.859 |
strang | -1.787 |
gard | -1.735 |
Token | been |
Token ID | 587 |
Feature activation | -4.67e-01 |
Pos logit contributions | |
practiced | +1.222 |
ounge | +1.198 |
thus | +1.140 |
UA | +1.136 |
ildo | +1.115 |
Neg logit contributions | |
Supplement | -0.968 |
appendix | -0.961 |
defences | -0.903 |
strang | -0.864 |
gard | -0.836 |
Token | guilty |
Token ID | 6717 |
Feature activation | -3.28e-01 |
Pos logit contributions | |
practiced | +2.572 |
ounge | +2.483 |
thus | +2.354 |
UA | +2.349 |
ildo | +2.276 |
Neg logit contributions | |
Supplement | -2.436 |
appendix | -2.414 |
defences | -2.270 |
strang | -2.171 |
gard | -2.117 |
Token | of |
Token ID | 286 |
Feature activation | -4.33e-01 |
Pos logit contributions | |
practiced | +1.895 |
ounge | +1.869 |
UA | +1.769 |
thus | +1.762 |
ildo | +1.739 |
Neg logit contributions | |
Supplement | -1.592 |
appendix | -1.567 |
defences | -1.484 |
strang | -1.390 |
erald | -1.365 |
Token | sharing |
Token ID | 7373 |
Feature activation | -9.44e-01 |
Pos logit contributions | |
practiced | +2.385 |
ounge | +2.352 |
thus | +2.233 |
UA | +2.220 |
ildo | +2.183 |
Neg logit contributions | |
Supplement | -2.212 |
appendix | -2.195 |
defences | -2.068 |
strang | -1.968 |
gard | -1.924 |
Token | fake |
Token ID | 8390 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
practiced | +5.038 |
ounge | +4.811 |
thus | +4.562 |
UA | +4.546 |
ildo | +4.398 |
Neg logit contributions | |
Supplement | -4.812 |
appendix | -4.736 |
defences | -4.387 |
erald | -4.200 |
strang | -4.185 |
Token | news |
Token ID | 1705 |
Feature activation | -5.26e-01 |
Pos logit contributions | |
practiced | +5.363 |
ounge | +5.297 |
UA | +4.867 |
thus | +4.785 |
ildo | +4.693 |
Neg logit contributions | |
Supplement | -10.318 |
appendix | -9.865 |
defences | -9.366 |
erald | -8.931 |
strang | -8.913 |
Token | on |
Token ID | 319 |
Feature activation | -4.71e-01 |
Pos logit contributions | |
practiced | +3.042 |
ounge | +2.978 |
thus | +2.860 |
UA | +2.834 |
ildo | +2.784 |
Neg logit contributions | |
Supplement | -2.530 |
appendix | -2.487 |
defences | -2.329 |
strang | -2.214 |
gard | -2.168 |
Token | his |
Token ID | 465 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
practiced | +2.236 |
ounge | +2.196 |
thus | +2.071 |
UA | +2.054 |
ildo | +2.001 |
Neg logit contributions | |
Supplement | -2.758 |
appendix | -2.748 |
defences | -2.592 |
strang | -2.510 |
gard | -2.450 |
Token | Twitter |
Token ID | 3009 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
practiced | +1.460 |
ounge | +1.441 |
thus | +1.376 |
UA | +1.373 |
ildo | +1.334 |
Neg logit contributions | |
Supplement | -1.317 |
appendix | -1.304 |
defences | -1.226 |
strang | -1.180 |
gard | -1.139 |
Token | page |
Token ID | 2443 |
Feature activation | -6.68e-01 |
Pos logit contributions | |
practiced | +6.091 |
ounge | +6.014 |
thus | +5.619 |
UA | +5.604 |
ildo | +5.254 |
Neg logit contributions | |
appendix | -7.977 |
Supplement | -7.955 |
strang | -7.437 |
defences | -7.326 |
erald | -7.249 |
Token | it |
Token ID | 340 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
practiced | +4.828 |
ounge | +4.661 |
UA | +4.463 |
thus | +4.412 |
ildo | +4.349 |
Neg logit contributions | |
Supplement | -3.987 |
appendix | -3.885 |
defences | -3.526 |
erald | -3.429 |
strang | -3.413 |
Token | accused |
Token ID | 5371 |
Feature activation | +2.76e-01 |
Pos logit contributions | |
practiced | +0.930 |
ounge | +0.908 |
thus | +0.869 |
UA | +0.861 |
ildo | +0.851 |
Neg logit contributions | |
Supplement | -0.774 |
appendix | -0.767 |
defences | -0.721 |
strang | -0.691 |
gard | -0.667 |
Token | Kiev |
Token ID | 22761 |
Feature activation | -3.49e-02 |
Pos logit contributions | |
Supplement | +1.162 |
appendix | +1.157 |
defences | +1.085 |
strang | +1.035 |
gard | +0.997 |
Neg logit contributions | |
practiced | -1.761 |
ounge | -1.757 |
thus | -1.679 |
UA | -1.676 |
ildo | -1.649 |
Token | of |
Token ID | 286 |
Feature activation | +2.60e-02 |
Pos logit contributions | |
practiced | +0.206 |
ounge | +0.202 |
UA | +0.193 |
ildo | +0.189 |
thus | +0.189 |
Neg logit contributions | |
Supplement | -0.168 |
appendix | -0.167 |
defences | -0.153 |
strang | -0.148 |
erald | -0.145 |
Token | stealing |
Token ID | 16568 |
Feature activation | -3.96e-01 |
Pos logit contributions | |
Supplement | +0.132 |
appendix | +0.132 |
defences | +0.124 |
strang | +0.119 |
gard | +0.116 |
Neg logit contributions | |
practiced | -0.145 |
ounge | -0.143 |
thus | -0.136 |
UA | -0.136 |
ildo | -0.134 |
Token | gas |
Token ID | 3623 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
practiced | +2.049 |
ounge | +1.995 |
UA | +1.895 |
thus | +1.892 |
ildo | +1.842 |
Neg logit contributions | |
Supplement | -2.152 |
appendix | -2.147 |
defences | -2.003 |
strang | -1.941 |
gard | -1.896 |
Token | meant |
Token ID | 4001 |
Feature activation | +3.02e-01 |
Pos logit contributions | |
practiced | +8.097 |
ounge | +7.505 |
thus | +7.235 |
UA | +7.199 |
ildo | +7.191 |
Neg logit contributions | |
appendix | -7.744 |
Supplement | -7.526 |
defences | -6.952 |
strang | -6.774 |
erald | -6.661 |
Token | for |
Token ID | 329 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
Supplement | +1.371 |
appendix | +1.348 |
defences | +1.277 |
strang | +1.194 |
gard | +1.172 |
Neg logit contributions | |
ounge | -1.854 |
practiced | -1.834 |
UA | -1.774 |
thus | -1.754 |
ildo | -1.711 |
Token | other |
Token ID | 584 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
Supplement | +1.993 |
appendix | +1.986 |
defences | +1.886 |
strang | +1.818 |
gard | +1.765 |
Neg logit contributions | |
practiced | -2.035 |
ounge | -2.028 |
thus | -1.921 |
UA | -1.921 |
ildo | -1.881 |
Token | European |
Token ID | 3427 |
Feature activation | +6.03e-02 |
Pos logit contributions | |
practiced | +1.423 |
ounge | +1.412 |
thus | +1.345 |
UA | +1.338 |
ildo | +1.322 |
Neg logit contributions | |
Supplement | -1.085 |
appendix | -1.063 |
defences | -0.987 |
strang | -0.943 |
gard | -0.921 |
Token | customers |
Token ID | 4297 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
Supplement | +0.273 |
appendix | +0.270 |
defences | +0.252 |
strang | +0.241 |
gard | +0.234 |
Neg logit contributions | |
practiced | -0.369 |
ounge | -0.368 |
thus | -0.351 |
UA | -0.350 |
ildo | -0.344 |
Token | 't |
Token ID | 470 |
Feature activation | -5.99e-01 |
Pos logit contributions | |
practiced | +3.822 |
ounge | +3.721 |
thus | +3.551 |
ildo | +3.440 |
UA | +3.385 |
Neg logit contributions | |
Supplement | -4.217 |
appendix | -4.151 |
defences | -4.020 |
strang | -3.791 |
gard | -3.676 |
Token | imagine |
Token ID | 5967 |
Feature activation | -6.44e-01 |
Pos logit contributions | |
practiced | +3.727 |
ounge | +3.661 |
thus | +3.514 |
UA | +3.438 |
ildo | +3.438 |
Neg logit contributions | |
Supplement | -2.649 |
appendix | -2.573 |
defences | -2.455 |
strang | -2.306 |
gard | -2.224 |
Token | how |
Token ID | 703 |
Feature activation | -4.53e-01 |
Pos logit contributions | |
practiced | +3.592 |
ounge | +3.505 |
thus | +3.368 |
UA | +3.292 |
ildo | +3.245 |
Neg logit contributions | |
Supplement | -3.243 |
appendix | -3.141 |
defences | -2.994 |
strang | -2.811 |
gard | -2.734 |
Token | hurt |
Token ID | 5938 |
Feature activation | -2.84e-01 |
Pos logit contributions | |
practiced | +2.674 |
ounge | +2.603 |
thus | +2.496 |
UA | +2.463 |
ildo | +2.434 |
Neg logit contributions | |
Supplement | -2.176 |
appendix | -2.119 |
defences | -1.992 |
strang | -1.880 |
gard | -1.829 |
Token | Barbara |
Token ID | 16685 |
Feature activation | -6.55e-01 |
Pos logit contributions | |
practiced | +1.616 |
ounge | +1.585 |
thus | +1.531 |
UA | +1.508 |
ildo | +1.491 |
Neg logit contributions | |
Supplement | -1.406 |
appendix | -1.383 |
defences | -1.312 |
strang | -1.260 |
gard | -1.221 |
Token | must |
Token ID | 1276 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
practiced | +3.746 |
ounge | +3.622 |
UA | +3.450 |
thus | +3.449 |
ildo | +3.338 |
Neg logit contributions | |
Supplement | -3.238 |
appendix | -3.145 |
defences | -2.989 |
strang | -2.856 |
gard | -2.765 |
Token | be |
Token ID | 307 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
practiced | +6.697 |
ounge | +6.532 |
tone | +5.945 |
thus | +5.877 |
fray | +5.862 |
Neg logit contributions | |
Supplement | -8.951 |
appendix | -8.568 |
defences | -8.332 |
strang | -7.833 |
andestine | -7.807 |
Token | to |
Token ID | 284 |
Feature activation | -2.03e-01 |
Pos logit contributions | |
practiced | +6.972 |
ounge | +6.531 |
thus | +6.377 |
apologizing | +6.112 |
UA | +6.095 |
Neg logit contributions | |
Supplement | -6.807 |
appendix | -6.721 |
defences | -6.326 |
strang | -6.000 |
erald | -5.932 |
Token | find |
Token ID | 1064 |
Feature activation | -3.80e-01 |
Pos logit contributions | |
practiced | +1.258 |
ounge | +1.252 |
thus | +1.195 |
UA | +1.193 |
ildo | +1.173 |
Neg logit contributions | |
Supplement | -0.897 |
appendix | -0.891 |
defences | -0.837 |
strang | -0.799 |
gard | -0.771 |
Token | that |
Token ID | 326 |
Feature activation | -4.75e-01 |
Pos logit contributions | |
practiced | +2.436 |
ounge | +2.391 |
thus | +2.315 |
UA | +2.288 |
ildo | +2.243 |
Neg logit contributions | |
Supplement | -1.614 |
appendix | -1.562 |
defences | -1.473 |
strang | -1.397 |
gard | -1.335 |
Token | out |
Token ID | 503 |
Feature activation | -4.63e-03 |
Pos logit contributions | |
practiced | +3.019 |
ounge | +2.938 |
thus | +2.839 |
UA | +2.798 |
ildo | +2.761 |
Neg logit contributions | |
Supplement | -2.053 |
appendix | -1.950 |
defences | -1.879 |
strang | -1.748 |
gard | -1.692 |
Token | , |
Token ID | 11 |
Feature activation | -2.74e-02 |
Pos logit contributions | |
practiced | +0.901 |
ounge | +0.877 |
thus | +0.854 |
UA | +0.840 |
ildo | +0.814 |
Neg logit contributions | |
Supplement | -0.966 |
appendix | -0.959 |
defences | -0.914 |
strang | -0.874 |
gard | -0.845 |
Token | 2009 |
Token ID | 3717 |
Feature activation | -6.33e-01 |
Pos logit contributions | |
practiced | +0.177 |
ounge | +0.176 |
thus | +0.169 |
UA | +0.168 |
ildo | +0.166 |
Neg logit contributions | |
Supplement | -0.114 |
appendix | -0.114 |
defences | -0.106 |
strang | -0.101 |
gard | -0.098 |
Token | in |
Token ID | 287 |
Feature activation | -8.55e-02 |
Pos logit contributions | |
practiced | +3.207 |
ounge | +3.032 |
UA | +2.967 |
thus | +2.937 |
ildo | +2.811 |
Neg logit contributions | |
Supplement | -3.498 |
appendix | -3.452 |
defences | -3.292 |
strang | -3.187 |
quirks | -3.036 |
Token | Antioch |
Token ID | 46590 |
Feature activation | -9.12e-01 |
Pos logit contributions | |
practiced | +0.445 |
ounge | +0.441 |
thus | +0.418 |
UA | +0.415 |
ildo | +0.405 |
Neg logit contributions | |
Supplement | -0.466 |
appendix | -0.461 |
defences | -0.439 |
strang | -0.424 |
gard | -0.411 |
Token | , |
Token ID | 11 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
practiced | +4.371 |
ounge | +4.267 |
UA | +4.121 |
thus | +4.112 |
ildo | +3.927 |
Neg logit contributions | |
Supplement | -5.152 |
appendix | -5.130 |
defences | -4.927 |
strang | -4.750 |
gard | -4.506 |
Token | Calif |
Token ID | 3192 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
practiced | +1.629 |
ounge | +1.581 |
UA | +1.516 |
thus | +1.503 |
ildo | +1.459 |
Neg logit contributions | |
Supplement | -1.885 |
appendix | -1.871 |
defences | -1.789 |
strang | -1.726 |
gard | -1.678 |
Token | . |
Token ID | 13 |
Feature activation | -4.84e-01 |
Pos logit contributions | |
practiced | +5.628 |
UA | +5.515 |
ounge | +5.428 |
thus | +4.927 |
ildo | +4.770 |
Neg logit contributions | |
appendix | -9.651 |
Supplement | -9.624 |
defences | -9.131 |
strang | -8.852 |
quirks | -8.683 |
Token | Photo |
Token ID | 5555 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
practiced | +2.535 |
ounge | +2.493 |
UA | +2.395 |
thus | +2.379 |
ildo | +2.306 |
Neg logit contributions | |
appendix | -2.568 |
Supplement | -2.567 |
defences | -2.442 |
strang | -2.353 |
gard | -2.259 |
Token | : |
Token ID | 25 |
Feature activation | +3.68e-01 |
Pos logit contributions | |
Supplement | +0.532 |
appendix | +0.530 |
defences | +0.502 |
strang | +0.481 |
gard | +0.464 |
Neg logit contributions | |
practiced | -0.629 |
ounge | -0.622 |
thus | -0.596 |
UA | -0.593 |
ildo | -0.581 |
Token | Justin |
Token ID | 10799 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
Supplement | +1.827 |
appendix | +1.820 |
defences | +1.711 |
strang | +1.653 |
gard | +1.607 |
Neg logit contributions | |
ounge | -2.079 |
practiced | -2.075 |
thus | -1.959 |
UA | -1.955 |
ildo | -1.926 |
Token | Sullivan |
Token ID | 18501 |
Feature activation | +6.62e-01 |
Pos logit contributions | |
practiced | +1.452 |
ounge | +1.442 |
thus | +1.369 |
UA | +1.365 |
ildo | +1.334 |
Neg logit contributions | |
Supplement | -1.448 |
appendix | -1.438 |
defences | -1.364 |
strang | -1.315 |
gard | -1.269 |
Token | his |
Token ID | 465 |
Feature activation | +9.22e-02 |
Pos logit contributions | |
practiced | +3.848 |
ounge | +3.698 |
UA | +3.579 |
thus | +3.576 |
ildo | +3.440 |
Neg logit contributions | |
Supplement | -3.653 |
appendix | -3.628 |
defences | -3.375 |
strang | -3.261 |
gard | -3.119 |
Token | dad |
Token ID | 9955 |
Feature activation | -3.08e-01 |
Pos logit contributions | |
Supplement | +0.399 |
appendix | +0.397 |
defences | +0.372 |
strang | +0.356 |
gard | +0.343 |
Neg logit contributions | |
practiced | -0.580 |
ounge | -0.579 |
thus | -0.552 |
UA | -0.551 |
ildo | -0.543 |
Token | � |
Token ID | 447 |
Feature activation | -3.32e-01 |
Pos logit contributions | |
practiced | +1.715 |
ounge | +1.680 |
UA | +1.634 |
thus | +1.613 |
ildo | +1.541 |
Neg logit contributions | |
appendix | -1.553 |
Supplement | -1.540 |
defences | -1.447 |
strang | -1.392 |
gard | -1.327 |
Token | � |
Token ID | 247 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
practiced | +1.785 |
ounge | +1.782 |
UA | +1.677 |
thus | +1.674 |
ildo | +1.655 |
Neg logit contributions | |
Supplement | -1.753 |
appendix | -1.738 |
defences | -1.651 |
strang | -1.586 |
gard | -1.541 |
Token | s |
Token ID | 82 |
Feature activation | -4.05e-01 |
Pos logit contributions | |
practiced | +1.431 |
ounge | +1.425 |
thus | +1.370 |
UA | +1.362 |
ildo | +1.326 |
Neg logit contributions | |
appendix | -1.149 |
Supplement | -1.141 |
defences | -1.080 |
strang | -1.030 |
gard | -0.992 |
Token | Twitter |
Token ID | 3009 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
practiced | +2.196 |
ounge | +2.133 |
UA | +2.065 |
thus | +2.044 |
ildo | +1.967 |
Neg logit contributions | |
Supplement | -2.119 |
appendix | -2.093 |
defences | -1.959 |
strang | -1.890 |
gard | -1.824 |
Token | page |
Token ID | 2443 |
Feature activation | -5.48e-01 |
Pos logit contributions | |
practiced | +6.945 |
ounge | +6.612 |
UA | +6.339 |
thus | +6.274 |
ildo | +5.987 |
Neg logit contributions | |
Supplement | -8.308 |
appendix | -8.303 |
strang | -7.674 |
defences | -7.671 |
erald | -7.479 |
Token | . |
Token ID | 13 |
Feature activation | -3.34e-01 |
Pos logit contributions | |
practiced | +2.795 |
ounge | +2.755 |
thus | +2.633 |
UA | +2.604 |
ildo | +2.510 |
Neg logit contributions | |
appendix | -2.987 |
Supplement | -2.966 |
defences | -2.830 |
strang | -2.744 |
gard | -2.625 |
Token |
|
Token ID | 198 |
Feature activation | -3.09e-01 |
Pos logit contributions | |
practiced | +1.769 |
ounge | +1.762 |
UA | +1.700 |
thus | +1.687 |
ildo | +1.643 |
Neg logit contributions | |
appendix | -1.759 |
Supplement | -1.734 |
defences | -1.684 |
strang | -1.607 |
gard | -1.539 |
Token |
|
Token ID | 198 |
Feature activation | -2.25e-01 |
Pos logit contributions | |
practiced | +1.801 |
ounge | +1.794 |
thus | +1.704 |
UA | +1.702 |
ildo | +1.673 |
Neg logit contributions | |
Supplement | -1.482 |
appendix | -1.474 |
defences | -1.388 |
strang | -1.333 |
gard | -1.292 |
Token | In |
Token ID | 818 |
Feature activation | -3.90e-01 |
Pos logit contributions | |
ounge | +1.148 |
practiced | +1.147 |
UA | +1.103 |
thus | +1.098 |
ildo | +1.060 |
Neg logit contributions | |
appendix | -1.230 |
Supplement | -1.208 |
defences | -1.175 |
strang | -1.132 |
gard | -1.093 |
Token | S |
Token ID | 50 |
Feature activation | +5.55e-02 |
Pos logit contributions | |
Supplement | +2.171 |
appendix | +2.000 |
defences | +1.786 |
strang | +1.762 |
Imm | +1.717 |
Neg logit contributions | |
practiced | -3.015 |
ounge | -2.981 |
anguage | -2.839 |
ildo | -2.778 |
thus | -2.745 |
Token | . |
Token ID | 13 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
Supplement | +0.318 |
appendix | +0.317 |
defences | +0.302 |
strang | +0.290 |
gard | +0.283 |
Neg logit contributions | |
practiced | -0.277 |
ounge | -0.273 |
UA | -0.259 |
thus | -0.252 |
ildo | -0.249 |
Token | government |
Token ID | 1230 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
Supplement | +0.674 |
appendix | +0.671 |
defences | +0.630 |
strang | +0.602 |
gard | +0.581 |
Neg logit contributions | |
practiced | -0.956 |
ounge | -0.953 |
thus | -0.909 |
UA | -0.908 |
ildo | -0.893 |
Token | worked |
Token ID | 3111 |
Feature activation | +4.06e-01 |
Pos logit contributions | |
Supplement | +0.466 |
appendix | +0.464 |
defences | +0.436 |
strang | +0.418 |
gard | +0.404 |
Neg logit contributions | |
practiced | -0.610 |
ounge | -0.606 |
thus | -0.577 |
UA | -0.576 |
ildo | -0.566 |
Token | with |
Token ID | 351 |
Feature activation | -3.42e-01 |
Pos logit contributions | |
Supplement | +1.999 |
appendix | +1.996 |
defences | +1.885 |
strang | +1.813 |
gard | +1.758 |
Neg logit contributions | |
ounge | -2.302 |
practiced | -2.298 |
UA | -2.183 |
thus | -2.180 |
ildo | -2.147 |
Token | Exxon |
Token ID | 27879 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
practiced | +1.866 |
ounge | +1.819 |
thus | +1.743 |
UA | +1.741 |
ildo | +1.695 |
Neg logit contributions | |
Supplement | -1.779 |
appendix | -1.763 |
defences | -1.671 |
strang | -1.596 |
gard | -1.552 |
Token | Mobil |
Token ID | 47100 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
practiced | +6.819 |
ounge | +6.413 |
thus | +6.282 |
UA | +6.201 |
ildo | +6.089 |
Neg logit contributions | |
appendix | -8.739 |
Supplement | -8.655 |
defences | -8.189 |
strang | -7.767 |
erald | -7.710 |
Token | and |
Token ID | 290 |
Feature activation | -1.61e-01 |
Pos logit contributions | |
practiced | +2.545 |
ounge | +2.514 |
UA | +2.394 |
thus | +2.392 |
ildo | +2.323 |
Neg logit contributions | |
appendix | -2.434 |
Supplement | -2.427 |
defences | -2.291 |
strang | -2.185 |
gard | -2.144 |
Token | Chevron |
Token ID | 50083 |
Feature activation | -9.25e-01 |
Pos logit contributions | |
practiced | +0.873 |
ounge | +0.864 |
UA | +0.821 |
thus | +0.821 |
ildo | +0.802 |
Neg logit contributions | |
Supplement | -0.845 |
appendix | -0.840 |
defences | -0.797 |
strang | -0.767 |
gard | -0.744 |
Token | , |
Token ID | 11 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
practiced | +4.740 |
ounge | +4.595 |
UA | +4.458 |
thus | +4.398 |
ildo | +4.229 |
Neg logit contributions | |
appendix | -4.999 |
Supplement | -4.866 |
defences | -4.690 |
strang | -4.458 |
gard | -4.401 |
Token | the |
Token ID | 262 |
Feature activation | -6.07e-02 |
Pos logit contributions | |
practiced | +1.167 |
ounge | +1.153 |
thus | +1.100 |
UA | +1.097 |
ildo | +1.071 |
Neg logit contributions | |
Supplement | -1.010 |
appendix | -1.006 |
defences | -0.952 |
strang | -0.906 |
gard | -0.882 |
Token | ans |
Token ID | 504 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
practiced | +1.223 |
ounge | +1.221 |
thus | +1.172 |
UA | +1.168 |
ildo | +1.151 |
Neg logit contributions | |
Supplement | -0.657 |
appendix | -0.653 |
defences | -0.605 |
strang | -0.574 |
gard | -0.550 |
Token | were |
Token ID | 547 |
Feature activation | +5.44e-01 |
Pos logit contributions | |
Supplement | +1.279 |
appendix | +1.276 |
defences | +1.196 |
strang | +1.145 |
gard | +1.105 |
Neg logit contributions | |
ounge | -1.766 |
practiced | -1.755 |
UA | -1.684 |
thus | -1.676 |
ildo | -1.653 |
Token | gradually |
Token ID | 11835 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
appendix | +2.608 |
Supplement | +2.584 |
defences | +2.463 |
strang | +2.379 |
gard | +2.293 |
Neg logit contributions | |
ounge | -3.132 |
practiced | -3.070 |
UA | -2.982 |
thus | -2.964 |
ildo | -2.946 |
Token | merged |
Token ID | 23791 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
Supplement | +1.807 |
appendix | +1.802 |
defences | +1.722 |
strang | +1.670 |
gard | +1.630 |
Neg logit contributions | |
practiced | -1.333 |
ounge | -1.333 |
thus | -1.247 |
UA | -1.247 |
ildo | -1.217 |
Token | into |
Token ID | 656 |
Feature activation | +5.21e-01 |
Pos logit contributions | |
Supplement | +0.660 |
appendix | +0.654 |
defences | +0.622 |
strang | +0.597 |
gard | +0.582 |
Neg logit contributions | |
practiced | -0.629 |
ounge | -0.626 |
thus | -0.596 |
UA | -0.588 |
ildo | -0.578 |
Token | an |
Token ID | 281 |
Feature activation | +9.66e-01 |
Pos logit contributions | |
Supplement | +2.404 |
appendix | +2.383 |
defences | +2.242 |
strang | +2.151 |
gard | +2.077 |
Neg logit contributions | |
practiced | -3.147 |
ounge | -3.126 |
thus | -2.982 |
UA | -2.972 |
ildo | -2.922 |
Token | all |
Token ID | 477 |
Feature activation | +4.38e-01 |
Pos logit contributions | |
appendix | +4.590 |
Supplement | +4.373 |
defences | +4.141 |
strang | +4.018 |
gard | +3.838 |
Neg logit contributions | |
ounge | -5.581 |
practiced | -5.555 |
UA | -5.422 |
thus | -5.313 |
ildo | -5.232 |
Token | - |
Token ID | 12 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
Supplement | +1.696 |
appendix | +1.692 |
defences | +1.554 |
strang | +1.479 |
gard | +1.432 |
Neg logit contributions | |
ounge | -2.947 |
practiced | -2.916 |
UA | -2.794 |
thus | -2.763 |
ildo | -2.736 |
Token | en |
Token ID | 268 |
Feature activation | +4.92e-01 |
Pos logit contributions | |
Supplement | +0.698 |
appendix | +0.682 |
defences | +0.611 |
strang | +0.570 |
gard | +0.550 |
Neg logit contributions | |
practiced | -1.404 |
ounge | -1.392 |
UA | -1.340 |
ildo | -1.323 |
thus | -1.304 |
Token | comp |
Token ID | 5589 |
Feature activation | -6.61e-01 |
Pos logit contributions | |
Supplement | +2.022 |
appendix | +1.965 |
defences | +1.710 |
gard | +1.691 |
strang | +1.620 |
Neg logit contributions | |
practiced | -3.240 |
ounge | -3.214 |
UA | -3.173 |
ildo | -3.002 |
anguage | -2.955 |
Token | assing |
Token ID | 19696 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
practiced | +2.813 |
ounge | +2.793 |
thus | +2.656 |
UA | +2.575 |
ildo | +2.559 |
Neg logit contributions | |
Supplement | -4.136 |
appendix | -4.116 |
defences | -4.020 |
strang | -3.875 |
gard | -3.782 |
Token | : |
Token ID | 25 |
Feature activation | +3.68e-01 |
Pos logit contributions | |
appendix | +3.667 |
Supplement | +3.666 |
defences | +3.444 |
strang | +3.334 |
gard | +3.239 |
Neg logit contributions | |
ounge | -5.364 |
practiced | -5.281 |
ildo | -5.105 |
thus | -5.095 |
UA | -5.063 |
Token | What |
Token ID | 1867 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
appendix | +2.033 |
Supplement | +2.026 |
defences | +1.929 |
strang | +1.871 |
gard | +1.830 |
Neg logit contributions | |
ounge | -1.856 |
practiced | -1.838 |
UA | -1.751 |
thus | -1.734 |
ildo | -1.719 |
Token | really |
Token ID | 1107 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
appendix | +4.688 |
Supplement | +4.469 |
defences | +4.359 |
strang | +4.158 |
gard | +4.088 |
Neg logit contributions | |
ounge | -7.374 |
practiced | -6.986 |
UA | -6.943 |
ildo | -6.907 |
thus | -6.906 |
Token | plays |
Token ID | 5341 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
Supplement | +0.629 |
appendix | +0.624 |
defences | +0.587 |
strang | +0.563 |
gard | +0.544 |
Neg logit contributions | |
practiced | -0.817 |
ounge | -0.812 |
thus | -0.774 |
UA | -0.772 |
ildo | -0.759 |
Token | is |
Token ID | 318 |
Feature activation | +5.84e-01 |
Pos logit contributions | |
practiced | +0.977 |
ounge | +0.947 |
thus | +0.913 |
UA | +0.903 |
ildo | +0.889 |
Neg logit contributions | |
Supplement | -0.801 |
appendix | -0.781 |
defences | -0.732 |
strang | -0.701 |
gard | -0.678 |
Token | what |
Token ID | 644 |
Feature activation | +9.98e-01 |
Pos logit contributions | |
appendix | +2.716 |
Supplement | +2.676 |
defences | +2.551 |
strang | +2.466 |
gard | +2.384 |
Neg logit contributions | |
ounge | -3.454 |
practiced | -3.393 |
UA | -3.301 |
thus | -3.267 |
ildo | -3.265 |
Token | one |
Token ID | 530 |
Feature activation | +5.46e-01 |
Pos logit contributions | |
appendix | +4.212 |
Supplement | +4.069 |
defences | +3.939 |
strang | +3.791 |
gard | +3.703 |
Neg logit contributions | |
ounge | -6.251 |
practiced | -5.958 |
ildo | -5.927 |
UA | -5.870 |
thus | -5.866 |
Token | Mont |
Token ID | 5575 |
Feature activation | +9.45e-02 |
Pos logit contributions | |
appendix | +2.465 |
Supplement | +2.406 |
defences | +2.267 |
strang | +2.194 |
gard | +2.163 |
Neg logit contributions | |
ounge | -3.333 |
practiced | -3.284 |
thus | -3.177 |
UA | -3.172 |
ildo | -3.143 |
Token | anan |
Token ID | 27870 |
Feature activation | +3.62e-01 |
Pos logit contributions | |
Supplement | +0.548 |
appendix | +0.546 |
defences | +0.520 |
strang | +0.503 |
gard | +0.491 |
Neg logit contributions | |
practiced | -0.455 |
ounge | -0.453 |
thus | -0.426 |
UA | -0.425 |
ildo | -0.416 |
Token | says |
Token ID | 1139 |
Feature activation | -2.86e-01 |
Pos logit contributions | |
appendix | +1.583 |
Supplement | +1.571 |
defences | +1.463 |
strang | +1.409 |
gard | +1.387 |
Neg logit contributions | |
ounge | -2.234 |
practiced | -2.227 |
UA | -2.136 |
thus | -2.120 |
ildo | -2.100 |
Token | to |
Token ID | 284 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
practiced | +1.646 |
ounge | +1.611 |
thus | +1.543 |
UA | +1.535 |
ildo | +1.492 |
Neg logit contributions | |
Supplement | -1.420 |
appendix | -1.385 |
defences | -1.310 |
strang | -1.248 |
gard | -1.203 |
Token | slowly |
Token ID | 6364 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
practiced | +3.646 |
ounge | +3.420 |
thus | +3.291 |
UA | +3.204 |
ildo | +3.049 |
Neg logit contributions | |
Supplement | -5.017 |
appendix | -4.926 |
defences | -4.710 |
strang | -4.431 |
erald | -4.394 |
Token | . |
Token ID | 13 |
Feature activation | -4.65e-02 |
Pos logit contributions | |
Supplement | +0.860 |
appendix | +0.856 |
defences | +0.811 |
strang | +0.782 |
gard | +0.756 |
Neg logit contributions | |
ounge | -0.986 |
practiced | -0.984 |
UA | -0.937 |
thus | -0.932 |
ildo | -0.920 |
Token | ( |
Token ID | 357 |
Feature activation | -8.93e-01 |
Pos logit contributions | |
practiced | +0.250 |
ounge | +0.249 |
UA | +0.235 |
thus | +0.235 |
ildo | +0.231 |
Neg logit contributions | |
Supplement | -0.245 |
appendix | -0.243 |
defences | -0.230 |
strang | -0.223 |
gard | -0.216 |
Token | At |
Token ID | 2953 |
Feature activation | -2.50e-01 |
Pos logit contributions | |
practiced | +4.140 |
ounge | +4.100 |
thus | +4.092 |
UA | +4.019 |
ildo | +3.734 |
Neg logit contributions | |
appendix | -5.094 |
defences | -4.965 |
Supplement | -4.849 |
strang | -4.750 |
gard | -4.647 |
Token | this |
Token ID | 428 |
Feature activation | +6.70e-01 |
Pos logit contributions | |
practiced | +1.374 |
ounge | +1.360 |
thus | +1.299 |
UA | +1.284 |
ildo | +1.257 |
Neg logit contributions | |
Supplement | -1.279 |
appendix | -1.263 |
defences | -1.204 |
strang | -1.146 |
gard | -1.119 |
Token | point |
Token ID | 966 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
appendix | +2.625 |
Supplement | +2.585 |
defences | +2.417 |
strang | +2.348 |
gard | +2.237 |
Neg logit contributions | |
ounge | -4.466 |
practiced | -4.430 |
UA | -4.288 |
thus | -4.260 |
ildo | -4.239 |
Token | Anders |
Token ID | 25519 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
appendix | +4.468 |
Supplement | +4.367 |
defences | +4.184 |
strang | +4.094 |
gard | +3.963 |
Neg logit contributions | |
ounge | -6.425 |
practiced | -6.232 |
UA | -6.156 |
ildo | -6.078 |
thus | -5.974 |
Token | recommends |
Token ID | 20829 |
Feature activation | -4.48e-01 |
Pos logit contributions | |
Supplement | +0.582 |
appendix | +0.580 |
defences | +0.544 |
strang | +0.521 |
gard | +0.503 |
Neg logit contributions | |
practiced | -0.806 |
ounge | -0.804 |
thus | -0.766 |
UA | -0.766 |
ildo | -0.753 |
Token | celebrating |
Token ID | 17499 |
Feature activation | +3.72e-01 |
Pos logit contributions | |
practiced | +2.513 |
ounge | +2.441 |
thus | +2.335 |
UA | +2.288 |
ildo | +2.241 |
Neg logit contributions | |
Supplement | -2.240 |
appendix | -2.201 |
defences | -2.094 |
strang | -1.989 |
erald | -1.945 |
Token | with |
Token ID | 351 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
appendix | +1.737 |
Supplement | +1.731 |
defences | +1.634 |
strang | +1.575 |
gard | +1.527 |
Neg logit contributions | |
ounge | -2.206 |
practiced | -2.194 |
UA | -2.088 |
thus | -2.082 |
ildo | -2.063 |
Token | a |
Token ID | 257 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
appendix | +1.203 |
Supplement | +1.202 |
defences | +1.131 |
strang | +1.088 |
gard | +1.053 |
Neg logit contributions | |
ounge | -1.556 |
practiced | -1.550 |
UA | -1.478 |
thus | -1.476 |
ildo | -1.453 |
Token | Ent |
Token ID | 14539 |
Feature activation | +6.80e-01 |
Pos logit contributions | |
Supplement | +1.693 |
appendix | +1.683 |
defences | +1.585 |
strang | +1.526 |
gard | +1.480 |
Neg logit contributions | |
practiced | -1.879 |
ounge | -1.853 |
thus | -1.766 |
UA | -1.744 |
ildo | -1.727 |
Token | rem |
Token ID | 2787 |
Feature activation | -3.11e-02 |
Pos logit contributions | |
Supplement | +3.746 |
appendix | +3.730 |
defences | +3.480 |
strang | +3.427 |
gard | +3.384 |
Neg logit contributions | |
practiced | -3.431 |
ounge | -3.288 |
UA | -3.150 |
thus | -3.101 |
ildo | -2.995 |
Token | ont |
Token ID | 756 |
Feature activation | +5.24e-01 |
Pos logit contributions | |
practiced | +0.125 |
ounge | +0.125 |
UA | +0.116 |
thus | +0.116 |
ildo | +0.113 |
Neg logit contributions | |
Supplement | -0.205 |
appendix | -0.204 |
defences | -0.196 |
strang | -0.190 |
gard | -0.186 |
Token | calls |
Token ID | 3848 |
Feature activation | -3.76e-01 |
Pos logit contributions | |
appendix | +2.479 |
Supplement | +2.461 |
defences | +2.319 |
strang | +2.218 |
gard | +2.197 |
Neg logit contributions | |
ounge | -3.062 |
practiced | -3.042 |
thus | -2.894 |
UA | -2.885 |
ildo | -2.828 |
Token | for |
Token ID | 329 |
Feature activation | -5.39e-01 |
Pos logit contributions | |
practiced | +2.079 |
ounge | +2.051 |
UA | +1.960 |
thus | +1.923 |
ildo | +1.917 |
Neg logit contributions | |
Supplement | -1.882 |
appendix | -1.853 |
defences | -1.766 |
strang | -1.721 |
gard | -1.620 |
Token | bilingual |
Token ID | 48116 |
Feature activation | +9.33e-01 |
Pos logit contributions | |
practiced | +3.268 |
ounge | +3.190 |
UA | +3.048 |
thus | +3.014 |
ildo | +2.968 |
Neg logit contributions | |
Supplement | -2.410 |
appendix | -2.373 |
defences | -2.216 |
strang | -2.173 |
gard | -2.028 |
Token | ism |
Token ID | 1042 |
Feature activation | +2.80e-01 |
Pos logit contributions | |
appendix | +4.038 |
Supplement | +3.937 |
defences | +3.864 |
gard | +3.575 |
strang | +3.570 |
Neg logit contributions | |
ounge | -5.685 |
practiced | -5.611 |
UA | -5.477 |
thus | -5.464 |
ildo | -5.389 |
Token | to |
Token ID | 284 |
Feature activation | -4.15e-01 |
Pos logit contributions | |
appendix | +1.293 |
Supplement | +1.293 |
defences | +1.226 |
strang | +1.154 |
gard | +1.136 |
Neg logit contributions | |
ounge | -1.681 |
practiced | -1.652 |
thus | -1.595 |
UA | -1.591 |
ildo | -1.573 |
Token | be |
Token ID | 307 |
Feature activation | +7.42e-02 |
Pos logit contributions | |
practiced | +2.158 |
ounge | +2.121 |
thus | +2.007 |
UA | +1.995 |
ildo | +1.966 |
Neg logit contributions | |
Supplement | -2.234 |
appendix | -2.214 |
defences | -2.099 |
strang | -2.035 |
gard | -1.957 |
Token | a |
Token ID | 257 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
Supplement | +0.326 |
appendix | +0.324 |
defences | +0.304 |
strang | +0.290 |
gard | +0.281 |
Neg logit contributions | |
practiced | -0.461 |
ounge | -0.461 |
thus | -0.440 |
UA | -0.439 |
ildo | -0.432 |
Token | requirement |
Token ID | 9079 |
Feature activation | -3.52e-01 |
Pos logit contributions | |
appendix | +0.955 |
Supplement | +0.945 |
defences | +0.882 |
strang | +0.834 |
gard | +0.815 |
Neg logit contributions | |
ounge | -1.652 |
practiced | -1.633 |
thus | -1.581 |
UA | -1.580 |
ildo | -1.554 |
Token | of |
Token ID | 286 |
Feature activation | +7.91e-02 |
Pos logit contributions | |
appendix | +2.978 |
Supplement | +2.914 |
defences | +2.785 |
strang | +2.678 |
gard | +2.620 |
Neg logit contributions | |
ounge | -4.884 |
practiced | -4.814 |
thus | -4.674 |
UA | -4.571 |
ildo | -4.567 |
Token | us |
Token ID | 514 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
Supplement | +0.369 |
appendix | +0.368 |
defences | +0.347 |
strang | +0.333 |
gard | +0.323 |
Neg logit contributions | |
practiced | -0.470 |
ounge | -0.470 |
thus | -0.447 |
UA | -0.445 |
ildo | -0.438 |
Token | , |
Token ID | 11 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
Supplement | +1.084 |
appendix | +1.081 |
defences | +1.022 |
strang | +0.985 |
gard | +0.959 |
Neg logit contributions | |
ounge | -1.243 |
practiced | -1.236 |
UA | -1.174 |
thus | -1.173 |
ildo | -1.155 |
Token | � |
Token ID | 447 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
Supplement | +1.127 |
appendix | +1.126 |
defences | +1.056 |
strang | +1.021 |
gard | +0.989 |
Neg logit contributions | |
ounge | -1.523 |
practiced | -1.515 |
thus | -1.449 |
UA | -1.447 |
ildo | -1.426 |
Token | � |
Token ID | 251 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
practiced | +0.517 |
ounge | +0.511 |
thus | +0.478 |
UA | +0.476 |
ildo | +0.462 |
Neg logit contributions | |
Supplement | -0.826 |
appendix | -0.824 |
defences | -0.791 |
strang | -0.767 |
gard | -0.749 |
Token | C |
Token ID | 327 |
Feature activation | +9.34e-01 |
Pos logit contributions | |
Supplement | +1.367 |
appendix | +1.361 |
defences | +1.288 |
strang | +1.242 |
gard | +1.207 |
Neg logit contributions | |
practiced | -1.452 |
ounge | -1.449 |
thus | -1.370 |
UA | -1.369 |
ildo | -1.345 |
Token | ray |
Token ID | 2433 |
Feature activation | -7.41e-02 |
Pos logit contributions | |
Supplement | +5.216 |
appendix | +4.923 |
erald | +4.765 |
defences | +4.609 |
gard | +4.544 |
Neg logit contributions | |
practiced | -4.377 |
ounge | -4.312 |
�� | -4.138 |
UA | -4.015 |
ildo | -4.001 |
Token | said |
Token ID | 531 |
Feature activation | -4.17e-03 |
Pos logit contributions | |
practiced | +0.439 |
ounge | +0.429 |
thus | +0.414 |
UA | +0.412 |
ildo | +0.402 |
Neg logit contributions | |
Supplement | -0.352 |
appendix | -0.352 |
defences | -0.336 |
strang | -0.317 |
gard | -0.305 |
Token | . |
Token ID | 13 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
practiced | +0.022 |
ounge | +0.021 |
thus | +0.020 |
UA | +0.020 |
ildo | +0.020 |
Neg logit contributions | |
Supplement | -0.023 |
appendix | -0.023 |
defences | -0.022 |
strang | -0.021 |
gard | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | +1.32e-02 |
Pos logit contributions | |
practiced | +1.548 |
ounge | +1.539 |
thus | +1.476 |
UA | +1.473 |
ildo | +1.432 |
Neg logit contributions | |
appendix | -1.507 |
Supplement | -1.496 |
defences | -1.453 |
strang | -1.381 |
gard | -1.327 |
Token |
|
Token ID | 198 |
Feature activation | +6.00e-02 |
Pos logit contributions | |
Supplement | +0.060 |
appendix | +0.059 |
defences | +0.054 |
strang | +0.052 |
gard | +0.051 |
Neg logit contributions | |
practiced | -0.081 |
ounge | -0.081 |
UA | -0.076 |
thus | -0.076 |
ildo | -0.076 |
Token | never |
Token ID | 1239 |
Feature activation | -4.01e-01 |
Pos logit contributions | |
Supplement | +0.086 |
appendix | +0.086 |
defences | +0.081 |
strang | +0.078 |
gard | +0.076 |
Neg logit contributions | |
practiced | -0.106 |
ounge | -0.105 |
thus | -0.100 |
UA | -0.100 |
ildo | -0.098 |
Token | heard |
Token ID | 2982 |
Feature activation | -6.08e-01 |
Pos logit contributions | |
practiced | +2.256 |
ounge | +2.168 |
thus | +2.060 |
UA | +2.042 |
ildo | +1.998 |
Neg logit contributions | |
Supplement | -2.069 |
appendix | -2.037 |
defences | -1.956 |
strang | -1.863 |
erald | -1.798 |
Token | of |
Token ID | 286 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
practiced | +3.490 |
ounge | +3.425 |
UA | +3.264 |
ildo | +3.185 |
thus | +3.173 |
Neg logit contributions | |
Supplement | -2.956 |
appendix | -2.865 |
defences | -2.760 |
strang | -2.629 |
erald | -2.569 |
Token | the |
Token ID | 262 |
Feature activation | -5.19e-02 |
Pos logit contributions | |
practiced | +1.091 |
ounge | +1.082 |
thus | +1.017 |
UA | +1.016 |
ildo | +0.991 |
Neg logit contributions | |
Supplement | -1.321 |
appendix | -1.312 |
defences | -1.255 |
strang | -1.212 |
gard | -1.178 |
Token | book |
Token ID | 1492 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
practiced | +0.305 |
ounge | +0.304 |
thus | +0.289 |
UA | +0.289 |
ildo | +0.284 |
Neg logit contributions | |
Supplement | -0.245 |
appendix | -0.245 |
defences | -0.230 |
strang | -0.221 |
gard | -0.214 |
Token | or |
Token ID | 393 |
Feature activation | +7.29e-01 |
Pos logit contributions | |
Supplement | +0.982 |
appendix | +0.980 |
defences | +0.925 |
strang | +0.890 |
gard | +0.865 |
Neg logit contributions | |
practiced | -1.098 |
ounge | -1.096 |
thus | -1.040 |
UA | -1.039 |
ildo | -1.020 |
Token | author |
Token ID | 1772 |
Feature activation | +5.29e-01 |
Pos logit contributions | |
appendix | +3.539 |
Supplement | +3.440 |
defences | +3.207 |
gard | +3.143 |
strang | +3.127 |
Neg logit contributions | |
ounge | -4.117 |
thus | -3.940 |
UA | -3.930 |
ildo | -3.924 |
practiced | -3.916 |
Token | . |
Token ID | 13 |
Feature activation | +4.89e-01 |
Pos logit contributions | |
appendix | +2.578 |
Supplement | +2.576 |
defences | +2.419 |
strang | +2.326 |
gard | +2.274 |
Neg logit contributions | |
ounge | -2.994 |
practiced | -2.984 |
thus | -2.848 |
UA | -2.836 |
ildo | -2.804 |
Token |
|
Token ID | 198 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
Supplement | +2.485 |
appendix | +2.441 |
defences | +2.259 |
strang | +2.219 |
gard | +2.163 |
Neg logit contributions | |
practiced | -2.709 |
ounge | -2.697 |
UA | -2.512 |
thus | -2.511 |
ildo | -2.486 |
Token |
|
Token ID | 198 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
Supplement | +0.606 |
appendix | +0.585 |
defences | +0.533 |
strang | +0.513 |
gard | +0.498 |
Neg logit contributions | |
practiced | -0.869 |
ounge | -0.868 |
UA | -0.809 |
anguage | -0.808 |
ildo | -0.807 |
Token | Those |
Token ID | 9627 |
Feature activation | -3.40e-01 |
Pos logit contributions | |
Supplement | +0.603 |
appendix | +0.588 |
defences | +0.552 |
strang | +0.532 |
gard | +0.518 |
Neg logit contributions | |
practiced | -0.653 |
ounge | -0.647 |
thus | -0.608 |
UA | -0.605 |
ildo | -0.602 |
Token | the |
Token ID | 262 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
practiced | +0.524 |
ounge | +0.519 |
thus | +0.495 |
UA | +0.495 |
ildo | +0.485 |
Neg logit contributions | |
Supplement | -0.420 |
appendix | -0.418 |
defences | -0.393 |
strang | -0.376 |
gard | -0.365 |
Token | prison |
Token ID | 3770 |
Feature activation | -7.46e-01 |
Pos logit contributions | |
practiced | +3.199 |
ounge | +3.119 |
thus | +2.992 |
UA | +2.969 |
ildo | +2.914 |
Neg logit contributions | |
Supplement | -2.838 |
appendix | -2.767 |
defences | -2.609 |
strang | -2.501 |
gard | -2.431 |
Token | closed |
Token ID | 4838 |
Feature activation | +1.92e-02 |
Pos logit contributions | |
practiced | +4.363 |
ounge | +4.176 |
thus | +3.984 |
UA | +3.943 |
ildo | +3.921 |
Neg logit contributions | |
Supplement | -3.610 |
appendix | -3.526 |
defences | -3.294 |
strang | -3.158 |
gard | -3.069 |
Token | . |
Token ID | 13 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
Supplement | +0.098 |
appendix | +0.097 |
defences | +0.092 |
strang | +0.089 |
gard | +0.086 |
Neg logit contributions | |
practiced | -0.106 |
ounge | -0.106 |
thus | -0.101 |
UA | -0.101 |
ildo | -0.099 |
Token | His |
Token ID | 2399 |
Feature activation | -4.82e-01 |
Pos logit contributions | |
practiced | +0.721 |
ounge | +0.716 |
thus | +0.682 |
UA | +0.681 |
ildo | +0.667 |
Neg logit contributions | |
Supplement | -0.670 |
appendix | -0.669 |
defences | -0.637 |
strang | -0.610 |
gard | -0.591 |
Token | son |
Token ID | 3367 |
Feature activation | -9.84e-03 |
Pos logit contributions | |
practiced | +2.618 |
ounge | +2.540 |
UA | +2.445 |
thus | +2.442 |
ildo | +2.362 |
Neg logit contributions | |
Supplement | -2.505 |
appendix | -2.424 |
defences | -2.340 |
strang | -2.222 |
gard | -2.157 |
Token | , |
Token ID | 11 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
ounge | +0.055 |
practiced | +0.055 |
thus | +0.052 |
UA | +0.052 |
ildo | +0.051 |
Neg logit contributions | |
Supplement | -0.049 |
appendix | -0.049 |
defences | -0.046 |
strang | -0.045 |
gard | -0.043 |
Token | Dev |
Token ID | 6245 |
Feature activation | +5.83e-01 |
Pos logit contributions | |
appendix | +0.814 |
Supplement | +0.813 |
defences | +0.768 |
strang | +0.742 |
gard | +0.723 |
Neg logit contributions | |
ounge | -0.896 |
practiced | -0.894 |
UA | -0.847 |
thus | -0.847 |
ildo | -0.833 |
Token | ik |
Token ID | 1134 |
Feature activation | +3.66e-02 |
Pos logit contributions | |
Supplement | +3.575 |
appendix | +3.558 |
defences | +3.397 |
strang | +3.298 |
gard | +3.245 |
Neg logit contributions | |
ounge | -2.535 |
practiced | -2.529 |
UA | -2.394 |
thus | -2.359 |
ildo | -2.284 |
Token | , |
Token ID | 11 |
Feature activation | -3.55e-01 |
Pos logit contributions | |
Supplement | +0.192 |
appendix | +0.191 |
defences | +0.181 |
strang | +0.174 |
gard | +0.169 |
Neg logit contributions | |
practiced | -0.197 |
ounge | -0.196 |
thus | -0.186 |
UA | -0.186 |
ildo | -0.182 |
Token | red |
Token ID | 2266 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
practiced | +2.049 |
ounge | +1.995 |
UA | +1.908 |
thus | +1.907 |
ildo | +1.859 |
Neg logit contributions | |
Supplement | -1.749 |
appendix | -1.727 |
defences | -1.643 |
strang | -1.568 |
gard | -1.504 |
Token | so |
Token ID | 523 |
Feature activation | +8.55e-02 |
Pos logit contributions | |
Supplement | +0.817 |
appendix | +0.815 |
defences | +0.768 |
strang | +0.735 |
gard | +0.714 |
Neg logit contributions | |
ounge | -0.986 |
practiced | -0.985 |
UA | -0.936 |
thus | -0.933 |
ildo | -0.921 |
Token | we |
Token ID | 356 |
Feature activation | +4.25e-01 |
Pos logit contributions | |
Supplement | +0.453 |
appendix | +0.453 |
defences | +0.429 |
strang | +0.414 |
gard | +0.404 |
Neg logit contributions | |
ounge | -0.455 |
practiced | -0.453 |
thus | -0.430 |
UA | -0.428 |
ildo | -0.420 |
Token | can |
Token ID | 460 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
appendix | +1.417 |
Supplement | +1.414 |
defences | +1.303 |
strang | +1.215 |
gard | +1.176 |
Neg logit contributions | |
ounge | -3.090 |
practiced | -3.058 |
UA | -2.955 |
thus | -2.951 |
ildo | -2.920 |
Token | ensure |
Token ID | 4155 |
Feature activation | +5.07e-01 |
Pos logit contributions | |
Supplement | +0.663 |
appendix | +0.662 |
defences | +0.620 |
strang | +0.593 |
gard | +0.573 |
Neg logit contributions | |
practiced | -0.958 |
ounge | -0.958 |
UA | -0.914 |
thus | -0.913 |
ildo | -0.897 |
Token | that |
Token ID | 326 |
Feature activation | +3.46e-01 |
Pos logit contributions | |
appendix | +2.551 |
Supplement | +2.521 |
defences | +2.398 |
strang | +2.312 |
gard | +2.281 |
Neg logit contributions | |
ounge | -2.851 |
practiced | -2.758 |
thus | -2.677 |
UA | -2.672 |
ildo | -2.616 |
Token | it |
Token ID | 340 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
appendix | +1.670 |
Supplement | +1.641 |
defences | +1.573 |
strang | +1.515 |
gard | +1.482 |
Neg logit contributions | |
ounge | -2.017 |
practiced | -1.957 |
UA | -1.899 |
thus | -1.896 |
ildo | -1.863 |
Token | doesn |
Token ID | 1595 |
Feature activation | -3.29e-01 |
Pos logit contributions | |
Supplement | +0.566 |
appendix | +0.565 |
defences | +0.531 |
strang | +0.508 |
gard | +0.492 |
Neg logit contributions | |
practiced | -0.753 |
ounge | -0.752 |
UA | -0.715 |
thus | -0.715 |
ildo | -0.703 |
Token | � |
Token ID | 447 |
Feature activation | +5.68e-02 |
Pos logit contributions | |
practiced | +1.675 |
ounge | +1.667 |
thus | +1.564 |
UA | +1.563 |
ildo | +1.534 |
Neg logit contributions | |
Supplement | -1.832 |
appendix | -1.816 |
defences | -1.721 |
strang | -1.663 |
gard | -1.621 |
Token | � |
Token ID | 247 |
Feature activation | -7.19e-02 |
Pos logit contributions | |
Supplement | +0.327 |
appendix | +0.326 |
defences | +0.309 |
strang | +0.299 |
gard | +0.292 |
Neg logit contributions | |
practiced | -0.275 |
ounge | -0.275 |
UA | -0.259 |
thus | -0.258 |
ildo | -0.253 |
Token | t |
Token ID | 83 |
Feature activation | -2.70e-02 |
Pos logit contributions | |
practiced | +0.380 |
ounge | +0.378 |
thus | +0.358 |
UA | +0.357 |
ildo | +0.350 |
Neg logit contributions | |
Supplement | -0.383 |
appendix | -0.383 |
defences | -0.364 |
strang | -0.350 |
gard | -0.340 |
Token | violate |
Token ID | 16967 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
practiced | +0.153 |
ounge | +0.152 |
thus | +0.145 |
UA | +0.144 |
ildo | +0.142 |
Neg logit contributions | |
Supplement | -0.134 |
appendix | -0.133 |
defences | -0.127 |
strang | -0.121 |
gard | -0.117 |
Token | network |
Token ID | 3127 |
Feature activation | -4.47e-02 |
Pos logit contributions | |
appendix | +0.834 |
Supplement | +0.827 |
defences | +0.781 |
strang | +0.752 |
gard | +0.727 |
Neg logit contributions | |
ounge | -1.132 |
practiced | -1.125 |
thus | -1.076 |
UA | -1.075 |
ildo | -1.053 |
Token | of |
Token ID | 286 |
Feature activation | -8.26e-02 |
Pos logit contributions | |
practiced | +0.262 |
ounge | +0.257 |
thus | +0.245 |
UA | +0.244 |
ildo | +0.241 |
Neg logit contributions | |
Supplement | -0.216 |
appendix | -0.212 |
defences | -0.201 |
strang | -0.193 |
gard | -0.186 |
Token | operatives |
Token ID | 27269 |
Feature activation | -2.08e-02 |
Pos logit contributions | |
practiced | +0.524 |
ounge | +0.515 |
thus | +0.495 |
UA | +0.492 |
ildo | +0.488 |
Neg logit contributions | |
Supplement | -0.360 |
appendix | -0.352 |
defences | -0.327 |
strang | -0.313 |
gard | -0.302 |
Token | who |
Token ID | 508 |
Feature activation | +4.07e-01 |
Pos logit contributions | |
practiced | +0.115 |
ounge | +0.114 |
thus | +0.109 |
UA | +0.108 |
ildo | +0.106 |
Neg logit contributions | |
Supplement | -0.106 |
appendix | -0.105 |
defences | -0.100 |
strang | -0.096 |
gard | -0.093 |
Token | want |
Token ID | 765 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
appendix | +1.693 |
Supplement | +1.686 |
defences | +1.574 |
strang | +1.510 |
gard | +1.455 |
Neg logit contributions | |
ounge | -2.615 |
practiced | -2.593 |
UA | -2.505 |
thus | -2.494 |
ildo | -2.448 |
Token | to |
Token ID | 284 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
Supplement | +1.331 |
appendix | +1.320 |
defences | +1.245 |
strang | +1.197 |
gard | +1.164 |
Neg logit contributions | |
practiced | -1.438 |
ounge | -1.421 |
thus | -1.353 |
UA | -1.348 |
ildo | -1.329 |
Token | blow |
Token ID | 6611 |
Feature activation | +3.64e-01 |
Pos logit contributions | |
appendix | +1.511 |
Supplement | +1.500 |
defences | +1.415 |
strang | +1.372 |
gard | +1.321 |
Neg logit contributions | |
ounge | -2.102 |
practiced | -2.082 |
UA | -2.013 |
thus | -2.001 |
ildo | -1.948 |
Token | up |
Token ID | 510 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
appendix | +1.346 |
Supplement | +1.340 |
defences | +1.257 |
strang | +1.187 |
gard | +1.132 |
Neg logit contributions | |
ounge | -2.504 |
practiced | -2.497 |
thus | -2.398 |
UA | -2.396 |
ildo | -2.353 |
Token | the |
Token ID | 262 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
appendix | +1.489 |
Supplement | +1.474 |
defences | +1.414 |
strang | +1.344 |
gard | +1.302 |
Neg logit contributions | |
ounge | -2.037 |
practiced | -2.012 |
thus | -1.933 |
UA | -1.927 |
ildo | -1.885 |
Token | World |
Token ID | 2159 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
appendix | +1.772 |
Supplement | +1.750 |
defences | +1.691 |
strang | +1.615 |
gard | +1.560 |
Neg logit contributions | |
ounge | -2.213 |
practiced | -2.184 |
thus | -2.092 |
UA | -2.089 |
ildo | -2.050 |
Token | Trade |
Token ID | 9601 |
Feature activation | +7.38e-02 |
Pos logit contributions | |
Supplement | +0.455 |
appendix | +0.452 |
defences | +0.414 |
strang | +0.388 |
gard | +0.373 |
Neg logit contributions | |
practiced | -1.012 |
ounge | -1.010 |
thus | -0.964 |
UA | -0.962 |
ildo | -0.954 |
Token | get |
Token ID | 651 |
Feature activation | -2.29e-01 |
Pos logit contributions | |
practiced | +0.415 |
ounge | +0.408 |
thus | +0.392 |
UA | +0.388 |
ildo | +0.381 |
Neg logit contributions | |
Supplement | -0.294 |
appendix | -0.290 |
defences | -0.274 |
strang | -0.259 |
gard | -0.252 |
Token | this |
Token ID | 428 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
practiced | +1.304 |
ounge | +1.273 |
thus | +1.222 |
UA | +1.212 |
ildo | +1.177 |
Neg logit contributions | |
Supplement | -1.141 |
appendix | -1.120 |
defences | -1.060 |
strang | -1.002 |
gard | -0.990 |
Token | : |
Token ID | 25 |
Feature activation | +3.89e-01 |
Pos logit contributions | |
Supplement | +0.890 |
appendix | +0.883 |
defences | +0.836 |
strang | +0.800 |
gard | +0.778 |
Neg logit contributions | |
practiced | -1.038 |
ounge | -1.032 |
thus | -0.981 |
UA | -0.980 |
ildo | -0.961 |
Token |
|
Token ID | 198 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
Supplement | +1.971 |
appendix | +1.954 |
defences | +1.866 |
strang | +1.777 |
gard | +1.732 |
Neg logit contributions | |
practiced | -2.182 |
ounge | -2.168 |
thus | -2.062 |
UA | -2.052 |
ildo | -2.006 |
Token |
|
Token ID | 198 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
Supplement | +0.615 |
appendix | +0.596 |
defences | +0.541 |
strang | +0.522 |
gard | +0.507 |
Neg logit contributions | |
practiced | -0.886 |
ounge | -0.886 |
UA | -0.826 |
ildo | -0.824 |
anguage | -0.824 |
Token | + |
Token ID | 10 |
Feature activation | +8.47e-01 |
Pos logit contributions | |
Supplement | +0.770 |
appendix | +0.768 |
defences | +0.721 |
strang | +0.690 |
gard | +0.666 |
Neg logit contributions | |
practiced | -1.084 |
ounge | -1.081 |
thus | -1.032 |
UA | -1.031 |
ildo | -1.013 |
Token | -------------------- |
Token ID | 19351 |
Feature activation | +4.48e-01 |
Pos logit contributions | |
Supplement | +3.598 |
appendix | +3.435 |
defences | +3.013 |
Imm | +2.919 |
erald | +2.872 |
Neg logit contributions | |
practiced | -5.444 |
ounge | -5.366 |
anguage | -5.044 |
ildo | -5.024 |
UA | -4.939 |
Token | --+ |
Token ID | 44785 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
Supplement | +2.582 |
appendix | +2.577 |
defences | +2.338 |
strang | +2.260 |
gard | +2.257 |
Neg logit contributions | |
practiced | -2.209 |
ounge | -2.191 |
thus | -1.995 |
ildo | -1.993 |
UA | -1.992 |
Token | | |
Token ID | 930 |
Feature activation | -2.94e-01 |
Pos logit contributions | |
appendix | +0.734 |
Supplement | +0.732 |
defences | +0.678 |
strang | +0.662 |
gard | +0.640 |
Neg logit contributions | |
ounge | -0.839 |
practiced | -0.834 |
thus | -0.786 |
UA | -0.786 |
ildo | -0.773 |
Token | ... |
Token ID | 2644 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
practiced | +1.252 |
ounge | +1.231 |
thus | +1.136 |
UA | +1.132 |
ildo | +1.115 |
Neg logit contributions | |
Supplement | -1.865 |
appendix | -1.810 |
defences | -1.778 |
strang | -1.704 |
gard | -1.664 |
Token | | |
Token ID | 930 |
Feature activation | +6.14e-01 |
Pos logit contributions | |
practiced | +0.682 |
ounge | +0.681 |
thus | +0.641 |
UA | +0.640 |
ildo | +0.630 |
Neg logit contributions | |
Supplement | -0.631 |
appendix | -0.627 |
defences | -0.588 |
strang | -0.569 |
gard | -0.552 |
Token | writer |
Token ID | 6260 |
Feature activation | +4.11e-01 |
Pos logit contributions | |
practiced | +0.916 |
ounge | +0.909 |
UA | +0.867 |
thus | +0.862 |
ildo | +0.843 |
Neg logit contributions | |
Supplement | -0.807 |
appendix | -0.800 |
defences | -0.756 |
strang | -0.719 |
gard | -0.697 |
Token | Tom |
Token ID | 4186 |
Feature activation | -6.33e-02 |
Pos logit contributions | |
Supplement | +1.872 |
appendix | +1.867 |
defences | +1.759 |
strang | +1.700 |
gard | +1.639 |
Neg logit contributions | |
practiced | -2.471 |
ounge | -2.469 |
thus | -2.348 |
UA | -2.337 |
ildo | -2.307 |
Token | King |
Token ID | 2677 |
Feature activation | +2.80e-02 |
Pos logit contributions | |
practiced | +0.367 |
ounge | +0.365 |
thus | +0.347 |
UA | +0.347 |
ildo | +0.341 |
Neg logit contributions | |
Supplement | -0.306 |
appendix | -0.305 |
defences | -0.288 |
strang | -0.276 |
gard | -0.267 |
Token | and |
Token ID | 290 |
Feature activation | -3.54e-01 |
Pos logit contributions | |
Supplement | +0.136 |
appendix | +0.136 |
defences | +0.129 |
strang | +0.122 |
gard | +0.119 |
Neg logit contributions | |
practiced | -0.162 |
ounge | -0.160 |
thus | -0.153 |
UA | -0.153 |
ildo | -0.150 |
Token | artist |
Token ID | 6802 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
practiced | +1.878 |
ounge | +1.852 |
thus | +1.757 |
UA | +1.755 |
ildo | +1.716 |
Neg logit contributions | |
Supplement | -1.895 |
appendix | -1.870 |
defences | -1.781 |
strang | -1.685 |
gard | -1.642 |
Token | Mitch |
Token ID | 20472 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
Supplement | +0.651 |
appendix | +0.649 |
defences | +0.613 |
strang | +0.590 |
gard | +0.572 |
Neg logit contributions | |
practiced | -0.764 |
ounge | -0.762 |
thus | -0.722 |
UA | -0.722 |
ildo | -0.709 |
Token | Ger |
Token ID | 13573 |
Feature activation | -7.22e-01 |
Pos logit contributions | |
practiced | +2.910 |
ounge | +2.908 |
UA | +2.761 |
thus | +2.748 |
ildo | +2.724 |
Neg logit contributions | |
Supplement | -3.072 |
appendix | -3.031 |
defences | -2.901 |
strang | -2.747 |
gard | -2.673 |
Token | ads |
Token ID | 5643 |
Feature activation | +2.03e-02 |
Pos logit contributions | |
ounge | +3.468 |
practiced | +3.407 |
thus | +3.394 |
ildo | +3.241 |
UA | +3.233 |
Neg logit contributions | |
appendix | -4.110 |
Supplement | -4.090 |
defences | -3.979 |
strang | -3.761 |
gard | -3.641 |
Token | , |
Token ID | 11 |
Feature activation | -6.42e-01 |
Pos logit contributions | |
Supplement | +0.101 |
appendix | +0.101 |
defences | +0.095 |
strang | +0.092 |
gard | +0.089 |
Neg logit contributions | |
practiced | -0.115 |
ounge | -0.114 |
thus | -0.108 |
UA | -0.108 |
ildo | -0.106 |
Token | following |
Token ID | 1708 |
Feature activation | -2.65e-01 |
Pos logit contributions | |
practiced | +3.649 |
ounge | +3.569 |
thus | +3.445 |
UA | +3.391 |
ildo | +3.283 |
Neg logit contributions | |
Supplement | -3.174 |
appendix | -3.114 |
defences | -2.993 |
strang | -2.780 |
gard | -2.734 |
Token | their |
Token ID | 511 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
practiced | +1.542 |
ounge | +1.532 |
UA | +1.466 |
thus | +1.458 |
ildo | +1.426 |
Neg logit contributions | |
Supplement | -1.266 |
appendix | -1.247 |
defences | -1.179 |
strang | -1.116 |
gard | -1.090 |
Token |
|
Token ID | 198 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
Supplement | +0.493 |
appendix | +0.472 |
defences | +0.431 |
strang | +0.413 |
gard | +0.401 |
Neg logit contributions | |
practiced | -0.692 |
ounge | -0.688 |
anguage | -0.641 |
ildo | -0.640 |
thus | -0.639 |
Token | Looking |
Token ID | 15784 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
Supplement | +0.821 |
appendix | +0.804 |
defences | +0.755 |
strang | +0.730 |
gard | +0.708 |
Neg logit contributions | |
practiced | -0.835 |
ounge | -0.826 |
thus | -0.774 |
UA | -0.770 |
ildo | -0.768 |
Token | back |
Token ID | 736 |
Feature activation | -3.25e-01 |
Pos logit contributions | |
Supplement | +0.079 |
appendix | +0.079 |
defences | +0.075 |
strang | +0.072 |
gard | +0.069 |
Neg logit contributions | |
practiced | -0.095 |
ounge | -0.095 |
thus | -0.090 |
UA | -0.090 |
ildo | -0.089 |
Token | at |
Token ID | 379 |
Feature activation | -5.37e-01 |
Pos logit contributions | |
practiced | +1.760 |
ounge | +1.739 |
thus | +1.657 |
UA | +1.635 |
ildo | +1.591 |
Neg logit contributions | |
Supplement | -1.700 |
appendix | -1.684 |
defences | -1.604 |
strang | -1.529 |
gard | -1.481 |
Token | the |
Token ID | 262 |
Feature activation | -3.40e-01 |
Pos logit contributions | |
practiced | +3.070 |
ounge | +3.021 |
thus | +2.873 |
UA | +2.861 |
ildo | +2.783 |
Neg logit contributions | |
Supplement | -2.621 |
appendix | -2.553 |
defences | -2.450 |
strang | -2.317 |
gard | -2.289 |
Token | list |
Token ID | 1351 |
Feature activation | -3.10e-01 |
Pos logit contributions | |
practiced | +1.933 |
ounge | +1.911 |
thus | +1.816 |
UA | +1.802 |
ildo | +1.765 |
Neg logit contributions | |
Supplement | -1.695 |
appendix | -1.651 |
defences | -1.575 |
strang | -1.490 |
gard | -1.470 |
Token | today |
Token ID | 1909 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
practiced | +1.759 |
ounge | +1.741 |
thus | +1.655 |
UA | +1.645 |
ildo | +1.603 |
Neg logit contributions | |
Supplement | -1.548 |
appendix | -1.513 |
defences | -1.454 |
strang | -1.377 |
gard | -1.355 |
Token | , |
Token ID | 11 |
Feature activation | -2.92e-01 |
Pos logit contributions | |
practiced | +0.747 |
ounge | +0.738 |
thus | +0.698 |
UA | +0.698 |
ildo | +0.679 |
Neg logit contributions | |
Supplement | -0.756 |
appendix | -0.746 |
defences | -0.713 |
strang | -0.683 |
gard | -0.663 |
Token | there |
Token ID | 612 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
practiced | +1.698 |
ounge | +1.684 |
thus | +1.602 |
UA | +1.591 |
ildo | +1.558 |
Neg logit contributions | |
Supplement | -1.411 |
appendix | -1.388 |
defences | -1.321 |
strang | -1.253 |
gard | -1.226 |
Token | may |
Token ID | 743 |
Feature activation | -5.10e-01 |
Pos logit contributions | |
practiced | +1.123 |
ounge | +1.109 |
thus | +1.060 |
UA | +1.050 |
ildo | +1.034 |
Neg logit contributions | |
Supplement | -0.754 |
appendix | -0.741 |
defences | -0.695 |
strang | -0.661 |
gard | -0.632 |
Token | be |
Token ID | 307 |
Feature activation | -5.23e-01 |
Pos logit contributions | |
practiced | +2.710 |
ounge | +2.699 |
thus | +2.523 |
ildo | +2.483 |
UA | +2.407 |
Neg logit contributions | |
Supplement | -2.700 |
appendix | -2.643 |
defences | -2.529 |
strang | -2.358 |
gard | -2.284 |
Token | investigation |
Token ID | 3645 |
Feature activation | -7.58e-02 |
Pos logit contributions | |
appendix | +1.507 |
Supplement | +1.505 |
defences | +1.405 |
strang | +1.350 |
gard | +1.306 |
Neg logit contributions | |
ounge | -1.991 |
practiced | -1.975 |
UA | -1.883 |
thus | -1.883 |
ildo | -1.861 |
Token | , |
Token ID | 11 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
practiced | +0.441 |
ounge | +0.436 |
thus | +0.416 |
UA | +0.415 |
ildo | +0.407 |
Neg logit contributions | |
Supplement | -0.366 |
appendix | -0.361 |
defences | -0.343 |
strang | -0.330 |
gard | -0.319 |
Token | but |
Token ID | 475 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
practiced | +1.083 |
ounge | +1.065 |
thus | +1.030 |
UA | +1.022 |
ildo | +1.002 |
Neg logit contributions | |
Supplement | -0.663 |
appendix | -0.655 |
defences | -0.617 |
strang | -0.582 |
gard | -0.559 |
Token | also |
Token ID | 635 |
Feature activation | +5.61e-01 |
Pos logit contributions | |
appendix | +1.335 |
Supplement | +1.334 |
defences | +1.264 |
strang | +1.227 |
gard | +1.193 |
Neg logit contributions | |
ounge | -1.217 |
practiced | -1.206 |
UA | -1.144 |
thus | -1.136 |
ildo | -1.121 |
Token | ordered |
Token ID | 6149 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
appendix | +2.658 |
Supplement | +2.638 |
defences | +2.473 |
strang | +2.409 |
gard | +2.334 |
Neg logit contributions | |
ounge | -3.304 |
practiced | -3.210 |
UA | -3.131 |
thus | -3.081 |
ildo | -3.075 |
Token | the |
Token ID | 262 |
Feature activation | -1.61e-01 |
Pos logit contributions | |
practiced | +0.960 |
ounge | +0.941 |
UA | +0.899 |
thus | +0.896 |
ildo | +0.880 |
Neg logit contributions | |
Supplement | -0.809 |
appendix | -0.802 |
defences | -0.752 |
strang | -0.725 |
gard | -0.699 |
Token | destruction |
Token ID | 8166 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
practiced | +0.950 |
ounge | +0.933 |
thus | +0.893 |
UA | +0.891 |
ildo | +0.872 |
Neg logit contributions | |
Supplement | -0.764 |
appendix | -0.749 |
defences | -0.711 |
strang | -0.676 |
gard | -0.656 |
Token | of |
Token ID | 286 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
Supplement | +0.666 |
appendix | +0.652 |
defences | +0.620 |
strang | +0.597 |
gard | +0.574 |
Neg logit contributions | |
practiced | -0.863 |
ounge | -0.844 |
thus | -0.809 |
UA | -0.809 |
ildo | -0.794 |
Token | all |
Token ID | 477 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
appendix | +0.883 |
Supplement | +0.882 |
defences | +0.829 |
strang | +0.792 |
gard | +0.767 |
Neg logit contributions | |
ounge | -1.182 |
practiced | -1.178 |
thus | -1.124 |
UA | -1.123 |
ildo | -1.107 |
Token | documents |
Token ID | 4963 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
Supplement | +0.788 |
appendix | +0.785 |
defences | +0.738 |
strang | +0.707 |
gard | +0.684 |
Neg logit contributions | |
practiced | -1.041 |
ounge | -1.037 |
thus | -0.988 |
UA | -0.987 |
ildo | -0.970 |
Token | in |
Token ID | 287 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
Supplement | +0.057 |
appendix | +0.057 |
defences | +0.054 |
strang | +0.051 |
gard | +0.050 |
Neg logit contributions | |
practiced | -0.073 |
ounge | -0.072 |
thus | -0.069 |
UA | -0.069 |
ildo | -0.067 |
Token | how |
Token ID | 703 |
Feature activation | +7.10e-01 |
Pos logit contributions | |
Supplement | +1.488 |
appendix | +1.486 |
defences | +1.402 |
strang | +1.341 |
gard | +1.297 |
Neg logit contributions | |
practiced | -1.963 |
ounge | -1.961 |
thus | -1.867 |
UA | -1.866 |
ildo | -1.837 |
Token | cognitive |
Token ID | 10870 |
Feature activation | +9.22e-01 |
Pos logit contributions | |
appendix | +3.225 |
Supplement | +3.136 |
defences | +3.106 |
strang | +2.940 |
gard | +2.842 |
Neg logit contributions | |
ounge | -4.290 |
practiced | -4.180 |
UA | -4.088 |
ildo | -4.053 |
thus | -4.044 |
Token | capacities |
Token ID | 32484 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
defences | +4.019 |
appendix | +4.000 |
Supplement | +3.859 |
strang | +3.733 |
gard | +3.654 |
Neg logit contributions | |
ounge | -5.689 |
UA | -5.393 |
practiced | -5.393 |
thus | -5.354 |
ildo | -5.265 |
Token | for |
Token ID | 329 |
Feature activation | +8.96e-02 |
Pos logit contributions | |
appendix | +3.141 |
Supplement | +3.088 |
defences | +2.959 |
strang | +2.850 |
gard | +2.752 |
Neg logit contributions | |
ounge | -3.800 |
practiced | -3.670 |
UA | -3.645 |
thus | -3.590 |
ildo | -3.556 |
Token | viewing |
Token ID | 11681 |
Feature activation | -3.35e-01 |
Pos logit contributions | |
Supplement | +0.456 |
appendix | +0.454 |
defences | +0.431 |
strang | +0.414 |
gard | +0.402 |
Neg logit contributions | |
practiced | -0.494 |
ounge | -0.494 |
thus | -0.468 |
UA | -0.468 |
ildo | -0.460 |
Token | complex |
Token ID | 3716 |
Feature activation | -6.09e-01 |
Pos logit contributions | |
practiced | +1.904 |
ounge | +1.848 |
thus | +1.770 |
UA | +1.751 |
ildo | +1.698 |
Neg logit contributions | |
Supplement | -1.687 |
appendix | -1.639 |
defences | -1.529 |
strang | -1.459 |
gard | -1.437 |
Token | images |
Token ID | 4263 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
practiced | +3.290 |
ounge | +3.168 |
thus | +3.048 |
UA | +3.014 |
ildo | +2.898 |
Neg logit contributions | |
Supplement | -3.196 |
appendix | -3.098 |
defences | -2.825 |
strang | -2.757 |
gard | -2.702 |
Token | evolved |
Token ID | 12572 |
Feature activation | -1.72e-01 |
Pos logit contributions | |
practiced | +1.638 |
ounge | +1.607 |
thus | +1.542 |
UA | +1.514 |
ildo | +1.500 |
Neg logit contributions | |
Supplement | -1.211 |
appendix | -1.198 |
defences | -1.127 |
strang | -1.076 |
gard | -1.041 |
Token | in |
Token ID | 287 |
Feature activation | +9.13e-02 |
Pos logit contributions | |
practiced | +0.951 |
ounge | +0.935 |
thus | +0.896 |
UA | +0.886 |
ildo | +0.870 |
Neg logit contributions | |
Supplement | -0.877 |
appendix | -0.869 |
defences | -0.822 |
strang | -0.794 |
gard | -0.767 |
Token | brains |
Token ID | 14290 |
Feature activation | +5.28e-01 |
Pos logit contributions | |
Supplement | +0.430 |
appendix | +0.424 |
defences | +0.398 |
strang | +0.383 |
gard | +0.371 |
Neg logit contributions | |
practiced | -0.545 |
ounge | -0.538 |
thus | -0.513 |
UA | -0.510 |
ildo | -0.500 |
Token | . |
Token ID | 13 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
appendix | +2.571 |
Supplement | +2.571 |
defences | +2.436 |
strang | +2.331 |
gard | +2.268 |
Neg logit contributions | |
ounge | -3.016 |
practiced | -2.950 |
UA | -2.859 |
thus | -2.841 |
ildo | -2.800 |
Token | must |
Token ID | 1276 |
Feature activation | -4.87e-01 |
Pos logit contributions | |
appendix | +0.952 |
Supplement | +0.947 |
defences | +0.886 |
strang | +0.852 |
gard | +0.819 |
Neg logit contributions | |
ounge | -1.457 |
practiced | -1.444 |
UA | -1.388 |
thus | -1.385 |
ildo | -1.365 |
Token | - |
Token ID | 12 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
practiced | +2.758 |
ounge | +2.702 |
thus | +2.623 |
UA | +2.609 |
ildo | +2.523 |
Neg logit contributions | |
Supplement | -2.355 |
appendix | -2.321 |
defences | -2.229 |
strang | -2.151 |
gard | -2.058 |
Token | read |
Token ID | 961 |
Feature activation | -6.03e-02 |
Pos logit contributions | |
practiced | +1.692 |
ounge | +1.685 |
thus | +1.637 |
UA | +1.600 |
ildo | +1.572 |
Neg logit contributions | |
appendix | -1.467 |
Supplement | -1.464 |
defences | -1.417 |
strang | -1.366 |
gard | -1.310 |
Token | for |
Token ID | 329 |
Feature activation | -2.24e-01 |
Pos logit contributions | |
practiced | +0.346 |
ounge | +0.344 |
thus | +0.327 |
UA | +0.326 |
ildo | +0.320 |
Neg logit contributions | |
Supplement | -0.294 |
appendix | -0.291 |
defences | -0.277 |
strang | -0.266 |
gard | -0.258 |
Token | the |
Token ID | 262 |
Feature activation | +8.85e-02 |
Pos logit contributions | |
practiced | +1.312 |
ounge | +1.290 |
thus | +1.236 |
UA | +1.222 |
ildo | +1.202 |
Neg logit contributions | |
Supplement | -1.070 |
appendix | -1.049 |
defences | -0.991 |
strang | -0.955 |
gard | -0.927 |
Token | basic |
Token ID | 4096 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
Supplement | +0.415 |
appendix | +0.414 |
defences | +0.389 |
strang | +0.374 |
gard | +0.362 |
Neg logit contributions | |
practiced | -0.524 |
ounge | -0.523 |
thus | -0.498 |
UA | -0.497 |
ildo | -0.489 |
Token | intuition |
Token ID | 31563 |
Feature activation | +3.07e-01 |
Pos logit contributions | |
practiced | +0.900 |
ounge | +0.892 |
thus | +0.851 |
UA | +0.847 |
ildo | +0.833 |
Neg logit contributions | |
Supplement | -0.707 |
appendix | -0.694 |
defences | -0.655 |
strang | -0.628 |
gard | -0.608 |
Token | about |
Token ID | 546 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
appendix | +1.480 |
Supplement | +1.478 |
defences | +1.396 |
strang | +1.338 |
gard | +1.302 |
Neg logit contributions | |
ounge | -1.771 |
practiced | -1.757 |
thus | -1.678 |
UA | -1.672 |
ildo | -1.645 |
Token | how |
Token ID | 703 |
Feature activation | +5.58e-01 |
Pos logit contributions | |
appendix | +0.844 |
Supplement | +0.843 |
defences | +0.794 |
strang | +0.763 |
gard | +0.736 |
Neg logit contributions | |
ounge | -1.076 |
practiced | -1.073 |
UA | -1.021 |
thus | -1.020 |
ildo | -1.005 |
Token | transaction |
Token ID | 8611 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
appendix | +2.658 |
Supplement | +2.604 |
defences | +2.504 |
strang | +2.418 |
gard | +2.303 |
Neg logit contributions | |
ounge | -3.289 |
practiced | -3.202 |
UA | -3.101 |
thus | -3.068 |
ildo | -3.043 |
Token | capacity |
Token ID | 5339 |
Feature activation | +7.08e-01 |
Pos logit contributions | |
practiced | +1.337 |
ounge | +1.304 |
thus | +1.250 |
UA | +1.244 |
ildo | +1.228 |
Neg logit contributions | |
Supplement | -1.033 |
appendix | -1.008 |
defences | -0.951 |
strang | -0.904 |
gard | -0.877 |
Token | collapsing |
Token ID | 30792 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
practiced | +2.480 |
ounge | +2.412 |
thus | +2.309 |
UA | +2.290 |
ildo | +2.249 |
Neg logit contributions | |
Supplement | -2.021 |
appendix | -1.967 |
defences | -1.824 |
strang | -1.751 |
gard | -1.702 |
Token | monster |
Token ID | 9234 |
Feature activation | -8.85e-01 |
Pos logit contributions | |
practiced | +5.883 |
ounge | +5.588 |
UA | +5.417 |
thus | +5.414 |
fray | +5.350 |
Neg logit contributions | |
Supplement | -5.191 |
appendix | -4.775 |
defences | -4.322 |
strang | -4.303 |
erald | -4.295 |
Token | . |
Token ID | 13 |
Feature activation | -4.08e-01 |
Pos logit contributions | |
practiced | +4.351 |
ounge | +4.203 |
UA | +4.024 |
thus | +4.001 |
ildo | +3.902 |
Neg logit contributions | |
Supplement | -4.878 |
appendix | -4.831 |
defences | -4.457 |
strang | -4.383 |
erald | -4.266 |
Token | After |
Token ID | 2293 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
practiced | +2.135 |
ounge | +2.130 |
thus | +2.051 |
UA | +2.040 |
ildo | +1.991 |
Neg logit contributions | |
appendix | -2.162 |
Supplement | -2.132 |
defences | -2.066 |
strang | -1.968 |
gard | -1.913 |
Token | centuries |
Token ID | 10675 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
practiced | +5.602 |
ounge | +5.310 |
thus | +5.270 |
UA | +5.055 |
ildo | +4.956 |
Neg logit contributions | |
Supplement | -4.999 |
appendix | -4.889 |
defences | -4.652 |
strang | -4.334 |
gard | -4.239 |
Token | of |
Token ID | 286 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
practiced | +5.853 |
ounge | +5.318 |
thus | +5.187 |
UA | +5.091 |
ildo | +4.973 |
Neg logit contributions | |
Supplement | -5.480 |
appendix | -5.387 |
defences | -4.994 |
erald | -4.818 |
strang | -4.765 |
Token | oppression |
Token ID | 18345 |
Feature activation | -4.20e-01 |
Pos logit contributions | |
practiced | +6.092 |
ounge | +5.652 |
thus | +5.444 |
UA | +5.316 |
ildo | +5.283 |
Neg logit contributions | |
Supplement | -4.775 |
appendix | -4.536 |
defences | -4.221 |
erald | -3.955 |
gard | -3.943 |
Token | , |
Token ID | 11 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
practiced | +2.331 |
ounge | +2.228 |
thus | +2.124 |
UA | +2.108 |
ildo | +2.086 |
Neg logit contributions | |
Supplement | -2.190 |
appendix | -2.173 |
defences | -2.024 |
strang | -1.951 |
gard | -1.899 |
Token | humanity |
Token ID | 9265 |
Feature activation | -2.82e-01 |
Pos logit contributions | |
Supplement | +1.506 |
appendix | +1.504 |
defences | +1.423 |
strang | +1.371 |
gard | +1.322 |
Neg logit contributions | |
ounge | -1.858 |
practiced | -1.850 |
UA | -1.766 |
thus | -1.763 |
ildo | -1.730 |
Token | was |
Token ID | 373 |
Feature activation | -1.36e-02 |
Pos logit contributions | |
practiced | +1.714 |
ounge | +1.646 |
thus | +1.583 |
UA | +1.552 |
ildo | +1.535 |
Neg logit contributions | |
Supplement | -1.324 |
appendix | -1.308 |
defences | -1.213 |
strang | -1.166 |
gard | -1.123 |
Token | at |
Token ID | 379 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
practiced | +0.090 |
ounge | +0.089 |
thus | +0.085 |
UA | +0.084 |
ildo | +0.083 |
Neg logit contributions | |
Supplement | -0.056 |
appendix | -0.055 |
defences | -0.052 |
strang | -0.049 |
gard | -0.047 |
Token | news |
Token ID | 1705 |
Feature activation | -6.17e-02 |
Pos logit contributions | |
appendix | +1.294 |
Supplement | +1.286 |
defences | +1.216 |
strang | +1.177 |
gard | +1.136 |
Neg logit contributions | |
practiced | -1.473 |
ounge | -1.471 |
thus | -1.398 |
UA | -1.397 |
ildo | -1.374 |
Token | that |
Token ID | 326 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
practiced | +0.340 |
ounge | +0.338 |
thus | +0.320 |
UA | +0.320 |
ildo | +0.314 |
Neg logit contributions | |
Supplement | -0.315 |
appendix | -0.313 |
defences | -0.298 |
strang | -0.285 |
gard | -0.277 |
Token | Oculus |
Token ID | 22334 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
Supplement | +1.079 |
appendix | +1.078 |
defences | +1.018 |
strang | +0.981 |
gard | +0.953 |
Neg logit contributions | |
practiced | -1.206 |
ounge | -1.205 |
thus | -1.141 |
UA | -1.140 |
ildo | -1.119 |
Token | Jo |
Token ID | 5302 |
Feature activation | +4.80e-01 |
Pos logit contributions | |
practiced | +1.127 |
ounge | +1.117 |
thus | +1.064 |
UA | +1.061 |
ildo | +1.043 |
Neg logit contributions | |
Supplement | -0.947 |
appendix | -0.942 |
defences | -0.886 |
strang | -0.851 |
gard | -0.825 |
Token | ins |
Token ID | 1040 |
Feature activation | -8.68e-01 |
Pos logit contributions | |
Supplement | +2.767 |
appendix | +2.743 |
defences | +2.644 |
strang | +2.544 |
gard | +2.468 |
Neg logit contributions | |
ounge | -2.284 |
practiced | -2.280 |
thus | -2.147 |
UA | -2.141 |
ildo | -2.088 |
Token | Facebook |
Token ID | 3203 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
practiced | +4.416 |
ounge | +4.396 |
UA | +4.207 |
thus | +4.203 |
ildo | +4.059 |
Neg logit contributions | |
Supplement | -4.626 |
appendix | -4.559 |
defences | -4.302 |
strang | -4.161 |
gard | -4.096 |
Token | . |
Token ID | 13 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
practiced | +6.674 |
ounge | +6.567 |
UA | +6.344 |
thus | +6.283 |
fray | +6.147 |
Neg logit contributions | |
Supplement | -6.439 |
appendix | -6.399 |
defences | -6.060 |
gard | -5.787 |
strang | -5.756 |
Token | The |
Token ID | 383 |
Feature activation | -4.74e-01 |
Pos logit contributions | |
practiced | +1.520 |
ounge | +1.518 |
thus | +1.444 |
UA | +1.440 |
ildo | +1.409 |
Neg logit contributions | |
Supplement | -1.496 |
appendix | -1.493 |
defences | -1.421 |
strang | -1.365 |
gard | -1.329 |
Token | news |
Token ID | 1705 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
practiced | +2.685 |
ounge | +2.667 |
thus | +2.531 |
UA | +2.519 |
ildo | +2.466 |
Neg logit contributions | |
Supplement | -2.355 |
appendix | -2.308 |
defences | -2.184 |
strang | -2.067 |
gard | -2.030 |
Token | that |
Token ID | 326 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
practiced | +0.929 |
ounge | +0.921 |
thus | +0.879 |
UA | +0.877 |
ildo | +0.861 |
Neg logit contributions | |
Supplement | -0.710 |
appendix | -0.704 |
defences | -0.666 |
strang | -0.633 |
gard | -0.614 |
Token | Facebook |
Token ID | 3203 |
Feature activation | -9.15e-01 |
Pos logit contributions | |
Supplement | +0.641 |
appendix | +0.640 |
defences | +0.608 |
strang | +0.587 |
gard | +0.571 |
Neg logit contributions | |
practiced | -0.617 |
ounge | -0.616 |
UA | -0.582 |
thus | -0.581 |
ildo | -0.570 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +4.12e-01 |
Pos logit contributions | |
practiced | +1.398 |
ounge | +1.394 |
thus | +1.327 |
UA | +1.325 |
ildo | +1.297 |
Neg logit contributions | |
Supplement | -1.295 |
appendix | -1.293 |
defences | -1.229 |
strang | -1.180 |
gard | -1.145 |
Token | Christian |
Token ID | 20298 |
Feature activation | -5.51e-01 |
Pos logit contributions | |
Supplement | +2.290 |
appendix | +2.216 |
defences | +2.095 |
strang | +2.018 |
gard | +1.973 |
Neg logit contributions | |
practiced | -2.133 |
ounge | -2.112 |
thus | -1.957 |
ildo | -1.948 |
UA | -1.943 |
Token | philosopher |
Token ID | 23723 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
practiced | +2.981 |
ounge | +2.851 |
thus | +2.792 |
UA | +2.748 |
ildo | +2.744 |
Neg logit contributions | |
Supplement | -2.865 |
appendix | -2.833 |
defences | -2.648 |
strang | -2.557 |
erald | -2.463 |
Token | and |
Token ID | 290 |
Feature activation | -2.58e-01 |
Pos logit contributions | |
practiced | +0.553 |
ounge | +0.545 |
thus | +0.518 |
UA | +0.518 |
ildo | +0.508 |
Neg logit contributions | |
Supplement | -0.528 |
appendix | -0.521 |
defences | -0.493 |
strang | -0.475 |
gard | -0.459 |
Token | blogger |
Token ID | 23530 |
Feature activation | +1.27e-01 |
Pos logit contributions | |
practiced | +1.464 |
ounge | +1.432 |
thus | +1.368 |
UA | +1.361 |
ildo | +1.341 |
Neg logit contributions | |
Supplement | -1.305 |
appendix | -1.277 |
defences | -1.211 |
strang | -1.153 |
gard | -1.113 |
Token | Dr |
Token ID | 1583 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
Supplement | +0.654 |
appendix | +0.651 |
defences | +0.617 |
strang | +0.594 |
gard | +0.577 |
Neg logit contributions | |
practiced | -0.692 |
ounge | -0.690 |
thus | -0.654 |
UA | -0.653 |
ildo | -0.640 |
Token | Glenn |
Token ID | 17551 |
Feature activation | -6.99e-01 |
Pos logit contributions | |
ounge | +4.915 |
practiced | +4.865 |
ildo | +4.665 |
thus | +4.552 |
UA | +4.513 |
Neg logit contributions | |
Supplement | -6.125 |
appendix | -6.091 |
defences | -5.832 |
strang | -5.535 |
gard | -5.362 |
Token | Peoples |
Token ID | 41770 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
ounge | +3.600 |
practiced | +3.591 |
ildo | +3.438 |
thus | +3.407 |
UA | +3.389 |
Neg logit contributions | |
Supplement | -3.736 |
appendix | -3.702 |
defences | -3.476 |
strang | -3.297 |
gard | -3.201 |
Token | is |
Token ID | 318 |
Feature activation | -3.63e-01 |
Pos logit contributions | |
practiced | +0.662 |
ounge | +0.652 |
thus | +0.624 |
UA | +0.623 |
ildo | +0.612 |
Neg logit contributions | |
Supplement | -0.480 |
appendix | -0.475 |
defences | -0.444 |
strang | -0.426 |
gard | -0.409 |
Token | coming |
Token ID | 2406 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
practiced | +2.012 |
ounge | +1.958 |
thus | +1.861 |
UA | +1.842 |
ildo | +1.812 |
Neg logit contributions | |
Supplement | -1.883 |
appendix | -1.849 |
defences | -1.749 |
strang | -1.674 |
gard | -1.626 |
Token | to |
Token ID | 284 |
Feature activation | -7.27e-01 |
Pos logit contributions | |
practiced | +1.100 |
ounge | +1.085 |
thus | +1.042 |
UA | +1.034 |
ildo | +1.015 |
Neg logit contributions | |
Supplement | -0.863 |
appendix | -0.850 |
defences | -0.798 |
strang | -0.765 |
gard | -0.737 |
Token | im |
Token ID | 320 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
practiced | +1.068 |
ounge | +1.060 |
thus | +1.012 |
UA | +0.999 |
ildo | +0.985 |
Neg logit contributions | |
Supplement | -1.077 |
appendix | -1.075 |
defences | -1.026 |
strang | -0.985 |
gard | -0.958 |
Token | arer |
Token ID | 11258 |
Feature activation | -1.48e-01 |
Pos logit contributions | |
Supplement | +0.834 |
appendix | +0.829 |
defences | +0.788 |
strang | +0.758 |
gard | +0.736 |
Neg logit contributions | |
practiced | -0.849 |
ounge | -0.844 |
thus | -0.801 |
UA | -0.799 |
ildo | -0.784 |
Token | Rep |
Token ID | 1432 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
practiced | +0.831 |
ounge | +0.828 |
thus | +0.792 |
UA | +0.788 |
ildo | +0.772 |
Neg logit contributions | |
Supplement | -0.740 |
appendix | -0.733 |
defences | -0.701 |
strang | -0.665 |
gard | -0.646 |
Token | ub |
Token ID | 549 |
Feature activation | +3.06e-02 |
Pos logit contributions | |
ounge | +0.548 |
practiced | +0.546 |
thus | +0.505 |
UA | +0.494 |
ildo | +0.490 |
Neg logit contributions | |
Supplement | -1.188 |
appendix | -1.186 |
defences | -1.150 |
strang | -1.110 |
gard | -1.085 |
Token | lik |
Token ID | 46965 |
Feature activation | -2.78e-01 |
Pos logit contributions | |
Supplement | +0.171 |
appendix | +0.171 |
defences | +0.162 |
strang | +0.157 |
gard | +0.153 |
Neg logit contributions | |
practiced | -0.153 |
ounge | -0.152 |
thus | -0.144 |
UA | -0.144 |
ildo | -0.140 |
Token | ," |
Token ID | 553 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
practiced | +1.463 |
ounge | +1.451 |
thus | +1.387 |
UA | +1.372 |
ildo | +1.352 |
Neg logit contributions | |
Supplement | -1.486 |
appendix | -1.470 |
defences | -1.413 |
strang | -1.343 |
gard | -1.307 |
Token | was |
Token ID | 373 |
Feature activation | -4.97e-01 |
Pos logit contributions | |
practiced | +5.779 |
ounge | +5.244 |
thus | +5.151 |
UA | +4.992 |
ildo | +4.960 |
Neg logit contributions | |
Supplement | -4.843 |
appendix | -4.755 |
defences | -4.580 |
strang | -4.301 |
erald | -4.216 |
Token | put |
Token ID | 1234 |
Feature activation | -5.97e-02 |
Pos logit contributions | |
practiced | +2.837 |
ounge | +2.670 |
thus | +2.553 |
UA | +2.522 |
ildo | +2.458 |
Neg logit contributions | |
Supplement | -2.526 |
appendix | -2.480 |
defences | -2.346 |
strang | -2.220 |
erald | -2.204 |
Token | under |
Token ID | 739 |
Feature activation | +2.41e-02 |
Pos logit contributions | |
practiced | +0.350 |
ounge | +0.347 |
thus | +0.332 |
UA | +0.329 |
ildo | +0.324 |
Neg logit contributions | |
Supplement | -0.285 |
appendix | -0.282 |
defences | -0.266 |
strang | -0.255 |
gard | -0.248 |
Token | fatal |
Token ID | 10800 |
Feature activation | +5.11e-03 |
Pos logit contributions | |
Supplement | +0.110 |
appendix | +0.109 |
defences | +0.102 |
strang | +0.098 |
gard | +0.094 |
Neg logit contributions | |
practiced | -0.147 |
ounge | -0.145 |
thus | -0.139 |
UA | -0.138 |
ildo | -0.135 |
Token | pressure |
Token ID | 3833 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
Supplement | +0.024 |
appendix | +0.024 |
defences | +0.022 |
strang | +0.021 |
gard | +0.021 |
Neg logit contributions | |
practiced | -0.030 |
ounge | -0.030 |
thus | -0.029 |
UA | -0.028 |
ildo | -0.028 |
Token | way |
Token ID | 835 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
practiced | +3.351 |
ounge | +3.224 |
thus | +3.073 |
UA | +3.065 |
ildo | +3.039 |
Neg logit contributions | |
Supplement | -2.396 |
appendix | -2.330 |
defences | -2.196 |
strang | -2.078 |
erald | -1.995 |
Token | to |
Token ID | 284 |
Feature activation | -5.22e-01 |
Pos logit contributions | |
practiced | +1.570 |
ounge | +1.532 |
thus | +1.460 |
UA | +1.454 |
ildo | +1.437 |
Neg logit contributions | |
Supplement | -1.463 |
appendix | -1.452 |
defences | -1.374 |
strang | -1.322 |
gard | -1.278 |
Token | share |
Token ID | 2648 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
practiced | +3.239 |
ounge | +3.161 |
thus | +3.017 |
ildo | +2.990 |
UA | +2.980 |
Neg logit contributions | |
Supplement | -2.311 |
appendix | -2.250 |
defences | -2.122 |
strang | -2.005 |
gard | -1.926 |
Token | sacred |
Token ID | 13626 |
Feature activation | -3.79e-01 |
Pos logit contributions | |
practiced | +7.137 |
ounge | +6.642 |
thus | +6.479 |
UA | +6.369 |
ildo | +6.347 |
Neg logit contributions | |
Supplement | -5.990 |
appendix | -5.667 |
defences | -5.235 |
andestine | -5.102 |
strang | -5.099 |
Token | space |
Token ID | 2272 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
practiced | +2.128 |
ounge | +2.067 |
thus | +1.982 |
UA | +1.977 |
ildo | +1.926 |
Neg logit contributions | |
Supplement | -1.928 |
appendix | -1.884 |
defences | -1.756 |
strang | -1.694 |
gard | -1.644 |
Token | without |
Token ID | 1231 |
Feature activation | -9.90e-01 |
Pos logit contributions | |
practiced | +3.194 |
ounge | +3.098 |
thus | +2.989 |
UA | +2.933 |
ildo | +2.880 |
Neg logit contributions | |
Supplement | -3.169 |
appendix | -3.151 |
defences | -2.975 |
strang | -2.892 |
gard | -2.788 |
Token | trying |
Token ID | 2111 |
Feature activation | +2.13e-02 |
Pos logit contributions | |
practiced | +5.416 |
ounge | +5.158 |
fray | +4.836 |
thus | +4.808 |
ildo | +4.795 |
Neg logit contributions | |
Supplement | -5.049 |
appendix | -4.782 |
defences | -4.423 |
erald | -4.301 |
andestine | -4.241 |
Token | to |
Token ID | 284 |
Feature activation | +2.62e-02 |
Pos logit contributions | |
Supplement | +0.112 |
appendix | +0.111 |
defences | +0.105 |
strang | +0.101 |
gard | +0.098 |
Neg logit contributions | |
practiced | -0.115 |
ounge | -0.114 |
thus | -0.107 |
UA | -0.107 |
ildo | -0.105 |
Token | convert |
Token ID | 10385 |
Feature activation | -7.76e-01 |
Pos logit contributions | |
Supplement | +0.121 |
appendix | +0.120 |
defences | +0.113 |
strang | +0.108 |
gard | +0.105 |
Neg logit contributions | |
practiced | -0.157 |
ounge | -0.156 |
thus | -0.149 |
UA | -0.148 |
ildo | -0.146 |
Token | one |
Token ID | 530 |
Feature activation | -5.83e-01 |
Pos logit contributions | |
practiced | +4.461 |
ounge | +4.255 |
UA | +4.047 |
thus | +4.043 |
ildo | +4.030 |
Neg logit contributions | |
Supplement | -3.871 |
appendix | -3.745 |
defences | -3.488 |
strang | -3.364 |
gard | -3.228 |
Token | another |
Token ID | 1194 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
practiced | +3.397 |
ounge | +3.261 |
UA | +3.109 |
thus | +3.083 |
ildo | +3.079 |
Neg logit contributions | |
Supplement | -2.836 |
appendix | -2.742 |
defences | -2.624 |
strang | -2.493 |
gard | -2.376 |