Token | that |
Token ID | 326 |
Feature activation | +9.28e-02 |
Pos logit contributions | |
ricks | +3.080 |
idth | +2.893 |
--------------- | +2.804 |
abama | +2.793 |
akespeare | +2.715 |
Neg logit contributions | |
ULAR | -2.836 |
eur | -2.815 |
Versus | -2.795 |
aido | -2.721 |
INESS | -2.696 |
Token | toxic |
Token ID | 11422 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
eur | +0.465 |
ULAR | +0.455 |
Versus | +0.450 |
atively | +0.436 |
aido | +0.433 |
Neg logit contributions | |
ricks | -0.586 |
idth | -0.561 |
abama | -0.537 |
--------------- | -0.529 |
akespeare | -0.523 |
Token | waste |
Token ID | 7030 |
Feature activation | +4.52e-01 |
Pos logit contributions | |
ricks | +0.714 |
idth | +0.674 |
--------------- | +0.643 |
abama | +0.640 |
akespeare | +0.626 |
Neg logit contributions | |
eur | -0.650 |
ULAR | -0.645 |
Versus | -0.640 |
aido | -0.623 |
atively | -0.617 |
Token | from |
Token ID | 422 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
eur | +2.113 |
Versus | +2.063 |
ULAR | +2.040 |
survival | +1.968 |
INESS | +1.963 |
Neg logit contributions | |
ricks | -2.979 |
idth | -2.822 |
abama | -2.758 |
--------------- | -2.680 |
akespeare | -2.641 |
Token | Rob |
Token ID | 3851 |
Feature activation | +8.37e-02 |
Pos logit contributions | |
eur | +1.377 |
Versus | +1.375 |
ULAR | +1.347 |
atively | +1.287 |
aido | +1.281 |
Neg logit contributions | |
ricks | -1.689 |
idth | -1.643 |
abama | -1.555 |
--------------- | -1.539 |
raught | -1.489 |
Token | oc |
Token ID | 420 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
Versus | +0.417 |
eur | +0.411 |
ULAR | +0.403 |
opa | +0.397 |
aido | +0.397 |
Neg logit contributions | |
ricks | -0.515 |
idth | -0.502 |
abama | -0.486 |
xual | -0.485 |
--------------- | -0.475 |
Token | op |
Token ID | 404 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
aido | +8.787 |
opa | +8.701 |
atively | +7.813 |
eur | +7.730 |
here | +7.487 |
Neg logit contributions | |
--------------- | -16.462 |
enriched | -16.123 |
�� | -15.761 |
�� | -15.325 |
enrich | -15.282 |
Token | . |
Token ID | 13 |
Feature activation | +6.86e-01 |
Pos logit contributions | |
eur | +0.862 |
Versus | +0.860 |
ULAR | +0.828 |
aido | +0.809 |
INESS | +0.808 |
Neg logit contributions | |
ricks | -1.074 |
idth | -1.058 |
abama | -1.020 |
--------------- | -0.992 |
raught | -0.976 |
Token | Continue |
Token ID | 10054 |
Feature activation | -2.96e-01 |
Pos logit contributions | |
Versus | +3.298 |
eur | +3.273 |
ULAR | +3.170 |
opa | +2.988 |
INESS | +2.978 |
Neg logit contributions | |
ricks | -4.404 |
idth | -4.190 |
abama | -4.082 |
enriched | -4.049 |
akespeare | -3.960 |
Token | Reading |
Token ID | 11725 |
Feature activation | -3.47e-01 |
Pos logit contributions | |
ricks | +1.450 |
idth | +1.322 |
abama | +1.283 |
--------------- | +1.261 |
enriched | +1.245 |
Neg logit contributions | |
Versus | -1.928 |
ULAR | -1.926 |
eur | -1.898 |
aido | -1.838 |
INESS | -1.830 |
Token | Below |
Token ID | 10383 |
Feature activation | -9.19e-01 |
Pos logit contributions | |
ricks | +2.334 |
idth | +2.181 |
abama | +2.128 |
--------------- | +2.105 |
enriched | +2.086 |
Neg logit contributions | |
ULAR | -1.630 |
Versus | -1.627 |
eur | -1.604 |
aido | -1.542 |
INESS | -1.539 |
Token | of |
Token ID | 286 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
eur | +1.084 |
ULAR | +1.053 |
Versus | +1.029 |
aido | +0.999 |
atively | +0.990 |
Neg logit contributions | |
ricks | -1.578 |
idth | -1.494 |
abama | -1.437 |
raught | -1.430 |
akespeare | -1.421 |
Token | the |
Token ID | 262 |
Feature activation | +1.04e-01 |
Pos logit contributions | |
ULAR | +1.422 |
eur | +1.407 |
Versus | +1.404 |
atively | +1.386 |
opa | +1.360 |
Neg logit contributions | |
ricks | -1.636 |
--------------- | -1.482 |
idth | -1.480 |
abama | -1.466 |
xual | -1.459 |
Token | federal |
Token ID | 2717 |
Feature activation | -7.60e-01 |
Pos logit contributions | |
eur | +0.531 |
ULAR | +0.528 |
Versus | +0.525 |
opa | +0.512 |
INESS | +0.508 |
Neg logit contributions | |
ricks | -0.645 |
idth | -0.598 |
--------------- | -0.588 |
abama | -0.584 |
akespeare | -0.576 |
Token | government |
Token ID | 1230 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
ricks | +4.379 |
idth | +4.037 |
--------------- | +3.984 |
abama | +3.942 |
enriched | +3.840 |
Neg logit contributions | |
ULAR | -4.215 |
eur | -4.169 |
Versus | -4.142 |
aido | -4.070 |
INESS | -4.038 |
Token | , |
Token ID | 11 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
ricks | +0.718 |
idth | +0.672 |
--------------- | +0.659 |
abama | +0.653 |
akespeare | +0.639 |
Neg logit contributions | |
eur | -0.578 |
ULAR | -0.571 |
Versus | -0.565 |
aido | -0.554 |
INESS | -0.552 |
Token | even |
Token ID | 772 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
Versus | +2.592 |
eur | +2.574 |
ULAR | +2.512 |
atively | +2.488 |
aido | +2.486 |
Neg logit contributions | |
ricks | -2.953 |
abama | -2.771 |
idth | -2.760 |
xual | -2.677 |
akespeare | -2.625 |
Token | if |
Token ID | 611 |
Feature activation | +5.35e-01 |
Pos logit contributions | |
rudimentary | +7.581 |
moderately | +7.495 |
outside | +7.445 |
vaguely | +7.441 |
provisional | +7.436 |
Neg logit contributions | |
ricks | -16.099 |
idth | -15.616 |
abama | -15.097 |
xual | -15.041 |
raught | -14.919 |
Token | the |
Token ID | 262 |
Feature activation | +2.54e-01 |
Pos logit contributions | |
Versus | +2.644 |
atively | +2.636 |
eur | +2.635 |
ULAR | +2.611 |
interim | +2.535 |
Neg logit contributions | |
ricks | -3.316 |
abama | -3.057 |
--------------- | -3.031 |
idth | -3.020 |
xual | -2.994 |
Token | Obama |
Token ID | 2486 |
Feature activation | -7.44e-01 |
Pos logit contributions | |
eur | +1.274 |
Versus | +1.273 |
ULAR | +1.262 |
atively | +1.233 |
INESS | +1.227 |
Neg logit contributions | |
ricks | -1.572 |
idth | -1.481 |
--------------- | -1.444 |
abama | -1.430 |
xual | -1.417 |
Token | administration |
Token ID | 3662 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
ricks | +4.182 |
idth | +3.835 |
--------------- | +3.788 |
abama | +3.742 |
enriched | +3.655 |
Neg logit contributions | |
ULAR | -4.225 |
eur | -4.174 |
Versus | -4.148 |
aido | -4.088 |
INESS | -4.054 |
Token | is |
Token ID | 318 |
Feature activation | -3.52e-01 |
Pos logit contributions | |
ricks | +0.998 |
idth | +0.966 |
abama | +0.935 |
--------------- | +0.926 |
xual | +0.898 |
Neg logit contributions | |
eur | -0.729 |
Versus | -0.709 |
ULAR | -0.705 |
aido | -0.681 |
atively | -0.679 |
Token | plus |
Token ID | 5556 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
eur | +1.483 |
Versus | +1.462 |
ULAR | +1.421 |
INESS | +1.385 |
ré | +1.379 |
Neg logit contributions | |
ricks | -1.645 |
idth | -1.542 |
--------------- | -1.479 |
abama | -1.475 |
akespeare | -1.420 |
Token | bas |
Token ID | 1615 |
Feature activation | +4.67e-01 |
Pos logit contributions | |
eur | +0.872 |
Versus | +0.848 |
ULAR | +0.840 |
aido | +0.817 |
INESS | +0.815 |
Neg logit contributions | |
ricks | -1.019 |
idth | -0.958 |
abama | -0.941 |
--------------- | -0.917 |
akespeare | -0.904 |
Token | iques |
Token ID | 6368 |
Feature activation | +5.22e-01 |
Pos logit contributions | |
eur | +2.349 |
Versus | +2.246 |
ULAR | +2.226 |
INESS | +2.199 |
aido | +2.194 |
Neg logit contributions | |
ricks | -2.877 |
idth | -2.802 |
abama | -2.697 |
--------------- | -2.643 |
raught | -2.602 |
Token | . |
Token ID | 13 |
Feature activation | +6.53e-01 |
Pos logit contributions | |
eur | +2.625 |
Versus | +2.573 |
ULAR | +2.503 |
ré | +2.457 |
INESS | +2.403 |
Neg logit contributions | |
ricks | -3.278 |
idth | -3.116 |
abama | -2.983 |
--------------- | -2.923 |
akespeare | -2.897 |
Token | Il |
Token ID | 13778 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
eur | +3.185 |
ULAR | +3.182 |
Versus | +3.127 |
INESS | +2.983 |
ré | +2.851 |
Neg logit contributions | |
ricks | -4.261 |
idth | -4.011 |
abama | -3.834 |
enriched | -3.796 |
xual | -3.789 |
Token | app |
Token ID | 598 |
Feature activation | +2.42e+00 |
Pos logit contributions | |
Versus | +5.677 |
eur | +5.658 |
ré | +5.621 |
interim | +5.350 |
survival | +5.333 |
Neg logit contributions | |
ricks | -6.915 |
idth | -6.374 |
abama | -6.091 |
--------------- | -6.089 |
@#& | -5.986 |
Token | ara |
Token ID | 3301 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
eur | +13.547 |
ilot | +11.883 |
oser | +11.867 |
opa | +11.688 |
omew | +11.619 |
Neg logit contributions | |
�� | -9.530 |
enriched | -9.357 |
xual | -9.316 |
ricks | -9.298 |
--------------- | -9.289 |
Token | î |
Token ID | 34803 |
Feature activation | +6.48e-01 |
Pos logit contributions | |
eur | +4.832 |
Versus | +4.405 |
opa | +4.379 |
INESS | +4.277 |
ULAR | +4.218 |
Neg logit contributions | |
ricks | -7.385 |
abama | -6.921 |
idth | -6.757 |
xual | -6.713 |
--------------- | -6.643 |
Token | t |
Token ID | 83 |
Feature activation | +5.35e-01 |
Pos logit contributions | |
eur | +3.345 |
ULAR | +3.175 |
Versus | +3.173 |
atively | +3.024 |
ré | +2.994 |
Neg logit contributions | |
ricks | -3.868 |
idth | -3.744 |
abama | -3.636 |
--------------- | -3.595 |
xual | -3.503 |
Token | c |
Token ID | 269 |
Feature activation | +1.78e+00 |
Pos logit contributions | |
eur | +2.711 |
Versus | +2.607 |
ULAR | +2.560 |
ré | +2.490 |
atively | +2.454 |
Neg logit contributions | |
ricks | -3.318 |
idth | -3.205 |
abama | -3.114 |
--------------- | -3.041 |
xual | -2.993 |
Token | epend |
Token ID | 2690 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
eur | +7.819 |
opa | +7.013 |
ULAR | +6.797 |
aido | +6.755 |
here | +6.578 |
Neg logit contributions | |
ricks | -10.205 |
enriched | -10.144 |
idth | -9.841 |
@#& | -9.735 |
--------------- | -9.709 |
Token | pressure |
Token ID | 3833 |
Feature activation | +3.68e-01 |
Pos logit contributions | |
eur | +0.193 |
ULAR | +0.189 |
Versus | +0.188 |
atively | +0.182 |
aido | +0.180 |
Neg logit contributions | |
ricks | -0.241 |
idth | -0.236 |
abama | -0.226 |
--------------- | -0.220 |
akespeare | -0.219 |
Token | on |
Token ID | 319 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
eur | +1.975 |
Versus | +1.948 |
ULAR | +1.932 |
aido | +1.864 |
atively | +1.841 |
Neg logit contributions | |
ricks | -2.155 |
idth | -2.068 |
abama | -1.992 |
--------------- | -1.942 |
akespeare | -1.918 |
Token | his |
Token ID | 465 |
Feature activation | +4.72e-01 |
Pos logit contributions | |
Versus | +0.823 |
ULAR | +0.818 |
eur | +0.807 |
atively | +0.785 |
aido | +0.783 |
Neg logit contributions | |
ricks | -0.865 |
idth | -0.811 |
abama | -0.785 |
--------------- | -0.780 |
akespeare | -0.774 |
Token | job |
Token ID | 1693 |
Feature activation | +3.92e-01 |
Pos logit contributions | |
ULAR | +2.008 |
Versus | +1.999 |
survival | +1.965 |
ré | +1.948 |
rudimentary | +1.930 |
Neg logit contributions | |
ricks | -3.214 |
idth | -3.124 |
abama | -3.025 |
akespeare | -3.003 |
xual | -2.967 |
Token | , |
Token ID | 11 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
eur | +1.919 |
Versus | +1.881 |
INESS | +1.867 |
ULAR | +1.861 |
survival | +1.849 |
Neg logit contributions | |
ricks | -2.489 |
idth | -2.318 |
akespeare | -2.277 |
abama | -2.257 |
--------------- | -2.239 |
Token | even |
Token ID | 772 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
Versus | +0.526 |
ULAR | +0.511 |
eur | +0.506 |
aido | +0.494 |
atively | +0.487 |
Neg logit contributions | |
ricks | -0.617 |
idth | -0.592 |
abama | -0.569 |
--------------- | -0.557 |
akespeare | -0.554 |
Token | though |
Token ID | 996 |
Feature activation | +5.83e-01 |
Pos logit contributions | |
moderately | +8.621 |
Versus | +8.483 |
mildly | +8.279 |
interim | +8.237 |
internally | +8.218 |
Neg logit contributions | |
idth | -14.544 |
ricks | -14.282 |
abama | -13.319 |
akespeare | -13.215 |
raught | -13.196 |
Token | he |
Token ID | 339 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
Versus | +3.000 |
eur | +2.943 |
interim | +2.922 |
ULAR | +2.918 |
atively | +2.865 |
Neg logit contributions | |
ricks | -3.461 |
idth | -3.289 |
abama | -3.214 |
akespeare | -3.155 |
--------------- | -3.147 |
Token | was |
Token ID | 373 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
ricks | +1.103 |
idth | +1.058 |
abama | +1.021 |
--------------- | +1.020 |
xual | +0.986 |
Neg logit contributions | |
eur | -0.810 |
Versus | -0.797 |
ULAR | -0.791 |
aido | -0.772 |
atively | -0.762 |
Token | pretty |
Token ID | 2495 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
Versus | +1.466 |
ULAR | +1.464 |
eur | +1.454 |
interim | +1.439 |
atively | +1.405 |
Neg logit contributions | |
ricks | -2.110 |
idth | -2.084 |
abama | -1.971 |
akespeare | -1.947 |
xual | -1.929 |
Token | much |
Token ID | 881 |
Feature activation | +7.09e-01 |
Pos logit contributions | |
eur | +1.777 |
Versus | +1.770 |
ULAR | +1.764 |
rudimentary | +1.754 |
interim | +1.722 |
Neg logit contributions | |
ricks | -2.439 |
idth | -2.399 |
abama | -2.278 |
akespeare | -2.266 |
xual | -2.233 |
Token | Giant |
Token ID | 17384 |
Feature activation | +6.28e-01 |
Pos logit contributions | |
ricks | +1.336 |
idth | +1.242 |
--------------- | +1.218 |
abama | +1.213 |
enriched | +1.186 |
Neg logit contributions | |
Versus | -1.193 |
ULAR | -1.186 |
eur | -1.180 |
aido | -1.144 |
INESS | -1.122 |
Token | Cherry |
Token ID | 23165 |
Feature activation | -6.13e-01 |
Pos logit contributions | |
Versus | +2.724 |
ULAR | +2.653 |
eur | +2.612 |
opa | +2.513 |
aido | +2.510 |
Neg logit contributions | |
ricks | -4.256 |
idth | -3.998 |
--------------- | -3.967 |
abama | -3.928 |
enriched | -3.890 |
Token | ) |
Token ID | 8 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
ricks | +3.818 |
idth | +3.545 |
--------------- | +3.507 |
abama | +3.469 |
enriched | +3.387 |
Neg logit contributions | |
ULAR | -3.119 |
eur | -3.090 |
Versus | -3.074 |
aido | -3.009 |
INESS | -2.980 |
Token | was |
Token ID | 373 |
Feature activation | +7.26e-01 |
Pos logit contributions | |
Versus | +1.638 |
eur | +1.614 |
ULAR | +1.569 |
aido | +1.539 |
atively | +1.521 |
Neg logit contributions | |
ricks | -2.180 |
idth | -2.130 |
abama | -2.069 |
--------------- | -2.008 |
xual | -1.963 |
Token | only |
Token ID | 691 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
Versus | +3.071 |
atively | +3.001 |
eur | +2.989 |
rudimentary | +2.979 |
moderately | +2.963 |
Neg logit contributions | |
idth | -4.829 |
ricks | -4.811 |
abama | -4.625 |
xual | -4.503 |
--------------- | -4.440 |
Token | a |
Token ID | 257 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
moderately | +7.520 |
rudimentary | +7.109 |
survival | +7.006 |
mildly | +6.938 |
vaguely | +6.895 |
Neg logit contributions | |
idth | -10.363 |
ricks | -9.972 |
abama | -9.641 |
xual | -9.580 |
raught | -9.393 |
Token | moderate |
Token ID | 10768 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
rudimentary | +10.930 |
moderately | +10.752 |
survival | +10.722 |
provisional | +10.321 |
interim | +10.184 |
Neg logit contributions | |
ricks | -12.755 |
idth | -12.440 |
xual | -12.314 |
nces | -12.278 |
abama | -11.906 |
Token | success |
Token ID | 1943 |
Feature activation | +4.90e-01 |
Pos logit contributions | |
survival | +4.431 |
eur | +4.220 |
interim | +4.212 |
Versus | +4.193 |
rudimentary | +4.135 |
Neg logit contributions | |
ricks | -6.925 |
idth | -6.557 |
--------------- | -6.248 |
abama | -6.219 |
xual | -6.158 |
Token | . |
Token ID | 13 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
eur | +2.230 |
Versus | +2.227 |
ULAR | +2.162 |
atively | +2.139 |
INESS | +2.128 |
Neg logit contributions | |
ricks | -3.189 |
idth | -3.109 |
abama | -2.980 |
--------------- | -2.946 |
akespeare | -2.876 |
Token | His |
Token ID | 2399 |
Feature activation | -6.58e-02 |
Pos logit contributions | |
Versus | +1.935 |
ULAR | +1.846 |
eur | +1.814 |
INESS | +1.704 |
atively | +1.700 |
Neg logit contributions | |
ricks | -2.443 |
idth | -2.359 |
abama | -2.252 |
xual | -2.249 |
enriched | -2.214 |
Token | least |
Token ID | 1551 |
Feature activation | +3.38e-01 |
Pos logit contributions | |
ricks | +0.450 |
idth | +0.423 |
--------------- | +0.413 |
abama | +0.412 |
xual | +0.405 |
Neg logit contributions | |
ULAR | -0.295 |
Versus | -0.294 |
eur | -0.291 |
aido | -0.281 |
survival | -0.276 |
Token | a |
Token ID | 257 |
Feature activation | +7.43e-01 |
Pos logit contributions | |
eur | +2.694 |
Versus | +2.675 |
ULAR | +2.640 |
atively | +2.612 |
survival | +2.581 |
Neg logit contributions | |
ricks | -2.901 |
idth | -2.785 |
abama | -2.709 |
--------------- | -2.695 |
xual | -2.604 |
Token | very |
Token ID | 845 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
Versus | +3.338 |
ULAR | +3.293 |
eur | +3.229 |
survival | +3.221 |
rudimentary | +3.158 |
Neg logit contributions | |
ricks | -4.863 |
idth | -4.693 |
abama | -4.492 |
--------------- | -4.438 |
akespeare | -4.353 |
Token | vulnerable |
Token ID | 8826 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
ULAR | +0.889 |
eur | +0.883 |
Versus | +0.864 |
rudimentary | +0.850 |
survival | +0.838 |
Neg logit contributions | |
ricks | -1.131 |
idth | -1.087 |
--------------- | -1.025 |
abama | -1.024 |
akespeare | -0.996 |
Token | way |
Token ID | 835 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
Versus | +1.484 |
eur | +1.477 |
ULAR | +1.466 |
atively | +1.402 |
survival | +1.393 |
Neg logit contributions | |
ricks | -2.493 |
idth | -2.346 |
--------------- | -2.281 |
abama | -2.277 |
akespeare | -2.217 |
Token | , |
Token ID | 11 |
Feature activation | +3.05e-01 |
Pos logit contributions | |
ricks | +1.055 |
idth | +0.979 |
abama | +0.968 |
--------------- | +0.957 |
akespeare | +0.932 |
Neg logit contributions | |
eur | -0.877 |
Versus | -0.872 |
ULAR | -0.871 |
aido | -0.841 |
INESS | -0.837 |
Token | even |
Token ID | 772 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
Versus | +1.650 |
eur | +1.615 |
ULAR | +1.585 |
aido | +1.554 |
atively | +1.537 |
Neg logit contributions | |
ricks | -1.782 |
idth | -1.694 |
abama | -1.655 |
--------------- | -1.622 |
akespeare | -1.594 |
Token | to |
Token ID | 284 |
Feature activation | +7.62e-01 |
Pos logit contributions | |
Versus | +8.574 |
moderately | +8.214 |
vaguely | +8.213 |
survival | +8.142 |
mildly | +8.128 |
Neg logit contributions | |
ricks | -14.371 |
idth | -13.865 |
abama | -13.154 |
akespeare | -12.662 |
uliffe | -12.610 |
Token | herself |
Token ID | 5223 |
Feature activation | +9.46e-01 |
Pos logit contributions | |
Versus | +3.933 |
ULAR | +3.792 |
survival | +3.772 |
eur | +3.754 |
atively | +3.749 |
Neg logit contributions | |
ricks | -4.504 |
idth | -4.200 |
abama | -4.158 |
--------------- | -3.989 |
uliffe | -3.928 |
Token | , |
Token ID | 11 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
eur | +4.006 |
Versus | +3.981 |
atively | +3.885 |
ULAR | +3.809 |
aido | +3.740 |
Neg logit contributions | |
ricks | -6.379 |
idth | -5.962 |
abama | -5.957 |
--------------- | -5.794 |
akespeare | -5.682 |
Token | that |
Token ID | 326 |
Feature activation | -2.55e-01 |
Pos logit contributions | |
Versus | +0.063 |
eur | +0.062 |
ULAR | +0.061 |
aido | +0.059 |
atively | +0.059 |
Neg logit contributions | |
ricks | -0.072 |
idth | -0.067 |
abama | -0.066 |
--------------- | -0.065 |
akespeare | -0.064 |
Token | she |
Token ID | 673 |
Feature activation | -3.80e-01 |
Pos logit contributions | |
ricks | +1.270 |
idth | +1.155 |
abama | +1.127 |
--------------- | +1.124 |
akespeare | +1.087 |
Neg logit contributions | |
eur | -1.630 |
ULAR | -1.622 |
Versus | -1.619 |
aido | -1.571 |
INESS | -1.569 |
Token | to |
Token ID | 284 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
eur | +2.461 |
Versus | +2.456 |
ULAR | +2.439 |
aido | +2.393 |
atively | +2.383 |
Neg logit contributions | |
ricks | -2.250 |
idth | -2.073 |
abama | -2.048 |
--------------- | -1.999 |
akespeare | -1.953 |
Token | just |
Token ID | 655 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
Versus | +1.205 |
eur | +1.198 |
ULAR | +1.176 |
aido | +1.167 |
survival | +1.134 |
Neg logit contributions | |
ricks | -1.900 |
idth | -1.832 |
abama | -1.805 |
--------------- | -1.727 |
xual | -1.716 |
Token | postpone |
Token ID | 47328 |
Feature activation | +8.40e-01 |
Pos logit contributions | |
Versus | +4.511 |
survival | +4.475 |
aido | +4.418 |
eur | +4.403 |
ULAR | +4.395 |
Neg logit contributions | |
ricks | -7.496 |
idth | -7.403 |
abama | -7.230 |
uliffe | -6.969 |
raught | -6.965 |
Token | a |
Token ID | 257 |
Feature activation | +6.50e-01 |
Pos logit contributions | |
survival | +3.941 |
eur | +3.923 |
Versus | +3.884 |
atively | +3.788 |
ULAR | +3.741 |
Neg logit contributions | |
ricks | -5.353 |
idth | -5.014 |
abama | -4.938 |
akespeare | -4.817 |
uliffe | -4.797 |
Token | situation |
Token ID | 3074 |
Feature activation | +5.92e-01 |
Pos logit contributions | |
Versus | +2.981 |
survival | +2.958 |
eur | +2.915 |
ULAR | +2.855 |
aido | +2.792 |
Neg logit contributions | |
ricks | -4.183 |
abama | -3.946 |
idth | -3.933 |
xual | -3.870 |
akespeare | -3.792 |
Token | even |
Token ID | 772 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
eur | +3.009 |
Versus | +2.913 |
atively | +2.836 |
INESS | +2.826 |
ULAR | +2.814 |
Neg logit contributions | |
ricks | -3.674 |
idth | -3.450 |
abama | -3.377 |
akespeare | -3.242 |
raught | -3.229 |
Token | if |
Token ID | 611 |
Feature activation | +6.06e-01 |
Pos logit contributions | |
moderately | +7.446 |
Versus | +7.231 |
vaguely | +7.224 |
mildly | +7.175 |
eur | +7.127 |
Neg logit contributions | |
ricks | -15.296 |
idth | -15.117 |
raught | -14.557 |
xual | -14.497 |
abama | -14.409 |
Token | I |
Token ID | 314 |
Feature activation | +7.67e-01 |
Pos logit contributions | |
eur | +2.717 |
Versus | +2.681 |
survival | +2.615 |
ULAR | +2.604 |
atively | +2.598 |
Neg logit contributions | |
ricks | -4.032 |
abama | -3.757 |
idth | -3.721 |
akespeare | -3.623 |
--------------- | -3.599 |
Token | � |
Token ID | 447 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
eur | +2.801 |
aido | +2.772 |
Versus | +2.715 |
ULAR | +2.629 |
opa | +2.616 |
Neg logit contributions | |
ricks | -5.570 |
idth | -5.378 |
abama | -5.345 |
xual | -5.185 |
akespeare | -5.143 |
Token | � |
Token ID | 247 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
ULAR | +0.960 |
eur | +0.955 |
atively | +0.914 |
Versus | +0.910 |
opa | +0.902 |
Neg logit contributions | |
ricks | -1.095 |
idth | -1.033 |
abama | -0.985 |
enriched | -0.979 |
--------------- | -0.978 |
Token | m |
Token ID | 76 |
Feature activation | +9.62e-01 |
Pos logit contributions | |
eur | +1.967 |
atively | +1.894 |
Versus | +1.878 |
ULAR | +1.862 |
aido | +1.857 |
Neg logit contributions | |
ricks | -1.552 |
idth | -1.469 |
abama | -1.412 |
--------------- | -1.398 |
enriched | -1.379 |
Token | heard |
Token ID | 2982 |
Feature activation | +9.48e-01 |
Pos logit contributions | |
eur | +2.890 |
Versus | +2.844 |
moderately | +2.686 |
vaguely | +2.683 |
atively | +2.679 |
Neg logit contributions | |
ricks | -6.726 |
idth | -6.684 |
xual | -6.520 |
--------------- | -6.434 |
abama | -6.389 |
Token | of |
Token ID | 286 |
Feature activation | +7.94e-01 |
Pos logit contributions | |
eur | +3.696 |
ULAR | +3.533 |
Versus | +3.525 |
atively | +3.414 |
aido | +3.402 |
Neg logit contributions | |
idth | -6.661 |
ricks | -6.657 |
raught | -6.432 |
xual | -6.325 |
abama | -6.309 |
Token | the |
Token ID | 262 |
Feature activation | +6.49e-01 |
Pos logit contributions | |
eur | +3.866 |
Versus | +3.832 |
ULAR | +3.767 |
atively | +3.693 |
aido | +3.601 |
Neg logit contributions | |
ricks | -4.864 |
idth | -4.716 |
xual | -4.493 |
abama | -4.477 |
--------------- | -4.471 |
Token | Wisconsin |
Token ID | 9279 |
Feature activation | -7.88e-01 |
Pos logit contributions | |
ULAR | +3.005 |
eur | +2.998 |
Versus | +2.960 |
interim | +2.934 |
survival | +2.897 |
Neg logit contributions | |
ricks | -4.160 |
idth | -4.011 |
abama | -3.834 |
xual | -3.824 |
--------------- | -3.789 |
Token | Republican |
Token ID | 3415 |
Feature activation | -7.54e-02 |
Pos logit contributions | |
ricks | +5.381 |
idth | +5.018 |
--------------- | +4.973 |
abama | +4.921 |
enriched | +4.829 |
Neg logit contributions | |
ULAR | -3.515 |
eur | -3.448 |
Versus | -3.422 |
aido | -3.371 |
INESS | -3.335 |
Token | even |
Token ID | 772 |
Feature activation | +2.36e+00 |
Pos logit contributions | |
ricks | +0.491 |
idth | +0.473 |
--------------- | +0.455 |
abama | +0.452 |
akespeare | +0.442 |
Neg logit contributions | |
eur | -0.359 |
ULAR | -0.357 |
Versus | -0.356 |
aido | -0.347 |
INESS | -0.341 |
Token | though |
Token ID | 996 |
Feature activation | +2.79e-01 |
Pos logit contributions | |
vaguely | +6.806 |
moderately | +6.744 |
mildly | +6.289 |
rudimentary | +6.167 |
outside | +6.013 |
Neg logit contributions | |
idth | -16.709 |
ricks | -16.187 |
raught | -15.815 |
xual | -15.322 |
abama | -15.182 |
Token | Democrats |
Token ID | 4956 |
Feature activation | +4.23e-02 |
Pos logit contributions | |
Versus | +1.477 |
eur | +1.461 |
ULAR | +1.442 |
atively | +1.418 |
aido | +1.405 |
Neg logit contributions | |
ricks | -1.680 |
idth | -1.584 |
abama | -1.551 |
--------------- | -1.538 |
xual | -1.498 |
Token | had |
Token ID | 550 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
Versus | +0.201 |
eur | +0.199 |
ULAR | +0.198 |
aido | +0.194 |
INESS | +0.187 |
Neg logit contributions | |
ricks | -0.281 |
idth | -0.267 |
abama | -0.257 |
--------------- | -0.256 |
xual | -0.252 |
Token | been |
Token ID | 587 |
Feature activation | -5.14e-01 |
Pos logit contributions | |
eur | +0.725 |
Versus | +0.715 |
ULAR | +0.711 |
atively | +0.683 |
aido | +0.681 |
Neg logit contributions | |
ricks | -1.002 |
idth | -0.971 |
abama | -0.933 |
--------------- | -0.927 |
xual | -0.914 |
Token | running |
Token ID | 2491 |
Feature activation | +4.88e-01 |
Pos logit contributions | |
ricks | +3.395 |
idth | +3.191 |
--------------- | +3.121 |
abama | +3.108 |
xual | +3.030 |
Neg logit contributions | |
ULAR | -2.449 |
eur | -2.420 |
Versus | -2.404 |
aido | -2.346 |
INESS | -2.321 |
Token | Once |
Token ID | 4874 |
Feature activation | +6.64e-01 |
Pos logit contributions | |
Versus | +2.187 |
ULAR | +2.099 |
eur | +2.087 |
opa | +1.953 |
aido | +1.934 |
Neg logit contributions | |
ricks | -2.595 |
idth | -2.500 |
abama | -2.430 |
xual | -2.404 |
akespeare | -2.369 |
Token | Node |
Token ID | 19081 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
Versus | +2.749 |
ULAR | +2.730 |
eur | +2.685 |
opa | +2.591 |
atively | +2.591 |
Neg logit contributions | |
ricks | -4.615 |
abama | -4.424 |
idth | -4.404 |
xual | -4.337 |
akespeare | -4.176 |
Token | . |
Token ID | 13 |
Feature activation | +7.65e-01 |
Pos logit contributions | |
ULAR | +4.537 |
Versus | +4.361 |
eur | +4.315 |
atively | +4.279 |
ilot | +4.085 |
Neg logit contributions | |
ricks | -7.700 |
idth | -7.560 |
abama | -7.353 |
xual | -7.348 |
raught | -7.189 |
Token | js |
Token ID | 8457 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
eur | +2.907 |
ULAR | +2.787 |
opa | +2.758 |
Versus | +2.741 |
atively | +2.716 |
Neg logit contributions | |
ricks | -5.429 |
idth | -5.327 |
raught | -5.246 |
enriched | -5.131 |
xual | -5.125 |
Token | and |
Token ID | 290 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
Versus | +5.840 |
ULAR | +5.607 |
eur | +5.575 |
interim | +5.345 |
atively | +5.336 |
Neg logit contributions | |
ricks | -8.509 |
abama | -8.490 |
idth | -8.240 |
xual | -8.181 |
raught | -7.803 |
Token | npm |
Token ID | 30599 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
ULAR | +1.724 |
Versus | +1.706 |
eur | +1.696 |
aido | +1.624 |
atively | +1.610 |
Neg logit contributions | |
ricks | -2.029 |
idth | -1.919 |
abama | -1.891 |
xual | -1.849 |
--------------- | -1.847 |
Token | is |
Token ID | 318 |
Feature activation | +7.77e-01 |
Pos logit contributions | |
ULAR | +7.242 |
Versus | +7.148 |
interim | +6.805 |
atively | +6.727 |
eur | +6.611 |
Neg logit contributions | |
abama | -14.888 |
xual | -14.802 |
idth | -14.631 |
ricks | -14.385 |
�� | -13.763 |
Token | installed |
Token ID | 6589 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
Versus | +1.843 |
ULAR | +1.770 |
eur | +1.742 |
atively | +1.693 |
moderately | +1.674 |
Neg logit contributions | |
idth | -6.667 |
ricks | -6.625 |
abama | -6.444 |
xual | -6.319 |
akespeare | -6.170 |
Token | , |
Token ID | 11 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
ricks | +1.786 |
idth | +1.670 |
abama | +1.636 |
--------------- | +1.628 |
enriched | +1.581 |
Neg logit contributions | |
ULAR | -1.536 |
eur | -1.519 |
Versus | -1.514 |
aido | -1.473 |
INESS | -1.467 |
Token | you |
Token ID | 345 |
Feature activation | -9.57e-03 |
Pos logit contributions | |
Versus | +0.475 |
ULAR | +0.472 |
eur | +0.463 |
INESS | +0.444 |
aido | +0.442 |
Neg logit contributions | |
ricks | -0.739 |
idth | -0.711 |
abama | -0.708 |
--------------- | -0.681 |
xual | -0.680 |
Token | can |
Token ID | 460 |
Feature activation | -2.17e-02 |
Pos logit contributions | |
ricks | +0.071 |
idth | +0.069 |
abama | +0.068 |
xual | +0.066 |
--------------- | +0.065 |
Neg logit contributions | |
Versus | -0.037 |
ULAR | -0.037 |
eur | -0.036 |
aido | -0.034 |
atively | -0.034 |
Token | 69 |
Token ID | 3388 |
Feature activation | +5.26e-01 |
Pos logit contributions | |
ULAR | +3.258 |
eur | +3.237 |
Versus | +3.183 |
INESS | +3.109 |
opa | +3.081 |
Neg logit contributions | |
ricks | -3.850 |
--------------- | -3.480 |
idth | -3.468 |
abama | -3.456 |
xual | -3.346 |
Token | Bra |
Token ID | 9718 |
Feature activation | -8.51e-01 |
Pos logit contributions | |
Versus | +2.217 |
eur | +2.120 |
ULAR | +2.117 |
atively | +1.996 |
ilot | +1.965 |
Neg logit contributions | |
ricks | -3.729 |
idth | -3.486 |
--------------- | -3.405 |
abama | -3.403 |
xual | -3.332 |
Token | ille |
Token ID | 8270 |
Feature activation | -2.01e-01 |
Pos logit contributions | |
ricks | +3.883 |
idth | +3.442 |
--------------- | +3.427 |
abama | +3.375 |
dy | +3.305 |
Neg logit contributions | |
ULAR | -5.703 |
Versus | -5.605 |
eur | -5.561 |
INESS | -5.507 |
aido | -5.478 |
Token | was |
Token ID | 373 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
ricks | +1.269 |
idth | +1.191 |
abama | +1.159 |
--------------- | +1.154 |
akespeare | +1.120 |
Neg logit contributions | |
Versus | -1.027 |
ULAR | -1.014 |
eur | -1.014 |
aido | -0.970 |
atively | -0.962 |
Token | only |
Token ID | 691 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
Versus | +1.640 |
ULAR | +1.599 |
eur | +1.589 |
atively | +1.567 |
rudimentary | +1.566 |
Neg logit contributions | |
ricks | -2.275 |
idth | -2.200 |
abama | -2.122 |
xual | -2.086 |
--------------- | -2.071 |
Token | a |
Token ID | 257 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
moderately | +7.177 |
rudimentary | +6.823 |
interim | +6.743 |
Versus | +6.609 |
mildly | +6.561 |
Neg logit contributions | |
ricks | -10.266 |
idth | -10.201 |
xual | -9.612 |
abama | -9.571 |
akespeare | -9.489 |
Token | partial |
Token ID | 13027 |
Feature activation | +3.03e-01 |
Pos logit contributions | |
rudimentary | +10.454 |
moderately | +10.061 |
provisional | +9.840 |
interim | +9.824 |
survival | +9.735 |
Neg logit contributions | |
ricks | -13.075 |
xual | -12.878 |
idth | -12.649 |
nces | -12.302 |
akespeare | -12.274 |
Token | success |
Token ID | 1943 |
Feature activation | +8.80e-02 |
Pos logit contributions | |
eur | +1.356 |
Versus | +1.333 |
survival | +1.332 |
ULAR | +1.328 |
interim | +1.295 |
Neg logit contributions | |
ricks | -2.078 |
idth | -1.978 |
--------------- | -1.906 |
xual | -1.902 |
abama | -1.893 |
Token | . |
Token ID | 13 |
Feature activation | +3.22e-02 |
Pos logit contributions | |
Versus | +0.422 |
ULAR | +0.418 |
eur | +0.418 |
ilot | +0.401 |
INESS | +0.401 |
Neg logit contributions | |
ricks | -0.573 |
idth | -0.541 |
--------------- | -0.523 |
abama | -0.522 |
akespeare | -0.516 |
Token | Deep |
Token ID | 10766 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
Versus | +0.170 |
ULAR | +0.169 |
eur | +0.163 |
INESS | +0.156 |
opa | +0.153 |
Neg logit contributions | |
ricks | -0.203 |
idth | -0.191 |
abama | -0.183 |
xual | -0.182 |
akespeare | -0.182 |
Token | Space |
Token ID | 4687 |
Feature activation | +3.90e-02 |
Pos logit contributions | |
ricks | +1.017 |
idth | +0.926 |
--------------- | +0.915 |
abama | +0.904 |
enriched | +0.881 |
Neg logit contributions | |
ULAR | -1.261 |
eur | -1.249 |
Versus | -1.237 |
aido | -1.229 |
INESS | -1.220 |
Token | trade |
Token ID | 3292 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
ricks | +0.379 |
idth | +0.359 |
abama | +0.350 |
--------------- | +0.344 |
xual | +0.342 |
Neg logit contributions | |
ULAR | -0.278 |
eur | -0.275 |
Versus | -0.273 |
aido | -0.268 |
atively | -0.255 |
Token | for |
Token ID | 329 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
ULAR | +4.848 |
eur | +4.795 |
aido | +4.731 |
survival | +4.671 |
interim | +4.667 |
Neg logit contributions | |
ricks | -6.794 |
abama | -6.635 |
akespeare | -6.359 |
xual | -6.343 |
idth | -6.320 |
Token | a |
Token ID | 257 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
ULAR | +1.215 |
eur | +1.201 |
Versus | +1.175 |
aido | +1.171 |
survival | +1.145 |
Neg logit contributions | |
ricks | -1.622 |
abama | -1.527 |
idth | -1.512 |
xual | -1.508 |
akespeare | -1.485 |
Token | closer |
Token ID | 5699 |
Feature activation | -2.29e-01 |
Pos logit contributions | |
ULAR | +1.369 |
eur | +1.333 |
aido | +1.310 |
Versus | +1.301 |
survival | +1.288 |
Neg logit contributions | |
ricks | -2.022 |
abama | -1.931 |
idth | -1.910 |
xual | -1.860 |
akespeare | -1.844 |
Token | , |
Token ID | 11 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
ricks | +1.442 |
idth | +1.342 |
--------------- | +1.318 |
abama | +1.316 |
akespeare | +1.286 |
Neg logit contributions | |
eur | -1.154 |
ULAR | -1.148 |
Versus | -1.134 |
aido | -1.110 |
atively | -1.091 |
Token | even |
Token ID | 772 |
Feature activation | +2.34e+00 |
Pos logit contributions | |
ricks | +1.571 |
idth | +1.461 |
abama | +1.422 |
--------------- | +1.409 |
xual | +1.382 |
Neg logit contributions | |
ULAR | -1.532 |
Versus | -1.531 |
eur | -1.516 |
aido | -1.498 |
INESS | -1.460 |
Token | if |
Token ID | 611 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
moderately | +7.481 |
mildly | +7.180 |
Versus | +7.145 |
interim | +7.100 |
rudimentary | +7.066 |
Neg logit contributions | |
idth | -15.081 |
ricks | -15.062 |
xual | -14.678 |
abama | -14.579 |
akespeare | -14.049 |
Token | that |
Token ID | 326 |
Feature activation | +5.30e-01 |
Pos logit contributions | |
eur | +1.363 |
ULAR | +1.357 |
Versus | +1.348 |
aido | +1.319 |
atively | +1.301 |
Neg logit contributions | |
ricks | -1.467 |
abama | -1.361 |
idth | -1.353 |
xual | -1.318 |
--------------- | -1.316 |
Token | closer |
Token ID | 5699 |
Feature activation | +4.01e-02 |
Pos logit contributions | |
eur | +2.536 |
ULAR | +2.473 |
aido | +2.460 |
Versus | +2.412 |
survival | +2.357 |
Neg logit contributions | |
ricks | -3.446 |
idth | -3.260 |
abama | -3.186 |
xual | -3.108 |
akespeare | -3.098 |
Token | was |
Token ID | 373 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
eur | +0.201 |
ULAR | +0.200 |
Versus | +0.197 |
aido | +0.190 |
INESS | +0.190 |
Neg logit contributions | |
ricks | -0.255 |
idth | -0.236 |
abama | -0.234 |
--------------- | -0.232 |
akespeare | -0.227 |
Token | Craig |
Token ID | 13854 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
eur | +1.225 |
ULAR | +1.220 |
Versus | +1.202 |
aido | +1.187 |
atively | +1.160 |
Neg logit contributions | |
ricks | -1.829 |
idth | -1.755 |
abama | -1.720 |
xual | -1.687 |
akespeare | -1.677 |
Token | ' |
Token ID | 6 |
Feature activation | +6.85e-01 |
Pos logit contributions | |
eur | +3.519 |
Versus | +3.168 |
INESS | +3.084 |
ULAR | +3.072 |
opa | +3.040 |
Neg logit contributions | |
ricks | -5.434 |
idth | -5.005 |
xual | -4.971 |
--------------- | -4.951 |
enriched | -4.937 |
Token | O |
Token ID | 46 |
Feature activation | -5.10e-01 |
Pos logit contributions | |
eur | +3.482 |
aido | +3.225 |
ULAR | +3.195 |
opa | +3.166 |
ilot | +3.125 |
Neg logit contributions | |
ricks | -4.278 |
idth | -3.996 |
xual | -3.965 |
enriched | -3.844 |
--------------- | -3.835 |
Token | mb |
Token ID | 2022 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
ricks | +2.974 |
idth | +2.744 |
--------------- | +2.707 |
abama | +2.679 |
enriched | +2.614 |
Neg logit contributions | |
ULAR | -2.791 |
eur | -2.762 |
Versus | -2.741 |
aido | -2.697 |
INESS | -2.676 |
Token | re |
Token ID | 260 |
Feature activation | -4.48e-01 |
Pos logit contributions | |
eur | +1.446 |
ULAR | +1.412 |
Versus | +1.379 |
aido | +1.364 |
opa | +1.360 |
Neg logit contributions | |
ricks | -1.396 |
idth | -1.327 |
--------------- | -1.324 |
enriched | -1.281 |
abama | -1.259 |
Token | . |
Token ID | 13 |
Feature activation | +6.15e-01 |
Pos logit contributions | |
ricks | +2.788 |
idth | +2.589 |
--------------- | +2.548 |
abama | +2.529 |
enriched | +2.462 |
Neg logit contributions | |
ULAR | -2.283 |
eur | -2.270 |
Versus | -2.252 |
aido | -2.203 |
INESS | -2.183 |
Token | N |
Token ID | 45 |
Feature activation | +2.33e+00 |
Pos logit contributions | |
ULAR | +2.954 |
eur | +2.950 |
Versus | +2.947 |
INESS | +2.759 |
ré | +2.676 |
Neg logit contributions | |
ricks | -4.044 |
idth | -3.799 |
abama | -3.676 |
xual | -3.586 |
enriched | -3.584 |
Token | os |
Token ID | 418 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
eur | +9.471 |
atively | +8.316 |
opa | +8.161 |
omew | +8.145 |
aido | +7.900 |
Neg logit contributions | |
ricks | -13.748 |
idth | -13.153 |
xual | -13.070 |
�� | -12.956 |
��� | -12.653 |
Token | relations |
Token ID | 2316 |
Feature activation | +6.46e-01 |
Pos logit contributions | |
eur | +6.357 |
ré | +6.246 |
Versus | +6.131 |
opa | +5.912 |
INESS | +5.866 |
Neg logit contributions | |
ricks | -6.816 |
idth | -6.547 |
abama | -6.320 |
--------------- | -6.067 |
akespeare | -5.915 |
Token | diplomat |
Token ID | 28278 |
Feature activation | +6.91e-01 |
Pos logit contributions | |
eur | +3.344 |
Versus | +3.176 |
ULAR | +3.097 |
ré | +3.072 |
aido | +2.960 |
Neg logit contributions | |
ricks | -4.027 |
idth | -3.827 |
abama | -3.671 |
--------------- | -3.595 |
raught | -3.535 |
Token | iques |
Token ID | 6368 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
eur | +3.311 |
ULAR | +3.038 |
Versus | +3.009 |
aido | +2.937 |
atively | +2.927 |
Neg logit contributions | |
ricks | -4.380 |
idth | -4.320 |
abama | -4.210 |
--------------- | -4.194 |
xual | -4.153 |
Token | a |
Token ID | 257 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
eur | +1.578 |
Versus | +1.552 |
ULAR | +1.518 |
ré | +1.454 |
INESS | +1.442 |
Neg logit contributions | |
ricks | -2.055 |
idth | -1.935 |
abama | -1.874 |
--------------- | -1.829 |
akespeare | -1.811 |
Token | lured |
Token ID | 41546 |
Feature activation | -4.13e-01 |
Pos logit contributions | |
ULAR | +0.828 |
Versus | +0.820 |
eur | +0.815 |
aido | +0.785 |
atively | +0.785 |
Neg logit contributions | |
ricks | -1.293 |
idth | -1.232 |
--------------- | -1.205 |
akespeare | -1.196 |
abama | -1.194 |
Token | out |
Token ID | 503 |
Feature activation | -7.97e-01 |
Pos logit contributions | |
ricks | +2.471 |
idth | +2.300 |
--------------- | +2.249 |
abama | +2.230 |
akespeare | +2.180 |
Neg logit contributions | |
ULAR | -2.226 |
eur | -2.213 |
Versus | -2.187 |
aido | -2.156 |
INESS | -2.130 |
Token | of |
Token ID | 286 |
Feature activation | -2.20e-01 |
Pos logit contributions | |
ricks | +4.606 |
idth | +4.225 |
--------------- | +4.184 |
abama | +4.132 |
enriched | +4.056 |
Neg logit contributions | |
ULAR | -4.375 |
eur | -4.313 |
Versus | -4.287 |
aido | -4.211 |
INESS | -4.185 |
Token | province |
Token ID | 8473 |
Feature activation | -6.17e-01 |
Pos logit contributions | |
ricks | +1.356 |
idth | +1.251 |
--------------- | +1.238 |
abama | +1.222 |
akespeare | +1.205 |
Neg logit contributions | |
ULAR | -1.151 |
Versus | -1.137 |
eur | -1.135 |
aido | -1.100 |
INESS | -1.099 |
Token | by |
Token ID | 416 |
Feature activation | -9.40e-03 |
Pos logit contributions | |
ricks | +3.812 |
idth | +3.542 |
--------------- | +3.489 |
abama | +3.459 |
akespeare | +3.375 |
Neg logit contributions | |
ULAR | -3.186 |
eur | -3.158 |
Versus | -3.135 |
aido | -3.075 |
INESS | -3.041 |
Token | even |
Token ID | 772 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
ricks | +0.058 |
idth | +0.055 |
--------------- | +0.054 |
abama | +0.053 |
akespeare | +0.053 |
Neg logit contributions | |
ULAR | -0.048 |
Versus | -0.048 |
eur | -0.047 |
aido | -0.045 |
interim | -0.045 |
Token | better |
Token ID | 1365 |
Feature activation | +6.34e-01 |
Pos logit contributions | |
moderately | +10.396 |
rudimentary | +10.104 |
survival | +9.613 |
mildly | +9.556 |
vaguely | +9.509 |
Neg logit contributions | |
idth | -12.192 |
raught | -12.078 |
ricks | -12.050 |
xual | -11.831 |
akespeare | -11.730 |
Token | wages |
Token ID | 9400 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
Versus | +2.604 |
survival | +2.573 |
eur | +2.534 |
ULAR | +2.491 |
interim | +2.484 |
Neg logit contributions | |
ricks | -4.487 |
idth | -4.265 |
xual | -4.204 |
abama | -4.179 |
--------------- | -4.135 |
Token | , |
Token ID | 11 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
Versus | +0.088 |
eur | +0.088 |
ULAR | +0.088 |
aido | +0.086 |
INESS | +0.085 |
Neg logit contributions | |
ricks | -0.110 |
idth | -0.105 |
--------------- | -0.102 |
abama | -0.102 |
akespeare | -0.099 |
Token | Vel |
Token ID | 17378 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
Versus | +1.318 |
eur | +1.314 |
ULAR | +1.285 |
interim | +1.234 |
survival | +1.232 |
Neg logit contributions | |
ricks | -1.666 |
abama | -1.563 |
idth | -1.561 |
--------------- | -1.527 |
akespeare | -1.506 |
Token | ie |
Token ID | 494 |
Feature activation | -2.64e-01 |
Pos logit contributions | |
eur | +2.556 |
atively | +1.928 |
omew | +1.896 |
opa | +1.894 |
aido | +1.867 |
Neg logit contributions | |
��� | -9.282 |
ricks | -9.043 |
�� | -8.984 |
raught | -8.801 |
enriched | -8.778 |
Token | Paul |
Token ID | 12041 |
Feature activation | -6.81e-02 |
Pos logit contributions | |
ricks | +0.932 |
idth | +0.885 |
abama | +0.860 |
--------------- | +0.846 |
enriched | +0.838 |
Neg logit contributions | |
eur | -0.868 |
ULAR | -0.865 |
Versus | -0.840 |
aido | -0.827 |
INESS | -0.827 |
Token | Popular |
Token ID | 22623 |
Feature activation | +4.97e-01 |
Pos logit contributions | |
ricks | +0.419 |
idth | +0.401 |
--------------- | +0.392 |
abama | +0.391 |
akespeare | +0.385 |
Neg logit contributions | |
eur | -0.346 |
Versus | -0.346 |
ULAR | -0.341 |
aido | -0.329 |
INESS | -0.325 |
Token | Front |
Token ID | 8880 |
Feature activation | +7.85e-01 |
Pos logit contributions | |
Versus | +2.403 |
eur | +2.284 |
ULAR | +2.281 |
atively | +2.198 |
aido | +2.120 |
Neg logit contributions | |
ricks | -3.236 |
idth | -3.056 |
abama | -3.008 |
--------------- | -2.995 |
xual | -2.965 |
Token | is |
Token ID | 318 |
Feature activation | +4.29e-01 |
Pos logit contributions | |
Versus | +3.856 |
eur | +3.855 |
ULAR | +3.728 |
atively | +3.519 |
aido | +3.433 |
Neg logit contributions | |
ricks | -4.850 |
idth | -4.622 |
abama | -4.547 |
--------------- | -4.505 |
akespeare | -4.461 |
Token | only |
Token ID | 691 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
Versus | +1.990 |
ULAR | +1.982 |
eur | +1.959 |
atively | +1.876 |
aido | +1.873 |
Neg logit contributions | |
ricks | -2.823 |
idth | -2.715 |
abama | -2.609 |
--------------- | -2.562 |
akespeare | -2.528 |
Token | just |
Token ID | 655 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
moderately | +4.624 |
ULAR | +4.566 |
eur | +4.484 |
Versus | +4.460 |
survival | +4.454 |
Neg logit contributions | |
ricks | -6.792 |
idth | -6.667 |
abama | -6.249 |
raught | -6.202 |
xual | -6.147 |
Token | beginning |
Token ID | 3726 |
Feature activation | +6.58e-01 |
Pos logit contributions | |
survival | +8.354 |
barely | +8.321 |
eur | +8.299 |
moderately | +8.051 |
interim | +7.973 |
Neg logit contributions | |
idth | -14.443 |
ricks | -13.882 |
xual | -13.403 |
akespeare | -12.948 |
raught | -12.712 |
Token | to |
Token ID | 284 |
Feature activation | +6.22e-01 |
Pos logit contributions | |
Versus | +3.507 |
eur | +3.442 |
ULAR | +3.412 |
survival | +3.318 |
INESS | +3.314 |
Neg logit contributions | |
ricks | -3.823 |
idth | -3.575 |
abama | -3.437 |
akespeare | -3.417 |
xual | -3.373 |
Token | rev |
Token ID | 2710 |
Feature activation | +6.07e-01 |
Pos logit contributions | |
eur | +2.734 |
Versus | +2.652 |
ULAR | +2.633 |
survival | +2.617 |
moderately | +2.591 |
Neg logit contributions | |
ricks | -4.147 |
idth | -4.005 |
--------------- | -3.821 |
abama | -3.820 |
xual | -3.778 |
Token | up |
Token ID | 510 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
eur | +2.472 |
ULAR | +2.425 |
aido | +2.407 |
Versus | +2.406 |
atively | +2.367 |
Neg logit contributions | |
ricks | -4.250 |
idth | -4.006 |
xual | -3.955 |
--------------- | -3.947 |
abama | -3.930 |
Token | its |
Token ID | 663 |
Feature activation | +3.77e-01 |
Pos logit contributions | |
Versus | +0.706 |
ULAR | +0.706 |
eur | +0.702 |
aido | +0.665 |
INESS | +0.659 |
Neg logit contributions | |
ricks | -1.088 |
idth | -1.023 |
abama | -1.005 |
akespeare | -0.991 |
--------------- | -0.991 |
Token | section |
Token ID | 2665 |
Feature activation | +5.97e-01 |
Pos logit contributions | |
ricks | +0.099 |
idth | +0.093 |
abama | +0.090 |
--------------- | +0.089 |
akespeare | +0.088 |
Neg logit contributions | |
eur | -0.063 |
Versus | -0.063 |
ULAR | -0.062 |
atively | -0.061 |
aido | -0.059 |
Token | of |
Token ID | 286 |
Feature activation | -9.10e-02 |
Pos logit contributions | |
ULAR | +2.763 |
eur | +2.738 |
Versus | +2.680 |
atively | +2.634 |
aido | +2.576 |
Neg logit contributions | |
ricks | -3.927 |
idth | -3.853 |
abama | -3.695 |
--------------- | -3.608 |
raught | -3.530 |
Token | DOM |
Token ID | 24121 |
Feature activation | +2.69e-01 |
Pos logit contributions | |
ricks | +0.498 |
idth | +0.463 |
--------------- | +0.448 |
abama | +0.445 |
akespeare | +0.429 |
Neg logit contributions | |
ULAR | -0.537 |
Versus | -0.534 |
eur | -0.533 |
aido | -0.514 |
atively | -0.509 |
Token | A |
Token ID | 32 |
Feature activation | +3.31e-01 |
Pos logit contributions | |
ULAR | +1.290 |
eur | +1.276 |
Versus | +1.233 |
INESS | +1.224 |
aido | +1.214 |
Neg logit contributions | |
ricks | -1.790 |
idth | -1.702 |
abama | -1.618 |
enriched | -1.614 |
xual | -1.613 |
Token | unconstitutional |
Token ID | 20727 |
Feature activation | -1.78e-02 |
Pos logit contributions | |
eur | +1.607 |
ULAR | +1.601 |
Versus | +1.590 |
survival | +1.522 |
atively | +1.519 |
Neg logit contributions | |
ricks | -2.129 |
idth | -2.043 |
abama | -1.985 |
--------------- | -1.916 |
raught | -1.885 |
Token | even |
Token ID | 772 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
ricks | +0.113 |
idth | +0.107 |
abama | +0.103 |
--------------- | +0.103 |
raught | +0.100 |
Neg logit contributions | |
Versus | -0.089 |
eur | -0.089 |
ULAR | -0.089 |
aido | -0.086 |
atively | -0.085 |
Token | though |
Token ID | 996 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
Versus | +6.863 |
eur | +6.492 |
moderately | +6.470 |
vaguely | +6.449 |
rudimentary | +6.414 |
Neg logit contributions | |
ricks | -15.801 |
idth | -15.372 |
raught | -14.464 |
abama | -14.395 |
xual | -14.199 |
Token | Obama |
Token ID | 2486 |
Feature activation | -2.66e-01 |
Pos logit contributions | |
Versus | +0.139 |
ULAR | +0.138 |
eur | +0.138 |
atively | +0.134 |
aido | +0.133 |
Neg logit contributions | |
ricks | -0.158 |
idth | -0.146 |
abama | -0.144 |
--------------- | -0.142 |
raught | -0.138 |
Token | refused |
Token ID | 6520 |
Feature activation | -5.89e-02 |
Pos logit contributions | |
ricks | +1.706 |
idth | +1.619 |
abama | +1.576 |
--------------- | +1.556 |
akespeare | +1.511 |
Neg logit contributions | |
Versus | -1.319 |
ULAR | -1.314 |
eur | -1.313 |
aido | -1.259 |
atively | -1.242 |
Token | to |
Token ID | 284 |
Feature activation | -4.65e-01 |
Pos logit contributions | |
ricks | +0.258 |
idth | +0.230 |
--------------- | +0.228 |
abama | +0.224 |
enriched | +0.218 |
Neg logit contributions | |
ULAR | -0.406 |
eur | -0.403 |
Versus | -0.400 |
aido | -0.396 |
INESS | -0.392 |
Token | defend |
Token ID | 4404 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
ricks | +3.333 |
idth | +3.147 |
--------------- | +3.082 |
abama | +3.075 |
enriched | +2.992 |
Neg logit contributions | |
ULAR | -1.942 |
eur | -1.921 |
Versus | -1.915 |
aido | -1.862 |
INESS | -1.817 |
Token | around |
Token ID | 1088 |
Feature activation | +4.80e-01 |
Pos logit contributions | |
Versus | +0.465 |
ULAR | +0.461 |
eur | +0.458 |
aido | +0.449 |
INESS | +0.442 |
Neg logit contributions | |
ricks | -0.631 |
idth | -0.608 |
--------------- | -0.576 |
abama | -0.573 |
xual | -0.573 |
Token | him |
Token ID | 683 |
Feature activation | -8.02e-01 |
Pos logit contributions | |
Versus | +2.062 |
eur | +2.017 |
ULAR | +1.996 |
aido | +1.948 |
atively | +1.932 |
Neg logit contributions | |
ricks | -3.309 |
idth | -3.126 |
xual | -3.052 |
abama | -3.038 |
--------------- | -3.007 |
Token | say |
Token ID | 910 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
ricks | +5.110 |
idth | +4.750 |
--------------- | +4.718 |
abama | +4.648 |
enriched | +4.582 |
Neg logit contributions | |
ULAR | -3.923 |
eur | -3.840 |
Versus | -3.813 |
aido | -3.732 |
INESS | -3.727 |
Token | that |
Token ID | 326 |
Feature activation | +3.91e-02 |
Pos logit contributions | |
ricks | +1.782 |
idth | +1.657 |
abama | +1.633 |
--------------- | +1.610 |
xual | +1.568 |
Neg logit contributions | |
eur | -1.744 |
ULAR | -1.742 |
Versus | -1.735 |
aido | -1.692 |
INESS | -1.691 |
Token | , |
Token ID | 11 |
Feature activation | +6.06e-01 |
Pos logit contributions | |
Versus | +0.206 |
eur | +0.205 |
ULAR | +0.202 |
atively | +0.200 |
aido | +0.198 |
Neg logit contributions | |
ricks | -0.236 |
idth | -0.222 |
abama | -0.216 |
--------------- | -0.213 |
xual | -0.209 |
Token | even |
Token ID | 772 |
Feature activation | +2.28e+00 |
Pos logit contributions | |
Versus | +2.715 |
eur | +2.696 |
ULAR | +2.615 |
moderately | +2.610 |
survival | +2.601 |
Neg logit contributions | |
ricks | -3.942 |
idth | -3.895 |
abama | -3.645 |
--------------- | -3.608 |
xual | -3.596 |
Token | with |
Token ID | 351 |
Feature activation | -4.54e-01 |
Pos logit contributions | |
moderately | +8.021 |
mildly | +7.658 |
outside | +7.624 |
Versus | +7.598 |
eur | +7.519 |
Neg logit contributions | |
ricks | -14.374 |
idth | -14.131 |
xual | -13.712 |
abama | -13.259 |
--------------- | -12.949 |
Token | the |
Token ID | 262 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
ricks | +2.656 |
idth | +2.461 |
--------------- | +2.417 |
abama | +2.402 |
xual | +2.328 |
Neg logit contributions | |
ULAR | -2.491 |
eur | -2.468 |
Versus | -2.463 |
aido | -2.409 |
INESS | -2.392 |
Token | shit |
Token ID | 7510 |
Feature activation | +7.82e-01 |
Pos logit contributions | |
ricks | +0.657 |
idth | +0.623 |
abama | +0.598 |
xual | +0.598 |
--------------- | +0.595 |
Neg logit contributions | |
Versus | -0.521 |
eur | -0.520 |
ULAR | -0.520 |
aido | -0.499 |
INESS | -0.496 |
Token | storm |
Token ID | 12135 |
Feature activation | +7.74e-01 |
Pos logit contributions | |
Versus | +3.973 |
ULAR | +3.919 |
eur | +3.853 |
INESS | +3.782 |
atively | +3.705 |
Neg logit contributions | |
ricks | -4.450 |
idth | -4.387 |
xual | -4.319 |
abama | -4.288 |
--------------- | -4.053 |
Token | his |
Token ID | 465 |
Feature activation | +3.39e-01 |
Pos logit contributions | |
eur | +3.730 |
Versus | +3.644 |
ULAR | +3.601 |
aido | +3.499 |
atively | +3.477 |
Neg logit contributions | |
ricks | -4.768 |
idth | -4.671 |
abama | -4.627 |
xual | -4.415 |
--------------- | -4.366 |
Token | as |
Token ID | 355 |
Feature activation | +1.65e-01 |
Pos logit contributions | |
Versus | +2.549 |
ULAR | +2.523 |
eur | +2.523 |
moderately | +2.477 |
atively | +2.464 |
Neg logit contributions | |
ricks | -3.873 |
idth | -3.758 |
abama | -3.674 |
xual | -3.581 |
--------------- | -3.579 |
Token | a |
Token ID | 257 |
Feature activation | +4.20e-01 |
Pos logit contributions | |
ULAR | +0.757 |
eur | +0.748 |
Versus | +0.740 |
atively | +0.722 |
INESS | +0.721 |
Neg logit contributions | |
ricks | -1.118 |
idth | -1.045 |
abama | -1.036 |
--------------- | -1.014 |
akespeare | -1.007 |
Token | financial |
Token ID | 3176 |
Feature activation | -9.12e-01 |
Pos logit contributions | |
Versus | +1.981 |
ULAR | +1.942 |
eur | +1.936 |
survival | +1.928 |
INESS | +1.892 |
Neg logit contributions | |
ricks | -2.764 |
idth | -2.601 |
abama | -2.596 |
akespeare | -2.512 |
xual | -2.497 |
Token | institution |
Token ID | 9901 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
ricks | +5.955 |
idth | +5.519 |
--------------- | +5.489 |
abama | +5.406 |
enriched | +5.342 |
Neg logit contributions | |
ULAR | -4.268 |
eur | -4.191 |
Versus | -4.174 |
aido | -4.122 |
INESS | -4.063 |
Token | . |
Token ID | 13 |
Feature activation | +6.60e-01 |
Pos logit contributions | |
eur | +0.528 |
Versus | +0.524 |
ULAR | +0.519 |
INESS | +0.505 |
atively | +0.504 |
Neg logit contributions | |
ricks | -0.703 |
idth | -0.672 |
--------------- | -0.651 |
abama | -0.650 |
akespeare | -0.635 |
Token | Even |
Token ID | 3412 |
Feature activation | +2.28e+00 |
Pos logit contributions | |
Versus | +3.317 |
eur | +3.035 |
ULAR | +3.013 |
INESS | +2.889 |
opa | +2.776 |
Neg logit contributions | |
ricks | -4.418 |
idth | -4.236 |
enriched | -4.096 |
abama | -4.066 |
akespeare | -4.045 |
Token | then |
Token ID | 788 |
Feature activation | +9.74e-01 |
Pos logit contributions | |
Versus | +8.816 |
moderately | +8.557 |
interim | +8.503 |
rudimentary | +8.473 |
internally | +8.425 |
Neg logit contributions | |
abama | -13.742 |
idth | -13.562 |
ricks | -13.421 |
raught | -12.706 |
xual | -12.558 |
Token | we |
Token ID | 356 |
Feature activation | +5.92e-01 |
Pos logit contributions | |
Versus | +4.197 |
eur | +4.190 |
ULAR | +4.093 |
atively | +4.053 |
INESS | +4.017 |
Neg logit contributions | |
ricks | -6.454 |
abama | -6.180 |
idth | -6.030 |
--------------- | -6.010 |
akespeare | -5.882 |
Token | were |
Token ID | 547 |
Feature activation | +4.54e-01 |
Pos logit contributions | |
Versus | +2.663 |
eur | +2.653 |
ULAR | +2.552 |
aido | +2.506 |
opa | +2.503 |
Neg logit contributions | |
ricks | -3.876 |
idth | -3.873 |
abama | -3.753 |
--------------- | -3.587 |
xual | -3.553 |
Token | storing |
Token ID | 23069 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
Versus | +1.995 |
ULAR | +1.957 |
eur | +1.929 |
rudimentary | +1.888 |
moderately | +1.881 |
Neg logit contributions | |
ricks | -3.091 |
idth | -3.069 |
abama | -2.957 |
--------------- | -2.893 |
akespeare | -2.865 |
Token | tens |
Token ID | 11192 |
Feature activation | +7.01e-01 |
Pos logit contributions | |
eur | +0.649 |
ULAR | +0.645 |
Versus | +0.643 |
INESS | +0.619 |
aido | +0.618 |
Neg logit contributions | |
ricks | -0.776 |
idth | -0.731 |
abama | -0.724 |
--------------- | -0.711 |
akespeare | -0.689 |
Token | for |
Token ID | 329 |
Feature activation | +5.22e-01 |
Pos logit contributions | |
ricks | +1.677 |
idth | +1.565 |
--------------- | +1.551 |
abama | +1.521 |
akespeare | +1.495 |
Neg logit contributions | |
ULAR | -1.273 |
eur | -1.269 |
Versus | -1.260 |
aido | -1.238 |
INESS | -1.228 |
Token | the |
Token ID | 262 |
Feature activation | +6.63e-01 |
Pos logit contributions | |
Versus | +1.944 |
eur | +1.905 |
ULAR | +1.897 |
atively | +1.833 |
survival | +1.824 |
Neg logit contributions | |
ricks | -3.914 |
idth | -3.706 |
--------------- | -3.692 |
abama | -3.681 |
xual | -3.645 |
Token | individual |
Token ID | 1981 |
Feature activation | -7.02e-01 |
Pos logit contributions | |
eur | +2.879 |
Versus | +2.866 |
ULAR | +2.810 |
atively | +2.796 |
survival | +2.783 |
Neg logit contributions | |
ricks | -4.408 |
idth | -4.186 |
abama | -4.147 |
--------------- | -4.122 |
xual | -4.039 |
Token | market |
Token ID | 1910 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
ricks | +4.766 |
idth | +4.446 |
--------------- | +4.395 |
abama | +4.355 |
enriched | +4.271 |
Neg logit contributions | |
ULAR | -3.164 |
eur | -3.119 |
Versus | -3.092 |
aido | -3.036 |
INESS | -3.007 |
Token | , |
Token ID | 11 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
eur | +1.279 |
Versus | +1.274 |
ULAR | +1.267 |
INESS | +1.240 |
aido | +1.236 |
Neg logit contributions | |
ricks | -1.360 |
idth | -1.274 |
abama | -1.253 |
--------------- | -1.252 |
akespeare | -1.226 |
Token | even |
Token ID | 772 |
Feature activation | +2.27e+00 |
Pos logit contributions | |
Versus | +0.732 |
ULAR | +0.726 |
eur | +0.721 |
aido | +0.707 |
INESS | +0.695 |
Neg logit contributions | |
ricks | -0.887 |
idth | -0.833 |
--------------- | -0.819 |
abama | -0.813 |
akespeare | -0.793 |
Token | members |
Token ID | 1866 |
Feature activation | -5.01e-02 |
Pos logit contributions | |
moderately | +9.273 |
rudimentary | +8.993 |
atively | +8.789 |
survival | +8.786 |
provisional | +8.740 |
Neg logit contributions | |
ricks | -13.124 |
--------------- | -12.515 |
idth | -12.451 |
xual | -12.279 |
akespeare | -12.195 |
Token | of |
Token ID | 286 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
ricks | +0.287 |
idth | +0.263 |
--------------- | +0.261 |
abama | +0.259 |
enriched | +0.256 |
Neg logit contributions | |
ULAR | -0.278 |
eur | -0.273 |
Versus | -0.273 |
aido | -0.268 |
INESS | -0.267 |
Token | Congress |
Token ID | 3162 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
ricks | +2.039 |
idth | +1.878 |
--------------- | +1.856 |
abama | +1.825 |
akespeare | +1.775 |
Neg logit contributions | |
ULAR | -2.039 |
eur | -2.011 |
Versus | -2.002 |
aido | -1.958 |
INESS | -1.951 |
Token | , |
Token ID | 11 |
Feature activation | +7.79e-02 |
Pos logit contributions | |
eur | +0.738 |
ULAR | +0.731 |
Versus | +0.723 |
aido | +0.713 |
INESS | +0.706 |
Neg logit contributions | |
ricks | -0.852 |
idth | -0.799 |
--------------- | -0.781 |
abama | -0.771 |
akespeare | -0.751 |
Token | to |
Token ID | 284 |
Feature activation | +7.16e-01 |
Pos logit contributions | |
ULAR | +0.492 |
eur | +0.489 |
Versus | +0.486 |
aido | +0.480 |
INESS | +0.475 |
Neg logit contributions | |
ricks | -0.388 |
idth | -0.354 |
--------------- | -0.347 |
abama | -0.342 |
akespeare | -0.330 |
Token | the |
Token ID | 262 |
Feature activation | -1.95e-02 |
Pos logit contributions | |
ULAR | +0.233 |
Versus | +0.231 |
eur | +0.231 |
atively | +0.222 |
aido | +0.222 |
Neg logit contributions | |
ricks | -0.288 |
idth | -0.270 |
--------------- | -0.260 |
abama | -0.259 |
xual | -0.251 |
Token | house |
Token ID | 2156 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
ricks | +0.115 |
idth | +0.108 |
--------------- | +0.104 |
abama | +0.103 |
raught | +0.100 |
Neg logit contributions | |
eur | -0.106 |
ULAR | -0.106 |
Versus | -0.105 |
INESS | -0.102 |
aido | -0.102 |
Token | and |
Token ID | 290 |
Feature activation | -2.01e-01 |
Pos logit contributions | |
ricks | +6.239 |
--------------- | +5.745 |
idth | +5.672 |
abama | +5.597 |
enriched | +5.568 |
Neg logit contributions | |
ULAR | -6.204 |
eur | -6.018 |
Versus | -6.001 |
aido | -5.927 |
INESS | -5.843 |
Token | has |
Token ID | 468 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
ricks | +1.394 |
idth | +1.321 |
abama | +1.278 |
--------------- | +1.270 |
akespeare | +1.242 |
Neg logit contributions | |
eur | -0.888 |
Versus | -0.883 |
ULAR | -0.878 |
aido | -0.841 |
atively | -0.836 |
Token | killed |
Token ID | 2923 |
Feature activation | +6.83e-01 |
Pos logit contributions | |
ricks | +0.814 |
idth | +0.765 |
abama | +0.737 |
--------------- | +0.735 |
akespeare | +0.724 |
Neg logit contributions | |
eur | -0.688 |
ULAR | -0.682 |
Versus | -0.679 |
aido | -0.657 |
INESS | -0.650 |
Token | even |
Token ID | 772 |
Feature activation | +2.26e+00 |
Pos logit contributions | |
Versus | +3.012 |
eur | +2.988 |
atively | +2.936 |
ULAR | +2.933 |
survival | +2.919 |
Neg logit contributions | |
ricks | -4.548 |
idth | -4.349 |
abama | -4.159 |
--------------- | -4.061 |
raught | -4.060 |
Token | one |
Token ID | 530 |
Feature activation | +7.15e-01 |
Pos logit contributions | |
moderately | +9.160 |
rudimentary | +8.800 |
mildly | +8.754 |
survival | +8.518 |
eur | +8.378 |
Neg logit contributions | |
ricks | -13.103 |
idth | -12.999 |
raught | -12.616 |
xual | -12.285 |
abama | -12.133 |
Token | animal |
Token ID | 5044 |
Feature activation | +2.81e-01 |
Pos logit contributions | |
eur | +3.124 |
Versus | +3.023 |
ULAR | +2.986 |
survival | +2.921 |
moderately | +2.906 |
Neg logit contributions | |
ricks | -4.989 |
idth | -4.705 |
abama | -4.481 |
--------------- | -4.472 |
akespeare | -4.446 |
Token | , |
Token ID | 11 |
Feature activation | -4.68e-01 |
Pos logit contributions | |
eur | +1.341 |
Versus | +1.308 |
ULAR | +1.293 |
INESS | +1.262 |
aido | +1.257 |
Neg logit contributions | |
ricks | -1.845 |
idth | -1.746 |
abama | -1.682 |
--------------- | -1.661 |
akespeare | -1.640 |
Token | please |
Token ID | 3387 |
Feature activation | -3.39e-01 |
Pos logit contributions | |
ricks | +2.982 |
idth | +2.810 |
abama | +2.739 |
--------------- | +2.724 |
enriched | +2.630 |
Neg logit contributions | |
ULAR | -2.322 |
Versus | -2.306 |
eur | -2.305 |
aido | -2.230 |
INESS | -2.214 |
Token | do |
Token ID | 466 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
ricks | +2.316 |
idth | +2.202 |
abama | +2.146 |
--------------- | +2.129 |
akespeare | +2.072 |
Neg logit contributions | |
ULAR | -1.520 |
eur | -1.517 |
Versus | -1.513 |
aido | -1.458 |
INESS | -1.430 |
Token | raised |
Token ID | 4376 |
Feature activation | -7.52e-01 |
Pos logit contributions | |
ricks | +3.619 |
idth | +3.382 |
--------------- | +3.319 |
abama | +3.300 |
akespeare | +3.217 |
Neg logit contributions | |
ULAR | -2.823 |
eur | -2.800 |
Versus | -2.779 |
aido | -2.710 |
INESS | -2.684 |
Token | concerns |
Token ID | 4786 |
Feature activation | +6.60e-02 |
Pos logit contributions | |
ricks | +4.180 |
idth | +3.836 |
--------------- | +3.786 |
abama | +3.740 |
enriched | +3.652 |
Neg logit contributions | |
ULAR | -4.314 |
eur | -4.268 |
Versus | -4.241 |
aido | -4.178 |
INESS | -4.144 |
Token | related |
Token ID | 3519 |
Feature activation | -9.33e-01 |
Pos logit contributions | |
eur | +0.281 |
ULAR | +0.279 |
Versus | +0.275 |
atively | +0.266 |
aido | +0.264 |
Neg logit contributions | |
ricks | -0.470 |
idth | -0.452 |
abama | -0.439 |
--------------- | -0.433 |
raught | -0.425 |
Token | to |
Token ID | 284 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
ricks | +3.855 |
--------------- | +3.406 |
idth | +3.399 |
abama | +3.265 |
enriched | +3.221 |
Neg logit contributions | |
ULAR | -6.565 |
eur | -6.460 |
Versus | -6.454 |
aido | -6.417 |
INESS | -6.370 |
Token | restrictions |
Token ID | 8733 |
Feature activation | +8.84e-01 |
Pos logit contributions | |
eur | +1.373 |
Versus | +1.361 |
ULAR | +1.344 |
atively | +1.310 |
INESS | +1.296 |
Neg logit contributions | |
ricks | -1.751 |
idth | -1.643 |
abama | -1.619 |
--------------- | -1.572 |
akespeare | -1.568 |
Token | Google |
Token ID | 3012 |
Feature activation | +2.25e+00 |
Pos logit contributions | |
eur | +3.399 |
ULAR | +3.221 |
Versus | +3.198 |
atively | +3.130 |
opa | +3.056 |
Neg logit contributions | |
ricks | -6.510 |
abama | -6.344 |
idth | -6.242 |
--------------- | -6.054 |
akespeare | -5.959 |
Token | places |
Token ID | 4113 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
Versus | +8.478 |
eur | +8.131 |
atively | +8.125 |
interim | +8.113 |
affiliates | +7.784 |
Neg logit contributions | |
abama | -14.152 |
ricks | -13.987 |
idth | -13.956 |
xual | -13.100 |
raught | -13.057 |
Token | on |
Token ID | 319 |
Feature activation | +6.19e-01 |
Pos logit contributions | |
atively | +3.373 |
eur | +3.191 |
ULAR | +3.171 |
Versus | +2.969 |
interim | +2.903 |
Neg logit contributions | |
ricks | -8.401 |
idth | -8.002 |
abama | -7.969 |
--------------- | -7.832 |
akespeare | -7.678 |
Token | use |
Token ID | 779 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
Versus | +2.720 |
eur | +2.711 |
ULAR | +2.663 |
atively | +2.630 |
survival | +2.584 |
Neg logit contributions | |
ricks | -4.206 |
idth | -4.010 |
abama | -4.008 |
akespeare | -3.832 |
--------------- | -3.822 |
Token | of |
Token ID | 286 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
eur | +2.794 |
ULAR | +2.783 |
Versus | +2.721 |
INESS | +2.641 |
atively | +2.618 |
Neg logit contributions | |
ricks | -3.662 |
idth | -3.399 |
abama | -3.375 |
--------------- | -3.359 |
akespeare | -3.282 |
Token | its |
Token ID | 663 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
ULAR | +0.613 |
eur | +0.606 |
Versus | +0.604 |
atively | +0.573 |
opa | +0.566 |
Neg logit contributions | |
ricks | -1.045 |
idth | -0.998 |
abama | -0.993 |
--------------- | -0.971 |
xual | -0.954 |
Token | :: |
Token ID | 3712 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
ricks | +4.430 |
--------------- | +4.094 |
idth | +3.950 |
abama | +3.840 |
enriched | +3.796 |
Neg logit contributions | |
aido | -6.659 |
ULAR | -6.620 |
Versus | -6.593 |
eur | -6.511 |
INESS | -6.452 |
Token | All |
Token ID | 3237 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
ricks | +1.718 |
idth | +1.603 |
abama | +1.574 |
--------------- | +1.560 |
enriched | +1.557 |
Neg logit contributions | |
ULAR | -1.253 |
eur | -1.232 |
Versus | -1.209 |
INESS | -1.180 |
aido | -1.179 |
Token | Sc |
Token ID | 3351 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
ricks | +6.059 |
idth | +5.576 |
--------------- | +5.530 |
abama | +5.410 |
enriched | +5.265 |
Neg logit contributions | |
ULAR | -5.788 |
Versus | -5.751 |
eur | -5.747 |
aido | -5.710 |
INESS | -5.572 |
Token | reens |
Token ID | 5681 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
ricks | +1.004 |
--------------- | +0.959 |
idth | +0.952 |
abama | +0.952 |
xual | +0.935 |
Neg logit contributions | |
eur | -0.474 |
ULAR | -0.472 |
Versus | -0.454 |
aido | -0.453 |
opa | -0.440 |
Token | | |
Token ID | 930 |
Feature activation | -9.11e-01 |
Pos logit contributions | |
ricks | +2.378 |
idth | +2.173 |
--------------- | +2.149 |
abama | +2.137 |
enriched | +2.078 |
Neg logit contributions | |
ULAR | -2.436 |
eur | -2.415 |
Versus | -2.400 |
aido | -2.354 |
INESS | -2.340 |
Token | Where |
Token ID | 6350 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
ricks | +5.590 |
idth | +5.195 |
--------------- | +5.159 |
abama | +5.100 |
enriched | +4.982 |
Neg logit contributions | |
ULAR | -4.592 |
eur | -4.520 |
Versus | -4.470 |
aido | -4.466 |
INESS | -4.446 |
Token | Primary |
Token ID | 21087 |
Feature activation | -2.11e+00 |
Pos logit contributions | |
idth | +11.015 |
--------------- | +10.872 |
ricks | +10.189 |
dup | +10.073 |
abama | +10.040 |
Neg logit contributions | |
aido | -12.250 |
eur | -11.793 |
INESS | -11.723 |
accompan | -11.590 |
ULAR | -11.428 |
Token | | |
Token ID | 930 |
Feature activation | -7.76e-01 |
Pos logit contributions | |
ricks | +11.089 |
--------------- | +10.823 |
idth | +10.674 |
abama | +10.228 |
dy | +9.965 |
Neg logit contributions | |
aido | -10.333 |
ULAR | -9.955 |
opa | -9.921 |
eur | -9.778 |
accompan | -9.707 |
Token | Select |
Token ID | 9683 |
Feature activation | -8.19e-01 |
Pos logit contributions | |
ricks | +4.633 |
idth | +4.294 |
--------------- | +4.244 |
abama | +4.194 |
enriched | +4.092 |
Neg logit contributions | |
ULAR | -4.103 |
eur | -4.053 |
Versus | -4.015 |
aido | -3.973 |
INESS | -3.939 |
Token | - |
Token ID | 532 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
ricks | +5.038 |
idth | +4.704 |
--------------- | +4.648 |
abama | +4.577 |
enriched | +4.484 |
Neg logit contributions | |
ULAR | -4.147 |
eur | -4.092 |
Versus | -4.050 |
aido | -4.007 |
INESS | -3.991 |
Token | Exp |
Token ID | 16870 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
ricks | +5.893 |
idth | +5.468 |
--------------- | +5.405 |
abama | +5.325 |
enriched | +5.162 |
Neg logit contributions | |
ULAR | -5.573 |
eur | -5.471 |
Versus | -5.446 |
aido | -5.426 |
INESS | -5.425 |
Token | Select |
Token ID | 9683 |
Feature activation | -8.19e-01 |
Pos logit contributions | |
ricks | +4.633 |
idth | +4.294 |
--------------- | +4.244 |
abama | +4.194 |
enriched | +4.092 |
Neg logit contributions | |
ULAR | -4.103 |
eur | -4.053 |
Versus | -4.015 |
aido | -3.973 |
INESS | -3.939 |
Token | - |
Token ID | 532 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
ricks | +5.038 |
idth | +4.704 |
--------------- | +4.648 |
abama | +4.577 |
enriched | +4.484 |
Neg logit contributions | |
ULAR | -4.147 |
eur | -4.092 |
Versus | -4.050 |
aido | -4.007 |
INESS | -3.991 |
Token | Exp |
Token ID | 16870 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
ricks | +5.893 |
idth | +5.468 |
--------------- | +5.405 |
abama | +5.325 |
enriched | +5.162 |
Neg logit contributions | |
ULAR | -5.573 |
eur | -5.471 |
Versus | -5.446 |
aido | -5.426 |
INESS | -5.425 |
Token | and |
Token ID | 392 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
ricks | +6.594 |
--------------- | +6.259 |
idth | +6.128 |
abama | +5.758 |
dy | +5.723 |
Neg logit contributions | |
ULAR | -10.614 |
aido | -10.487 |
eur | -10.425 |
INESS | -10.375 |
Versus | -10.205 |
Token | Property |
Token ID | 21746 |
Feature activation | -9.11e-01 |
Pos logit contributions | |
ricks | +3.330 |
idth | +3.068 |
--------------- | +3.024 |
abama | +2.999 |
enriched | +2.924 |
Neg logit contributions | |
ULAR | -3.174 |
eur | -3.140 |
Versus | -3.120 |
aido | -3.062 |
INESS | -3.042 |
Token | B |
Token ID | 347 |
Feature activation | -2.32e+00 |
Pos logit contributions | |
ricks | +5.382 |
idth | +4.994 |
--------------- | +4.955 |
abama | +4.867 |
enriched | +4.770 |
Neg logit contributions | |
ULAR | -4.808 |
eur | -4.729 |
Versus | -4.700 |
aido | -4.664 |
INESS | -4.620 |
Token | ounds |
Token ID | 3733 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
ricks | +13.412 |
idth | +11.403 |
--------------- | +11.325 |
dy | +11.005 |
enriched | +10.790 |
Neg logit contributions | |
INESS | -10.855 |
Versus | -10.827 |
eur | -10.714 |
ULAR | -10.638 |
aido | -10.408 |
Token | | |
Token ID | 930 |
Feature activation | -9.31e-01 |
Pos logit contributions | |
ricks | +7.130 |
idth | +6.789 |
--------------- | +6.709 |
abama | +6.440 |
dup | +6.280 |
Neg logit contributions | |
ULAR | -7.267 |
eur | -7.181 |
aido | -7.179 |
Versus | -7.173 |
opa | -6.963 |
Token | Select |
Token ID | 9683 |
Feature activation | -7.49e-01 |
Pos logit contributions | |
ricks | +5.510 |
idth | +5.115 |
--------------- | +5.060 |
abama | +4.988 |
enriched | +4.869 |
Neg logit contributions | |
ULAR | -4.913 |
eur | -4.839 |
Versus | -4.779 |
aido | -4.772 |
INESS | -4.745 |
Token | Width |
Token ID | 38807 |
Feature activation | -5.29e-01 |
Pos logit contributions | |
ricks | +4.442 |
idth | +4.123 |
--------------- | +4.071 |
abama | +4.014 |
enriched | +3.923 |
Neg logit contributions | |
ULAR | -3.987 |
eur | -3.938 |
Versus | -3.904 |
aido | -3.854 |
INESS | -3.825 |
Token | , |
Token ID | 11 |
Feature activation | +9.09e-01 |
Pos logit contributions | |
ricks | +3.042 |
idth | +2.798 |
--------------- | +2.760 |
abama | +2.735 |
enriched | +2.668 |
Neg logit contributions | |
ULAR | -2.945 |
eur | -2.915 |
Versus | -2.896 |
aido | -2.845 |
INESS | -2.825 |
Token | Williams |
Token ID | 6484 |
Feature activation | +7.16e-01 |
Pos logit contributions | |
Versus | +0.254 |
eur | +0.252 |
ULAR | +0.250 |
atively | +0.249 |
INESS | +0.245 |
Neg logit contributions | |
ricks | -0.274 |
idth | -0.258 |
abama | -0.249 |
--------------- | -0.249 |
xual | -0.249 |
Token | . |
Token ID | 13 |
Feature activation | -3.50e-01 |
Pos logit contributions | |
Versus | +3.282 |
INESS | +3.255 |
eur | +3.249 |
atively | +3.115 |
ULAR | +3.087 |
Neg logit contributions | |
ricks | -4.576 |
idth | -4.538 |
abama | -4.277 |
--------------- | -4.205 |
raught | -4.197 |
Token | The |
Token ID | 383 |
Feature activation | -7.02e-01 |
Pos logit contributions | |
ricks | +2.007 |
idth | +1.891 |
abama | +1.801 |
enriched | +1.795 |
akespeare | +1.777 |
Neg logit contributions | |
Versus | -2.030 |
ULAR | -2.006 |
eur | -1.973 |
INESS | -1.923 |
atively | -1.877 |
Token | evidence |
Token ID | 2370 |
Feature activation | -6.44e-01 |
Pos logit contributions | |
ricks | +4.106 |
idth | +3.806 |
--------------- | +3.732 |
abama | +3.702 |
akespeare | +3.599 |
Neg logit contributions | |
ULAR | -3.844 |
eur | -3.809 |
Versus | -3.797 |
aido | -3.702 |
INESS | -3.694 |
Token | at |
Token ID | 379 |
Feature activation | -9.12e-01 |
Pos logit contributions | |
ricks | +4.094 |
idth | +3.803 |
--------------- | +3.755 |
abama | +3.721 |
enriched | +3.635 |
Neg logit contributions | |
ULAR | -3.192 |
eur | -3.153 |
Versus | -3.132 |
aido | -3.073 |
INESS | -3.045 |
Token | trial |
Token ID | 4473 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
ricks | +5.150 |
idth | +4.730 |
--------------- | +4.687 |
abama | +4.633 |
enriched | +4.518 |
Neg logit contributions | |
ULAR | -5.122 |
eur | -5.074 |
Versus | -4.996 |
aido | -4.969 |
INESS | -4.916 |
Token | did |
Token ID | 750 |
Feature activation | -6.41e-01 |
Pos logit contributions | |
ricks | +11.610 |
enriched | +11.326 |
--------------- | +10.968 |
dy | +10.765 |
dup | +10.675 |
Neg logit contributions | |
ULAR | -11.890 |
INESS | -11.069 |
aido | -11.054 |
eur | -10.834 |
opa | -10.662 |
Token | not |
Token ID | 407 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
ricks | +3.991 |
idth | +3.703 |
--------------- | +3.654 |
abama | +3.622 |
enriched | +3.534 |
Neg logit contributions | |
ULAR | -3.256 |
eur | -3.219 |
Versus | -3.197 |
aido | -3.138 |
INESS | -3.109 |
Token | establish |
Token ID | 4474 |
Feature activation | -9.04e-01 |
Pos logit contributions | |
ricks | +7.860 |
--------------- | +7.127 |
idth | +7.100 |
enrich | +7.065 |
enriched | +7.042 |
Neg logit contributions | |
ULAR | -7.287 |
INESS | -7.069 |
eur | -6.932 |
aido | -6.837 |
Versus | -6.833 |
Token | that |
Token ID | 326 |
Feature activation | -6.84e-01 |
Pos logit contributions | |
ricks | +5.174 |
idth | +4.726 |
--------------- | +4.712 |
abama | +4.628 |
enriched | +4.581 |
Neg logit contributions | |
ULAR | -4.992 |
eur | -4.871 |
Versus | -4.863 |
aido | -4.847 |
INESS | -4.754 |
Token | the |
Token ID | 262 |
Feature activation | -6.56e-01 |
Pos logit contributions | |
ricks | +3.402 |
idth | +3.110 |
--------------- | +3.041 |
abama | +3.017 |
akespeare | +2.907 |
Neg logit contributions | |
ULAR | -4.341 |
eur | -4.309 |
Versus | -4.285 |
aido | -4.207 |
INESS | -4.190 |
Token | , |
Token ID | 11 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
ricks | +4.232 |
idth | +3.922 |
--------------- | +3.810 |
abama | +3.776 |
dy | +3.619 |
Neg logit contributions | |
aido | -5.187 |
ULAR | -5.186 |
eur | -5.161 |
Versus | -5.130 |
INESS | -5.020 |
Token | c |
Token ID | 269 |
Feature activation | -7.31e-02 |
Pos logit contributions | |
ricks | +6.925 |
idth | +6.478 |
--------------- | +6.401 |
enriched | +6.246 |
abama | +6.221 |
Neg logit contributions | |
ULAR | -6.045 |
eur | -5.984 |
aido | -5.919 |
Versus | -5.911 |
INESS | -5.876 |
Token | v |
Token ID | 85 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
ricks | +0.346 |
idth | +0.304 |
--------------- | +0.301 |
enriched | +0.300 |
abama | +0.296 |
Neg logit contributions | |
eur | -0.489 |
ULAR | -0.483 |
Versus | -0.476 |
aido | -0.463 |
INESS | -0.461 |
Token | 2 |
Token ID | 17 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
ricks | +1.745 |
idth | +1.605 |
--------------- | +1.589 |
abama | +1.580 |
enriched | +1.560 |
Neg logit contributions | |
ULAR | -1.362 |
eur | -1.335 |
Versus | -1.293 |
INESS | -1.261 |
atively | -1.259 |
Token | . |
Token ID | 13 |
Feature activation | -5.07e-01 |
Pos logit contributions | |
ricks | +5.710 |
idth | +5.226 |
--------------- | +5.201 |
abama | +5.140 |
dy | +5.053 |
Neg logit contributions | |
Versus | -5.851 |
ULAR | -5.823 |
eur | -5.770 |
aido | -5.764 |
INESS | -5.614 |
Token | COLOR |
Token ID | 46786 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
ricks | +2.861 |
idth | +2.638 |
--------------- | +2.594 |
abama | +2.576 |
enriched | +2.518 |
Neg logit contributions | |
ULAR | -2.896 |
eur | -2.861 |
Versus | -2.822 |
aido | -2.779 |
INESS | -2.771 |
Token | _ |
Token ID | 62 |
Feature activation | -8.66e-01 |
Pos logit contributions | |
ricks | +8.872 |
idth | +8.415 |
--------------- | +8.232 |
abama | +7.683 |
enrich | +7.628 |
Neg logit contributions | |
aido | -14.099 |
eur | -14.074 |
accompan | -13.970 |
Versus | -13.814 |
opa | -13.766 |
Token | B |
Token ID | 33 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
ricks | +4.925 |
--------------- | +4.547 |
idth | +4.517 |
abama | +4.426 |
dy | +4.319 |
Neg logit contributions | |
eur | -4.713 |
Versus | -4.707 |
ULAR | -4.703 |
aido | -4.665 |
INESS | -4.528 |
Token | GR |
Token ID | 10761 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
ricks | +12.995 |
--------------- | +11.312 |
idth | +10.907 |
dy | +10.723 |
orate | +10.711 |
Neg logit contributions | |
accompan | -11.049 |
aido | -10.993 |
opa | -10.754 |
eur | -10.719 |
Versus | -10.674 |
Token | 2 |
Token ID | 17 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
ricks | +7.518 |
idth | +7.246 |
--------------- | +7.039 |
dy | +6.878 |
abama | +6.773 |
Neg logit contributions | |
eur | -7.914 |
aido | -7.643 |
Versus | -7.531 |
ULAR | -7.342 |
opa | -7.315 |
Token | G |
Token ID | 38 |
Feature activation | -8.56e-01 |
Pos logit contributions | |
ricks | +6.449 |
idth | +5.975 |
--------------- | +5.883 |
abama | +5.766 |
dy | +5.701 |
Neg logit contributions | |
eur | -6.449 |
Versus | -6.417 |
aido | -6.411 |
ULAR | -6.364 |
opa | -6.199 |
Token | Allen |
Token ID | 9659 |
Feature activation | -9.46e-01 |
Pos logit contributions | |
ricks | +4.569 |
idth | +4.207 |
--------------- | +4.162 |
abama | +4.097 |
enriched | +4.021 |
Neg logit contributions | |
ULAR | -4.368 |
eur | -4.302 |
Versus | -4.282 |
aido | -4.223 |
INESS | -4.196 |
Token | will |
Token ID | 481 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
ricks | +5.918 |
idth | +5.468 |
--------------- | +5.460 |
abama | +5.321 |
enriched | +5.299 |
Neg logit contributions | |
ULAR | -4.689 |
eur | -4.567 |
Versus | -4.548 |
INESS | -4.489 |
aido | -4.484 |
Token | tread |
Token ID | 23153 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
ricks | +7.918 |
idth | +7.288 |
--------------- | +7.235 |
enriched | +7.028 |
abama | +7.020 |
Neg logit contributions | |
ULAR | -7.182 |
INESS | -7.078 |
Versus | -6.963 |
eur | -6.888 |
aido | -6.862 |
Token | down |
Token ID | 866 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
ricks | +2.571 |
idth | +2.430 |
abama | +2.374 |
--------------- | +2.373 |
akespeare | +2.310 |
Neg logit contributions | |
eur | -1.626 |
ULAR | -1.623 |
Versus | -1.596 |
INESS | -1.547 |
aido | -1.543 |
Token | this |
Token ID | 428 |
Feature activation | -9.40e-01 |
Pos logit contributions | |
ricks | +9.192 |
--------------- | +8.277 |
idth | +8.220 |
enriched | +8.161 |
akespeare | +8.125 |
Neg logit contributions | |
ULAR | -9.398 |
aido | -9.195 |
INESS | -9.095 |
Versus | -9.066 |
eur | -8.984 |
Token | cinematic |
Token ID | 29932 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
ricks | +5.078 |
idth | +4.630 |
--------------- | +4.593 |
abama | +4.510 |
enriched | +4.458 |
Neg logit contributions | |
ULAR | -5.487 |
eur | -5.384 |
Versus | -5.374 |
aido | -5.321 |
INESS | -5.293 |
Token | path |
Token ID | 3108 |
Feature activation | -8.07e-01 |
Pos logit contributions | |
ricks | +14.084 |
enriched | +13.150 |
enrich | +12.916 |
shaft | +12.825 |
dy | +12.787 |
Neg logit contributions | |
INESS | -9.359 |
aido | -9.142 |
ULAR | -8.895 |
Versus | -8.528 |
eur | -8.271 |
Token | again |
Token ID | 757 |
Feature activation | -8.42e-01 |
Pos logit contributions | |
ricks | +4.671 |
idth | +4.300 |
--------------- | +4.248 |
abama | +4.197 |
enriched | +4.104 |
Neg logit contributions | |
ULAR | -4.445 |
eur | -4.383 |
Versus | -4.363 |
aido | -4.291 |
INESS | -4.256 |
Token | , |
Token ID | 11 |
Feature activation | -3.57e-01 |
Pos logit contributions | |
ricks | +4.924 |
idth | +4.545 |
--------------- | +4.512 |
abama | +4.424 |
enriched | +4.366 |
Neg logit contributions | |
ULAR | -4.540 |
Versus | -4.437 |
eur | -4.431 |
aido | -4.369 |
INESS | -4.340 |
Token | it |
Token ID | 340 |
Feature activation | -2.44e-01 |
Pos logit contributions | |
ricks | +2.089 |
idth | +1.950 |
abama | +1.938 |
--------------- | +1.904 |
xual | +1.830 |
Neg logit contributions | |
eur | -1.955 |
Versus | -1.942 |
ULAR | -1.940 |
aido | -1.889 |
atively | -1.859 |
Token | would |
Token ID | 561 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
ricks | +1.606 |
idth | +1.514 |
abama | +1.490 |
--------------- | +1.487 |
akespeare | +1.428 |
Neg logit contributions | |
eur | -1.155 |
ULAR | -1.134 |
Versus | -1.125 |
aido | -1.104 |
INESS | -1.084 |
Token | v |
Token ID | 85 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
ricks | +0.346 |
idth | +0.304 |
--------------- | +0.301 |
enriched | +0.300 |
abama | +0.296 |
Neg logit contributions | |
eur | -0.489 |
ULAR | -0.483 |
Versus | -0.476 |
aido | -0.463 |
INESS | -0.461 |
Token | 2 |
Token ID | 17 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
ricks | +1.745 |
idth | +1.605 |
--------------- | +1.589 |
abama | +1.580 |
enriched | +1.560 |
Neg logit contributions | |
ULAR | -1.362 |
eur | -1.335 |
Versus | -1.293 |
INESS | -1.261 |
atively | -1.259 |
Token | . |
Token ID | 13 |
Feature activation | -5.07e-01 |
Pos logit contributions | |
ricks | +5.710 |
idth | +5.226 |
--------------- | +5.201 |
abama | +5.140 |
dy | +5.053 |
Neg logit contributions | |
Versus | -5.851 |
ULAR | -5.823 |
eur | -5.770 |
aido | -5.764 |
INESS | -5.614 |
Token | COLOR |
Token ID | 46786 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
ricks | +2.861 |
idth | +2.638 |
--------------- | +2.594 |
abama | +2.576 |
enriched | +2.518 |
Neg logit contributions | |
ULAR | -2.896 |
eur | -2.861 |
Versus | -2.822 |
aido | -2.779 |
INESS | -2.771 |
Token | _ |
Token ID | 62 |
Feature activation | -8.66e-01 |
Pos logit contributions | |
ricks | +8.872 |
idth | +8.415 |
--------------- | +8.232 |
abama | +7.683 |
enrich | +7.628 |
Neg logit contributions | |
aido | -14.099 |
eur | -14.074 |
accompan | -13.970 |
Versus | -13.814 |
opa | -13.766 |
Token | B |
Token ID | 33 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
ricks | +4.925 |
--------------- | +4.547 |
idth | +4.517 |
abama | +4.426 |
dy | +4.319 |
Neg logit contributions | |
eur | -4.713 |
Versus | -4.707 |
ULAR | -4.703 |
aido | -4.665 |
INESS | -4.528 |
Token | GR |
Token ID | 10761 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
ricks | +12.995 |
--------------- | +11.312 |
idth | +10.907 |
dy | +10.723 |
orate | +10.711 |
Neg logit contributions | |
accompan | -11.049 |
aido | -10.993 |
opa | -10.754 |
eur | -10.719 |
Versus | -10.674 |
Token | 2 |
Token ID | 17 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
ricks | +7.518 |
idth | +7.246 |
--------------- | +7.039 |
dy | +6.878 |
abama | +6.773 |
Neg logit contributions | |
eur | -7.914 |
aido | -7.643 |
Versus | -7.531 |
ULAR | -7.342 |
opa | -7.315 |
Token | G |
Token ID | 38 |
Feature activation | -8.56e-01 |
Pos logit contributions | |
ricks | +6.449 |
idth | +5.975 |
--------------- | +5.883 |
abama | +5.766 |
dy | +5.701 |
Neg logit contributions | |
eur | -6.449 |
Versus | -6.417 |
aido | -6.411 |
ULAR | -6.364 |
opa | -6.199 |
Token | RAY |
Token ID | 30631 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
ricks | +4.483 |
idth | +4.099 |
--------------- | +4.036 |
abama | +3.977 |
enriched | +3.874 |
Neg logit contributions | |
ULAR | -5.166 |
eur | -5.129 |
Versus | -5.100 |
aido | -5.028 |
INESS | -4.977 |
Token | ) |
Token ID | 8 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
ricks | +9.327 |
idth | +8.742 |
--------------- | +8.700 |
dy | +8.511 |
abama | +8.387 |
Neg logit contributions | |
aido | -11.088 |
Versus | -10.925 |
accompan | -10.764 |
eur | -10.622 |
opa | -10.617 |
Token | turns |
Token ID | 4962 |
Feature activation | -5.76e-02 |
Pos logit contributions | |
ricks | +1.257 |
idth | +1.210 |
abama | +1.190 |
--------------- | +1.178 |
xual | +1.137 |
Neg logit contributions | |
eur | -0.947 |
Versus | -0.935 |
ULAR | -0.931 |
aido | -0.903 |
atively | -0.892 |
Token | out |
Token ID | 503 |
Feature activation | -7.81e-01 |
Pos logit contributions | |
ricks | +0.467 |
idth | +0.444 |
abama | +0.430 |
--------------- | +0.430 |
akespeare | +0.425 |
Neg logit contributions | |
eur | -0.189 |
ULAR | -0.188 |
Versus | -0.186 |
aido | -0.177 |
atively | -0.175 |
Token | that |
Token ID | 326 |
Feature activation | -7.31e-03 |
Pos logit contributions | |
ricks | +4.536 |
idth | +4.185 |
--------------- | +4.129 |
abama | +4.073 |
enriched | +3.987 |
Neg logit contributions | |
ULAR | -4.271 |
eur | -4.215 |
Versus | -4.175 |
aido | -4.122 |
INESS | -4.095 |
Token | things |
Token ID | 1243 |
Feature activation | -5.71e-02 |
Pos logit contributions | |
ricks | +0.045 |
idth | +0.042 |
abama | +0.041 |
--------------- | +0.041 |
raught | +0.040 |
Neg logit contributions | |
Versus | -0.038 |
eur | -0.038 |
ULAR | -0.037 |
aido | -0.037 |
atively | -0.036 |
Token | could |
Token ID | 714 |
Feature activation | -5.72e-01 |
Pos logit contributions | |
ricks | +0.377 |
idth | +0.363 |
abama | +0.351 |
--------------- | +0.348 |
xual | +0.340 |
Neg logit contributions | |
Versus | -0.265 |
ULAR | -0.265 |
eur | -0.264 |
aido | -0.258 |
INESS | -0.252 |
Token | go |
Token ID | 467 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
ricks | +3.514 |
idth | +3.272 |
--------------- | +3.221 |
abama | +3.213 |
enriched | +3.122 |
Neg logit contributions | |
ULAR | -2.966 |
eur | -2.927 |
Versus | -2.905 |
aido | -2.860 |
INESS | -2.819 |
Token | wrong |
Token ID | 2642 |
Feature activation | -7.48e-01 |
Pos logit contributions | |
ricks | +12.266 |
--------------- | +11.160 |
dy | +11.107 |
enriched | +10.938 |
dup | +10.786 |
Neg logit contributions | |
aido | -10.704 |
ULAR | -10.608 |
INESS | -10.558 |
eur | -10.393 |
accompan | -10.265 |
Token | . |
Token ID | 13 |
Feature activation | -3.44e-02 |
Pos logit contributions | |
ricks | +4.592 |
idth | +4.241 |
--------------- | +4.199 |
abama | +4.150 |
enriched | +4.066 |
Neg logit contributions | |
ULAR | -3.848 |
eur | -3.788 |
Versus | -3.766 |
aido | -3.707 |
INESS | -3.672 |
Token | Ter |
Token ID | 3813 |
Feature activation | -4.11e-01 |
Pos logit contributions | |
ricks | +0.220 |
idth | +0.207 |
abama | +0.201 |
enriched | +0.199 |
xual | +0.197 |
Neg logit contributions | |
Versus | -0.180 |
ULAR | -0.175 |
eur | -0.172 |
INESS | -0.164 |
aido | -0.162 |
Token | ribly |
Token ID | 16358 |
Feature activation | -3.53e-01 |
Pos logit contributions | |
ricks | +1.776 |
idth | +1.608 |
--------------- | +1.580 |
abama | +1.570 |
enriched | +1.526 |
Neg logit contributions | |
eur | -2.850 |
ULAR | -2.831 |
Versus | -2.819 |
aido | -2.793 |
atively | -2.751 |
Token | , |
Token ID | 11 |
Feature activation | +2.05e-01 |
Pos logit contributions | |
ricks | +1.986 |
idth | +1.855 |
abama | +1.803 |
--------------- | +1.782 |
xual | +1.745 |
Neg logit contributions | |
eur | -2.008 |
ULAR | -2.005 |
Versus | -2.003 |
INESS | -1.943 |
aido | -1.938 |
Token |
|
Token ID | 198 |
Feature activation | -7.00e-01 |
Pos logit contributions | |
ricks | +2.942 |
--------------- | +2.659 |
idth | +2.653 |
abama | +2.600 |
dy | +2.507 |
Neg logit contributions | |
ULAR | -3.738 |
Versus | -3.686 |
eur | -3.684 |
aido | -3.647 |
INESS | -3.613 |
Token | At |
Token ID | 2953 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
ricks | +4.062 |
idth | +3.758 |
--------------- | +3.683 |
abama | +3.661 |
enriched | +3.581 |
Neg logit contributions | |
ULAR | -3.863 |
eur | -3.824 |
Versus | -3.786 |
aido | -3.727 |
INESS | -3.702 |
Token | this |
Token ID | 428 |
Feature activation | -6.14e-01 |
Pos logit contributions | |
ricks | +8.906 |
--------------- | +8.209 |
idth | +8.038 |
dy | +7.904 |
abama | +7.869 |
Neg logit contributions | |
ULAR | -9.286 |
eur | -9.027 |
INESS | -9.001 |
aido | -8.905 |
Versus | -8.824 |
Token | pre |
Token ID | 662 |
Feature activation | -9.16e-01 |
Pos logit contributions | |
ricks | +3.378 |
idth | +3.097 |
--------------- | +3.042 |
abama | +3.017 |
enriched | +2.924 |
Neg logit contributions | |
ULAR | -3.585 |
eur | -3.554 |
Versus | -3.537 |
aido | -3.468 |
INESS | -3.444 |
Token | - |
Token ID | 12 |
Feature activation | -7.82e-01 |
Pos logit contributions | |
ricks | +5.610 |
--------------- | +5.242 |
idth | +5.182 |
abama | +5.147 |
dy | +5.023 |
Neg logit contributions | |
ULAR | -4.583 |
Versus | -4.466 |
eur | -4.438 |
INESS | -4.424 |
aido | -4.417 |
Token | trial |
Token ID | 45994 |
Feature activation | -2.21e+00 |
Pos logit contributions | |
ricks | +3.462 |
idth | +3.105 |
--------------- | +3.054 |
abama | +3.006 |
enriched | +2.900 |
Neg logit contributions | |
ULAR | -5.367 |
eur | -5.315 |
Versus | -5.298 |
aido | -5.223 |
INESS | -5.193 |
Token | hearing |
Token ID | 4854 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
ricks | +11.069 |
--------------- | +10.747 |
dy | +10.385 |
idth | +10.359 |
enriched | +10.071 |
Neg logit contributions | |
ULAR | -11.090 |
aido | -11.004 |
Versus | -10.554 |
eur | -10.522 |
INESS | -10.310 |
Token | on |
Token ID | 319 |
Feature activation | -8.02e-01 |
Pos logit contributions | |
ricks | +7.693 |
--------------- | +7.165 |
idth | +6.983 |
dy | +6.938 |
abama | +6.876 |
Neg logit contributions | |
ULAR | -6.898 |
eur | -6.596 |
aido | -6.557 |
Versus | -6.497 |
INESS | -6.481 |
Token | Thursday |
Token ID | 3635 |
Feature activation | -9.65e-01 |
Pos logit contributions | |
ricks | +5.220 |
idth | +4.848 |
--------------- | +4.810 |
abama | +4.745 |
enriched | +4.657 |
Neg logit contributions | |
ULAR | -3.843 |
eur | -3.774 |
Versus | -3.741 |
aido | -3.691 |
INESS | -3.665 |
Token | , |
Token ID | 11 |
Feature activation | -5.80e-01 |
Pos logit contributions | |
ricks | +5.549 |
idth | +5.093 |
--------------- | +5.086 |
abama | +4.960 |
enriched | +4.887 |
Neg logit contributions | |
ULAR | -5.315 |
eur | -5.165 |
Versus | -5.121 |
aido | -5.100 |
INESS | -5.072 |
Token | Mel |
Token ID | 5616 |
Feature activation | -6.98e-01 |
Pos logit contributions | |
ricks | +3.543 |
idth | +3.297 |
abama | +3.227 |
--------------- | +3.222 |
enriched | +3.120 |
Neg logit contributions | |
eur | -3.012 |
ULAR | -3.009 |
Versus | -3.004 |
aido | -2.929 |
INESS | -2.888 |
Token | :: |
Token ID | 3712 |
Feature activation | -9.55e-01 |
Pos logit contributions | |
ricks | +4.996 |
--------------- | +4.559 |
idth | +4.557 |
abama | +4.395 |
enriched | +4.341 |
Neg logit contributions | |
ULAR | -6.787 |
aido | -6.769 |
Versus | -6.722 |
eur | -6.720 |
INESS | -6.599 |
Token | From |
Token ID | 4863 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
ricks | +5.521 |
idth | +5.111 |
--------------- | +5.105 |
abama | +4.977 |
dy | +4.885 |
Neg logit contributions | |
Versus | -5.080 |
ULAR | -5.072 |
eur | -5.038 |
aido | -5.002 |
INESS | -4.914 |
Token | Ar |
Token ID | 3163 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
ricks | +6.512 |
--------------- | +6.217 |
idth | +6.114 |
abama | +5.906 |
dy | +5.860 |
Neg logit contributions | |
aido | -7.364 |
Versus | -7.234 |
eur | -7.120 |
opa | -6.954 |
accompan | -6.943 |
Token | gb |
Token ID | 22296 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
ricks | +6.996 |
idth | +6.350 |
dy | +6.322 |
abama | +6.041 |
--------------- | +5.710 |
Neg logit contributions | |
ULAR | -13.499 |
闘 | -13.478 |
accompan | -13.449 |
INESS | -13.277 |
Versus | -13.191 |
Token | ($ |
Token ID | 16763 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
ricks | +9.321 |
idth | +9.217 |
--------------- | +8.691 |
dy | +8.617 |
abama | +8.508 |
Neg logit contributions | |
eur | -10.253 |
aido | -10.187 |
accompan | -10.107 |
Versus | -10.067 |
opa | -9.954 |
Token | BG |
Token ID | 40469 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
ricks | +6.947 |
idth | +6.514 |
abama | +6.381 |
dy | +6.377 |
--------------- | +6.355 |
Neg logit contributions | |
Versus | -6.596 |
ULAR | -6.423 |
aido | -6.357 |
eur | -6.233 |
INESS | -6.182 |
Token | [ |
Token ID | 58 |
Feature activation | -3.42e-01 |
Pos logit contributions | |
ricks | +11.638 |
idth | +10.981 |
--------------- | +10.431 |
dy | +10.341 |
abama | +10.233 |
Neg logit contributions | |
Versus | -10.841 |
eur | -10.622 |
aido | -10.593 |
accompan | -10.433 |
atively | -10.233 |
Token | 0 |
Token ID | 15 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
ricks | +2.309 |
idth | +2.146 |
--------------- | +2.113 |
abama | +2.112 |
enriched | +2.076 |
Neg logit contributions | |
ULAR | -1.592 |
eur | -1.563 |
Versus | -1.530 |
INESS | -1.506 |
aido | -1.486 |
Token | ], |
Token ID | 4357 |
Feature activation | -5.11e-01 |
Pos logit contributions | |
ricks | +8.955 |
idth | +8.423 |
--------------- | +8.393 |
abama | +8.232 |
dy | +8.193 |
Neg logit contributions | |
aido | -7.539 |
ULAR | -7.431 |
Versus | -7.367 |
eur | -7.316 |
accompan | -7.174 |
Token | $ |
Token ID | 3 |
Feature activation | -7.96e-01 |
Pos logit contributions | |
ricks | +2.905 |
idth | +2.666 |
--------------- | +2.627 |
abama | +2.603 |
enriched | +2.539 |
Neg logit contributions | |
ULAR | -2.898 |
eur | -2.859 |
Versus | -2.841 |
aido | -2.789 |
INESS | -2.778 |
Token | BG |
Token ID | 40469 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
ricks | +4.989 |
idth | +4.631 |
--------------- | +4.583 |
abama | +4.538 |
dy | +4.436 |
Neg logit contributions | |
Versus | -3.904 |
ULAR | -3.897 |
eur | -3.853 |
aido | -3.805 |
INESS | -3.737 |
Token |
|
Token ID | 198 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
ricks | +0.109 |
idth | +0.103 |
abama | +0.098 |
enriched | +0.098 |
xual | +0.098 |
Neg logit contributions | |
eur | -0.106 |
ULAR | -0.105 |
Versus | -0.103 |
INESS | -0.100 |
aido | -0.099 |
Token | The |
Token ID | 464 |
Feature activation | -4.33e-01 |
Pos logit contributions | |
ULAR | +0.687 |
eur | +0.681 |
INESS | +0.658 |
Versus | +0.653 |
atively | +0.634 |
Neg logit contributions | |
ricks | -0.820 |
idth | -0.798 |
xual | -0.772 |
abama | -0.771 |
enriched | -0.771 |
Token | Dram |
Token ID | 36736 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
ricks | +2.756 |
idth | +2.586 |
abama | +2.531 |
--------------- | +2.525 |
akespeare | +2.441 |
Neg logit contributions | |
ULAR | -2.150 |
Versus | -2.141 |
eur | -2.131 |
INESS | -2.059 |
aido | -2.045 |
Token | atically |
Token ID | 4142 |
Feature activation | -8.64e-01 |
Pos logit contributions | |
ricks | +1.075 |
idth | +1.017 |
--------------- | +1.014 |
abama | +1.003 |
enriched | +0.990 |
Neg logit contributions | |
eur | -0.394 |
Versus | -0.384 |
ULAR | -0.380 |
aido | -0.369 |
atively | -0.369 |
Token | Different |
Token ID | 20615 |
Feature activation | -3.23e-02 |
Pos logit contributions | |
ricks | +5.037 |
idth | +4.639 |
--------------- | +4.593 |
abama | +4.527 |
enriched | +4.446 |
Neg logit contributions | |
ULAR | -4.703 |
eur | -4.646 |
Versus | -4.593 |
aido | -4.555 |
INESS | -4.513 |
Token | Attention |
Token ID | 47406 |
Feature activation | -2.16e+00 |
Pos logit contributions | |
ricks | +0.214 |
idth | +0.202 |
abama | +0.198 |
--------------- | +0.197 |
enriched | +0.194 |
Neg logit contributions | |
Versus | -0.156 |
eur | -0.152 |
ULAR | -0.150 |
INESS | -0.144 |
atively | -0.142 |
Token | Economy |
Token ID | 18493 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
ricks | +13.047 |
idth | +12.303 |
--------------- | +11.851 |
enriched | +11.721 |
dy | +11.657 |
Neg logit contributions | |
ULAR | -9.347 |
aido | -8.870 |
eur | -8.859 |
INESS | -8.817 |
atively | -8.564 |
Token | Of |
Token ID | 3226 |
Feature activation | -4.56e-01 |
Pos logit contributions | |
ricks | +0.810 |
idth | +0.758 |
abama | +0.746 |
--------------- | +0.733 |
akespeare | +0.718 |
Neg logit contributions | |
Versus | -0.725 |
eur | -0.698 |
ULAR | -0.693 |
INESS | -0.670 |
atively | -0.658 |
Token | The |
Token ID | 383 |
Feature activation | -4.85e-01 |
Pos logit contributions | |
ricks | +2.999 |
idth | +2.795 |
--------------- | +2.748 |
abama | +2.741 |
enriched | +2.675 |
Neg logit contributions | |
ULAR | -2.171 |
Versus | -2.166 |
eur | -2.153 |
aido | -2.076 |
INESS | -2.064 |
Token | Future |
Token ID | 10898 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
ricks | +3.233 |
idth | +3.016 |
--------------- | +2.961 |
abama | +2.952 |
enriched | +2.886 |
Neg logit contributions | |
ULAR | -2.278 |
Versus | -2.265 |
eur | -2.263 |
aido | -2.174 |
INESS | -2.168 |
Token |
|
Token ID | 198 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
ricks | +1.051 |
idth | +0.967 |
abama | +0.953 |
--------------- | +0.947 |
akespeare | +0.925 |
Neg logit contributions | |
Versus | -1.023 |
ULAR | -0.999 |
eur | -0.998 |
INESS | -0.966 |
aido | -0.959 |
Token | degree |
Token ID | 4922 |
Feature activation | -7.64e-03 |
Pos logit contributions | |
eur | +2.992 |
ULAR | +2.933 |
Versus | +2.933 |
semblance | +2.932 |
survival | +2.911 |
Neg logit contributions | |
ricks | -3.868 |
idth | -3.734 |
akespeare | -3.517 |
abama | -3.496 |
--------------- | -3.478 |
Token | of |
Token ID | 286 |
Feature activation | -3.33e-03 |
Pos logit contributions | |
ricks | +0.050 |
idth | +0.047 |
abama | +0.045 |
--------------- | +0.045 |
raught | +0.044 |
Neg logit contributions | |
eur | -0.038 |
ULAR | -0.038 |
Versus | -0.037 |
aido | -0.036 |
atively | -0.035 |
Token | cooperation |
Token ID | 11113 |
Feature activation | +2.64e-01 |
Pos logit contributions | |
ricks | +0.021 |
idth | +0.020 |
--------------- | +0.019 |
abama | +0.019 |
akespeare | +0.019 |
Neg logit contributions | |
eur | -0.017 |
ULAR | -0.017 |
Versus | -0.016 |
survival | -0.016 |
atively | -0.016 |
Token | from |
Token ID | 422 |
Feature activation | -7.38e-02 |
Pos logit contributions | |
eur | +1.112 |
atively | +1.064 |
Versus | +1.062 |
ULAR | +1.052 |
aido | +1.020 |
Neg logit contributions | |
ricks | -1.889 |
idth | -1.810 |
--------------- | -1.756 |
abama | -1.745 |
akespeare | -1.706 |
Token | the |
Token ID | 262 |
Feature activation | +1.20e-02 |
Pos logit contributions | |
ricks | +0.431 |
idth | +0.403 |
--------------- | +0.386 |
abama | +0.385 |
akespeare | +0.380 |
Neg logit contributions | |
Versus | -0.410 |
ULAR | -0.410 |
eur | -0.406 |
atively | -0.395 |
aido | -0.389 |
Token | B |
Token ID | 347 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
Versus | +0.058 |
ULAR | +0.058 |
eur | +0.057 |
atively | +0.056 |
interim | +0.055 |
Neg logit contributions | |
ricks | -0.079 |
idth | -0.074 |
abama | -0.072 |
--------------- | -0.071 |
akespeare | -0.071 |
Token | CS |
Token ID | 7902 |
Feature activation | -1.56e-01 |
Pos logit contributions | |
ricks | +9.687 |
--------------- | +8.132 |
dy | +7.889 |
idth | +7.834 |
abama | +7.682 |
Neg logit contributions | |
accompan | -12.920 |
Versus | -12.757 |
eur | -12.605 |
aido | -12.397 |
ULAR | -12.386 |
Token | . |
Token ID | 13 |
Feature activation | -4.19e-02 |
Pos logit contributions | |
ricks | +1.023 |
idth | +0.953 |
--------------- | +0.931 |
abama | +0.922 |
akespeare | +0.911 |
Neg logit contributions | |
ULAR | -0.762 |
eur | -0.758 |
Versus | -0.750 |
INESS | -0.738 |
aido | -0.727 |
Token |
|
Token ID | 198 |
Feature activation | +2.59e-01 |
Pos logit contributions | |
ricks | +0.263 |
idth | +0.248 |
enriched | +0.238 |
akespeare | +0.235 |
xual | +0.232 |
Neg logit contributions | |
Versus | -0.225 |
ULAR | -0.218 |
eur | -0.218 |
INESS | -0.208 |
atively | -0.204 |
Token |
|
Token ID | 198 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
eur | +1.375 |
ULAR | +1.349 |
Versus | +1.312 |
opa | +1.265 |
INESS | +1.263 |
Neg logit contributions | |
ricks | -1.588 |
idth | -1.536 |
enriched | -1.468 |
xual | -1.464 |
akespeare | -1.453 |
Token | At |
Token ID | 2953 |
Feature activation | -9.09e-01 |
Pos logit contributions | |
ULAR | +0.576 |
eur | +0.568 |
INESS | +0.545 |
Versus | +0.537 |
atively | +0.529 |
Neg logit contributions | |
ricks | -0.648 |
idth | -0.631 |
enriched | -0.614 |
xual | -0.611 |
akespeare | -0.593 |
Token | . |
Token ID | 13 |
Feature activation | -4.21e-01 |
Pos logit contributions | |
ricks | +5.735 |
--------------- | +5.488 |
dy | +5.169 |
abama | +5.057 |
idth | +4.977 |
Neg logit contributions | |
accompan | -7.301 |
aido | -7.216 |
Versus | -7.136 |
ULAR | -7.091 |
eur | -7.005 |
Token | Color |
Token ID | 10258 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
ricks | +1.953 |
idth | +1.765 |
--------------- | +1.725 |
abama | +1.717 |
enriched | +1.668 |
Neg logit contributions | |
ULAR | -2.822 |
eur | -2.788 |
Versus | -2.765 |
aido | -2.724 |
INESS | -2.715 |
Token | ] |
Token ID | 60 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
ricks | +7.371 |
idth | +6.957 |
--------------- | +6.672 |
dy | +6.663 |
dup | +6.433 |
Neg logit contributions | |
aido | -11.992 |
eur | -11.899 |
INESS | -11.840 |
Versus | -11.824 |
opa | -11.590 |
Token | :: |
Token ID | 3712 |
Feature activation | -4.61e-01 |
Pos logit contributions | |
ricks | +5.009 |
--------------- | +4.702 |
idth | +4.421 |
abama | +4.407 |
dy | +4.350 |
Neg logit contributions | |
aido | -7.223 |
ULAR | -7.195 |
Versus | -7.109 |
eur | -7.069 |
INESS | -6.971 |
Token | From |
Token ID | 4863 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
ricks | +2.731 |
idth | +2.523 |
--------------- | +2.497 |
abama | +2.464 |
enriched | +2.400 |
Neg logit contributions | |
ULAR | -2.470 |
eur | -2.446 |
Versus | -2.431 |
aido | -2.395 |
INESS | -2.369 |
Token | Ar |
Token ID | 3163 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
ricks | +5.106 |
--------------- | +4.814 |
idth | +4.793 |
abama | +4.633 |
dy | +4.508 |
Neg logit contributions | |
Versus | -6.695 |
aido | -6.677 |
eur | -6.540 |
ULAR | -6.483 |
INESS | -6.447 |
Token | gb |
Token ID | 22296 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
ricks | +5.411 |
abama | +4.779 |
dy | +4.699 |
idth | +4.663 |
--------------- | +4.188 |
Neg logit contributions | |
accompan | -16.866 |
INESS | -16.408 |
闘 | -16.404 |
Versus | -16.371 |
ULAR | -16.268 |
Token | ($ |
Token ID | 16763 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
ricks | +4.379 |
idth | +4.000 |
dy | +3.856 |
abama | +3.693 |
--------------- | +3.682 |
Neg logit contributions | |
Versus | -10.184 |
aido | -10.099 |
eur | -9.994 |
ULAR | -9.802 |
atively | -9.775 |
Token | FC |
Token ID | 4851 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
ricks | +6.642 |
idth | +6.131 |
--------------- | +6.108 |
abama | +6.000 |
dy | +5.940 |
Neg logit contributions | |
Versus | -5.612 |
ULAR | -5.514 |
eur | -5.479 |
aido | -5.466 |
INESS | -5.312 |
Token | 1 |
Token ID | 16 |
Feature activation | -9.37e-01 |
Pos logit contributions | |
ricks | +5.916 |
idth | +5.439 |
--------------- | +5.349 |
abama | +5.280 |
dy | +5.170 |
Neg logit contributions | |
Versus | -5.559 |
ULAR | -5.545 |
eur | -5.482 |
aido | -5.462 |
INESS | -5.351 |
Token | [ |
Token ID | 58 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
ricks | +5.284 |
idth | +4.853 |
--------------- | +4.803 |
abama | +4.768 |
dy | +4.654 |
Neg logit contributions | |
ULAR | -5.104 |
Versus | -5.062 |
eur | -5.050 |
aido | -5.033 |
INESS | -4.900 |
Token | All |
Token ID | 3237 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
ricks | +1.718 |
idth | +1.603 |
abama | +1.574 |
--------------- | +1.560 |
enriched | +1.557 |
Neg logit contributions | |
ULAR | -1.253 |
eur | -1.232 |
Versus | -1.209 |
INESS | -1.180 |
aido | -1.179 |
Token | Sc |
Token ID | 3351 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
ricks | +6.059 |
idth | +5.576 |
--------------- | +5.530 |
abama | +5.410 |
enriched | +5.265 |
Neg logit contributions | |
ULAR | -5.788 |
Versus | -5.751 |
eur | -5.747 |
aido | -5.710 |
INESS | -5.572 |
Token | reens |
Token ID | 5681 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
ricks | +1.004 |
--------------- | +0.959 |
idth | +0.952 |
abama | +0.952 |
xual | +0.935 |
Neg logit contributions | |
eur | -0.474 |
ULAR | -0.472 |
Versus | -0.454 |
aido | -0.453 |
opa | -0.440 |
Token | | |
Token ID | 930 |
Feature activation | -9.11e-01 |
Pos logit contributions | |
ricks | +2.378 |
idth | +2.173 |
--------------- | +2.149 |
abama | +2.137 |
enriched | +2.078 |
Neg logit contributions | |
ULAR | -2.436 |
eur | -2.415 |
Versus | -2.400 |
aido | -2.354 |
INESS | -2.340 |
Token | Where |
Token ID | 6350 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
ricks | +5.590 |
idth | +5.195 |
--------------- | +5.159 |
abama | +5.100 |
enriched | +4.982 |
Neg logit contributions | |
ULAR | -4.592 |
eur | -4.520 |
Versus | -4.470 |
aido | -4.466 |
INESS | -4.446 |
Token | Primary |
Token ID | 21087 |
Feature activation | -2.11e+00 |
Pos logit contributions | |
idth | +11.015 |
--------------- | +10.872 |
ricks | +10.189 |
dup | +10.073 |
abama | +10.040 |
Neg logit contributions | |
aido | -12.250 |
eur | -11.793 |
INESS | -11.723 |
accompan | -11.590 |
ULAR | -11.428 |
Token | | |
Token ID | 930 |
Feature activation | -7.76e-01 |
Pos logit contributions | |
ricks | +11.089 |
--------------- | +10.823 |
idth | +10.674 |
abama | +10.228 |
dy | +9.965 |
Neg logit contributions | |
aido | -10.333 |
ULAR | -9.955 |
opa | -9.921 |
eur | -9.778 |
accompan | -9.707 |
Token | Select |
Token ID | 9683 |
Feature activation | -8.19e-01 |
Pos logit contributions | |
ricks | +4.633 |
idth | +4.294 |
--------------- | +4.244 |
abama | +4.194 |
enriched | +4.092 |
Neg logit contributions | |
ULAR | -4.103 |
eur | -4.053 |
Versus | -4.015 |
aido | -3.973 |
INESS | -3.939 |
Token | - |
Token ID | 532 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
ricks | +5.038 |
idth | +4.704 |
--------------- | +4.648 |
abama | +4.577 |
enriched | +4.484 |
Neg logit contributions | |
ULAR | -4.147 |
eur | -4.092 |
Versus | -4.050 |
aido | -4.007 |
INESS | -3.991 |
Token | Exp |
Token ID | 16870 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
ricks | +5.893 |
idth | +5.468 |
--------------- | +5.405 |
abama | +5.325 |
enriched | +5.162 |
Neg logit contributions | |
ULAR | -5.573 |
eur | -5.471 |
Versus | -5.446 |
aido | -5.426 |
INESS | -5.425 |
Token | and |
Token ID | 392 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
ricks | +6.594 |
--------------- | +6.259 |
idth | +6.128 |
abama | +5.758 |
dy | +5.723 |
Neg logit contributions | |
ULAR | -10.614 |
aido | -10.487 |
eur | -10.425 |
INESS | -10.375 |
Versus | -10.205 |
Token | I |
Token ID | 314 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
Versus | +8.078 |
moderately | +7.885 |
rudimentary | +7.557 |
mildly | +7.548 |
outside | +7.529 |
Neg logit contributions | |
ricks | -12.957 |
idth | -12.457 |
abama | -12.300 |
raught | -11.996 |
xual | -11.943 |
Token | can |
Token ID | 460 |
Feature activation | +5.09e-01 |
Pos logit contributions | |
eur | +3.947 |
aido | +3.861 |
Versus | +3.860 |
moderately | +3.794 |
vaguely | +3.699 |
Neg logit contributions | |
ricks | -7.121 |
idth | -6.964 |
abama | -6.693 |
--------------- | -6.467 |
xual | -6.340 |
Token | 't |
Token ID | 470 |
Feature activation | +4.09e-01 |
Pos logit contributions | |
eur | +1.942 |
Versus | +1.909 |
moderately | +1.840 |
aido | +1.806 |
vaguely | +1.806 |
Neg logit contributions | |
ricks | -3.688 |
idth | -3.515 |
abama | -3.471 |
--------------- | -3.467 |
uliffe | -3.384 |
Token | deny |
Token ID | 10129 |
Feature activation | +9.21e-02 |
Pos logit contributions | |
Versus | +1.966 |
eur | +1.912 |
moderately | +1.865 |
ULAR | +1.830 |
aido | +1.827 |
Neg logit contributions | |
ricks | -2.644 |
idth | -2.494 |
abama | -2.463 |
uliffe | -2.463 |
--------------- | -2.416 |
Token | how |
Token ID | 703 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
eur | +0.482 |
Versus | +0.481 |
ULAR | +0.477 |
atively | +0.466 |
aido | +0.457 |
Neg logit contributions | |
ricks | -0.560 |
idth | -0.520 |
abama | -0.517 |
--------------- | -0.513 |
akespeare | -0.502 |
Token | visually |
Token ID | 22632 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
ricks | +6.931 |
--------------- | +6.344 |
idth | +6.322 |
enriched | +6.211 |
abama | +6.169 |
Neg logit contributions | |
ULAR | -6.190 |
Versus | -6.103 |
eur | -6.073 |
aido | -6.030 |
INESS | -5.984 |
Token | stunning |
Token ID | 13393 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
ricks | +11.305 |
enriched | +10.732 |
enrich | +10.565 |
--------------- | +10.416 |
dy | +10.270 |
Neg logit contributions | |
Versus | -10.537 |
ULAR | -10.534 |
INESS | -10.460 |
aido | -10.387 |
eur | -10.076 |
Token | and |
Token ID | 290 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
ricks | +1.291 |
abama | +1.176 |
idth | +1.169 |
--------------- | +1.154 |
akespeare | +1.131 |
Neg logit contributions | |
Versus | -1.422 |
ULAR | -1.421 |
eur | -1.405 |
aido | -1.364 |
INESS | -1.353 |
Token | colorful |
Token ID | 20239 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
ricks | +2.049 |
idth | +1.940 |
abama | +1.886 |
--------------- | +1.869 |
akespeare | +1.814 |
Neg logit contributions | |
eur | -1.551 |
ULAR | -1.548 |
Versus | -1.515 |
aido | -1.476 |
atively | -1.465 |
Token | Marvel |
Token ID | 9923 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
ricks | +1.457 |
idth | +1.326 |
abama | +1.320 |
--------------- | +1.307 |
akespeare | +1.267 |
Neg logit contributions | |
ULAR | -1.660 |
Versus | -1.646 |
eur | -1.633 |
aido | -1.587 |
INESS | -1.576 |
Token | 's |
Token ID | 338 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
ricks | +0.675 |
abama | +0.633 |
idth | +0.628 |
--------------- | +0.623 |
akespeare | +0.610 |
Neg logit contributions | |
ULAR | -0.530 |
Versus | -0.524 |
eur | -0.512 |
INESS | -0.504 |
aido | -0.494 |
Token | and |
Token ID | 290 |
Feature activation | +2.05e-01 |
Pos logit contributions | |
ricks | +1.986 |
idth | +1.875 |
abama | +1.824 |
--------------- | +1.821 |
xual | +1.766 |
Neg logit contributions | |
ULAR | -1.677 |
Versus | -1.670 |
eur | -1.669 |
aido | -1.617 |
opa | -1.593 |
Token | it |
Token ID | 340 |
Feature activation | -5.28e-01 |
Pos logit contributions | |
eur | +1.054 |
ULAR | +1.037 |
Versus | +1.033 |
atively | +1.010 |
aido | +1.003 |
Neg logit contributions | |
ricks | -1.256 |
idth | -1.197 |
--------------- | -1.149 |
abama | -1.147 |
xual | -1.119 |
Token | will |
Token ID | 481 |
Feature activation | -5.27e-01 |
Pos logit contributions | |
ricks | +3.163 |
idth | +2.950 |
--------------- | +2.892 |
abama | +2.877 |
enriched | +2.776 |
Neg logit contributions | |
eur | -2.820 |
ULAR | -2.803 |
Versus | -2.766 |
aido | -2.709 |
INESS | -2.687 |
Token | turn |
Token ID | 1210 |
Feature activation | -5.19e-01 |
Pos logit contributions | |
ricks | +3.402 |
idth | +3.197 |
--------------- | +3.143 |
abama | +3.131 |
xual | +3.016 |
Neg logit contributions | |
eur | -2.576 |
ULAR | -2.570 |
Versus | -2.517 |
aido | -2.474 |
opa | -2.423 |
Token | a |
Token ID | 257 |
Feature activation | -7.81e-01 |
Pos logit contributions | |
ricks | +3.426 |
idth | +3.198 |
--------------- | +3.154 |
abama | +3.122 |
enriched | +3.046 |
Neg logit contributions | |
ULAR | -2.459 |
eur | -2.428 |
Versus | -2.413 |
aido | -2.353 |
INESS | -2.322 |
Token | spotlight |
Token ID | 17838 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
ricks | +4.673 |
idth | +4.321 |
--------------- | +4.263 |
abama | +4.221 |
enriched | +4.119 |
Neg logit contributions | |
ULAR | -4.156 |
eur | -4.108 |
Versus | -4.080 |
aido | -4.011 |
INESS | -3.977 |
Token | on |
Token ID | 319 |
Feature activation | -6.89e-01 |
Pos logit contributions | |
ricks | +10.016 |
enriched | +9.756 |
dy | +9.708 |
wards | +9.593 |
idth | +9.357 |
Neg logit contributions | |
INESS | -10.377 |
aido | -10.193 |
eur | -10.013 |
ULAR | -9.987 |
Versus | -9.973 |
Token | the |
Token ID | 262 |
Feature activation | -3.33e-01 |
Pos logit contributions | |
ricks | +3.945 |
idth | +3.637 |
--------------- | +3.583 |
abama | +3.544 |
enriched | +3.452 |
Neg logit contributions | |
ULAR | -3.851 |
eur | -3.811 |
Versus | -3.787 |
aido | -3.721 |
INESS | -3.691 |
Token | pivotal |
Token ID | 28992 |
Feature activation | -8.95e-01 |
Pos logit contributions | |
ricks | +2.041 |
idth | +1.898 |
--------------- | +1.854 |
abama | +1.826 |
xual | +1.797 |
Neg logit contributions | |
ULAR | -1.752 |
eur | -1.748 |
Versus | -1.743 |
atively | -1.660 |
aido | -1.659 |
Token | role |
Token ID | 2597 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
ricks | +4.671 |
idth | +4.272 |
--------------- | +4.207 |
abama | +4.167 |
enriched | +4.066 |
Neg logit contributions | |
ULAR | -5.407 |
eur | -5.340 |
Versus | -5.296 |
aido | -5.272 |
INESS | -5.220 |
Token | that |
Token ID | 326 |
Feature activation | -4.27e-01 |
Pos logit contributions | |
ricks | +6.013 |
enriched | +5.437 |
idth | +5.410 |
--------------- | +5.371 |
abama | +5.353 |
Neg logit contributions | |
ULAR | -6.860 |
INESS | -6.830 |
aido | -6.757 |
Versus | -6.744 |
eur | -6.743 |
Token | . |
Token ID | 13 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
ricks | +5.205 |
--------------- | +4.970 |
dy | +4.677 |
abama | +4.631 |
idth | +4.556 |
Neg logit contributions | |
aido | -6.313 |
accompan | -6.308 |
Versus | -6.285 |
ULAR | -6.243 |
eur | -6.155 |
Token | Font |
Token ID | 23252 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
ricks | +0.547 |
idth | +0.487 |
--------------- | +0.476 |
abama | +0.472 |
enriched | +0.456 |
Neg logit contributions | |
ULAR | -0.947 |
eur | -0.938 |
Versus | -0.931 |
aido | -0.920 |
INESS | -0.916 |
Token | Style |
Token ID | 21466 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
ricks | +4.077 |
--------------- | +3.560 |
idth | +3.539 |
dy | +3.403 |
abama | +3.195 |
Neg logit contributions | |
Versus | -8.659 |
aido | -8.642 |
ULAR | -8.593 |
eur | -8.554 |
opa | -8.444 |
Token | ] |
Token ID | 60 |
Feature activation | -6.56e-01 |
Pos logit contributions | |
ricks | +6.716 |
--------------- | +6.377 |
idth | +6.026 |
dy | +5.927 |
abama | +5.898 |
Neg logit contributions | |
aido | -8.985 |
Versus | -8.952 |
accompan | -8.915 |
ULAR | -8.845 |
eur | -8.843 |
Token | :: |
Token ID | 3712 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
ricks | +3.273 |
--------------- | +2.991 |
idth | +2.945 |
abama | +2.894 |
dy | +2.810 |
Neg logit contributions | |
ULAR | -4.095 |
Versus | -4.046 |
eur | -4.032 |
aido | -4.015 |
INESS | -3.953 |
Token | B |
Token ID | 33 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
ULAR | +1.214 |
eur | +1.156 |
Versus | +1.110 |
INESS | +1.107 |
aido | +1.094 |
Neg logit contributions | |
ricks | -1.653 |
idth | -1.557 |
xual | -1.524 |
abama | -1.521 |
enriched | -1.506 |
Token | old |
Token ID | 727 |
Feature activation | -7.62e-01 |
Pos logit contributions | |
ricks | +7.443 |
dy | +6.327 |
idth | +6.201 |
--------------- | +6.078 |
orate | +5.775 |
Neg logit contributions | |
Versus | -14.580 |
INESS | -14.412 |
accompan | -14.374 |
闘 | -14.102 |
semblance | -13.938 |
Token | ) |
Token ID | 8 |
Feature activation | -5.26e-01 |
Pos logit contributions | |
ricks | +3.554 |
idth | +3.301 |
--------------- | +3.237 |
abama | +3.210 |
enriched | +3.131 |
Neg logit contributions | |
Versus | -4.740 |
ULAR | -4.721 |
aido | -4.687 |
eur | -4.659 |
INESS | -4.609 |
Token | $ |
Token ID | 720 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
ricks | +2.356 |
idth | +2.151 |
--------------- | +2.124 |
abama | +2.056 |
dup | +2.028 |
Neg logit contributions | |
ULAR | -3.519 |
aido | -3.473 |
eur | -3.461 |
Versus | -3.453 |
INESS | -3.420 |
Token | Br |
Token ID | 9414 |
Feature activation | -7.85e-01 |
Pos logit contributions | |
ricks | +5.418 |
idth | +4.806 |
--------------- | +4.759 |
dy | +4.628 |
abama | +4.577 |
Neg logit contributions | |
Versus | -7.668 |
ULAR | -7.584 |
INESS | -7.429 |
aido | -7.424 |
eur | -7.369 |
Token | ush |
Token ID | 1530 |
Feature activation | -6.85e-01 |
Pos logit contributions | |
ricks | +4.314 |
idth | +3.876 |
--------------- | +3.858 |
abama | +3.795 |
akespeare | +3.664 |
Neg logit contributions | |
ULAR | -4.562 |
Versus | -4.518 |
eur | -4.456 |
INESS | -4.403 |
aido | -4.343 |
Token | you |
Token ID | 345 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
ricks | +3.276 |
idth | +3.072 |
abama | +3.024 |
--------------- | +2.997 |
akespeare | +2.920 |
Neg logit contributions | |
Versus | -2.461 |
ULAR | -2.457 |
eur | -2.436 |
aido | -2.375 |
INESS | -2.338 |
Token | will |
Token ID | 481 |
Feature activation | -6.89e-01 |
Pos logit contributions | |
ricks | +1.727 |
idth | +1.637 |
abama | +1.606 |
--------------- | +1.562 |
xual | +1.548 |
Neg logit contributions | |
Versus | -1.271 |
eur | -1.255 |
ULAR | -1.255 |
aido | -1.214 |
opa | -1.191 |
Token | see |
Token ID | 766 |
Feature activation | -3.90e-01 |
Pos logit contributions | |
ricks | +4.455 |
idth | +4.152 |
abama | +4.078 |
--------------- | +4.075 |
akespeare | +3.953 |
Neg logit contributions | |
ULAR | -3.358 |
eur | -3.326 |
Versus | -3.305 |
aido | -3.233 |
INESS | -3.175 |
Token | all |
Token ID | 477 |
Feature activation | -7.44e-01 |
Pos logit contributions | |
ricks | +2.416 |
idth | +2.251 |
abama | +2.216 |
--------------- | +2.205 |
akespeare | +2.144 |
Neg logit contributions | |
ULAR | -2.008 |
eur | -2.004 |
Versus | -2.003 |
aido | -1.928 |
INESS | -1.914 |
Token | available |
Token ID | 1695 |
Feature activation | -8.79e-01 |
Pos logit contributions | |
ricks | +4.339 |
idth | +3.999 |
--------------- | +3.949 |
abama | +3.906 |
enriched | +3.817 |
Neg logit contributions | |
ULAR | -4.066 |
eur | -4.020 |
Versus | -3.992 |
aido | -3.931 |
INESS | -3.900 |
Token | B |
Token ID | 347 |
Feature activation | -2.05e+00 |
Pos logit contributions | |
ricks | +4.693 |
idth | +4.270 |
--------------- | +4.227 |
abama | +4.172 |
enriched | +4.119 |
Neg logit contributions | |
ULAR | -5.172 |
eur | -5.113 |
Versus | -5.045 |
aido | -5.041 |
INESS | -4.998 |
Token | isc |
Token ID | 2304 |
Feature activation | +6.45e-01 |
Pos logit contributions | |
ricks | +9.891 |
idth | +8.271 |
--------------- | +8.034 |
abama | +7.766 |
akespeare | +7.744 |
Neg logit contributions | |
eur | -12.018 |
ULAR | -11.900 |
Versus | -11.738 |
INESS | -11.668 |
aido | -11.455 |
Token | uit |
Token ID | 5013 |
Feature activation | -6.37e-01 |
Pos logit contributions | |
ULAR | +2.296 |
eur | +2.231 |
opa | +2.200 |
Versus | +2.186 |
aido | +2.181 |
Neg logit contributions | |
ricks | -4.737 |
--------------- | -4.572 |
idth | -4.520 |
abama | -4.463 |
xual | -4.452 |
Token | pets |
Token ID | 17252 |
Feature activation | +7.65e-02 |
Pos logit contributions | |
ricks | +3.353 |
idth | +3.073 |
--------------- | +3.022 |
abama | +2.989 |
enriched | +2.900 |
Neg logit contributions | |
ULAR | -3.852 |
eur | -3.815 |
Versus | -3.796 |
aido | -3.732 |
INESS | -3.706 |
Token | . |
Token ID | 13 |
Feature activation | -3.48e-01 |
Pos logit contributions | |
Versus | +0.369 |
ULAR | +0.363 |
eur | +0.362 |
aido | +0.350 |
atively | +0.348 |
Neg logit contributions | |
ricks | -0.493 |
idth | -0.469 |
abama | -0.452 |
--------------- | -0.450 |
akespeare | -0.444 |
Token | Similarly |
Token ID | 15298 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
ricks | +2.108 |
idth | +1.977 |
abama | +1.921 |
--------------- | +1.886 |
enriched | +1.880 |
Neg logit contributions | |
Versus | -1.864 |
ULAR | -1.845 |
eur | -1.833 |
aido | -1.758 |
INESS | -1.749 |
Token | System |
Token ID | 11964 |
Feature activation | -5.83e-01 |
Pos logit contributions | |
ricks | +0.124 |
idth | +0.114 |
abama | +0.111 |
--------------- | +0.110 |
enriched | +0.110 |
Neg logit contributions | |
ULAR | -0.120 |
eur | -0.117 |
Versus | -0.115 |
INESS | -0.114 |
aido | -0.112 |
Token | . |
Token ID | 13 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
ricks | +3.094 |
idth | +2.862 |
--------------- | +2.853 |
abama | +2.820 |
dy | +2.750 |
Neg logit contributions | |
ULAR | -3.324 |
Versus | -3.317 |
eur | -3.288 |
aido | -3.262 |
INESS | -3.216 |
Token | Draw |
Token ID | 25302 |
Feature activation | -6.07e-01 |
Pos logit contributions | |
ricks | +2.137 |
idth | +1.977 |
--------------- | +1.938 |
abama | +1.926 |
enriched | +1.892 |
Neg logit contributions | |
ULAR | -1.943 |
eur | -1.917 |
Versus | -1.890 |
aido | -1.859 |
INESS | -1.850 |
Token | ing |
Token ID | 278 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
ricks | +3.876 |
idth | +3.592 |
--------------- | +3.560 |
abama | +3.517 |
enriched | +3.426 |
Neg logit contributions | |
ULAR | -2.971 |
Versus | -2.916 |
eur | -2.914 |
aido | -2.860 |
INESS | -2.837 |
Token | . |
Token ID | 13 |
Feature activation | -5.85e-01 |
Pos logit contributions | |
ricks | +5.934 |
--------------- | +5.397 |
idth | +5.373 |
\\ | +5.204 |
abama | +5.176 |
Neg logit contributions | |
aido | -8.703 |
Versus | -8.588 |
accompan | -8.569 |
opa | -8.565 |
eur | -8.522 |
Token | Color |
Token ID | 10258 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
ricks | +4.143 |
idth | +3.880 |
--------------- | +3.836 |
abama | +3.806 |
enriched | +3.732 |
Neg logit contributions | |
ULAR | -2.471 |
eur | -2.433 |
Versus | -2.411 |
aido | -2.359 |
INESS | -2.336 |
Token | ] |
Token ID | 60 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
ricks | +10.176 |
idth | +9.381 |
--------------- | +9.247 |
dy | +9.002 |
abama | +8.859 |
Neg logit contributions | |
eur | -10.934 |
aido | -10.813 |
INESS | -10.717 |
opa | -10.677 |
Versus | -10.569 |
Token | :: |
Token ID | 3712 |
Feature activation | -9.55e-01 |
Pos logit contributions | |
ricks | +4.996 |
--------------- | +4.559 |
idth | +4.557 |
abama | +4.395 |
enriched | +4.341 |
Neg logit contributions | |
ULAR | -6.787 |
aido | -6.769 |
Versus | -6.722 |
eur | -6.720 |
INESS | -6.599 |
Token | From |
Token ID | 4863 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
ricks | +5.521 |
idth | +5.111 |
--------------- | +5.105 |
abama | +4.977 |
dy | +4.885 |
Neg logit contributions | |
Versus | -5.080 |
ULAR | -5.072 |
eur | -5.038 |
aido | -5.002 |
INESS | -4.914 |
Token | Ar |
Token ID | 3163 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
ricks | +6.512 |
--------------- | +6.217 |
idth | +6.114 |
abama | +5.906 |
dy | +5.860 |
Neg logit contributions | |
aido | -7.364 |
Versus | -7.234 |
eur | -7.120 |
opa | -6.954 |
accompan | -6.943 |
Token | gb |
Token ID | 22296 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
ricks | +6.996 |
idth | +6.350 |
dy | +6.322 |
abama | +6.041 |
--------------- | +5.710 |
Neg logit contributions | |
ULAR | -13.499 |
闘 | -13.478 |
accompan | -13.449 |
INESS | -13.277 |
Versus | -13.191 |
Token | other |
Token ID | 584 |
Feature activation | +5.00e-02 |
Pos logit contributions | |
Versus | +1.618 |
eur | +1.603 |
ULAR | +1.593 |
moderately | +1.540 |
rudimentary | +1.528 |
Neg logit contributions | |
ricks | -2.159 |
idth | -2.031 |
abama | -2.024 |
--------------- | -1.956 |
raught | -1.938 |
Token | than |
Token ID | 621 |
Feature activation | +9.67e-01 |
Pos logit contributions | |
ULAR | +0.237 |
Versus | +0.234 |
eur | +0.233 |
atively | +0.228 |
aido | +0.224 |
Neg logit contributions | |
ricks | -0.334 |
idth | -0.313 |
abama | -0.308 |
--------------- | -0.299 |
raught | -0.298 |
Token | 8 |
Token ID | 807 |
Feature activation | +4.78e-02 |
Pos logit contributions | |
Versus | +4.610 |
rudimentary | +4.559 |
ULAR | +4.540 |
moderately | +4.470 |
survival | +4.448 |
Neg logit contributions | |
ricks | -5.831 |
abama | -5.654 |
idth | -5.571 |
akespeare | -5.402 |
--------------- | -5.376 |
Token | - |
Token ID | 12 |
Feature activation | -6.04e-01 |
Pos logit contributions | |
ULAR | +0.170 |
eur | +0.168 |
Versus | +0.166 |
aido | +0.160 |
INESS | +0.157 |
Neg logit contributions | |
ricks | -0.369 |
idth | -0.347 |
abama | -0.345 |
--------------- | -0.345 |
akespeare | -0.337 |
Token | bit |
Token ID | 2545 |
Feature activation | -6.25e-01 |
Pos logit contributions | |
ricks | +3.189 |
idth | +2.926 |
--------------- | +2.873 |
abama | +2.849 |
enriched | +2.769 |
Neg logit contributions | |
ULAR | -3.645 |
eur | -3.607 |
Versus | -3.585 |
aido | -3.539 |
INESS | -3.505 |
Token | A |
Token ID | 317 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
ricks | +3.860 |
idth | +3.586 |
--------------- | +3.528 |
abama | +3.516 |
akespeare | +3.411 |
Neg logit contributions | |
ULAR | -3.222 |
eur | -3.175 |
Versus | -3.165 |
aido | -3.102 |
INESS | -3.065 |
Token | VR |
Token ID | 13024 |
Feature activation | -8.78e-01 |
Pos logit contributions | |
ricks | +10.503 |
--------------- | +9.734 |
dy | +8.958 |
enriched | +8.830 |
idth | +8.793 |
Neg logit contributions | |
ULAR | -11.090 |
eur | -10.879 |
Versus | -10.782 |
INESS | -10.749 |
aido | -10.529 |
Token | is |
Token ID | 318 |
Feature activation | +8.38e-01 |
Pos logit contributions | |
ricks | +5.259 |
idth | +4.850 |
--------------- | +4.792 |
abama | +4.703 |
enriched | +4.644 |
Neg logit contributions | |
ULAR | -4.614 |
eur | -4.571 |
Versus | -4.524 |
aido | -4.460 |
INESS | -4.427 |
Token | far |
Token ID | 1290 |
Feature activation | +7.04e-01 |
Pos logit contributions | |
Versus | +3.689 |
eur | +3.683 |
rudimentary | +3.577 |
moderately | +3.543 |
ULAR | +3.513 |
Neg logit contributions | |
idth | -5.477 |
ricks | -5.449 |
abama | -5.213 |
xual | -5.140 |
akespeare | -5.034 |
Token | more |
Token ID | 517 |
Feature activation | +3.45e-02 |
Pos logit contributions | |
eur | +3.070 |
Versus | +2.829 |
rudimentary | +2.653 |
survival | +2.617 |
aido | +2.589 |
Neg logit contributions | |
idth | -4.866 |
ricks | -4.851 |
xual | -4.611 |
abama | -4.526 |
akespeare | -4.438 |
Token | challenging |
Token ID | 9389 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
eur | +0.179 |
ULAR | +0.177 |
Versus | +0.176 |
aido | +0.169 |
atively | +0.169 |
Neg logit contributions | |
ricks | -0.212 |
idth | -0.205 |
abama | -0.200 |
xual | -0.190 |
--------------- | -0.189 |
Token | mp |
Token ID | 3149 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
ricks | +3.205 |
idth | +2.157 |
dy | +2.071 |
--------------- | +2.059 |
abama | +2.030 |
Neg logit contributions | |
Versus | -13.236 |
ULAR | -13.089 |
INESS | -12.939 |
aido | -12.626 |
accompan | -12.615 |
Token | ) |
Token ID | 8 |
Feature activation | -8.32e-01 |
Pos logit contributions | |
ricks | +4.988 |
idth | +4.665 |
abama | +4.570 |
--------------- | +4.530 |
dy | +4.432 |
Neg logit contributions | |
Versus | -8.399 |
INESS | -8.113 |
aido | -8.111 |
ULAR | -8.106 |
eur | -7.928 |
Token | $ |
Token ID | 720 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
ricks | +4.634 |
idth | +4.342 |
--------------- | +4.298 |
abama | +4.190 |
dup | +4.168 |
Neg logit contributions | |
ULAR | -4.580 |
eur | -4.473 |
Versus | -4.467 |
aido | -4.464 |
INESS | -4.425 |
Token | image |
Token ID | 9060 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
ricks | +7.417 |
idth | +6.871 |
--------------- | +6.757 |
dy | +6.670 |
abama | +6.618 |
Neg logit contributions | |
Versus | -6.430 |
ULAR | -6.339 |
INESS | -6.105 |
aido | -6.079 |
eur | -6.067 |
Token | . |
Token ID | 13 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
ricks | +5.832 |
--------------- | +5.393 |
idth | +5.388 |
abama | +5.193 |
dy | +5.093 |
Neg logit contributions | |
ULAR | -6.084 |
aido | -6.059 |
Versus | -6.053 |
INESS | -5.984 |
eur | -5.964 |
Token | Fill |
Token ID | 33762 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
ricks | +3.549 |
idth | +3.281 |
--------------- | +3.231 |
abama | +3.205 |
enriched | +3.130 |
Neg logit contributions | |
ULAR | -3.247 |
eur | -3.212 |
Versus | -3.182 |
aido | -3.134 |
INESS | -3.104 |
Token | Rect |
Token ID | 45474 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
ricks | +10.159 |
idth | +9.844 |
--------------- | +9.840 |
dy | +9.306 |
dup | +9.228 |
Neg logit contributions | |
aido | -10.266 |
Versus | -10.141 |
eur | -10.083 |
accompan | -9.964 |
ULAR | -9.854 |
Token | angle |
Token ID | 9248 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
ricks | +6.886 |
idth | +6.382 |
--------------- | +6.209 |
dup | +6.078 |
dy | +6.052 |
Neg logit contributions | |
Versus | -8.211 |
ULAR | -8.184 |
aido | -8.168 |
eur | -8.075 |
INESS | -8.040 |
Token | ( |
Token ID | 7 |
Feature activation | -2.03e-01 |
Pos logit contributions | |
ricks | +7.897 |
idth | +7.482 |
--------------- | +7.465 |
dy | +7.059 |
dup | +7.024 |
Neg logit contributions | |
aido | -9.999 |
eur | -9.885 |
Versus | -9.850 |
ULAR | -9.789 |
accompan | -9.663 |
Token | ( |
Token ID | 357 |
Feature activation | -5.97e-02 |
Pos logit contributions | |
ricks | +1.305 |
idth | +1.195 |
abama | +1.189 |
--------------- | +1.179 |
enriched | +1.167 |
Neg logit contributions | |
ULAR | -1.014 |
eur | -0.999 |
Versus | -0.974 |
INESS | -0.957 |
aido | -0.957 |
Token | New |
Token ID | 3791 |
Feature activation | +5.54e-02 |
Pos logit contributions | |
ricks | +0.379 |
idth | +0.341 |
abama | +0.339 |
--------------- | +0.338 |
akespeare | +0.336 |
Neg logit contributions | |
ULAR | -0.308 |
eur | -0.301 |
Versus | -0.296 |
INESS | -0.289 |
aido | -0.285 |
Token | other |
Token ID | 584 |
Feature activation | +2.23e-01 |
Pos logit contributions | |
Versus | +1.787 |
ULAR | +1.748 |
eur | +1.745 |
INESS | +1.652 |
atively | +1.648 |
Neg logit contributions | |
ricks | -2.588 |
idth | -2.463 |
abama | -2.429 |
akespeare | -2.410 |
xual | -2.384 |
Token | options |
Token ID | 3689 |
Feature activation | +4.23e-01 |
Pos logit contributions | |
Versus | +1.051 |
ULAR | +1.027 |
eur | +1.021 |
survival | +0.969 |
INESS | +0.961 |
Neg logit contributions | |
ricks | -1.473 |
idth | -1.421 |
abama | -1.400 |
xual | -1.376 |
akespeare | -1.372 |
Token | to |
Token ID | 284 |
Feature activation | -9.34e-02 |
Pos logit contributions | |
Versus | +2.023 |
eur | +1.982 |
ULAR | +1.945 |
atively | +1.879 |
aido | +1.861 |
Neg logit contributions | |
ricks | -2.760 |
idth | -2.633 |
abama | -2.580 |
--------------- | -2.522 |
akespeare | -2.509 |
Token | buy |
Token ID | 2822 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
ricks | +0.643 |
idth | +0.613 |
abama | +0.603 |
--------------- | +0.594 |
akespeare | +0.587 |
Neg logit contributions | |
Versus | -0.421 |
ULAR | -0.417 |
eur | -0.411 |
aido | -0.396 |
atively | -0.388 |
Token | the |
Token ID | 262 |
Feature activation | +5.30e-01 |
Pos logit contributions | |
ricks | +0.725 |
idth | +0.684 |
abama | +0.677 |
--------------- | +0.666 |
akespeare | +0.660 |
Neg logit contributions | |
Versus | -0.603 |
ULAR | -0.595 |
eur | -0.591 |
aido | -0.569 |
INESS | -0.569 |
Token | Nexus |
Token ID | 16756 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
Versus | +2.174 |
ULAR | +2.099 |
eur | +2.071 |
INESS | +1.989 |
interim | +1.954 |
Neg logit contributions | |
ricks | -3.728 |
abama | -3.597 |
idth | -3.596 |
akespeare | -3.544 |
xual | -3.534 |
Token | 6 |
Token ID | 718 |
Feature activation | +7.82e-01 |
Pos logit contributions | |
Versus | +5.289 |
ULAR | +4.847 |
eur | +4.829 |
INESS | +4.795 |
opa | +4.576 |
Neg logit contributions | |
ricks | -11.814 |
idth | -11.495 |
abama | -11.423 |
akespeare | -11.156 |
dy | -10.984 |
Token | . |
Token ID | 13 |
Feature activation | -4.51e-02 |
Pos logit contributions | |
Versus | +3.620 |
ULAR | +3.595 |
eur | +3.456 |
INESS | +3.419 |
survival | +3.282 |
Neg logit contributions | |
ricks | -4.995 |
idth | -4.886 |
abama | -4.848 |
akespeare | -4.798 |
--------------- | -4.655 |
Token | No |
Token ID | 1400 |
Feature activation | -5.54e-01 |
Pos logit contributions | |
ricks | +0.287 |
idth | +0.269 |
abama | +0.261 |
akespeare | +0.258 |
enriched | +0.257 |
Neg logit contributions | |
Versus | -0.235 |
ULAR | -0.228 |
eur | -0.227 |
INESS | -0.218 |
aido | -0.214 |
Token | word |
Token ID | 1573 |
Feature activation | +7.15e-01 |
Pos logit contributions | |
ricks | +3.541 |
idth | +3.289 |
--------------- | +3.240 |
abama | +3.224 |
akespeare | +3.145 |
Neg logit contributions | |
ULAR | -2.743 |
eur | -2.721 |
Versus | -2.707 |
aido | -2.632 |
INESS | -2.619 |
Token | on |
Token ID | 319 |
Feature activation | +5.11e-01 |
Pos logit contributions | |
eur | +2.835 |
Versus | +2.812 |
ULAR | +2.760 |
atively | +2.716 |
aido | +2.586 |
Neg logit contributions | |
ricks | -5.079 |
idth | -4.918 |
abama | -4.779 |
akespeare | -4.746 |
raught | -4.674 |
Token | IS |
Token ID | 1797 |
Feature activation | +6.25e-01 |
Pos logit contributions | |
ULAR | +1.703 |
INESS | +1.567 |
eur | +1.514 |
Versus | +1.462 |
aido | +1.401 |
Neg logit contributions | |
ricks | -2.990 |
idth | -2.862 |
enriched | -2.848 |
enrich | -2.801 |
raught | -2.774 |
Token | CO |
Token ID | 8220 |
Feature activation | +2.49e-01 |
Pos logit contributions | |
ULAR | +1.325 |
INESS | +1.127 |
aido | +1.098 |
Versus | +1.098 |
eur | +1.083 |
Neg logit contributions | |
ricks | -5.869 |
idth | -5.786 |
abama | -5.600 |
xual | -5.573 |
enriched | -5.551 |
Token | - |
Token ID | 532 |
Feature activation | -7.39e-02 |
Pos logit contributions | |
ULAR | +1.048 |
Versus | +1.036 |
eur | +1.013 |
INESS | +0.985 |
aido | +0.966 |
Neg logit contributions | |
ricks | -1.785 |
idth | -1.691 |
abama | -1.644 |
--------------- | -1.615 |
akespeare | -1.613 |
Token | Reddit |
Token ID | 10750 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
ricks | +0.474 |
idth | +0.443 |
abama | +0.429 |
enriched | +0.426 |
--------------- | +0.423 |
Neg logit contributions | |
ULAR | -0.374 |
Versus | -0.372 |
eur | -0.367 |
INESS | -0.357 |
aido | -0.351 |
Token | and |
Token ID | 290 |
Feature activation | +4.24e-01 |
Pos logit contributions | |
Versus | +6.869 |
ULAR | +6.851 |
interim | +6.730 |
eur | +6.724 |
opa | +6.490 |
Neg logit contributions | |
idth | -9.677 |
ricks | -9.656 |
abama | -9.578 |
raught | -9.176 |
akespeare | -9.016 |
Token | Google |
Token ID | 3012 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
Versus | +1.891 |
ULAR | +1.840 |
eur | +1.829 |
atively | +1.740 |
aido | +1.735 |
Neg logit contributions | |
ricks | -2.866 |
idth | -2.723 |
abama | -2.699 |
--------------- | -2.674 |
raught | -2.607 |
Token | are |
Token ID | 389 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
ULAR | +6.050 |
Versus | +6.036 |
interim | +5.743 |
eur | +5.670 |
survival | +5.652 |
Neg logit contributions | |
ricks | -8.814 |
idth | -8.612 |
abama | -8.413 |
xual | -8.122 |
raught | -8.085 |
Token | taking |
Token ID | 2263 |
Feature activation | +3.36e-01 |
Pos logit contributions | |
ricks | +0.183 |
idth | +0.177 |
--------------- | +0.169 |
abama | +0.169 |
xual | +0.166 |
Neg logit contributions | |
Versus | -0.123 |
ULAR | -0.121 |
eur | -0.119 |
aido | -0.115 |
atively | -0.114 |
Token | a |
Token ID | 257 |
Feature activation | -5.27e-01 |
Pos logit contributions | |
Versus | +1.563 |
ULAR | +1.550 |
eur | +1.537 |
atively | +1.493 |
interim | +1.475 |
Neg logit contributions | |
ricks | -2.254 |
idth | -2.086 |
abama | -2.080 |
--------------- | -2.069 |
akespeare | -2.029 |
Token | tougher |
Token ID | 20516 |
Feature activation | -4.93e-01 |
Pos logit contributions | |
ricks | +3.259 |
idth | +3.024 |
--------------- | +2.979 |
abama | +2.952 |
enriched | +2.873 |
Neg logit contributions | |
ULAR | -2.719 |
eur | -2.683 |
Versus | -2.671 |
aido | -2.610 |
INESS | -2.596 |
Token | stance |
Token ID | 12046 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
ricks | +3.369 |
idth | +3.148 |
--------------- | +3.109 |
abama | +3.084 |
enriched | +3.017 |
Neg logit contributions | |
ULAR | -2.213 |
eur | -2.185 |
Versus | -2.170 |
aido | -2.117 |
INESS | -2.101 |
Token | Roe |
Token ID | 34904 |
Feature activation | +7.32e-01 |
Pos logit contributions | |
Versus | +3.618 |
eur | +3.569 |
aido | +3.250 |
ULAR | +3.193 |
INESS | +3.193 |
Neg logit contributions | |
ricks | -5.961 |
idth | -5.740 |
abama | -5.683 |
--------------- | -5.594 |
akespeare | -5.475 |
Token | " |
Token ID | 1 |
Feature activation | +4.49e-02 |
Pos logit contributions | |
Versus | +3.762 |
eur | +3.722 |
opa | +3.354 |
atively | +3.352 |
aido | +3.338 |
Neg logit contributions | |
ricks | -4.360 |
idth | -4.130 |
--------------- | -4.114 |
abama | -4.076 |
akespeare | -3.996 |
Token | through |
Token ID | 832 |
Feature activation | -6.09e-01 |
Pos logit contributions | |
Versus | +0.217 |
eur | +0.217 |
ULAR | +0.209 |
aido | +0.208 |
atively | +0.206 |
Neg logit contributions | |
ricks | -0.292 |
idth | -0.281 |
abama | -0.271 |
--------------- | -0.269 |
akespeare | -0.259 |
Token | a |
Token ID | 257 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
ricks | +4.017 |
idth | +3.749 |
--------------- | +3.699 |
abama | +3.664 |
enriched | +3.578 |
Neg logit contributions | |
ULAR | -2.882 |
eur | -2.852 |
Versus | -2.833 |
aido | -2.768 |
INESS | -2.738 |
Token | dating |
Token ID | 10691 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
Versus | +0.046 |
eur | +0.046 |
ULAR | +0.046 |
aido | +0.043 |
rudimentary | +0.043 |
Neg logit contributions | |
ricks | -0.070 |
idth | -0.066 |
--------------- | -0.064 |
abama | -0.064 |
akespeare | -0.061 |
Token | app |
Token ID | 598 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
ricks | +1.026 |
idth | +0.984 |
--------------- | +0.954 |
abama | +0.951 |
akespeare | +0.931 |
Neg logit contributions | |
eur | -0.428 |
ULAR | -0.420 |
Versus | -0.415 |
aido | -0.390 |
INESS | -0.381 |
Token | . |
Token ID | 13 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
Versus | +7.630 |
eur | +7.585 |
ULAR | +7.241 |
interim | +7.143 |
atively | +6.899 |
Neg logit contributions | |
idth | -11.053 |
ricks | -11.024 |
abama | -10.864 |
--------------- | -10.280 |
akespeare | -9.974 |
Token |
|
Token ID | 198 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
ricks | +0.946 |
idth | +0.882 |
--------------- | +0.846 |
enriched | +0.841 |
abama | +0.839 |
Neg logit contributions | |
Versus | -0.967 |
eur | -0.962 |
ULAR | -0.961 |
INESS | -0.917 |
aido | -0.915 |
Token |
|
Token ID | 198 |
Feature activation | -5.37e-01 |
Pos logit contributions | |
ricks | +1.139 |
idth | +1.065 |
abama | +1.021 |
--------------- | +1.010 |
enriched | +1.007 |
Neg logit contributions | |
ULAR | -1.211 |
eur | -1.210 |
Versus | -1.187 |
aido | -1.159 |
INESS | -1.156 |
Token | The |
Token ID | 464 |
Feature activation | -4.05e-01 |
Pos logit contributions | |
ricks | +3.020 |
idth | +2.801 |
--------------- | +2.721 |
abama | +2.719 |
enriched | +2.674 |
Neg logit contributions | |
ULAR | -3.073 |
eur | -3.047 |
Versus | -2.989 |
aido | -2.946 |
INESS | -2.942 |
Token | court |
Token ID | 2184 |
Feature activation | -8.62e-02 |
Pos logit contributions | |
ricks | +2.400 |
idth | +2.223 |
--------------- | +2.179 |
abama | +2.151 |
akespeare | +2.097 |
Neg logit contributions | |
eur | -2.212 |
ULAR | -2.210 |
Versus | -2.194 |
aido | -2.125 |
INESS | -2.109 |
Token | like |
Token ID | 588 |
Feature activation | -2.82e-01 |
Pos logit contributions | |
ricks | +3.400 |
idth | +3.180 |
--------------- | +3.124 |
abama | +3.116 |
akespeare | +3.016 |
Neg logit contributions | |
ULAR | -2.545 |
eur | -2.518 |
Versus | -2.505 |
aido | -2.447 |
INESS | -2.420 |
Token | digital |
Token ID | 4875 |
Feature activation | -9.54e-01 |
Pos logit contributions | |
ricks | +1.742 |
abama | +1.605 |
idth | +1.603 |
--------------- | +1.568 |
akespeare | +1.557 |
Neg logit contributions | |
ULAR | -1.459 |
Versus | -1.452 |
eur | -1.438 |
aido | -1.403 |
INESS | -1.389 |
Token | Write |
Token ID | 16594 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
ricks | +5.846 |
idth | +5.428 |
--------------- | +5.368 |
abama | +5.258 |
enriched | +5.192 |
Neg logit contributions | |
ULAR | -4.843 |
eur | -4.810 |
Versus | -4.744 |
aido | -4.692 |
INESS | -4.651 |
Token | () |
Token ID | 3419 |
Feature activation | -5.89e-01 |
Pos logit contributions | |
ricks | +6.217 |
--------------- | +5.684 |
idth | +5.676 |
enriched | +5.448 |
abama | +5.437 |
Neg logit contributions | |
ULAR | -6.248 |
eur | -6.178 |
aido | -6.147 |
Versus | -6.121 |
INESS | -5.990 |
Token | is |
Token ID | 318 |
Feature activation | +8.18e-01 |
Pos logit contributions | |
ricks | +3.601 |
idth | +3.344 |
--------------- | +3.287 |
abama | +3.279 |
enriched | +3.173 |
Neg logit contributions | |
ULAR | -3.073 |
eur | -3.045 |
Versus | -3.029 |
aido | -2.959 |
INESS | -2.941 |
Token | only |
Token ID | 691 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
Versus | +3.649 |
rudimentary | +3.614 |
eur | +3.584 |
moderately | +3.556 |
ULAR | +3.473 |
Neg logit contributions | |
idth | -5.381 |
ricks | -5.276 |
abama | -5.104 |
xual | -5.051 |
akespeare | -4.864 |
Token | the |
Token ID | 262 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
moderately | +7.118 |
rudimentary | +6.887 |
mildly | +6.558 |
vaguely | +6.509 |
marginally | +6.383 |
Neg logit contributions | |
idth | -10.903 |
ricks | -10.461 |
xual | -10.250 |
abama | -10.222 |
raught | -9.852 |
Token | beginning |
Token ID | 3726 |
Feature activation | +6.79e-01 |
Pos logit contributions | |
rudimentary | +5.268 |
survival | +5.188 |
moderately | +5.148 |
interim | +5.144 |
ré | +4.933 |
Neg logit contributions | |
idth | -11.090 |
ricks | -10.854 |
xual | -10.677 |
abama | -10.432 |
raught | -10.226 |
Token | . |
Token ID | 13 |
Feature activation | +1.90e-01 |
Pos logit contributions | |
Versus | +3.109 |
eur | +3.079 |
ULAR | +3.028 |
INESS | +2.947 |
atively | +2.899 |
Neg logit contributions | |
ricks | -4.417 |
idth | -4.192 |
abama | -4.090 |
akespeare | -4.070 |
--------------- | -3.967 |
Token | For |
Token ID | 1114 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
Versus | +0.950 |
ULAR | +0.911 |
eur | +0.900 |
INESS | +0.849 |
aido | +0.846 |
Neg logit contributions | |
ricks | -1.241 |
idth | -1.175 |
abama | -1.148 |
akespeare | -1.119 |
enriched | -1.111 |
Token | example |
Token ID | 1672 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
ricks | +1.649 |
idth | +1.537 |
abama | +1.519 |
--------------- | +1.504 |
akespeare | +1.469 |
Neg logit contributions | |
ULAR | -1.419 |
eur | -1.412 |
Versus | -1.401 |
aido | -1.360 |
atively | -1.346 |
Token | best |
Token ID | 1266 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
ricks | +2.822 |
idth | +2.639 |
abama | +2.593 |
--------------- | +2.586 |
akespeare | +2.512 |
Neg logit contributions | |
ULAR | -2.023 |
eur | -2.016 |
Versus | -2.010 |
aido | -1.946 |
INESS | -1.921 |
Token | results |
Token ID | 2482 |
Feature activation | -4.21e-01 |
Pos logit contributions | |
ricks | +0.910 |
idth | +0.850 |
abama | +0.833 |
--------------- | +0.827 |
akespeare | +0.814 |
Neg logit contributions | |
ULAR | -0.617 |
eur | -0.616 |
Versus | -0.614 |
aido | -0.594 |
INESS | -0.582 |
Token | . |
Token ID | 13 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
ricks | +2.585 |
idth | +2.398 |
--------------- | +2.359 |
abama | +2.345 |
akespeare | +2.276 |
Neg logit contributions | |
ULAR | -2.181 |
eur | -2.161 |
Versus | -2.147 |
aido | -2.104 |
INESS | -2.085 |
Token | Still |
Token ID | 7831 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
Versus | +5.172 |
ULAR | +4.749 |
eur | +4.586 |
opa | +4.347 |
atively | +4.230 |
Neg logit contributions | |
ricks | -8.260 |
idth | -8.014 |
abama | -7.878 |
akespeare | -7.808 |
raught | -7.757 |
Token | , |
Token ID | 11 |
Feature activation | +6.70e-01 |
Pos logit contributions | |
eur | +4.717 |
ULAR | +4.668 |
Versus | +4.643 |
aido | +4.519 |
INESS | +4.476 |
Neg logit contributions | |
ricks | -6.547 |
idth | -6.242 |
abama | -6.238 |
akespeare | -6.036 |
--------------- | -5.934 |
Token | even |
Token ID | 772 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
Versus | +3.360 |
eur | +3.234 |
ULAR | +3.106 |
survival | +3.051 |
rudimentary | +3.035 |
Neg logit contributions | |
ricks | -4.163 |
abama | -4.094 |
idth | -3.960 |
--------------- | -3.922 |
raught | -3.837 |
Token | with |
Token ID | 351 |
Feature activation | +2.25e-03 |
Pos logit contributions | |
Versus | +8.850 |
rudimentary | +8.533 |
moderately | +8.420 |
eur | +7.951 |
ULAR | +7.875 |
Neg logit contributions | |
abama | -11.488 |
ricks | -11.381 |
idth | -11.020 |
raught | -10.871 |
akespeare | -10.752 |
Token | just |
Token ID | 655 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
Versus | +0.012 |
ULAR | +0.012 |
eur | +0.012 |
aido | +0.011 |
atively | +0.011 |
Neg logit contributions | |
ricks | -0.014 |
abama | -0.013 |
idth | -0.013 |
--------------- | -0.013 |
akespeare | -0.012 |
Token | your |
Token ID | 534 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
Versus | +6.251 |
rudimentary | +5.990 |
ULAR | +5.865 |
moderately | +5.722 |
eur | +5.683 |
Neg logit contributions | |
ricks | -7.633 |
abama | -7.459 |
idth | -7.282 |
raught | -7.205 |
akespeare | -7.164 |
Token | basic |
Token ID | 4096 |
Feature activation | +5.89e-01 |
Pos logit contributions | |
Versus | +4.749 |
ULAR | +4.587 |
rudimentary | +4.563 |
eur | +4.559 |
moderately | +4.373 |
Neg logit contributions | |
ricks | -7.258 |
abama | -6.905 |
xual | -6.760 |
akespeare | -6.663 |
idth | -6.603 |
Token | smartphone |
Token ID | 11745 |
Feature activation | +7.27e-01 |
Pos logit contributions | |
Versus | +2.974 |
ULAR | +2.882 |
eur | +2.850 |
rudimentary | +2.786 |
survival | +2.759 |
Neg logit contributions | |
ricks | -3.668 |
abama | -3.479 |
idth | -3.384 |
xual | -3.373 |
akespeare | -3.364 |
Token | story |
Token ID | 1621 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
ULAR | +2.167 |
Versus | +2.124 |
eur | +2.080 |
survival | +2.018 |
aido | +1.978 |
Neg logit contributions | |
ricks | -3.366 |
idth | -3.272 |
abama | -3.192 |
xual | -3.119 |
orate | -3.033 |
Token | : |
Token ID | 25 |
Feature activation | +2.54e-01 |
Pos logit contributions | |
ricks | +1.102 |
idth | +1.018 |
abama | +0.996 |
--------------- | +0.971 |
akespeare | +0.969 |
Neg logit contributions | |
ULAR | -1.018 |
eur | -1.007 |
Versus | -1.006 |
INESS | -0.967 |
aido | -0.964 |
Token | http |
Token ID | 2638 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
Versus | +1.341 |
ULAR | +1.339 |
eur | +1.329 |
aido | +1.295 |
INESS | +1.282 |
Neg logit contributions | |
ricks | -1.497 |
abama | -1.394 |
idth | -1.392 |
xual | -1.377 |
--------------- | -1.358 |
Token | :// |
Token ID | 1378 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
ricks | +1.495 |
idth | +1.371 |
abama | +1.326 |
--------------- | +1.318 |
enriched | +1.311 |
Neg logit contributions | |
ULAR | -1.686 |
eur | -1.679 |
Versus | -1.652 |
INESS | -1.629 |
aido | -1.617 |
Token | on |
Token ID | 261 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
eur | +0.851 |
ULAR | +0.798 |
aido | +0.798 |
opa | +0.794 |
atively | +0.771 |
Neg logit contributions | |
ricks | -1.278 |
--------------- | -1.216 |
idth | -1.197 |
abama | -1.194 |
enriched | -1.180 |
Token | . |
Token ID | 13 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
ricks | +0.730 |
idth | +0.686 |
--------------- | +0.678 |
abama | +0.675 |
enriched | +0.668 |
Neg logit contributions | |
eur | -0.579 |
ULAR | -0.563 |
aido | -0.561 |
Versus | -0.548 |
opa | -0.545 |
Token | c |
Token ID | 66 |
Feature activation | +7.58e-01 |
Pos logit contributions | |
eur | +1.654 |
aido | +1.591 |
ULAR | +1.583 |
opa | +1.570 |
atively | +1.557 |
Neg logit contributions | |
ricks | -1.866 |
--------------- | -1.750 |
idth | -1.747 |
enriched | -1.706 |
abama | -1.689 |
Token | ps |
Token ID | 862 |
Feature activation | -2.25e-01 |
Pos logit contributions | |
eur | +2.587 |
opa | +2.474 |
atively | +2.414 |
ULAR | +2.413 |
ilot | +2.374 |
Neg logit contributions | |
ricks | -5.610 |
�� | -5.519 |
enriched | -5.477 |
--------------- | -5.390 |
�� | -5.325 |
Token | j |
Token ID | 73 |
Feature activation | -2.47e-01 |
Pos logit contributions | |
ricks | +1.339 |
idth | +1.238 |
--------------- | +1.220 |
abama | +1.208 |
enriched | +1.179 |
Neg logit contributions | |
ULAR | -1.204 |
eur | -1.188 |
Versus | -1.183 |
aido | -1.162 |
INESS | -1.152 |
Token | . |
Token ID | 13 |
Feature activation | -1.86e-02 |
Pos logit contributions | |
ricks | +1.495 |
idth | +1.389 |
--------------- | +1.367 |
abama | +1.358 |
enriched | +1.332 |
Neg logit contributions | |
ULAR | -1.295 |
eur | -1.292 |
Versus | -1.270 |
aido | -1.255 |
INESS | -1.236 |
Token | com |
Token ID | 785 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
ricks | +0.143 |
idth | +0.136 |
--------------- | +0.134 |
abama | +0.132 |
enriched | +0.132 |
Neg logit contributions | |
eur | -0.068 |
ULAR | -0.066 |
aido | -0.065 |
Versus | -0.064 |
opa | -0.062 |
Token | evolution |
Token ID | 6954 |
Feature activation | +9.10e-02 |
Pos logit contributions | |
ricks | +0.791 |
idth | +0.744 |
xual | +0.728 |
abama | +0.721 |
--------------- | +0.706 |
Neg logit contributions | |
eur | -0.668 |
ULAR | -0.660 |
Versus | -0.652 |
interim | -0.638 |
INESS | -0.636 |
Token | in |
Token ID | 287 |
Feature activation | +2.01e-02 |
Pos logit contributions | |
Versus | +0.403 |
eur | +0.402 |
ULAR | +0.400 |
atively | +0.388 |
INESS | +0.378 |
Neg logit contributions | |
ricks | -0.628 |
idth | -0.592 |
--------------- | -0.578 |
abama | -0.565 |
akespeare | -0.560 |
Token | the |
Token ID | 262 |
Feature activation | -3.34e-02 |
Pos logit contributions | |
Versus | +0.107 |
eur | +0.106 |
ULAR | +0.105 |
atively | +0.102 |
INESS | +0.102 |
Neg logit contributions | |
ricks | -0.123 |
idth | -0.114 |
--------------- | -0.110 |
abama | -0.108 |
xual | -0.108 |
Token | [ |
Token ID | 685 |
Feature activation | +4.89e-01 |
Pos logit contributions | |
ricks | +0.220 |
idth | +0.205 |
xual | +0.196 |
abama | +0.195 |
--------------- | +0.195 |
Neg logit contributions | |
Versus | -0.165 |
eur | -0.164 |
ULAR | -0.161 |
survival | -0.156 |
INESS | -0.156 |
Token | F |
Token ID | 37 |
Feature activation | -7.53e-01 |
Pos logit contributions | |
eur | +2.644 |
ULAR | +2.536 |
INESS | +2.498 |
opa | +2.453 |
aido | +2.435 |
Neg logit contributions | |
ricks | -2.847 |
idth | -2.715 |
xual | -2.685 |
enriched | -2.650 |
abama | -2.635 |
Token | DA |
Token ID | 5631 |
Feature activation | +6.02e-01 |
Pos logit contributions | |
ricks | +4.170 |
idth | +3.825 |
--------------- | +3.772 |
abama | +3.723 |
enriched | +3.611 |
Neg logit contributions | |
ULAR | -4.340 |
eur | -4.281 |
Versus | -4.275 |
aido | -4.191 |
INESS | -4.171 |
Token | 's |
Token ID | 338 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
ULAR | +2.968 |
eur | +2.960 |
Versus | +2.955 |
INESS | +2.849 |
aido | +2.820 |
Neg logit contributions | |
ricks | -3.799 |
idth | -3.534 |
--------------- | -3.467 |
abama | -3.427 |
enriched | -3.368 |
Token | ] |
Token ID | 60 |
Feature activation | -9.67e-02 |
Pos logit contributions | |
ULAR | +0.687 |
Versus | +0.682 |
eur | +0.682 |
aido | +0.655 |
INESS | +0.653 |
Neg logit contributions | |
ricks | -0.856 |
idth | -0.781 |
--------------- | -0.767 |
abama | -0.762 |
xual | -0.749 |
Token | approach |
Token ID | 3164 |
Feature activation | -6.23e-01 |
Pos logit contributions | |
ricks | +0.687 |
idth | +0.644 |
--------------- | +0.622 |
abama | +0.621 |
akespeare | +0.614 |
Neg logit contributions | |
Versus | -0.420 |
ULAR | -0.416 |
eur | -0.415 |
INESS | -0.397 |
aido | -0.394 |
Token | to |
Token ID | 284 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
ricks | +3.342 |
idth | +3.061 |
--------------- | +3.018 |
abama | +2.980 |
enriched | +2.884 |
Neg logit contributions | |
ULAR | -3.702 |
eur | -3.680 |
Versus | -3.662 |
aido | -3.593 |
INESS | -3.570 |
Token | regulating |
Token ID | 26379 |
Feature activation | +2.55e-01 |
Pos logit contributions | |
ricks | +0.731 |
idth | +0.675 |
abama | +0.649 |
--------------- | +0.645 |
akespeare | +0.637 |
Neg logit contributions | |
Versus | -0.702 |
eur | -0.697 |
ULAR | -0.690 |
INESS | -0.680 |
atively | -0.673 |
Token |
|
Token ID | 198 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
ricks | +0.635 |
idth | +0.592 |
abama | +0.564 |
--------------- | +0.562 |
enriched | +0.562 |
Neg logit contributions | |
Versus | -0.637 |
ULAR | -0.635 |
eur | -0.630 |
INESS | -0.601 |
aido | -0.601 |
Token |
|
Token ID | 198 |
Feature activation | -6.14e-01 |
Pos logit contributions | |
ricks | +1.613 |
idth | +1.493 |
abama | +1.440 |
--------------- | +1.437 |
enriched | +1.412 |
Neg logit contributions | |
ULAR | -1.807 |
eur | -1.800 |
Versus | -1.775 |
aido | -1.740 |
INESS | -1.732 |
Token | " |
Token ID | 1 |
Feature activation | -1.77e-01 |
Pos logit contributions | |
ricks | +3.353 |
idth | +3.079 |
--------------- | +3.028 |
abama | +2.998 |
enriched | +2.921 |
Neg logit contributions | |
ULAR | -3.593 |
eur | -3.555 |
Versus | -3.530 |
aido | -3.475 |
INESS | -3.452 |
Token | The |
Token ID | 464 |
Feature activation | -5.36e-02 |
Pos logit contributions | |
ricks | +1.067 |
idth | +1.010 |
abama | +0.974 |
enriched | +0.973 |
xual | +0.956 |
Neg logit contributions | |
ULAR | -0.960 |
eur | -0.949 |
Versus | -0.926 |
INESS | -0.916 |
aido | -0.896 |
Token | Finnish |
Token ID | 26838 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
ricks | +0.347 |
idth | +0.325 |
abama | +0.317 |
--------------- | +0.316 |
akespeare | +0.309 |
Neg logit contributions | |
eur | -0.261 |
ULAR | -0.260 |
Versus | -0.260 |
INESS | -0.247 |
aido | -0.244 |
Token | constitution |
Token ID | 11784 |
Feature activation | +7.05e-01 |
Pos logit contributions | |
ricks | +1.023 |
idth | +0.973 |
abama | +0.943 |
--------------- | +0.941 |
akespeare | +0.922 |
Neg logit contributions | |
Versus | -0.781 |
eur | -0.779 |
ULAR | -0.778 |
INESS | -0.740 |
aido | -0.735 |
Token | guarantees |
Token ID | 19026 |
Feature activation | +2.86e-01 |
Pos logit contributions | |
eur | +3.059 |
atively | +2.935 |
Versus | +2.848 |
vaguely | +2.733 |
interim | +2.705 |
Neg logit contributions | |
ricks | -4.817 |
idth | -4.800 |
abama | -4.562 |
--------------- | -4.462 |
raught | -4.402 |
Token | everyone |
Token ID | 2506 |
Feature activation | +4.69e-01 |
Pos logit contributions | |
eur | +1.442 |
atively | +1.402 |
ULAR | +1.393 |
Versus | +1.389 |
survival | +1.368 |
Neg logit contributions | |
ricks | -1.827 |
idth | -1.682 |
abama | -1.678 |
--------------- | -1.637 |
akespeare | -1.603 |
Token | the |
Token ID | 262 |
Feature activation | +2.54e-01 |
Pos logit contributions | |
eur | +2.383 |
Versus | +2.252 |
ULAR | +2.251 |
atively | +2.233 |
survival | +2.233 |
Neg logit contributions | |
ricks | -2.914 |
abama | -2.731 |
idth | -2.727 |
akespeare | -2.639 |
xual | -2.630 |
Token | right |
Token ID | 826 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
eur | +1.115 |
ULAR | +1.087 |
survival | +1.058 |
Versus | +1.051 |
rudimentary | +1.031 |
Neg logit contributions | |
ricks | -1.774 |
idth | -1.655 |
abama | -1.652 |
--------------- | -1.593 |
akespeare | -1.591 |
Token | to |
Token ID | 284 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
ULAR | +1.246 |
eur | +1.235 |
Versus | +1.228 |
aido | +1.212 |
INESS | +1.204 |
Neg logit contributions | |
ricks | -0.842 |
idth | -0.759 |
--------------- | -0.745 |
abama | -0.735 |
enriched | -0.711 |
Token | seem |
Token ID | 1283 |
Feature activation | -3.42e-01 |
Pos logit contributions | |
ricks | +0.607 |
idth | +0.568 |
abama | +0.562 |
--------------- | +0.554 |
akespeare | +0.539 |
Neg logit contributions | |
ULAR | -0.463 |
Versus | -0.462 |
eur | -0.460 |
aido | -0.449 |
opa | -0.436 |
Token | to |
Token ID | 284 |
Feature activation | -3.98e-01 |
Pos logit contributions | |
ricks | +1.653 |
idth | +1.501 |
--------------- | +1.472 |
abama | +1.457 |
enriched | +1.407 |
Neg logit contributions | |
ULAR | -2.214 |
eur | -2.194 |
Versus | -2.181 |
aido | -2.152 |
INESS | -2.136 |
Token | be |
Token ID | 307 |
Feature activation | -4.60e-02 |
Pos logit contributions | |
ricks | +2.436 |
idth | +2.258 |
abama | +2.211 |
--------------- | +2.204 |
akespeare | +2.137 |
Neg logit contributions | |
ULAR | -2.084 |
eur | -2.070 |
Versus | -2.059 |
aido | -2.029 |
INESS | -1.985 |
Token | in |
Token ID | 287 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
ricks | +0.323 |
idth | +0.308 |
abama | +0.300 |
--------------- | +0.296 |
akespeare | +0.293 |
Neg logit contributions | |
Versus | -0.199 |
ULAR | -0.199 |
eur | -0.194 |
aido | -0.191 |
atively | -0.185 |
Token | the |
Token ID | 262 |
Feature activation | +2.57e-01 |
Pos logit contributions | |
ricks | +0.730 |
idth | +0.678 |
--------------- | +0.665 |
abama | +0.662 |
akespeare | +0.647 |
Neg logit contributions | |
ULAR | -0.550 |
eur | -0.546 |
Versus | -0.542 |
aido | -0.534 |
atively | -0.524 |
Token | very |
Token ID | 845 |
Feature activation | +4.47e-01 |
Pos logit contributions | |
ULAR | +1.263 |
Versus | +1.260 |
eur | +1.241 |
aido | +1.219 |
survival | +1.212 |
Neg logit contributions | |
ricks | -1.643 |
idth | -1.519 |
abama | -1.487 |
--------------- | -1.483 |
xual | -1.464 |
Token | last |
Token ID | 938 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
eur | +2.005 |
ULAR | +1.980 |
survival | +1.973 |
Versus | +1.971 |
interim | +1.919 |
Neg logit contributions | |
ricks | -2.976 |
idth | -2.805 |
--------------- | -2.726 |
xual | -2.724 |
abama | -2.717 |
Token | stage |
Token ID | 3800 |
Feature activation | +5.05e-01 |
Pos logit contributions | |
eur | +5.568 |
survival | +5.552 |
Versus | +5.447 |
ULAR | +5.371 |
possession | +5.325 |
Neg logit contributions | |
ricks | -6.858 |
idth | -6.381 |
abama | -6.261 |
akespeare | -6.244 |
xual | -6.193 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e-01 |
Pos logit contributions | |
eur | +2.343 |
Versus | +2.315 |
ULAR | +2.281 |
aido | +2.258 |
INESS | +2.201 |
Neg logit contributions | |
ricks | -3.318 |
idth | -3.094 |
abama | -3.044 |
--------------- | -2.992 |
akespeare | -2.953 |
Token | I |
Token ID | 314 |
Feature activation | +7.33e-01 |
Pos logit contributions | |
Versus | +2.735 |
eur | +2.692 |
ULAR | +2.664 |
survival | +2.658 |
aido | +2.642 |
Neg logit contributions | |
ricks | -3.401 |
idth | -3.126 |
abama | -3.117 |
akespeare | -3.019 |
--------------- | -2.977 |
Token | do |
Token ID | 466 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
aido | +2.876 |
eur | +2.872 |
Versus | +2.797 |
ULAR | +2.692 |
ilot | +2.631 |
Neg logit contributions | |
ricks | -5.171 |
idth | -4.969 |
abama | -4.929 |
akespeare | -4.729 |
--------------- | -4.712 |
Token | the |
Token ID | 262 |
Feature activation | +9.84e-02 |
Pos logit contributions | |
ricks | +1.022 |
idth | +0.955 |
abama | +0.937 |
--------------- | +0.932 |
xual | +0.914 |
Neg logit contributions | |
Versus | -0.808 |
ULAR | -0.797 |
eur | -0.791 |
INESS | -0.766 |
aido | -0.765 |
Token | newly |
Token ID | 8308 |
Feature activation | +5.14e-01 |
Pos logit contributions | |
Versus | +0.484 |
ULAR | +0.470 |
eur | +0.465 |
INESS | +0.450 |
aido | +0.447 |
Neg logit contributions | |
ricks | -0.648 |
idth | -0.603 |
abama | -0.589 |
xual | -0.588 |
--------------- | -0.583 |
Token | launched |
Token ID | 5611 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
eur | +2.124 |
Versus | +2.096 |
ULAR | +2.053 |
atively | +2.012 |
interim | +1.976 |
Neg logit contributions | |
ricks | -3.596 |
idth | -3.454 |
abama | -3.389 |
xual | -3.331 |
--------------- | -3.292 |
Token | Fol |
Token ID | 30938 |
Feature activation | +8.91e-02 |
Pos logit contributions | |
ricks | +0.798 |
idth | +0.747 |
abama | +0.730 |
--------------- | +0.727 |
xual | +0.712 |
Neg logit contributions | |
Versus | -0.637 |
ULAR | -0.630 |
eur | -0.625 |
INESS | -0.600 |
aido | -0.599 |
Token | lett |
Token ID | 15503 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
ULAR | +0.401 |
eur | +0.399 |
INESS | +0.392 |
Versus | +0.392 |
aido | +0.390 |
Neg logit contributions | |
ricks | -0.579 |
--------------- | -0.558 |
idth | -0.554 |
abama | -0.541 |
enriched | -0.541 |
Token | Knowledge |
Token ID | 20414 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
ricks | +1.752 |
idth | +1.638 |
--------------- | +1.606 |
abama | +1.597 |
xual | +1.559 |
Neg logit contributions | |
Versus | -1.419 |
ULAR | -1.413 |
eur | -1.401 |
aido | -1.355 |
INESS | -1.355 |
Token | Fund |
Token ID | 7557 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
Versus | +1.184 |
ULAR | +1.135 |
eur | +1.133 |
INESS | +1.121 |
aido | +1.111 |
Neg logit contributions | |
ricks | -1.561 |
idth | -1.457 |
abama | -1.441 |
--------------- | -1.439 |
xual | -1.422 |
Token | , |
Token ID | 11 |
Feature activation | +1.79e-01 |
Pos logit contributions | |
Versus | +1.998 |
eur | +1.974 |
ULAR | +1.940 |
INESS | +1.908 |
atively | +1.876 |
Neg logit contributions | |
ricks | -2.643 |
idth | -2.505 |
abama | -2.483 |
--------------- | -2.450 |
raught | -2.350 |
Token | a |
Token ID | 257 |
Feature activation | +7.10e-02 |
Pos logit contributions | |
Versus | +0.861 |
eur | +0.833 |
ULAR | +0.828 |
aido | +0.798 |
opa | +0.797 |
Neg logit contributions | |
ricks | -1.169 |
idth | -1.118 |
abama | -1.112 |
--------------- | -1.080 |
xual | -1.066 |
Token | venture |
Token ID | 13189 |
Feature activation | +4.98e-01 |
Pos logit contributions | |
Versus | +0.336 |
ULAR | +0.328 |
eur | +0.327 |
INESS | +0.317 |
atively | +0.315 |
Neg logit contributions | |
ricks | -0.469 |
idth | -0.446 |
abama | -0.434 |
--------------- | -0.430 |
xual | -0.424 |
Token | capital |
Token ID | 3139 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
Versus | +2.298 |
atively | +2.238 |
ULAR | +2.231 |
eur | +2.229 |
opa | +2.103 |
Neg logit contributions | |
ricks | -3.289 |
--------------- | -3.067 |
idth | -3.056 |
abama | -3.044 |
akespeare | -2.990 |
Token | where |
Token ID | 810 |
Feature activation | +6.66e-02 |
Pos logit contributions | |
Versus | +2.647 |
eur | +2.585 |
ULAR | +2.577 |
aido | +2.561 |
INESS | +2.528 |
Neg logit contributions | |
ricks | -2.986 |
idth | -2.937 |
xual | -2.803 |
abama | -2.799 |
akespeare | -2.730 |
Token | he |
Token ID | 339 |
Feature activation | -4.22e-02 |
Pos logit contributions | |
eur | +0.359 |
ULAR | +0.358 |
Versus | +0.358 |
aido | +0.349 |
INESS | +0.349 |
Neg logit contributions | |
ricks | -0.387 |
idth | -0.362 |
abama | -0.356 |
--------------- | -0.350 |
akespeare | -0.348 |
Token | pan |
Token ID | 3425 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
ricks | +0.277 |
idth | +0.259 |
abama | +0.255 |
--------------- | +0.253 |
xual | +0.248 |
Neg logit contributions | |
eur | -0.203 |
ULAR | -0.198 |
Versus | -0.198 |
aido | -0.194 |
atively | -0.187 |
Token | hand |
Token ID | 4993 |
Feature activation | +6.52e-01 |
Pos logit contributions | |
opa | +7.113 |
eur | +7.042 |
atively | +6.950 |
ULAR | +6.754 |
aido | +6.753 |
Neg logit contributions | |
idth | -7.451 |
xual | -7.367 |
enrich | -7.296 |
abama | -7.244 |
akespeare | -7.198 |
Token | les |
Token ID | 829 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
eur | +3.206 |
atively | +2.987 |
ULAR | +2.978 |
aido | +2.946 |
opa | +2.938 |
Neg logit contributions | |
idth | -4.032 |
ricks | -3.883 |
abama | -3.860 |
enrich | -3.752 |
akespeare | -3.741 |
Token | with |
Token ID | 351 |
Feature activation | +1.27e-01 |
Pos logit contributions | |
Versus | +1.873 |
eur | +1.857 |
ULAR | +1.849 |
survival | +1.830 |
atively | +1.817 |
Neg logit contributions | |
ricks | -2.395 |
idth | -2.326 |
abama | -2.282 |
--------------- | -2.223 |
xual | -2.216 |
Token | his |
Token ID | 465 |
Feature activation | +4.02e-01 |
Pos logit contributions | |
eur | +0.617 |
ULAR | +0.617 |
Versus | +0.614 |
aido | +0.593 |
atively | +0.586 |
Neg logit contributions | |
ricks | -0.804 |
idth | -0.755 |
abama | -0.752 |
--------------- | -0.739 |
akespeare | -0.736 |
Token | friends |
Token ID | 2460 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
eur | +1.695 |
Versus | +1.675 |
ULAR | +1.670 |
survival | +1.612 |
aido | +1.602 |
Neg logit contributions | |
ricks | -2.800 |
abama | -2.646 |
idth | -2.637 |
akespeare | -2.596 |
--------------- | -2.576 |
Token | , |
Token ID | 11 |
Feature activation | +9.80e-02 |
Pos logit contributions | |
eur | +0.923 |
Versus | +0.919 |
aido | +0.911 |
ULAR | +0.911 |
INESS | +0.895 |
Neg logit contributions | |
ricks | -1.042 |
idth | -0.980 |
abama | -0.959 |
--------------- | -0.953 |
akespeare | -0.936 |
Token | holding |
Token ID | 4769 |
Feature activation | +6.10e-01 |
Pos logit contributions | |
Versus | +0.479 |
ULAR | +0.475 |
eur | +0.475 |
aido | +0.467 |
INESS | +0.454 |
Neg logit contributions | |
ricks | -0.619 |
idth | -0.585 |
abama | -0.578 |
--------------- | -0.567 |
akespeare | -0.558 |
Token | signs |
Token ID | 5895 |
Feature activation | +5.87e-01 |
Pos logit contributions | |
ULAR | +2.862 |
Versus | +2.840 |
eur | +2.829 |
rudimentary | +2.804 |
atively | +2.784 |
Neg logit contributions | |
ricks | -3.779 |
abama | -3.714 |
idth | -3.680 |
xual | -3.634 |
--------------- | -3.543 |
Token | . |
Token ID | 13 |
Feature activation | +5.05e-01 |
Pos logit contributions | |
Versus | +0.496 |
eur | +0.496 |
aido | +0.490 |
ULAR | +0.488 |
INESS | +0.484 |
Neg logit contributions | |
ricks | -0.673 |
idth | -0.619 |
abama | -0.617 |
--------------- | -0.608 |
akespeare | -0.602 |
Token | Don |
Token ID | 2094 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
Versus | +2.605 |
ULAR | +2.451 |
eur | +2.436 |
INESS | +2.271 |
opa | +2.267 |
Neg logit contributions | |
ricks | -3.210 |
idth | -3.001 |
abama | -2.918 |
enriched | -2.916 |
akespeare | -2.907 |
Token | 't |
Token ID | 470 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
eur | +0.566 |
ULAR | +0.548 |
Versus | +0.539 |
atively | +0.526 |
aido | +0.526 |
Neg logit contributions | |
ricks | -0.945 |
idth | -0.906 |
abama | -0.885 |
enriched | -0.882 |
xual | -0.874 |
Token | actually |
Token ID | 1682 |
Feature activation | -4.88e-02 |
Pos logit contributions | |
ricks | +1.667 |
idth | +1.569 |
abama | +1.552 |
--------------- | +1.535 |
akespeare | +1.510 |
Neg logit contributions | |
Versus | -1.066 |
eur | -1.064 |
ULAR | -1.051 |
aido | -1.029 |
opa | -1.003 |
Token | have |
Token ID | 423 |
Feature activation | -7.39e-02 |
Pos logit contributions | |
ricks | +0.336 |
idth | +0.319 |
abama | +0.313 |
--------------- | +0.312 |
akespeare | +0.305 |
Neg logit contributions | |
Versus | -0.215 |
eur | -0.213 |
ULAR | -0.212 |
aido | -0.209 |
opa | -0.201 |
Token | a |
Token ID | 257 |
Feature activation | -6.55e-02 |
Pos logit contributions | |
ricks | +0.444 |
idth | +0.409 |
--------------- | +0.403 |
abama | +0.400 |
akespeare | +0.395 |
Neg logit contributions | |
Versus | -0.403 |
eur | -0.398 |
ULAR | -0.388 |
aido | -0.380 |
atively | -0.375 |
Token | full |
Token ID | 1336 |
Feature activation | -4.55e-01 |
Pos logit contributions | |
ricks | +0.419 |
idth | +0.392 |
--------------- | +0.386 |
abama | +0.383 |
akespeare | +0.377 |
Neg logit contributions | |
Versus | -0.329 |
eur | -0.321 |
ULAR | -0.321 |
aido | -0.308 |
survival | -0.307 |
Token | 100 |
Token ID | 1802 |
Feature activation | +2.09e-01 |
Pos logit contributions | |
ricks | +2.949 |
idth | +2.743 |
--------------- | +2.702 |
abama | +2.677 |
xual | +2.613 |
Neg logit contributions | |
ULAR | -2.229 |
eur | -2.207 |
Versus | -2.205 |
aido | -2.132 |
INESS | -2.096 |
Token | % |
Token ID | 4 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
Versus | +1.153 |
ULAR | +1.139 |
eur | +1.136 |
aido | +1.104 |
atively | +1.076 |
Neg logit contributions | |
ricks | -1.205 |
idth | -1.109 |
abama | -1.104 |
akespeare | -1.099 |
--------------- | -1.081 |
Token | run |
Token ID | 1057 |
Feature activation | +9.63e-02 |
Pos logit contributions | |
Versus | +0.085 |
eur | +0.084 |
ULAR | +0.084 |
aido | +0.081 |
survival | +0.080 |
Neg logit contributions | |
ricks | -0.123 |
idth | -0.116 |
abama | -0.114 |
--------------- | -0.113 |
akespeare | -0.111 |
Token | recorded |
Token ID | 6264 |
Feature activation | -5.46e-01 |
Pos logit contributions | |
eur | +0.469 |
Versus | +0.464 |
ULAR | +0.462 |
aido | +0.447 |
atively | +0.442 |
Neg logit contributions | |
ricks | -0.614 |
idth | -0.574 |
abama | -0.574 |
akespeare | -0.559 |
--------------- | -0.558 |
Token | who |
Token ID | 508 |
Feature activation | +3.33e-01 |
Pos logit contributions | |
eur | +3.042 |
Versus | +2.955 |
ULAR | +2.947 |
survival | +2.925 |
moderately | +2.897 |
Neg logit contributions | |
ricks | -4.682 |
idth | -4.519 |
abama | -4.403 |
--------------- | -4.370 |
akespeare | -4.201 |
Token | know |
Token ID | 760 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
eur | +1.456 |
Versus | +1.443 |
ULAR | +1.380 |
aido | +1.372 |
survival | +1.350 |
Neg logit contributions | |
ricks | -2.327 |
idth | -2.182 |
--------------- | -2.133 |
abama | -2.126 |
raught | -2.058 |
Token | how |
Token ID | 703 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
eur | +0.822 |
ULAR | +0.820 |
Versus | +0.806 |
survival | +0.783 |
rudimentary | +0.778 |
Neg logit contributions | |
ricks | -1.105 |
abama | -1.057 |
idth | -1.055 |
--------------- | -1.028 |
raught | -1.013 |
Token | – |
Token ID | 784 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
ricks | +3.514 |
idth | +3.152 |
--------------- | +3.098 |
abama | +3.013 |
enriched | +2.985 |
Neg logit contributions | |
ULAR | -5.086 |
eur | -5.034 |
Versus | -5.008 |
aido | -4.970 |
INESS | -4.935 |
Token | in |
Token ID | 287 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
ricks | +1.191 |
idth | +1.121 |
abama | +1.107 |
--------------- | +1.096 |
raught | +1.052 |
Neg logit contributions | |
ULAR | -1.092 |
Versus | -1.091 |
eur | -1.088 |
aido | -1.059 |
atively | -1.040 |
Token | Hollywood |
Token ID | 8502 |
Feature activation | -4.11e-01 |
Pos logit contributions | |
Versus | +0.778 |
ULAR | +0.774 |
eur | +0.767 |
atively | +0.739 |
survival | +0.737 |
Neg logit contributions | |
ricks | -0.846 |
idth | -0.798 |
abama | -0.784 |
--------------- | -0.777 |
xual | -0.759 |
Token | , |
Token ID | 11 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
ricks | +2.542 |
idth | +2.374 |
--------------- | +2.336 |
abama | +2.328 |
akespeare | +2.243 |
Neg logit contributions | |
ULAR | -2.117 |
eur | -2.103 |
Versus | -2.096 |
aido | -2.025 |
INESS | -2.022 |
Token | France |
Token ID | 4881 |
Feature activation | +5.77e-02 |
Pos logit contributions | |
Versus | +0.886 |
ULAR | +0.881 |
eur | +0.877 |
survival | +0.857 |
aido | +0.836 |
Neg logit contributions | |
ricks | -1.082 |
idth | -1.033 |
abama | -1.022 |
--------------- | -1.013 |
raught | -0.973 |
Token | , |
Token ID | 11 |
Feature activation | +2.28e-02 |
Pos logit contributions | |
eur | +0.305 |
Versus | +0.303 |
ULAR | +0.300 |
aido | +0.289 |
INESS | +0.286 |
Neg logit contributions | |
ricks | -0.350 |
idth | -0.329 |
--------------- | -0.323 |
abama | -0.323 |
raught | -0.310 |
Token | even |
Token ID | 772 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
Versus | +0.119 |
ULAR | +0.117 |
eur | +0.117 |
aido | +0.113 |
survival | +0.111 |
Neg logit contributions | |
ricks | -0.138 |
idth | -0.132 |
--------------- | -0.129 |
abama | -0.128 |
raught | -0.126 |
Token | Iran |
Token ID | 4068 |
Feature activation | +6.02e-01 |
Pos logit contributions | |
Versus | +5.885 |
ULAR | +5.739 |
rudimentary | +5.714 |
eur | +5.712 |
survival | +5.698 |
Neg logit contributions | |
ricks | -7.737 |
idth | -7.445 |
raught | -7.309 |
abama | -7.251 |
--------------- | -7.246 |
Token | way |
Token ID | 1014 |
Feature activation | -3.07e-01 |
Pos logit contributions | |
ricks | +4.616 |
idth | +4.277 |
--------------- | +4.178 |
abama | +4.148 |
enriched | +4.060 |
Neg logit contributions | |
ULAR | -4.840 |
eur | -4.805 |
Versus | -4.764 |
aido | -4.666 |
INESS | -4.628 |
Token | book |
Token ID | 1492 |
Feature activation | -7.11e-02 |
Pos logit contributions | |
ricks | +2.072 |
idth | +1.950 |
--------------- | +1.911 |
abama | +1.904 |
raught | +1.846 |
Neg logit contributions | |
Versus | -1.416 |
ULAR | -1.396 |
eur | -1.392 |
aido | -1.350 |
INESS | -1.320 |
Token | to |
Token ID | 284 |
Feature activation | -7.11e-01 |
Pos logit contributions | |
ricks | +0.428 |
idth | +0.394 |
abama | +0.390 |
--------------- | +0.386 |
akespeare | +0.376 |
Neg logit contributions | |
Versus | -0.384 |
ULAR | -0.377 |
eur | -0.375 |
aido | -0.367 |
INESS | -0.363 |
Token | get |
Token ID | 651 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
ricks | +4.332 |
idth | +4.015 |
--------------- | +3.951 |
abama | +3.916 |
enriched | +3.818 |
Neg logit contributions | |
ULAR | -3.715 |
eur | -3.679 |
Versus | -3.661 |
aido | -3.587 |
INESS | -3.545 |
Token | it |
Token ID | 340 |
Feature activation | -5.52e-01 |
Pos logit contributions | |
ricks | +1.149 |
idth | +1.078 |
abama | +1.053 |
--------------- | +1.047 |
akespeare | +1.024 |
Neg logit contributions | |
eur | -0.908 |
Versus | -0.905 |
ULAR | -0.896 |
atively | -0.872 |
aido | -0.860 |
Token | started |
Token ID | 2067 |
Feature activation | -3.73e-01 |
Pos logit contributions | |
ricks | +3.596 |
idth | +3.372 |
--------------- | +3.297 |
abama | +3.285 |
akespeare | +3.190 |
Neg logit contributions | |
eur | -2.649 |
ULAR | -2.646 |
Versus | -2.644 |
aido | -2.541 |
atively | -2.530 |
Token | what |
Token ID | 644 |
Feature activation | -2.06e-01 |
Pos logit contributions | |
ricks | +2.355 |
idth | +2.207 |
abama | +2.157 |
--------------- | +2.138 |
akespeare | +2.085 |
Neg logit contributions | |
ULAR | -1.872 |
Versus | -1.867 |
eur | -1.866 |
aido | -1.811 |
INESS | -1.795 |
Token | a |
Token ID | 257 |
Feature activation | -2.72e-01 |
Pos logit contributions | |
ricks | +1.290 |
idth | +1.182 |
abama | +1.170 |
--------------- | +1.163 |
xual | +1.132 |
Neg logit contributions | |
eur | -1.048 |
Versus | -1.040 |
ULAR | -1.034 |
aido | -1.011 |
atively | -1.007 |
Token | lifes |
Token ID | 25622 |
Feature activation | +7.22e-01 |
Pos logit contributions | |
ricks | +1.671 |
idth | +1.590 |
abama | +1.540 |
--------------- | +1.527 |
xual | +1.473 |
Neg logit contributions | |
ULAR | -1.401 |
eur | -1.400 |
Versus | -1.391 |
aido | -1.356 |
atively | -1.331 |
Token | aver |
Token ID | 8770 |
Feature activation | +2.09e-02 |
Pos logit contributions | |
Versus | +3.087 |
eur | +2.877 |
INESS | +2.858 |
survival | +2.826 |
ilot | +2.823 |
Neg logit contributions | |
ricks | -5.011 |
idth | -4.639 |
xual | -4.571 |
abama | -4.563 |
--------------- | -4.463 |
Token | . |
Token ID | 13 |
Feature activation | -1.77e-01 |
Pos logit contributions | |
Versus | +0.107 |
eur | +0.106 |
ULAR | +0.105 |
atively | +0.102 |
survival | +0.102 |
Neg logit contributions | |
ricks | -0.131 |
idth | -0.122 |
abama | -0.119 |
--------------- | -0.117 |
xual | -0.116 |
Token | to |
Token ID | 284 |
Feature activation | -4.94e-01 |
Pos logit contributions | |
ricks | +2.411 |
idth | +2.174 |
--------------- | +2.151 |
abama | +2.104 |
enriched | +2.070 |
Neg logit contributions | |
ULAR | -3.421 |
eur | -3.369 |
Versus | -3.332 |
aido | -3.304 |
INESS | -3.265 |
Token | be |
Token ID | 307 |
Feature activation | -5.23e-02 |
Pos logit contributions | |
ricks | +3.262 |
idth | +3.053 |
--------------- | +3.005 |
abama | +2.991 |
enriched | +2.909 |
Neg logit contributions | |
ULAR | -2.329 |
eur | -2.306 |
Versus | -2.286 |
aido | -2.245 |
INESS | -2.199 |
Token | dark |
Token ID | 3223 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
ricks | +0.334 |
idth | +0.321 |
abama | +0.312 |
--------------- | +0.306 |
xual | +0.299 |
Neg logit contributions | |
ULAR | -0.256 |
eur | -0.254 |
Versus | -0.248 |
atively | -0.244 |
aido | -0.241 |
Token | , |
Token ID | 11 |
Feature activation | -3.91e-01 |
Pos logit contributions | |
ricks | +0.979 |
idth | +0.906 |
--------------- | +0.886 |
abama | +0.885 |
enriched | +0.852 |
Neg logit contributions | |
ULAR | -0.965 |
eur | -0.959 |
Versus | -0.948 |
aido | -0.933 |
INESS | -0.928 |
Token | s |
Token ID | 264 |
Feature activation | +6.30e-01 |
Pos logit contributions | |
ricks | +2.293 |
idth | +2.163 |
abama | +2.110 |
--------------- | +2.089 |
akespeare | +2.007 |
Neg logit contributions | |
ULAR | -2.127 |
eur | -2.125 |
Versus | -2.092 |
aido | -2.063 |
INESS | -2.020 |
Token | ard |
Token ID | 446 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
eur | +2.936 |
atively | +2.931 |
opa | +2.911 |
aido | +2.901 |
omew | +2.881 |
Neg logit contributions | |
ricks | -4.034 |
idth | -3.613 |
abama | -3.601 |
enriched | -3.599 |
--------------- | -3.560 |
Token | onic |
Token ID | 9229 |
Feature activation | +1.92e-02 |
Pos logit contributions | |
ricks | +0.905 |
idth | +0.852 |
--------------- | +0.848 |
abama | +0.840 |
enriched | +0.836 |
Neg logit contributions | |
eur | -0.307 |
ULAR | -0.300 |
Versus | -0.286 |
atively | -0.284 |
aido | -0.281 |
Token | , |
Token ID | 11 |
Feature activation | -3.18e-01 |
Pos logit contributions | |
ULAR | +0.099 |
eur | +0.099 |
Versus | +0.098 |
aido | +0.096 |
INESS | +0.094 |
Neg logit contributions | |
ricks | -0.117 |
idth | -0.109 |
--------------- | -0.107 |
abama | -0.106 |
enriched | -0.103 |
Token | overtly |
Token ID | 45118 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
ricks | +1.873 |
idth | +1.760 |
abama | +1.712 |
--------------- | +1.703 |
xual | +1.633 |
Neg logit contributions | |
eur | -1.728 |
ULAR | -1.724 |
Versus | -1.699 |
aido | -1.670 |
INESS | -1.634 |
Token | mean |
Token ID | 1612 |
Feature activation | +6.16e-01 |
Pos logit contributions | |
ricks | +7.148 |
--------------- | +6.535 |
idth | +6.486 |
enriched | +6.426 |
abama | +6.361 |
Neg logit contributions | |
ULAR | -6.232 |
Versus | -6.147 |
eur | -6.088 |
INESS | -6.087 |
aido | -6.082 |
Token | , |
Token ID | 11 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
eur | +3.034 |
Versus | +3.002 |
ULAR | +2.962 |
INESS | +2.957 |
aido | +2.957 |
Neg logit contributions | |
ricks | -3.749 |
idth | -3.536 |
abama | -3.494 |
--------------- | -3.396 |
enriched | -3.369 |
Token | search |
Token ID | 2989 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
ricks | +2.035 |
idth | +1.890 |
abama | +1.852 |
--------------- | +1.848 |
xual | +1.788 |
Neg logit contributions | |
ULAR | -1.577 |
Versus | -1.577 |
eur | -1.555 |
aido | -1.517 |
INESS | -1.482 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
ricks | +1.838 |
idth | +1.692 |
--------------- | +1.671 |
abama | +1.665 |
xual | +1.624 |
Neg logit contributions | |
ULAR | -1.424 |
eur | -1.410 |
Versus | -1.395 |
aido | -1.348 |
INESS | -1.347 |
Token |
|
Token ID | 198 |
Feature activation | -3.14e-02 |
Pos logit contributions | |
ricks | +2.585 |
idth | +2.400 |
abama | +2.332 |
--------------- | +2.318 |
enriched | +2.286 |
Neg logit contributions | |
Versus | -2.239 |
ULAR | -2.236 |
eur | -2.222 |
aido | -2.159 |
opa | -2.117 |
Token |
|
Token ID | 198 |
Feature activation | -4.59e-01 |
Pos logit contributions | |
ricks | +0.181 |
idth | +0.171 |
abama | +0.162 |
enriched | +0.162 |
xual | +0.162 |
Neg logit contributions | |
eur | -0.177 |
ULAR | -0.176 |
Versus | -0.172 |
INESS | -0.167 |
aido | -0.166 |
Token | The |
Token ID | 464 |
Feature activation | -8.36e-01 |
Pos logit contributions | |
ricks | +2.735 |
idth | +2.543 |
abama | +2.479 |
--------------- | +2.462 |
enriched | +2.437 |
Neg logit contributions | |
ULAR | -2.467 |
eur | -2.452 |
Versus | -2.397 |
aido | -2.372 |
INESS | -2.351 |
Token | blue |
Token ID | 4171 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
ricks | +5.337 |
idth | +4.962 |
--------------- | +4.904 |
abama | +4.853 |
enriched | +4.753 |
Neg logit contributions | |
ULAR | -4.096 |
eur | -4.043 |
Versus | -4.011 |
aido | -3.943 |
INESS | -3.909 |
Token | tiles |
Token ID | 19867 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
ricks | +9.465 |
idth | +8.984 |
--------------- | +8.785 |
enriched | +8.585 |
abama | +8.528 |
Neg logit contributions | |
ULAR | -7.928 |
aido | -7.747 |
eur | -7.705 |
INESS | -7.699 |
Versus | -7.641 |
Token | are |
Token ID | 389 |
Feature activation | -4.83e-01 |
Pos logit contributions | |
ricks | +1.485 |
idth | +1.382 |
abama | +1.362 |
--------------- | +1.357 |
xual | +1.316 |
Neg logit contributions | |
ULAR | -1.164 |
Versus | -1.161 |
eur | -1.160 |
aido | -1.135 |
INESS | -1.113 |
Token | those |
Token ID | 883 |
Feature activation | +2.84e-02 |
Pos logit contributions | |
ricks | +2.996 |
idth | +2.791 |
--------------- | +2.730 |
abama | +2.728 |
akespeare | +2.655 |
Neg logit contributions | |
ULAR | -2.479 |
Versus | -2.447 |
eur | -2.442 |
aido | -2.374 |
INESS | -2.352 |
Token | which |
Token ID | 543 |
Feature activation | -7.17e-02 |
Pos logit contributions | |
ULAR | +0.143 |
Versus | +0.141 |
eur | +0.141 |
aido | +0.135 |
atively | +0.135 |
Neg logit contributions | |
ricks | -0.179 |
idth | -0.168 |
abama | -0.165 |
--------------- | -0.162 |
akespeare | -0.159 |
Token | have |
Token ID | 423 |
Feature activation | -8.08e-02 |
Pos logit contributions | |
ricks | +0.462 |
idth | +0.429 |
abama | +0.420 |
--------------- | +0.413 |
xual | +0.409 |
Neg logit contributions | |
Versus | -0.356 |
ULAR | -0.352 |
eur | -0.349 |
aido | -0.343 |
atively | -0.333 |
Token | , |
Token ID | 11 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
ricks | +1.186 |
idth | +1.099 |
abama | +1.087 |
--------------- | +1.074 |
akespeare | +1.045 |
Neg logit contributions | |
ULAR | -0.902 |
Versus | -0.900 |
eur | -0.887 |
INESS | -0.860 |
aido | -0.857 |
Token | comprised |
Token ID | 19869 |
Feature activation | +2.82e-02 |
Pos logit contributions | |
ricks | +0.746 |
idth | +0.695 |
abama | +0.687 |
--------------- | +0.674 |
xual | +0.660 |
Neg logit contributions | |
Versus | -0.593 |
ULAR | -0.592 |
eur | -0.575 |
INESS | -0.561 |
aido | -0.561 |
Token | of |
Token ID | 286 |
Feature activation | -4.91e-01 |
Pos logit contributions | |
ULAR | +0.154 |
eur | +0.153 |
Versus | +0.152 |
aido | +0.150 |
INESS | +0.148 |
Neg logit contributions | |
ricks | -0.164 |
idth | -0.151 |
--------------- | -0.150 |
abama | -0.148 |
enriched | -0.145 |
Token | over |
Token ID | 625 |
Feature activation | -6.73e-01 |
Pos logit contributions | |
ricks | +3.154 |
idth | +2.911 |
--------------- | +2.878 |
abama | +2.870 |
enriched | +2.786 |
Neg logit contributions | |
ULAR | -2.421 |
Versus | -2.393 |
eur | -2.388 |
aido | -2.324 |
INESS | -2.312 |
Token | 200 |
Token ID | 939 |
Feature activation | -8.29e-01 |
Pos logit contributions | |
ricks | +4.339 |
idth | +4.032 |
--------------- | +3.982 |
abama | +3.950 |
enriched | +3.855 |
Neg logit contributions | |
ULAR | -3.289 |
eur | -3.249 |
Versus | -3.227 |
aido | -3.165 |
INESS | -3.132 |
Token | professional |
Token ID | 4708 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
ricks | +4.941 |
idth | +4.679 |
--------------- | +4.583 |
abama | +4.486 |
enriched | +4.427 |
Neg logit contributions | |
ULAR | -4.288 |
eur | -4.253 |
Versus | -4.187 |
aido | -4.168 |
INESS | -4.099 |
Token | TV |
Token ID | 3195 |
Feature activation | -7.89e-01 |
Pos logit contributions | |
ricks | +7.825 |
idth | +7.468 |
--------------- | +7.348 |
enriched | +7.061 |
akespeare | +7.026 |
Neg logit contributions | |
ULAR | -7.332 |
aido | -7.139 |
eur | -7.099 |
INESS | -7.017 |
opa | -6.908 |
Token | critics |
Token ID | 9188 |
Feature activation | -2.58e-02 |
Pos logit contributions | |
ricks | +5.053 |
idth | +4.703 |
--------------- | +4.646 |
abama | +4.589 |
enriched | +4.499 |
Neg logit contributions | |
ULAR | -3.858 |
eur | -3.801 |
Versus | -3.771 |
aido | -3.711 |
INESS | -3.670 |
Token | and |
Token ID | 290 |
Feature activation | -7.63e-02 |
Pos logit contributions | |
ricks | +0.160 |
idth | +0.149 |
abama | +0.146 |
--------------- | +0.144 |
xual | +0.141 |
Neg logit contributions | |
eur | -0.131 |
ULAR | -0.130 |
Versus | -0.130 |
aido | -0.128 |
INESS | -0.126 |
Token | print |
Token ID | 3601 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
ricks | +0.504 |
abama | +0.462 |
idth | +0.459 |
--------------- | +0.454 |
raught | +0.447 |
Neg logit contributions | |
Versus | -0.371 |
ULAR | -0.367 |
eur | -0.361 |
INESS | -0.353 |
aido | -0.352 |
Token | journalists |
Token ID | 9046 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
ricks | +2.107 |
abama | +1.949 |
idth | +1.936 |
--------------- | +1.930 |
xual | +1.879 |
Neg logit contributions | |
ULAR | -1.647 |
Versus | -1.634 |
eur | -1.615 |
INESS | -1.583 |
atively | -1.575 |
Token | inter |
Token ID | 987 |
Feature activation | -9.58e-01 |
Pos logit contributions | |
ricks | +1.435 |
idth | +1.342 |
--------------- | +1.329 |
abama | +1.314 |
xual | +1.259 |
Neg logit contributions | |
eur | -1.312 |
Versus | -1.290 |
ULAR | -1.288 |
aido | -1.246 |
atively | -1.236 |
Token | sp |
Token ID | 2777 |
Feature activation | +2.21e-01 |
Pos logit contributions | |
ricks | +4.801 |
idth | +4.319 |
--------------- | +4.247 |
abama | +4.189 |
dy | +4.106 |
Neg logit contributions | |
ULAR | -6.027 |
Versus | -5.873 |
eur | -5.841 |
INESS | -5.837 |
aido | -5.764 |
Token | ersed |
Token ID | 20204 |
Feature activation | -2.92e-01 |
Pos logit contributions | |
eur | +0.585 |
Versus | +0.574 |
ULAR | +0.550 |
opa | +0.542 |
atively | +0.541 |
Neg logit contributions | |
ricks | -1.856 |
idth | -1.787 |
abama | -1.785 |
--------------- | -1.776 |
enriched | -1.734 |
Token | with |
Token ID | 351 |
Feature activation | -6.33e-01 |
Pos logit contributions | |
ricks | +1.596 |
idth | +1.459 |
--------------- | +1.440 |
abama | +1.424 |
enriched | +1.409 |
Neg logit contributions | |
ULAR | -1.699 |
Versus | -1.674 |
eur | -1.671 |
aido | -1.648 |
INESS | -1.637 |
Token | red |
Token ID | 2266 |
Feature activation | -9.12e-01 |
Pos logit contributions | |
ricks | +3.745 |
idth | +3.460 |
--------------- | +3.413 |
abama | +3.378 |
enriched | +3.295 |
Neg logit contributions | |
ULAR | -3.413 |
eur | -3.374 |
Versus | -3.352 |
aido | -3.295 |
INESS | -3.268 |
Token | - |
Token ID | 12 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
ricks | +4.880 |
idth | +4.431 |
--------------- | +4.366 |
abama | +4.305 |
enriched | +4.232 |
Neg logit contributions | |
ULAR | -5.412 |
eur | -5.317 |
Versus | -5.317 |
aido | -5.252 |
INESS | -5.229 |
Token | painted |
Token ID | 47351 |
Feature activation | -8.86e-01 |
Pos logit contributions | |
ricks | +6.713 |
idth | +5.993 |
--------------- | +5.899 |
dy | +5.857 |
abama | +5.796 |
Neg logit contributions | |
ULAR | -7.168 |
Versus | -6.988 |
INESS | -6.905 |
eur | -6.834 |
aido | -6.806 |
Token | wood |
Token ID | 4898 |
Feature activation | -4.52e-01 |
Pos logit contributions | |
ricks | +5.032 |
idth | +4.535 |
--------------- | +4.513 |
abama | +4.427 |
enriched | +4.419 |
Neg logit contributions | |
ULAR | -4.929 |
Versus | -4.822 |
eur | -4.821 |
aido | -4.818 |
INESS | -4.790 |
Token | stripes |
Token ID | 28806 |
Feature activation | -3.53e-01 |
Pos logit contributions | |
ricks | +2.682 |
idth | +2.507 |
--------------- | +2.484 |
abama | +2.465 |
akespeare | +2.372 |
Neg logit contributions | |
ULAR | -2.409 |
eur | -2.403 |
Versus | -2.382 |
aido | -2.342 |
INESS | -2.308 |
Token | ( |
Token ID | 357 |
Feature activation | -6.07e-02 |
Pos logit contributions | |
ricks | +2.149 |
idth | +2.001 |
--------------- | +1.975 |
abama | +1.961 |
akespeare | +1.886 |
Neg logit contributions | |
eur | -1.847 |
ULAR | -1.839 |
Versus | -1.824 |
aido | -1.779 |
INESS | -1.754 |
Token | from |
Token ID | 6738 |
Feature activation | +1.79e-01 |
Pos logit contributions | |
ricks | +0.367 |
idth | +0.349 |
abama | +0.345 |
--------------- | +0.341 |
xual | +0.337 |
Neg logit contributions | |
eur | -0.317 |
ULAR | -0.310 |
Versus | -0.303 |
aido | -0.302 |
atively | -0.296 |
Token | List |
Token ID | 8053 |
Feature activation | -9.78e-02 |
Pos logit contributions | |
ricks | +4.568 |
idth | +4.176 |
--------------- | +4.175 |
abama | +4.013 |
enriched | +4.003 |
Neg logit contributions | |
ULAR | -4.369 |
Versus | -4.336 |
eur | -4.329 |
aido | -4.318 |
INESS | -4.307 |
Token | $ |
Token ID | 720 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
ricks | +0.520 |
idth | +0.476 |
abama | +0.467 |
--------------- | +0.464 |
akespeare | +0.448 |
Neg logit contributions | |
ULAR | -0.589 |
eur | -0.583 |
Versus | -0.582 |
INESS | -0.565 |
aido | -0.563 |
Token | w |
Token ID | 86 |
Feature activation | -3.29e-01 |
Pos logit contributions | |
ricks | +7.444 |
--------------- | +6.872 |
idth | +6.826 |
abama | +6.636 |
dy | +6.597 |
Neg logit contributions | |
Versus | -6.821 |
ULAR | -6.775 |
aido | -6.571 |
INESS | -6.566 |
eur | -6.552 |
Token | path |
Token ID | 6978 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
ricks | +1.205 |
idth | +1.045 |
--------------- | +1.041 |
abama | +1.022 |
enriched | +0.987 |
Neg logit contributions | |
ULAR | -2.518 |
eur | -2.515 |
Versus | -2.480 |
aido | -2.454 |
INESS | -2.440 |
Token | $ |
Token ID | 720 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
ricks | +6.846 |
idth | +6.322 |
--------------- | +6.311 |
abama | +6.122 |
dup | +6.082 |
Neg logit contributions | |
ULAR | -8.066 |
aido | -7.987 |
eur | -7.918 |
INESS | -7.872 |
Versus | -7.858 |
Token | image |
Token ID | 9060 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
ricks | +6.397 |
idth | +5.871 |
--------------- | +5.824 |
abama | +5.701 |
dy | +5.623 |
Neg logit contributions | |
ULAR | -6.256 |
Versus | -6.232 |
INESS | -6.045 |
eur | -6.028 |
aido | -6.013 |
Token | = |
Token ID | 796 |
Feature activation | -3.12e-01 |
Pos logit contributions | |
ricks | +6.509 |
idth | +6.054 |
--------------- | +5.969 |
abama | +5.801 |
dy | +5.669 |
Neg logit contributions | |
ULAR | -6.726 |
Versus | -6.671 |
aido | -6.600 |
eur | -6.592 |
INESS | -6.524 |
Token | [ |
Token ID | 685 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
ricks | +1.974 |
idth | +1.826 |
--------------- | +1.790 |
abama | +1.783 |
xual | +1.746 |
Neg logit contributions | |
ULAR | -1.588 |
eur | -1.570 |
Versus | -1.565 |
aido | -1.511 |
INESS | -1.493 |
Token | System |
Token ID | 11964 |
Feature activation | -3.43e-01 |
Pos logit contributions | |
ricks | +1.054 |
idth | +0.970 |
abama | +0.950 |
--------------- | +0.943 |
enriched | +0.926 |
Neg logit contributions | |
ULAR | -1.057 |
eur | -1.041 |
Versus | -1.027 |
aido | -1.002 |
INESS | -1.001 |
Token | . |
Token ID | 13 |
Feature activation | -3.04e-01 |
Pos logit contributions | |
ricks | +2.090 |
idth | +1.932 |
--------------- | +1.900 |
abama | +1.884 |
enriched | +1.838 |
Neg logit contributions | |
ULAR | -1.815 |
eur | -1.789 |
Versus | -1.773 |
aido | -1.740 |
INESS | -1.727 |
Token | Draw |
Token ID | 25302 |
Feature activation | -9.75e-01 |
Pos logit contributions | |
ricks | +1.812 |
idth | +1.686 |
--------------- | +1.643 |
abama | +1.635 |
enriched | +1.604 |
Neg logit contributions | |
ULAR | -1.644 |
eur | -1.624 |
Versus | -1.598 |
aido | -1.582 |
INESS | -1.567 |
Token | izen |
Token ID | 33977 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
ricks | +0.801 |
idth | +0.763 |
abama | +0.750 |
--------------- | +0.746 |
enriched | +0.738 |
Neg logit contributions | |
ULAR | -0.459 |
eur | -0.440 |
Versus | -0.430 |
aido | -0.430 |
INESS | -0.428 |
Token | Kernel |
Token ID | 32169 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
ricks | +1.283 |
idth | +1.200 |
abama | +1.180 |
--------------- | +1.176 |
akespeare | +1.151 |
Neg logit contributions | |
ULAR | -1.115 |
Versus | -1.105 |
eur | -1.101 |
aido | -1.070 |
INESS | -1.053 |
Token | , |
Token ID | 11 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
Versus | +1.370 |
ULAR | +1.344 |
eur | +1.299 |
aido | +1.276 |
atively | +1.271 |
Neg logit contributions | |
ricks | -1.770 |
idth | -1.694 |
abama | -1.674 |
akespeare | -1.628 |
xual | -1.626 |
Token | but |
Token ID | 475 |
Feature activation | +6.15e-01 |
Pos logit contributions | |
ricks | +1.068 |
idth | +1.014 |
abama | +1.009 |
--------------- | +0.983 |
akespeare | +0.967 |
Neg logit contributions | |
Versus | -0.848 |
ULAR | -0.847 |
eur | -0.846 |
aido | -0.818 |
INESS | -0.806 |
Token | * |
Token ID | 1635 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
eur | +2.702 |
Versus | +2.697 |
ULAR | +2.609 |
survival | +2.568 |
interim | +2.551 |
Neg logit contributions | |
ricks | -4.056 |
abama | -3.896 |
idth | -3.884 |
akespeare | -3.799 |
--------------- | -3.754 |
Token | before |
Token ID | 19052 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
ULAR | +0.747 |
eur | +0.745 |
INESS | +0.723 |
Versus | +0.714 |
aido | +0.712 |
Neg logit contributions | |
ricks | -0.896 |
idth | -0.863 |
abama | -0.856 |
akespeare | -0.835 |
enriched | -0.834 |
Token | * |
Token ID | 9 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
ricks | +5.964 |
--------------- | +5.439 |
idth | +5.411 |
abama | +5.267 |
dy | +5.205 |
Neg logit contributions | |
ULAR | -6.342 |
eur | -6.314 |
Versus | -6.256 |
aido | -6.203 |
INESS | -6.117 |
Token | the |
Token ID | 262 |
Feature activation | +6.83e-02 |
Pos logit contributions | |
ULAR | +1.136 |
Versus | +1.113 |
eur | +1.106 |
INESS | +1.076 |
aido | +1.069 |
Neg logit contributions | |
ricks | -1.358 |
idth | -1.282 |
abama | -1.275 |
akespeare | -1.237 |
--------------- | -1.235 |
Token | root |
Token ID | 6808 |
Feature activation | +4.10e-02 |
Pos logit contributions | |
ULAR | +0.363 |
Versus | +0.359 |
eur | +0.358 |
aido | +0.347 |
survival | +0.345 |
Neg logit contributions | |
ricks | -0.409 |
idth | -0.382 |
abama | -0.379 |
--------------- | -0.371 |
akespeare | -0.369 |
Token | fs |
Token ID | 9501 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
ULAR | +0.239 |
eur | +0.238 |
Versus | +0.235 |
INESS | +0.228 |
atively | +0.227 |
Neg logit contributions | |
ricks | -0.225 |
idth | -0.208 |
abama | -0.207 |
--------------- | -0.203 |
akespeare | -0.200 |
Token | , |
Token ID | 11 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
ricks | +0.809 |
idth | +0.758 |
abama | +0.749 |
--------------- | +0.737 |
xual | +0.725 |
Neg logit contributions | |
ULAR | -0.648 |
eur | -0.644 |
Versus | -0.639 |
INESS | -0.623 |
aido | -0.615 |