Token | SR |
Token ID | 12562 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
u | +16.329 |
- | +14.743 |
b | +14.602 |
ire | +14.477 |
id | +14.371 |
Neg logit contributions | |
disparate | -16.654 |
relentless | -15.768 |
hindsight | -15.608 |
newer | -15.589 |
totality | -15.573 |
Token | . |
Token ID | 13 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
. | +30.291 |
u | +28.171 |
- | +27.743 |
ag | +25.631 |
_ | +25.628 |
Neg logit contributions | |
disparate | -18.752 |
proactive | -18.353 |
relentless | -18.294 |
spontaneous | -17.412 |
blatant | -17.388 |
Token | Width |
Token ID | 30916 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
u | +2.546 |
id | +2.133 |
- | +2.098 |
ine | +2.008 |
ab | +1.966 |
Neg logit contributions | |
disparate | -9.145 |
relentless | -8.872 |
totality | -8.839 |
hindsight | -8.793 |
proactive | -8.792 |
Token | ), |
Token ID | 828 |
Feature activation | +3.72e+00 |
Pos logit contributions | |
- | +22.633 |
u | +21.014 |
. | +20.613 |
+ | +19.920 |
/ | +19.152 |
Neg logit contributions | |
disparate | -16.339 |
relentless | -15.791 |
spontaneous | -15.404 |
proactive | -15.269 |
blatant | -15.179 |
Token | ($ |
Token ID | 16763 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
u | +8.332 |
- | +7.985 |
ire | +7.552 |
id | +7.543 |
ab | +7.431 |
Neg logit contributions | |
disparate | -9.798 |
totality | -9.289 |
relentless | -9.184 |
proactive | -9.106 |
academics | -9.069 |
Token | SR |
Token ID | 12562 |
Feature activation | +2.63e+01 |
Pos logit contributions | |
u | +19.480 |
- | +17.721 |
ire | +17.199 |
id | +17.196 |
b | +17.133 |
Neg logit contributions | |
disparate | -21.547 |
totality | -21.197 |
disgruntled | -20.590 |
newer | -20.585 |
venerable | -20.253 |
Token | . |
Token ID | 13 |
Feature activation | +6.06e+00 |
Pos logit contributions | |
. | +32.322 |
- | +27.876 |
u | +24.780 |
_ | +24.695 |
' | +22.692 |
Neg logit contributions | |
tremend | -54.232 |
metic | -48.051 |
mathemat | -46.794 |
eleph | -46.607 |
cumbers | -46.290 |
Token | Height |
Token ID | 23106 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
- | +4.820 |
u | +4.797 |
id | +4.178 |
ab | +4.132 |
ire | +3.623 |
Neg logit contributions | |
disparate | -22.783 |
proactive | -22.530 |
totality | -22.257 |
sporadic | -22.205 |
relentless | -22.029 |
Token | ))) |
Token ID | 22305 |
Feature activation | +3.99e+00 |
Pos logit contributions | |
- | +22.044 |
u | +21.459 |
. | +20.193 |
ire | +19.524 |
ine | +19.474 |
Neg logit contributions | |
disparate | -16.484 |
relentless | -16.435 |
proactive | -16.137 |
spontaneous | -16.014 |
blatant | -15.793 |
Token | ) |
Token ID | 1267 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
u | +9.191 |
- | +9.132 |
ire | +8.638 |
end | +8.605 |
id | +8.543 |
Neg logit contributions | |
disparate | -9.078 |
relentless | -8.768 |
stringent | -8.666 |
disgruntled | -8.605 |
academics | -8.563 |
Token | } |
Token ID | 1782 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
u | +4.621 |
- | +4.521 |
ire | +4.341 |
ine | +4.281 |
end | +4.212 |
Neg logit contributions | |
disparate | -5.533 |
relentless | -5.341 |
stringent | -5.264 |
academics | -5.242 |
blatant | -5.203 |
Token | Line |
Token ID | 13949 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
u | +2.371 |
ab | +2.045 |
ine | +2.038 |
id | +2.001 |
- | +1.998 |
Neg logit contributions | |
disparate | -5.601 |
totality | -5.429 |
relentless | -5.418 |
newer | -5.416 |
myriad | -5.337 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
al | +19.842 |
- | +19.136 |
u | +18.174 |
. | +17.926 |
ab | +17.451 |
Neg logit contributions | |
tremend | -25.767 |
mathemat | -23.867 |
disparate | -23.428 |
disgruntled | -22.821 |
stringent | -22.741 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
u | +21.176 |
id | +21.128 |
ire | +20.767 |
ig | +20.629 |
ag | +20.539 |
Neg logit contributions | |
tremend | -33.610 |
hemor | -31.234 |
metic | -30.939 |
cumbers | -30.516 |
misunder | -29.883 |
Token | = |
Token ID | 796 |
Feature activation | +7.44e+00 |
Pos logit contributions | |
. | +23.254 |
u | +22.229 |
- | +22.090 |
= | +20.706 |
_ | +20.362 |
Neg logit contributions | |
tremend | -35.869 |
mathemat | -32.404 |
hemor | -31.578 |
metic | -30.891 |
cumbers | -29.923 |
Token | [ |
Token ID | 685 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
- | +13.889 |
u | +13.883 |
. | +13.012 |
id | +12.620 |
ong | +12.225 |
Neg logit contributions | |
tremend | -16.427 |
misunder | -14.755 |
mathemat | -14.703 |
disparate | -14.580 |
behavi | -14.541 |
Token | system |
Token ID | 10057 |
Feature activation | +2.49e+01 |
Pos logit contributions | |
u | +19.016 |
- | +17.619 |
id | +17.302 |
ine | +16.756 |
ab | +16.613 |
Neg logit contributions | |
hemor | -26.977 |
behavi | -26.732 |
tremend | -26.528 |
metic | -26.167 |
undermin | -25.980 |
Token | . |
Token ID | 13 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
. | +31.667 |
- | +27.314 |
u | +25.016 |
_ | +23.830 |
' | +22.716 |
Neg logit contributions | |
tremend | -52.691 |
eleph | -47.276 |
cumbers | -46.720 |
metic | -46.443 |
exha | -45.912 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
u | +16.012 |
id | +15.129 |
- | +14.994 |
ab | +14.734 |
end | +14.447 |
Neg logit contributions | |
metic | -31.138 |
tremend | -30.436 |
mathemat | -29.219 |
unnecess | -28.805 |
behavi | -28.465 |
Token | ing |
Token ID | 278 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
ing | +27.886 |
- | +23.755 |
u | +23.129 |
al | +22.324 |
. | +22.215 |
Neg logit contributions | |
tremend | -52.098 |
metic | -47.504 |
eleph | -47.261 |
cumbers | -46.629 |
exha | -46.521 |
Token | . |
Token ID | 13 |
Feature activation | +9.27e+00 |
Pos logit contributions | |
. | +30.560 |
- | +26.039 |
u | +23.048 |
_ | +22.550 |
' | +21.884 |
Neg logit contributions | |
tremend | -52.194 |
eleph | -46.695 |
cumbers | -45.449 |
metic | -45.131 |
mathemat | -44.439 |
Token | String |
Token ID | 10100 |
Feature activation | +1.89e+01 |
Pos logit contributions | |
u | +9.991 |
- | +9.249 |
id | +8.587 |
ine | +8.263 |
. | +8.071 |
Neg logit contributions | |
tremend | -29.700 |
hemor | -28.227 |
mathemat | -28.010 |
eleph | -27.322 |
reluct | -26.957 |
Token | , |
Token ID | 11 |
Feature activation | +3.59e+00 |
Pos logit contributions | |
- | +19.564 |
. | +19.326 |
, | +17.979 |
u | +17.941 |
ia | +16.649 |
Neg logit contributions | |
tremend | -38.946 |
mathemat | -34.734 |
cumbers | -34.580 |
undermin | -34.446 |
behavi | -33.182 |
Token | characterized |
Token ID | 16264 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
u | +8.243 |
- | +7.996 |
ire | +7.859 |
ia | +7.796 |
ine | +7.684 |
Neg logit contributions | |
blatant | -8.419 |
totality | -8.380 |
disparate | -8.376 |
relentless | -8.349 |
newer | -8.210 |
Token | by |
Token ID | 416 |
Feature activation | +9.60e+00 |
Pos logit contributions | |
. | +22.223 |
- | +22.048 |
ine | +18.403 |
u | +18.305 |
ic | +18.269 |
Neg logit contributions | |
tremend | -38.617 |
mathemat | -35.259 |
cumbers | -33.972 |
undermin | -33.400 |
misunder | -33.339 |
Token | multiple |
Token ID | 3294 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
- | +20.465 |
. | +19.242 |
ine | +17.455 |
u | +17.104 |
ia | +16.646 |
Neg logit contributions | |
mathemat | -19.557 |
tremend | -19.277 |
undermin | -17.592 |
misunder | -17.454 |
cumbers | -17.211 |
Token | tiny |
Token ID | 7009 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
- | +21.996 |
. | +20.577 |
u | +18.471 |
y | +18.238 |
ia | +17.933 |
Neg logit contributions | |
mathemat | -17.263 |
Palestin | -16.799 |
tremend | -16.586 |
undermin | -16.499 |
reluct | -16.329 |
Token | ker |
Token ID | 41927 |
Feature activation | +2.47e+01 |
Pos logit contributions | |
- | +27.173 |
. | +25.719 |
u | +23.330 |
er | +23.187 |
ire | +21.998 |
Neg logit contributions | |
tremend | -24.625 |
mathemat | -22.759 |
undermin | -22.597 |
ccording | -22.511 |
Palestin | -21.886 |
Token | at |
Token ID | 265 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
at | +29.020 |
ati | +23.963 |
ac | +23.619 |
ate | +23.188 |
ath | +23.067 |
Neg logit contributions | |
tremend | -44.712 |
reluct | -43.402 |
cumbers | -43.268 |
enthusi | -41.953 |
undermin | -41.912 |
Token | otic |
Token ID | 6210 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
otic | +16.595 |
ic | +15.214 |
os | +14.261 |
ot | +13.478 |
id | +12.958 |
Neg logit contributions | |
behavi | -38.084 |
hemor | -37.678 |
tremend | -37.456 |
reluct | -36.804 |
misunder | -36.762 |
Token | plugs |
Token ID | 37008 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
- | +18.899 |
. | +17.703 |
ig | +15.763 |
u | +14.880 |
s | +14.546 |
Neg logit contributions | |
tremend | -27.574 |
mathemat | -26.685 |
behavi | -25.340 |
metic | -24.819 |
hemor | -24.214 |
Token | , |
Token ID | 11 |
Feature activation | +3.49e+00 |
Pos logit contributions | |
. | +22.535 |
- | +22.422 |
, | +21.534 |
u | +20.040 |
; | +18.631 |
Neg logit contributions | |
tremend | -44.050 |
cumbers | -39.329 |
undermin | -38.594 |
mathemat | -38.069 |
reluct | -37.896 |
Token | mim |
Token ID | 17007 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
- | +8.454 |
u | +7.993 |
. | +7.966 |
ine | +7.916 |
ia | +7.572 |
Neg logit contributions | |
disparate | -7.658 |
totality | -7.426 |
disgruntled | -7.418 |
hindsight | -7.347 |
tremend | -7.344 |
Token | cv |
Token ID | 33967 |
Feature activation | +2.08e+01 |
Pos logit contributions | |
u | +12.045 |
ix | +9.874 |
q | +9.644 |
ire | +9.510 |
ab | +9.368 |
Neg logit contributions | |
disparate | -27.642 |
tremend | -27.622 |
undermin | -27.421 |
mathemat | -27.309 |
totality | -26.984 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
2 | +25.091 |
- | +24.006 |
u | +23.839 |
. | +23.059 |
_ | +21.915 |
Neg logit contributions | |
tremend | -49.329 |
eleph | -44.866 |
exha | -44.831 |
undermin | -44.619 |
metic | -44.493 |
Token | . |
Token ID | 13 |
Feature activation | +9.97e+00 |
Pos logit contributions | |
. | +27.050 |
- | +23.197 |
u | +21.652 |
_ | +20.888 |
' | +19.380 |
Neg logit contributions | |
tremend | -47.260 |
mathemat | -41.399 |
eleph | -41.074 |
cumbers | -41.004 |
metic | -40.906 |
Token | M |
Token ID | 44 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
- | +10.764 |
u | +9.960 |
. | +9.842 |
_ | +9.465 |
M | +9.099 |
Neg logit contributions | |
tremend | -33.763 |
mathemat | -31.138 |
undermin | -30.072 |
hemor | -29.733 |
exha | -29.530 |
Token | OR |
Token ID | 1581 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
- | +20.424 |
. | +19.512 |
OR | +19.209 |
_ | +18.457 |
u | +17.847 |
Neg logit contributions | |
tremend | -41.627 |
mathemat | -38.708 |
metic | -37.972 |
undermin | -37.657 |
behavi | -37.200 |
Token | PH |
Token ID | 11909 |
Feature activation | +2.45e+01 |
Pos logit contributions | |
- | +22.092 |
. | +20.517 |
_ | +19.107 |
PH | +18.637 |
PA | +18.518 |
Neg logit contributions | |
tremend | -41.080 |
mathemat | -36.581 |
metic | -35.309 |
undermin | -34.969 |
streng | -34.561 |
Token | _ |
Token ID | 62 |
Feature activation | +9.47e+00 |
Pos logit contributions | |
_ | +30.714 |
- | +27.240 |
. | +25.375 |
u | +24.220 |
' | +22.235 |
Neg logit contributions | |
tremend | -48.666 |
mathemat | -43.387 |
cumbers | -43.191 |
metic | -42.569 |
hemor | -42.486 |
Token | RECT |
Token ID | 23988 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
- | +10.951 |
u | +10.606 |
. | +9.719 |
X | +9.030 |
_ | +8.885 |
Neg logit contributions | |
tremend | -30.325 |
mathemat | -28.658 |
undermin | -28.560 |
streng | -28.170 |
hemor | -27.889 |
Token | , |
Token ID | 11 |
Feature activation | +6.67e+00 |
Pos logit contributions | |
- | +23.464 |
. | +23.190 |
u | +21.756 |
, | +21.700 |
_ | +21.083 |
Neg logit contributions | |
tremend | -42.764 |
mathemat | -37.772 |
hemor | -37.508 |
cumbers | -37.167 |
undermin | -36.913 |
Token | ( |
Token ID | 357 |
Feature activation | +5.69e+00 |
Pos logit contributions | |
u | +13.648 |
- | +13.197 |
ire | +12.623 |
ine | +12.261 |
ong | +11.941 |
Neg logit contributions | |
disparate | -13.996 |
blatant | -13.331 |
hindsight | -13.329 |
academics | -13.323 |
totality | -13.272 |
Token | 13 |
Token ID | 1485 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
u | +7.775 |
- | +7.357 |
ire | +7.295 |
id | +6.660 |
ab | +6.486 |
Neg logit contributions | |
disparate | -18.746 |
totality | -18.256 |
genuine | -17.895 |
blatant | -17.682 |
relentless | -17.604 |
Token | cv |
Token ID | 33967 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
u | +16.202 |
ix | +13.813 |
q | +13.705 |
- | +13.469 |
ab | +13.449 |
Neg logit contributions | |
tremend | -29.471 |
mathemat | -28.990 |
undermin | -28.836 |
metic | -28.038 |
hemor | -27.514 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
2 | +26.093 |
- | +24.863 |
u | +24.337 |
. | +24.173 |
_ | +22.439 |
Neg logit contributions | |
tremend | -50.813 |
eleph | -46.030 |
exha | -45.978 |
undermin | -45.856 |
metic | -45.454 |
Token | . |
Token ID | 13 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
. | +28.652 |
- | +24.159 |
u | +22.118 |
_ | +21.988 |
' | +20.337 |
Neg logit contributions | |
tremend | -49.111 |
mathemat | -43.465 |
cumbers | -42.854 |
eleph | -42.694 |
metic | -42.532 |
Token | M |
Token ID | 44 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
- | +11.643 |
. | +10.774 |
u | +10.494 |
_ | +10.274 |
M | +9.833 |
Neg logit contributions | |
tremend | -35.212 |
mathemat | -32.065 |
undermin | -31.066 |
hemor | -30.852 |
exha | -30.663 |
Token | OR |
Token ID | 1581 |
Feature activation | +1.95e+01 |
Pos logit contributions | |
- | +20.374 |
. | +19.840 |
OR | +19.382 |
+ | +18.123 |
_ | +18.034 |
Neg logit contributions | |
tremend | -44.262 |
mathemat | -40.057 |
undermin | -39.326 |
metic | -39.148 |
behavi | -38.740 |
Token | PH |
Token ID | 11909 |
Feature activation | +2.45e+01 |
Pos logit contributions | |
- | +20.273 |
. | +19.052 |
PH | +18.485 |
PA | +17.629 |
_ | +17.298 |
Neg logit contributions | |
tremend | -44.645 |
mathemat | -39.432 |
metic | -37.835 |
undermin | -37.547 |
streng | -37.544 |
Token | _ |
Token ID | 62 |
Feature activation | +9.94e+00 |
Pos logit contributions | |
_ | +30.790 |
- | +27.837 |
. | +25.652 |
u | +24.014 |
+ | +22.634 |
Neg logit contributions | |
tremend | -49.142 |
mathemat | -43.799 |
cumbers | -43.515 |
metic | -42.990 |
undermin | -42.602 |
Token | RECT |
Token ID | 23988 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
- | +11.427 |
u | +10.717 |
. | +10.127 |
X | +9.246 |
_ | +9.209 |
Neg logit contributions | |
tremend | -32.704 |
mathemat | -30.867 |
undermin | -30.690 |
hemor | -30.137 |
streng | -29.812 |
Token | , |
Token ID | 11 |
Feature activation | +9.72e+00 |
Pos logit contributions | |
. | +23.723 |
- | +23.675 |
, | +22.251 |
u | +21.904 |
_ | +20.998 |
Neg logit contributions | |
tremend | -43.817 |
mathemat | -39.169 |
hemor | -38.294 |
cumbers | -37.765 |
undermin | -37.675 |
Token | ( |
Token ID | 357 |
Feature activation | +6.66e+00 |
Pos logit contributions | |
- | +15.658 |
u | +14.863 |
. | +14.677 |
id | +13.403 |
ine | +13.313 |
Neg logit contributions | |
tremend | -27.329 |
mathemat | -25.113 |
undermin | -24.526 |
hemor | -23.757 |
cumbers | -23.566 |
Token | 21 |
Token ID | 2481 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
- | +8.269 |
u | +7.850 |
ab | +7.594 |
q | +7.280 |
b | +7.119 |
Neg logit contributions | |
disparate | -21.855 |
totality | -20.845 |
behavi | -20.269 |
relentless | -20.259 |
genuine | -20.178 |
Token | Solid |
Token ID | 46933 |
Feature activation | +1.95e+01 |
Pos logit contributions | |
u | +10.475 |
- | +10.084 |
. | +8.890 |
b | +8.805 |
ine | +8.713 |
Neg logit contributions | |
tremend | -27.872 |
hemor | -26.448 |
mathemat | -26.170 |
undermin | -25.523 |
eleph | -25.420 |
Token | Br |
Token ID | 9414 |
Feature activation | +1.88e+01 |
Pos logit contributions | |
- | +22.417 |
. | +20.979 |
B | +19.993 |
b | +19.607 |
br | +19.071 |
Neg logit contributions | |
tremend | -43.185 |
eleph | -38.591 |
mathemat | -38.235 |
hemor | -38.005 |
metic | -36.840 |
Token | ush |
Token ID | 1530 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
u | +25.625 |
ush | +25.236 |
ite | +23.583 |
ace | +23.517 |
- | +23.265 |
Neg logit contributions | |
tremend | -36.801 |
behavi | -36.161 |
hemor | -35.060 |
mathemat | -34.456 |
cumbers | -34.046 |
Token | ( |
Token ID | 357 |
Feature activation | +8.84e+00 |
Pos logit contributions | |
- | +21.032 |
. | +20.714 |
_ | +19.815 |
u | +19.386 |
ine | +18.541 |
Neg logit contributions | |
tremend | -33.146 |
mathemat | -29.495 |
cumbers | -28.505 |
hemor | -28.422 |
metic | -28.083 |
Token | [ |
Token ID | 685 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
u | +16.710 |
- | +16.096 |
id | +15.538 |
ire | +15.282 |
ong | +14.931 |
Neg logit contributions | |
disparate | -16.294 |
relentless | -15.840 |
stringent | -15.254 |
drastic | -15.230 |
gradual | -15.123 |
Token | System |
Token ID | 11964 |
Feature activation | +2.45e+01 |
Pos logit contributions | |
- | +16.832 |
u | +16.796 |
. | +15.261 |
id | +14.132 |
ine | +14.004 |
Neg logit contributions | |
tremend | -34.628 |
hemor | -33.301 |
metic | -33.056 |
eleph | -32.919 |
mathemat | -32.602 |
Token | . |
Token ID | 13 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
. | +31.399 |
- | +26.930 |
u | +24.152 |
_ | +22.912 |
' | +22.048 |
Neg logit contributions | |
tremend | -52.151 |
eleph | -46.521 |
cumbers | -45.717 |
mathemat | -45.432 |
exha | -45.124 |
Token | Draw |
Token ID | 25302 |
Feature activation | +2.25e+01 |
Pos logit contributions | |
- | +14.358 |
u | +13.869 |
. | +13.120 |
ine | +12.586 |
id | +12.067 |
Neg logit contributions | |
tremend | -34.634 |
metic | -32.384 |
mathemat | -32.090 |
eleph | -30.062 |
unnecess | -29.732 |
Token | ing |
Token ID | 278 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
ing | +27.104 |
- | +23.056 |
u | +22.620 |
. | +21.683 |
al | +21.238 |
Neg logit contributions | |
tremend | -50.065 |
eleph | -45.667 |
metic | -45.163 |
cumbers | -44.851 |
mathemat | -44.700 |
Token | . |
Token ID | 13 |
Feature activation | +8.38e+00 |
Pos logit contributions | |
. | +29.194 |
- | +24.836 |
u | +21.744 |
_ | +21.245 |
' | +20.272 |
Neg logit contributions | |
tremend | -50.289 |
eleph | -44.970 |
cumbers | -42.992 |
metic | -42.932 |
mathemat | -42.827 |
Token | Color |
Token ID | 10258 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
u | +8.795 |
- | +8.681 |
ine | +7.862 |
. | +7.702 |
ag | +7.406 |
Neg logit contributions | |
tremend | -29.514 |
mathemat | -27.302 |
hemor | -26.612 |
totality | -26.412 |
relentless | -26.056 |
Token | Line |
Token ID | 13949 |
Feature activation | +6.63e+00 |
Pos logit contributions | |
u | +0.301 |
id | +0.261 |
ab | +0.261 |
ine | +0.257 |
- | +0.250 |
Neg logit contributions | |
disparate | -0.681 |
relentless | -0.666 |
newer | -0.662 |
totality | -0.656 |
proactive | -0.652 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
u | +14.164 |
- | +13.975 |
id | +13.557 |
ab | +13.522 |
ag | +13.512 |
Neg logit contributions | |
disparate | -13.610 |
disgruntled | -12.954 |
proactive | -12.793 |
relentless | -12.764 |
newer | -12.671 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
u | +18.995 |
ig | +17.954 |
id | +17.686 |
ag | +17.483 |
ine | +17.420 |
Neg logit contributions | |
tremend | -30.580 |
hemor | -28.714 |
misunder | -27.773 |
mathemat | -27.690 |
cumbers | -27.292 |
Token | = |
Token ID | 796 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
. | +21.929 |
u | +21.922 |
- | +20.692 |
ine | +19.998 |
ab | +19.971 |
Neg logit contributions | |
disparate | -19.855 |
disgruntled | -18.746 |
hindsight | -18.486 |
academics | -18.193 |
anecdotal | -18.142 |
Token | [ |
Token ID | 685 |
Feature activation | +6.62e+00 |
Pos logit contributions | |
u | +2.553 |
- | +2.450 |
ine | +2.342 |
ire | +2.341 |
id | +2.334 |
Neg logit contributions | |
disparate | -2.649 |
blatant | -2.536 |
relentless | -2.530 |
academics | -2.494 |
poorer | -2.448 |
Token | system |
Token ID | 10057 |
Feature activation | +2.44e+01 |
Pos logit contributions | |
u | +13.446 |
- | +12.624 |
id | +12.244 |
ine | +12.031 |
ab | +11.930 |
Neg logit contributions | |
disparate | -14.720 |
relentless | -14.252 |
proactive | -14.215 |
drastic | -14.080 |
newer | -14.077 |
Token | . |
Token ID | 13 |
Feature activation | +8.13e+00 |
Pos logit contributions | |
. | +31.248 |
- | +26.619 |
u | +25.064 |
_ | +23.727 |
' | +22.052 |
Neg logit contributions | |
tremend | -51.364 |
eleph | -46.456 |
metic | -45.659 |
cumbers | -45.425 |
exha | -44.896 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.42e+01 |
Pos logit contributions | |
u | +12.177 |
- | +11.249 |
id | +11.145 |
ab | +11.037 |
ine | +10.805 |
Neg logit contributions | |
disparate | -20.656 |
totality | -20.651 |
proactive | -20.599 |
relentless | -20.388 |
stringent | -20.114 |
Token | ing |
Token ID | 278 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
ing | +28.118 |
- | +24.028 |
u | +23.135 |
. | +22.631 |
al | +22.307 |
Neg logit contributions | |
tremend | -51.263 |
eleph | -46.798 |
metic | -46.421 |
cumbers | -45.907 |
exha | -45.873 |
Token | . |
Token ID | 13 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
. | +30.159 |
- | +25.591 |
u | +22.462 |
_ | +22.309 |
' | +21.246 |
Neg logit contributions | |
tremend | -51.383 |
eleph | -46.102 |
cumbers | -44.416 |
metic | -44.197 |
occas | -43.634 |
Token | String |
Token ID | 10100 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
u | +1.848 |
ine | +1.598 |
id | +1.562 |
- | +1.554 |
ab | +1.540 |
Neg logit contributions | |
disparate | -5.015 |
relentless | -4.918 |
newer | -4.896 |
totality | -4.894 |
proactive | -4.850 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
u | +18.995 |
ig | +17.954 |
id | +17.686 |
ag | +17.483 |
ine | +17.420 |
Neg logit contributions | |
tremend | -30.580 |
hemor | -28.714 |
misunder | -27.773 |
mathemat | -27.690 |
cumbers | -27.292 |
Token | = |
Token ID | 796 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
. | +21.929 |
u | +21.922 |
- | +20.692 |
ine | +19.998 |
ab | +19.971 |
Neg logit contributions | |
disparate | -19.855 |
disgruntled | -18.746 |
hindsight | -18.486 |
academics | -18.193 |
anecdotal | -18.142 |
Token | [ |
Token ID | 685 |
Feature activation | +6.62e+00 |
Pos logit contributions | |
u | +2.553 |
- | +2.450 |
ine | +2.342 |
ire | +2.341 |
id | +2.334 |
Neg logit contributions | |
disparate | -2.649 |
blatant | -2.536 |
relentless | -2.530 |
academics | -2.494 |
poorer | -2.448 |
Token | system |
Token ID | 10057 |
Feature activation | +2.44e+01 |
Pos logit contributions | |
u | +13.446 |
- | +12.624 |
id | +12.244 |
ine | +12.031 |
ab | +11.930 |
Neg logit contributions | |
disparate | -14.720 |
relentless | -14.252 |
proactive | -14.215 |
drastic | -14.080 |
newer | -14.077 |
Token | . |
Token ID | 13 |
Feature activation | +8.13e+00 |
Pos logit contributions | |
. | +31.248 |
- | +26.619 |
u | +25.064 |
_ | +23.727 |
' | +22.052 |
Neg logit contributions | |
tremend | -51.364 |
eleph | -46.456 |
metic | -45.659 |
cumbers | -45.425 |
exha | -44.896 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.42e+01 |
Pos logit contributions | |
u | +12.177 |
- | +11.249 |
id | +11.145 |
ab | +11.037 |
ine | +10.805 |
Neg logit contributions | |
disparate | -20.656 |
totality | -20.651 |
proactive | -20.599 |
relentless | -20.388 |
stringent | -20.114 |
Token | ing |
Token ID | 278 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
ing | +28.118 |
- | +24.028 |
u | +23.135 |
. | +22.631 |
al | +22.307 |
Neg logit contributions | |
tremend | -51.263 |
eleph | -46.798 |
metic | -46.421 |
cumbers | -45.907 |
exha | -45.873 |
Token | . |
Token ID | 13 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
. | +30.159 |
- | +25.591 |
u | +22.462 |
_ | +22.309 |
' | +21.246 |
Neg logit contributions | |
tremend | -51.383 |
eleph | -46.102 |
cumbers | -44.416 |
metic | -44.197 |
occas | -43.634 |
Token | String |
Token ID | 10100 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
u | +1.848 |
ine | +1.598 |
id | +1.562 |
- | +1.554 |
ab | +1.540 |
Neg logit contributions | |
disparate | -5.015 |
relentless | -4.918 |
newer | -4.896 |
totality | -4.894 |
proactive | -4.850 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
- | +16.902 |
ine | +16.206 |
u | +16.189 |
. | +15.996 |
ab | +15.592 |
Neg logit contributions | |
disparate | -19.711 |
totality | -19.217 |
hindsight | -19.110 |
relentless | -19.081 |
proactive | -18.981 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
u | +20.123 |
ire | +19.655 |
id | +19.603 |
ig | +19.349 |
ine | +19.235 |
Neg logit contributions | |
tremend | -31.383 |
hemor | -30.394 |
cumbers | -29.146 |
metic | -28.338 |
behavi | -28.034 |
Token | v |
Token ID | 410 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
- | +7.713 |
u | +7.697 |
. | +6.974 |
v | +6.728 |
q | +6.314 |
Neg logit contributions | |
tremend | -14.646 |
mathemat | -14.101 |
undermin | -13.737 |
blatant | -13.574 |
relentless | -13.499 |
Token | ars |
Token ID | 945 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
ar | +20.924 |
- | +20.327 |
u | +20.247 |
ab | +20.101 |
ars | +20.030 |
Neg logit contributions | |
tremend | -35.095 |
undermin | -33.353 |
hemor | -33.346 |
behavi | -33.256 |
metic | -33.219 |
Token | ( |
Token ID | 7 |
Feature activation | +9.23e+00 |
Pos logit contributions | |
- | +20.562 |
. | +20.127 |
( | +19.789 |
u | +19.616 |
_ | +19.490 |
Neg logit contributions | |
tremend | -39.522 |
hemor | -36.549 |
undermin | -36.406 |
metic | -36.103 |
mathemat | -36.058 |
Token | ap |
Token ID | 499 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
ab | +14.628 |
u | +14.460 |
ag | +14.073 |
ac | +13.440 |
ip | +13.185 |
Neg logit contributions | |
tremend | -26.651 |
behavi | -25.795 |
mathemat | -25.593 |
undermin | -25.476 |
metic | -25.192 |
Token | . |
Token ID | 13 |
Feature activation | +9.63e+00 |
Pos logit contributions | |
. | +27.503 |
- | +22.839 |
u | +22.630 |
_ | +21.305 |
' | +19.392 |
Neg logit contributions | |
tremend | -46.906 |
metic | -41.855 |
cumbers | -41.268 |
hemor | -41.162 |
mathemat | -41.015 |
Token | parse |
Token ID | 29572 |
Feature activation | +2.42e+01 |
Pos logit contributions | |
u | +9.019 |
ine | +8.770 |
q | +8.683 |
id | +8.678 |
- | +8.625 |
Neg logit contributions | |
behavi | -30.650 |
hemor | -30.006 |
tremend | -29.949 |
disparate | -29.661 |
undermin | -29.535 |
Token | _ |
Token ID | 62 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
_ | +30.265 |
- | +26.852 |
. | +24.832 |
u | +24.069 |
q | +22.226 |
Neg logit contributions | |
tremend | -49.287 |
metic | -44.854 |
mathemat | -43.985 |
cumbers | -43.510 |
undermin | -43.080 |
Token | args |
Token ID | 22046 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
args | +23.373 |
u | +20.490 |
ag | +19.466 |
- | +18.332 |
b | +18.123 |
Neg logit contributions | |
tremend | -36.672 |
metic | -35.943 |
mathemat | -34.192 |
behavi | -34.018 |
undermin | -33.202 |
Token | ()) |
Token ID | 28955 |
Feature activation | +3.86e+00 |
Pos logit contributions | |
() | +11.092 |
u | +10.462 |
_ | +10.405 |
- | +10.237 |
. | +9.853 |
Neg logit contributions | |
tremend | -36.094 |
mathemat | -35.067 |
metic | -34.614 |
streng | -33.482 |
undermin | -33.369 |
Token | # |
Token ID | 1303 |
Feature activation | +3.39e+00 |
Pos logit contributions | |
u | +7.676 |
- | +7.091 |
ab | +6.785 |
ag | +6.672 |
aga | +6.651 |
Neg logit contributions | |
disparate | -10.487 |
relentless | -10.272 |
tremendous | -10.011 |
newer | -9.938 |
academics | -9.926 |
Token | initialize |
Token ID | 41216 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
- | +5.955 |
ine | +5.907 |
u | +5.592 |
. | +5.239 |
ax | +5.206 |
Neg logit contributions | |
disparate | -10.018 |
blatant | -9.765 |
venerable | -9.732 |
drastic | -9.670 |
relentless | -9.668 |
Token | . |
Token ID | 13 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
. | +27.128 |
- | +22.725 |
u | +21.101 |
_ | +20.248 |
id | +19.492 |
Neg logit contributions | |
tremend | -40.634 |
mathemat | -35.977 |
hemor | -35.172 |
metic | -34.921 |
undermin | -34.173 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
u | +3.337 |
ab | +2.881 |
ine | +2.839 |
id | +2.806 |
- | +2.782 |
Neg logit contributions | |
disparate | -9.107 |
totality | -8.850 |
relentless | -8.833 |
newer | -8.813 |
proactive | -8.739 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
u | +20.894 |
id | +20.349 |
ire | +20.009 |
ig | +19.962 |
ine | +19.611 |
Neg logit contributions | |
tremend | -31.903 |
hemor | -29.932 |
mathemat | -29.842 |
metic | -29.239 |
cumbers | -28.711 |
Token | = |
Token ID | 796 |
Feature activation | +3.71e+00 |
Pos logit contributions | |
. | +25.177 |
u | +22.926 |
- | +22.519 |
id | +21.324 |
_ | +21.230 |
Neg logit contributions | |
disparate | -19.821 |
proactive | -18.586 |
anecdotal | -18.563 |
hindsight | -18.482 |
relentless | -18.436 |
Token | [ |
Token ID | 685 |
Feature activation | +8.25e+00 |
Pos logit contributions | |
u | +8.390 |
- | +8.009 |
id | +7.722 |
ire | +7.669 |
ong | +7.633 |
Neg logit contributions | |
disparate | -8.829 |
relentless | -8.464 |
blatant | -8.399 |
academics | -8.363 |
stringent | -8.269 |
Token | system |
Token ID | 10057 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
u | +15.469 |
- | +14.339 |
id | +14.085 |
ine | +13.734 |
ab | +13.706 |
Neg logit contributions | |
disparate | -17.765 |
proactive | -17.351 |
relentless | -17.160 |
newer | -17.151 |
gradual | -17.113 |
Token | . |
Token ID | 13 |
Feature activation | +9.36e+00 |
Pos logit contributions | |
. | +31.050 |
- | +26.524 |
u | +24.732 |
_ | +23.552 |
' | +22.084 |
Neg logit contributions | |
tremend | -51.473 |
eleph | -46.492 |
metic | -45.760 |
cumbers | -45.576 |
exha | -45.015 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.35e+01 |
Pos logit contributions | |
u | +14.467 |
id | +13.435 |
- | +13.266 |
ab | +13.221 |
ine | +13.016 |
Neg logit contributions | |
tremend | -24.281 |
metic | -24.278 |
mathemat | -23.498 |
behavi | -23.101 |
unnecess | -22.916 |
Token | ing |
Token ID | 278 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
ing | +27.765 |
- | +23.892 |
u | +22.887 |
. | +22.522 |
al | +22.140 |
Neg logit contributions | |
tremend | -50.914 |
eleph | -46.435 |
metic | -45.988 |
cumbers | -45.612 |
exha | -45.402 |
Token | . |
Token ID | 13 |
Feature activation | +3.80e+00 |
Pos logit contributions | |
. | +29.455 |
- | +25.024 |
u | +22.093 |
_ | +21.744 |
' | +20.862 |
Neg logit contributions | |
tremend | -50.666 |
eleph | -45.334 |
metic | -43.867 |
cumbers | -43.742 |
occas | -43.116 |
Token | String |
Token ID | 10100 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
u | +5.014 |
id | +4.290 |
ine | +4.278 |
- | +4.277 |
ab | +4.103 |
Neg logit contributions | |
disparate | -13.820 |
totality | -13.587 |
relentless | -13.578 |
newer | -13.539 |
proactive | -13.519 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
u | +21.176 |
id | +21.128 |
ire | +20.767 |
ig | +20.629 |
ag | +20.539 |
Neg logit contributions | |
tremend | -33.610 |
hemor | -31.234 |
metic | -30.939 |
cumbers | -30.516 |
misunder | -29.883 |
Token | = |
Token ID | 796 |
Feature activation | +7.44e+00 |
Pos logit contributions | |
. | +23.254 |
u | +22.229 |
- | +22.090 |
= | +20.706 |
_ | +20.362 |
Neg logit contributions | |
tremend | -35.869 |
mathemat | -32.404 |
hemor | -31.578 |
metic | -30.891 |
cumbers | -29.923 |
Token | [ |
Token ID | 685 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
- | +13.889 |
u | +13.883 |
. | +13.012 |
id | +12.620 |
ong | +12.225 |
Neg logit contributions | |
tremend | -16.427 |
misunder | -14.755 |
mathemat | -14.703 |
disparate | -14.580 |
behavi | -14.541 |
Token | system |
Token ID | 10057 |
Feature activation | +2.49e+01 |
Pos logit contributions | |
u | +19.016 |
- | +17.619 |
id | +17.302 |
ine | +16.756 |
ab | +16.613 |
Neg logit contributions | |
hemor | -26.977 |
behavi | -26.732 |
tremend | -26.528 |
metic | -26.167 |
undermin | -25.980 |
Token | . |
Token ID | 13 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
. | +31.667 |
- | +27.314 |
u | +25.016 |
_ | +23.830 |
' | +22.716 |
Neg logit contributions | |
tremend | -52.691 |
eleph | -47.276 |
cumbers | -46.720 |
metic | -46.443 |
exha | -45.912 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
u | +16.012 |
id | +15.129 |
- | +14.994 |
ab | +14.734 |
end | +14.447 |
Neg logit contributions | |
metic | -31.138 |
tremend | -30.436 |
mathemat | -29.219 |
unnecess | -28.805 |
behavi | -28.465 |
Token | ing |
Token ID | 278 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
ing | +27.886 |
- | +23.755 |
u | +23.129 |
al | +22.324 |
. | +22.215 |
Neg logit contributions | |
tremend | -52.098 |
metic | -47.504 |
eleph | -47.261 |
cumbers | -46.629 |
exha | -46.521 |
Token | . |
Token ID | 13 |
Feature activation | +9.27e+00 |
Pos logit contributions | |
. | +30.560 |
- | +26.039 |
u | +23.048 |
_ | +22.550 |
' | +21.884 |
Neg logit contributions | |
tremend | -52.194 |
eleph | -46.695 |
cumbers | -45.449 |
metic | -45.131 |
mathemat | -44.439 |
Token | String |
Token ID | 10100 |
Feature activation | +1.89e+01 |
Pos logit contributions | |
u | +9.991 |
- | +9.249 |
id | +8.587 |
ine | +8.263 |
. | +8.071 |
Neg logit contributions | |
tremend | -29.700 |
hemor | -28.227 |
mathemat | -28.010 |
eleph | -27.322 |
reluct | -26.957 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
al | +21.016 |
- | +20.852 |
. | +20.147 |
u | +19.462 |
ab | +18.942 |
Neg logit contributions | |
tremend | -45.994 |
metic | -40.627 |
mathemat | -40.258 |
hemor | -40.215 |
occas | -39.583 |
Token | ignment |
Token ID | 16747 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
u | +21.390 |
ire | +20.820 |
id | +20.577 |
ag | +19.899 |
ig | +19.804 |
Neg logit contributions | |
tremend | -33.015 |
hemor | -31.337 |
cumbers | -30.703 |
metic | -30.450 |
behavi | -29.223 |
Token | image |
Token ID | 2939 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
- | +13.727 |
u | +13.355 |
. | +12.570 |
ine | +12.198 |
ia | +12.016 |
Neg logit contributions | |
tremend | -18.706 |
mathemat | -18.569 |
undermin | -18.389 |
misunder | -18.050 |
cumbers | -17.569 |
Token | Path |
Token ID | 15235 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
Path | +16.350 |
- | +15.529 |
. | +15.469 |
u | +15.457 |
X | +14.124 |
Neg logit contributions | |
tremend | -42.089 |
mathemat | -38.724 |
undermin | -37.179 |
metic | -36.987 |
hemor | -36.673 |
Token | in |
Token ID | 287 |
Feature activation | +6.93e+00 |
Pos logit contributions | |
- | +20.486 |
. | +20.389 |
u | +19.792 |
_ | +18.330 |
ab | +17.887 |
Neg logit contributions | |
tremend | -35.882 |
mathemat | -32.793 |
hemor | -32.164 |
undermin | -31.993 |
metic | -31.465 |
Token | paths |
Token ID | 13532 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
- | +13.146 |
u | +12.372 |
. | +12.018 |
ines | +11.245 |
ong | +11.106 |
Neg logit contributions | |
tremend | -17.938 |
mathemat | -16.622 |
misunder | -16.036 |
undermin | -15.325 |
metic | -15.303 |
Token | . |
Token ID | 13 |
Feature activation | +9.61e+00 |
Pos logit contributions | |
. | +24.870 |
- | +20.955 |
u | +19.430 |
_ | +19.021 |
; | +17.723 |
Neg logit contributions | |
tremend | -34.633 |
mathemat | -30.530 |
cumbers | -30.339 |
undermin | -30.163 |
behavi | -29.971 |
Token | list |
Token ID | 4868 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
u | +12.360 |
id | +11.850 |
ab | +11.634 |
ine | +11.478 |
- | +11.335 |
Neg logit contributions | |
behavi | -30.893 |
tremend | -29.976 |
undermin | -29.015 |
mathemat | -28.732 |
metic | -28.703 |
Token | _ |
Token ID | 62 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
_ | +30.454 |
- | +27.953 |
. | +25.270 |
u | +24.506 |
ine | +22.221 |
Neg logit contributions | |
tremend | -48.959 |
cumbers | -43.722 |
mathemat | -43.406 |
metic | -43.292 |
undermin | -42.929 |
Token | images |
Token ID | 17566 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
u | +17.835 |
ag | +15.551 |
ine | +15.503 |
ines | +15.104 |
ab | +14.792 |
Neg logit contributions | |
tremend | -34.811 |
behavi | -34.745 |
metic | -34.300 |
mathemat | -33.705 |
undermin | -33.699 |
Token | ( |
Token ID | 7 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
- | +20.347 |
_ | +20.067 |
. | +20.047 |
( | +20.045 |
u | +19.531 |
Neg logit contributions | |
tremend | -40.899 |
undermin | -37.793 |
hemor | -37.314 |
mathemat | -37.269 |
metic | -36.472 |
Token | args |
Token ID | 22046 |
Feature activation | +1.59e+01 |
Pos logit contributions | |
args | +17.324 |
u | +15.954 |
ag | +14.984 |
ab | +14.474 |
id | +14.044 |
Neg logit contributions | |
tremend | -29.999 |
behavi | -28.270 |
mathemat | -28.140 |
metic | -27.632 |
undermin | -27.185 |
Token | [" |
Token ID | 14692 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
u | +19.638 |
. | +18.926 |
- | +17.855 |
_ | +16.604 |
ix | +15.591 |
Neg logit contributions | |
tremend | -37.522 |
behavi | -36.097 |
undermin | -34.588 |
mathemat | -34.363 |
cumbers | -33.083 |
Token | , |
Token ID | 11 |
Feature activation | +6.75e+00 |
Pos logit contributions | |
- | +22.625 |
. | +22.129 |
u | +21.706 |
, | +20.032 |
_ | +19.452 |
Neg logit contributions | |
tremend | -35.998 |
mathemat | -31.470 |
hemor | -30.934 |
undermin | -30.593 |
cumbers | -29.916 |
Token | $ |
Token ID | 3 |
Feature activation | +5.64e+00 |
Pos logit contributions | |
u | +12.288 |
- | +12.016 |
id | +11.192 |
ab | +11.095 |
ire | +10.994 |
Neg logit contributions | |
disparate | -16.282 |
totality | -15.884 |
disgruntled | -15.585 |
relentless | -15.579 |
tremend | -15.502 |
Token | FS |
Token ID | 10652 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
u | +7.469 |
ire | +6.789 |
ab | +6.545 |
id | +6.485 |
- | +6.440 |
Neg logit contributions | |
disparate | -18.246 |
totality | -17.751 |
relentless | -17.613 |
proactive | -17.606 |
disgruntled | -17.376 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
- | +22.163 |
2 | +21.506 |
u | +21.281 |
. | +21.168 |
1 | +21.015 |
Neg logit contributions | |
tremend | -38.554 |
mathemat | -35.333 |
metic | -34.145 |
undermin | -33.773 |
hemor | -33.594 |
Token | ,[ |
Token ID | 17414 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
. | +16.623 |
- | +16.463 |
u | +15.170 |
ong | +14.470 |
ire | +14.367 |
Neg logit contributions | |
tremend | -25.377 |
relentless | -23.029 |
disparate | -22.562 |
mathemat | -22.306 |
sophisticated | -22.285 |
Token | System |
Token ID | 11964 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
- | +14.520 |
u | +14.282 |
. | +12.681 |
id | +12.236 |
i | +11.849 |
Neg logit contributions | |
tremend | -26.529 |
metic | -25.870 |
hemor | -25.437 |
mathemat | -25.032 |
eleph | -25.003 |
Token | . |
Token ID | 13 |
Feature activation | +9.74e+00 |
Pos logit contributions | |
. | +30.928 |
- | +26.077 |
u | +24.064 |
_ | +22.444 |
' | +21.751 |
Neg logit contributions | |
tremend | -51.928 |
eleph | -46.017 |
metic | -45.230 |
cumbers | -44.747 |
mathemat | -44.708 |
Token | Draw |
Token ID | 25302 |
Feature activation | +2.19e+01 |
Pos logit contributions | |
- | +11.612 |
u | +11.586 |
. | +10.468 |
ine | +10.097 |
id | +9.947 |
Neg logit contributions | |
tremend | -31.308 |
mathemat | -29.093 |
metic | -29.043 |
unnecess | -27.126 |
eleph | -27.119 |
Token | ing |
Token ID | 278 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
ing | +26.953 |
- | +23.216 |
u | +23.037 |
. | +22.154 |
er | +21.199 |
Neg logit contributions | |
tremend | -49.978 |
eleph | -44.556 |
metic | -44.495 |
mathemat | -44.179 |
cumbers | -44.002 |
Token | . |
Token ID | 13 |
Feature activation | +5.20e+00 |
Pos logit contributions | |
. | +28.220 |
- | +23.578 |
u | +21.112 |
_ | +20.636 |
' | +19.397 |
Neg logit contributions | |
tremend | -48.470 |
eleph | -43.321 |
metic | -41.593 |
mathemat | -41.409 |
occas | -41.089 |
Token | Font |
Token ID | 23252 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
u | +4.376 |
- | +3.640 |
id | +3.478 |
ine | +3.376 |
ab | +3.171 |
Neg logit contributions | |
totality | -19.926 |
disparate | -19.837 |
proactive | -19.688 |
hindsight | -19.533 |
relentless | -19.521 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
u | +20.417 |
2 | +19.060 |
- | +19.059 |
ab | +19.054 |
id | +18.579 |
Neg logit contributions | |
disparate | -20.282 |
proactive | -19.906 |
stringent | -19.779 |
relentless | -19.165 |
totality | -19.141 |
Token | = |
Token ID | 796 |
Feature activation | +7.76e+00 |
Pos logit contributions | |
. | +18.058 |
u | +17.433 |
- | +17.229 |
_ | +15.941 |
= | +15.917 |
Neg logit contributions | |
tremend | -37.038 |
mathemat | -33.862 |
hemor | -33.749 |
metic | -33.307 |
undermin | -33.177 |
Token | New |
Token ID | 968 |
Feature activation | +2.26e+01 |
Pos logit contributions | |
- | +16.423 |
. | +15.714 |
u | +15.467 |
id | +14.295 |
ine | +14.270 |
Neg logit contributions | |
tremend | -20.214 |
undermin | -17.694 |
mathemat | -17.564 |
behavi | -17.488 |
cumbers | -17.191 |
Token | - |
Token ID | 12 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
- | +32.204 |
. | +24.021 |
_ | +22.038 |
u | +21.545 |
+ | +20.984 |
Neg logit contributions | |
tremend | -51.247 |
undermin | -45.641 |
metic | -45.544 |
mathemat | -45.106 |
eleph | -45.039 |
Token | Object |
Token ID | 10267 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
u | +15.611 |
- | +15.277 |
. | +13.945 |
ine | +13.055 |
o | +12.877 |
Neg logit contributions | |
tremend | -43.835 |
metic | -41.578 |
eleph | -40.604 |
mathemat | -40.581 |
reluct | -39.778 |
Token | System |
Token ID | 4482 |
Feature activation | +2.36e+01 |
Pos logit contributions | |
- | +18.248 |
. | +17.630 |
u | +16.681 |
ine | +16.359 |
ia | +15.886 |
Neg logit contributions | |
tremend | -24.594 |
mathemat | -21.774 |
cumbers | -21.772 |
undermin | -21.615 |
unnecess | -21.372 |
Token | . |
Token ID | 13 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
. | +31.015 |
- | +26.729 |
u | +23.835 |
_ | +22.479 |
' | +21.924 |
Neg logit contributions | |
tremend | -52.541 |
eleph | -46.702 |
cumbers | -45.941 |
metic | -45.720 |
mathemat | -45.341 |
Token | Draw |
Token ID | 25302 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
- | +15.022 |
u | +14.077 |
. | +13.778 |
ine | +12.813 |
ab | +12.044 |
Neg logit contributions | |
tremend | -39.885 |
metic | -37.331 |
mathemat | -36.941 |
eleph | -35.009 |
reluct | -34.374 |
Token | ing |
Token ID | 278 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
ing | +26.767 |
- | +23.516 |
u | +22.558 |
. | +22.187 |
ong | +21.060 |
Neg logit contributions | |
tremend | -50.701 |
mathemat | -45.212 |
eleph | -45.186 |
metic | -45.041 |
cumbers | -44.478 |
Token | . |
Token ID | 13 |
Feature activation | +4.45e+00 |
Pos logit contributions | |
. | +27.763 |
- | +23.988 |
u | +20.800 |
_ | +20.011 |
' | +19.273 |
Neg logit contributions | |
tremend | -47.972 |
eleph | -43.165 |
cumbers | -41.656 |
metic | -41.322 |
mathemat | -41.170 |
Token | Rect |
Token ID | 45474 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
u | +3.466 |
- | +3.138 |
ine | +2.445 |
ire | +2.405 |
. | +2.215 |
Neg logit contributions | |
tremend | -18.863 |
mathemat | -18.629 |
relentless | -18.538 |
disparate | -18.404 |
hindsight | -18.331 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
u | +20.943 |
- | +20.408 |
id | +19.905 |
ab | +19.891 |
s | +19.815 |
Neg logit contributions | |
disparate | -18.268 |
proactive | -17.750 |
stringent | -17.341 |
relentless | -17.107 |
totality | -16.878 |
Token | = |
Token ID | 796 |
Feature activation | +1.77e+00 |
Pos logit contributions | |
u | +15.535 |
. | +14.765 |
- | +14.635 |
id | +14.139 |
ab | +13.587 |
Neg logit contributions | |
tremend | -26.734 |
mathemat | -26.218 |
hemor | -25.274 |
behavi | -25.187 |
undermin | -24.692 |
Token | New |
Token ID | 968 |
Feature activation | +2.13e+01 |
Pos logit contributions | |
u | +5.923 |
- | +5.710 |
ire | +5.619 |
ine | +5.565 |
id | +5.552 |
Neg logit contributions | |
disparate | -3.018 |
relentless | -2.879 |
blatant | -2.828 |
proactive | -2.798 |
academics | -2.786 |
Token | - |
Token ID | 12 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
- | +31.369 |
. | +23.300 |
u | +21.648 |
_ | +21.340 |
+ | +20.879 |
Neg logit contributions | |
tremend | -49.187 |
undermin | -43.315 |
mathemat | -43.114 |
metic | -43.085 |
eleph | -43.073 |
Token | Object |
Token ID | 10267 |
Feature activation | +4.91e+00 |
Pos logit contributions | |
- | +15.662 |
u | +15.479 |
. | +13.896 |
ine | +13.251 |
q | +13.033 |
Neg logit contributions | |
tremend | -43.994 |
metic | -41.022 |
eleph | -40.592 |
hemor | -40.186 |
mathemat | -39.966 |
Token | System |
Token ID | 4482 |
Feature activation | +2.36e+01 |
Pos logit contributions | |
- | +9.736 |
u | +9.723 |
ine | +9.101 |
ia | +8.936 |
. | +8.576 |
Neg logit contributions | |
relentless | -11.506 |
totality | -11.489 |
proactive | -11.413 |
disparate | -11.387 |
gradual | -11.312 |
Token | . |
Token ID | 13 |
Feature activation | +9.68e+00 |
Pos logit contributions | |
. | +30.960 |
- | +26.529 |
u | +23.727 |
_ | +22.635 |
' | +21.731 |
Neg logit contributions | |
tremend | -51.735 |
eleph | -46.281 |
metic | -45.083 |
cumbers | -44.870 |
occas | -44.457 |
Token | Draw |
Token ID | 25302 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
u | +12.047 |
- | +11.954 |
. | +10.832 |
ine | +10.653 |
ab | +10.164 |
Neg logit contributions | |
tremend | -30.820 |
mathemat | -28.691 |
metic | -28.250 |
hemor | -26.825 |
eleph | -26.645 |
Token | ing |
Token ID | 278 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
ing | +26.936 |
- | +23.602 |
u | +22.899 |
. | +22.413 |
al | +21.076 |
Neg logit contributions | |
tremend | -50.393 |
eleph | -44.921 |
metic | -44.647 |
mathemat | -44.458 |
cumbers | -44.076 |
Token | . |
Token ID | 13 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
. | +26.372 |
- | +22.722 |
u | +20.336 |
_ | +19.328 |
; | +18.355 |
Neg logit contributions | |
tremend | -44.216 |
eleph | -39.654 |
metic | -37.847 |
mathemat | -37.703 |
hemor | -37.519 |
Token | Font |
Token ID | 23252 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
u | +1.353 |
ine | +1.140 |
- | +1.124 |
ire | +1.124 |
id | +1.089 |
Neg logit contributions | |
disparate | -4.211 |
totality | -4.157 |
relentless | -4.153 |
proactive | -4.136 |
newer | -4.121 |
Token | c |
Token ID | 269 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
- | +17.173 |
. | +16.181 |
u | +15.127 |
c | +14.826 |
ic | +14.638 |
Neg logit contributions | |
tremend | -23.519 |
mathemat | -22.887 |
undermin | -22.188 |
cumbers | -21.558 |
hemor | -21.553 |
Token | v |
Token ID | 85 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
v | +27.245 |
u | +26.920 |
q | +23.734 |
- | +23.258 |
. | +22.691 |
Neg logit contributions | |
tremend | -43.130 |
metic | -42.833 |
cumbers | -41.289 |
exha | -40.738 |
eleph | -39.905 |
Token | 2 |
Token ID | 17 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
2 | +25.703 |
- | +23.759 |
u | +23.165 |
. | +22.739 |
_ | +21.838 |
Neg logit contributions | |
tremend | -51.284 |
exha | -45.867 |
undermin | -45.544 |
eleph | -45.450 |
mathemat | -45.428 |
Token | . |
Token ID | 764 |
Feature activation | +5.90e+00 |
Pos logit contributions | |
. | +27.817 |
- | +24.051 |
_ | +22.403 |
u | +22.291 |
i | +20.101 |
Neg logit contributions | |
tremend | -46.913 |
mathemat | -40.943 |
cumbers | -40.798 |
eleph | -39.881 |
hemor | -39.454 |
Token | MOR |
Token ID | 35208 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
- | +11.507 |
u | +11.381 |
. | +10.403 |
_ | +10.284 |
id | +10.108 |
Neg logit contributions | |
disparate | -12.989 |
relentless | -12.522 |
totality | -12.183 |
proactive | -12.155 |
academics | -12.048 |
Token | PH |
Token ID | 11909 |
Feature activation | +2.35e+01 |
Pos logit contributions | |
- | +19.143 |
_ | +18.075 |
. | +17.849 |
PH | +17.042 |
PA | +16.960 |
Neg logit contributions | |
tremend | -43.983 |
mathemat | -40.069 |
metic | -38.694 |
undermin | -38.523 |
hemor | -37.987 |
Token | _ |
Token ID | 62 |
Feature activation | +9.66e+00 |
Pos logit contributions | |
_ | +30.375 |
- | +26.351 |
. | +24.527 |
u | +23.950 |
i | +22.037 |
Neg logit contributions | |
tremend | -47.079 |
mathemat | -42.041 |
cumbers | -41.875 |
hemor | -41.871 |
undermin | -41.327 |
Token | BL |
Token ID | 9148 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
- | +8.829 |
u | +7.384 |
. | +7.373 |
_ | +6.664 |
ab | +6.503 |
Neg logit contributions | |
tremend | -36.128 |
mathemat | -33.529 |
undermin | -32.004 |
metic | -31.933 |
hemor | -31.918 |
Token | ACK |
Token ID | 8120 |
Feature activation | +1.81e+01 |
Pos logit contributions | |
- | +21.019 |
. | +20.233 |
u | +20.091 |
_ | +18.758 |
ab | +18.200 |
Neg logit contributions | |
tremend | -39.468 |
undermin | -32.884 |
metic | -32.784 |
hemor | -32.553 |
mathemat | -32.264 |
Token | H |
Token ID | 39 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
- | +18.866 |
H | +17.761 |
h | +17.162 |
. | +17.022 |
_ | +16.639 |
Neg logit contributions | |
tremend | -45.285 |
mathemat | -38.776 |
metic | -38.112 |
occas | -37.908 |
undermin | -37.405 |
Token | AT |
Token ID | 1404 |
Feature activation | +1.59e+01 |
Pos logit contributions | |
- | +19.100 |
. | +18.344 |
at | +18.275 |
u | +17.619 |
AT | +17.372 |
Neg logit contributions | |
tremend | -42.906 |
hemor | -37.411 |
mathemat | -36.532 |
eleph | -36.022 |
undermin | -36.018 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
u | +20.894 |
id | +20.349 |
ire | +20.009 |
ig | +19.962 |
ine | +19.611 |
Neg logit contributions | |
tremend | -31.903 |
hemor | -29.932 |
mathemat | -29.842 |
metic | -29.239 |
cumbers | -28.711 |
Token | = |
Token ID | 796 |
Feature activation | +3.71e+00 |
Pos logit contributions | |
. | +25.177 |
u | +22.926 |
- | +22.519 |
id | +21.324 |
_ | +21.230 |
Neg logit contributions | |
disparate | -19.821 |
proactive | -18.586 |
anecdotal | -18.563 |
hindsight | -18.482 |
relentless | -18.436 |
Token | [ |
Token ID | 685 |
Feature activation | +8.25e+00 |
Pos logit contributions | |
u | +8.390 |
- | +8.009 |
id | +7.722 |
ire | +7.669 |
ong | +7.633 |
Neg logit contributions | |
disparate | -8.829 |
relentless | -8.464 |
blatant | -8.399 |
academics | -8.363 |
stringent | -8.269 |
Token | system |
Token ID | 10057 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
u | +15.469 |
- | +14.339 |
id | +14.085 |
ine | +13.734 |
ab | +13.706 |
Neg logit contributions | |
disparate | -17.765 |
proactive | -17.351 |
relentless | -17.160 |
newer | -17.151 |
gradual | -17.113 |
Token | . |
Token ID | 13 |
Feature activation | +9.36e+00 |
Pos logit contributions | |
. | +31.050 |
- | +26.524 |
u | +24.732 |
_ | +23.552 |
' | +22.084 |
Neg logit contributions | |
tremend | -51.473 |
eleph | -46.492 |
metic | -45.760 |
cumbers | -45.576 |
exha | -45.015 |
Token | draw |
Token ID | 19334 |
Feature activation | +2.35e+01 |
Pos logit contributions | |
u | +14.467 |
id | +13.435 |
- | +13.266 |
ab | +13.221 |
ine | +13.016 |
Neg logit contributions | |
tremend | -24.281 |
metic | -24.278 |
mathemat | -23.498 |
behavi | -23.101 |
unnecess | -22.916 |
Token | ing |
Token ID | 278 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
ing | +27.765 |
- | +23.892 |
u | +22.887 |
. | +22.522 |
al | +22.140 |
Neg logit contributions | |
tremend | -50.914 |
eleph | -46.435 |
metic | -45.988 |
cumbers | -45.612 |
exha | -45.402 |
Token | . |
Token ID | 13 |
Feature activation | +3.80e+00 |
Pos logit contributions | |
. | +29.455 |
- | +25.024 |
u | +22.093 |
_ | +21.744 |
' | +20.862 |
Neg logit contributions | |
tremend | -50.666 |
eleph | -45.334 |
metic | -43.867 |
cumbers | -43.742 |
occas | -43.116 |
Token | String |
Token ID | 10100 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
u | +5.014 |
id | +4.290 |
ine | +4.278 |
- | +4.277 |
ab | +4.103 |
Neg logit contributions | |
disparate | -13.820 |
totality | -13.587 |
relentless | -13.578 |
newer | -13.539 |
proactive | -13.519 |
Token | Al |
Token ID | 2348 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
- | +19.392 |
al | +19.102 |
. | +18.750 |
u | +18.141 |
ine | +17.786 |
Neg logit contributions | |
tremend | -24.349 |
disparate | -23.156 |
totality | -22.787 |
hindsight | -22.730 |
relentless | -22.443 |
Token | ignment |
Token ID | 16747 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
u | +20.400 |
id | +19.946 |
ire | +19.841 |
ig | +19.128 |
ine | +19.056 |
Neg logit contributions | |
tremend | -33.461 |
hemor | -31.737 |
cumbers | -31.239 |
metic | -30.317 |
behavi | -29.555 |
Token | s |
Token ID | 82 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
u | +2.414 |
ire | +1.964 |
ab | +1.889 |
id | +1.851 |
ine | +1.808 |
Neg logit contributions | |
disparate | -8.784 |
relentless | -8.608 |
newer | -8.560 |
totality | -8.534 |
proactive | -8.459 |
Token | z |
Token ID | 89 |
Feature activation | +9.04e+00 |
Pos logit contributions | |
z | +22.452 |
u | +20.117 |
q | +19.431 |
ine | +19.232 |
ab | +19.082 |
Neg logit contributions | |
disparate | -21.855 |
totality | -21.252 |
disgruntled | -20.761 |
proactive | -20.521 |
relentless | -20.476 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
u | +17.606 |
ab | +16.462 |
- | +16.418 |
ire | +16.097 |
id | +16.052 |
Neg logit contributions | |
disparate | -17.377 |
relentless | -16.634 |
proactive | -16.570 |
totality | -16.558 |
disgruntled | -16.290 |
Token | = |
Token ID | 796 |
Feature activation | +4.63e+00 |
Pos logit contributions | |
u | +17.727 |
. | +17.397 |
- | +16.821 |
id | +16.025 |
_ | +15.662 |
Neg logit contributions | |
tremend | -29.700 |
mathemat | -27.876 |
hemor | -27.059 |
undermin | -26.768 |
metic | -26.665 |
Token | [ |
Token ID | 685 |
Feature activation | +8.77e+00 |
Pos logit contributions | |
u | +10.077 |
- | +9.616 |
ire | +9.292 |
id | +9.190 |
ong | +9.183 |
Neg logit contributions | |
disparate | -10.548 |
relentless | -10.360 |
blatant | -10.229 |
stringent | -10.131 |
academics | -10.073 |
Token | system |
Token ID | 10057 |
Feature activation | +2.34e+01 |
Pos logit contributions | |
u | +14.438 |
- | +13.304 |
id | +12.618 |
ine | +12.373 |
ab | +12.230 |
Neg logit contributions | |
hemor | -21.692 |
tremend | -21.609 |
behavi | -21.418 |
mathemat | -21.410 |
undermin | -21.290 |
Token | . |
Token ID | 13 |
Feature activation | +5.99e+00 |
Pos logit contributions | |
. | +30.903 |
- | +26.681 |
u | +24.538 |
_ | +23.190 |
s | +22.030 |
Neg logit contributions | |
tremend | -50.283 |
eleph | -45.220 |
cumbers | -44.911 |
metic | -44.340 |
exha | -44.123 |
Token | windows |
Token ID | 28457 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
u | +8.500 |
ab | +7.191 |
- | +7.090 |
ine | +7.060 |
id | +6.903 |
Neg logit contributions | |
totality | -18.886 |
proactive | -18.792 |
disparate | -18.746 |
relentless | -18.700 |
blatant | -18.613 |
Token | . |
Token ID | 13 |
Feature activation | +6.80e+00 |
Pos logit contributions | |
. | +29.802 |
- | +24.975 |
u | +22.134 |
_ | +21.749 |
' | +20.754 |
Neg logit contributions | |
tremend | -47.027 |
eleph | -42.317 |
cumbers | -42.190 |
mathemat | -40.904 |
metic | -40.886 |
Token | forms |
Token ID | 23914 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
u | +9.010 |
id | +8.094 |
ab | +8.025 |
- | +7.775 |
ine | +7.756 |
Neg logit contributions | |
totality | -20.523 |
disparate | -20.376 |
proactive | -20.331 |
relentless | -20.244 |
newer | -20.204 |
Token | . |
Token ID | 13 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
. | +28.386 |
- | +23.915 |
u | +22.740 |
_ | +21.485 |
id | +21.141 |
Neg logit contributions | |
tremend | -42.850 |
metic | -38.627 |
cumbers | -38.271 |
eleph | -38.242 |
hemor | -37.695 |
Token | cv |
Token ID | 33967 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
u | +4.295 |
ab | +3.568 |
ire | +3.515 |
q | +3.416 |
ix | +3.368 |
Neg logit contributions | |
disparate | -11.672 |
relentless | -11.169 |
totality | -11.128 |
newer | -11.121 |
genuine | -11.105 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
u | +24.419 |
2 | +24.292 |
- | +23.802 |
. | +23.027 |
b | +21.814 |
Neg logit contributions | |
tremend | -45.595 |
metic | -42.715 |
exha | -42.437 |
eleph | -42.282 |
hemor | -41.808 |
Token | . |
Token ID | 13 |
Feature activation | +4.31e+00 |
Pos logit contributions | |
. | +27.973 |
- | +23.689 |
u | +22.479 |
_ | +21.396 |
' | +19.900 |
Neg logit contributions | |
tremend | -48.745 |
metic | -43.433 |
eleph | -43.169 |
hemor | -42.515 |
cumbers | -42.481 |
Token | M |
Token ID | 44 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
u | +6.528 |
- | +6.067 |
id | +5.768 |
ab | +5.689 |
ire | +5.559 |
Neg logit contributions | |
disparate | -13.664 |
relentless | -13.217 |
totality | -13.186 |
hindsight | -13.146 |
proactive | -13.112 |
Token | OR |
Token ID | 1581 |
Feature activation | +1.94e+01 |
Pos logit contributions | |
- | +21.252 |
. | +20.303 |
_ | +19.989 |
u | +19.650 |
ong | +18.314 |
Neg logit contributions | |
tremend | -32.562 |
mathemat | -30.391 |
metic | -30.000 |
undermin | -29.900 |
behavi | -29.354 |
Token | PH |
Token ID | 11909 |
Feature activation | +2.34e+01 |
Pos logit contributions | |
- | +23.193 |
. | +21.637 |
_ | +21.021 |
PA | +19.579 |
PH | +19.362 |
Neg logit contributions | |
tremend | -41.533 |
mathemat | -36.847 |
metic | -35.952 |
undermin | -35.760 |
satell | -34.838 |
Token | _ |
Token ID | 62 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
_ | +30.273 |
- | +26.811 |
. | +25.281 |
u | +24.821 |
+ | +22.583 |
Neg logit contributions | |
tremend | -44.837 |
hemor | -40.135 |
cumbers | -39.854 |
mathemat | -39.822 |
metic | -39.610 |
Token | RECT |
Token ID | 23988 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
u | +3.301 |
- | +2.990 |
q | +2.760 |
ab | +2.758 |
ire | +2.666 |
Neg logit contributions | |
disparate | -8.924 |
relentless | -8.694 |
totality | -8.661 |
newer | -8.651 |
proactive | -8.596 |
Token | , |
Token ID | 11 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
- | +25.209 |
u | +25.152 |
_ | +24.082 |
. | +23.277 |
ong | +23.015 |
Neg logit contributions | |
disparate | -17.508 |
relentless | -16.733 |
stringent | -16.724 |
blatant | -16.649 |
totality | -16.377 |
Token | ( |
Token ID | 357 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
u | +4.339 |
- | +4.038 |
ire | +3.914 |
ab | +3.866 |
ine | +3.828 |
Neg logit contributions | |
disparate | -5.909 |
blatant | -5.604 |
relentless | -5.601 |
hindsight | -5.569 |
drastic | -5.515 |
Token | 21 |
Token ID | 2481 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
u | +2.098 |
- | +1.770 |
ire | +1.741 |
ab | +1.706 |
id | +1.671 |
Neg logit contributions | |
disparate | -6.597 |
blatant | -6.335 |
relentless | -6.326 |
genuine | -6.324 |
totality | -6.319 |
Token | is |
Token ID | 318 |
Feature activation | +8.91e+00 |
Pos logit contributions | |
- | +17.507 |
. | +17.046 |
u | +16.730 |
ine | +15.829 |
id | +15.414 |
Neg logit contributions | |
tremend | -27.080 |
mathemat | -25.412 |
undermin | -24.429 |
misunder | -24.218 |
behavi | -24.031 |
Token | an |
Token ID | 281 |
Feature activation | +5.98e+00 |
Pos logit contributions | |
- | +18.433 |
. | +17.702 |
u | +16.224 |
ag | +16.009 |
ic | +16.009 |
Neg logit contributions | |
tremend | -20.023 |
mathemat | -18.744 |
misunder | -17.100 |
cumbers | -16.610 |
unnecess | -16.025 |
Token | autos |
Token ID | 44619 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
- | +12.862 |
. | +12.320 |
u | +12.152 |
ag | +11.289 |
ine | +11.288 |
Neg logit contributions | |
tremend | -12.971 |
mathemat | -12.928 |
misunder | -12.278 |
undermin | -11.933 |
behavi | -11.919 |
Token | omal |
Token ID | 18048 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
u | +23.874 |
ome | +22.515 |
id | +22.273 |
um | +22.085 |
- | +21.477 |
Neg logit contributions | |
tremend | -35.824 |
behavi | -34.364 |
undermin | -34.080 |
cumbers | -33.770 |
mathemat | -33.605 |
Token | dominant |
Token ID | 11410 |
Feature activation | +9.08e+00 |
Pos logit contributions | |
- | +22.055 |
. | +20.351 |
u | +18.431 |
ine | +17.349 |
id | +16.601 |
Neg logit contributions | |
mathemat | -30.292 |
unnecess | -25.754 |
tremend | -25.694 |
Palestin | -25.244 |
cumbers | -25.241 |
Token | ker |
Token ID | 41927 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
- | +17.774 |
. | +17.062 |
u | +16.119 |
ia | +14.982 |
er | +14.747 |
Neg logit contributions | |
tremend | -17.348 |
mathemat | -17.040 |
undermin | -16.699 |
misunder | -15.892 |
disparate | -15.617 |
Token | at |
Token ID | 265 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
at | +28.634 |
ati | +24.487 |
id | +24.155 |
ac | +24.023 |
- | +24.019 |
Neg logit contributions | |
tremend | -44.812 |
eleph | -42.838 |
cumbers | -42.528 |
reluct | -42.465 |
metic | -41.976 |
Token | oder |
Token ID | 12342 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
ode | +22.233 |
oder | +21.441 |
id | +21.080 |
ine | +20.479 |
- | +20.201 |
Neg logit contributions | |
tremend | -34.254 |
behavi | -32.125 |
mathemat | -31.931 |
unnecess | -31.866 |
cumbers | -31.851 |
Token | ma |
Token ID | 2611 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
ia | +23.968 |
ma | +21.486 |
u | +21.472 |
- | +21.227 |
ium | +20.910 |
Neg logit contributions | |
tremend | -33.579 |
undermin | -32.881 |
cumbers | -32.648 |
mathemat | -32.207 |
misunder | -31.708 |
Token | of |
Token ID | 286 |
Feature activation | +6.30e+00 |
Pos logit contributions | |
- | +20.665 |
. | +19.861 |
u | +18.437 |
ine | +17.284 |
ia | +17.164 |
Neg logit contributions | |
tremend | -34.600 |
mathemat | -33.526 |
cumbers | -31.621 |
undermin | -31.466 |
misunder | -30.908 |
Token | late |
Token ID | 2739 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
- | +13.333 |
. | +12.476 |
u | +12.269 |
ine | +11.999 |
ire | +11.430 |
Neg logit contributions | |
tremend | -15.377 |
mathemat | -14.979 |
behavi | -14.100 |
undermin | -13.855 |
DRAG | -13.399 |
Token | . |
Token ID | 13 |
Feature activation | +5.67e+00 |
Pos logit contributions | |
. | +14.352 |
u | +12.536 |
ab | +12.253 |
- | +12.182 |
á | +11.804 |
Neg logit contributions | |
disparate | -18.168 |
meticulous | -17.502 |
newer | -17.292 |
blatant | -17.155 |
totality | -17.148 |
Token | Bush |
Token ID | 5511 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
u | +11.359 |
- | +11.025 |
ab | +10.728 |
ia | +10.568 |
ire | +10.534 |
Neg logit contributions | |
tremend | -13.460 |
disparate | -13.355 |
mathemat | -13.278 |
totality | -13.014 |
misunder | -12.850 |
Token | was |
Token ID | 373 |
Feature activation | -6.99e+00 |
Pos logit contributions | |
u | +2.766 |
- | +2.610 |
ia | +2.552 |
id | +2.513 |
aga | +2.497 |
Neg logit contributions | |
disparate | -2.779 |
newer | -2.641 |
totality | -2.637 |
genuine | -2.619 |
blatant | -2.616 |
Token | president |
Token ID | 1893 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
disparate | +21.697 |
relentless | +21.490 |
newer | +21.406 |
genuine | +21.233 |
various | +21.180 |
Neg logit contributions | |
u | -11.507 |
aga | -11.124 |
ire | -11.061 |
ong | -10.964 |
iev | -10.731 |
Token | -- |
Token ID | 438 |
Feature activation | -5.30e+00 |
Pos logit contributions | |
- | +3.613 |
u | +3.545 |
. | +3.325 |
ine | +3.263 |
ia | +3.260 |
Neg logit contributions | |
disparate | -4.200 |
blatant | -4.064 |
newer | -3.985 |
genuine | -3.968 |
relentless | -3.966 |
Token | and |
Token ID | 290 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
disparate | +19.938 |
newer | +19.555 |
relentless | +19.455 |
various | +19.399 |
genuine | +19.387 |
Neg logit contributions | |
u | -6.469 |
aga | -5.952 |
ire | -5.882 |
ong | -5.635 |
ine | -5.483 |
Token | a |
Token ID | 257 |
Feature activation | -7.61e+00 |
Pos logit contributions | |
those | +35.930 |
many | +35.394 |
various | +34.740 |
modern | +34.540 |
newer | +34.113 |
Neg logit contributions | |
u | -14.309 |
iev | -13.489 |
ong | -13.031 |
igr | -12.875 |
ire | -12.704 |
Token | popular |
Token ID | 2968 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
disparate | +25.214 |
relentless | +24.849 |
genuine | +24.832 |
newer | +24.804 |
blatant | +24.593 |
Neg logit contributions | |
u | -10.104 |
aga | -9.508 |
ire | -9.434 |
iev | -9.190 |
ong | -9.147 |
Token | one |
Token ID | 530 |
Feature activation | -2.38e+00 |
Pos logit contributions | |
disparate | +11.230 |
newer | +10.939 |
blatant | +10.877 |
genuine | +10.861 |
relentless | +10.857 |
Neg logit contributions | |
u | -5.751 |
aga | -5.330 |
ire | -5.204 |
ong | -5.132 |
ine | -5.107 |
Token | -- |
Token ID | 1377 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
disparate | +10.898 |
newer | +10.603 |
blatant | +10.593 |
totality | +10.526 |
relentless | +10.520 |
Neg logit contributions | |
u | -1.949 |
- | -1.585 |
aga | -1.554 |
ire | -1.524 |
ine | -1.468 |
Token | 12 |
Token ID | 1105 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
disparate | +4.245 |
blatant | +4.116 |
genuine | +4.085 |
newer | +4.077 |
relentless | +4.048 |
Neg logit contributions | |
u | -2.803 |
aga | -2.595 |
ine | -2.587 |
ire | -2.538 |
ong | -2.535 |
Token | 's |
Token ID | 338 |
Feature activation | -6.05e+00 |
Pos logit contributions | |
u | +6.059 |
- | +5.791 |
ia | +5.638 |
ine | +5.503 |
ab | +5.443 |
Neg logit contributions | |
disparate | -6.559 |
stringent | -6.387 |
blatant | -6.311 |
newer | -6.257 |
stricter | -6.246 |
Token | a |
Token ID | 257 |
Feature activation | -4.01e+00 |
Pos logit contributions | |
disparate | +20.560 |
newer | +20.119 |
genuine | +19.938 |
relentless | +19.933 |
various | +19.891 |
Neg logit contributions | |
u | -10.355 |
aga | -9.696 |
ire | -9.616 |
ine | -9.306 |
ong | -9.302 |
Token | big |
Token ID | 1263 |
Feature activation | -7.25e-02 |
Pos logit contributions | |
disparate | +14.356 |
newer | +13.990 |
relentless | +13.888 |
various | +13.880 |
genuine | +13.878 |
Neg logit contributions | |
u | -7.104 |
aga | -6.491 |
ire | -6.378 |
ong | -6.252 |
ine | -6.231 |
Token | place |
Token ID | 1295 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
disparate | +0.145 |
genuine | +0.139 |
academics | +0.139 |
blatant | +0.138 |
relentless | +0.137 |
Neg logit contributions | |
u | -0.237 |
- | -0.232 |
ong | -0.222 |
aga | -0.221 |
id | -0.219 |
Token | , |
Token ID | 11 |
Feature activation | -7.64e+00 |
Pos logit contributions | |
u | +4.259 |
- | +4.093 |
. | +4.032 |
ine | +3.804 |
ia | +3.802 |
Neg logit contributions | |
totality | -4.890 |
disparate | -4.889 |
blatant | -4.759 |
relentless | -4.752 |
gradual | -4.743 |
Token | and |
Token ID | 290 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
disparate | +22.717 |
newer | +22.423 |
various | +22.265 |
relentless | +22.196 |
genuine | +22.181 |
Neg logit contributions | |
u | -12.787 |
aga | -12.486 |
ire | -12.393 |
iev | -12.055 |
ong | -11.956 |
Token | we |
Token ID | 356 |
Feature activation | -3.54e+00 |
Pos logit contributions | |
those | +34.997 |
many | +34.989 |
various | +34.608 |
newer | +34.532 |
disparate | +33.944 |
Neg logit contributions | |
aga | -14.961 |
ée | -14.909 |
iev | -14.427 |
u | -14.312 |
union | -14.256 |
Token | 're |
Token ID | 821 |
Feature activation | -4.87e+00 |
Pos logit contributions | |
disparate | +10.398 |
newer | +10.042 |
genuine | +9.953 |
blatant | +9.950 |
relentless | +9.935 |
Neg logit contributions | |
u | -8.335 |
ire | -7.861 |
aga | -7.857 |
ine | -7.664 |
ong | -7.605 |
Token | sure |
Token ID | 1654 |
Feature activation | -5.95e+00 |
Pos logit contributions | |
disparate | +14.088 |
newer | +13.676 |
genuine | +13.528 |
relentless | +13.485 |
blatant | +13.479 |
Neg logit contributions | |
u | -11.444 |
aga | -10.813 |
ire | -10.721 |
ine | -10.510 |
ong | -10.495 |
Token | there |
Token ID | 612 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
disparate | +19.890 |
newer | +19.478 |
genuine | +19.275 |
various | +19.239 |
relentless | +19.223 |
Neg logit contributions | |
u | -10.702 |
aga | -10.037 |
ire | -9.901 |
ong | -9.629 |
ine | -9.626 |
Token | are |
Token ID | 389 |
Feature activation | -7.33e+00 |
Pos logit contributions | |
disparate | +4.966 |
totality | +4.826 |
blatant | +4.794 |
relentless | +4.788 |
newer | +4.764 |
Neg logit contributions | |
u | -1.814 |
ire | -1.575 |
ine | -1.554 |
ab | -1.546 |
- | -1.529 |
Token | reducing |
Token ID | 8868 |
Feature activation | -4.70e+00 |
Pos logit contributions | |
disparate | +22.062 |
newer | +21.614 |
genuine | +21.505 |
relentless | +21.405 |
various | +21.402 |
Neg logit contributions | |
u | -11.587 |
aga | -10.852 |
ire | -10.799 |
ong | -10.500 |
ine | -10.310 |
Token | the |
Token ID | 262 |
Feature activation | -5.86e+00 |
Pos logit contributions | |
disparate | +15.743 |
newer | +15.417 |
relentless | +15.259 |
blatant | +15.206 |
genuine | +15.194 |
Neg logit contributions | |
u | -9.038 |
aga | -8.462 |
ire | -8.394 |
ine | -8.231 |
id | -8.124 |
Token | shelter |
Token ID | 11772 |
Feature activation | +4.33e+00 |
Pos logit contributions | |
disparate | +18.851 |
newer | +18.357 |
genuine | +18.234 |
various | +18.196 |
relentless | +18.187 |
Neg logit contributions | |
u | -11.143 |
aga | -10.469 |
ire | -10.371 |
ong | -10.120 |
ine | -10.040 |
Token | population |
Token ID | 3265 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
- | +12.128 |
ine | +11.030 |
. | +11.023 |
u | +10.922 |
id | +10.810 |
Neg logit contributions | |
hindsight | -7.887 |
disparate | -7.546 |
newer | -7.524 |
blatant | -7.413 |
relentless | -7.387 |
Token | . |
Token ID | 13 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
- | +2.796 |
. | +2.782 |
u | +2.732 |
id | +2.599 |
ong | +2.515 |
Neg logit contributions | |
disparate | -4.487 |
blatant | -4.344 |
newer | -4.288 |
relentless | -4.267 |
genuine | -4.260 |
Token | But |
Token ID | 887 |
Feature activation | -1.49e+01 |
Pos logit contributions | |
those | +25.937 |
various | +25.858 |
newer | +25.798 |
modern | +25.726 |
many | +25.599 |
Neg logit contributions | |
aga | -14.055 |
ire | -13.867 |
u | -13.561 |
iev | -13.559 |
ong | -13.066 |
Token | , |
Token ID | 11 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
those | +35.594 |
many | +35.138 |
various | +34.349 |
disparate | +34.113 |
newer | +33.754 |
Neg logit contributions | |
ire | -14.201 |
aga | -13.976 |
u | -13.907 |
ong | -13.630 |
ée | -13.460 |
Token | of |
Token ID | 286 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
those | +29.987 |
many | +29.831 |
various | +29.653 |
disparate | +29.436 |
newer | +29.165 |
Neg logit contributions | |
ire | -14.459 |
u | -14.266 |
aga | -13.859 |
ée | -13.318 |
ong | -13.269 |
Token | course |
Token ID | 1781 |
Feature activation | +3.97e+00 |
Pos logit contributions | |
u | +0.597 |
- | +0.571 |
aga | +0.566 |
ab | +0.561 |
ire | +0.556 |
Neg logit contributions | |
disparate | -0.571 |
newer | -0.547 |
relentless | -0.544 |
blatant | -0.542 |
venerable | -0.539 |
Token | , |
Token ID | 11 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
u | +7.312 |
- | +7.152 |
ab | +6.535 |
. | +6.533 |
id | +6.500 |
Neg logit contributions | |
disparate | -11.107 |
blatant | -10.558 |
relentless | -10.494 |
venerable | -10.494 |
newer | -10.440 |
Token | there |
Token ID | 612 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
those | +29.418 |
disparate | +29.309 |
many | +29.009 |
various | +28.893 |
newer | +28.750 |
Neg logit contributions | |
u | -13.724 |
aga | -13.368 |
ire | -13.121 |
ong | -12.754 |
ée | -12.692 |
Token | appropriate |
Token ID | 13335 |
Feature activation | +2.67e+00 |
Pos logit contributions | |
disparate | +1.553 |
newer | +1.526 |
relentless | +1.485 |
drastic | +1.479 |
tremendous | +1.475 |
Neg logit contributions | |
u | -1.207 |
- | -1.141 |
ine | -1.115 |
ab | -1.104 |
id | -1.081 |
Token | language |
Token ID | 3303 |
Feature activation | +3.22e+00 |
Pos logit contributions | |
- | +7.406 |
u | +7.392 |
ia | +6.833 |
ine | +6.763 |
aga | +6.761 |
Neg logit contributions | |
disparate | -5.472 |
newer | -5.308 |
poorer | -5.231 |
gradual | -5.231 |
genuine | -5.174 |
Token | � |
Token ID | 447 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
u | +6.465 |
- | +6.238 |
. | +6.171 |
id | +5.849 |
ia | +5.817 |
Neg logit contributions | |
disparate | -8.734 |
totality | -8.644 |
venerable | -8.555 |
newer | -8.542 |
relentless | -8.476 |
Token | � |
Token ID | 247 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
� | +16.764 |
� | +16.556 |
� | +16.240 |
� | +14.788 |
� | +14.296 |
Neg logit contributions | |
blatant | -21.733 |
mathemat | -21.447 |
disparate | -21.307 |
venerable | -21.247 |
totality | -21.079 |
Token | . |
Token ID | 13 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
u | +0.714 |
ine | +0.653 |
- | +0.653 |
id | +0.642 |
ire | +0.641 |
Neg logit contributions | |
disparate | -1.025 |
newer | -1.007 |
totality | -0.997 |
gradual | -0.989 |
genuine | -0.987 |
Token | But |
Token ID | 887 |
Feature activation | -1.47e+01 |
Pos logit contributions | |
those | +23.111 |
many | +22.925 |
modern | +22.893 |
various | +22.693 |
newer | +22.303 |
Neg logit contributions | |
aga | -17.218 |
iev | -16.542 |
ire | -16.067 |
u | -15.910 |
union | -15.819 |
Token | when |
Token ID | 618 |
Feature activation | -9.08e+00 |
Pos logit contributions | |
those | +35.109 |
many | +34.214 |
modern | +33.858 |
genuine | +33.563 |
various | +33.278 |
Neg logit contributions | |
aga | -15.075 |
iev | -15.022 |
ire | -14.766 |
u | -14.538 |
ée | -14.251 |
Token | a |
Token ID | 257 |
Feature activation | -8.96e+00 |
Pos logit contributions | |
disparate | +27.856 |
genuine | +27.467 |
those | +27.417 |
modern | +27.321 |
blatant | +27.302 |
Neg logit contributions | |
u | -12.860 |
aga | -12.553 |
ire | -12.144 |
iev | -11.807 |
ée | -11.782 |
Token | politician |
Token ID | 14971 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
genuine | +26.610 |
disparate | +26.603 |
modern | +26.403 |
blatant | +26.203 |
newer | +26.185 |
Neg logit contributions | |
u | -13.249 |
aga | -12.971 |
iev | -12.550 |
ire | -12.456 |
ong | -12.312 |
Token | tries |
Token ID | 8404 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
disparate | +6.845 |
newer | +6.643 |
totality | +6.599 |
relentless | +6.554 |
blatant | +6.522 |
Neg logit contributions | |
u | -4.797 |
ire | -4.449 |
aga | -4.441 |
- | -4.424 |
ine | -4.382 |
Token | to |
Token ID | 284 |
Feature activation | -6.24e+00 |
Pos logit contributions | |
disparate | +4.929 |
newer | +4.794 |
totality | +4.756 |
relentless | +4.694 |
genuine | +4.674 |
Neg logit contributions | |
u | -3.009 |
aga | -2.780 |
ire | -2.766 |
- | -2.759 |
ong | -2.734 |
Token | on |
Token ID | 319 |
Feature activation | -3.79e+00 |
Pos logit contributions | |
. | +6.444 |
- | +6.372 |
u | +6.282 |
ine | +6.151 |
ong | +5.959 |
Neg logit contributions | |
blatant | -6.224 |
genuine | -6.129 |
venerable | -6.106 |
disparate | -6.096 |
totality | -6.052 |
Token | Fisher |
Token ID | 14388 |
Feature activation | +7.57e+00 |
Pos logit contributions | |
disparate | +11.212 |
blatant | +10.789 |
newer | +10.778 |
genuine | +10.765 |
relentless | +10.661 |
Neg logit contributions | |
u | -9.530 |
ire | -8.925 |
aga | -8.896 |
- | -8.829 |
ine | -8.807 |
Token | s |
Token ID | 82 |
Feature activation | +4.02e+00 |
Pos logit contributions | |
- | +17.546 |
y | +16.381 |
ia | +16.199 |
. | +15.990 |
s | +15.987 |
Neg logit contributions | |
disparate | -13.000 |
blatant | -12.686 |
genuine | -12.515 |
proactive | -12.451 |
tremend | -12.261 |
Token | Island |
Token ID | 5451 |
Feature activation | +3.71e+00 |
Pos logit contributions | |
- | +10.058 |
ia | +9.701 |
u | +9.528 |
. | +9.485 |
ab | +9.480 |
Neg logit contributions | |
disparate | -8.833 |
blatant | -8.078 |
genuine | -8.040 |
totality | -8.015 |
proactive | -7.891 |
Token | -- |
Token ID | 1377 |
Feature activation | -3.96e+00 |
Pos logit contributions | |
. | +9.484 |
u | +9.426 |
- | +9.365 |
ine | +9.154 |
ia | +8.960 |
Neg logit contributions | |
blatant | -7.460 |
disparate | -7.401 |
proactive | -7.293 |
stringent | -7.265 |
genuine | -7.236 |
Token | but |
Token ID | 475 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
disparate | +13.237 |
newer | +12.793 |
blatant | +12.789 |
genuine | +12.757 |
relentless | +12.747 |
Neg logit contributions | |
u | -8.020 |
aga | -7.449 |
ire | -7.314 |
ine | -7.277 |
ong | -7.206 |
Token | early |
Token ID | 1903 |
Feature activation | -4.68e+00 |
Pos logit contributions | |
those | +35.296 |
many | +34.813 |
various | +34.433 |
newer | +34.333 |
disparate | +34.099 |
Neg logit contributions | |
iev | -14.273 |
u | -14.210 |
ire | -14.145 |
aga | -13.915 |
ache | -13.689 |
Token | in |
Token ID | 287 |
Feature activation | -2.56e+00 |
Pos logit contributions | |
disparate | +18.445 |
newer | +18.013 |
relentless | +17.903 |
genuine | +17.893 |
blatant | +17.874 |
Neg logit contributions | |
u | -6.148 |
aga | -5.561 |
ire | -5.489 |
ine | -5.301 |
ong | -5.234 |
Token | 1989 |
Token ID | 11104 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
disparate | +5.105 |
blatant | +4.810 |
relentless | +4.741 |
genuine | +4.721 |
proactive | +4.663 |
Neg logit contributions | |
u | -8.941 |
- | -8.418 |
aga | -8.410 |
ire | -8.408 |
ine | -8.356 |
Token | he |
Token ID | 339 |
Feature activation | -2.36e+00 |
Pos logit contributions | |
- | +2.979 |
u | +2.923 |
ine | +2.854 |
id | +2.794 |
ia | +2.777 |
Neg logit contributions | |
disparate | -2.071 |
relentless | -1.999 |
proactive | -1.998 |
blatant | -1.992 |
totality | -1.982 |
Token | found |
Token ID | 1043 |
Feature activation | -3.18e+00 |
Pos logit contributions | |
disparate | +6.670 |
newer | +6.433 |
totality | +6.433 |
blatant | +6.415 |
relentless | +6.385 |
Neg logit contributions | |
u | -6.005 |
ire | -5.693 |
aga | -5.671 |
ine | -5.620 |
- | -5.548 |
Token | was |
Token ID | 373 |
Feature activation | -7.85e+00 |
Pos logit contributions | |
newer | +29.551 |
various | +29.209 |
disparate | +29.045 |
venerable | +28.819 |
genuine | +28.819 |
Neg logit contributions | |
u | -10.306 |
ire | -10.137 |
aga | -9.986 |
ong | -9.544 |
union | -9.491 |
Token | right |
Token ID | 826 |
Feature activation | -7.96e-01 |
Pos logit contributions | |
disparate | +25.562 |
newer | +25.204 |
various | +25.151 |
genuine | +25.049 |
relentless | +24.928 |
Neg logit contributions | |
u | -11.144 |
ire | -10.626 |
aga | -10.580 |
ong | -10.076 |
ée | -9.968 |
Token | at |
Token ID | 379 |
Feature activation | -3.96e+00 |
Pos logit contributions | |
disparate | +3.132 |
totality | +3.027 |
blatant | +3.015 |
relentless | +2.996 |
genuine | +2.980 |
Neg logit contributions | |
u | -1.186 |
- | -1.082 |
ire | -1.020 |
ab | -0.996 |
ong | -0.983 |
Token | release |
Token ID | 2650 |
Feature activation | +4.79e-01 |
Pos logit contributions | |
disparate | +12.637 |
newer | +12.178 |
relentless | +12.128 |
genuine | +12.055 |
blatant | +12.048 |
Neg logit contributions | |
u | -8.783 |
aga | -8.181 |
ire | -8.127 |
ine | -8.065 |
ong | -7.918 |
Token | time |
Token ID | 640 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
- | +1.035 |
u | +1.007 |
. | +0.956 |
ine | +0.939 |
id | +0.926 |
Neg logit contributions | |
disparate | -1.486 |
blatant | -1.422 |
relentless | -1.421 |
totality | -1.404 |
gradual | -1.397 |
Token | and |
Token ID | 290 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
disparate | +5.383 |
relentless | +5.207 |
blatant | +5.205 |
totality | +5.163 |
genuine | +5.157 |
Neg logit contributions | |
u | -1.259 |
- | -1.123 |
aga | -1.047 |
ine | -1.029 |
ire | -1.009 |
Token | the |
Token ID | 262 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
those | +34.821 |
newer | +34.630 |
many | +34.510 |
various | +34.494 |
modern | +33.501 |
Neg logit contributions | |
u | -14.479 |
union | -13.988 |
ong | -13.932 |
aga | -13.827 |
ée | -13.744 |
Token | resolution |
Token ID | 6323 |
Feature activation | -9.84e-01 |
Pos logit contributions | |
newer | +32.897 |
various | +32.363 |
disparate | +31.992 |
genuine | +31.849 |
modern | +31.789 |
Neg logit contributions | |
u | -13.305 |
aga | -12.716 |
ong | -12.491 |
ée | -12.372 |
ire | -12.158 |
Token | was |
Token ID | 373 |
Feature activation | -9.81e+00 |
Pos logit contributions | |
disparate | +2.950 |
relentless | +2.773 |
blatant | +2.763 |
genuine | +2.733 |
newer | +2.723 |
Neg logit contributions | |
u | -2.371 |
- | -2.326 |
ine | -2.163 |
ab | -2.138 |
ire | -2.137 |
Token | most |
Token ID | 749 |
Feature activation | -3.28e+00 |
Pos logit contributions | |
newer | +28.761 |
disparate | +28.736 |
various | +28.685 |
genuine | +28.677 |
tremendous | +28.590 |
Neg logit contributions | |
u | -12.147 |
aga | -11.846 |
ire | -11.737 |
ong | -11.434 |
union | -11.287 |
Token | impressive |
Token ID | 8036 |
Feature activation | -2.05e+00 |
Pos logit contributions | |
disparate | +10.542 |
newer | +10.218 |
totality | +10.202 |
relentless | +10.144 |
genuine | +10.089 |
Neg logit contributions | |
u | -7.045 |
ire | -6.693 |
aga | -6.633 |
ab | -6.413 |
ine | -6.392 |
Token | all |
Token ID | 477 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
u | +3.901 |
- | +3.811 |
ine | +3.793 |
ab | +3.710 |
ire | +3.705 |
Neg logit contributions | |
disparate | -1.497 |
newer | -1.460 |
totality | -1.389 |
stringent | -1.330 |
relentless | -1.327 |
Token | the |
Token ID | 262 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
disparate | +6.200 |
relentless | +6.077 |
newer | +6.074 |
blatant | +6.042 |
genuine | +5.988 |
Neg logit contributions | |
u | -4.905 |
- | -4.713 |
ire | -4.645 |
ong | -4.545 |
ine | -4.529 |
Token | more |
Token ID | 517 |
Feature activation | -1.76e+00 |
Pos logit contributions | |
disparate | +3.228 |
genuine | +3.004 |
relentless | +2.992 |
newer | +2.992 |
blatant | +2.968 |
Neg logit contributions | |
u | -9.808 |
aga | -9.298 |
ire | -9.296 |
- | -9.216 |
ia | -9.194 |
Token | impressive |
Token ID | 8036 |
Feature activation | +5.55e-01 |
Pos logit contributions | |
disparate | +2.602 |
newer | +2.593 |
totality | +2.579 |
various | +2.397 |
relentless | +2.332 |
Neg logit contributions | |
u | -6.725 |
- | -6.485 |
aga | -6.470 |
ire | -6.466 |
ab | -6.367 |
Token | . |
Token ID | 13 |
Feature activation | -9.29e+00 |
Pos logit contributions | |
u | +0.535 |
. | +0.506 |
- | +0.503 |
ine | +0.445 |
id | +0.438 |
Neg logit contributions | |
disparate | -2.373 |
blatant | -2.293 |
totality | -2.293 |
relentless | -2.290 |
newer | -2.281 |
Token | But |
Token ID | 887 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
modern | +23.587 |
newer | +23.443 |
those | +23.436 |
various | +23.321 |
many | +23.002 |
Neg logit contributions | |
aga | -14.469 |
u | -14.196 |
ire | -13.810 |
iev | -13.758 |
ong | -13.326 |
Token | Louisiana |
Token ID | 13340 |
Feature activation | -2.17e-01 |
Pos logit contributions | |
those | +35.178 |
many | +34.660 |
modern | +34.263 |
newer | +34.220 |
various | +34.019 |
Neg logit contributions | |
u | -14.142 |
iev | -13.458 |
aga | -13.371 |
ire | -13.183 |
illo | -13.038 |
Token | voters |
Token ID | 4446 |
Feature activation | -2.61e+00 |
Pos logit contributions | |
disparate | +0.627 |
blatant | +0.604 |
relentless | +0.603 |
genuine | +0.602 |
newer | +0.601 |
Neg logit contributions | |
u | -0.511 |
- | -0.500 |
aga | -0.483 |
ia | -0.479 |
ab | -0.469 |
Token | have |
Token ID | 423 |
Feature activation | -6.95e+00 |
Pos logit contributions | |
disparate | +8.860 |
newer | +8.612 |
blatant | +8.576 |
relentless | +8.531 |
genuine | +8.519 |
Neg logit contributions | |
u | -5.103 |
aga | -4.746 |
ire | -4.615 |
ong | -4.593 |
- | -4.571 |
Token | never |
Token ID | 1239 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
disparate | +21.862 |
newer | +21.323 |
genuine | +21.275 |
various | +21.232 |
relentless | +21.142 |
Neg logit contributions | |
u | -12.249 |
ire | -11.622 |
aga | -11.434 |
ine | -11.224 |
ong | -11.183 |
Token | supported |
Token ID | 4855 |
Feature activation | -6.79e+00 |
Pos logit contributions | |
disparate | +12.113 |
newer | +11.774 |
genuine | +11.646 |
relentless | +11.627 |
various | +11.593 |
Neg logit contributions | |
u | -10.492 |
aga | -9.970 |
ire | -9.900 |
ine | -9.690 |
ong | -9.684 |
Token | to |
Token ID | 284 |
Feature activation | -4.85e+00 |
Pos logit contributions | |
u | +2.189 |
- | +2.118 |
aga | +2.104 |
ire | +2.089 |
ine | +2.067 |
Neg logit contributions | |
disparate | -2.476 |
newer | -2.458 |
hindsight | -2.428 |
blatant | -2.398 |
venerable | -2.396 |
Token | withdraw |
Token ID | 8399 |
Feature activation | -5.18e-01 |
Pos logit contributions | |
disparate | +14.222 |
newer | +13.848 |
genuine | +13.698 |
relentless | +13.675 |
blatant | +13.641 |
Neg logit contributions | |
u | -11.133 |
aga | -10.524 |
ire | -10.479 |
ine | -10.228 |
ong | -10.219 |
Token | before |
Token ID | 878 |
Feature activation | -7.45e+00 |
Pos logit contributions | |
disparate | +1.912 |
newer | +1.886 |
blatant | +1.860 |
genuine | +1.856 |
relentless | +1.846 |
Neg logit contributions | |
u | -0.838 |
- | -0.754 |
ire | -0.733 |
aga | -0.717 |
id | -0.717 |
Token | him |
Token ID | 683 |
Feature activation | -8.10e-01 |
Pos logit contributions | |
disparate | +24.256 |
newer | +23.804 |
various | +23.713 |
relentless | +23.671 |
genuine | +23.670 |
Neg logit contributions | |
u | -12.068 |
aga | -11.314 |
ire | -11.106 |
ong | -10.961 |
ab | -10.667 |
Token | , |
Token ID | 11 |
Feature activation | -8.00e+00 |
Pos logit contributions | |
disparate | +3.802 |
newer | +3.688 |
genuine | +3.681 |
blatant | +3.679 |
totality | +3.657 |
Neg logit contributions | |
u | -0.538 |
- | -0.437 |
ire | -0.406 |
id | -0.400 |
aga | -0.399 |
Token | and |
Token ID | 290 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
disparate | +23.660 |
various | +23.195 |
newer | +23.091 |
relentless | +23.077 |
genuine | +23.023 |
Neg logit contributions | |
u | -13.050 |
ire | -12.531 |
aga | -12.289 |
ong | -12.149 |
ine | -11.859 |
Token | made |
Token ID | 925 |
Feature activation | -4.05e+00 |
Pos logit contributions | |
those | +34.413 |
many | +34.412 |
various | +34.188 |
disparate | +33.481 |
modern | +33.142 |
Neg logit contributions | |
u | -14.577 |
aga | -13.681 |
ong | -13.455 |
ire | -13.030 |
iev | -12.982 |
Token | his |
Token ID | 465 |
Feature activation | -4.84e+00 |
Pos logit contributions | |
disparate | +11.691 |
newer | +11.483 |
totality | +11.198 |
genuine | +11.127 |
blatant | +11.110 |
Neg logit contributions | |
u | -10.124 |
aga | -9.702 |
ire | -9.558 |
id | -9.450 |
ine | -9.395 |
Token | way |
Token ID | 835 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
disparate | +14.391 |
newer | +14.031 |
genuine | +13.828 |
blatant | +13.777 |
relentless | +13.770 |
Neg logit contributions | |
u | -11.190 |
ire | -10.547 |
aga | -10.532 |
ine | -10.297 |
ong | -10.190 |
Token | to |
Token ID | 284 |
Feature activation | -6.82e+00 |
Pos logit contributions | |
disparate | +0.705 |
totality | +0.685 |
newer | +0.676 |
blatant | +0.675 |
hindsight | +0.674 |
Neg logit contributions | |
u | -0.538 |
- | -0.520 |
ire | -0.502 |
ine | -0.488 |
ia | -0.487 |
Token | York |
Token ID | 1971 |
Feature activation | +4.29e+00 |
Pos logit contributions | |
disparate | +22.511 |
newer | +22.068 |
various | +21.985 |
genuine | +21.819 |
relentless | +21.713 |
Neg logit contributions | |
u | -11.410 |
aga | -10.747 |
ire | -10.512 |
ong | -10.331 |
ine | -10.205 |
Token | to |
Token ID | 284 |
Feature activation | -6.32e+00 |
Pos logit contributions | |
u | +1.043 |
- | +0.999 |
ong | +0.967 |
id | +0.942 |
aga | +0.940 |
Neg logit contributions | |
disparate | -1.768 |
relentless | -1.745 |
totality | -1.727 |
blatant | -1.706 |
genuine | -1.692 |
Token | track |
Token ID | 2610 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
disparate | +18.809 |
newer | +18.516 |
various | +18.395 |
modern | +18.310 |
genuine | +18.274 |
Neg logit contributions | |
u | -12.121 |
aga | -11.537 |
ire | -11.327 |
ong | -10.971 |
ab | -10.873 |
Token | bottleneck |
Token ID | 49936 |
Feature activation | +3.44e+00 |
Pos logit contributions | |
disparate | +10.878 |
newer | +10.564 |
relentless | +10.532 |
blatant | +10.458 |
genuine | +10.401 |
Neg logit contributions | |
u | -7.509 |
aga | -6.997 |
ire | -6.964 |
ine | -6.918 |
ong | -6.850 |
Token | bandwidth |
Token ID | 19484 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
- | +9.777 |
u | +9.183 |
ine | +8.949 |
id | +8.906 |
ab | +8.793 |
Neg logit contributions | |
disparate | -6.657 |
relentless | -6.348 |
blatant | -6.344 |
newer | -6.321 |
disgruntled | -6.286 |
Token | , |
Token ID | 11 |
Feature activation | -9.17e+00 |
Pos logit contributions | |
u | +2.614 |
- | +2.490 |
. | +2.450 |
ine | +2.329 |
ab | +2.314 |
Neg logit contributions | |
disparate | -4.653 |
relentless | -4.518 |
blatant | -4.450 |
genuine | -4.449 |
venerable | -4.427 |
Token | but |
Token ID | 475 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
disparate | +26.169 |
various | +25.870 |
genuine | +25.858 |
newer | +25.716 |
modern | +25.633 |
Neg logit contributions | |
u | -13.161 |
ire | -12.976 |
aga | -12.913 |
ée | -12.134 |
usk | -12.110 |
Token | a |
Token ID | 257 |
Feature activation | -9.02e+00 |
Pos logit contributions | |
those | +34.454 |
various | +34.248 |
many | +34.227 |
newer | +33.801 |
disparate | +33.656 |
Neg logit contributions | |
aga | -14.644 |
union | -13.766 |
u | -13.754 |
ée | -13.272 |
ire | -13.222 |
Token | good |
Token ID | 922 |
Feature activation | -2.97e+00 |
Pos logit contributions | |
disparate | +27.534 |
newer | +27.422 |
genuine | +27.162 |
modern | +27.023 |
relentless | +26.628 |
Neg logit contributions | |
aga | -11.443 |
u | -11.357 |
ire | -10.521 |
iev | -10.483 |
ong | -10.303 |
Token | estimate |
Token ID | 8636 |
Feature activation | +8.91e-01 |
Pos logit contributions | |
disparate | +10.172 |
newer | +9.895 |
relentless | +9.850 |
blatant | +9.840 |
genuine | +9.791 |
Neg logit contributions | |
u | -5.576 |
ire | -5.140 |
aga | -5.063 |
ine | -5.055 |
- | -5.005 |
Token | results |
Token ID | 2482 |
Feature activation | +4.97e-01 |
Pos logit contributions | |
u | +1.486 |
- | +1.417 |
id | +1.298 |
ab | +1.298 |
aga | +1.279 |
Neg logit contributions | |
disparate | -3.139 |
relentless | -3.054 |
blatant | -3.049 |
newer | -3.021 |
totality | -3.003 |
Token | from |
Token ID | 422 |
Feature activation | -8.16e+00 |
Pos logit contributions | |
u | +0.986 |
- | +0.980 |
ine | +0.926 |
. | +0.926 |
ab | +0.913 |
Neg logit contributions | |
disparate | -1.560 |
relentless | -1.552 |
blatant | -1.529 |
newer | -1.514 |
totality | -1.513 |
Token | five |
Token ID | 1936 |
Feature activation | -2.69e+00 |
Pos logit contributions | |
disparate | +22.507 |
newer | +21.984 |
genuine | +21.810 |
various | +21.792 |
relentless | +21.699 |
Neg logit contributions | |
u | -10.934 |
aga | -10.302 |
ire | -10.169 |
ong | -9.846 |
ine | -9.781 |
Token | kids |
Token ID | 3988 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
disparate | +12.152 |
newer | +11.976 |
relentless | +11.963 |
blatant | +11.913 |
totality | +11.890 |
Neg logit contributions | |
u | -2.228 |
- | -1.785 |
aga | -1.740 |
ire | -1.733 |
ine | -1.727 |
Token | on |
Token ID | 319 |
Feature activation | -4.15e+00 |
Pos logit contributions | |
disparate | +6.005 |
blatant | +5.935 |
newer | +5.877 |
relentless | +5.864 |
totality | +5.863 |
Neg logit contributions | |
u | -2.892 |
- | -2.658 |
aga | -2.574 |
ire | -2.562 |
ine | -2.558 |
Token | a |
Token ID | 257 |
Feature activation | -4.79e+00 |
Pos logit contributions | |
disparate | +16.452 |
newer | +16.139 |
blatant | +16.059 |
relentless | +16.026 |
genuine | +16.016 |
Neg logit contributions | |
u | -5.802 |
aga | -5.230 |
ire | -5.105 |
ine | -4.977 |
ong | -4.957 |
Token | ship |
Token ID | 4074 |
Feature activation | +9.31e-01 |
Pos logit contributions | |
disparate | +14.943 |
newer | +14.461 |
blatant | +14.332 |
genuine | +14.291 |
relentless | +14.240 |
Neg logit contributions | |
u | -10.789 |
aga | -10.089 |
ire | -9.966 |
ine | -9.855 |
ong | -9.776 |
Token | and |
Token ID | 290 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
u | +2.056 |
- | +2.031 |
. | +1.970 |
ine | +1.889 |
ab | +1.874 |
Neg logit contributions | |
blatant | -2.627 |
disparate | -2.624 |
stringent | -2.590 |
venerable | -2.572 |
newer | -2.562 |
Token | for |
Token ID | 329 |
Feature activation | -6.24e+00 |
Pos logit contributions | |
those | +33.366 |
various | +32.529 |
many | +32.240 |
everything | +31.874 |
disparate | +31.739 |
Neg logit contributions | |
u | -15.126 |
iev | -14.893 |
ire | -14.783 |
ong | -14.391 |
aga | -14.353 |
Token | some |
Token ID | 617 |
Feature activation | -2.32e+00 |
Pos logit contributions | |
disparate | +19.474 |
various | +19.061 |
newer | +19.025 |
genuine | +18.897 |
relentless | +18.778 |
Neg logit contributions | |
u | -11.595 |
aga | -10.877 |
ire | -10.846 |
ong | -10.598 |
ine | -10.524 |
Token | reason |
Token ID | 1738 |
Feature activation | -5.60e+00 |
Pos logit contributions | |
disparate | +5.572 |
newer | +5.283 |
relentless | +5.268 |
totality | +5.183 |
blatant | +5.177 |
Neg logit contributions | |
u | -6.874 |
ire | -6.623 |
aga | -6.593 |
- | -6.547 |
ine | -6.464 |
Token | they |
Token ID | 484 |
Feature activation | -5.96e+00 |
Pos logit contributions | |
disparate | +19.353 |
newer | +18.932 |
genuine | +18.781 |
various | +18.757 |
relentless | +18.727 |
Neg logit contributions | |
u | -9.260 |
aga | -8.630 |
ire | -8.514 |
ong | -8.272 |
ine | -8.250 |
Token | were |
Token ID | 547 |
Feature activation | -9.13e+00 |
Pos logit contributions | |
disparate | +17.692 |
newer | +17.225 |
various | +17.172 |
genuine | +17.123 |
relentless | +17.084 |
Neg logit contributions | |
u | -11.620 |
aga | -11.106 |
ire | -10.946 |
ong | -10.716 |
ine | -10.691 |
Token | go |
Token ID | 467 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
disparate | +12.945 |
newer | +12.574 |
genuine | +12.438 |
relentless | +12.428 |
blatant | +12.394 |
Neg logit contributions | |
u | -10.550 |
aga | -9.978 |
ire | -9.929 |
ine | -9.710 |
ong | -9.709 |
Token | in |
Token ID | 287 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
disparate | +3.193 |
blatant | +3.070 |
totality | +3.049 |
venerable | +3.024 |
relentless | +3.010 |
Neg logit contributions | |
u | -3.084 |
- | -2.924 |
ine | -2.860 |
ire | -2.843 |
ab | -2.831 |
Token | effect |
Token ID | 1245 |
Feature activation | -8.18e-01 |
Pos logit contributions | |
disparate | +4.789 |
blatant | +4.722 |
venerable | +4.675 |
relentless | +4.639 |
newer | +4.628 |
Neg logit contributions | |
u | -5.060 |
- | -4.966 |
ine | -4.680 |
ire | -4.667 |
ong | -4.618 |
Token | immediately |
Token ID | 3393 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
disparate | +2.528 |
blatant | +2.461 |
relentless | +2.433 |
newer | +2.426 |
tremendous | +2.400 |
Neg logit contributions | |
u | -1.867 |
- | -1.733 |
ire | -1.702 |
ab | -1.698 |
ine | -1.686 |
Token | , |
Token ID | 11 |
Feature activation | -8.97e+00 |
Pos logit contributions | |
disparate | +4.940 |
blatant | +4.867 |
relentless | +4.837 |
newer | +4.784 |
tremendous | +4.778 |
Neg logit contributions | |
u | -1.204 |
- | -1.011 |
ab | -1.000 |
ire | -0.973 |
id | -0.963 |
Token | and |
Token ID | 290 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
disparate | +25.816 |
newer | +25.450 |
various | +25.405 |
genuine | +25.396 |
modern | +25.355 |
Neg logit contributions | |
u | -13.578 |
aga | -13.531 |
ire | -12.917 |
ong | -12.599 |
ine | -12.384 |
Token | proposals |
Token ID | 11628 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
those | +35.191 |
various | +34.676 |
many | +34.655 |
modern | +34.603 |
genuine | +34.529 |
Neg logit contributions | |
aga | -14.257 |
u | -13.721 |
ée | -13.146 |
union | -12.942 |
� | -12.903 |
Token | for |
Token ID | 329 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
disparate | +7.363 |
newer | +7.183 |
totality | +7.103 |
blatant | +7.081 |
genuine | +7.063 |
Neg logit contributions | |
u | -4.908 |
- | -4.521 |
ire | -4.518 |
aga | -4.502 |
ong | -4.493 |
Token | water |
Token ID | 1660 |
Feature activation | +8.07e-01 |
Pos logit contributions | |
various | +30.319 |
newer | +30.163 |
disparate | +30.090 |
modern | +30.007 |
genuine | +29.943 |
Neg logit contributions | |
u | -13.380 |
aga | -12.916 |
iev | -12.642 |
ire | -12.411 |
ée | -12.330 |
Token | transfer |
Token ID | 4351 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
- | +2.653 |
u | +2.587 |
id | +2.484 |
ine | +2.477 |
ab | +2.444 |
Neg logit contributions | |
disparate | -1.520 |
newer | -1.472 |
blatant | -1.470 |
relentless | -1.463 |
venerable | -1.436 |
Token | - |
Token ID | 532 |
Feature activation | -7.80e+00 |
Pos logit contributions | |
disparate | +0.783 |
relentless | +0.759 |
blatant | +0.755 |
newer | +0.754 |
venerable | +0.752 |
Neg logit contributions | |
u | -0.668 |
- | -0.627 |
ine | -0.619 |
ire | -0.617 |
ab | -0.613 |
Token | and |
Token ID | 290 |
Feature activation | -9.26e+00 |
Pos logit contributions | |
u | +15.445 |
ul | +13.960 |
- | +13.940 |
id | +13.542 |
ab | +13.298 |
Neg logit contributions | |
blatant | -10.881 |
disparate | -10.879 |
newer | -10.559 |
proactive | -10.542 |
relentless | -10.529 |
Token | so |
Token ID | 523 |
Feature activation | +4.04e+00 |
Pos logit contributions | |
various | +29.273 |
disparate | +29.042 |
newer | +28.857 |
those | +28.704 |
many | +28.563 |
Neg logit contributions | |
ire | -10.005 |
u | -9.980 |
aga | -9.876 |
iev | -9.455 |
ée | -9.423 |
Token | on |
Token ID | 319 |
Feature activation | +7.79e-01 |
Pos logit contributions | |
u | +9.344 |
- | +9.278 |
ong | +8.657 |
ire | +8.488 |
ab | +8.457 |
Neg logit contributions | |
disparate | -9.388 |
totality | -9.083 |
hindsight | -9.036 |
proactive | -8.924 |
newer | -8.887 |
Token | ). |
Token ID | 737 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
u | +0.777 |
- | +0.663 |
ong | +0.603 |
ab | +0.596 |
aga | +0.589 |
Neg logit contributions | |
disparate | -3.292 |
relentless | -3.239 |
blatant | -3.216 |
proactive | -3.208 |
totality | -3.188 |
Token | However |
Token ID | 2102 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
modern | +27.982 |
various | +27.979 |
those | +27.642 |
newer | +27.610 |
many | +27.474 |
Neg logit contributions | |
aga | -13.673 |
ire | -13.279 |
ée | -13.044 |
iev | -12.823 |
u | -12.704 |
Token | , |
Token ID | 11 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
u | +0.849 |
aga | +0.741 |
ire | +0.732 |
- | +0.722 |
ong | +0.717 |
Neg logit contributions | |
disparate | -2.257 |
relentless | -2.217 |
totality | -2.178 |
newer | -2.177 |
proactive | -2.173 |
Token | names |
Token ID | 3891 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
modern | +34.726 |
many | +34.689 |
various | +34.610 |
newer | +34.368 |
those | +34.306 |
Neg logit contributions | |
ée | -15.135 |
aga | -14.015 |
u | -13.849 |
ire | -13.777 |
union | -13.577 |
Token | of |
Token ID | 286 |
Feature activation | -8.61e+00 |
Pos logit contributions | |
disparate | +3.962 |
relentless | +3.914 |
totality | +3.863 |
blatant | +3.793 |
newer | +3.775 |
Neg logit contributions | |
u | -3.336 |
- | -3.093 |
ong | -3.053 |
ab | -3.025 |
aga | -3.007 |
Token | other |
Token ID | 584 |
Feature activation | -5.96e+00 |
Pos logit contributions | |
disparate | +27.592 |
various | +27.201 |
newer | +27.043 |
genuine | +26.953 |
modern | +26.679 |
Neg logit contributions | |
u | -12.451 |
aga | -11.979 |
ire | -11.785 |
ée | -11.493 |
ong | -11.409 |
Token | foreign |
Token ID | 3215 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
disparate | +19.633 |
newer | +19.130 |
genuine | +18.991 |
various | +18.976 |
blatant | +18.848 |
Neg logit contributions | |
u | -10.721 |
aga | -10.049 |
ire | -9.954 |
ine | -9.684 |
ong | -9.655 |
Token | origin |
Token ID | 8159 |
Feature activation | -5.70e-01 |
Pos logit contributions | |
- | +0.865 |
u | +0.860 |
aga | +0.829 |
ia | +0.829 |
id | +0.829 |
Neg logit contributions | |
relentless | -0.531 |
newer | -0.518 |
disparate | -0.511 |
blatant | -0.505 |
proactive | -0.501 |
Token | end |
Token ID | 886 |
Feature activation | +4.77e+00 |
Pos logit contributions | |
disparate | +18.831 |
newer | +18.386 |
genuine | +18.245 |
relentless | +18.230 |
various | +18.181 |
Neg logit contributions | |
u | -12.339 |
aga | -11.703 |
ire | -11.544 |
ong | -11.252 |
ine | -11.249 |
Token | . |
Token ID | 13 |
Feature activation | -7.79e+00 |
Pos logit contributions | |
u | +11.061 |
- | +10.996 |
. | +10.898 |
ine | +10.082 |
id | +10.034 |
Neg logit contributions | |
disparate | -10.466 |
blatant | -10.078 |
newer | -10.065 |
proactive | -9.980 |
tremendous | -9.933 |
Token |
|
Token ID | 198 |
Feature activation | +7.37e+00 |
Pos logit contributions | |
disparate | +21.198 |
newer | +21.165 |
modern | +21.158 |
various | +21.040 |
genuine | +20.935 |
Neg logit contributions | |
aga | -13.788 |
u | -13.701 |
ire | -13.342 |
ong | -13.034 |
iev | -12.879 |
Token |
|
Token ID | 198 |
Feature activation | -7.32e+00 |
Pos logit contributions | |
- | +10.558 |
u | +9.900 |
. | +9.639 |
id | +8.555 |
ine | +8.453 |
Neg logit contributions | |
tremend | -29.702 |
undermin | -26.938 |
mathemat | -26.911 |
hemor | -26.243 |
cumbers | -25.819 |
Token | However |
Token ID | 4864 |
Feature activation | -5.27e-01 |
Pos logit contributions | |
those | +19.300 |
modern | +19.233 |
genuine | +19.188 |
disparate | +19.181 |
newer | +19.174 |
Neg logit contributions | |
aga | -11.839 |
ire | -11.003 |
u | -10.882 |
iev | -10.782 |
ong | -10.782 |
Token | , |
Token ID | 11 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
disparate | +2.112 |
totality | +2.076 |
newer | +2.069 |
relentless | +2.041 |
tremendous | +2.034 |
Neg logit contributions | |
u | -0.624 |
- | -0.546 |
ine | -0.535 |
ire | -0.530 |
aga | -0.503 |
Token | it |
Token ID | 340 |
Feature activation | -4.48e+00 |
Pos logit contributions | |
those | +34.065 |
modern | +33.807 |
many | +33.730 |
various | +33.452 |
newer | +33.224 |
Neg logit contributions | |
aga | -15.711 |
u | -15.036 |
ire | -15.034 |
iev | -14.879 |
ong | -14.643 |
Token | is |
Token ID | 318 |
Feature activation | -7.32e+00 |
Pos logit contributions | |
disparate | +16.097 |
newer | +15.725 |
genuine | +15.590 |
relentless | +15.576 |
blatant | +15.548 |
Neg logit contributions | |
u | -7.372 |
aga | -6.781 |
ire | -6.713 |
ine | -6.529 |
ong | -6.528 |
Token | utter |
Token ID | 10517 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
disparate | +22.980 |
newer | +22.629 |
genuine | +22.582 |
various | +22.467 |
relentless | +22.406 |
Neg logit contributions | |
u | -12.406 |
aga | -11.899 |
ire | -11.738 |
ong | -11.338 |
ine | -11.069 |
Token | nonsense |
Token ID | 18149 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
u | +5.817 |
- | +5.685 |
ab | +5.558 |
ine | +5.453 |
ong | +5.424 |
Neg logit contributions | |
disparate | -3.356 |
newer | -3.204 |
stricter | -3.167 |
proactive | -3.092 |
stringent | -3.071 |
Token | to |
Token ID | 284 |
Feature activation | -5.03e+00 |
Pos logit contributions | |
u | +0.405 |
- | +0.379 |
. | +0.374 |
ong | +0.364 |
ine | +0.358 |
Neg logit contributions | |
disparate | -0.824 |
totality | -0.805 |
newer | -0.801 |
relentless | -0.799 |
blatant | -0.797 |
Token | teammates |
Token ID | 13107 |
Feature activation | +6.93e-01 |
Pos logit contributions | |
disparate | +23.208 |
relentless | +22.811 |
newer | +22.777 |
various | +22.738 |
genuine | +22.593 |
Neg logit contributions | |
u | -11.250 |
aga | -10.470 |
ire | -10.319 |
ine | -9.908 |
ong | -9.868 |
Token | . |
Token ID | 13 |
Feature activation | -6.10e+00 |
Pos logit contributions | |
u | +1.224 |
- | +1.207 |
. | +1.185 |
ong | +1.173 |
id | +1.117 |
Neg logit contributions | |
disparate | -2.358 |
blatant | -2.246 |
totality | -2.236 |
newer | -2.236 |
venerable | -2.212 |
Token |
|
Token ID | 198 |
Feature activation | +3.94e+00 |
Pos logit contributions | |
disparate | +16.674 |
newer | +16.566 |
various | +16.488 |
genuine | +16.372 |
modern | +16.211 |
Neg logit contributions | |
u | -12.671 |
aga | -12.325 |
ire | -12.068 |
ong | -11.831 |
ine | -11.687 |
Token |
|
Token ID | 198 |
Feature activation | -6.27e+00 |
Pos logit contributions | |
- | +4.705 |
u | +4.580 |
. | +4.025 |
ine | +3.868 |
id | +3.735 |
Neg logit contributions | |
tremend | -18.053 |
mathemat | -16.935 |
undermin | -16.813 |
hemor | -16.427 |
behavi | -16.272 |
Token | However |
Token ID | 4864 |
Feature activation | -2.86e+00 |
Pos logit contributions | |
those | +18.312 |
genuine | +18.241 |
disparate | +18.166 |
newer | +18.152 |
blatant | +18.148 |
Neg logit contributions | |
aga | -9.298 |
u | -8.997 |
ong | -8.704 |
ire | -8.668 |
ée | -8.663 |
Token | , |
Token ID | 11 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
disparate | +11.822 |
newer | +11.539 |
relentless | +11.466 |
genuine | +11.383 |
blatant | +11.365 |
Neg logit contributions | |
u | -3.627 |
ire | -3.187 |
aga | -3.136 |
ine | -3.041 |
- | -2.989 |
Token | life |
Token ID | 1204 |
Feature activation | -4.25e-01 |
Pos logit contributions | |
those | +33.920 |
various | +33.418 |
many | +33.192 |
newer | +32.270 |
genuine | +32.258 |
Neg logit contributions | |
aga | -14.994 |
ée | -14.823 |
u | -14.593 |
ong | -14.461 |
ield | -14.413 |
Token | comes |
Token ID | 2058 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
disparate | +1.322 |
blatant | +1.259 |
genuine | +1.246 |
totality | +1.244 |
newer | +1.240 |
Neg logit contributions | |
u | -0.962 |
- | -0.930 |
aga | -0.855 |
ab | -0.855 |
ine | -0.847 |
Token | at |
Token ID | 379 |
Feature activation | -8.19e-01 |
Pos logit contributions | |
disparate | +3.020 |
blatant | +2.977 |
totality | +2.946 |
venerable | +2.940 |
genuine | +2.914 |
Neg logit contributions | |
u | -2.665 |
- | -2.425 |
ong | -2.336 |
aga | -2.320 |
ire | -2.297 |
Token | you |
Token ID | 345 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
disparate | +1.122 |
newer | +1.068 |
genuine | +1.037 |
blatant | +1.014 |
relentless | +0.994 |
Neg logit contributions | |
u | -3.143 |
- | -3.123 |
aga | -3.059 |
ine | -3.052 |
ia | -3.035 |
Token | fast |
Token ID | 3049 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
disparate | +4.437 |
blatant | +4.303 |
newer | +4.298 |
totality | +4.282 |
genuine | +4.275 |
Neg logit contributions | |
u | -2.128 |
ire | -1.940 |
- | -1.927 |
ine | -1.892 |
aga | -1.886 |
Token | . |
Token ID | 13 |
Feature activation | -8.86e+00 |
Pos logit contributions | |
- | +15.099 |
u | +15.042 |
. | +14.421 |
ia | +14.382 |
aga | +14.215 |
Neg logit contributions | |
disparate | -11.775 |
newer | -10.605 |
totality | -10.601 |
blatant | -10.571 |
gradual | -10.484 |
Token | � |
Token ID | 447 |
Feature activation | +7.47e+00 |
Pos logit contributions | |
those | +22.527 |
various | +22.356 |
modern | +22.333 |
newer | +22.250 |
disparate | +22.013 |
Neg logit contributions | |
aga | -14.146 |
u | -14.077 |
iev | -13.781 |
ire | -13.743 |
ong | -13.348 |
Token | � |
Token ID | 251 |
Feature activation | -6.29e+00 |
Pos logit contributions | |
� | +12.770 |
u | +11.576 |
� | +11.545 |
� | +11.511 |
� | +11.310 |
Neg logit contributions | |
disparate | -18.174 |
blatant | -17.337 |
relentless | -16.882 |
newer | -16.821 |
drastic | -16.771 |
Token |
|
Token ID | 198 |
Feature activation | +5.09e+00 |
Pos logit contributions | |
disparate | +18.649 |
newer | +18.567 |
various | +18.450 |
genuine | +18.317 |
modern | +18.299 |
Neg logit contributions | |
u | -10.646 |
aga | -10.294 |
ire | -10.104 |
ong | -9.854 |
iev | -9.746 |
Token |
|
Token ID | 198 |
Feature activation | -6.86e+00 |
Pos logit contributions | |
- | +5.879 |
u | +5.679 |
. | +5.110 |
ine | +4.682 |
id | +4.598 |
Neg logit contributions | |
tremend | -23.139 |
mathemat | -21.540 |
undermin | -21.382 |
hemor | -20.863 |
behavi | -20.599 |
Token | But |
Token ID | 1537 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
disparate | +19.133 |
those | +19.106 |
newer | +19.036 |
genuine | +19.010 |
modern | +18.944 |
Neg logit contributions | |
aga | -10.460 |
u | -10.188 |
ire | -9.908 |
iev | -9.820 |
ong | -9.716 |
Token | this |
Token ID | 428 |
Feature activation | -6.71e+00 |
Pos logit contributions | |
those | +34.643 |
many | +33.954 |
various | +33.432 |
modern | +33.325 |
newer | +33.170 |
Neg logit contributions | |
u | -13.643 |
iev | -13.399 |
ire | -13.198 |
aga | -13.100 |
illo | -12.853 |
Token | year |
Token ID | 614 |
Feature activation | -9.05e-01 |
Pos logit contributions | |
disparate | +22.636 |
newer | +22.153 |
relentless | +22.010 |
blatant | +21.926 |
genuine | +21.850 |
Neg logit contributions | |
u | -10.670 |
aga | -9.912 |
ire | -9.843 |
ong | -9.501 |
ine | -9.454 |
Token | looks |
Token ID | 3073 |
Feature activation | +6.82e-01 |
Pos logit contributions | |
disparate | +3.701 |
blatant | +3.593 |
newer | +3.583 |
relentless | +3.581 |
genuine | +3.573 |
Neg logit contributions | |
u | -1.079 |
- | -1.023 |
ia | -0.950 |
id | -0.949 |
ine | -0.940 |
Token | different |
Token ID | 1180 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
- | +2.270 |
u | +2.258 |
ire | +2.166 |
id | +2.161 |
ia | +2.150 |
Neg logit contributions | |
totality | -1.078 |
academics | -1.061 |
DRAG | -1.057 |
disparate | -1.041 |
hindsight | -1.036 |
Token | . |
Token ID | 13 |
Feature activation | -9.97e+00 |
Pos logit contributions | |
u | +1.888 |
. | +1.787 |
- | +1.764 |
ab | +1.608 |
id | +1.601 |
Neg logit contributions | |
disparate | -5.107 |
blatant | -4.999 |
newer | -4.970 |
relentless | -4.899 |
genuine | -4.888 |
Token | area |
Token ID | 1989 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
- | +15.238 |
. | +15.027 |
u | +14.330 |
id | +14.293 |
ab | +13.776 |
Neg logit contributions | |
meticulous | -10.624 |
venerable | -10.485 |
disparate | -10.330 |
proactive | -10.259 |
totality | -10.120 |
Token | . |
Token ID | 13 |
Feature activation | -8.38e+00 |
Pos logit contributions | |
- | +4.572 |
. | +4.570 |
u | +4.421 |
id | +4.270 |
ia | +4.244 |
Neg logit contributions | |
disparate | -4.021 |
meticulous | -3.942 |
newer | -3.919 |
blatant | -3.909 |
venerable | -3.909 |
Token |
|
Token ID | 198 |
Feature activation | +5.55e+00 |
Pos logit contributions | |
various | +22.196 |
those | +22.039 |
newer | +21.940 |
disparate | +21.887 |
genuine | +21.809 |
Neg logit contributions | |
aga | -14.012 |
u | -13.653 |
ire | -13.172 |
ong | -13.126 |
iev | -13.011 |
Token |
|
Token ID | 198 |
Feature activation | -7.06e+00 |
Pos logit contributions | |
- | +6.636 |
u | +6.213 |
. | +5.811 |
ine | +5.253 |
id | +5.111 |
Neg logit contributions | |
tremend | -25.254 |
mathemat | -23.294 |
undermin | -23.208 |
hemor | -22.735 |
cumbers | -22.159 |
Token | However |
Token ID | 4864 |
Feature activation | -3.48e+00 |
Pos logit contributions | |
those | +18.530 |
genuine | +18.457 |
disparate | +18.351 |
various | +18.218 |
newer | +18.172 |
Neg logit contributions | |
aga | -11.423 |
u | -10.622 |
ong | -10.603 |
iev | -10.574 |
ée | -10.544 |
Token | , |
Token ID | 11 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
disparate | +14.233 |
newer | +13.924 |
relentless | +13.845 |
blatant | +13.790 |
genuine | +13.694 |
Neg logit contributions | |
u | -4.507 |
ire | -3.953 |
aga | -3.933 |
ine | -3.831 |
- | -3.729 |
Token | to |
Token ID | 284 |
Feature activation | -7.71e+00 |
Pos logit contributions | |
those | +33.877 |
many | +33.604 |
various | +33.518 |
genuine | +32.915 |
modern | +32.600 |
Neg logit contributions | |
aga | -15.235 |
ong | -14.985 |
u | -14.938 |
ée | -14.791 |
iev | -14.644 |
Token | make |
Token ID | 787 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
various | +23.695 |
those | +23.687 |
genuine | +23.593 |
modern | +23.460 |
disparate | +23.458 |
Neg logit contributions | |
u | -11.096 |
aga | -10.850 |
ine | -10.543 |
ire | -10.517 |
ée | -10.431 |
Token | all |
Token ID | 477 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
disparate | +8.323 |
newer | +7.963 |
relentless | +7.894 |
blatant | +7.847 |
venerable | +7.705 |
Neg logit contributions | |
u | -9.987 |
aga | -9.467 |
ire | -9.463 |
- | -9.359 |
id | -9.246 |
Token | this |
Token ID | 428 |
Feature activation | -3.93e+00 |
Pos logit contributions | |
disparate | +10.778 |
newer | +10.505 |
relentless | +10.433 |
blatant | +10.357 |
genuine | +10.319 |
Neg logit contributions | |
u | -7.490 |
ire | -6.941 |
aga | -6.929 |
ine | -6.764 |
ong | -6.761 |
Token | happen |
Token ID | 1645 |
Feature activation | -2.13e-01 |
Pos logit contributions | |
disparate | +12.217 |
newer | +11.910 |
relentless | +11.797 |
blatant | +11.715 |
genuine | +11.692 |
Neg logit contributions | |
u | -8.640 |
ire | -8.100 |
aga | -8.020 |
ong | -7.845 |
ine | -7.832 |
Token | Nor |
Token ID | 5414 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
various | +23.963 |
those | +23.822 |
newer | +23.769 |
modern | +23.522 |
genuine | +23.446 |
Neg logit contributions | |
aga | -14.243 |
u | -14.081 |
ire | -14.001 |
iev | -13.715 |
ong | -13.594 |
Token | the |
Token ID | 262 |
Feature activation | -8.79e+00 |
Pos logit contributions | |
disparate | +5.217 |
relentless | +4.954 |
newer | +4.909 |
totality | +4.879 |
blatant | +4.862 |
Neg logit contributions | |
u | -4.836 |
aga | -4.471 |
ire | -4.461 |
id | -4.449 |
ong | -4.433 |
Token | FG |
Token ID | 25503 |
Feature activation | +4.12e+00 |
Pos logit contributions | |
various | +27.074 |
disparate | +27.071 |
newer | +26.922 |
genuine | +26.714 |
modern | +26.528 |
Neg logit contributions | |
u | -12.988 |
aga | -12.359 |
ire | -12.096 |
ong | -11.971 |
iev | -11.566 |
Token | . |
Token ID | 13 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
u | +9.932 |
- | +9.739 |
. | +9.732 |
id | +9.171 |
ire | +9.017 |
Neg logit contributions | |
disparate | -9.735 |
relentless | -9.097 |
proactive | -8.901 |
blatant | -8.889 |
hindsight | -8.887 |
Token | However |
Token ID | 2102 |
Feature activation | -4.66e+00 |
Pos logit contributions | |
various | +25.012 |
newer | +24.966 |
those | +24.955 |
modern | +24.519 |
genuine | +24.409 |
Neg logit contributions | |
aga | -15.021 |
u | -14.677 |
iev | -14.574 |
ire | -14.515 |
ong | -14.504 |
Token | , |
Token ID | 11 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
disparate | +18.384 |
newer | +17.979 |
relentless | +17.865 |
genuine | +17.836 |
blatant | +17.810 |
Neg logit contributions | |
u | -6.113 |
aga | -5.515 |
ire | -5.463 |
ine | -5.230 |
ong | -5.208 |
Token | if |
Token ID | 611 |
Feature activation | -7.81e+00 |
Pos logit contributions | |
those | +33.121 |
various | +32.971 |
many | +32.517 |
newer | +32.419 |
modern | +31.925 |
Neg logit contributions | |
u | -15.694 |
aga | -15.522 |
iev | -14.827 |
union | -14.769 |
ire | -14.511 |
Token | we |
Token ID | 356 |
Feature activation | -5.35e+00 |
Pos logit contributions | |
disparate | +24.119 |
newer | +23.977 |
various | +23.817 |
genuine | +23.760 |
those | +23.528 |
Neg logit contributions | |
u | -12.961 |
aga | -12.274 |
ire | -11.974 |
ong | -11.873 |
ine | -11.586 |
Token | assume |
Token ID | 7048 |
Feature activation | -5.58e+00 |
Pos logit contributions | |
disparate | +15.334 |
newer | +15.027 |
various | +14.855 |
genuine | +14.844 |
modern | +14.791 |
Neg logit contributions | |
u | -11.493 |
aga | -11.020 |
ire | -10.779 |
ong | -10.648 |
ine | -10.605 |
Token | the |
Token ID | 262 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
disparate | +18.541 |
newer | +18.104 |
genuine | +17.936 |
relentless | +17.919 |
blatant | +17.869 |
Neg logit contributions | |
u | -10.432 |
aga | -9.759 |
ire | -9.669 |
ine | -9.400 |
ong | -9.390 |
Token | hops |
Token ID | 29438 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
various | +29.834 |
newer | +29.828 |
genuine | +29.357 |
disparate | +29.329 |
modern | +29.201 |
Neg logit contributions | |
u | -13.303 |
aga | -13.293 |
ong | -12.698 |
iev | -12.698 |
ire | -12.360 |
Token | � |
Token ID | 447 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
u | +11.799 |
- | +10.990 |
ate | +10.934 |
ine | +10.664 |
ig | +10.570 |
Neg logit contributions | |
disparate | -11.730 |
totality | -11.074 |
hindsight | -10.856 |
newer | -10.758 |
relentless | -10.752 |
Token | � |
Token ID | 247 |
Feature activation | +4.44e+00 |
Pos logit contributions | |
� | +19.198 |
� | +18.767 |
� | +17.764 |
� | +17.763 |
u | +17.193 |
Neg logit contributions | |
mathemat | -23.850 |
disparate | -23.211 |
blatant | -22.949 |
totality | -22.091 |
stringent | -21.827 |
Token | t |
Token ID | 83 |
Feature activation | -2.96e+00 |
Pos logit contributions | |
u | +7.804 |
id | +6.630 |
ire | +6.437 |
- | +6.303 |
ate | +6.201 |
Neg logit contributions | |
disparate | -14.193 |
totality | -13.341 |
newer | -13.226 |
relentless | -13.153 |
blatant | -13.151 |
Token | . |
Token ID | 13 |
Feature activation | -8.42e+00 |
Pos logit contributions | |
disparate | +12.318 |
newer | +12.013 |
relentless | +11.964 |
genuine | +11.943 |
blatant | +11.873 |
Neg logit contributions | |
u | -3.414 |
ire | -3.049 |
aga | -3.013 |
ine | -2.904 |
ong | -2.861 |
Token | However |
Token ID | 2102 |
Feature activation | +3.70e+00 |
Pos logit contributions | |
various | +23.250 |
those | +23.059 |
newer | +23.053 |
modern | +22.920 |
many | +22.898 |
Neg logit contributions | |
aga | -11.917 |
u | -11.744 |
ire | -11.357 |
ong | -11.137 |
iev | -10.907 |
Token | , |
Token ID | 11 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
u | +9.348 |
- | +8.922 |
ire | +8.785 |
ine | +8.709 |
aga | +8.687 |
Neg logit contributions | |
disparate | -8.185 |
newer | -7.745 |
relentless | -7.711 |
totality | -7.687 |
tremendous | -7.493 |
Token | when |
Token ID | 618 |
Feature activation | -7.38e+00 |
Pos logit contributions | |
those | +33.033 |
many | +33.026 |
various | +32.624 |
newer | +31.930 |
most | +31.901 |
Neg logit contributions | |
aga | -15.159 |
u | -14.871 |
ée | -14.200 |
ong | -13.940 |
ire | -13.795 |
Token | it |
Token ID | 340 |
Feature activation | -5.63e-01 |
Pos logit contributions | |
disparate | +23.580 |
newer | +23.075 |
various | +23.072 |
genuine | +22.927 |
blatant | +22.795 |
Neg logit contributions | |
u | -12.127 |
aga | -11.478 |
ire | -11.214 |
ong | -10.993 |
ée | -10.783 |
Token | becomes |
Token ID | 4329 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
disparate | +1.843 |
relentless | +1.760 |
blatant | +1.735 |
totality | +1.735 |
genuine | +1.723 |
Neg logit contributions | |
u | -1.233 |
- | -1.127 |
ire | -1.101 |
ab | -1.083 |
ong | -1.082 |
Token | � |
Token ID | 564 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
disparate | +12.594 |
newer | +12.215 |
relentless | +12.047 |
genuine | +12.003 |
various | +11.991 |
Neg logit contributions | |
u | -11.385 |
ire | -10.709 |
aga | -10.689 |
ine | -10.494 |
ong | -10.406 |
Token | � |
Token ID | 250 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
� | +17.841 |
� | +17.084 |
� | +17.050 |
ine | +16.798 |
� | +16.760 |
Neg logit contributions | |
disparate | -18.065 |
blatant | -17.477 |
newer | -17.103 |
relentless | -17.054 |
venerable | -16.962 |
Token | governments |
Token ID | 6905 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
disparate | +0.173 |
relentless | +0.168 |
blatant | +0.167 |
newer | +0.167 |
meticulous | +0.166 |
Neg logit contributions | |
u | -0.257 |
- | -0.255 |
id | -0.244 |
ia | -0.243 |
ong | -0.243 |
Token | . |
Token ID | 13 |
Feature activation | -8.49e+00 |
Pos logit contributions | |
. | +2.556 |
u | +2.453 |
- | +2.373 |
ong | +2.295 |
id | +2.131 |
Neg logit contributions | |
disparate | -7.026 |
totality | -6.882 |
newer | -6.867 |
gradual | -6.864 |
venerable | -6.858 |
Token |
|
Token ID | 198 |
Feature activation | +5.92e+00 |
Pos logit contributions | |
various | +23.638 |
disparate | +23.427 |
newer | +23.420 |
those | +23.389 |
modern | +23.363 |
Neg logit contributions | |
aga | -12.693 |
u | -11.989 |
ire | -11.977 |
ong | -11.465 |
ine | -11.303 |
Token |
|
Token ID | 198 |
Feature activation | -7.50e+00 |
Pos logit contributions | |
- | +7.277 |
u | +7.050 |
. | +6.588 |
ine | +5.961 |
id | +5.846 |
Neg logit contributions | |
tremend | -25.547 |
mathemat | -23.619 |
undermin | -23.331 |
hemor | -23.014 |
behavi | -22.383 |
Token | However |
Token ID | 4864 |
Feature activation | +3.19e+00 |
Pos logit contributions | |
disparate | +20.829 |
blatant | +20.748 |
genuine | +20.712 |
those | +20.628 |
various | +20.583 |
Neg logit contributions | |
aga | -11.304 |
ire | -10.472 |
u | -10.321 |
ong | -10.085 |
iev | -9.967 |
Token | , |
Token ID | 11 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
u | +6.468 |
- | +6.356 |
. | +5.866 |
ine | +5.720 |
ire | +5.702 |
Neg logit contributions | |
tremend | -8.393 |
mathemat | -8.243 |
disparate | -8.142 |
totality | -8.073 |
venerable | -7.945 |
Token | the |
Token ID | 262 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
those | +34.031 |
various | +33.861 |
many | +33.822 |
genuine | +33.090 |
newer | +33.021 |
Neg logit contributions | |
aga | -15.179 |
u | -14.327 |
ield | -14.298 |
ire | -14.022 |
ab | -13.485 |
Token | United |
Token ID | 1578 |
Feature activation | +8.53e+00 |
Pos logit contributions | |
genuine | +30.379 |
various | +30.344 |
newer | +30.316 |
disparate | +30.306 |
blatant | +29.888 |
Neg logit contributions | |
aga | -13.839 |
u | -13.408 |
ire | -12.924 |
ée | -12.766 |
iev | -12.742 |
Token | States |
Token ID | 1829 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
- | +16.621 |
u | +15.616 |
. | +15.418 |
ia | +15.188 |
ine | +14.904 |
Neg logit contributions | |
tremend | -20.437 |
mathemat | -19.316 |
hemor | -18.228 |
undermin | -17.731 |
misunder | -17.494 |
Token | � |
Token ID | 447 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
disparate | +5.317 |
newer | +5.140 |
relentless | +5.066 |
genuine | +5.052 |
blatant | +5.048 |
Neg logit contributions | |
u | -3.671 |
- | -3.404 |
aga | -3.339 |
ong | -3.320 |
ire | -3.316 |
Token | � |
Token ID | 247 |
Feature activation | +6.32e+00 |
Pos logit contributions | |
� | +21.757 |
� | +20.515 |
� | +19.833 |
� | +19.513 |
� | +19.153 |
Neg logit contributions | |
tremend | -29.824 |
mathemat | -28.706 |
misunder | -27.350 |
behavi | -25.955 |
disparate | -25.950 |
Token | off |
Token ID | 572 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
disparate | +1.277 |
blatant | +1.237 |
genuine | +1.234 |
newer | +1.231 |
totality | +1.220 |
Neg logit contributions | |
u | -0.992 |
- | -0.959 |
ine | -0.907 |
ire | -0.907 |
aga | -0.896 |
Token | winning |
Token ID | 5442 |
Feature activation | +1.14e-01 |
Pos logit contributions | |
disparate | +5.104 |
blatant | +4.861 |
newer | +4.859 |
relentless | +4.832 |
genuine | +4.810 |
Neg logit contributions | |
u | -3.075 |
- | -2.965 |
aga | -2.893 |
ire | -2.768 |
ine | -2.751 |
Token | a |
Token ID | 257 |
Feature activation | -3.28e+00 |
Pos logit contributions | |
u | +0.427 |
- | +0.424 |
ine | +0.413 |
ire | +0.410 |
aga | +0.408 |
Neg logit contributions | |
disparate | -0.179 |
genuine | -0.157 |
newer | -0.156 |
relentless | -0.155 |
blatant | -0.154 |
Token | Stanley |
Token ID | 14167 |
Feature activation | +9.63e+00 |
Pos logit contributions | |
disparate | +8.023 |
newer | +7.620 |
relentless | +7.468 |
genuine | +7.451 |
academics | +7.407 |
Neg logit contributions | |
u | -9.760 |
ire | -9.406 |
aga | -9.266 |
ong | -9.240 |
ine | -9.233 |
Token | Cup |
Token ID | 5454 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
- | +18.159 |
. | +16.856 |
ab | +16.255 |
u | +16.203 |
id | +16.013 |
Neg logit contributions | |
tremend | -20.102 |
behavi | -18.696 |
totality | -18.390 |
disparate | -18.267 |
mathemat | -17.899 |
Token | and |
Token ID | 290 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
- | +4.188 |
u | +4.156 |
. | +4.103 |
ire | +3.958 |
ine | +3.944 |
Neg logit contributions | |
disparate | -4.214 |
blatant | -3.912 |
genuine | -3.896 |
relentless | -3.891 |
newer | -3.879 |
Token | obviously |
Token ID | 6189 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
many | +33.989 |
various | +33.985 |
those | +33.956 |
newer | +33.097 |
most | +32.839 |
Neg logit contributions | |
u | -14.058 |
ong | -13.619 |
aga | -13.534 |
ée | -13.266 |
ire | -13.161 |
Token | enjoying |
Token ID | 13226 |
Feature activation | -4.59e+00 |
Pos logit contributions | |
those | +29.965 |
various | +29.960 |
newer | +29.859 |
disparate | +29.811 |
many | +29.666 |
Neg logit contributions | |
u | -12.664 |
aga | -12.146 |
ée | -11.742 |
ong | -11.717 |
ire | -11.391 |
Token | the |
Token ID | 262 |
Feature activation | -6.96e+00 |
Pos logit contributions | |
disparate | +14.023 |
newer | +13.504 |
blatant | +13.400 |
genuine | +13.332 |
relentless | +13.315 |
Neg logit contributions | |
u | -10.632 |
aga | -10.014 |
ire | -9.934 |
ine | -9.779 |
ong | -9.713 |
Token | hard |
Token ID | 1327 |
Feature activation | +4.18e+00 |
Pos logit contributions | |
disparate | +22.277 |
newer | +21.907 |
various | +21.777 |
relentless | +21.755 |
genuine | +21.702 |
Neg logit contributions | |
u | -12.295 |
aga | -11.659 |
ire | -11.465 |
ong | -11.057 |
ine | -11.043 |
Token | work |
Token ID | 670 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
- | +12.661 |
u | +11.575 |
aga | +11.079 |
ong | +11.070 |
ia | +10.847 |
Neg logit contributions | |
disparate | -7.402 |
blatant | -6.996 |
venerable | -6.691 |
newer | -6.666 |
drastic | -6.592 |
Token | a |
Token ID | 257 |
Feature activation | -6.86e+00 |
Pos logit contributions | |
disparate | +26.698 |
newer | +26.563 |
various | +26.538 |
those | +26.501 |
relentless | +26.384 |
Neg logit contributions | |
u | -12.419 |
aga | -12.043 |
ong | -11.702 |
ire | -11.581 |
ée | -11.280 |
Token | corner |
Token ID | 5228 |
Feature activation | +5.96e+00 |
Pos logit contributions | |
disparate | +22.400 |
genuine | +22.066 |
newer | +22.054 |
relentless | +22.007 |
blatant | +21.911 |
Neg logit contributions | |
u | -10.640 |
aga | -10.281 |
ong | -9.849 |
ire | -9.818 |
ine | -9.509 |
Token | may |
Token ID | 743 |
Feature activation | -4.04e+00 |
Pos logit contributions | |
- | +16.056 |
u | +15.603 |
ab | +15.121 |
ine | +14.990 |
id | +14.931 |
Neg logit contributions | |
disparate | -9.505 |
venerable | -8.348 |
stringent | -8.256 |
totality | -8.211 |
blatant | -8.198 |
Token | think |
Token ID | 892 |
Feature activation | -2.62e+00 |
Pos logit contributions | |
disparate | +11.257 |
newer | +10.854 |
genuine | +10.734 |
relentless | +10.713 |
blatant | +10.707 |
Neg logit contributions | |
u | -10.329 |
ire | -9.737 |
aga | -9.718 |
ine | -9.543 |
ong | -9.506 |
Token | he |
Token ID | 339 |
Feature activation | -7.23e-02 |
Pos logit contributions | |
disparate | +7.510 |
newer | +7.262 |
genuine | +7.138 |
blatant | +7.100 |
relentless | +7.095 |
Neg logit contributions | |
u | -6.625 |
ire | -6.214 |
- | -6.157 |
aga | -6.156 |
ine | -6.130 |
Token | � |
Token ID | 447 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
disparate | +0.234 |
totality | +0.227 |
newer | +0.224 |
genuine | +0.222 |
venerable | +0.221 |
Neg logit contributions | |
u | -0.159 |
- | -0.143 |
id | -0.143 |
ab | -0.141 |
ine | -0.141 |
Token | � |
Token ID | 247 |
Feature activation | +8.47e+00 |
Pos logit contributions | |
� | +22.443 |
� | +19.339 |
� | +18.417 |
� | +18.300 |
� | +18.214 |
Neg logit contributions | |
tremend | -33.769 |
mathemat | -33.756 |
behavi | -31.865 |
misunder | -31.589 |
anwhile | -31.410 |
Token | s |
Token ID | 82 |
Feature activation | -3.72e+00 |
Pos logit contributions | |
s | +15.594 |
u | +15.032 |
id | +14.639 |
ll | +14.205 |
- | +13.561 |
Neg logit contributions | |
disparate | -19.549 |
drastic | -18.570 |
blatant | -18.530 |
totality | -18.192 |
venerable | -18.101 |
Token | running |
Token ID | 2491 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
disparate | +9.772 |
newer | +9.378 |
genuine | +9.210 |
blatant | +9.202 |
various | +9.196 |
Neg logit contributions | |
u | -10.218 |
aga | -9.617 |
ire | -9.563 |
ine | -9.454 |
id | -9.378 |
Token | deep |
Token ID | 2769 |
Feature activation | +9.91e-01 |
Pos logit contributions | |
disparate | +0.410 |
venerable | +0.393 |
newer | +0.391 |
hindsight | +0.376 |
blatant | +0.370 |
Neg logit contributions | |
- | -0.674 |
u | -0.657 |
ine | -0.634 |
ire | -0.633 |
ab | -0.632 |
Token | , |
Token ID | 11 |
Feature activation | -9.49e+00 |
Pos logit contributions | |
- | +2.078 |
u | +2.035 |
ine | +1.918 |
ab | +1.892 |
ire | +1.881 |
Neg logit contributions | |
disparate | -3.016 |
newer | -2.905 |
venerable | -2.892 |
blatant | -2.851 |
stringent | -2.849 |
Token | the |
Token ID | 262 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
u | +4.209 |
- | +4.182 |
ia | +4.030 |
ire | +4.019 |
ine | +4.005 |
Neg logit contributions | |
disparate | -1.885 |
blatant | -1.761 |
relentless | -1.738 |
poorer | -1.732 |
disgruntled | -1.678 |
Token | The |
Token ID | 383 |
Feature activation | +8.52e+00 |
Pos logit contributions | |
disparate | +3.141 |
relentless | +2.991 |
blatant | +2.988 |
hindsight | +2.983 |
genuine | +2.934 |
Neg logit contributions | |
u | -3.514 |
- | -3.262 |
ine | -3.260 |
ire | -3.256 |
ia | -3.219 |
Token | Stan |
Token ID | 32140 |
Feature activation | +1.88e+01 |
Pos logit contributions | |
- | +16.842 |
u | +15.348 |
ine | +15.294 |
. | +15.062 |
aga | +14.955 |
Neg logit contributions | |
disparate | -14.594 |
totality | -13.798 |
proactive | -13.766 |
stringent | -13.598 |
whichever | -13.596 |
Token | ley |
Token ID | 1636 |
Feature activation | +9.16e+00 |
Pos logit contributions | |
ley | +25.197 |
ine | +22.933 |
- | +22.847 |
. | +21.768 |
u | +21.312 |
Neg logit contributions | |
tremend | -33.648 |
cumbers | -32.595 |
hemor | -31.920 |
metic | -31.653 |
undermin | -30.917 |
Token | Par |
Token ID | 10044 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
- | +18.582 |
. | +17.229 |
u | +16.650 |
_ | +16.242 |
ab | +16.212 |
Neg logit contributions | |
disparate | -15.292 |
stricter | -14.489 |
stringent | -14.241 |
relentless | -14.204 |
hindsight | -14.188 |
Token | ad |
Token ID | 324 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
ade | +23.980 |
ab | +23.507 |
ad | +23.414 |
id | +22.883 |
ag | +22.795 |
Neg logit contributions | |
tremend | -34.656 |
metic | -34.135 |
hemor | -32.837 |
cumbers | -32.575 |
behavi | -32.246 |
Token | ox |
Token ID | 1140 |
Feature activation | +6.68e+00 |
Pos logit contributions | |
ox | +23.697 |
ong | +23.036 |
u | +23.007 |
- | +22.292 |
ax | +22.273 |
Neg logit contributions | |
tremend | -31.612 |
hemor | -30.631 |
behavi | -29.707 |
cumbers | -29.293 |
reluct | -29.189 |
Token | . |
Token ID | 13 |
Feature activation | +5.89e+00 |
Pos logit contributions | |
. | +16.386 |
- | +16.240 |
u | +16.216 |
ire | +15.009 |
ia | +14.589 |
Neg logit contributions | |
disparate | -11.696 |
hindsight | -10.961 |
relentless | -10.850 |
totality | -10.665 |
blatant | -10.566 |
Token | rar |
Token ID | 20040 |
Feature activation | +6.38e+00 |
Pos logit contributions | |
u | +13.516 |
id | +12.491 |
ab | +12.376 |
- | +12.126 |
ag | +12.112 |
Neg logit contributions | |
disparate | -12.868 |
hindsight | -12.051 |
academics | -11.889 |
relentless | -11.753 |
totality | -11.739 |
Token | and |
Token ID | 290 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
. | +15.228 |
- | +15.225 |
u | +14.834 |
ine | +14.165 |
ab | +13.847 |
Neg logit contributions | |
disparate | -11.334 |
hindsight | -10.751 |
relentless | -10.735 |
stringent | -10.611 |
blatant | -10.483 |
Token | un |
Token ID | 555 |
Feature activation | +8.71e+00 |
Pos logit contributions | |
disparate | +7.403 |
relentless | +6.895 |
genuine | +6.850 |
blatant | +6.844 |
newer | +6.807 |
Neg logit contributions | |
u | -7.902 |
ire | -7.595 |
ine | -7.476 |
- | -7.411 |
aga | -7.337 |
Token | SR |
Token ID | 12562 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
u | +16.329 |
- | +14.743 |
b | +14.602 |
ire | +14.477 |
id | +14.371 |
Neg logit contributions | |
disparate | -16.654 |
relentless | -15.768 |
hindsight | -15.608 |
newer | -15.589 |
totality | -15.573 |
Token | . |
Token ID | 13 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
. | +30.291 |
u | +28.171 |
- | +27.743 |
ag | +25.631 |
_ | +25.628 |
Neg logit contributions | |
disparate | -18.752 |
proactive | -18.353 |
relentless | -18.294 |
spontaneous | -17.412 |
blatant | -17.388 |
Token | Width |
Token ID | 30916 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
u | +2.546 |
id | +2.133 |
- | +2.098 |
ine | +2.008 |
ab | +1.966 |
Neg logit contributions | |
disparate | -9.145 |
relentless | -8.872 |
totality | -8.839 |
hindsight | -8.793 |
proactive | -8.792 |
Token | ), |
Token ID | 828 |
Feature activation | +3.72e+00 |
Pos logit contributions | |
- | +22.633 |
u | +21.014 |
. | +20.613 |
+ | +19.920 |
/ | +19.152 |
Neg logit contributions | |
disparate | -16.339 |
relentless | -15.791 |
spontaneous | -15.404 |
proactive | -15.269 |
blatant | -15.179 |
Token | ($ |
Token ID | 16763 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
u | +8.332 |
- | +7.985 |
ire | +7.552 |
id | +7.543 |
ab | +7.431 |
Neg logit contributions | |
disparate | -9.798 |
totality | -9.289 |
relentless | -9.184 |
proactive | -9.106 |
academics | -9.069 |
Token | SR |
Token ID | 12562 |
Feature activation | +2.63e+01 |
Pos logit contributions | |
u | +19.480 |
- | +17.721 |
ire | +17.199 |
id | +17.196 |
b | +17.133 |
Neg logit contributions | |
disparate | -21.547 |
totality | -21.197 |
disgruntled | -20.590 |
newer | -20.585 |
venerable | -20.253 |
Token | . |
Token ID | 13 |
Feature activation | +6.06e+00 |
Pos logit contributions | |
. | +32.322 |
- | +27.876 |
u | +24.780 |
_ | +24.695 |
' | +22.692 |
Neg logit contributions | |
tremend | -54.232 |
metic | -48.051 |
mathemat | -46.794 |
eleph | -46.607 |
cumbers | -46.290 |
Token | Height |
Token ID | 23106 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
- | +4.820 |
u | +4.797 |
id | +4.178 |
ab | +4.132 |
ire | +3.623 |
Neg logit contributions | |
disparate | -22.783 |
proactive | -22.530 |
totality | -22.257 |
sporadic | -22.205 |
relentless | -22.029 |
Token | ))) |
Token ID | 22305 |
Feature activation | +3.99e+00 |
Pos logit contributions | |
- | +22.044 |
u | +21.459 |
. | +20.193 |
ire | +19.524 |
ine | +19.474 |
Neg logit contributions | |
disparate | -16.484 |
relentless | -16.435 |
proactive | -16.137 |
spontaneous | -16.014 |
blatant | -15.793 |
Token | ) |
Token ID | 1267 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
u | +9.191 |
- | +9.132 |
ire | +8.638 |
end | +8.605 |
id | +8.543 |
Neg logit contributions | |
disparate | -9.078 |
relentless | -8.768 |
stringent | -8.666 |
disgruntled | -8.605 |
academics | -8.563 |
Token | } |
Token ID | 1782 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
u | +4.621 |
- | +4.521 |
ire | +4.341 |
ine | +4.281 |
end | +4.212 |
Neg logit contributions | |
disparate | -5.533 |
relentless | -5.341 |
stringent | -5.264 |
academics | -5.242 |
blatant | -5.203 |
Token | s |
Token ID | 82 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
s | +23.742 |
u | +22.438 |
- | +20.132 |
id | +19.508 |
q | +19.282 |
Neg logit contributions | |
tremend | -39.749 |
metic | -38.518 |
hemor | -37.796 |
mathemat | -37.108 |
undermin | -36.959 |
Token | 180 |
Token ID | 11546 |
Feature activation | +7.12e+00 |
Pos logit contributions | |
disparate | +9.278 |
newer | +8.992 |
genuine | +8.890 |
relentless | +8.880 |
blatant | +8.847 |
Neg logit contributions | |
u | -9.354 |
aga | -8.917 |
ire | -8.862 |
ine | -8.687 |
ong | -8.680 |
Token | . |
Token ID | 13 |
Feature activation | +6.37e+00 |
Pos logit contributions | |
. | +16.161 |
- | +15.469 |
u | +15.144 |
ig | +14.045 |
ire | +13.729 |
Neg logit contributions | |
disparate | -13.588 |
relentless | -13.184 |
proactive | -13.177 |
blatant | -13.032 |
stringent | -12.559 |
Token | 7 |
Token ID | 22 |
Feature activation | +5.21e+00 |
Pos logit contributions | |
u | +10.177 |
- | +10.071 |
ab | +9.041 |
id | +8.833 |
. | +8.683 |
Neg logit contributions | |
disparate | -18.024 |
tremend | -17.901 |
totality | -17.514 |
undermin | -17.439 |
behavi | -17.431 |
Token | GT |
Token ID | 7963 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
u | +11.286 |
- | +11.142 |
ig | +10.335 |
. | +10.230 |
ire | +10.218 |
Neg logit contributions | |
disparate | -11.647 |
relentless | -11.469 |
proactive | -11.434 |
blatant | -11.314 |
academics | -11.129 |
Token | / |
Token ID | 14 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
/ | +25.224 |
- | +24.294 |
. | +22.385 |
u | +21.161 |
_ | +20.503 |
Neg logit contributions | |
tremend | -39.658 |
undermin | -35.511 |
metic | -35.263 |
mathemat | -35.225 |
reluct | -34.811 |
Token | s |
Token ID | 82 |
Feature activation | -4.72e+00 |
Pos logit contributions | |
s | +24.220 |
u | +22.960 |
- | +21.023 |
b | +20.019 |
q | +19.935 |
Neg logit contributions | |
tremend | -40.857 |
metic | -39.437 |
hemor | -38.740 |
mathemat | -37.840 |
undermin | -37.488 |
Token | 257 |
Token ID | 36100 |
Feature activation | +7.62e+00 |
Pos logit contributions | |
disparate | +13.714 |
newer | +13.400 |
various | +13.302 |
genuine | +13.226 |
relentless | +13.169 |
Neg logit contributions | |
u | -10.215 |
aga | -9.751 |
ire | -9.626 |
ong | -9.407 |
ine | -9.397 |
Token | . |
Token ID | 13 |
Feature activation | +5.65e+00 |
Pos logit contributions | |
. | +17.206 |
- | +16.360 |
u | +15.993 |
ig | +14.837 |
ire | +14.637 |
Neg logit contributions | |
proactive | -13.796 |
relentless | -13.792 |
disparate | -13.729 |
blatant | -13.447 |
stringent | -13.208 |
Token | 1 |
Token ID | 16 |
Feature activation | +3.55e+00 |
Pos logit contributions | |
u | +8.265 |
- | +7.890 |
ab | +7.314 |
id | +6.971 |
q | +6.914 |
Neg logit contributions | |
disparate | -17.631 |
totality | -17.171 |
relentless | -16.933 |
tremend | -16.912 |
proactive | -16.908 |
Token | GT |
Token ID | 7963 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
u | +8.890 |
- | +8.707 |
ig | +8.125 |
ire | +8.109 |
. | +8.077 |
Neg logit contributions | |
disparate | -7.953 |
relentless | -7.789 |
proactive | -7.739 |
blatant | -7.628 |
academics | -7.598 |
Token | HQ |
Token ID | 41275 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
u | +2.766 |
id | +2.395 |
ab | +2.206 |
ag | +2.129 |
ia | +2.113 |
Neg logit contributions | |
disparate | -9.816 |
totality | -9.723 |
relentless | -9.587 |
proactive | -9.570 |
hindsight | -9.542 |
Token | ) |
Token ID | 8 |
Feature activation | +6.02e+00 |
Pos logit contributions | |
- | +26.218 |
u | +25.793 |
. | +24.227 |
) | +23.942 |
ab | +23.397 |
Neg logit contributions | |
disparate | -17.446 |
proactive | -16.709 |
blatant | -16.596 |
stringent | -16.551 |
relentless | -16.521 |
Token | | |
Token ID | 930 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
u | +11.837 |
- | +10.631 |
id | +10.486 |
ire | +10.388 |
ine | +10.278 |
Neg logit contributions | |
disparate | -14.731 |
stringent | -13.908 |
blatant | -13.711 |
gradual | -13.663 |
totality | -13.547 |
Token | RSS |
Token ID | 25012 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
disparate | +3.192 |
totality | +2.992 |
relentless | +2.985 |
genuine | +2.976 |
blatant | +2.973 |
Neg logit contributions | |
u | -5.126 |
- | -4.761 |
ire | -4.740 |
id | -4.738 |
aga | -4.734 |
Token | ( |
Token ID | 357 |
Feature activation | +3.18e+00 |
Pos logit contributions | |
- | +25.258 |
u | +24.883 |
ine | +23.310 |
. | +23.284 |
id | +22.966 |
Neg logit contributions | |
stringent | -16.048 |
disparate | -16.008 |
totality | -15.669 |
meticulous | -15.617 |
relentless | -15.497 |
Token | SD |
Token ID | 10305 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
u | +2.976 |
id | +2.584 |
ia | +2.267 |
ag | +2.181 |
ab | +2.176 |
Neg logit contributions | |
disparate | -12.918 |
totality | -12.819 |
relentless | -12.775 |
proactive | -12.738 |
blatant | -12.713 |
Token | ) |
Token ID | 8 |
Feature activation | +2.87e+00 |
Pos logit contributions | |
- | +24.368 |
) | +22.959 |
u | +22.422 |
. | +22.193 |
+ | +20.610 |
Neg logit contributions | |
tremend | -35.017 |
mathemat | -31.418 |
undermin | -29.783 |
hemor | -29.690 |
metic | -29.494 |
Token |
|
Token ID | 198 |
Feature activation | +6.85e+00 |
Pos logit contributions | |
u | +5.994 |
ire | +5.277 |
- | +5.269 |
ong | +5.177 |
id | +5.172 |
Neg logit contributions | |
disparate | -8.430 |
stringent | -8.036 |
blatant | -7.904 |
gradual | -7.897 |
totality | -7.889 |
Token |
|
Token ID | 198 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
- | +9.444 |
u | +8.937 |
. | +8.597 |
ine | +7.498 |
id | +7.465 |
Neg logit contributions | |
tremend | -29.352 |
mathemat | -26.884 |
undermin | -26.656 |
hemor | -26.062 |
cumbers | -25.554 |
Token | This |
Token ID | 1212 |
Feature activation | -2.31e+00 |
Pos logit contributions | |
disparate | +5.495 |
newer | +5.323 |
totality | +5.282 |
genuine | +5.281 |
relentless | +5.276 |
Neg logit contributions | |
u | -2.542 |
ire | -2.226 |
ine | -2.194 |
ab | -2.174 |
id | -2.173 |
Token | week |
Token ID | 1285 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
disparate | +6.358 |
totality | +5.992 |
genuine | +5.965 |
newer | +5.957 |
relentless | +5.935 |
Neg logit contributions | |
u | -6.397 |
ire | -5.887 |
- | -5.871 |
ine | -5.855 |
ong | -5.840 |
Token | a |
Token ID | 257 |
Feature activation | -3.51e+00 |
Pos logit contributions | |
u | +31.496 |
- | +31.282 |
. | +29.934 |
ine | +29.847 |
id | +29.717 |
Neg logit contributions | |
disparate | -7.811 |
newer | -6.782 |
blatant | -6.738 |
relentless | -6.724 |
totality | -6.693 |
Token | scripted |
Token ID | 37341 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
disparate | +10.057 |
newer | +9.599 |
various | +9.593 |
relentless | +9.535 |
academics | +9.488 |
Neg logit contributions | |
u | -9.633 |
- | -8.961 |
ire | -8.911 |
ine | -8.849 |
id | -8.643 |
Token | TV |
Token ID | 3195 |
Feature activation | +2.34e+00 |
Pos logit contributions | |
disparate | +0.271 |
newer | +0.259 |
relentless | +0.254 |
blatant | +0.251 |
disgruntled | +0.251 |
Neg logit contributions | |
- | -0.365 |
u | -0.355 |
ine | -0.341 |
ong | -0.330 |
ire | -0.328 |
Token | show |
Token ID | 905 |
Feature activation | -7.29e-01 |
Pos logit contributions | |
- | +6.424 |
u | +6.106 |
ine | +5.826 |
. | +5.676 |
ab | +5.548 |
Neg logit contributions | |
disparate | -5.166 |
totality | -4.933 |
relentless | -4.818 |
stringent | -4.791 |
newer | -4.770 |
Token | with |
Token ID | 351 |
Feature activation | -6.43e+00 |
Pos logit contributions | |
disparate | +2.748 |
totality | +2.693 |
relentless | +2.693 |
newer | +2.679 |
blatant | +2.658 |
Neg logit contributions | |
u | -1.151 |
- | -1.077 |
ong | -1.021 |
. | -1.020 |
ire | -0.991 |
Token | Dr |
Token ID | 1583 |
Feature activation | +6.12e+00 |
Pos logit contributions | |
disparate | +24.151 |
newer | +23.655 |
relentless | +23.426 |
genuine | +23.422 |
blatant | +23.360 |
Neg logit contributions | |
u | -9.711 |
aga | -8.874 |
ire | -8.797 |
ine | -8.507 |
ong | -8.465 |
Token | . |
Token ID | 13 |
Feature activation | +2.26e+00 |
Pos logit contributions | |
. | +14.007 |
ab | +13.077 |
aga | +13.030 |
u | +12.882 |
ine | +12.810 |
Neg logit contributions | |
disparate | -12.944 |
totality | -12.903 |
stringent | -12.833 |
proactive | -12.806 |
blatant | -12.376 |
Token | Dre |
Token ID | 30882 |
Feature activation | +2.58e+00 |
Pos logit contributions | |
u | +6.515 |
- | +6.083 |
ine | +6.046 |
ab | +6.017 |
ire | +5.994 |
Neg logit contributions | |
stringent | -4.692 |
disparate | -4.656 |
proactive | -4.575 |
blatant | -4.459 |
totality | -4.397 |
Token | that |
Token ID | 326 |
Feature activation | -8.14e+00 |
Pos logit contributions | |
u | +6.141 |
. | +5.909 |
- | +5.903 |
ong | +5.598 |
ab | +5.536 |
Neg logit contributions | |
disparate | -6.607 |
totality | -6.422 |
genuine | -6.321 |
stringent | -6.268 |
venerable | -6.209 |
Token | could |
Token ID | 714 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
disparate | +28.189 |
newer | +27.679 |
various | +27.589 |
genuine | +27.409 |
relentless | +27.376 |
Neg logit contributions | |
u | -10.909 |
aga | -10.415 |
ire | -10.131 |
ong | -9.787 |
ine | -9.737 |
Token | debut |
Token ID | 8886 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
disparate | +9.702 |
newer | +9.271 |
blatant | +9.239 |
relentless | +9.210 |
totality | +9.182 |
Neg logit contributions | |
u | -8.856 |
ire | -8.308 |
aga | -8.247 |
- | -8.177 |
ong | -8.172 |
Token | communication |
Token ID | 6946 |
Feature activation | +2.56e+00 |
Pos logit contributions | |
- | +0.594 |
u | +0.593 |
ab | +0.570 |
ia | +0.557 |
id | +0.555 |
Neg logit contributions | |
disparate | -0.410 |
genuine | -0.387 |
newer | -0.384 |
relentless | -0.384 |
totality | -0.381 |
Token | to |
Token ID | 284 |
Feature activation | -5.98e+00 |
Pos logit contributions | |
- | +7.143 |
u | +6.738 |
ia | +6.653 |
. | +6.572 |
ag | +6.452 |
Neg logit contributions | |
disparate | -5.431 |
totality | -5.109 |
relentless | -5.093 |
tremendous | -5.072 |
newer | -5.060 |
Token | the |
Token ID | 262 |
Feature activation | -4.91e+00 |
Pos logit contributions | |
disparate | +19.857 |
newer | +19.410 |
various | +19.236 |
genuine | +19.217 |
relentless | +19.176 |
Neg logit contributions | |
u | -10.736 |
aga | -10.135 |
ire | -9.957 |
ine | -9.706 |
ong | -9.698 |
Token | U |
Token ID | 471 |
Feature activation | +9.60e+00 |
Pos logit contributions | |
disparate | +13.205 |
newer | +12.837 |
genuine | +12.714 |
relentless | +12.698 |
blatant | +12.663 |
Neg logit contributions | |
u | -12.601 |
ire | -11.907 |
aga | -11.871 |
ine | -11.644 |
ong | -11.599 |
Token | . |
Token ID | 13 |
Feature activation | +6.86e+00 |
Pos logit contributions | |
. | +17.669 |
- | +16.106 |
u | +15.802 |
ire | +14.236 |
ine | +14.212 |
Neg logit contributions | |
tremend | -27.739 |
mathemat | -25.695 |
undermin | -25.002 |
hemor | -24.811 |
cumbers | -24.095 |
Token | S |
Token ID | 50 |
Feature activation | +6.80e+00 |
Pos logit contributions | |
u | +11.226 |
ire | +10.715 |
ong | +10.279 |
- | +10.055 |
ine | +9.679 |
Neg logit contributions | |
disparate | -17.921 |
totality | -17.537 |
sheer | -17.180 |
meticulous | -17.153 |
blatant | -16.839 |
Token | . |
Token ID | 13 |
Feature activation | +3.44e-01 |
Pos logit contributions | |
. | +14.918 |
u | +14.698 |
- | +14.119 |
ire | +13.704 |
ong | +13.497 |
Neg logit contributions | |
disparate | -14.606 |
hindsight | -14.092 |
genuine | -14.022 |
totality | -13.961 |
meticulous | -13.947 |
Token | government |
Token ID | 1230 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
u | +1.107 |
ire | +1.051 |
- | +1.035 |
ab | +1.023 |
ong | +1.020 |
Neg logit contributions | |
disparate | -0.684 |
newer | -0.664 |
hindsight | -0.658 |
genuine | -0.656 |
totality | -0.647 |
Token | demanding |
Token ID | 11334 |
Feature activation | -4.45e+00 |
Pos logit contributions | |
- | +5.265 |
u | +5.103 |
. | +5.066 |
ia | +4.850 |
ine | +4.764 |
Neg logit contributions | |
disparate | -4.147 |
totality | -4.120 |
newer | -4.039 |
hindsight | -4.024 |
tremendous | -3.986 |
Token | to |
Token ID | 284 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
disparate | +13.940 |
newer | +13.497 |
relentless | +13.343 |
genuine | +13.298 |
blatant | +13.260 |
Neg logit contributions | |
u | -10.004 |
ire | -9.296 |
aga | -9.124 |
ine | -9.005 |
id | -8.991 |
Token | know |
Token ID | 760 |
Feature activation | -8.96e-01 |
Pos logit contributions | |
disparate | +4.566 |
relentless | +4.338 |
newer | +4.329 |
blatant | +4.325 |
genuine | +4.324 |
Neg logit contributions | |
u | -6.175 |
ire | -5.897 |
- | -5.812 |
id | -5.804 |
aga | -5.757 |
Token | $ |
Token ID | 720 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
disparate | +6.973 |
newer | +6.723 |
genuine | +6.652 |
relentless | +6.650 |
blatant | +6.640 |
Neg logit contributions | |
u | -9.725 |
aga | -9.196 |
ire | -9.173 |
ine | -9.151 |
- | -9.077 |
Token | 5 |
Token ID | 20 |
Feature activation | +5.70e+00 |
Pos logit contributions | |
u | +2.598 |
- | +2.282 |
ab | +2.192 |
ine | +2.149 |
ire | +2.128 |
Neg logit contributions | |
disparate | -7.302 |
blatant | -7.086 |
totality | -7.086 |
relentless | -7.079 |
newer | -7.048 |
Token | million |
Token ID | 1510 |
Feature activation | +3.92e+00 |
Pos logit contributions | |
- | +13.070 |
. | +12.995 |
u | +12.460 |
ab | +11.772 |
b | +11.515 |
Neg logit contributions | |
disparate | -11.862 |
blatant | -11.770 |
relentless | -11.768 |
newer | -11.590 |
totality | -11.511 |
Token | and |
Token ID | 290 |
Feature activation | -5.91e-01 |
Pos logit contributions | |
- | +9.054 |
u | +8.505 |
. | +8.014 |
aga | +7.917 |
ire | +7.681 |
Neg logit contributions | |
blatant | -9.350 |
disparate | -9.205 |
relentless | -9.100 |
newer | -8.978 |
venerable | -8.942 |
Token | $ |
Token ID | 720 |
Feature activation | +3.12e+00 |
Pos logit contributions | |
disparate | +1.313 |
blatant | +1.241 |
newer | +1.232 |
relentless | +1.222 |
genuine | +1.219 |
Neg logit contributions | |
u | -1.830 |
- | -1.733 |
ine | -1.722 |
ire | -1.685 |
aga | -1.683 |
Token | 30 |
Token ID | 1270 |
Feature activation | +9.80e+00 |
Pos logit contributions | |
u | +3.111 |
- | +2.720 |
ab | +2.526 |
ine | +2.425 |
id | +2.263 |
Neg logit contributions | |
disparate | -13.120 |
blatant | -12.704 |
totality | -12.701 |
mathemat | -12.695 |
proactive | -12.657 |
Token | million |
Token ID | 1510 |
Feature activation | +8.32e-01 |
Pos logit contributions | |
- | +20.665 |
. | +19.912 |
u | +18.848 |
ire | +17.272 |
ia | +17.200 |
Neg logit contributions | |
disparate | -15.481 |
blatant | -15.074 |
totality | -14.896 |
relentless | -14.760 |
proactive | -14.530 |
Token | a |
Token ID | 257 |
Feature activation | +9.71e-01 |
Pos logit contributions | |
. | +1.618 |
u | +1.612 |
- | +1.604 |
aga | +1.463 |
ire | +1.454 |
Neg logit contributions | |
disparate | -2.577 |
blatant | -2.556 |
relentless | -2.532 |
newer | -2.501 |
proactive | -2.501 |
Token | day |
Token ID | 1110 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
u | +2.770 |
- | +2.759 |
ire | +2.587 |
ine | +2.577 |
aga | +2.572 |
Neg logit contributions | |
disparate | -2.062 |
newer | -2.017 |
genuine | -1.978 |
relentless | -1.970 |
stringent | -1.970 |
Token | . |
Token ID | 13 |
Feature activation | -7.66e+00 |
Pos logit contributions | |
u | +1.392 |
. | +1.391 |
- | +1.320 |
ine | +1.161 |
ong | +1.147 |
Neg logit contributions | |
disparate | -4.349 |
blatant | -4.340 |
genuine | -4.306 |
proactive | -4.286 |
relentless | -4.284 |
Token | But |
Token ID | 887 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
disparate | +21.026 |
newer | +20.864 |
various | +20.833 |
those | +20.792 |
modern | +20.480 |
Neg logit contributions | |
aga | -12.989 |
u | -12.807 |
ire | -12.425 |
ong | -12.187 |
iev | -12.057 |
Token |
|
Token ID | 198 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
- | +10.438 |
u | +9.746 |
. | +9.593 |
id | +8.298 |
ine | +8.295 |
Neg logit contributions | |
tremend | -30.563 |
mathemat | -27.681 |
undermin | -27.563 |
hemor | -26.889 |
cumbers | -26.518 |
Token | G |
Token ID | 38 |
Feature activation | +4.70e+00 |
Pos logit contributions | |
disparate | +16.706 |
newer | +16.435 |
genuine | +16.297 |
various | +16.280 |
relentless | +16.252 |
Neg logit contributions | |
u | -6.861 |
aga | -6.499 |
ire | -6.366 |
ong | -6.178 |
ine | -6.101 |
Token | rim |
Token ID | 3036 |
Feature activation | +5.53e+00 |
Pos logit contributions | |
u | +9.652 |
aga | +9.294 |
id | +9.113 |
ire | +9.040 |
ong | +9.019 |
Neg logit contributions | |
disparate | -12.910 |
totality | -12.692 |
genuine | -12.281 |
relentless | -12.220 |
hindsight | -12.095 |
Token | Lav |
Token ID | 21438 |
Feature activation | +7.13e+00 |
Pos logit contributions | |
u | +14.826 |
- | +14.280 |
aga | +14.167 |
ia | +14.152 |
acy | +14.080 |
Neg logit contributions | |
disparate | -9.527 |
newer | -9.108 |
stringent | -9.056 |
stricter | -8.911 |
genuine | -8.835 |
Token | am |
Token ID | 321 |
Feature activation | +5.29e+00 |
Pos logit contributions | |
u | +17.040 |
ag | +16.255 |
ine | +16.096 |
id | +16.033 |
ab | +15.861 |
Neg logit contributions | |
disparate | -14.315 |
totality | -13.166 |
blatant | -13.123 |
genuine | -13.094 |
behavi | -13.010 |
Token | ancer |
Token ID | 8250 |
Feature activation | +6.49e+00 |
Pos logit contributions | |
u | +10.766 |
id | +10.252 |
aga | +9.935 |
ire | +9.830 |
ag | +9.720 |
Neg logit contributions | |
disparate | -14.024 |
hindsight | -13.658 |
blatant | -13.436 |
proactive | -13.356 |
totality | -13.188 |
Token | vs |
Token ID | 3691 |
Feature activation | -4.25e+00 |
Pos logit contributions | |
u | +14.668 |
- | +14.063 |
ia | +13.433 |
aga | +13.350 |
id | +13.161 |
Neg logit contributions | |
disparate | -13.442 |
blatant | -12.809 |
totality | -12.298 |
genuine | -12.050 |
stringent | -12.035 |
Token | Ragnar |
Token ID | 32797 |
Feature activation | +6.02e+00 |
Pos logit contributions | |
disparate | +12.674 |
newer | +12.255 |
genuine | +12.156 |
relentless | +12.144 |
blatant | +12.117 |
Neg logit contributions | |
u | -10.019 |
aga | -9.430 |
ire | -9.367 |
ine | -9.171 |
ong | -9.138 |
Token |
|
Token ID | 198 |
Feature activation | +7.87e+00 |
Pos logit contributions | |
os | +14.664 |
id | +13.696 |
u | +13.237 |
ag | +13.207 |
- | +13.160 |
Neg logit contributions | |
disparate | -12.071 |
blatant | -11.936 |
distinguishing | -11.902 |
sophisticated | -11.774 |
drastic | -11.723 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+00 |
Pos logit contributions | |
- | +11.204 |
u | +10.449 |
. | +10.375 |
id | +8.933 |
ine | +8.887 |
Neg logit contributions | |
tremend | -32.018 |
mathemat | -28.978 |
undermin | -28.885 |
hemor | -28.146 |
cumbers | -27.841 |
Token | Gen |
Token ID | 13746 |
Feature activation | +5.13e+00 |
Pos logit contributions | |
disparate | +15.223 |
newer | +14.931 |
genuine | +14.811 |
relentless | +14.780 |
various | +14.779 |
Neg logit contributions | |
u | -6.320 |
aga | -5.904 |
ire | -5.804 |
ong | -5.621 |
ine | -5.584 |
Token | � |
Token ID | 447 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
disparate | +15.915 |
newer | +15.547 |
genuine | +15.404 |
relentless | +15.385 |
blatant | +15.348 |
Neg logit contributions | |
u | -8.120 |
aga | -7.556 |
ire | -7.473 |
ine | -7.262 |
ong | -7.252 |
Token | � |
Token ID | 251 |
Feature activation | -5.53e-01 |
Pos logit contributions | |
� | +18.839 |
� | +17.868 |
u | +17.726 |
� | +17.592 |
id | +17.501 |
Neg logit contributions | |
tremend | -18.259 |
disparate | -18.203 |
relentless | -17.382 |
blatant | -17.326 |
newer | -17.057 |
Token | she |
Token ID | 673 |
Feature activation | +2.41e+00 |
Pos logit contributions | |
disparate | +1.410 |
newer | +1.343 |
totality | +1.314 |
relentless | +1.305 |
blatant | +1.304 |
Neg logit contributions | |
u | -1.575 |
aga | -1.507 |
- | -1.484 |
ine | -1.479 |
ab | -1.458 |
Token | said |
Token ID | 531 |
Feature activation | +7.03e-01 |
Pos logit contributions | |
u | +5.974 |
- | +5.739 |
aga | +5.601 |
ab | +5.495 |
ine | +5.478 |
Neg logit contributions | |
disparate | -6.164 |
newer | -5.797 |
totality | -5.766 |
hindsight | -5.741 |
genuine | -5.683 |
Token | . |
Token ID | 13 |
Feature activation | +4.05e-01 |
Pos logit contributions | |
u | +0.445 |
- | +0.306 |
aga | +0.304 |
. | +0.284 |
id | +0.284 |
Neg logit contributions | |
disparate | -3.299 |
newer | -3.189 |
relentless | -3.142 |
totality | -3.140 |
genuine | -3.132 |
Token | � |
Token ID | 447 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
u | +0.711 |
ab | +0.628 |
- | +0.621 |
id | +0.619 |
ine | +0.619 |
Neg logit contributions | |
disparate | -1.467 |
newer | -1.399 |
relentless | -1.399 |
venerable | -1.384 |
totality | -1.383 |
Token | � |
Token ID | 250 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
� | +19.186 |
� | +18.736 |
� | +18.147 |
� | +17.933 |
� | +17.775 |
Neg logit contributions | |
disparate | -21.236 |
tremend | -20.692 |
blatant | -19.752 |
relentless | -19.691 |
venerable | -19.685 |
Token | If |
Token ID | 1532 |
Feature activation | -5.18e+00 |
Pos logit contributions | |
disparate | +7.368 |
newer | +7.169 |
relentless | +7.074 |
genuine | +7.072 |
blatant | +7.039 |
Neg logit contributions | |
u | -3.740 |
ire | -3.372 |
aga | -3.368 |
ine | -3.323 |
id | -3.303 |
Token | he |
Token ID | 339 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
disparate | +16.985 |
newer | +16.573 |
genuine | +16.406 |
relentless | +16.398 |
blatant | +16.346 |
Neg logit contributions | |
u | -10.007 |
aga | -9.361 |
ire | -9.287 |
ine | -9.041 |
ong | -9.026 |
Token | � |
Token ID | 447 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
disparate | +5.416 |
newer | +5.271 |
relentless | +5.219 |
totality | +5.179 |
genuine | +5.161 |
Neg logit contributions | |
u | -3.594 |
ire | -3.259 |
aga | -3.229 |
ine | -3.227 |
ab | -3.208 |
Token | � |
Token ID | 247 |
Feature activation | +6.20e+00 |
Pos logit contributions | |
� | +22.308 |
u | +19.401 |
� | +19.338 |
� | +19.020 |
� | +18.568 |
Neg logit contributions | |
tremend | -30.564 |
mathemat | -30.335 |
behavi | -28.133 |
anwhile | -27.546 |
disparate | -27.539 |
Token | A |
Token ID | 32 |
Feature activation | -4.04e+00 |
Pos logit contributions | |
disparate | +15.333 |
newer | +15.027 |
genuine | +14.985 |
various | +14.962 |
relentless | +14.927 |
Neg logit contributions | |
u | -8.436 |
aga | -8.267 |
ire | -7.943 |
ong | -7.798 |
ée | -7.627 |
Token | little |
Token ID | 1310 |
Feature activation | -2.56e+00 |
Pos logit contributions | |
disparate | +12.963 |
newer | +12.625 |
genuine | +12.513 |
various | +12.481 |
relentless | +12.471 |
Neg logit contributions | |
u | -8.221 |
aga | -7.693 |
ire | -7.662 |
ine | -7.461 |
ong | -7.437 |
Token | later |
Token ID | 1568 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
disparate | +8.879 |
genuine | +8.544 |
newer | +8.524 |
relentless | +8.477 |
blatant | +8.477 |
Neg logit contributions | |
u | -4.881 |
- | -4.652 |
ire | -4.513 |
aga | -4.450 |
ia | -4.366 |
Token | : |
Token ID | 25 |
Feature activation | -6.09e+00 |
Pos logit contributions | |
u | +6.176 |
- | +6.064 |
ire | +5.869 |
id | +5.800 |
ine | +5.797 |
Neg logit contributions | |
disparate | -6.749 |
blatant | -6.332 |
newer | -6.258 |
tremendous | -6.229 |
genuine | -6.184 |
Token | � |
Token ID | 564 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
disparate | +19.549 |
newer | +19.143 |
various | +19.006 |
genuine | +18.956 |
relentless | +18.954 |
Neg logit contributions | |
u | -11.088 |
aga | -10.520 |
ire | -10.310 |
ong | -10.019 |
ine | -10.015 |
Token | � |
Token ID | 250 |
Feature activation | -3.59e+00 |
Pos logit contributions | |
� | +17.448 |
� | +16.769 |
� | +16.708 |
� | +16.462 |
� | +16.436 |
Neg logit contributions | |
disparate | -20.579 |
tremend | -19.846 |
newer | -19.463 |
relentless | -19.358 |
stricter | -19.249 |
Token | There |
Token ID | 1858 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
disparate | +13.015 |
newer | +12.722 |
genuine | +12.611 |
relentless | +12.593 |
various | +12.558 |
Neg logit contributions | |
u | -5.801 |
aga | -5.333 |
ire | -5.295 |
ine | -5.129 |
ong | -5.104 |
Token | � |
Token ID | 447 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
u | +2.054 |
id | +1.925 |
- | +1.925 |
ong | +1.887 |
ine | +1.884 |
Neg logit contributions | |
disparate | -3.282 |
relentless | -3.097 |
gradual | -3.064 |
blatant | -3.064 |
totality | -3.056 |
Token | � |
Token ID | 247 |
Feature activation | +5.78e+00 |
Pos logit contributions | |
� | +18.359 |
� | +16.790 |
� | +16.379 |
� | +16.323 |
� | +15.506 |
Neg logit contributions | |
mathemat | -26.702 |
disparate | -26.146 |
tremend | -25.855 |
blatant | -25.812 |
totality | -25.150 |
Token | s |
Token ID | 82 |
Feature activation | -7.14e-01 |
Pos logit contributions | |
u | +14.604 |
id | +13.872 |
ine | +13.593 |
ia | +13.586 |
ire | +13.414 |
Neg logit contributions | |
disparate | -11.542 |
totality | -10.817 |
drastic | -10.674 |
relentless | -10.605 |
blatant | -10.536 |
Token | no |
Token ID | 645 |
Feature activation | -3.27e+00 |
Pos logit contributions | |
disparate | +1.682 |
relentless | +1.535 |
venerable | +1.528 |
newer | +1.517 |
blatant | +1.502 |
Neg logit contributions | |
u | -2.221 |
- | -2.077 |
ire | -2.075 |
ong | -2.064 |
ine | -2.064 |
Token | C |
Token ID | 34 |
Feature activation | +4.32e+00 |
Pos logit contributions | |
u | +12.132 |
- | +12.052 |
. | +11.521 |
ig | +10.538 |
ire | +10.381 |
Neg logit contributions | |
disparate | -12.439 |
proactive | -12.110 |
venerable | -12.082 |
relentless | -11.982 |
meticulous | -11.979 |
Token | from |
Token ID | 422 |
Feature activation | -2.11e+00 |
Pos logit contributions | |
u | +10.934 |
- | +10.902 |
. | +10.762 |
ag | +10.041 |
ab | +10.010 |
Neg logit contributions | |
disparate | -9.265 |
blatant | -8.646 |
venerable | -8.594 |
meticulous | -8.530 |
myriad | -8.336 |
Token | the |
Token ID | 262 |
Feature activation | -3.03e+00 |
Pos logit contributions | |
disparate | +5.355 |
blatant | +5.084 |
genuine | +4.928 |
relentless | +4.906 |
newer | +4.856 |
Neg logit contributions | |
u | -6.231 |
- | -5.886 |
ire | -5.825 |
ab | -5.640 |
ine | -5.632 |
Token | pre |
Token ID | 662 |
Feature activation | +6.92e+00 |
Pos logit contributions | |
disparate | +6.748 |
blatant | +6.292 |
genuine | +6.187 |
newer | +6.159 |
totality | +6.037 |
Neg logit contributions | |
u | -9.803 |
ire | -9.291 |
ine | -9.169 |
- | -9.159 |
ab | -9.007 |
Token | - |
Token ID | 12 |
Feature activation | +3.72e+00 |
Pos logit contributions | |
- | +16.741 |
u | +14.816 |
ag | +14.032 |
ine | +13.859 |
b | +13.562 |
Neg logit contributions | |
disparate | -14.342 |
blatant | -13.709 |
DRAG | -13.680 |
venerable | -13.510 |
theless | -13.255 |
Token | industrial |
Token ID | 31130 |
Feature activation | +3.76e+00 |
Pos logit contributions | |
u | +5.003 |
ag | +4.623 |
ine | +4.382 |
ab | +4.266 |
- | +4.115 |
Neg logit contributions | |
disparate | -13.825 |
totality | -13.631 |
myriad | -13.465 |
DRAG | -13.458 |
newer | -13.188 |
Token | age |
Token ID | 2479 |
Feature activation | +3.67e+00 |
Pos logit contributions | |
- | +10.203 |
u | +9.585 |
. | +9.265 |
ine | +9.197 |
al | +8.825 |
Neg logit contributions | |
disparate | -7.674 |
blatant | -7.170 |
disgruntled | -6.976 |
newer | -6.912 |
venerable | -6.896 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+00 |
Pos logit contributions | |
. | +8.505 |
- | +8.266 |
u | +8.161 |
ire | +7.394 |
ab | +7.343 |
Neg logit contributions | |
disparate | -9.053 |
blatant | -8.749 |
proactive | -8.697 |
spontaneous | -8.425 |
venerable | -8.424 |
Token |
|
Token ID | 198 |
Feature activation | +5.07e+00 |
Pos logit contributions | |
disparate | +13.674 |
newer | +13.322 |
relentless | +13.197 |
genuine | +13.186 |
blatant | +13.166 |
Neg logit contributions | |
u | -8.594 |
aga | -7.998 |
ire | -7.962 |
ine | -7.775 |
ong | -7.761 |
Token |
|
Token ID | 198 |
Feature activation | -5.46e+00 |
Pos logit contributions | |
- | +6.338 |
u | +6.115 |
. | +5.533 |
id | +5.108 |
ine | +5.005 |
Neg logit contributions | |
tremend | -22.200 |
mathemat | -20.643 |
undermin | -20.468 |
hemor | -19.969 |
behavi | -19.700 |
Token | H |
Token ID | 39 |
Feature activation | +6.66e+00 |
Pos logit contributions | |
disparate | +17.385 |
newer | +17.068 |
genuine | +17.067 |
various | +17.000 |
relentless | +16.971 |
Neg logit contributions | |
u | -8.408 |
aga | -8.327 |
ire | -8.018 |
ong | -7.735 |
ine | -7.586 |
Token | which |
Token ID | 543 |
Feature activation | -7.05e+00 |
Pos logit contributions | |
disparate | +17.621 |
newer | +17.200 |
genuine | +17.038 |
relentless | +17.018 |
various | +16.979 |
Neg logit contributions | |
u | -10.404 |
aga | -9.758 |
ire | -9.671 |
ine | -9.408 |
ong | -9.403 |
Token | followed |
Token ID | 3940 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
disparate | +23.218 |
various | +22.769 |
newer | +22.722 |
genuine | +22.568 |
blatant | +22.470 |
Neg logit contributions | |
u | -11.002 |
aga | -10.345 |
ire | -10.148 |
ong | -10.056 |
ine | -9.884 |
Token | a |
Token ID | 257 |
Feature activation | -4.45e+00 |
Pos logit contributions | |
disparate | +3.376 |
newer | +3.293 |
venerable | +3.171 |
totality | +3.168 |
genuine | +3.140 |
Neg logit contributions | |
u | -5.721 |
aga | -5.482 |
- | -5.477 |
ire | -5.413 |
id | -5.364 |
Token | challenge |
Token ID | 4427 |
Feature activation | +4.73e+00 |
Pos logit contributions | |
disparate | +13.244 |
newer | +12.946 |
various | +12.743 |
genuine | +12.724 |
relentless | +12.688 |
Neg logit contributions | |
u | -10.403 |
aga | -9.817 |
ire | -9.764 |
ine | -9.499 |
ong | -9.432 |
Token | from |
Token ID | 422 |
Feature activation | -4.81e+00 |
Pos logit contributions | |
- | +10.788 |
. | +10.361 |
u | +10.091 |
aga | +9.832 |
ire | +9.657 |
Neg logit contributions | |
disparate | -10.357 |
venerable | -9.799 |
newer | -9.771 |
hindsight | -9.732 |
totality | -9.728 |
Token | central |
Token ID | 4318 |
Feature activation | +4.72e+00 |
Pos logit contributions | |
disparate | +14.733 |
newer | +14.343 |
genuine | +14.202 |
relentless | +14.199 |
blatant | +14.184 |
Neg logit contributions | |
u | -10.796 |
aga | -10.201 |
ire | -10.112 |
ine | -9.866 |
ong | -9.796 |
Token | government |
Token ID | 1230 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
- | +13.816 |
u | +13.051 |
aga | +12.793 |
ia | +12.752 |
ire | +12.648 |
Neg logit contributions | |
disparate | -7.541 |
relentless | -7.405 |
totality | -7.289 |
tremendous | -7.211 |
newer | -7.107 |
Token | . |
Token ID | 13 |
Feature activation | -4.30e+00 |
Pos logit contributions | |
- | +7.916 |
. | +7.758 |
u | +7.540 |
aga | +7.287 |
ia | +7.269 |
Neg logit contributions | |
disparate | -5.726 |
totality | -5.569 |
hindsight | -5.484 |
venerable | -5.379 |
newer | -5.379 |
Token |
|
Token ID | 198 |
Feature activation | +6.55e+00 |
Pos logit contributions | |
disparate | +14.415 |
newer | +14.031 |
relentless | +13.945 |
genuine | +13.907 |
blatant | +13.877 |
Neg logit contributions | |
u | -8.309 |
aga | -7.687 |
ire | -7.627 |
ine | -7.438 |
ong | -7.418 |
Token |
|
Token ID | 198 |
Feature activation | -5.99e+00 |
Pos logit contributions | |
- | +9.092 |
u | +8.575 |
. | +8.192 |
id | +7.288 |
ine | +7.236 |
Neg logit contributions | |
tremend | -27.850 |
mathemat | -25.567 |
undermin | -25.527 |
hemor | -24.921 |
cumbers | -24.226 |
Token | For |
Token ID | 1890 |
Feature activation | +3.74e+00 |
Pos logit contributions | |
disparate | +19.177 |
genuine | +18.907 |
newer | +18.854 |
various | +18.833 |
blatant | +18.770 |
Neg logit contributions | |
aga | -8.161 |
u | -8.043 |
ire | -7.850 |
ong | -7.627 |
iev | -7.452 |
Token | in |
Token ID | 287 |
Feature activation | -4.26e+00 |
Pos logit contributions | |
u | +5.109 |
- | +5.008 |
ine | +4.774 |
ire | +4.756 |
ong | +4.738 |
Neg logit contributions | |
disparate | -4.177 |
blatant | -4.101 |
hindsight | -3.999 |
gradual | -3.969 |
newer | -3.959 |
Token | its |
Token ID | 663 |
Feature activation | -3.17e+00 |
Pos logit contributions | |
disparate | +15.028 |
newer | +14.685 |
relentless | +14.534 |
genuine | +14.510 |
blatant | +14.481 |
Neg logit contributions | |
u | -7.577 |
ire | -6.942 |
aga | -6.895 |
ine | -6.738 |
ong | -6.675 |
Token | thr |
Token ID | 5636 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
disparate | +8.038 |
newer | +7.761 |
blatant | +7.719 |
genuine | +7.681 |
drastic | +7.509 |
Neg logit contributions | |
u | -8.947 |
ire | -8.568 |
ine | -8.469 |
aga | -8.429 |
- | -8.352 |
Token | all |
Token ID | 439 |
Feature activation | +5.07e+00 |
Pos logit contributions | |
ong | +18.718 |
u | +16.617 |
ab | +16.347 |
um | +16.112 |
ag | +15.960 |
Neg logit contributions | |
proactive | -21.004 |
disparate | -20.585 |
deceptive | -20.459 |
blatant | -20.388 |
misleading | -20.243 |
Token | ? |
Token ID | 30 |
Feature activation | -6.54e+00 |
Pos logit contributions | |
- | +11.641 |
u | +11.549 |
. | +11.074 |
id | +10.923 |
ong | +10.719 |
Neg logit contributions | |
disparate | -10.520 |
blatant | -10.354 |
newer | -10.181 |
tremendous | -10.145 |
genuine | -10.133 |
Token |
|
Token ID | 198 |
Feature activation | +5.05e+00 |
Pos logit contributions | |
various | +18.726 |
disparate | +18.692 |
newer | +18.523 |
those | +18.476 |
modern | +18.323 |
Neg logit contributions | |
u | -11.371 |
aga | -11.164 |
ire | -10.946 |
ong | -10.740 |
ine | -10.563 |
Token |
|
Token ID | 198 |
Feature activation | -5.36e+00 |
Pos logit contributions | |
- | +5.951 |
u | +5.691 |
. | +5.270 |
ine | +4.816 |
id | +4.606 |
Neg logit contributions | |
tremend | -22.855 |
mathemat | -21.308 |
undermin | -21.079 |
hemor | -20.592 |
behavi | -20.387 |
Token | And |
Token ID | 1870 |
Feature activation | -9.16e+00 |
Pos logit contributions | |
disparate | +16.171 |
newer | +15.891 |
various | +15.819 |
those | +15.799 |
genuine | +15.789 |
Neg logit contributions | |
u | -8.766 |
aga | -8.730 |
ire | -8.511 |
ong | -8.264 |
iev | -8.107 |
Token | without |
Token ID | 1231 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
those | +27.224 |
various | +26.903 |
disparate | +26.813 |
many | +26.600 |
newer | +26.567 |
Neg logit contributions | |
u | -11.573 |
ire | -11.412 |
aga | -11.173 |
iev | -10.784 |
ée | -10.697 |
Token | going |
Token ID | 1016 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
disparate | +3.710 |
newer | +3.422 |
relentless | +3.314 |
blatant | +3.295 |
genuine | +3.286 |
Neg logit contributions | |
u | -7.384 |
aga | -6.995 |
id | -6.924 |
- | -6.900 |
ab | -6.890 |
Token | into |
Token ID | 656 |
Feature activation | -2.04e+00 |
Pos logit contributions | |
u | +5.088 |
- | +5.065 |
ab | +4.818 |
ine | +4.812 |
ong | +4.715 |
Neg logit contributions | |
disparate | -4.117 |
newer | -3.961 |
venerable | -3.811 |
poorer | -3.706 |
relentless | -3.667 |
Token | elt |
Token ID | 2120 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
elt | +22.134 |
id | +18.371 |
u | +17.513 |
elle | +17.157 |
ire | +17.112 |
Neg logit contributions | |
tremend | -33.661 |
behavi | -32.470 |
hemor | -31.067 |
metic | -30.430 |
misunder | -29.882 |
Token | ine |
Token ID | 500 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
ine | +25.272 |
id | +20.994 |
ines | +20.456 |
u | +20.331 |
ia | +20.256 |
Neg logit contributions | |
tremend | -30.177 |
hemor | -29.238 |
behavi | -28.503 |
cumbers | -28.111 |
mathemat | -27.814 |
Token | 's |
Token ID | 338 |
Feature activation | -4.51e+00 |
Pos logit contributions | |
u | +2.118 |
- | +2.074 |
ire | +1.936 |
aga | +1.910 |
. | +1.887 |
Neg logit contributions | |
disparate | -3.194 |
totality | -3.135 |
newer | -3.072 |
blatant | -3.031 |
spontaneous | -3.003 |
Token | intervention |
Token ID | 9572 |
Feature activation | +3.30e+00 |
Pos logit contributions | |
disparate | +11.935 |
newer | +11.560 |
genuine | +11.375 |
relentless | +11.293 |
blatant | +11.291 |
Neg logit contributions | |
u | -11.942 |
ire | -11.307 |
aga | -11.279 |
ine | -11.092 |
ong | -11.021 |
Token | reminds |
Token ID | 17603 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
- | +8.058 |
u | +7.819 |
ire | +7.519 |
. | +7.507 |
ine | +7.292 |
Neg logit contributions | |
disparate | -7.451 |
totality | -7.386 |
venerable | -7.082 |
newer | -7.046 |
myriad | -6.961 |
Token | us |
Token ID | 514 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
u | +0.356 |
- | +0.351 |
ire | +0.340 |
id | +0.339 |
ine | +0.335 |
Neg logit contributions | |
disparate | -0.214 |
totality | -0.206 |
newer | -0.191 |
relentless | -0.189 |
blatant | -0.189 |
Token | of |
Token ID | 286 |
Feature activation | -5.95e+00 |
Pos logit contributions | |
disparate | +5.547 |
newer | +5.349 |
totality | +5.318 |
genuine | +5.280 |
relentless | +5.276 |
Neg logit contributions | |
u | -3.117 |
- | -2.844 |
ine | -2.840 |
ire | -2.793 |
aga | -2.771 |
Token | the |
Token ID | 262 |
Feature activation | -7.98e+00 |
Pos logit contributions | |
disparate | +18.903 |
newer | +18.441 |
genuine | +18.264 |
relentless | +18.241 |
various | +18.197 |
Neg logit contributions | |
u | -11.972 |
aga | -11.261 |
ire | -11.161 |
ine | -10.870 |
ong | -10.867 |
Token | sort |
Token ID | 3297 |
Feature activation | +5.97e+00 |
Pos logit contributions | |
disparate | +24.699 |
relentless | +24.332 |
various | +24.189 |
newer | +24.130 |
genuine | +24.118 |
Neg logit contributions | |
u | -13.413 |
aga | -12.934 |
ire | -12.442 |
ong | -12.273 |
ée | -12.253 |
Token | of |
Token ID | 286 |
Feature activation | -6.12e+00 |
Pos logit contributions | |
u | +11.751 |
- | +11.442 |
id | +10.546 |
ine | +10.499 |
ire | +10.313 |
Neg logit contributions | |
mathemat | -14.889 |
tremend | -14.692 |
disparate | -14.639 |
hemor | -13.912 |
misunder | -13.905 |
Token | division |
Token ID | 7297 |
Feature activation | -5.53e-02 |
Pos logit contributions | |
disparate | +20.125 |
newer | +19.620 |
relentless | +19.556 |
genuine | +19.543 |
blatant | +19.498 |
Neg logit contributions | |
u | -11.061 |
aga | -10.432 |
ire | -10.252 |
ong | -9.985 |
ine | -9.932 |
Token | of |
Token ID | 286 |
Feature activation | -3.56e+00 |
Pos logit contributions | |
u | +1.598 |
- | +1.508 |
. | +1.499 |
ire | +1.331 |
aga | +1.326 |
Neg logit contributions | |
disparate | -4.431 |
blatant | -4.252 |
relentless | -4.233 |
newer | -4.195 |
genuine | -4.176 |
Token | warm |
Token ID | 5814 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
disparate | +10.249 |
newer | +9.805 |
blatant | +9.740 |
genuine | +9.633 |
relentless | +9.619 |
Neg logit contributions | |
u | -9.186 |
aga | -8.625 |
ine | -8.466 |
- | -8.460 |
ire | -8.453 |
Token | up |
Token ID | 929 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
- | +23.542 |
up | +21.946 |
u | +20.727 |
ong | +20.203 |
aga | +19.620 |
Neg logit contributions | |
disparate | -16.599 |
poorer | -16.550 |
blatant | -15.769 |
stricter | -15.438 |
venerable | -15.276 |
Token | . |
Token ID | 13 |
Feature activation | -8.17e+00 |
Pos logit contributions | |
. | +1.951 |
- | +1.946 |
u | +1.944 |
ine | +1.694 |
aga | +1.683 |
Neg logit contributions | |
disparate | -4.805 |
newer | -4.589 |
blatant | -4.570 |
venerable | -4.565 |
relentless | -4.549 |
Token | There |
Token ID | 1318 |
Feature activation | -6.51e-01 |
Pos logit contributions | |
newer | +21.409 |
various | +21.170 |
modern | +21.133 |
those | +21.015 |
disparate | +20.766 |
Neg logit contributions | |
aga | -13.944 |
u | -13.599 |
ire | -13.328 |
iev | -13.096 |
ong | -13.037 |
Token | are |
Token ID | 389 |
Feature activation | -6.62e+00 |
Pos logit contributions | |
disparate | +2.333 |
totality | +2.225 |
relentless | +2.222 |
blatant | +2.200 |
newer | +2.187 |
Neg logit contributions | |
u | -1.201 |
ine | -1.103 |
- | -1.099 |
ong | -1.091 |
ab | -1.086 |
Token | no |
Token ID | 645 |
Feature activation | -3.94e+00 |
Pos logit contributions | |
disparate | +21.716 |
newer | +21.389 |
various | +21.261 |
genuine | +21.153 |
blatant | +20.996 |
Neg logit contributions | |
u | -11.544 |
aga | -10.942 |
ire | -10.771 |
ong | -10.474 |
ine | -10.443 |
Token | excuses |
Token ID | 25893 |
Feature activation | +2.71e+00 |
Pos logit contributions | |
disparate | +12.717 |
newer | +12.273 |
relentless | +12.258 |
blatant | +12.166 |
genuine | +12.143 |
Neg logit contributions | |
u | -8.374 |
ire | -7.785 |
aga | -7.735 |
ong | -7.597 |
ine | -7.574 |
Token | . |
Token ID | 13 |
Feature activation | -7.18e+00 |
Pos logit contributions | |
. | +5.904 |
- | +5.711 |
u | +5.594 |
ab | +5.187 |
ine | +5.153 |
Neg logit contributions | |
disparate | -7.404 |
totality | -7.344 |
relentless | -7.140 |
venerable | -7.025 |
gradual | -6.960 |
Token |
|
Token ID | 198 |
Feature activation | +6.02e+00 |
Pos logit contributions | |
newer | +19.169 |
various | +18.898 |
disparate | +18.860 |
modern | +18.821 |
genuine | +18.752 |
Neg logit contributions | |
u | -13.582 |
aga | -13.534 |
ire | -13.095 |
ong | -12.783 |
iev | -12.694 |
Token |
|
Token ID | 198 |
Feature activation | -5.23e+00 |
Pos logit contributions | |
- | +7.789 |
u | +7.115 |
. | +6.750 |
ine | +6.067 |
id | +6.003 |
Neg logit contributions | |
tremend | -26.604 |
mathemat | -24.715 |
undermin | -24.471 |
hemor | -24.030 |
cumbers | -23.409 |
Token | a |
Token ID | 257 |
Feature activation | -7.49e+00 |
Pos logit contributions | |
disparate | +25.007 |
genuine | +24.528 |
newer | +24.510 |
various | +24.475 |
relentless | +24.123 |
Neg logit contributions | |
u | -11.695 |
aga | -10.993 |
ire | -10.699 |
ong | -10.629 |
ine | -10.451 |
Token | break |
Token ID | 2270 |
Feature activation | +1.98e+00 |
Pos logit contributions | |
disparate | +24.326 |
genuine | +24.039 |
newer | +24.032 |
relentless | +23.653 |
blatant | +23.596 |
Neg logit contributions | |
u | -11.464 |
aga | -10.893 |
ire | -10.432 |
ong | -10.365 |
iev | -10.257 |
Token | away |
Token ID | 8272 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
- | +4.787 |
u | +4.609 |
ab | +4.258 |
. | +4.157 |
ire | +4.106 |
Neg logit contributions | |
disparate | -5.395 |
blatant | -5.261 |
relentless | -5.256 |
totality | -5.196 |
genuine | -5.125 |
Token | , |
Token ID | 11 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
disparate | +6.821 |
relentless | +6.706 |
blatant | +6.666 |
newer | +6.630 |
totality | +6.612 |
Neg logit contributions | |
u | -3.252 |
ire | -3.048 |
- | -2.995 |
aga | -2.956 |
ine | -2.939 |
Token | but |
Token ID | 475 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
disparate | +28.794 |
newer | +28.718 |
various | +28.375 |
genuine | +28.230 |
those | +28.097 |
Neg logit contributions | |
u | -14.055 |
aga | -13.528 |
ong | -13.291 |
ée | -13.059 |
ire | -12.918 |
Token | with |
Token ID | 351 |
Feature activation | -9.88e+00 |
Pos logit contributions | |
those | +33.959 |
many | +33.209 |
various | +32.973 |
genuine | +32.832 |
newer | +32.688 |
Neg logit contributions | |
u | -15.381 |
aga | -15.284 |
ée | -15.096 |
ong | -14.690 |
usk | -14.275 |
Token | no |
Token ID | 645 |
Feature activation | -7.40e+00 |
Pos logit contributions | |
disparate | +30.791 |
newer | +30.579 |
genuine | +30.437 |
various | +30.347 |
modern | +30.074 |
Neg logit contributions | |
u | -12.489 |
aga | -11.679 |
ée | -11.439 |
ong | -11.428 |
ire | -10.898 |
Token | construct |
Token ID | 5678 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
disparate | +26.278 |
genuine | +26.033 |
newer | +25.983 |
various | +25.546 |
blatant | +25.537 |
Neg logit contributions | |
u | -9.316 |
aga | -8.767 |
ong | -8.192 |
ire | -8.145 |
ée | -8.001 |
Token | ors |
Token ID | 669 |
Feature activation | -9.87e-01 |
Pos logit contributions | |
- | +5.031 |
u | +4.962 |
ion | +4.599 |
iv | +4.564 |
ag | +4.556 |
Neg logit contributions | |
disparate | -13.626 |
totality | -13.540 |
blatant | -13.348 |
proactive | -13.288 |
relentless | -13.277 |
Token | left |
Token ID | 1364 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
disparate | +3.635 |
relentless | +3.530 |
blatant | +3.502 |
totality | +3.477 |
genuine | +3.455 |
Neg logit contributions | |
u | -1.569 |
- | -1.522 |
ire | -1.486 |
ine | -1.450 |
ia | -1.416 |
Token | they |
Token ID | 484 |
Feature activation | -3.76e+00 |
Pos logit contributions | |
disparate | +6.042 |
relentless | +5.893 |
blatant | +5.878 |
totality | +5.850 |
newer | +5.811 |
Neg logit contributions | |
u | -2.526 |
- | -2.347 |
ire | -2.304 |
ine | -2.252 |
ia | -2.217 |
Token | is |
Token ID | 318 |
Feature activation | -4.20e+00 |
Pos logit contributions | |
u | +6.033 |
- | +6.026 |
. | +5.711 |
ia | +5.703 |
id | +5.629 |
Neg logit contributions | |
disparate | -4.541 |
newer | -4.383 |
stringent | -4.320 |
totality | -4.308 |
venerable | -4.306 |
Token | very |
Token ID | 845 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
disparate | +13.611 |
newer | +13.232 |
relentless | +13.085 |
genuine | +13.066 |
various | +13.021 |
Neg logit contributions | |
u | -8.648 |
aga | -8.091 |
ire | -7.997 |
ine | -7.853 |
ong | -7.792 |
Token | paradox |
Token ID | 22226 |
Feature activation | +7.26e+00 |
Pos logit contributions | |
disparate | +3.723 |
newer | +3.605 |
totality | +3.588 |
relentless | +3.585 |
various | +3.453 |
Neg logit contributions | |
u | -5.434 |
ire | -5.112 |
- | -5.099 |
aga | -5.092 |
ab | -5.061 |
Token | ical |
Token ID | 605 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
ic | +13.282 |
- | +12.964 |
u | +12.775 |
al | +12.342 |
ine | +12.220 |
Neg logit contributions | |
disparate | -16.518 |
newer | -15.590 |
disgruntled | -15.500 |
totality | -15.277 |
gradual | -15.212 |
Token | . |
Token ID | 13 |
Feature activation | -8.04e+00 |
Pos logit contributions | |
u | +2.138 |
- | +2.043 |
. | +2.021 |
ong | +1.911 |
ine | +1.905 |
Neg logit contributions | |
disparate | -4.708 |
relentless | -4.614 |
newer | -4.538 |
stringent | -4.506 |
gradual | -4.505 |
Token | What |
Token ID | 1867 |
Feature activation | -5.58e+00 |
Pos logit contributions | |
various | +22.316 |
newer | +22.312 |
disparate | +22.260 |
those | +22.108 |
genuine | +22.064 |
Neg logit contributions | |
aga | -12.923 |
u | -12.702 |
ire | -12.243 |
iev | -12.143 |
ine | -11.811 |
Token | 's |
Token ID | 338 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
disparate | +20.232 |
newer | +19.831 |
genuine | +19.709 |
various | +19.641 |
relentless | +19.607 |
Neg logit contributions | |
u | -8.248 |
aga | -7.672 |
ire | -7.517 |
ine | -7.267 |
ong | -7.266 |
Token | your |
Token ID | 534 |
Feature activation | -3.19e+00 |
Pos logit contributions | |
disparate | +4.509 |
relentless | +4.254 |
totality | +4.238 |
newer | +4.157 |
blatant | +4.101 |
Neg logit contributions | |
u | -7.555 |
ire | -7.129 |
- | -7.044 |
aga | -7.004 |
ine | -6.985 |
Token | point |
Token ID | 966 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
disparate | +7.907 |
newer | +7.605 |
relentless | +7.518 |
genuine | +7.451 |
blatant | +7.406 |
Neg logit contributions | |
u | -9.181 |
ire | -8.626 |
aga | -8.618 |
ong | -8.531 |
ine | -8.519 |
Token | ? |
Token ID | 30 |
Feature activation | -6.75e+00 |
Pos logit contributions | |
- | +8.633 |
u | +8.602 |
. | +8.240 |
ine | +7.778 |
id | +7.757 |
Neg logit contributions | |
disparate | -7.646 |
newer | -7.423 |
totality | -7.405 |
relentless | -7.404 |
gradual | -7.154 |
Token | And |
Token ID | 843 |
Feature activation | -7.88e+00 |
Pos logit contributions | |
disparate | +20.853 |
newer | +20.600 |
various | +20.522 |
genuine | +20.486 |
blatant | +20.351 |
Neg logit contributions | |
u | -10.934 |
aga | -10.724 |
ire | -10.337 |
iev | -9.996 |
ine | -9.979 |
Token | of |
Token ID | 286 |
Feature activation | -6.59e+00 |
Pos logit contributions | |
u | +7.393 |
- | +7.166 |
ab | +6.756 |
ine | +6.595 |
id | +6.572 |
Neg logit contributions | |
disparate | -9.881 |
relentless | -9.672 |
blatant | -9.490 |
newer | -9.359 |
genuine | -9.343 |
Token | conventional |
Token ID | 10224 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
disparate | +22.113 |
newer | +21.769 |
various | +21.533 |
genuine | +21.502 |
modern | +21.364 |
Neg logit contributions | |
u | -11.145 |
aga | -10.481 |
ire | -10.301 |
ong | -10.109 |
ine | -9.955 |
Token | ice |
Token ID | 4771 |
Feature activation | +6.56e+00 |
Pos logit contributions | |
- | +0.528 |
u | +0.517 |
ine | +0.495 |
ia | +0.489 |
ire | +0.487 |
Neg logit contributions | |
disparate | -0.323 |
blatant | -0.312 |
relentless | -0.301 |
totality | -0.299 |
genuine | -0.295 |
Token | breakers |
Token ID | 49295 |
Feature activation | +2.36e+00 |
Pos logit contributions | |
- | +15.257 |
u | +13.759 |
b | +13.342 |
ab | +13.180 |
. | +13.143 |
Neg logit contributions | |
disparate | -12.972 |
blatant | -12.104 |
hindsight | -12.101 |
genuine | -11.940 |
anecdotal | -11.922 |
Token | . |
Token ID | 13 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
. | +5.231 |
- | +5.144 |
u | +5.073 |
ong | +4.833 |
ab | +4.724 |
Neg logit contributions | |
disparate | -6.439 |
blatant | -6.172 |
relentless | -6.162 |
totality | -6.080 |
genuine | -6.046 |
Token | The |
Token ID | 383 |
Feature activation | -9.93e+00 |
Pos logit contributions | |
modern | +28.368 |
various | +28.271 |
newer | +28.152 |
many | +27.753 |
those | +27.670 |
Neg logit contributions | |
aga | -14.233 |
ire | -12.882 |
u | -12.802 |
iev | -12.723 |
ée | -12.487 |
Token | power |
Token ID | 1176 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
various | +29.241 |
newer | +29.209 |
disparate | +28.968 |
modern | +28.916 |
relentless | +28.615 |
Neg logit contributions | |
aga | -12.641 |
u | -12.586 |
ire | -11.795 |
ong | -11.678 |
ée | -11.619 |
Token | levels |
Token ID | 2974 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
u | +0.796 |
- | +0.775 |
ine | +0.725 |
ab | +0.710 |
aga | +0.707 |
Neg logit contributions | |
disparate | -0.885 |
blatant | -0.854 |
relentless | -0.835 |
newer | -0.832 |
genuine | -0.828 |
Token | required |
Token ID | 2672 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
disparate | +3.391 |
blatant | +3.303 |
relentless | +3.270 |
genuine | +3.252 |
newer | +3.245 |
Neg logit contributions | |
u | -2.011 |
- | -1.857 |
ine | -1.830 |
ire | -1.816 |
aga | -1.811 |
Token | for |
Token ID | 329 |
Feature activation | -9.21e+00 |
Pos logit contributions | |
disparate | +4.381 |
blatant | +4.270 |
relentless | +4.232 |
totality | +4.200 |
newer | +4.196 |
Neg logit contributions | |
u | -2.698 |
- | -2.478 |
ong | -2.451 |
ire | -2.448 |
ine | -2.438 |
Token | breaking |
Token ID | 7163 |
Feature activation | +7.38e-01 |
Pos logit contributions | |
various | +28.385 |
newer | +27.966 |
disparate | +27.956 |
modern | +27.949 |
genuine | +27.682 |
Neg logit contributions | |
u | -12.266 |
aga | -11.678 |
ire | -11.672 |
ong | -11.376 |
iev | -11.284 |
Token | been |
Token ID | 587 |
Feature activation | -4.09e+00 |
Pos logit contributions | |
disparate | +8.498 |
newer | +8.238 |
relentless | +8.160 |
genuine | +8.046 |
totality | +8.027 |
Neg logit contributions | |
u | -8.622 |
aga | -8.112 |
ire | -8.112 |
id | -8.007 |
ine | -8.000 |
Token | filed |
Token ID | 5717 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
disparate | +11.753 |
newer | +11.390 |
relentless | +11.202 |
genuine | +11.199 |
blatant | +11.185 |
Neg logit contributions | |
u | -10.205 |
aga | -9.560 |
ire | -9.520 |
ine | -9.395 |
ong | -9.291 |
Token | in |
Token ID | 287 |
Feature activation | -2.97e+00 |
Pos logit contributions | |
u | +2.177 |
- | +2.130 |
. | +2.075 |
ine | +2.028 |
ia | +1.996 |
Neg logit contributions | |
disparate | -2.857 |
venerable | -2.824 |
genuine | -2.787 |
newer | -2.770 |
gradual | -2.763 |
Token | 2006 |
Token ID | 4793 |
Feature activation | +2.59e+00 |
Pos logit contributions | |
disparate | +6.994 |
newer | +6.773 |
genuine | +6.663 |
relentless | +6.592 |
gradual | +6.488 |
Neg logit contributions | |
u | -9.219 |
aga | -8.722 |
- | -8.647 |
ine | -8.625 |
id | -8.578 |
Token | . |
Token ID | 13 |
Feature activation | -5.37e+00 |
Pos logit contributions | |
- | +6.220 |
. | +6.190 |
u | +6.118 |
id | +5.729 |
ia | +5.599 |
Neg logit contributions | |
disparate | -6.341 |
venerable | -6.258 |
gradual | -6.147 |
newer | -6.109 |
genuine | -6.043 |
Token | The |
Token ID | 383 |
Feature activation | -7.44e+00 |
Pos logit contributions | |
disparate | +16.669 |
newer | +16.368 |
various | +16.217 |
genuine | +16.200 |
blatant | +16.116 |
Neg logit contributions | |
u | -10.267 |
aga | -9.840 |
ire | -9.662 |
ong | -9.417 |
ine | -9.387 |
Token | report |
Token ID | 989 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
disparate | +23.718 |
newer | +23.302 |
various | +23.188 |
blatant | +23.084 |
genuine | +23.029 |
Neg logit contributions | |
u | -11.843 |
aga | -11.449 |
ire | -11.106 |
ong | -10.822 |
iev | -10.716 |
Token | showed |
Token ID | 3751 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
u | +4.784 |
- | +4.690 |
id | +4.450 |
ire | +4.418 |
ia | +4.395 |
Neg logit contributions | |
disparate | -4.274 |
newer | -4.123 |
relentless | -3.978 |
venerable | -3.954 |
gradual | -3.935 |
Token | that |
Token ID | 326 |
Feature activation | -8.40e+00 |
Pos logit contributions | |
disparate | +11.739 |
newer | +11.525 |
genuine | +11.300 |
relentless | +11.295 |
totality | +11.184 |
Neg logit contributions | |
u | -8.270 |
ire | -7.607 |
ine | -7.503 |
aga | -7.468 |
- | -7.428 |
Token | when |
Token ID | 618 |
Feature activation | -4.51e+00 |
Pos logit contributions | |
disparate | +28.037 |
various | +27.676 |
newer | +27.518 |
genuine | +27.288 |
blatant | +27.267 |
Neg logit contributions | |
u | -10.890 |
aga | -10.430 |
ire | -10.143 |
ong | -9.938 |
iev | -9.776 |
Token | Josh |
Token ID | 8518 |
Feature activation | +5.24e+00 |
Pos logit contributions | |
disparate | +14.542 |
newer | +14.169 |
relentless | +14.037 |
genuine | +14.012 |
blatant | +13.970 |
Neg logit contributions | |
u | -9.864 |
aga | -9.138 |
ire | -9.128 |
ine | -8.983 |
id | -8.856 |