Token | , |
Token ID | 11 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
uala | +0.966 |
eni | +0.854 |
itton | +0.748 |
atin | +0.721 |
Devi | +0.718 |
Neg logit contributions | |
antioxid | -0.676 |
annoyance | -0.662 |
pleas | -0.655 |
Rate | -0.639 |
± | -0.635 |
Token | and |
Token ID | 290 |
Feature activation | +3.20e-01 |
Pos logit contributions | |
antioxid | +0.506 |
annoyance | +0.493 |
pleas | +0.486 |
Rate | +0.473 |
± | +0.469 |
Neg logit contributions | |
uala | -0.925 |
eni | -0.827 |
itton | -0.735 |
atin | -0.711 |
Devi | -0.708 |
Token | J |
Token ID | 449 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
antioxid | +1.035 |
annoyance | +1.012 |
pleas | +1.000 |
Rate | +0.972 |
± | +0.968 |
Neg logit contributions | |
uala | -1.610 |
eni | -1.428 |
itton | -1.260 |
atin | -1.215 |
Devi | -1.206 |
Token | . |
Token ID | 13 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
antioxid | +1.153 |
annoyance | +1.138 |
pleas | +1.120 |
Rate | +1.102 |
± | +1.097 |
Neg logit contributions | |
uala | -1.581 |
eni | -1.380 |
itton | -1.218 |
Devi | -1.180 |
� | -1.173 |
Token | J |
Token ID | 41 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
Rate | +4.768 |
annoyance | +4.718 |
pleas | +4.659 |
\\\\\\\\ | +4.628 |
± | +4.619 |
Neg logit contributions | |
uala | -10.669 |
eni | -9.261 |
atin | -8.705 |
itton | -8.636 |
ignty | -8.279 |
Token | . |
Token ID | 13 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
antioxid | +2.862 |
± | +2.847 |
annoyance | +2.827 |
pleas | +2.808 |
Rate | +2.770 |
Neg logit contributions | |
uala | -5.353 |
eni | -4.697 |
itton | -4.222 |
� | -4.128 |
Devi | -4.084 |
Token | B |
Token ID | 347 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
Interest | +4.959 |
± | +4.885 |
¯ | +4.760 |
annoyance | +4.698 |
pleas | +4.697 |
Neg logit contributions | |
uala | -11.536 |
eni | -10.217 |
itton | -9.635 |
� | -9.617 |
atin | -9.492 |
Token | area |
Token ID | 20337 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
gery | +3.696 |
Interest | +3.686 |
± | +3.686 |
Rate | +3.592 |
ranks | +3.554 |
Neg logit contributions | |
uala | -8.365 |
� | -7.378 |
Devi | -7.335 |
eni | -7.254 |
subdiv | -6.617 |
Token | . |
Token ID | 13 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
antioxid | +0.718 |
annoyance | +0.701 |
pleas | +0.692 |
Rate | +0.676 |
± | +0.670 |
Neg logit contributions | |
uala | -1.117 |
eni | -0.992 |
itton | -0.874 |
atin | -0.842 |
Devi | -0.839 |
Token | When |
Token ID | 1649 |
Feature activation | +1.93e-02 |
Pos logit contributions | |
antioxid | +0.620 |
annoyance | +0.602 |
pleas | +0.594 |
Rate | +0.578 |
\\\\\\\\ | +0.573 |
Neg logit contributions | |
uala | -0.996 |
eni | -0.887 |
itton | -0.780 |
atin | -0.756 |
Devi | -0.755 |
Token | you |
Token ID | 345 |
Feature activation | -6.19e-01 |
Pos logit contributions | |
antioxid | +0.057 |
annoyance | +0.056 |
pleas | +0.055 |
Rate | +0.054 |
\\\\\\\\ | +0.053 |
Neg logit contributions | |
uala | -0.102 |
eni | -0.092 |
itton | -0.081 |
atin | -0.079 |
Devi | -0.078 |
Token |
|
Token ID | 198 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
uala | +1.040 |
eni | +0.922 |
itton | +0.815 |
atin | +0.789 |
Devi | +0.781 |
Neg logit contributions | |
antioxid | -0.663 |
annoyance | -0.649 |
pleas | -0.640 |
Rate | -0.621 |
gery | -0.616 |
Token |
|
Token ID | 198 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
antioxid | +1.157 |
annoyance | +1.129 |
pleas | +1.115 |
Rate | +1.087 |
± | +1.078 |
Neg logit contributions | |
uala | -1.744 |
eni | -1.546 |
itton | -1.358 |
atin | -1.311 |
Devi | -1.305 |
Token | T |
Token ID | 51 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
uala | +0.791 |
eni | +0.704 |
itton | +0.618 |
atin | +0.601 |
nil | +0.599 |
Neg logit contributions | |
antioxid | -0.486 |
annoyance | -0.472 |
pleas | -0.464 |
gery | -0.444 |
regression | -0.443 |
Token | . |
Token ID | 13 |
Feature activation | +8.63e-01 |
Pos logit contributions | |
uala | +1.007 |
eni | +0.890 |
itton | +0.774 |
atin | +0.746 |
Devi | +0.730 |
Neg logit contributions | |
antioxid | -0.740 |
annoyance | -0.723 |
pleas | -0.717 |
Rate | -0.699 |
---------- | -0.692 |
Token | J |
Token ID | 41 |
Feature activation | +6.58e-01 |
Pos logit contributions | |
antioxid | +2.703 |
annoyance | +2.639 |
pleas | +2.607 |
Rate | +2.589 |
± | +2.557 |
Neg logit contributions | |
uala | -4.379 |
eni | -3.879 |
itton | -3.423 |
atin | -3.297 |
Devi | -3.264 |
Token | . |
Token ID | 13 |
Feature activation | +2.15e+00 |
Pos logit contributions | |
antioxid | +1.876 |
± | +1.815 |
annoyance | +1.806 |
Rate | +1.802 |
pleas | +1.796 |
Neg logit contributions | |
uala | -3.444 |
eni | -3.053 |
itton | -2.684 |
� | -2.641 |
Devi | -2.622 |
Token | Osh |
Token ID | 46614 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
± | +6.034 |
¯ | +5.938 |
Rate | +5.801 |
Interest | +5.671 |
antioxid | +5.655 |
Neg logit contributions | |
uala | -10.744 |
eni | -9.819 |
itton | -8.753 |
ignty | -8.513 |
uesday | -8.436 |
Token | ie |
Token ID | 494 |
Feature activation | +6.91e-01 |
Pos logit contributions | |
antioxid | +4.468 |
annoyance | +4.398 |
± | +4.364 |
pleas | +4.362 |
Rate | +4.357 |
Neg logit contributions | |
uala | -5.146 |
eni | -4.476 |
itton | -3.895 |
Devi | -3.744 |
� | -3.711 |
Token |
|
Token ID | 198 |
Feature activation | -4.75e-02 |
Pos logit contributions | |
antioxid | +2.084 |
annoyance | +2.031 |
pleas | +2.009 |
± | +1.981 |
Rate | +1.966 |
Neg logit contributions | |
uala | -3.589 |
eni | -3.209 |
itton | -2.834 |
Devi | -2.736 |
atin | -2.731 |
Token |
|
Token ID | 198 |
Feature activation | -2.26e-01 |
Pos logit contributions | |
uala | +0.224 |
eni | +0.197 |
itton | +0.169 |
atin | +0.165 |
Devi | +0.165 |
Neg logit contributions | |
antioxid | -0.172 |
annoyance | -0.165 |
pleas | -0.160 |
\\\\\\\\ | -0.159 |
reven | -0.157 |
Token | Nick |
Token ID | 23609 |
Feature activation | -6.50e-01 |
Pos logit contributions | |
uala | +1.153 |
eni | +1.025 |
itton | +0.898 |
atin | +0.876 |
nil | +0.876 |
Neg logit contributions | |
antioxid | -0.721 |
annoyance | -0.699 |
pleas | -0.687 |
gery | -0.657 |
reven | -0.656 |
Token | of |
Token ID | 286 |
Feature activation | +4.84e-01 |
Pos logit contributions | |
uala | +0.919 |
eni | +0.828 |
itton | +0.732 |
atin | +0.721 |
Devi | +0.715 |
Neg logit contributions | |
antioxid | -0.464 |
annoyance | -0.447 |
pleas | -0.439 |
Rate | -0.429 |
gery | -0.423 |
Token | Survivor |
Token ID | 23740 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
antioxid | +1.426 |
annoyance | +1.401 |
pleas | +1.384 |
Rate | +1.345 |
± | +1.338 |
Neg logit contributions | |
uala | -2.558 |
eni | -2.287 |
itton | -2.030 |
atin | -1.957 |
Devi | -1.943 |
Token | San |
Token ID | 2986 |
Feature activation | +5.16e-01 |
Pos logit contributions | |
antioxid | +0.419 |
annoyance | +0.406 |
pleas | +0.399 |
Rate | +0.389 |
± | +0.384 |
Neg logit contributions | |
uala | -0.840 |
eni | -0.754 |
itton | -0.674 |
atin | -0.652 |
Devi | -0.651 |
Token | Juan |
Token ID | 16852 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
antioxid | +1.616 |
annoyance | +1.584 |
pleas | +1.568 |
Rate | +1.530 |
± | +1.523 |
Neg logit contributions | |
uala | -2.631 |
eni | -2.339 |
itton | -2.071 |
atin | -1.990 |
Devi | -1.983 |
Token | Del |
Token ID | 4216 |
Feature activation | +8.91e-01 |
Pos logit contributions | |
antioxid | +1.254 |
annoyance | +1.225 |
pleas | +1.215 |
Rate | +1.182 |
± | +1.177 |
Neg logit contributions | |
uala | -1.928 |
eni | -1.716 |
itton | -1.511 |
atin | -1.452 |
Devi | -1.444 |
Token | Sur |
Token ID | 4198 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
annoyance | +2.517 |
antioxid | +2.515 |
pleas | +2.493 |
Rate | +2.479 |
± | +2.450 |
Neg logit contributions | |
uala | -4.673 |
eni | -4.137 |
itton | -3.708 |
� | -3.641 |
Devi | -3.576 |
Token | featuring |
Token ID | 9593 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
annoyance | +5.528 |
pleas | +5.467 |
Interest | +5.429 |
± | +5.327 |
antioxid | +5.306 |
Neg logit contributions | |
uala | -10.990 |
eni | -9.865 |
itton | -8.969 |
� | -8.827 |
ignty | -8.554 |
Token | Coach |
Token ID | 16393 |
Feature activation | -4.93e-01 |
Pos logit contributions | |
antioxid | +1.081 |
annoyance | +1.057 |
pleas | +1.045 |
Rate | +1.010 |
± | +1.007 |
Neg logit contributions | |
uala | -1.932 |
eni | -1.725 |
itton | -1.532 |
atin | -1.479 |
Devi | -1.470 |
Token | ( |
Token ID | 357 |
Feature activation | -3.66e-01 |
Pos logit contributions | |
uala | +2.487 |
eni | +2.195 |
itton | +1.933 |
Devi | +1.901 |
atin | +1.885 |
Neg logit contributions | |
antioxid | -1.590 |
annoyance | -1.536 |
pleas | -1.519 |
Rate | -1.478 |
---------- | -1.461 |
Token | Surv |
Token ID | 34652 |
Feature activation | -4.17e-01 |
Pos logit contributions | |
uala | +1.802 |
eni | +1.603 |
itton | +1.396 |
atin | +1.369 |
Devi | +1.355 |
Neg logit contributions | |
antioxid | -1.224 |
annoyance | -1.181 |
pleas | -1.174 |
± | -1.125 |
gery | -1.118 |
Token | iv |
Token ID | 452 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
uala | +1.790 |
eni | +1.574 |
itton | +1.362 |
atin | +1.301 |
Devi | +1.282 |
Neg logit contributions | |
antioxid | -1.649 |
annoyance | -1.608 |
pleas | -1.587 |
\\\\\\\\ | -1.557 |
Rate | -1.553 |
Token |
|
Token ID | 198 |
Feature activation | -3.19e-01 |
Pos logit contributions | |
antioxid | +0.007 |
annoyance | +0.007 |
pleas | +0.007 |
Rate | +0.006 |
\\\\\\\\ | +0.006 |
Neg logit contributions | |
uala | -0.010 |
eni | -0.009 |
itton | -0.008 |
Devi | -0.008 |
atin | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -9.71e-02 |
Pos logit contributions | |
uala | +1.464 |
eni | +1.287 |
itton | +1.092 |
Devi | +1.067 |
nil | +1.067 |
Neg logit contributions | |
antioxid | -1.206 |
annoyance | -1.154 |
pleas | -1.107 |
reven | -1.103 |
\\\\\\\\ | -1.100 |
Token | Among |
Token ID | 14311 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
uala | +0.470 |
eni | +0.416 |
itton | +0.360 |
atin | +0.349 |
� | +0.347 |
Neg logit contributions | |
antioxid | -0.337 |
annoyance | -0.327 |
pleas | -0.320 |
regression | -0.312 |
\\\\\\\\ | -0.310 |
Token | those |
Token ID | 883 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
antioxid | +0.782 |
annoyance | +0.759 |
pleas | +0.747 |
Rate | +0.730 |
± | +0.723 |
Neg logit contributions | |
uala | -1.436 |
eni | -1.285 |
itton | -1.141 |
atin | -1.103 |
Devi | -1.100 |
Token | ens |
Token ID | 3140 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
uala | +0.773 |
eni | +0.684 |
itton | +0.593 |
Devi | +0.577 |
atin | +0.575 |
Neg logit contributions | |
antioxid | -0.534 |
annoyance | -0.513 |
\\\\\\\\ | -0.509 |
Rate | -0.504 |
pleas | -0.502 |
Token | n |
Token ID | 77 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
antioxid | +1.225 |
pleas | +1.200 |
annoyance | +1.199 |
Rate | +1.162 |
---------- | +1.155 |
Neg logit contributions | |
uala | -1.756 |
eni | -1.552 |
itton | -1.360 |
Devi | -1.310 |
atin | -1.307 |
Token | ared |
Token ID | 1144 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
± | +5.320 |
pleas | +5.220 |
gery | +5.156 |
hed | +5.065 |
Interest | +4.978 |
Neg logit contributions | |
uala | -10.554 |
eni | -9.403 |
� | -9.116 |
Devi | -8.709 |
subdiv | -8.288 |
Token | by |
Token ID | 416 |
Feature activation | +1.65e-01 |
Pos logit contributions | |
pleas | +3.533 |
antioxid | +3.414 |
annoyance | +3.410 |
± | +3.268 |
gery | +3.222 |
Neg logit contributions | |
uala | -8.182 |
eni | -7.277 |
itton | -6.600 |
atin | -6.466 |
� | -6.404 |
Token | the |
Token ID | 262 |
Feature activation | +1.77e-01 |
Pos logit contributions | |
antioxid | +0.510 |
annoyance | +0.499 |
pleas | +0.493 |
Rate | +0.478 |
± | +0.475 |
Neg logit contributions | |
uala | -0.853 |
eni | -0.760 |
itton | -0.672 |
atin | -0.649 |
Devi | -0.646 |
Token | wide |
Token ID | 3094 |
Feature activation | -6.89e-01 |
Pos logit contributions | |
antioxid | +0.556 |
annoyance | +0.541 |
pleas | +0.534 |
Rate | +0.522 |
± | +0.517 |
Neg logit contributions | |
uala | -0.908 |
eni | -0.808 |
itton | -0.714 |
atin | -0.689 |
Devi | -0.687 |
Token | - |
Token ID | 12 |
Feature activation | -3.65e-01 |
Pos logit contributions | |
uala | +3.300 |
eni | +2.939 |
itton | +2.554 |
atin | +2.463 |
Devi | +2.450 |
Neg logit contributions | |
antioxid | -2.354 |
annoyance | -2.219 |
ONSORED | -2.217 |
pleas | -2.212 |
\\\\\\\\ | -2.212 |
Token | 's |
Token ID | 338 |
Feature activation | +4.71e-01 |
Pos logit contributions | |
antioxid | +1.215 |
annoyance | +1.179 |
pleas | +1.160 |
Rate | +1.130 |
± | +1.118 |
Neg logit contributions | |
uala | -2.366 |
eni | -2.123 |
itton | -1.890 |
atin | -1.833 |
Devi | -1.825 |
Token | recently |
Token ID | 2904 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
antioxid | +1.362 |
annoyance | +1.326 |
pleas | +1.309 |
Rate | +1.272 |
± | +1.261 |
Neg logit contributions | |
uala | -2.529 |
eni | -2.262 |
itton | -2.012 |
atin | -1.947 |
Devi | -1.940 |
Token | reached |
Token ID | 4251 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
antioxid | +0.509 |
annoyance | +0.492 |
pleas | +0.483 |
Rate | +0.476 |
\\\\\\\\ | +0.475 |
Neg logit contributions | |
uala | -0.873 |
eni | -0.782 |
itton | -0.690 |
atin | -0.668 |
Devi | -0.666 |
Token | a |
Token ID | 257 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
antioxid | +3.850 |
annoyance | +3.842 |
pleas | +3.789 |
± | +3.683 |
regression | +3.647 |
Neg logit contributions | |
uala | -7.724 |
eni | -6.954 |
itton | -6.211 |
� | -6.018 |
Devi | -5.970 |
Token | new |
Token ID | 649 |
Feature activation | +9.87e-01 |
Pos logit contributions | |
antioxid | +3.882 |
annoyance | +3.850 |
pleas | +3.848 |
regression | +3.720 |
± | +3.701 |
Neg logit contributions | |
uala | -6.989 |
eni | -6.273 |
itton | -5.572 |
atin | -5.428 |
� | -5.345 |
Token | level |
Token ID | 1241 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
antioxid | +2.778 |
annoyance | +2.724 |
pleas | +2.685 |
Rate | +2.591 |
± | +2.591 |
Neg logit contributions | |
uala | -5.352 |
eni | -4.795 |
itton | -4.289 |
atin | -4.153 |
Devi | -4.117 |
Token | , |
Token ID | 11 |
Feature activation | +5.63e-01 |
Pos logit contributions | |
annoyance | +5.037 |
pleas | +5.036 |
antioxid | +5.000 |
regression | +4.876 |
± | +4.782 |
Neg logit contributions | |
uala | -11.599 |
eni | -10.268 |
itton | -9.461 |
� | -9.149 |
atin | -8.997 |
Token | thanks |
Token ID | 5176 |
Feature activation | +5.17e-01 |
Pos logit contributions | |
antioxid | +1.501 |
annoyance | +1.456 |
pleas | +1.435 |
Rate | +1.394 |
---------- | +1.378 |
Neg logit contributions | |
uala | -3.149 |
eni | -2.831 |
itton | -2.532 |
atin | -2.454 |
Devi | -2.447 |
Token | to |
Token ID | 284 |
Feature activation | +4.41e-02 |
Pos logit contributions | |
antioxid | +1.163 |
annoyance | +1.120 |
pleas | +1.114 |
± | +1.055 |
Rate | +1.054 |
Neg logit contributions | |
uala | -3.112 |
eni | -2.805 |
itton | -2.536 |
atin | -2.468 |
Devi | -2.457 |
Token | the |
Token ID | 262 |
Feature activation | +8.41e-02 |
Pos logit contributions | |
antioxid | +0.135 |
annoyance | +0.131 |
pleas | +0.130 |
Rate | +0.127 |
---------- | +0.126 |
Neg logit contributions | |
uala | -0.229 |
eni | -0.204 |
itton | -0.181 |
atin | -0.175 |
Devi | -0.174 |
Token | health |
Token ID | 1535 |
Feature activation | -3.42e-01 |
Pos logit contributions | |
antioxid | +0.264 |
annoyance | +0.256 |
pleas | +0.252 |
Rate | +0.249 |
\\\\\\\\ | +0.247 |
Neg logit contributions | |
uala | -0.431 |
eni | -0.383 |
itton | -0.338 |
atin | -0.325 |
Devi | -0.325 |
Token | Please |
Token ID | 4222 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
antioxid | +1.640 |
annoyance | +1.591 |
pleas | +1.568 |
Rate | +1.516 |
± | +1.503 |
Neg logit contributions | |
uala | -3.830 |
eni | -3.459 |
itton | -3.107 |
atin | -3.013 |
Devi | -3.002 |
Token | re |
Token ID | 302 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
pleas | +3.773 |
± | +3.651 |
antioxid | +3.574 |
regression | +3.447 |
Rate | +3.446 |
Neg logit contributions | |
uala | -10.867 |
eni | -9.899 |
� | -9.151 |
itton | -8.853 |
ignty | -8.783 |
Token | - |
Token ID | 12 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
pleas | +2.731 |
---------- | +2.706 |
± | +2.703 |
annoyance | +2.686 |
Rate | +2.662 |
Neg logit contributions | |
uala | -5.593 |
eni | -4.943 |
itton | -4.526 |
� | -4.370 |
Devi | -4.299 |
Token | enter |
Token ID | 9255 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
Rate | +4.344 |
pleas | +4.319 |
---------- | +4.309 |
gery | +4.294 |
annoyance | +4.277 |
Neg logit contributions | |
uala | -4.054 |
eni | -3.340 |
itton | -2.982 |
Devi | -2.829 |
� | -2.815 |
Token | . |
Token ID | 13 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
pleas | +4.145 |
± | +4.072 |
---------- | +3.930 |
Rate | +3.898 |
gery | +3.897 |
Neg logit contributions | |
uala | -8.281 |
eni | -7.329 |
itton | -6.753 |
� | -6.498 |
atin | -6.454 |
Token | You |
Token ID | 921 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
antioxid | +2.848 |
pleas | +2.809 |
annoyance | +2.807 |
---------- | +2.779 |
± | +2.770 |
Neg logit contributions | |
uala | -10.148 |
eni | -9.326 |
itton | -8.594 |
atin | -8.241 |
� | -8.156 |
Token | must |
Token ID | 1276 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
pleas | +4.067 |
± | +3.827 |
---------- | +3.821 |
annoyance | +3.802 |
antioxid | +3.729 |
Neg logit contributions | |
uala | -12.527 |
eni | -11.460 |
� | -10.433 |
itton | -10.309 |
atin | -10.114 |
Token | select |
Token ID | 2922 |
Feature activation | +3.40e-01 |
Pos logit contributions | |
pleas | +3.703 |
± | +3.567 |
---------- | +3.529 |
antioxid | +3.508 |
annoyance | +3.505 |
Neg logit contributions | |
uala | -6.333 |
eni | -5.543 |
� | -4.915 |
itton | -4.894 |
atin | -4.787 |
Token | a |
Token ID | 257 |
Feature activation | +9.56e-02 |
Pos logit contributions | |
antioxid | +0.982 |
annoyance | +0.951 |
pleas | +0.931 |
Rate | +0.910 |
\\\\\\\\ | +0.901 |
Neg logit contributions | |
uala | -1.833 |
eni | -1.646 |
itton | -1.460 |
atin | -1.414 |
Devi | -1.413 |
Token | newsletter |
Token ID | 13129 |
Feature activation | +4.94e-01 |
Pos logit contributions | |
antioxid | +0.070 |
annoyance | +0.060 |
pleas | +0.051 |
\\\\\\\\ | +0.049 |
Rate | +0.047 |
Neg logit contributions | |
uala | -0.716 |
eni | -0.668 |
itton | -0.618 |
Devi | -0.604 |
atin | -0.602 |
Token | to |
Token ID | 284 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
antioxid | +1.183 |
annoyance | +1.144 |
pleas | +1.122 |
Rate | +1.087 |
± | +1.071 |
Neg logit contributions | |
uala | -2.906 |
eni | -2.627 |
itton | -2.362 |
atin | -2.295 |
Devi | -2.288 |
Token | library |
Token ID | 5888 |
Feature activation | +5.22e-01 |
Pos logit contributions | |
uala | +0.604 |
eni | +0.542 |
itton | +0.479 |
atin | +0.468 |
Devi | +0.468 |
Neg logit contributions | |
antioxid | -0.340 |
annoyance | -0.333 |
pleas | -0.327 |
\\\\\\\\ | -0.322 |
Rate | -0.319 |
Token | together |
Token ID | 1978 |
Feature activation | +7.65e-01 |
Pos logit contributions | |
antioxid | +1.320 |
annoyance | +1.281 |
pleas | +1.263 |
Rate | +1.222 |
± | +1.212 |
Neg logit contributions | |
uala | -2.991 |
eni | -2.696 |
itton | -2.421 |
atin | -2.345 |
Devi | -2.338 |
Token | : |
Token ID | 25 |
Feature activation | +4.24e-01 |
Pos logit contributions | |
antioxid | +2.098 |
annoyance | +2.052 |
pleas | +2.043 |
± | +1.979 |
Rate | +1.946 |
Neg logit contributions | |
uala | -4.192 |
eni | -3.757 |
itton | -3.368 |
atin | -3.241 |
Devi | -3.235 |
Token |
|
Token ID | 198 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
antioxid | +1.330 |
annoyance | +1.293 |
pleas | +1.282 |
Rate | +1.252 |
± | +1.251 |
Neg logit contributions | |
uala | -2.168 |
eni | -1.934 |
itton | -1.708 |
atin | -1.642 |
Devi | -1.636 |
Token |
|
Token ID | 198 |
Feature activation | +4.80e-01 |
Pos logit contributions | |
antioxid | +1.746 |
annoyance | +1.718 |
pleas | +1.714 |
Rate | +1.670 |
± | +1.668 |
Neg logit contributions | |
uala | -2.831 |
eni | -2.514 |
itton | -2.231 |
atin | -2.143 |
Devi | -2.136 |
Token | pub |
Token ID | 12984 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
antioxid | +1.317 |
annoyance | +1.281 |
pleas | +1.264 |
Rate | +1.232 |
± | +1.217 |
Neg logit contributions | |
uala | -2.649 |
eni | -2.376 |
itton | -2.123 |
atin | -2.053 |
Devi | -2.051 |
Token | struct |
Token ID | 2878 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
antioxid | +3.700 |
pleas | +3.550 |
annoyance | +3.509 |
± | +3.507 |
Rate | +3.448 |
Neg logit contributions | |
uala | -12.539 |
eni | -11.257 |
itton | -10.344 |
Devi | -10.030 |
� | -9.996 |
Token | Atomic |
Token ID | 28976 |
Feature activation | +3.60e-01 |
Pos logit contributions | |
antioxid | +3.465 |
± | +3.357 |
annoyance | +3.348 |
pleas | +3.344 |
Rate | +3.316 |
Neg logit contributions | |
uala | -4.949 |
eni | -4.336 |
itton | -3.886 |
� | -3.655 |
atin | -3.638 |
Token | < |
Token ID | 1279 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
antioxid | +0.800 |
annoyance | +0.772 |
pleas | +0.757 |
Rate | +0.724 |
\\\\\\\\ | +0.716 |
Neg logit contributions | |
uala | -2.177 |
eni | -1.977 |
itton | -1.780 |
atin | -1.734 |
Devi | -1.728 |
Token | T |
Token ID | 309 |
Feature activation | +6.23e-01 |
Pos logit contributions | |
antioxid | +1.567 |
annoyance | +1.532 |
pleas | +1.515 |
Rate | +1.475 |
± | +1.468 |
Neg logit contributions | |
uala | -2.579 |
eni | -2.289 |
itton | -2.028 |
atin | -1.953 |
Devi | -1.945 |
Token | > |
Token ID | 1875 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
antioxid | +0.884 |
annoyance | +0.851 |
pleas | +0.831 |
Rate | +0.793 |
± | +0.790 |
Neg logit contributions | |
uala | -4.239 |
eni | -3.858 |
itton | -3.554 |
atin | -3.447 |
Devi | -3.441 |
Token | party |
Token ID | 2151 |
Feature activation | -6.03e-01 |
Pos logit contributions | |
uala | +3.449 |
eni | +3.162 |
itton | +2.798 |
atin | +2.712 |
Devi | +2.709 |
Neg logit contributions | |
antioxid | -1.772 |
pleas | -1.679 |
Rate | -1.667 |
\\\\\\\\ | -1.662 |
annoyance | -1.661 |
Token | . |
Token ID | 13 |
Feature activation | -3.47e-01 |
Pos logit contributions | |
uala | +2.864 |
eni | +2.555 |
itton | +2.209 |
atin | +2.146 |
Devi | +2.146 |
Neg logit contributions | |
antioxid | -2.089 |
annoyance | -2.012 |
Rate | -1.979 |
pleas | -1.975 |
\\\\\\\\ | -1.946 |
Token |
|
Token ID | 198 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
uala | +1.701 |
eni | +1.512 |
itton | +1.308 |
Devi | +1.296 |
atin | +1.280 |
Neg logit contributions | |
antioxid | -1.177 |
annoyance | -1.140 |
pleas | -1.115 |
\\\\\\\\ | -1.076 |
Rate | -1.068 |
Token |
|
Token ID | 198 |
Feature activation | -4.17e-01 |
Pos logit contributions | |
uala | +1.553 |
eni | +1.368 |
itton | +1.156 |
nil | +1.135 |
atin | +1.129 |
Neg logit contributions | |
antioxid | -1.300 |
annoyance | -1.239 |
\\\\\\\\ | -1.187 |
pleas | -1.186 |
reven | -1.184 |
Token | J |
Token ID | 41 |
Feature activation | +9.65e-02 |
Pos logit contributions | |
uala | +1.997 |
eni | +1.795 |
itton | +1.528 |
nil | +1.523 |
atin | +1.495 |
Neg logit contributions | |
antioxid | -1.474 |
annoyance | -1.419 |
pleas | -1.376 |
regression | -1.341 |
reven | -1.340 |
Token | ou |
Token ID | 280 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
antioxid | +0.385 |
annoyance | +0.378 |
pleas | +0.375 |
Rate | +0.367 |
± | +0.364 |
Neg logit contributions | |
uala | -0.413 |
eni | -0.359 |
itton | -0.307 |
atin | -0.294 |
Devi | -0.291 |
Token | ko |
Token ID | 7204 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
antioxid | +7.659 |
annoyance | +7.572 |
gery | +7.477 |
pleas | +7.473 |
± | +7.417 |
Neg logit contributions | |
uala | -7.964 |
eni | -6.688 |
itton | -6.078 |
� | -5.943 |
Devi | -5.819 |
Token | Ja |
Token ID | 13790 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
antioxid | +0.369 |
annoyance | +0.361 |
pleas | +0.357 |
Rate | +0.349 |
± | +0.346 |
Neg logit contributions | |
uala | -0.504 |
eni | -0.445 |
itton | -0.388 |
atin | -0.374 |
Devi | -0.373 |
Token | as |
Token ID | 292 |
Feature activation | +4.94e-01 |
Pos logit contributions | |
antioxid | +0.855 |
annoyance | +0.838 |
pleas | +0.831 |
Rate | +0.814 |
± | +0.808 |
Neg logit contributions | |
uala | -0.903 |
eni | -0.785 |
itton | -0.671 |
atin | -0.641 |
Devi | -0.637 |
Token | kel |
Token ID | 7750 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
antioxid | +1.852 |
annoyance | +1.815 |
pleas | +1.796 |
Rate | +1.758 |
± | +1.747 |
Neg logit contributions | |
uala | -2.231 |
eni | -1.950 |
itton | -1.689 |
atin | -1.620 |
Devi | -1.613 |
Token | ain |
Token ID | 391 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
uala | +0.723 |
eni | +0.641 |
itton | +0.548 |
atin | +0.536 |
Devi | +0.521 |
Neg logit contributions | |
antioxid | -0.586 |
annoyance | -0.573 |
pleas | -0.569 |
Rate | -0.554 |
\\\\\\\\ | -0.550 |
Token | b |
Token ID | 275 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
uala | +0.760 |
eni | +0.678 |
itton | +0.597 |
Devi | +0.584 |
atin | +0.579 |
Neg logit contributions | |
antioxid | -0.448 |
annoyance | -0.431 |
pleas | -0.426 |
Rate | -0.422 |
\\\\\\\\ | -0.417 |
Token | iz |
Token ID | 528 |
Feature activation | +5.31e-01 |
Pos logit contributions | |
antioxid | +1.630 |
annoyance | +1.590 |
pleas | +1.570 |
Rate | +1.536 |
± | +1.523 |
Neg logit contributions | |
uala | -1.996 |
eni | -1.747 |
itton | -1.515 |
atin | -1.455 |
Devi | -1.444 |
Token | arro |
Token ID | 34852 |
Feature activation | -3.37e-01 |
Pos logit contributions | |
antioxid | +2.048 |
annoyance | +2.010 |
pleas | +1.990 |
Rate | +1.949 |
± | +1.936 |
Neg logit contributions | |
uala | -2.339 |
eni | -2.037 |
itton | -1.757 |
atin | -1.682 |
Devi | -1.675 |
Token | dé |
Token ID | 39073 |
Feature activation | +7.76e-01 |
Pos logit contributions | |
uala | +1.734 |
eni | +1.555 |
itton | +1.371 |
Devi | +1.329 |
atin | +1.327 |
Neg logit contributions | |
antioxid | -1.039 |
annoyance | -0.996 |
pleas | -0.984 |
Rate | -0.976 |
\\\\\\\\ | -0.964 |
Token | j |
Token ID | 73 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
antioxid | +2.783 |
annoyance | +2.759 |
pleas | +2.748 |
Rate | +2.705 |
gery | +2.668 |
Neg logit contributions | |
uala | -3.579 |
eni | -3.109 |
itton | -2.713 |
Devi | -2.624 |
atin | -2.581 |
Token | à |
Token ID | 24247 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
antioxid | +3.806 |
pleas | +3.731 |
annoyance | +3.711 |
± | +3.700 |
Rate | +3.602 |
Neg logit contributions | |
uala | -6.722 |
eni | -5.877 |
itton | -5.203 |
Devi | -5.110 |
� | -5.056 |
Token | v |
Token ID | 410 |
Feature activation | +4.29e-01 |
Pos logit contributions | |
pleas | +4.558 |
antioxid | +4.543 |
annoyance | +4.424 |
± | +4.294 |
gery | +4.289 |
Neg logit contributions | |
uala | -12.022 |
eni | -10.819 |
itton | -9.775 |
atin | -9.570 |
Devi | -9.434 |
Token | u |
Token ID | 84 |
Feature activation | +7.21e-02 |
Pos logit contributions | |
antioxid | +1.527 |
annoyance | +1.501 |
pleas | +1.489 |
Rate | +1.453 |
± | +1.443 |
Neg logit contributions | |
uala | -2.005 |
eni | -1.762 |
itton | -1.535 |
atin | -1.474 |
Devi | -1.473 |
Token | — |
Token ID | 960 |
Feature activation | +4.90e-01 |
Pos logit contributions | |
antioxid | +0.220 |
annoyance | +0.212 |
pleas | +0.210 |
Rate | +0.206 |
± | +0.203 |
Neg logit contributions | |
uala | -0.376 |
eni | -0.336 |
itton | -0.298 |
atin | -0.287 |
Devi | -0.286 |
Token | that |
Token ID | 5562 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
antioxid | +1.777 |
annoyance | +1.748 |
pleas | +1.733 |
Rate | +1.695 |
---------- | +1.682 |
Neg logit contributions | |
uala | -2.257 |
eni | -1.979 |
itton | -1.723 |
atin | -1.649 |
Devi | -1.645 |
Token | rare |
Token ID | 4071 |
Feature activation | -3.71e-01 |
Pos logit contributions | |
uala | +0.621 |
eni | +0.558 |
itton | +0.495 |
Devi | +0.480 |
atin | +0.480 |
Neg logit contributions | |
antioxid | -0.341 |
annoyance | -0.328 |
pleas | -0.325 |
Rate | -0.319 |
\\\\\\\\ | -0.317 |
Token | runs |
Token ID | 4539 |
Feature activation | +6.93e-01 |
Pos logit contributions | |
uala | +2.245 |
eni | +2.020 |
itton | +1.774 |
atin | +1.703 |
Devi | +1.700 |
Neg logit contributions | |
antioxid | -1.410 |
annoyance | -1.354 |
Rate | -1.325 |
\\\\\\\\ | -1.318 |
pleas | -1.316 |
Token | . |
Token ID | 13 |
Feature activation | -9.76e-02 |
Pos logit contributions | |
antioxid | +2.010 |
annoyance | +1.972 |
pleas | +1.959 |
± | +1.887 |
Rate | +1.880 |
Neg logit contributions | |
uala | -3.695 |
eni | -3.295 |
itton | -2.927 |
atin | -2.837 |
Devi | -2.824 |
Token | C |
Token ID | 327 |
Feature activation | +5.39e-01 |
Pos logit contributions | |
uala | +0.490 |
eni | +0.435 |
itton | +0.383 |
Devi | +0.374 |
atin | +0.371 |
Neg logit contributions | |
antioxid | -0.319 |
annoyance | -0.309 |
pleas | -0.304 |
Rate | -0.294 |
gery | -0.293 |
Token | . |
Token ID | 13 |
Feature activation | +9.07e-01 |
Pos logit contributions | |
antioxid | +1.819 |
annoyance | +1.783 |
pleas | +1.760 |
Rate | +1.717 |
± | +1.710 |
Neg logit contributions | |
uala | -2.623 |
eni | -2.317 |
itton | -2.028 |
atin | -1.956 |
Devi | -1.953 |
Token | J |
Token ID | 41 |
Feature activation | +6.99e-01 |
Pos logit contributions | |
antioxid | +2.890 |
annoyance | +2.850 |
pleas | +2.836 |
Rate | +2.787 |
---------- | +2.733 |
Neg logit contributions | |
uala | -4.543 |
eni | -4.045 |
itton | -3.543 |
atin | -3.422 |
Devi | -3.395 |
Token | . |
Token ID | 13 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
antioxid | +2.154 |
pleas | +2.111 |
annoyance | +2.109 |
± | +2.065 |
Rate | +2.061 |
Neg logit contributions | |
uala | -3.571 |
eni | -3.171 |
itton | -2.802 |
atin | -2.707 |
Devi | -2.694 |
Token | Anderson |
Token ID | 9918 |
Feature activation | +6.13e-01 |
Pos logit contributions | |
antioxid | +5.441 |
Interest | +5.309 |
pleas | +5.283 |
± | +5.250 |
Rate | +5.235 |
Neg logit contributions | |
uala | -10.392 |
eni | -9.398 |
itton | -8.414 |
ignty | -8.269 |
atin | -8.232 |
Token | , |
Token ID | 11 |
Feature activation | +6.09e-01 |
Pos logit contributions | |
antioxid | +1.806 |
annoyance | +1.768 |
pleas | +1.757 |
± | +1.697 |
Rate | +1.693 |
Neg logit contributions | |
uala | -3.251 |
eni | -2.896 |
itton | -2.568 |
atin | -2.489 |
Devi | -2.475 |
Token | Ju |
Token ID | 12585 |
Feature activation | +9.42e-01 |
Pos logit contributions | |
antioxid | +1.837 |
annoyance | +1.798 |
pleas | +1.777 |
Rate | +1.719 |
± | +1.711 |
Neg logit contributions | |
uala | -3.195 |
eni | -2.852 |
itton | -2.519 |
atin | -2.437 |
Devi | -2.421 |
Token | wan |
Token ID | 8149 |
Feature activation | +6.53e-01 |
Pos logit contributions | |
antioxid | +3.056 |
annoyance | +3.009 |
Rate | +2.954 |
pleas | +2.952 |
± | +2.917 |
Neg logit contributions | |
uala | -4.617 |
eni | -4.026 |
itton | -3.551 |
Devi | -3.457 |
� | -3.415 |
Token | Thompson |
Token ID | 11654 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
antioxid | +2.228 |
annoyance | +2.184 |
pleas | +2.177 |
Rate | +2.117 |
± | +2.107 |
Neg logit contributions | |
uala | -3.139 |
eni | -2.761 |
itton | -2.435 |
atin | -2.338 |
Devi | -2.330 |
Token | being |
Token ID | 852 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
antioxid | +1.389 |
annoyance | +1.354 |
pleas | +1.336 |
Rate | +1.299 |
± | +1.290 |
Neg logit contributions | |
uala | -2.580 |
eni | -2.309 |
itton | -2.053 |
atin | -1.986 |
Devi | -1.978 |
Token | active |
Token ID | 4075 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
uala | +0.921 |
eni | +0.826 |
itton | +0.730 |
Devi | +0.707 |
atin | +0.704 |
Neg logit contributions | |
antioxid | -0.541 |
annoyance | -0.530 |
pleas | -0.516 |
Rate | -0.512 |
\\\\\\\\ | -0.512 |
Token | : |
Token ID | 25 |
Feature activation | +2.66e-02 |
Pos logit contributions | |
antioxid | +0.960 |
annoyance | +0.937 |
pleas | +0.926 |
Rate | +0.902 |
± | +0.899 |
Neg logit contributions | |
uala | -1.531 |
eni | -1.361 |
itton | -1.201 |
atin | -1.159 |
Devi | -1.153 |
Token |
|
Token ID | 198 |
Feature activation | +3.61e-01 |
Pos logit contributions | |
antioxid | +0.088 |
annoyance | +0.085 |
pleas | +0.084 |
Rate | +0.082 |
± | +0.082 |
Neg logit contributions | |
uala | -0.132 |
eni | -0.117 |
itton | -0.103 |
atin | -0.099 |
Devi | -0.099 |
Token |
|
Token ID | 198 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
antioxid | +1.202 |
annoyance | +1.171 |
pleas | +1.154 |
Rate | +1.126 |
\\\\\\\\ | +1.115 |
Neg logit contributions | |
uala | -1.786 |
eni | -1.583 |
itton | -1.388 |
atin | -1.340 |
Devi | -1.335 |
Token | pub |
Token ID | 12984 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
antioxid | +1.175 |
annoyance | +1.149 |
pleas | +1.136 |
Rate | +1.104 |
± | +1.099 |
Neg logit contributions | |
uala | -1.725 |
eni | -1.528 |
itton | -1.340 |
atin | -1.292 |
Devi | -1.285 |
Token | struct |
Token ID | 2878 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
antioxid | +4.532 |
annoyance | +4.354 |
pleas | +4.329 |
± | +4.227 |
Rate | +4.166 |
Neg logit contributions | |
uala | -11.600 |
eni | -10.347 |
itton | -9.487 |
� | -9.142 |
Devi | -9.135 |
Token | Guard |
Token ID | 4932 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
antioxid | +3.139 |
annoyance | +3.031 |
pleas | +3.002 |
± | +2.956 |
Rate | +2.932 |
Neg logit contributions | |
uala | -5.413 |
eni | -4.829 |
itton | -4.321 |
atin | -4.155 |
� | -4.095 |
Token | { |
Token ID | 1391 |
Feature activation | -8.48e-02 |
Pos logit contributions | |
antioxid | +1.009 |
annoyance | +0.972 |
pleas | +0.955 |
Rate | +0.911 |
± | +0.902 |
Neg logit contributions | |
uala | -2.909 |
eni | -2.641 |
itton | -2.387 |
atin | -2.323 |
Devi | -2.316 |
Token | ... |
Token ID | 2644 |
Feature activation | -3.53e-01 |
Pos logit contributions | |
uala | +0.476 |
eni | +0.428 |
itton | +0.385 |
Devi | +0.373 |
atin | +0.372 |
Neg logit contributions | |
antioxid | -0.221 |
annoyance | -0.214 |
pleas | -0.212 |
\\\\\\\\ | -0.205 |
Rate | -0.204 |
Token | } |
Token ID | 1782 |
Feature activation | -1.56e-01 |
Pos logit contributions | |
uala | +1.857 |
eni | +1.672 |
itton | +1.480 |
Devi | +1.432 |
nil | +1.426 |
Neg logit contributions | |
antioxid | -1.029 |
annoyance | -1.002 |
pleas | -0.990 |
\\\\\\\\ | -0.963 |
Rate | -0.959 |
Token | Please |
Token ID | 4222 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
antioxid | +1.816 |
annoyance | +1.762 |
pleas | +1.741 |
Rate | +1.682 |
± | +1.673 |
Neg logit contributions | |
uala | -4.334 |
eni | -3.923 |
itton | -3.527 |
atin | -3.419 |
Devi | -3.402 |
Token | re |
Token ID | 302 |
Feature activation | +9.35e-01 |
Pos logit contributions | |
pleas | +3.662 |
antioxid | +3.529 |
± | +3.529 |
Rate | +3.376 |
regression | +3.354 |
Neg logit contributions | |
uala | -9.951 |
eni | -9.058 |
� | -8.280 |
itton | -8.101 |
Devi | -8.009 |
Token | - |
Token ID | 12 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
pleas | +2.524 |
---------- | +2.492 |
annoyance | +2.491 |
± | +2.490 |
Rate | +2.459 |
Neg logit contributions | |
uala | -5.057 |
eni | -4.472 |
itton | -4.079 |
� | -3.936 |
Devi | -3.878 |
Token | enter |
Token ID | 9255 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
Rate | +4.235 |
pleas | +4.213 |
---------- | +4.209 |
gery | +4.188 |
annoyance | +4.184 |
Neg logit contributions | |
uala | -3.939 |
eni | -3.253 |
itton | -2.903 |
Devi | -2.750 |
� | -2.730 |
Token | . |
Token ID | 13 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
pleas | +4.046 |
± | +3.967 |
---------- | +3.836 |
annoyance | +3.825 |
Rate | +3.808 |
Neg logit contributions | |
uala | -7.971 |
eni | -7.057 |
itton | -6.489 |
� | -6.241 |
atin | -6.198 |
Token | You |
Token ID | 921 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
antioxid | +2.835 |
annoyance | +2.807 |
pleas | +2.795 |
---------- | +2.759 |
± | +2.751 |
Neg logit contributions | |
uala | -10.003 |
eni | -9.204 |
itton | -8.477 |
atin | -8.131 |
� | -8.052 |
Token | must |
Token ID | 1276 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
pleas | +4.076 |
± | +3.868 |
---------- | +3.837 |
annoyance | +3.832 |
antioxid | +3.742 |
Neg logit contributions | |
uala | -12.163 |
eni | -11.138 |
� | -10.128 |
itton | -10.020 |
atin | -9.823 |
Token | select |
Token ID | 2922 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
pleas | +3.492 |
± | +3.374 |
---------- | +3.328 |
antioxid | +3.327 |
annoyance | +3.319 |
Neg logit contributions | |
uala | -5.880 |
eni | -5.141 |
� | -4.535 |
itton | -4.528 |
atin | -4.442 |
Token | a |
Token ID | 257 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
antioxid | +0.722 |
annoyance | +0.698 |
pleas | +0.680 |
Rate | +0.668 |
\\\\\\\\ | +0.664 |
Neg logit contributions | |
uala | -1.309 |
eni | -1.176 |
itton | -1.039 |
Devi | -1.008 |
atin | -1.007 |
Token | newsletter |
Token ID | 13129 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
uala | +0.086 |
eni | +0.080 |
itton | +0.074 |
Devi | +0.072 |
atin | +0.072 |
Neg logit contributions | |
antioxid | -0.009 |
annoyance | -0.008 |
pleas | -0.007 |
\\\\\\\\ | -0.007 |
Rate | -0.006 |
Token | to |
Token ID | 284 |
Feature activation | -2.78e-01 |
Pos logit contributions | |
antioxid | +1.006 |
annoyance | +0.971 |
pleas | +0.951 |
Rate | +0.924 |
\\\\\\\\ | +0.912 |
Neg logit contributions | |
uala | -2.420 |
eni | -2.187 |
itton | -1.963 |
atin | -1.908 |
Devi | -1.902 |
Token |
|
Token ID | 198 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
antioxid | +2.057 |
pleas | +2.055 |
annoyance | +2.039 |
± | +2.009 |
Rate | +2.003 |
Neg logit contributions | |
uala | -3.533 |
eni | -3.139 |
itton | -2.808 |
atin | -2.695 |
Devi | -2.682 |
Token | Clinton |
Token ID | 16549 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
antioxid | +1.044 |
annoyance | +1.018 |
pleas | +1.004 |
Rate | +0.973 |
± | +0.970 |
Neg logit contributions | |
uala | -1.588 |
eni | -1.409 |
itton | -1.237 |
atin | -1.195 |
Devi | -1.188 |
Token | also |
Token ID | 635 |
Feature activation | +4.77e-01 |
Pos logit contributions | |
uala | +0.637 |
eni | +0.569 |
itton | +0.507 |
Devi | +0.492 |
atin | +0.490 |
Neg logit contributions | |
antioxid | -0.342 |
annoyance | -0.332 |
pleas | -0.323 |
Rate | -0.319 |
gery | -0.315 |
Token | tried |
Token ID | 3088 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
antioxid | +1.334 |
annoyance | +1.297 |
pleas | +1.278 |
Rate | +1.242 |
± | +1.230 |
Neg logit contributions | |
uala | -2.607 |
eni | -2.338 |
itton | -2.084 |
atin | -2.018 |
Devi | -2.011 |
Token | to |
Token ID | 284 |
Feature activation | +5.95e-02 |
Pos logit contributions | |
antioxid | +0.810 |
annoyance | +0.785 |
pleas | +0.774 |
Rate | +0.746 |
± | +0.739 |
Neg logit contributions | |
uala | -1.956 |
eni | -1.766 |
itton | -1.589 |
atin | -1.542 |
Devi | -1.537 |
Token | tri |
Token ID | 1333 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
antioxid | +0.205 |
annoyance | +0.197 |
pleas | +0.194 |
Rate | +0.191 |
\\\\\\\\ | +0.191 |
Neg logit contributions | |
uala | -0.288 |
eni | -0.255 |
itton | -0.225 |
atin | -0.214 |
Devi | -0.214 |
Token | ang |
Token ID | 648 |
Feature activation | +3.71e-01 |
Pos logit contributions | |
pleas | +5.445 |
gery | +5.428 |
annoyance | +5.320 |
ghazi | +5.225 |
± | +5.190 |
Neg logit contributions | |
uala | -10.301 |
eni | -9.022 |
itton | -8.018 |
� | -8.011 |
nil | -7.817 |
Token | ulate |
Token ID | 5039 |
Feature activation | +5.53e-01 |
Pos logit contributions | |
antioxid | +1.468 |
annoyance | +1.442 |
pleas | +1.428 |
Rate | +1.399 |
± | +1.392 |
Neg logit contributions | |
uala | -1.591 |
eni | -1.382 |
itton | -1.187 |
atin | -1.136 |
Devi | -1.131 |
Token | on |
Token ID | 319 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
antioxid | +1.560 |
annoyance | +1.527 |
pleas | +1.510 |
Rate | +1.454 |
± | +1.448 |
Neg logit contributions | |
uala | -3.004 |
eni | -2.695 |
itton | -2.403 |
atin | -2.325 |
Devi | -2.309 |
Token | the |
Token ID | 262 |
Feature activation | +2.59e-01 |
Pos logit contributions | |
uala | +0.062 |
eni | +0.055 |
itton | +0.048 |
Devi | +0.047 |
atin | +0.047 |
Neg logit contributions | |
antioxid | -0.037 |
annoyance | -0.036 |
pleas | -0.035 |
Rate | -0.035 |
\\\\\\\\ | -0.034 |
Token | Planned |
Token ID | 18451 |
Feature activation | +7.10e-01 |
Pos logit contributions | |
antioxid | +0.796 |
annoyance | +0.775 |
pleas | +0.765 |
Rate | +0.746 |
± | +0.739 |
Neg logit contributions | |
uala | -1.349 |
eni | -1.203 |
itton | -1.064 |
atin | -1.028 |
Devi | -1.025 |
Token | the |
Token ID | 262 |
Feature activation | +6.27e-01 |
Pos logit contributions | |
antioxid | +0.684 |
annoyance | +0.662 |
pleas | +0.655 |
Rate | +0.644 |
\\\\\\\\ | +0.640 |
Neg logit contributions | |
uala | -1.132 |
eni | -1.005 |
itton | -0.889 |
atin | -0.862 |
Devi | -0.860 |
Token | Organisation |
Token ID | 30801 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
antioxid | +1.984 |
annoyance | +1.938 |
pleas | +1.917 |
Rate | +1.860 |
± | +1.860 |
Neg logit contributions | |
uala | -3.196 |
eni | -2.837 |
itton | -2.508 |
atin | -2.420 |
Devi | -2.402 |
Token | for |
Token ID | 329 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
uala | +0.589 |
eni | +0.525 |
itton | +0.464 |
Devi | +0.454 |
atin | +0.449 |
Neg logit contributions | |
antioxid | -0.345 |
annoyance | -0.340 |
pleas | -0.332 |
\\\\\\\\ | -0.331 |
gery | -0.325 |
Token | Economic |
Token ID | 11279 |
Feature activation | +5.48e-01 |
Pos logit contributions | |
antioxid | +1.786 |
annoyance | +1.695 |
pleas | +1.660 |
regression | +1.580 |
± | +1.567 |
Neg logit contributions | |
uala | -7.325 |
eni | -6.686 |
itton | -6.232 |
atin | -5.978 |
Devi | -5.953 |
Token | Co |
Token ID | 1766 |
Feature activation | +5.74e-01 |
Pos logit contributions | |
antioxid | +1.334 |
annoyance | +1.291 |
pleas | +1.271 |
Rate | +1.227 |
± | +1.214 |
Neg logit contributions | |
uala | -3.193 |
eni | -2.885 |
itton | -2.591 |
atin | -2.516 |
Devi | -2.509 |
Token | - |
Token ID | 12 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
antioxid | +1.647 |
annoyance | +1.602 |
pleas | +1.589 |
Rate | +1.578 |
± | +1.568 |
Neg logit contributions | |
uala | -3.105 |
eni | -2.731 |
itton | -2.452 |
� | -2.367 |
atin | -2.341 |
Token | operation |
Token ID | 27184 |
Feature activation | +6.67e-01 |
Pos logit contributions | |
Rate | +6.690 |
antioxid | +6.630 |
Interest | +6.460 |
annoyance | +6.430 |
pleas | +6.383 |
Neg logit contributions | |
uala | -9.632 |
eni | -8.061 |
itton | -7.364 |
Devi | -6.809 |
� | -6.786 |
Token | and |
Token ID | 290 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
antioxid | +1.887 |
annoyance | +1.842 |
pleas | +1.810 |
\\\\\\\\ | +1.752 |
Rate | +1.751 |
Neg logit contributions | |
uala | -3.614 |
eni | -3.258 |
itton | -2.883 |
Devi | -2.797 |
atin | -2.796 |
Token | Development |
Token ID | 7712 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
antioxid | +1.640 |
annoyance | +1.587 |
pleas | +1.584 |
\\\\\\\\ | +1.563 |
gery | +1.541 |
Neg logit contributions | |
uala | -1.785 |
eni | -1.566 |
itton | -1.315 |
Devi | -1.281 |
atin | -1.272 |
Token | ( |
Token ID | 357 |
Feature activation | -3.27e-01 |
Pos logit contributions | |
antioxid | +0.610 |
annoyance | +0.593 |
pleas | +0.585 |
Rate | +0.563 |
---------- | +0.560 |
Neg logit contributions | |
uala | -1.245 |
eni | -1.120 |
itton | -0.999 |
atin | -0.969 |
Devi | -0.966 |
Token | O |
Token ID | 46 |
Feature activation | -5.86e-01 |
Pos logit contributions | |
uala | +1.573 |
eni | +1.396 |
itton | +1.203 |
atin | +1.176 |
nil | +1.172 |
Neg logit contributions | |
antioxid | -1.103 |
annoyance | -1.074 |
pleas | -1.066 |
\\\\\\\\ | -1.046 |
reven | -1.039 |
Token | to |
Token ID | 284 |
Feature activation | +5.40e-02 |
Pos logit contributions | |
uala | +2.357 |
eni | +2.122 |
itton | +1.898 |
atin | +1.854 |
Devi | +1.845 |
Neg logit contributions | |
antioxid | -1.017 |
annoyance | -0.985 |
pleas | -0.965 |
Rate | -0.938 |
---------- | -0.927 |
Token | Box |
Token ID | 8315 |
Feature activation | +2.01e-02 |
Pos logit contributions | |
antioxid | +0.155 |
annoyance | +0.151 |
pleas | +0.149 |
Rate | +0.144 |
---------- | +0.143 |
Neg logit contributions | |
uala | -0.291 |
eni | -0.260 |
itton | -0.231 |
atin | -0.225 |
Devi | -0.225 |
Token | : |
Token ID | 1058 |
Feature activation | +3.20e-01 |
Pos logit contributions | |
antioxid | +0.049 |
annoyance | +0.048 |
pleas | +0.047 |
Rate | +0.045 |
\\\\\\\\ | +0.044 |
Neg logit contributions | |
uala | -0.117 |
eni | -0.105 |
itton | -0.095 |
atin | -0.092 |
Devi | -0.092 |
Token |
|
Token ID | 198 |
Feature activation | +6.77e-01 |
Pos logit contributions | |
antioxid | +1.022 |
annoyance | +0.998 |
pleas | +0.987 |
Rate | +0.962 |
± | +0.956 |
Neg logit contributions | |
uala | -1.619 |
eni | -1.439 |
itton | -1.269 |
atin | -1.223 |
Devi | -1.219 |
Token |
|
Token ID | 198 |
Feature activation | +5.78e-01 |
Pos logit contributions | |
antioxid | +2.078 |
pleas | +2.057 |
annoyance | +2.053 |
± | +2.005 |
Rate | +2.002 |
Neg logit contributions | |
uala | -3.474 |
eni | -3.086 |
itton | -2.748 |
atin | -2.635 |
Devi | -2.626 |
Token | pub |
Token ID | 12984 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
antioxid | +1.833 |
annoyance | +1.790 |
pleas | +1.771 |
Rate | +1.739 |
---------- | +1.720 |
Neg logit contributions | |
uala | -2.936 |
eni | -2.606 |
itton | -2.302 |
Devi | -2.218 |
atin | -2.216 |
Token | struct |
Token ID | 2878 |
Feature activation | +8.64e-01 |
Pos logit contributions | |
antioxid | +4.008 |
pleas | +3.851 |
annoyance | +3.817 |
± | +3.761 |
Rate | +3.674 |
Neg logit contributions | |
uala | -11.951 |
eni | -10.663 |
itton | -9.760 |
� | -9.548 |
Devi | -9.446 |
Token | Own |
Token ID | 11744 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
antioxid | +2.525 |
annoyance | +2.434 |
pleas | +2.415 |
± | +2.397 |
Rate | +2.364 |
Neg logit contributions | |
uala | -4.606 |
eni | -4.087 |
itton | -3.666 |
� | -3.502 |
atin | -3.499 |
Token | ed |
Token ID | 276 |
Feature activation | +3.87e-01 |
Pos logit contributions | |
antioxid | +1.633 |
annoyance | +1.599 |
pleas | +1.586 |
Rate | +1.556 |
± | +1.547 |
Neg logit contributions | |
uala | -2.012 |
eni | -1.758 |
itton | -1.531 |
atin | -1.466 |
Devi | -1.460 |
Token | < |
Token ID | 1279 |
Feature activation | +4.82e-01 |
Pos logit contributions | |
antioxid | +0.873 |
annoyance | +0.842 |
pleas | +0.827 |
Rate | +0.793 |
± | +0.784 |
Neg logit contributions | |
uala | -2.331 |
eni | -2.113 |
itton | -1.905 |
atin | -1.853 |
Devi | -1.846 |
Token | T |
Token ID | 309 |
Feature activation | +6.34e-01 |
Pos logit contributions | |
antioxid | +1.489 |
annoyance | +1.456 |
pleas | +1.438 |
Rate | +1.405 |
± | +1.394 |
Neg logit contributions | |
uala | -2.494 |
eni | -2.214 |
itton | -1.965 |
atin | -1.892 |
Devi | -1.885 |
Token | people |
Token ID | 661 |
Feature activation | -5.37e-01 |
Pos logit contributions | |
uala | +0.817 |
eni | +0.740 |
itton | +0.663 |
Devi | +0.644 |
atin | +0.644 |
Neg logit contributions | |
antioxid | -0.344 |
annoyance | -0.328 |
pleas | -0.322 |
Rate | -0.315 |
\\\\\\\\ | -0.310 |
Token | , |
Token ID | 11 |
Feature activation | -7.80e-01 |
Pos logit contributions | |
uala | +2.733 |
eni | +2.444 |
itton | +2.131 |
Devi | +2.077 |
atin | +2.072 |
Neg logit contributions | |
antioxid | -1.700 |
annoyance | -1.629 |
Rate | -1.601 |
pleas | -1.596 |
\\\\\\\\ | -1.578 |
Token | this |
Token ID | 428 |
Feature activation | -2.84e-01 |
Pos logit contributions | |
uala | +3.865 |
eni | +3.391 |
itton | +3.003 |
Devi | +2.964 |
atin | +2.941 |
Neg logit contributions | |
antioxid | -2.525 |
annoyance | -2.372 |
ONSORED | -2.360 |
\\\\\\\\ | -2.353 |
Rate | -2.350 |
Token | dé |
Token ID | 39073 |
Feature activation | +7.65e-01 |
Pos logit contributions | |
uala | +1.508 |
eni | +1.352 |
itton | +1.203 |
Devi | +1.165 |
atin | +1.164 |
Neg logit contributions | |
antioxid | -0.829 |
annoyance | -0.790 |
pleas | -0.780 |
Rate | -0.773 |
\\\\\\\\ | -0.768 |
Token | j |
Token ID | 73 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
antioxid | +2.491 |
pleas | +2.476 |
annoyance | +2.472 |
Rate | +2.409 |
gery | +2.392 |
Neg logit contributions | |
uala | -3.772 |
eni | -3.328 |
itton | -2.897 |
Devi | -2.833 |
� | -2.793 |
Token | à |
Token ID | 24247 |
Feature activation | +1.98e+00 |
Pos logit contributions | |
antioxid | +3.912 |
annoyance | +3.850 |
pleas | +3.829 |
± | +3.813 |
---------- | +3.688 |
Neg logit contributions | |
uala | -7.208 |
eni | -6.327 |
itton | -5.603 |
Devi | -5.525 |
� | -5.458 |
Token | v |
Token ID | 410 |
Feature activation | +5.29e-01 |
Pos logit contributions | |
pleas | +4.327 |
antioxid | +4.305 |
annoyance | +4.164 |
± | +4.066 |
---------- | +4.037 |
Neg logit contributions | |
uala | -11.758 |
eni | -10.634 |
itton | -9.557 |
atin | -9.364 |
� | -9.215 |
Token | u |
Token ID | 84 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
antioxid | +1.804 |
annoyance | +1.784 |
pleas | +1.778 |
Rate | +1.731 |
---------- | +1.721 |
Neg logit contributions | |
uala | -2.519 |
eni | -2.221 |
itton | -1.932 |
Devi | -1.870 |
� | -1.862 |
Token | isn |
Token ID | 2125 |
Feature activation | +3.88e-01 |
Pos logit contributions | |
uala | +1.260 |
eni | +1.127 |
itton | +1.008 |
atin | +0.971 |
Devi | +0.966 |
Neg logit contributions | |
antioxid | -0.705 |
annoyance | -0.669 |
pleas | -0.663 |
Rate | -0.653 |
\\\\\\\\ | -0.647 |
Token | � |
Token ID | 447 |
Feature activation | +6.61e-01 |
Pos logit contributions | |
antioxid | +1.167 |
annoyance | +1.139 |
pleas | +1.130 |
Rate | +1.100 |
± | +1.093 |
Neg logit contributions | |
uala | -2.035 |
eni | -1.815 |
itton | -1.611 |
atin | -1.555 |
Devi | -1.551 |
Token | � |
Token ID | 247 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
antioxid | +1.543 |
annoyance | +1.489 |
pleas | +1.487 |
± | +1.440 |
Rate | +1.430 |
Neg logit contributions | |
uala | -3.880 |
eni | -3.517 |
itton | -3.169 |
atin | -3.092 |
Devi | -3.067 |
Token | burning |
Token ID | 9482 |
Feature activation | +3.11e-01 |
Pos logit contributions | |
antioxid | +1.433 |
annoyance | +1.397 |
pleas | +1.375 |
Rate | +1.343 |
---------- | +1.328 |
Neg logit contributions | |
uala | -2.499 |
eni | -2.229 |
itton | -1.974 |
atin | -1.913 |
Devi | -1.905 |
Token | fat |
Token ID | 3735 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
antioxid | +0.945 |
annoyance | +0.922 |
pleas | +0.909 |
Rate | +0.886 |
---------- | +0.877 |
Neg logit contributions | |
uala | -1.626 |
eni | -1.449 |
itton | -1.283 |
atin | -1.242 |
Devi | -1.237 |
Token | . |
Token ID | 13 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
antioxid | +1.311 |
annoyance | +1.280 |
pleas | +1.265 |
Rate | +1.228 |
± | +1.223 |
Neg logit contributions | |
uala | -2.299 |
eni | -2.051 |
itton | -1.822 |
atin | -1.758 |
Devi | -1.752 |
Token |
|
Token ID | 198 |
Feature activation | +6.09e-01 |
Pos logit contributions | |
uala | +0.579 |
eni | +0.513 |
itton | +0.445 |
Devi | +0.439 |
atin | +0.438 |
Neg logit contributions | |
antioxid | -0.382 |
annoyance | -0.372 |
pleas | -0.364 |
\\\\\\\\ | -0.356 |
gery | -0.355 |
Token |
|
Token ID | 198 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
antioxid | +1.886 |
pleas | +1.861 |
annoyance | +1.860 |
± | +1.815 |
Rate | +1.814 |
Neg logit contributions | |
uala | -3.107 |
eni | -2.759 |
itton | -2.455 |
atin | -2.358 |
Devi | -2.346 |
Token | Met |
Token ID | 9171 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
antioxid | +1.472 |
annoyance | +1.436 |
pleas | +1.423 |
Rate | +1.394 |
---------- | +1.378 |
Neg logit contributions | |
uala | -2.376 |
eni | -2.112 |
itton | -1.870 |
atin | -1.797 |
Devi | -1.795 |
Token | abolic |
Token ID | 29304 |
Feature activation | +6.67e-01 |
Pos logit contributions | |
antioxid | +5.030 |
pleas | +4.951 |
Rate | +4.936 |
gery | +4.933 |
± | +4.858 |
Neg logit contributions | |
uala | -10.108 |
eni | -9.351 |
itton | -8.371 |
� | -8.324 |
Devi | -8.026 |
Token | exercise |
Token ID | 5517 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
antioxid | +1.997 |
annoyance | +1.935 |
pleas | +1.917 |
Rate | +1.875 |
± | +1.859 |
Neg logit contributions | |
uala | -3.518 |
eni | -3.140 |
itton | -2.800 |
� | -2.675 |
Devi | -2.668 |
Token |
|
Token ID | 198 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
antioxid | +3.216 |
annoyance | +3.132 |
pleas | +3.126 |
± | +3.033 |
Rate | +3.032 |
Neg logit contributions | |
uala | -5.524 |
eni | -4.954 |
itton | -4.412 |
atin | -4.197 |
Devi | -4.196 |
Token |
|
Token ID | 198 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
antioxid | +1.094 |
annoyance | +1.065 |
pleas | +1.050 |
Rate | +1.024 |
\\\\\\\\ | +1.014 |
Neg logit contributions | |
uala | -1.626 |
eni | -1.441 |
itton | -1.263 |
atin | -1.220 |
Devi | -1.215 |
Token | The |
Token ID | 464 |
Feature activation | -8.91e-03 |
Pos logit contributions | |
antioxid | +0.382 |
annoyance | +0.373 |
pleas | +0.367 |
\\\\\\\\ | +0.355 |
± | +0.354 |
Neg logit contributions | |
uala | -0.567 |
eni | -0.502 |
itton | -0.437 |
atin | -0.427 |
Devi | -0.422 |
Token | Amin |
Token ID | 39869 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
uala | +0.650 |
eni | +0.553 |
itton | +0.458 |
atin | +0.439 |
nil | +0.436 |
Neg logit contributions | |
antioxid | -0.731 |
annoyance | -0.707 |
Rate | -0.696 |
pleas | -0.695 |
gery | -0.685 |
Token | u |
Token ID | 84 |
Feature activation | -1.99e-01 |
Pos logit contributions | |
antioxid | +0.508 |
annoyance | +0.497 |
pleas | +0.492 |
Rate | +0.481 |
± | +0.478 |
Neg logit contributions | |
uala | -0.647 |
eni | -0.568 |
itton | -0.494 |
atin | -0.474 |
Devi | -0.472 |
Token | , |
Token ID | 11 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
uala | +0.966 |
eni | +0.854 |
itton | +0.748 |
atin | +0.721 |
Devi | +0.718 |
Neg logit contributions | |
antioxid | -0.676 |
annoyance | -0.662 |
pleas | -0.655 |
Rate | -0.639 |
± | -0.635 |
Token | and |
Token ID | 290 |
Feature activation | +3.20e-01 |
Pos logit contributions | |
antioxid | +0.506 |
annoyance | +0.493 |
pleas | +0.486 |
Rate | +0.473 |
± | +0.469 |
Neg logit contributions | |
uala | -0.925 |
eni | -0.827 |
itton | -0.735 |
atin | -0.711 |
Devi | -0.708 |
Token | J |
Token ID | 449 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
antioxid | +1.035 |
annoyance | +1.012 |
pleas | +1.000 |
Rate | +0.972 |
± | +0.968 |
Neg logit contributions | |
uala | -1.610 |
eni | -1.428 |
itton | -1.260 |
atin | -1.215 |
Devi | -1.206 |
Token | . |
Token ID | 13 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
antioxid | +1.153 |
annoyance | +1.138 |
pleas | +1.120 |
Rate | +1.102 |
± | +1.097 |
Neg logit contributions | |
uala | -1.581 |
eni | -1.380 |
itton | -1.218 |
Devi | -1.180 |
� | -1.173 |
Token | J |
Token ID | 41 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
Rate | +4.768 |
annoyance | +4.718 |
pleas | +4.659 |
\\\\\\\\ | +4.628 |
± | +4.619 |
Neg logit contributions | |
uala | -10.669 |
eni | -9.261 |
atin | -8.705 |
itton | -8.636 |
ignty | -8.279 |
Token | . |
Token ID | 13 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
antioxid | +2.862 |
± | +2.847 |
annoyance | +2.827 |
pleas | +2.808 |
Rate | +2.770 |
Neg logit contributions | |
uala | -5.353 |
eni | -4.697 |
itton | -4.222 |
� | -4.128 |
Devi | -4.084 |
Token | B |
Token ID | 347 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
Interest | +4.959 |
± | +4.885 |
¯ | +4.760 |
annoyance | +4.698 |
pleas | +4.697 |
Neg logit contributions | |
uala | -11.536 |
eni | -10.217 |
itton | -9.635 |
� | -9.617 |
atin | -9.492 |
Token | area |
Token ID | 20337 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
gery | +3.696 |
Interest | +3.686 |
± | +3.686 |
Rate | +3.592 |
ranks | +3.554 |
Neg logit contributions | |
uala | -8.365 |
� | -7.378 |
Devi | -7.335 |
eni | -7.254 |
subdiv | -6.617 |
Token | . |
Token ID | 13 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
antioxid | +0.718 |
annoyance | +0.701 |
pleas | +0.692 |
Rate | +0.676 |
± | +0.670 |
Neg logit contributions | |
uala | -1.117 |
eni | -0.992 |
itton | -0.874 |
atin | -0.842 |
Devi | -0.839 |
Token | Please |
Token ID | 4222 |
Feature activation | +1.72e+00 |
Pos logit contributions | |
antioxid | +1.626 |
annoyance | +1.576 |
pleas | +1.551 |
Rate | +1.500 |
± | +1.483 |
Neg logit contributions | |
uala | -3.716 |
eni | -3.347 |
itton | -3.004 |
atin | -2.916 |
Devi | -2.907 |
Token | re |
Token ID | 302 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
pleas | +3.646 |
± | +3.547 |
antioxid | +3.526 |
Rate | +3.393 |
regression | +3.365 |
Neg logit contributions | |
uala | -10.187 |
eni | -9.291 |
� | -8.545 |
itton | -8.330 |
ignty | -8.251 |
Token | - |
Token ID | 12 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
pleas | +2.832 |
---------- | +2.811 |
± | +2.797 |
annoyance | +2.790 |
Rate | +2.755 |
Neg logit contributions | |
uala | -5.802 |
eni | -5.128 |
itton | -4.697 |
� | -4.535 |
Devi | -4.464 |
Token | enter |
Token ID | 9255 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
Rate | +4.418 |
---------- | +4.395 |
pleas | +4.386 |
gery | +4.371 |
annoyance | +4.358 |
Neg logit contributions | |
uala | -4.166 |
eni | -3.428 |
itton | -3.075 |
Devi | -2.931 |
� | -2.899 |
Token | . |
Token ID | 13 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
pleas | +4.089 |
± | +4.004 |
---------- | +3.880 |
annoyance | +3.849 |
gery | +3.844 |
Neg logit contributions | |
uala | -8.153 |
eni | -7.209 |
itton | -6.635 |
� | -6.409 |
atin | -6.355 |
Token | You |
Token ID | 921 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
antioxid | +2.827 |
annoyance | +2.803 |
pleas | +2.782 |
± | +2.763 |
---------- | +2.763 |
Neg logit contributions | |
uala | -10.184 |
eni | -9.344 |
itton | -8.627 |
atin | -8.248 |
� | -8.209 |
Token | must |
Token ID | 1276 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
pleas | +3.961 |
annoyance | +3.777 |
± | +3.772 |
---------- | +3.757 |
antioxid | +3.689 |
Neg logit contributions | |
uala | -11.882 |
eni | -10.814 |
� | -9.808 |
itton | -9.784 |
atin | -9.507 |
Token | select |
Token ID | 2922 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
pleas | +3.381 |
± | +3.254 |
---------- | +3.221 |
annoyance | +3.190 |
antioxid | +3.190 |
Neg logit contributions | |
uala | -5.784 |
eni | -5.061 |
� | -4.472 |
itton | -4.457 |
atin | -4.376 |
Token | a |
Token ID | 257 |
Feature activation | +2.81e-02 |
Pos logit contributions | |
antioxid | +0.692 |
annoyance | +0.668 |
pleas | +0.648 |
Rate | +0.638 |
\\\\\\\\ | +0.636 |
Neg logit contributions | |
uala | -1.231 |
eni | -1.106 |
itton | -0.976 |
Devi | -0.947 |
atin | -0.945 |
Token | newsletter |
Token ID | 13129 |
Feature activation | +4.49e-01 |
Pos logit contributions | |
antioxid | +0.023 |
annoyance | +0.020 |
\\\\\\\\ | +0.016 |
pleas | +0.016 |
Rate | +0.015 |
Neg logit contributions | |
uala | -0.208 |
eni | -0.194 |
itton | -0.180 |
Devi | -0.176 |
atin | -0.175 |
Token | to |
Token ID | 284 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
antioxid | +1.092 |
annoyance | +1.054 |
pleas | +1.031 |
Rate | +1.002 |
\\\\\\\\ | +0.989 |
Neg logit contributions | |
uala | -2.629 |
eni | -2.376 |
itton | -2.133 |
atin | -2.073 |
Devi | -2.066 |
Token | know |
Token ID | 760 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
antioxid | +1.861 |
annoyance | +1.851 |
pleas | +1.827 |
± | +1.787 |
Rate | +1.780 |
Neg logit contributions | |
uala | -3.381 |
eni | -3.010 |
itton | -2.678 |
Devi | -2.581 |
� | -2.576 |
Token | them |
Token ID | 606 |
Feature activation | -2.26e-01 |
Pos logit contributions | |
antioxid | +1.054 |
annoyance | +1.029 |
pleas | +1.019 |
Rate | +0.986 |
± | +0.985 |
Neg logit contributions | |
uala | -1.905 |
eni | -1.699 |
itton | -1.513 |
atin | -1.461 |
Devi | -1.451 |
Token | . |
Token ID | 13 |
Feature activation | +2.19e-02 |
Pos logit contributions | |
uala | +1.116 |
eni | +1.001 |
itton | +0.866 |
atin | +0.840 |
Devi | +0.839 |
Neg logit contributions | |
antioxid | -0.754 |
annoyance | -0.727 |
Rate | -0.712 |
pleas | -0.706 |
\\\\\\\\ | -0.697 |
Token | It |
Token ID | 632 |
Feature activation | +4.00e-01 |
Pos logit contributions | |
antioxid | +0.074 |
annoyance | +0.072 |
pleas | +0.071 |
Rate | +0.068 |
\\\\\\\\ | +0.068 |
Neg logit contributions | |
uala | -0.108 |
eni | -0.095 |
itton | -0.083 |
Devi | -0.082 |
atin | -0.081 |
Token | 's |
Token ID | 338 |
Feature activation | +5.80e-01 |
Pos logit contributions | |
antioxid | +1.130 |
annoyance | +1.105 |
pleas | +1.094 |
Rate | +1.058 |
± | +1.052 |
Neg logit contributions | |
uala | -2.173 |
eni | -1.944 |
itton | -1.735 |
atin | -1.678 |
Devi | -1.669 |
Token | likely |
Token ID | 1884 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
antioxid | +1.641 |
annoyance | +1.600 |
pleas | +1.579 |
Rate | +1.529 |
± | +1.519 |
Neg logit contributions | |
uala | -3.155 |
eni | -2.826 |
itton | -2.518 |
atin | -2.437 |
Devi | -2.427 |
Token | those |
Token ID | 883 |
Feature activation | -9.23e-02 |
Pos logit contributions | |
pleas | +4.624 |
antioxid | +4.616 |
annoyance | +4.587 |
regression | +4.314 |
partisans | +4.305 |
Neg logit contributions | |
uala | -11.144 |
eni | -10.078 |
itton | -9.021 |
atin | -8.809 |
� | -8.733 |
Token | more |
Token ID | 517 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
uala | +0.496 |
eni | +0.448 |
itton | +0.396 |
atin | +0.385 |
Devi | +0.383 |
Neg logit contributions | |
antioxid | -0.263 |
annoyance | -0.251 |
pleas | -0.248 |
Rate | -0.247 |
\\\\\\\\ | -0.247 |
Token | aware |
Token ID | 3910 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
uala | +0.807 |
eni | +0.733 |
itton | +0.653 |
atin | +0.640 |
Devi | +0.636 |
Neg logit contributions | |
antioxid | -0.353 |
annoyance | -0.337 |
\\\\\\\\ | -0.331 |
pleas | -0.331 |
Rate | -0.328 |
Token | of |
Token ID | 286 |
Feature activation | -1.61e-01 |
Pos logit contributions | |
antioxid | +0.707 |
annoyance | +0.684 |
pleas | +0.676 |
Rate | +0.661 |
\\\\\\\\ | +0.657 |
Neg logit contributions | |
uala | -1.194 |
eni | -1.065 |
itton | -0.943 |
atin | -0.909 |
Devi | -0.906 |
Token | the |
Token ID | 262 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
uala | +0.848 |
eni | +0.757 |
itton | +0.672 |
atin | +0.648 |
Devi | +0.646 |
Neg logit contributions | |
antioxid | -0.486 |
annoyance | -0.469 |
pleas | -0.461 |
Rate | -0.455 |
\\\\\\\\ | -0.449 |
Token | from |
Token ID | 422 |
Feature activation | -4.29e-01 |
Pos logit contributions | |
uala | +1.666 |
eni | +1.486 |
itton | +1.309 |
atin | +1.261 |
Devi | +1.256 |
Neg logit contributions | |
antioxid | -1.080 |
annoyance | -1.053 |
pleas | -1.034 |
Rate | -1.017 |
\\\\\\\\ | -1.004 |
Token | the |
Token ID | 262 |
Feature activation | -5.55e-02 |
Pos logit contributions | |
uala | +2.167 |
eni | +1.916 |
itton | +1.689 |
atin | +1.633 |
Devi | +1.630 |
Neg logit contributions | |
antioxid | -1.382 |
annoyance | -1.343 |
pleas | -1.328 |
Rate | -1.313 |
\\\\\\\\ | -1.293 |
Token | Harvard |
Token ID | 11131 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
uala | +0.284 |
eni | +0.253 |
itton | +0.223 |
atin | +0.215 |
Devi | +0.215 |
Neg logit contributions | |
antioxid | -0.174 |
annoyance | -0.170 |
pleas | -0.168 |
Rate | -0.164 |
± | -0.162 |
Token | - |
Token ID | 12 |
Feature activation | -2.58e-01 |
Pos logit contributions | |
uala | +4.981 |
eni | +4.411 |
itton | +3.905 |
Devi | +3.801 |
atin | +3.680 |
Neg logit contributions | |
antioxid | -3.427 |
Rate | -3.326 |
annoyance | -3.258 |
\\\\\\\\ | -3.236 |
pleas | -3.212 |
Token | Smith |
Token ID | 17919 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
uala | +1.288 |
eni | +1.135 |
itton | +1.005 |
atin | +0.962 |
Devi | +0.958 |
Neg logit contributions | |
antioxid | -0.859 |
annoyance | -0.826 |
pleas | -0.817 |
Rate | -0.797 |
\\\\\\\\ | -0.795 |
Token | sonian |
Token ID | 35202 |
Feature activation | -2.11e+00 |
Pos logit contributions | |
uala | +4.122 |
eni | +3.465 |
itton | +2.721 |
nil | +2.697 |
ick | +2.547 |
Neg logit contributions | |
antioxid | -6.941 |
pleas | -6.878 |
Rate | -6.874 |
annoyance | -6.869 |
ghazi | -6.804 |
Token | Center |
Token ID | 3337 |
Feature activation | -8.08e-01 |
Pos logit contributions | |
uala | +8.185 |
eni | +7.231 |
itton | +6.473 |
Devi | +6.068 |
atin | +5.714 |
Neg logit contributions | |
antioxid | -8.373 |
annoyance | -8.122 |
ghazi | -8.076 |
Rate | -8.051 |
akespeare | -7.978 |
Token | for |
Token ID | 329 |
Feature activation | +8.49e-01 |
Pos logit contributions | |
uala | +4.056 |
eni | +3.610 |
itton | +3.203 |
Devi | +3.081 |
atin | +3.076 |
Neg logit contributions | |
antioxid | -2.559 |
annoyance | -2.475 |
pleas | -2.425 |
\\\\\\\\ | -2.421 |
Rate | -2.414 |
Token | Ast |
Token ID | 8304 |
Feature activation | -3.69e-01 |
Pos logit contributions | |
annoyance | +3.202 |
antioxid | +3.196 |
Interest | +3.090 |
± | +3.081 |
pleas | +3.073 |
Neg logit contributions | |
uala | -3.704 |
eni | -3.271 |
itton | -2.759 |
� | -2.700 |
atin | -2.685 |
Token | roph |
Token ID | 10051 |
Feature activation | -8.34e-01 |
Pos logit contributions | |
uala | +2.045 |
eni | +1.866 |
itton | +1.652 |
atin | +1.605 |
etta | +1.584 |
Neg logit contributions | |
antioxid | -1.016 |
annoyance | -0.975 |
pleas | -0.959 |
\\\\\\\\ | -0.949 |
ONSORED | -0.947 |
Token | ysics |
Token ID | 23154 |
Feature activation | -7.61e-01 |
Pos logit contributions | |
uala | +2.636 |
eni | +2.206 |
itton | +1.726 |
etta | +1.607 |
Devi | +1.564 |
Neg logit contributions | |
antioxid | -4.358 |
annoyance | -4.247 |
pleas | -4.169 |
\\\\\\\\ | -4.145 |
Rate | -4.123 |
Token | human |
Token ID | 1692 |
Feature activation | +6.69e-01 |
Pos logit contributions | |
antioxid | +0.883 |
annoyance | +0.857 |
pleas | +0.843 |
Rate | +0.826 |
\\\\\\\\ | +0.819 |
Neg logit contributions | |
uala | -1.592 |
eni | -1.428 |
itton | -1.263 |
atin | -1.227 |
Devi | -1.223 |
Token | - |
Token ID | 12 |
Feature activation | +8.06e-01 |
Pos logit contributions | |
antioxid | +2.019 |
annoyance | +1.999 |
pleas | +1.976 |
± | +1.907 |
Rate | +1.903 |
Neg logit contributions | |
uala | -3.475 |
eni | -3.080 |
itton | -2.749 |
atin | -2.651 |
Devi | -2.628 |
Token | like |
Token ID | 2339 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
antioxid | +2.510 |
annoyance | +2.478 |
pleas | +2.466 |
Rate | +2.404 |
± | +2.375 |
Neg logit contributions | |
uala | -4.098 |
eni | -3.631 |
itton | -3.219 |
Devi | -3.082 |
atin | -3.081 |
Token | with |
Token ID | 351 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
antioxid | +0.449 |
annoyance | +0.435 |
pleas | +0.430 |
Rate | +0.421 |
\\\\\\\\ | +0.416 |
Neg logit contributions | |
uala | -0.721 |
eni | -0.643 |
itton | -0.565 |
atin | -0.546 |
Devi | -0.546 |
Token | each |
Token ID | 1123 |
Feature activation | +4.86e-02 |
Pos logit contributions | |
antioxid | +0.509 |
annoyance | +0.496 |
pleas | +0.489 |
Rate | +0.475 |
± | +0.471 |
Neg logit contributions | |
uala | -0.975 |
eni | -0.873 |
itton | -0.778 |
atin | -0.753 |
Devi | -0.750 |
Token | passing |
Token ID | 6427 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
antioxid | +0.151 |
annoyance | +0.146 |
pleas | +0.145 |
Rate | +0.141 |
---------- | +0.140 |
Neg logit contributions | |
uala | -0.251 |
eni | -0.223 |
itton | -0.197 |
atin | -0.191 |
Devi | -0.190 |
Token | day |
Token ID | 1110 |
Feature activation | +5.71e-02 |
Pos logit contributions | |
uala | +7.686 |
eni | +6.576 |
itton | +5.643 |
Devi | +5.503 |
atin | +5.412 |
Neg logit contributions | |
antioxid | -7.157 |
ONSORED | -7.023 |
\\\\\\\\ | -6.948 |
ULTS | -6.918 |
Rate | -6.917 |
Token | ! |
Token ID | 0 |
Feature activation | +6.95e-02 |
Pos logit contributions | |
antioxid | +0.193 |
annoyance | +0.187 |
pleas | +0.185 |
Rate | +0.181 |
± | +0.180 |
Neg logit contributions | |
uala | -0.280 |
eni | -0.248 |
itton | -0.217 |
atin | -0.209 |
Devi | -0.209 |
Token | Eventually |
Token ID | 16178 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
antioxid | +0.231 |
annoyance | +0.225 |
pleas | +0.223 |
Rate | +0.217 |
\\\\\\\\ | +0.214 |
Neg logit contributions | |
uala | -0.343 |
eni | -0.305 |
itton | -0.266 |
Devi | -0.258 |
atin | -0.258 |
Token | the |
Token ID | 262 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
antioxid | +0.626 |
annoyance | +0.613 |
pleas | +0.606 |
Rate | +0.590 |
± | +0.587 |
Neg logit contributions | |
uala | -0.924 |
eni | -0.817 |
itton | -0.719 |
atin | -0.692 |
Devi | -0.688 |
Token | turtles |
Token ID | 36288 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
uala | +0.807 |
eni | +0.717 |
itton | +0.624 |
atin | +0.607 |
Devi | +0.607 |
Neg logit contributions | |
antioxid | -0.544 |
annoyance | -0.529 |
pleas | -0.521 |
Rate | -0.520 |
\\\\\\\\ | -0.517 |
Token | is |
Token ID | 318 |
Feature activation | +3.61e-01 |
Pos logit contributions | |
antioxid | +0.807 |
annoyance | +0.780 |
pleas | +0.768 |
Rate | +0.754 |
\\\\\\\\ | +0.747 |
Neg logit contributions | |
uala | -1.439 |
eni | -1.289 |
itton | -1.142 |
atin | -1.105 |
Devi | -1.102 |
Token | what |
Token ID | 644 |
Feature activation | -2.28e-01 |
Pos logit contributions | |
antioxid | +1.016 |
annoyance | +0.982 |
pleas | +0.965 |
Rate | +0.948 |
---------- | +0.935 |
Neg logit contributions | |
uala | -1.970 |
eni | -1.765 |
itton | -1.572 |
atin | -1.524 |
Devi | -1.517 |
Token | matters |
Token ID | 6067 |
Feature activation | -8.08e-01 |
Pos logit contributions | |
uala | +1.173 |
eni | +1.048 |
itton | +0.926 |
Devi | +0.901 |
atin | +0.895 |
Neg logit contributions | |
antioxid | -0.700 |
annoyance | -0.671 |
pleas | -0.661 |
Rate | -0.659 |
\\\\\\\\ | -0.654 |
Token | most |
Token ID | 749 |
Feature activation | -6.07e-01 |
Pos logit contributions | |
uala | +4.126 |
eni | +3.742 |
itton | +3.275 |
Devi | +3.181 |
nil | +3.130 |
Neg logit contributions | |
antioxid | -2.494 |
annoyance | -2.341 |
Rate | -2.333 |
\\\\\\\\ | -2.289 |
---------- | -2.262 |
Token | in |
Token ID | 287 |
Feature activation | -5.55e-01 |
Pos logit contributions | |
uala | +3.345 |
eni | +3.032 |
itton | +2.677 |
Devi | +2.614 |
nil | +2.579 |
Neg logit contributions | |
antioxid | -1.664 |
annoyance | -1.561 |
Rate | -1.554 |
\\\\\\\\ | -1.521 |
pleas | -1.500 |
Token | geop |
Token ID | 30324 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
uala | +2.739 |
eni | +2.434 |
itton | +2.140 |
atin | +2.076 |
Devi | +2.060 |
Neg logit contributions | |
antioxid | -1.824 |
annoyance | -1.722 |
Rate | -1.708 |
\\\\\\\\ | -1.702 |
pleas | -1.681 |
Token | olitics |
Token ID | 21704 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
uala | +7.024 |
eni | +6.347 |
etta | +5.088 |
itton | +5.072 |
ick | +4.882 |
Neg logit contributions | |
antioxid | -8.164 |
annoyance | -7.964 |
pleas | -7.808 |
Rate | -7.766 |
ONSORED | -7.645 |
Token | — |
Token ID | 851 |
Feature activation | -4.86e-01 |
Pos logit contributions | |
uala | +6.746 |
eni | +6.071 |
itton | +5.400 |
Devi | +5.244 |
etta | +5.186 |
Neg logit contributions | |
antioxid | -3.512 |
annoyance | -3.310 |
Rate | -3.279 |
pleas | -3.171 |
\\\\\\\\ | -3.149 |
Token | it |
Token ID | 340 |
Feature activation | -5.69e-02 |
Pos logit contributions | |
uala | +2.414 |
eni | +2.154 |
itton | +1.895 |
Devi | +1.839 |
atin | +1.837 |
Neg logit contributions | |
antioxid | -1.571 |
annoyance | -1.498 |
Rate | -1.468 |
pleas | -1.468 |
\\\\\\\\ | -1.462 |
Token | is |
Token ID | 318 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
uala | +0.309 |
eni | +0.277 |
itton | +0.246 |
Devi | +0.238 |
atin | +0.238 |
Neg logit contributions | |
antioxid | -0.164 |
annoyance | -0.157 |
pleas | -0.153 |
Rate | -0.151 |
\\\\\\\\ | -0.149 |
Token | plain |
Token ID | 8631 |
Feature activation | +5.84e-01 |
Pos logit contributions | |
uala | +1.394 |
eni | +1.242 |
itton | +1.095 |
Devi | +1.071 |
atin | +1.062 |
Neg logit contributions | |
antioxid | -0.855 |
annoyance | -0.815 |
Rate | -0.805 |
\\\\\\\\ | -0.803 |
ONSORED | -0.800 |
Token | yu |
Token ID | 24767 |
Feature activation | +9.44e-02 |
Pos logit contributions | |
uala | +2.932 |
eni | +2.575 |
itton | +2.074 |
atin | +2.057 |
Devi | +2.024 |
Neg logit contributions | |
antioxid | -3.378 |
annoyance | -3.262 |
pleas | -3.243 |
\\\\\\\\ | -3.212 |
Rate | -3.157 |
Token | K |
Token ID | 42 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
antioxid | +0.313 |
annoyance | +0.307 |
pleas | +0.303 |
Rate | +0.296 |
± | +0.294 |
Neg logit contributions | |
uala | -0.467 |
eni | -0.413 |
itton | -0.364 |
atin | -0.350 |
Devi | -0.348 |
Token | ong |
Token ID | 506 |
Feature activation | -5.13e-01 |
Pos logit contributions | |
uala | +4.755 |
eni | +4.121 |
itton | +3.521 |
atin | +3.437 |
nil | +3.288 |
Neg logit contributions | |
antioxid | -4.695 |
annoyance | -4.492 |
pleas | -4.449 |
\\\\\\\\ | -4.424 |
---------- | -4.366 |
Token | Ch |
Token ID | 1925 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
uala | +2.420 |
eni | +2.142 |
itton | +1.856 |
atin | +1.814 |
nil | +1.787 |
Neg logit contributions | |
antioxid | -1.808 |
annoyance | -1.760 |
pleas | -1.732 |
Rate | -1.690 |
\\\\\\\\ | -1.685 |
Token | oya |
Token ID | 23790 |
Feature activation | -7.08e-01 |
Pos logit contributions | |
uala | +1.870 |
eni | +1.230 |
itton | +0.604 |
atin | +0.529 |
nil | +0.277 |
Neg logit contributions | |
antioxid | -7.925 |
pleas | -7.749 |
annoyance | -7.726 |
\\\\\\\\ | -7.701 |
regression | -7.638 |
Token | Week |
Token ID | 20916 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
uala | +3.428 |
eni | +3.056 |
itton | +2.664 |
atin | +2.595 |
nil | +2.582 |
Neg logit contributions | |
antioxid | -2.391 |
annoyance | -2.313 |
pleas | -2.289 |
Rate | -2.211 |
± | -2.210 |
Token | end |
Token ID | 437 |
Feature activation | -6.50e-01 |
Pos logit contributions | |
uala | +7.444 |
eni | +6.419 |
itton | +5.469 |
atin | +5.215 |
hurst | +5.196 |
Neg logit contributions | |
antioxid | -8.004 |
\\\\\\\\ | -7.492 |
annoyance | -7.468 |
pleas | -7.379 |
reven | -7.375 |
Token | T |
Token ID | 51 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
uala | +3.158 |
eni | +2.821 |
itton | +2.455 |
atin | +2.395 |
nil | +2.387 |
Neg logit contributions | |
antioxid | -2.171 |
annoyance | -2.104 |
pleas | -2.091 |
± | -2.012 |
Rate | -2.010 |
Token | ear |
Token ID | 451 |
Feature activation | -6.35e-01 |
Pos logit contributions | |
uala | +6.935 |
eni | +6.097 |
itton | +5.330 |
atin | +5.049 |
etta | +4.962 |
Neg logit contributions | |
antioxid | -5.419 |
pleas | -5.197 |
annoyance | -5.190 |
---------- | -5.100 |
Rate | -5.070 |
Token | V |
Token ID | 53 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
uala | +2.969 |
eni | +2.646 |
itton | +2.282 |
atin | +2.233 |
nil | +2.221 |
Neg logit contributions | |
antioxid | -2.226 |
annoyance | -2.177 |
pleas | -2.154 |
Rate | -2.077 |
± | -2.072 |
Token | oid |
Token ID | 1868 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
uala | +5.994 |
eni | +5.224 |
itton | +4.603 |
atin | +4.387 |
nil | +4.354 |
Neg logit contributions | |
antioxid | -6.125 |
pleas | -5.835 |
\\\\\\\\ | -5.812 |
annoyance | -5.739 |
reven | -5.626 |
Token | but |
Token ID | 475 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
pleas | +3.704 |
annoyance | +3.695 |
antioxid | +3.677 |
± | +3.541 |
Rate | +3.490 |
Neg logit contributions | |
uala | -6.340 |
eni | -5.662 |
itton | -4.971 |
� | -4.886 |
atin | -4.809 |
Token | who |
Token ID | 508 |
Feature activation | -5.12e-02 |
Pos logit contributions | |
antioxid | +0.464 |
annoyance | +0.447 |
pleas | +0.439 |
Rate | +0.433 |
\\\\\\\\ | +0.431 |
Neg logit contributions | |
uala | -0.802 |
eni | -0.717 |
itton | -0.637 |
atin | -0.616 |
Devi | -0.615 |
Token | will |
Token ID | 481 |
Feature activation | +8.21e-02 |
Pos logit contributions | |
uala | +0.265 |
eni | +0.236 |
itton | +0.209 |
atin | +0.202 |
Devi | +0.201 |
Neg logit contributions | |
antioxid | -0.159 |
annoyance | -0.154 |
pleas | -0.150 |
Rate | -0.149 |
\\\\\\\\ | -0.147 |
Token | get |
Token ID | 651 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
antioxid | +0.282 |
annoyance | +0.275 |
pleas | +0.271 |
Rate | +0.266 |
\\\\\\\\ | +0.265 |
Neg logit contributions | |
uala | -0.397 |
eni | -0.350 |
itton | -0.308 |
atin | -0.296 |
Devi | -0.295 |
Token | the |
Token ID | 262 |
Feature activation | -7.14e-01 |
Pos logit contributions | |
antioxid | +0.472 |
annoyance | +0.460 |
pleas | +0.454 |
Rate | +0.443 |
± | +0.439 |
Neg logit contributions | |
uala | -0.780 |
eni | -0.695 |
itton | -0.614 |
atin | -0.593 |
Devi | -0.591 |
Token | blame |
Token ID | 8138 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
uala | +3.492 |
eni | +3.088 |
itton | +2.717 |
Devi | +2.634 |
atin | +2.633 |
Neg logit contributions | |
antioxid | -2.344 |
Rate | -2.220 |
\\\\\\\\ | -2.211 |
annoyance | -2.209 |
ONSORED | -2.195 |
Token | ? |
Token ID | 30 |
Feature activation | -2.64e-01 |
Pos logit contributions | |
uala | +8.683 |
eni | +7.705 |
itton | +6.885 |
Devi | +6.658 |
etta | +6.594 |
Neg logit contributions | |
antioxid | -6.171 |
ONSORED | -5.775 |
Rate | -5.752 |
annoyance | -5.737 |
\\\\\\\\ | -5.691 |
Token | | |
Token ID | 930 |
Feature activation | +8.10e-01 |
Pos logit contributions | |
uala | +1.274 |
eni | +1.124 |
itton | +0.987 |
Devi | +0.953 |
atin | +0.952 |
Neg logit contributions | |
antioxid | -0.912 |
annoyance | -0.883 |
pleas | -0.867 |
Rate | -0.849 |
\\\\\\\\ | -0.842 |
Token | Ad |
Token ID | 1215 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
antioxid | +2.463 |
annoyance | +2.443 |
pleas | +2.436 |
± | +2.375 |
---------- | +2.358 |
Neg logit contributions | |
uala | -4.124 |
eni | -3.667 |
itton | -3.257 |
atin | -3.129 |
� | -3.098 |
Token | ity |
Token ID | 414 |
Feature activation | -5.31e-01 |
Pos logit contributions | |
uala | +1.199 |
eni | +1.052 |
itton | +0.908 |
atin | +0.882 |
Devi | +0.871 |
Neg logit contributions | |
antioxid | -0.954 |
annoyance | -0.933 |
pleas | -0.929 |
\\\\\\\\ | -0.897 |
Rate | -0.897 |
Token | a |
Token ID | 64 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
uala | +2.464 |
eni | +2.184 |
itton | +1.850 |
atin | +1.826 |
Devi | +1.809 |
Neg logit contributions | |
antioxid | -1.958 |
annoyance | -1.893 |
pleas | -1.867 |
Rate | -1.830 |
± | -1.794 |
Token | of |
Token ID | 286 |
Feature activation | -5.82e-01 |
Pos logit contributions | |
uala | +5.519 |
eni | +4.991 |
itton | +4.431 |
Devi | +4.348 |
atin | +4.266 |
Neg logit contributions | |
antioxid | -3.061 |
\\\\\\\\ | -2.954 |
annoyance | -2.953 |
pleas | -2.896 |
ONSORED | -2.886 |
Token | the |
Token ID | 262 |
Feature activation | -2.40e-01 |
Pos logit contributions | |
uala | +2.822 |
eni | +2.498 |
itton | +2.166 |
Devi | +2.141 |
atin | +2.136 |
Neg logit contributions | |
antioxid | -1.959 |
annoyance | -1.906 |
pleas | -1.875 |
Rate | -1.870 |
\\\\\\\\ | -1.862 |
Token | limestone |
Token ID | 48520 |
Feature activation | -9.43e-01 |
Pos logit contributions | |
uala | +1.111 |
eni | +0.978 |
itton | +0.846 |
Devi | +0.822 |
atin | +0.821 |
Neg logit contributions | |
antioxid | -0.869 |
annoyance | -0.847 |
pleas | -0.838 |
Rate | -0.829 |
\\\\\\\\ | -0.829 |
Token | surrounding |
Token ID | 7346 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
uala | +4.511 |
eni | +4.031 |
atin | +3.487 |
itton | +3.458 |
Devi | +3.440 |
Neg logit contributions | |
antioxid | -3.194 |
\\\\\\\\ | -3.083 |
annoyance | -3.047 |
Rate | -3.018 |
pleas | -3.011 |
Token | the |
Token ID | 262 |
Feature activation | -3.33e-01 |
Pos logit contributions | |
uala | +4.867 |
eni | +4.231 |
atin | +3.673 |
itton | +3.668 |
Devi | +3.656 |
Neg logit contributions | |
antioxid | -3.442 |
annoyance | -3.346 |
Rate | -3.275 |
pleas | -3.264 |
\\\\\\\\ | -3.242 |
Token | fossils |
Token ID | 34066 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
uala | +1.536 |
eni | +1.342 |
itton | +1.156 |
atin | +1.130 |
Devi | +1.129 |
Neg logit contributions | |
antioxid | -1.211 |
annoyance | -1.182 |
pleas | -1.168 |
\\\\\\\\ | -1.163 |
Rate | -1.162 |
Token | , |
Token ID | 11 |
Feature activation | -4.57e-01 |
Pos logit contributions | |
uala | +7.944 |
eni | +7.038 |
Devi | +5.886 |
atin | +5.862 |
itton | +5.858 |
Neg logit contributions | |
antioxid | -7.027 |
\\\\\\\\ | -6.687 |
annoyance | -6.664 |
Rate | -6.580 |
★★ | -6.514 |
Token | said |
Token ID | 531 |
Feature activation | -2.25e-01 |
Pos logit contributions | |
uala | +2.169 |
eni | +1.925 |
itton | +1.685 |
Devi | +1.628 |
atin | +1.620 |
Neg logit contributions | |
antioxid | -1.599 |
annoyance | -1.539 |
\\\\\\\\ | -1.511 |
Rate | -1.508 |
pleas | -1.503 |
Token | the |
Token ID | 262 |
Feature activation | -8.94e-02 |
Pos logit contributions | |
uala | +1.261 |
eni | +1.136 |
itton | +1.015 |
atin | +0.987 |
Devi | +0.987 |
Neg logit contributions | |
antioxid | -0.592 |
annoyance | -0.574 |
pleas | -0.563 |
Rate | -0.554 |
\\\\\\\\ | -0.550 |
Token | question |
Token ID | 1808 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
uala | +0.465 |
eni | +0.415 |
itton | +0.366 |
atin | +0.355 |
Devi | +0.354 |
Neg logit contributions | |
antioxid | -0.273 |
annoyance | -0.266 |
pleas | -0.262 |
Rate | -0.257 |
\\\\\\\\ | -0.255 |
Token | of |
Token ID | 286 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
antioxid | +0.882 |
annoyance | +0.855 |
pleas | +0.840 |
Rate | +0.815 |
± | +0.806 |
Neg logit contributions | |
uala | -2.030 |
eni | -1.832 |
itton | -1.643 |
atin | -1.595 |
Devi | -1.591 |
Token | heads |
Token ID | 6665 |
Feature activation | -3.96e-01 |
Pos logit contributions | |
uala | +0.902 |
eni | +0.802 |
itton | +0.703 |
Devi | +0.683 |
atin | +0.680 |
Neg logit contributions | |
antioxid | -0.580 |
annoyance | -0.557 |
pleas | -0.549 |
\\\\\\\\ | -0.546 |
Rate | -0.544 |
Token | of |
Token ID | 286 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
uala | +2.340 |
eni | +2.117 |
itton | +1.902 |
atin | +1.854 |
Devi | +1.846 |
Neg logit contributions | |
antioxid | -0.930 |
annoyance | -0.899 |
pleas | -0.885 |
Rate | -0.854 |
± | -0.843 |
Token | the |
Token ID | 262 |
Feature activation | +3.50e-02 |
Pos logit contributions | |
antioxid | +0.789 |
annoyance | +0.771 |
pleas | +0.763 |
Rate | +0.743 |
± | +0.738 |
Neg logit contributions | |
uala | -1.201 |
eni | -1.065 |
itton | -0.937 |
atin | -0.903 |
Devi | -0.899 |
Token | two |
Token ID | 734 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
antioxid | +0.117 |
annoyance | +0.114 |
pleas | +0.113 |
Rate | +0.110 |
\\\\\\\\ | +0.109 |
Neg logit contributions | |
uala | -0.172 |
eni | -0.153 |
itton | -0.134 |
atin | -0.129 |
Devi | -0.129 |
Token | popular |
Token ID | 2968 |
Feature activation | -3.94e-01 |
Pos logit contributions | |
uala | +1.367 |
eni | +1.209 |
itton | +1.054 |
Devi | +1.024 |
atin | +1.021 |
Neg logit contributions | |
antioxid | -0.978 |
annoyance | -0.948 |
pleas | -0.935 |
\\\\\\\\ | -0.926 |
Rate | -0.924 |
Token | Luck |
Token ID | 14546 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
uala | +1.823 |
eni | +1.609 |
itton | +1.388 |
Devi | +1.350 |
atin | +1.346 |
Neg logit contributions | |
antioxid | -1.416 |
annoyance | -1.369 |
pleas | -1.350 |
\\\\\\\\ | -1.349 |
Rate | -1.340 |
Token | now |
Token ID | 2197 |
Feature activation | -7.84e-01 |
Pos logit contributions | |
uala | +5.479 |
eni | +4.504 |
atin | +3.243 |
etta | +3.171 |
Devi | +3.170 |
Neg logit contributions | |
antioxid | -9.958 |
ONSORED | -9.515 |
annoyance | -9.510 |
gery | -9.429 |
reven | -9.386 |
Token | - |
Token ID | 12 |
Feature activation | +3.35e-02 |
Pos logit contributions | |
uala | +3.684 |
eni | +3.276 |
Devi | +2.787 |
itton | +2.770 |
atin | +2.722 |
Neg logit contributions | |
antioxid | -2.763 |
\\\\\\\\ | -2.624 |
annoyance | -2.623 |
pleas | -2.580 |
Rate | -2.559 |
Token | based |
Token ID | 3106 |
Feature activation | -9.53e-01 |
Pos logit contributions | |
antioxid | +0.136 |
annoyance | +0.133 |
pleas | +0.132 |
Rate | +0.130 |
± | +0.129 |
Neg logit contributions | |
uala | -0.141 |
eni | -0.122 |
itton | -0.104 |
atin | -0.099 |
Devi | -0.099 |
Token | hel |
Token ID | 932 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
uala | +4.378 |
eni | +3.872 |
itton | +3.307 |
Devi | +3.302 |
atin | +3.237 |
Neg logit contributions | |
antioxid | -3.380 |
\\\\\\\\ | -3.293 |
annoyance | -3.204 |
ONSORED | -3.182 |
Rate | -3.182 |
Token | pl |
Token ID | 489 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
antioxid | +0.772 |
annoyance | +0.761 |
pleas | +0.755 |
Rate | +0.743 |
± | +0.740 |
Neg logit contributions | |
uala | -0.553 |
eni | -0.463 |
itton | -0.378 |
atin | -0.355 |
Devi | -0.353 |
Token | on |
Token ID | 319 |
Feature activation | -5.47e-01 |
Pos logit contributions | |
antioxid | +0.648 |
annoyance | +0.630 |
pleas | +0.622 |
Rate | +0.606 |
± | +0.600 |
Neg logit contributions | |
uala | -1.152 |
eni | -1.030 |
itton | -0.914 |
atin | -0.883 |
Devi | -0.880 |
Token | Division |
Token ID | 7458 |
Feature activation | -3.29e-01 |
Pos logit contributions | |
uala | +2.760 |
eni | +2.441 |
itton | +2.146 |
Devi | +2.089 |
atin | +2.077 |
Neg logit contributions | |
antioxid | -1.726 |
annoyance | -1.670 |
pleas | -1.646 |
Rate | -1.644 |
\\\\\\\\ | -1.617 |
Token | Street |
Token ID | 3530 |
Feature activation | -7.85e-01 |
Pos logit contributions | |
uala | +1.833 |
eni | +1.653 |
itton | +1.475 |
atin | +1.425 |
Devi | +1.422 |
Neg logit contributions | |
antioxid | -0.891 |
annoyance | -0.858 |
pleas | -0.843 |
Rate | -0.825 |
\\\\\\\\ | -0.816 |
Token | . |
Token ID | 13 |
Feature activation | -4.44e-01 |
Pos logit contributions | |
uala | +3.856 |
eni | +3.482 |
itton | +3.054 |
atin | +2.954 |
Devi | +2.940 |
Neg logit contributions | |
antioxid | -2.525 |
annoyance | -2.446 |
Rate | -2.414 |
pleas | -2.381 |
\\\\\\\\ | -2.362 |
Token | Block |
Token ID | 9726 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
uala | +2.135 |
eni | +1.893 |
itton | +1.619 |
Devi | +1.618 |
atin | +1.594 |
Neg logit contributions | |
antioxid | -1.542 |
annoyance | -1.497 |
pleas | -1.462 |
Rate | -1.430 |
\\\\\\\\ | -1.419 |
Token | after |
Token ID | 706 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
uala | +4.893 |
eni | +4.354 |
itton | +3.686 |
atin | +3.621 |
Devi | +3.565 |
Neg logit contributions | |
antioxid | -4.508 |
annoyance | -4.343 |
pleas | -4.238 |
gery | -4.205 |
---------- | -4.197 |
Token | block |
Token ID | 2512 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
uala | +6.352 |
eni | +5.357 |
itton | +4.497 |
Devi | +4.261 |
atin | +4.139 |
Neg logit contributions | |
antioxid | -8.073 |
Rate | -7.901 |
ULTS | -7.865 |
\\\\\\\\ | -7.714 |
Interest | -7.657 |
Token | is |
Token ID | 318 |
Feature activation | -9.05e-01 |
Pos logit contributions | |
uala | +6.795 |
eni | +6.196 |
itton | +5.387 |
Devi | +5.247 |
atin | +5.212 |
Neg logit contributions | |
antioxid | -4.144 |
Rate | -3.889 |
\\\\\\\\ | -3.889 |
annoyance | -3.872 |
ONSORED | -3.804 |
Token | filled |
Token ID | 5901 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
uala | +4.509 |
eni | +4.045 |
itton | +3.561 |
Devi | +3.444 |
atin | +3.443 |
Neg logit contributions | |
antioxid | -2.846 |
\\\\\\\\ | -2.754 |
Rate | -2.739 |
annoyance | -2.692 |
---------- | -2.627 |
Token | with |
Token ID | 351 |
Feature activation | -5.16e-01 |
Pos logit contributions | |
uala | +2.491 |
eni | +2.258 |
itton | +2.013 |
atin | +1.963 |
Devi | +1.958 |
Neg logit contributions | |
antioxid | -1.054 |
annoyance | -1.002 |
Rate | -0.973 |
\\\\\\\\ | -0.957 |
pleas | -0.956 |
Token | tents |
Token ID | 29804 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
uala | +2.674 |
eni | +2.409 |
itton | +2.113 |
Devi | +2.065 |
atin | +2.053 |
Neg logit contributions | |
antioxid | -1.539 |
annoyance | -1.468 |
\\\\\\\\ | -1.456 |
Rate | -1.451 |
± | -1.427 |
Token |
|
Token ID | 198 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
uala | +2.678 |
eni | +2.357 |
nil | +1.957 |
itton | +1.950 |
Devi | +1.922 |
Neg logit contributions | |
antioxid | -2.495 |
annoyance | -2.345 |
\\\\\\\\ | -2.263 |
reven | -2.259 |
unemploy | -2.243 |
Token | 20 |
Token ID | 1238 |
Feature activation | -8.69e-01 |
Pos logit contributions | |
uala | +0.696 |
eni | +0.598 |
itton | +0.507 |
atin | +0.486 |
Devi | +0.479 |
Neg logit contributions | |
antioxid | -0.709 |
annoyance | -0.697 |
pleas | -0.688 |
Rate | -0.669 |
± | -0.668 |
Token | . |
Token ID | 13 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
uala | +3.694 |
eni | +3.253 |
itton | +2.701 |
Devi | +2.700 |
nil | +2.692 |
Neg logit contributions | |
antioxid | -3.486 |
annoyance | -3.336 |
reven | -3.231 |
unemploy | -3.186 |
pleas | -3.180 |
Token | Chris |
Token ID | 5180 |
Feature activation | +2.46e-01 |
Pos logit contributions | |
uala | +5.117 |
eni | +4.499 |
itton | +3.976 |
Devi | +3.968 |
atin | +3.890 |
Neg logit contributions | |
antioxid | -3.316 |
annoyance | -3.211 |
pleas | -3.146 |
Rate | -3.063 |
---------- | -3.026 |
Token | F |
Token ID | 376 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
antioxid | +0.815 |
annoyance | +0.799 |
pleas | +0.791 |
Rate | +0.771 |
± | +0.769 |
Neg logit contributions | |
uala | -1.209 |
eni | -1.071 |
itton | -0.943 |
atin | -0.907 |
Devi | -0.900 |
Token | us |
Token ID | 385 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
uala | +0.441 |
eni | +0.383 |
itton | +0.330 |
atin | +0.314 |
Devi | +0.308 |
Neg logit contributions | |
antioxid | -0.418 |
annoyance | -0.409 |
pleas | -0.406 |
Rate | -0.396 |
---------- | -0.394 |
Token | aro |
Token ID | 12022 |
Feature activation | -4.98e-02 |
Pos logit contributions | |
uala | +7.949 |
eni | +7.217 |
itton | +6.130 |
atin | +5.963 |
etta | +5.890 |
Neg logit contributions | |
antioxid | -7.402 |
\\\\\\\\ | -7.013 |
ONSORED | -6.931 |
annoyance | -6.838 |
---------- | -6.671 |
Token | ( |
Token ID | 357 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
uala | +0.292 |
eni | +0.264 |
itton | +0.237 |
atin | +0.231 |
Devi | +0.230 |
Neg logit contributions | |
antioxid | -0.119 |
annoyance | -0.115 |
pleas | -0.113 |
Rate | -0.110 |
± | -0.109 |
Token | 117 |
Token ID | 17657 |
Feature activation | -8.14e-02 |
Pos logit contributions | |
uala | +1.752 |
eni | +1.510 |
itton | +1.269 |
nil | +1.252 |
atin | +1.243 |
Neg logit contributions | |
antioxid | -1.793 |
annoyance | -1.723 |
pleas | -1.685 |
regression | -1.650 |
reven | -1.645 |
Token | ) |
Token ID | 8 |
Feature activation | -1.99e-01 |
Pos logit contributions | |
uala | +0.409 |
eni | +0.365 |
itton | +0.319 |
atin | +0.310 |
nil | +0.309 |
Neg logit contributions | |
antioxid | -0.270 |
annoyance | -0.258 |
pleas | -0.250 |
\\\\\\\\ | -0.245 |
Rate | -0.244 |
Token | ( |
Token ID | 357 |
Feature activation | -3.34e-01 |
Pos logit contributions | |
uala | +1.098 |
eni | +0.993 |
itton | +0.879 |
Devi | +0.860 |
atin | +0.858 |
Neg logit contributions | |
antioxid | -0.550 |
annoyance | -0.525 |
pleas | -0.505 |
\\\\\\\\ | -0.493 |
Rate | -0.491 |
Token | if |
Token ID | 611 |
Feature activation | -2.23e-01 |
Pos logit contributions | |
uala | +0.830 |
eni | +0.732 |
itton | +0.638 |
atin | +0.617 |
Devi | +0.616 |
Neg logit contributions | |
antioxid | -0.608 |
annoyance | -0.587 |
pleas | -0.576 |
Rate | -0.570 |
\\\\\\\\ | -0.567 |
Token | he |
Token ID | 339 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
uala | +1.169 |
eni | +1.044 |
itton | +0.922 |
atin | +0.899 |
Devi | +0.894 |
Neg logit contributions | |
antioxid | -0.671 |
annoyance | -0.648 |
pleas | -0.628 |
Rate | -0.621 |
\\\\\\\\ | -0.619 |
Token | receives |
Token ID | 11583 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
uala | +1.515 |
eni | +1.379 |
itton | +1.212 |
atin | +1.182 |
Devi | +1.176 |
Neg logit contributions | |
antioxid | -0.817 |
annoyance | -0.772 |
Rate | -0.739 |
pleas | -0.735 |
\\\\\\\\ | -0.730 |
Token | food |
Token ID | 2057 |
Feature activation | -6.30e-01 |
Pos logit contributions | |
uala | +1.260 |
eni | +1.121 |
itton | +0.985 |
atin | +0.961 |
Devi | +0.954 |
Neg logit contributions | |
antioxid | -0.788 |
annoyance | -0.762 |
pleas | -0.740 |
\\\\\\\\ | -0.740 |
Rate | -0.737 |
Token | and |
Token ID | 290 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
uala | +2.737 |
eni | +2.418 |
itton | +2.082 |
atin | +2.017 |
nil | +1.960 |
Neg logit contributions | |
antioxid | -2.415 |
annoyance | -2.325 |
pleas | -2.294 |
± | -2.284 |
Rate | -2.280 |
Token | shelter |
Token ID | 11772 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
uala | +6.148 |
eni | +5.501 |
itton | +4.668 |
Devi | +4.663 |
atin | +4.639 |
Neg logit contributions | |
antioxid | -4.877 |
\\\\\\\\ | -4.781 |
ULTS | -4.656 |
Rate | -4.653 |
annoyance | -4.640 |
Token | , |
Token ID | 11 |
Feature activation | -5.69e-01 |
Pos logit contributions | |
uala | +8.276 |
eni | +7.395 |
itton | +6.414 |
atin | +6.270 |
nil | +6.167 |
Neg logit contributions | |
antioxid | -6.259 |
annoyance | -5.761 |
\\\\\\\\ | -5.710 |
Rate | -5.704 |
---------- | -5.703 |
Token | or |
Token ID | 393 |
Feature activation | +3.98e-01 |
Pos logit contributions | |
uala | +2.803 |
eni | +2.482 |
itton | +2.169 |
Devi | +2.119 |
atin | +2.112 |
Neg logit contributions | |
antioxid | -1.901 |
annoyance | -1.808 |
\\\\\\\\ | -1.776 |
Rate | -1.769 |
pleas | -1.759 |
Token | if |
Token ID | 611 |
Feature activation | +2.76e-01 |
Pos logit contributions | |
antioxid | +1.205 |
annoyance | +1.183 |
pleas | +1.175 |
Rate | +1.131 |
± | +1.124 |
Neg logit contributions | |
uala | -2.078 |
eni | -1.851 |
itton | -1.645 |
atin | -1.582 |
Devi | -1.577 |
Token | he |
Token ID | 339 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
antioxid | +0.808 |
annoyance | +0.791 |
pleas | +0.785 |
Rate | +0.758 |
± | +0.752 |
Neg logit contributions | |
uala | -1.468 |
eni | -1.311 |
itton | -1.166 |
atin | -1.125 |
Devi | -1.120 |
Token | gets |
Token ID | 3011 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
uala | +0.615 |
eni | +0.554 |
itton | +0.489 |
atin | +0.473 |
Devi | +0.472 |
Neg logit contributions | |
antioxid | -0.356 |
annoyance | -0.342 |
pleas | -0.332 |
Rate | -0.329 |
---------- | -0.324 |
Token | , |
Token ID | 11 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
antioxid | +0.977 |
annoyance | +0.956 |
pleas | +0.947 |
Rate | +0.923 |
± | +0.918 |
Neg logit contributions | |
uala | -1.416 |
eni | -1.252 |
itton | -1.098 |
atin | -1.057 |
Devi | -1.053 |
Token | telecommunications |
Token ID | 27473 |
Feature activation | +5.64e-01 |
Pos logit contributions | |
antioxid | +0.435 |
annoyance | +0.422 |
pleas | +0.413 |
Rate | +0.406 |
\\\\\\\\ | +0.399 |
Neg logit contributions | |
uala | -0.796 |
eni | -0.711 |
itton | -0.633 |
atin | -0.612 |
Devi | -0.611 |
Token | companies |
Token ID | 2706 |
Feature activation | -3.99e-02 |
Pos logit contributions | |
antioxid | +1.242 |
annoyance | +1.198 |
pleas | +1.177 |
Rate | +1.134 |
± | +1.121 |
Neg logit contributions | |
uala | -3.421 |
eni | -3.103 |
itton | -2.803 |
atin | -2.724 |
Devi | -2.715 |
Token | were |
Token ID | 547 |
Feature activation | -4.48e-01 |
Pos logit contributions | |
uala | +0.208 |
eni | +0.186 |
itton | +0.164 |
atin | +0.159 |
Devi | +0.158 |
Neg logit contributions | |
antioxid | -0.124 |
annoyance | -0.117 |
pleas | -0.115 |
Rate | -0.113 |
\\\\\\\\ | -0.113 |
Token | granted |
Token ID | 7520 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
uala | +2.295 |
eni | +2.044 |
itton | +1.818 |
atin | +1.759 |
Devi | +1.729 |
Neg logit contributions | |
antioxid | -1.406 |
annoyance | -1.336 |
\\\\\\\\ | -1.328 |
Rate | -1.315 |
pleas | -1.285 |
Token | retro |
Token ID | 12175 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
uala | +0.775 |
eni | +0.690 |
itton | +0.617 |
atin | +0.593 |
Devi | +0.590 |
Neg logit contributions | |
antioxid | -0.432 |
annoyance | -0.417 |
pleas | -0.409 |
Rate | -0.406 |
\\\\\\\\ | -0.404 |
Token | active |
Token ID | 5275 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
uala | +7.832 |
eni | +7.219 |
itton | +6.299 |
Devi | +5.999 |
atin | +5.934 |
Neg logit contributions | |
antioxid | -6.367 |
\\\\\\\\ | -6.265 |
annoyance | -6.105 |
ULTS | -6.060 |
ONSORED | -6.055 |
Token | immunity |
Token ID | 16989 |
Feature activation | -4.02e-01 |
Pos logit contributions | |
uala | +9.023 |
eni | +8.017 |
itton | +7.152 |
Devi | +6.927 |
atin | +6.891 |
Neg logit contributions | |
antioxid | -4.268 |
ONSORED | -4.179 |
ULTS | -4.177 |
\\\\\\\\ | -4.128 |
Rate | -4.096 |
Token | for |
Token ID | 329 |
Feature activation | +4.67e-03 |
Pos logit contributions | |
uala | +2.019 |
eni | +1.797 |
itton | +1.565 |
atin | +1.525 |
Devi | +1.522 |
Neg logit contributions | |
antioxid | -1.311 |
annoyance | -1.247 |
Rate | -1.222 |
\\\\\\\\ | -1.206 |
pleas | -1.200 |
Token | violating |
Token ID | 18134 |
Feature activation | -1.93e-01 |
Pos logit contributions | |
antioxid | +0.014 |
annoyance | +0.013 |
\\\\\\\\ | +0.013 |
pleas | +0.013 |
Rate | +0.013 |
Neg logit contributions | |
uala | -0.025 |
eni | -0.023 |
itton | -0.020 |
atin | -0.019 |
Devi | -0.019 |
Token | the |
Token ID | 262 |
Feature activation | +9.43e-03 |
Pos logit contributions | |
uala | +1.014 |
eni | +0.900 |
itton | +0.804 |
atin | +0.768 |
Devi | +0.764 |
Neg logit contributions | |
antioxid | -0.573 |
annoyance | -0.557 |
Rate | -0.547 |
pleas | -0.540 |
\\\\\\\\ | -0.537 |
Token | though |
Token ID | 996 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
uala | +4.976 |
eni | +4.459 |
itton | +3.939 |
atin | +3.794 |
nil | +3.772 |
Neg logit contributions | |
antioxid | -3.834 |
\\\\\\\\ | -3.780 |
± | -3.708 |
Rate | -3.654 |
gery | -3.643 |
Token | is |
Token ID | 318 |
Feature activation | -8.99e-01 |
Pos logit contributions | |
uala | +5.170 |
eni | +4.722 |
itton | +4.043 |
nil | +3.993 |
Devi | +3.951 |
Neg logit contributions | |
antioxid | -4.215 |
ONSORED | -3.938 |
\\\\\\\\ | -3.900 |
annoyance | -3.855 |
unemploy | -3.776 |
Token | the |
Token ID | 262 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
uala | +4.044 |
eni | +3.528 |
itton | +2.967 |
nil | +2.962 |
Devi | +2.925 |
Neg logit contributions | |
antioxid | -3.413 |
annoyance | -3.143 |
\\\\\\\\ | -3.095 |
ONSORED | -3.090 |
reven | -3.084 |
Token | one |
Token ID | 530 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
uala | +4.575 |
eni | +4.050 |
itton | +3.470 |
atin | +3.319 |
nil | +3.317 |
Neg logit contributions | |
antioxid | -4.171 |
\\\\\\\\ | -3.965 |
ONSORED | -3.864 |
Rate | -3.835 |
ghazi | -3.823 |
Token | that |
Token ID | 326 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
uala | +1.047 |
eni | +0.938 |
itton | +0.834 |
atin | +0.823 |
Devi | +0.811 |
Neg logit contributions | |
antioxid | -0.524 |
\\\\\\\\ | -0.475 |
annoyance | -0.470 |
ONSORED | -0.468 |
Rate | -0.465 |
Token | I |
Token ID | 314 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
uala | +5.352 |
eni | +4.894 |
Devi | +4.174 |
itton | +4.083 |
nil | +4.041 |
Neg logit contributions | |
antioxid | -4.503 |
\\\\\\\\ | -4.150 |
annoyance | -4.033 |
reven | -4.026 |
ONSORED | -4.024 |
Token | find |
Token ID | 1064 |
Feature activation | -9.03e-01 |
Pos logit contributions | |
uala | +6.170 |
eni | +5.552 |
itton | +4.511 |
atin | +4.331 |
hurst | +4.305 |
Neg logit contributions | |
antioxid | -8.333 |
ONSORED | -7.958 |
\\\\\\\\ | -7.842 |
gery | -7.618 |
annoyance | -7.508 |
Token | the |
Token ID | 262 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
uala | +4.065 |
eni | +3.564 |
nil | +2.966 |
Devi | +2.957 |
itton | +2.949 |
Neg logit contributions | |
antioxid | -3.445 |
annoyance | -3.158 |
reven | -3.112 |
ONSORED | -3.102 |
\\\\\\\\ | -3.102 |
Token | most |
Token ID | 749 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
uala | +4.920 |
eni | +4.345 |
itton | +3.526 |
nil | +3.412 |
hurst | +3.395 |
Neg logit contributions | |
antioxid | -5.637 |
\\\\\\\\ | -5.451 |
ONSORED | -5.207 |
gery | -5.162 |
Rate | -5.157 |
Token | annoying |
Token ID | 15774 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
uala | +7.036 |
eni | +6.511 |
itton | +5.720 |
Devi | +5.603 |
atin | +5.551 |
Neg logit contributions | |
\\\\\\\\ | -3.752 |
antioxid | -3.671 |
Rate | -3.483 |
ULTS | -3.422 |
akespeare | -3.374 |
Token | / |
Token ID | 14 |
Feature activation | -8.99e-01 |
Pos logit contributions | |
uala | +5.509 |
eni | +5.007 |
itton | +4.229 |
Devi | +4.206 |
atin | +4.190 |
Neg logit contributions | |
antioxid | -4.030 |
annoyance | -3.704 |
ONSORED | -3.672 |
unemploy | -3.665 |
reven | -3.660 |
Token | � |
Token ID | 251 |
Feature activation | +2.14e-01 |
Pos logit contributions | |
uala | +1.638 |
eni | +1.454 |
itton | +1.286 |
Devi | +1.246 |
atin | +1.236 |
Neg logit contributions | |
antioxid | -0.984 |
annoyance | -0.967 |
pleas | -0.940 |
Rate | -0.920 |
gery | -0.911 |
Token | . |
Token ID | 13 |
Feature activation | +2.82e-01 |
Pos logit contributions | |
antioxid | +0.596 |
annoyance | +0.577 |
pleas | +0.566 |
Rate | +0.555 |
---------- | +0.545 |
Neg logit contributions | |
uala | -1.178 |
eni | -1.054 |
itton | -0.939 |
atin | -0.912 |
Devi | -0.909 |
Token |
|
Token ID | 198 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
antioxid | +0.912 |
annoyance | +0.891 |
pleas | +0.884 |
Rate | +0.860 |
± | +0.857 |
Neg logit contributions | |
uala | -1.416 |
eni | -1.258 |
itton | -1.110 |
atin | -1.068 |
Devi | -1.061 |
Token |
|
Token ID | 198 |
Feature activation | -1.38e-01 |
Pos logit contributions | |
antioxid | +0.723 |
annoyance | +0.702 |
pleas | +0.689 |
Rate | +0.672 |
\\\\\\\\ | +0.669 |
Neg logit contributions | |
uala | -1.044 |
eni | -0.924 |
itton | -0.807 |
atin | -0.780 |
Devi | -0.778 |
Token | She |
Token ID | 3347 |
Feature activation | +8.00e-02 |
Pos logit contributions | |
uala | +0.676 |
eni | +0.597 |
itton | +0.520 |
atin | +0.505 |
nil | +0.501 |
Neg logit contributions | |
antioxid | -0.472 |
annoyance | -0.460 |
pleas | -0.450 |
regression | -0.437 |
Rate | -0.434 |
Token | appealed |
Token ID | 22280 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
antioxid | +0.248 |
annoyance | +0.239 |
pleas | +0.233 |
Rate | +0.231 |
\\\\\\\\ | +0.229 |
Neg logit contributions | |
uala | -0.417 |
eni | -0.373 |
itton | -0.329 |
atin | -0.317 |
Devi | -0.317 |
Token | once |
Token ID | 1752 |
Feature activation | +6.19e-01 |
Pos logit contributions | |
uala | +9.028 |
eni | +7.857 |
Devi | +6.961 |
itton | +6.939 |
nil | +6.869 |
Neg logit contributions | |
antioxid | -5.548 |
Rate | -5.241 |
annoyance | -5.190 |
---------- | -5.127 |
\\\\\\\\ | -5.096 |
Token | again |
Token ID | 757 |
Feature activation | +5.58e-01 |
Pos logit contributions | |
antioxid | +1.623 |
annoyance | +1.592 |
pleas | +1.588 |
± | +1.508 |
Rate | +1.507 |
Neg logit contributions | |
uala | -3.459 |
eni | -3.116 |
itton | -2.791 |
atin | -2.708 |
� | -2.686 |
Token | to |
Token ID | 284 |
Feature activation | +3.72e-01 |
Pos logit contributions | |
antioxid | +1.422 |
pleas | +1.402 |
annoyance | +1.400 |
± | +1.332 |
Rate | +1.322 |
Neg logit contributions | |
uala | -3.157 |
eni | -2.838 |
itton | -2.552 |
atin | -2.471 |
Devi | -2.455 |
Token | Judge |
Token ID | 8974 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
antioxid | +1.157 |
annoyance | +1.135 |
pleas | +1.125 |
Rate | +1.090 |
± | +1.084 |
Neg logit contributions | |
uala | -1.908 |
eni | -1.703 |
itton | -1.503 |
atin | -1.453 |
Devi | -1.442 |
Token | H |
Token ID | 367 |
Feature activation | -3.78e-01 |
Pos logit contributions | |
uala | +0.582 |
eni | +0.512 |
itton | +0.451 |
Devi | +0.437 |
atin | +0.435 |
Neg logit contributions | |
antioxid | -0.394 |
annoyance | -0.384 |
pleas | -0.377 |
Rate | -0.371 |
---------- | -0.367 |
Token | and |
Token ID | 290 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
antioxid | +1.125 |
annoyance | +1.097 |
pleas | +1.084 |
Rate | +1.052 |
± | +1.046 |
Neg logit contributions | |
uala | -2.014 |
eni | -1.799 |
itton | -1.597 |
atin | -1.544 |
Devi | -1.538 |
Token | owns |
Token ID | 12216 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
antioxid | +0.515 |
annoyance | +0.499 |
pleas | +0.491 |
Rate | +0.479 |
± | +0.474 |
Neg logit contributions | |
uala | -0.976 |
eni | -0.876 |
itton | -0.780 |
atin | -0.757 |
Devi | -0.754 |
Token | the |
Token ID | 262 |
Feature activation | -9.54e-01 |
Pos logit contributions | |
uala | +2.922 |
eni | +2.607 |
itton | +2.317 |
Devi | +2.254 |
atin | +2.248 |
Neg logit contributions | |
antioxid | -1.776 |
annoyance | -1.718 |
pleas | -1.674 |
\\\\\\\\ | -1.660 |
Rate | -1.652 |
Token | fast |
Token ID | 3049 |
Feature activation | -7.97e-01 |
Pos logit contributions | |
uala | +4.799 |
eni | +4.277 |
itton | +3.788 |
Devi | +3.700 |
atin | +3.695 |
Neg logit contributions | |
antioxid | -2.947 |
annoyance | -2.817 |
\\\\\\\\ | -2.779 |
Rate | -2.754 |
pleas | -2.745 |
Token | food |
Token ID | 2057 |
Feature activation | -8.37e-01 |
Pos logit contributions | |
uala | +3.727 |
eni | +3.336 |
itton | +2.927 |
atin | +2.822 |
Devi | +2.768 |
Neg logit contributions | |
antioxid | -2.759 |
annoyance | -2.668 |
pleas | -2.619 |
\\\\\\\\ | -2.613 |
Rate | -2.573 |
Token | chain |
Token ID | 6333 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
uala | +3.987 |
eni | +3.600 |
itton | +3.151 |
atin | +3.015 |
Devi | +2.977 |
Neg logit contributions | |
antioxid | -2.860 |
annoyance | -2.709 |
Rate | -2.682 |
pleas | -2.679 |
\\\\\\\\ | -2.676 |
Token | Fat |
Token ID | 12301 |
Feature activation | -6.10e-01 |
Pos logit contributions | |
uala | +8.214 |
eni | +7.511 |
Devi | +6.491 |
itton | +6.480 |
atin | +6.435 |
Neg logit contributions | |
antioxid | -5.868 |
annoyance | -5.669 |
\\\\\\\\ | -5.641 |
pleas | -5.468 |
Rate | -5.427 |
Token | bur |
Token ID | 6236 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
uala | +3.086 |
eni | +2.760 |
itton | +2.411 |
atin | +2.344 |
Devi | +2.332 |
Neg logit contributions | |
antioxid | -1.961 |
annoyance | -1.898 |
pleas | -1.859 |
\\\\\\\\ | -1.807 |
Rate | -1.789 |
Token | ger |
Token ID | 1362 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
antioxid | +0.484 |
annoyance | +0.472 |
pleas | +0.467 |
Rate | +0.455 |
± | +0.451 |
Neg logit contributions | |
uala | -0.784 |
eni | -0.698 |
itton | -0.616 |
atin | -0.595 |
Devi | -0.592 |
Token | . |
Token ID | 13 |
Feature activation | -6.73e-01 |
Pos logit contributions | |
antioxid | +0.082 |
annoyance | +0.080 |
pleas | +0.079 |
Rate | +0.077 |
± | +0.076 |
Neg logit contributions | |
uala | -0.132 |
eni | -0.117 |
itton | -0.104 |
atin | -0.100 |
Devi | -0.100 |
Token |
|
Token ID | 198 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
uala | +3.267 |
eni | +2.919 |
itton | +2.546 |
Devi | +2.510 |
atin | +2.496 |
Neg logit contributions | |
antioxid | -2.265 |
annoyance | -2.209 |
pleas | -2.131 |
regression | -2.081 |
reven | -2.078 |
Token | preliminary |
Token ID | 15223 |
Feature activation | +1.14e-01 |
Pos logit contributions | |
uala | +1.329 |
eni | +1.172 |
itton | +1.016 |
Devi | +0.982 |
atin | +0.977 |
Neg logit contributions | |
antioxid | -0.993 |
annoyance | -0.955 |
\\\\\\\\ | -0.943 |
Rate | -0.937 |
pleas | -0.935 |
Token | injunction |
Token ID | 27439 |
Feature activation | -9.60e-02 |
Pos logit contributions | |
antioxid | +0.425 |
annoyance | +0.414 |
pleas | +0.409 |
Rate | +0.404 |
\\\\\\\\ | +0.403 |
Neg logit contributions | |
uala | -0.514 |
eni | -0.449 |
itton | -0.388 |
Devi | -0.373 |
atin | -0.373 |
Token | after |
Token ID | 706 |
Feature activation | -3.69e-01 |
Pos logit contributions | |
uala | +0.513 |
eni | +0.458 |
itton | +0.407 |
atin | +0.394 |
Devi | +0.394 |
Neg logit contributions | |
antioxid | -0.280 |
annoyance | -0.270 |
pleas | -0.265 |
Rate | -0.262 |
\\\\\\\\ | -0.262 |
Token | the |
Token ID | 262 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
uala | +1.884 |
eni | +1.671 |
itton | +1.489 |
Devi | +1.442 |
atin | +1.432 |
Neg logit contributions | |
antioxid | -1.159 |
annoyance | -1.113 |
\\\\\\\\ | -1.083 |
Rate | -1.081 |
---------- | -1.075 |
Token | student |
Token ID | 3710 |
Feature activation | -4.04e-02 |
Pos logit contributions | |
antioxid | +0.604 |
annoyance | +0.587 |
pleas | +0.578 |
Rate | +0.565 |
---------- | +0.559 |
Neg logit contributions | |
uala | -1.115 |
eni | -0.999 |
itton | -0.886 |
atin | -0.858 |
Devi | -0.857 |
Token | appealed |
Token ID | 22280 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
uala | +0.203 |
eni | +0.181 |
itton | +0.159 |
atin | +0.154 |
Devi | +0.154 |
Neg logit contributions | |
antioxid | -0.131 |
annoyance | -0.127 |
pleas | -0.125 |
Rate | -0.123 |
\\\\\\\\ | -0.122 |
Token | his |
Token ID | 465 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
uala | +8.284 |
eni | +7.459 |
itton | +6.553 |
Devi | +6.471 |
atin | +6.362 |
Neg logit contributions | |
antioxid | -5.795 |
\\\\\\\\ | -5.633 |
---------- | -5.575 |
Rate | -5.533 |
annoyance | -5.451 |
Token | University |
Token ID | 2059 |
Feature activation | +1.76e-01 |
Pos logit contributions | |
uala | +1.012 |
eni | +0.899 |
itton | +0.792 |
Devi | +0.765 |
atin | +0.764 |
Neg logit contributions | |
antioxid | -0.639 |
annoyance | -0.613 |
pleas | -0.601 |
Rate | -0.601 |
\\\\\\\\ | -0.598 |
Token | of |
Token ID | 286 |
Feature activation | +5.44e-01 |
Pos logit contributions | |
antioxid | +0.403 |
annoyance | +0.391 |
pleas | +0.385 |
Rate | +0.373 |
± | +0.368 |
Neg logit contributions | |
uala | -1.055 |
eni | -0.954 |
itton | -0.859 |
atin | -0.835 |
Devi | -0.832 |
Token | Cincinnati |
Token ID | 16137 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
antioxid | +1.677 |
annoyance | +1.656 |
pleas | +1.647 |
± | +1.609 |
Rate | +1.589 |
Neg logit contributions | |
uala | -2.800 |
eni | -2.491 |
itton | -2.210 |
atin | -2.111 |
� | -2.091 |
Token | suspension |
Token ID | 11461 |
Feature activation | -5.33e-03 |
Pos logit contributions | |
antioxid | +0.381 |
annoyance | +0.373 |
pleas | +0.369 |
Rate | +0.359 |
± | +0.357 |
Neg logit contributions | |
uala | -0.571 |
eni | -0.505 |
itton | -0.445 |
atin | -0.429 |
Devi | -0.427 |
Token | we |
Token ID | 356 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
antioxid | +0.033 |
annoyance | +0.033 |
pleas | +0.032 |
Rate | +0.031 |
± | +0.031 |
Neg logit contributions | |
uala | -0.060 |
eni | -0.053 |
itton | -0.047 |
atin | -0.046 |
Devi | -0.046 |
Token | now |
Token ID | 783 |
Feature activation | -5.04e-01 |
Pos logit contributions | |
uala | +2.079 |
eni | +1.869 |
itton | +1.626 |
atin | +1.573 |
Devi | +1.571 |
Neg logit contributions | |
antioxid | -1.410 |
annoyance | -1.360 |
\\\\\\\\ | -1.330 |
pleas | -1.318 |
Rate | -1.307 |
Token | know |
Token ID | 760 |
Feature activation | -3.03e-02 |
Pos logit contributions | |
uala | +2.431 |
eni | +2.167 |
itton | +1.886 |
atin | +1.824 |
Devi | +1.807 |
Neg logit contributions | |
antioxid | -1.728 |
annoyance | -1.667 |
\\\\\\\\ | -1.634 |
pleas | -1.622 |
Rate | -1.611 |
Token | existed |
Token ID | 11196 |
Feature activation | -3.33e-01 |
Pos logit contributions | |
uala | +0.160 |
eni | +0.143 |
itton | +0.126 |
Devi | +0.123 |
atin | +0.123 |
Neg logit contributions | |
antioxid | -0.090 |
annoyance | -0.087 |
pleas | -0.085 |
Rate | -0.084 |
\\\\\\\\ | -0.084 |
Token | on |
Token ID | 319 |
Feature activation | -5.53e-01 |
Pos logit contributions | |
uala | +1.706 |
eni | +1.531 |
itton | +1.338 |
Devi | +1.310 |
atin | +1.291 |
Neg logit contributions | |
antioxid | -1.029 |
annoyance | -0.997 |
Rate | -0.979 |
pleas | -0.969 |
\\\\\\\\ | -0.969 |
Token | Hispan |
Token ID | 13600 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
uala | +2.615 |
eni | +2.289 |
itton | +1.981 |
Devi | +1.971 |
atin | +1.922 |
Neg logit contributions | |
antioxid | -1.923 |
annoyance | -1.882 |
pleas | -1.847 |
Rate | -1.836 |
\\\\\\\\ | -1.828 |
Token | iola |
Token ID | 30292 |
Feature activation | -5.37e-01 |
Pos logit contributions | |
uala | +5.599 |
eni | +4.554 |
Devi | +3.219 |
atin | +3.206 |
etta | +3.142 |
Neg logit contributions | |
antioxid | -9.276 |
annoyance | -8.984 |
pleas | -8.852 |
\\\\\\\\ | -8.765 |
ONSORED | -8.756 |
Token | relatively |
Token ID | 5365 |
Feature activation | -6.80e-01 |
Pos logit contributions | |
uala | +2.694 |
eni | +2.409 |
itton | +2.077 |
Devi | +2.050 |
atin | +2.016 |
Neg logit contributions | |
antioxid | -1.735 |
annoyance | -1.685 |
Rate | -1.636 |
pleas | -1.628 |
\\\\\\\\ | -1.621 |
Token | unchanged |
Token ID | 21588 |
Feature activation | -4.63e-01 |
Pos logit contributions | |
uala | +3.513 |
eni | +3.166 |
Devi | +2.755 |
itton | +2.745 |
atin | +2.696 |
Neg logit contributions | |
antioxid | -1.991 |
\\\\\\\\ | -1.932 |
annoyance | -1.906 |
Rate | -1.896 |
pleas | -1.837 |
Token | for |
Token ID | 329 |
Feature activation | +4.18e-01 |
Pos logit contributions | |
uala | +2.293 |
eni | +2.063 |
itton | +1.796 |
Devi | +1.754 |
atin | +1.747 |
Neg logit contributions | |
antioxid | -1.492 |
annoyance | -1.442 |
pleas | -1.410 |
Rate | -1.409 |
\\\\\\\\ | -1.408 |
Token | over |
Token ID | 625 |
Feature activation | -2.54e-01 |
Pos logit contributions | |
antioxid | +1.184 |
annoyance | +1.151 |
pleas | +1.135 |
Rate | +1.104 |
---------- | +1.093 |
Neg logit contributions | |
uala | -2.269 |
eni | -2.033 |
itton | -1.810 |
atin | -1.755 |
Devi | -1.749 |
Token | ost |
Token ID | 455 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
uala | +0.460 |
eni | +0.396 |
itton | +0.333 |
atin | +0.317 |
Devi | +0.314 |
Neg logit contributions | |
antioxid | -0.503 |
annoyance | -0.494 |
pleas | -0.489 |
Rate | -0.480 |
---------- | -0.478 |
Token | ach |
Token ID | 620 |
Feature activation | +3.23e-02 |
Pos logit contributions | |
uala | +3.669 |
eni | +3.295 |
atin | +2.642 |
itton | +2.559 |
etta | +2.432 |
Neg logit contributions | |
antioxid | -4.616 |
annoyance | -4.523 |
pleas | -4.449 |
\\\\\\\\ | -4.418 |
reven | -4.402 |
Token | , |
Token ID | 11 |
Feature activation | -4.73e-01 |
Pos logit contributions | |
antioxid | +0.104 |
annoyance | +0.102 |
pleas | +0.101 |
Rate | +0.098 |
± | +0.097 |
Neg logit contributions | |
uala | -0.162 |
eni | -0.144 |
itton | -0.127 |
atin | -0.123 |
Devi | -0.122 |
Token | a |
Token ID | 257 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
uala | +2.478 |
eni | +2.229 |
itton | +1.975 |
atin | +1.944 |
Devi | +1.937 |
Neg logit contributions | |
antioxid | -1.374 |
annoyance | -1.342 |
pleas | -1.320 |
\\\\\\\\ | -1.300 |
Rate | -1.289 |
Token | fuel |
Token ID | 5252 |
Feature activation | -7.78e-01 |
Pos logit contributions | |
uala | +3.160 |
eni | +2.823 |
itton | +2.514 |
Devi | +2.471 |
atin | +2.451 |
Neg logit contributions | |
antioxid | -1.729 |
annoyance | -1.679 |
pleas | -1.653 |
\\\\\\\\ | -1.645 |
Rate | -1.639 |
Token | supplier |
Token ID | 22693 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
uala | +3.608 |
eni | +3.215 |
itton | +2.791 |
atin | +2.704 |
Devi | +2.659 |
Neg logit contributions | |
antioxid | -2.749 |
annoyance | -2.631 |
pleas | -2.629 |
Rate | -2.592 |
---------- | -2.581 |
Token | which |
Token ID | 543 |
Feature activation | -7.58e-01 |
Pos logit contributions | |
uala | +8.371 |
eni | +7.429 |
itton | +6.462 |
Devi | +6.460 |
atin | +6.420 |
Neg logit contributions | |
antioxid | -5.603 |
\\\\\\\\ | -5.417 |
annoyance | -5.402 |
pleas | -5.379 |
Rate | -5.353 |
Token | is |
Token ID | 318 |
Feature activation | -5.26e-01 |
Pos logit contributions | |
uala | +3.801 |
eni | +3.445 |
itton | +2.995 |
Devi | +2.988 |
atin | +2.953 |
Neg logit contributions | |
antioxid | -2.354 |
annoyance | -2.308 |
\\\\\\\\ | -2.217 |
pleas | -2.210 |
---------- | -2.204 |
Token | connected |
Token ID | 5884 |
Feature activation | -6.82e-01 |
Pos logit contributions | |
uala | +2.622 |
eni | +2.353 |
itton | +2.054 |
atin | +2.018 |
Devi | +2.013 |
Neg logit contributions | |
antioxid | -1.682 |
annoyance | -1.640 |
\\\\\\\\ | -1.604 |
pleas | -1.600 |
Rate | -1.594 |
Token | to |
Token ID | 284 |
Feature activation | -5.68e-01 |
Pos logit contributions | |
uala | +3.852 |
eni | +3.475 |
itton | +3.100 |
atin | +3.030 |
Devi | +3.008 |
Neg logit contributions | |
antioxid | -1.727 |
annoyance | -1.677 |
pleas | -1.625 |
Rate | -1.617 |
\\\\\\\\ | -1.602 |
Token | Priv |
Token ID | 9243 |
Feature activation | -1.73e-01 |
Pos logit contributions | |
uala | +2.664 |
eni | +2.349 |
itton | +2.049 |
Devi | +2.000 |
atin | +1.987 |
Neg logit contributions | |
antioxid | -1.987 |
annoyance | -1.950 |
pleas | -1.911 |
\\\\\\\\ | -1.885 |
Rate | -1.881 |
Token | t |
Token ID | 83 |
Feature activation | +4.56e-01 |
Pos logit contributions | |
antioxid | +1.484 |
annoyance | +1.453 |
pleas | +1.439 |
Rate | +1.403 |
± | +1.395 |
Neg logit contributions | |
uala | -2.383 |
eni | -2.116 |
itton | -1.869 |
atin | -1.802 |
Devi | -1.798 |
Token | . |
Token ID | 13 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
antioxid | +1.499 |
annoyance | +1.467 |
pleas | +1.454 |
Rate | +1.418 |
± | +1.412 |
Neg logit contributions | |
uala | -2.269 |
eni | -2.010 |
itton | -1.769 |
atin | -1.704 |
Devi | -1.697 |
Token | F |
Token ID | 376 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
antioxid | +0.611 |
annoyance | +0.595 |
pleas | +0.584 |
± | +0.571 |
Rate | +0.570 |
Neg logit contributions | |
uala | -1.101 |
eni | -0.984 |
itton | -0.873 |
atin | -0.844 |
Devi | -0.833 |
Token | RA |
Token ID | 3861 |
Feature activation | +3.50e-01 |
Pos logit contributions | |
uala | +5.455 |
eni | +4.632 |
itton | +4.046 |
atin | +3.842 |
nil | +3.716 |
Neg logit contributions | |
antioxid | -4.936 |
annoyance | -4.750 |
pleas | -4.745 |
regression | -4.661 |
\\\\\\\\ | -4.659 |
Token | 13 |
Token ID | 1511 |
Feature activation | -6.06e-01 |
Pos logit contributions | |
antioxid | +0.760 |
annoyance | +0.734 |
pleas | +0.723 |
± | +0.700 |
Rate | +0.694 |
Neg logit contributions | |
uala | -2.130 |
eni | -1.930 |
itton | -1.745 |
atin | -1.701 |
Devi | -1.681 |
Token | Rom |
Token ID | 3570 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
uala | +2.927 |
eni | +2.585 |
itton | +2.254 |
Devi | +2.243 |
atin | +2.183 |
Neg logit contributions | |
antioxid | -2.048 |
annoyance | -2.002 |
pleas | -1.979 |
Rate | -1.937 |
\\\\\\\\ | -1.926 |
Token | ain |
Token ID | 391 |
Feature activation | -9.28e-01 |
Pos logit contributions | |
uala | +7.087 |
eni | +5.907 |
itton | +5.011 |
etta | +4.965 |
nil | +4.624 |
Neg logit contributions | |
antioxid | -7.924 |
\\\\\\\\ | -7.579 |
pleas | -7.377 |
ONSORED | -7.334 |
---------- | -7.288 |
Token | Fe |
Token ID | 5452 |
Feature activation | -8.29e-01 |
Pos logit contributions | |
uala | +3.813 |
eni | +3.293 |
itton | +2.722 |
Devi | +2.719 |
atin | +2.636 |
Neg logit contributions | |
antioxid | -3.832 |
annoyance | -3.826 |
pleas | -3.776 |
\\\\\\\\ | -3.700 |
Rate | -3.668 |
Token | ill |
Token ID | 359 |
Feature activation | -4.01e-01 |
Pos logit contributions | |
uala | +3.389 |
eni | +2.972 |
itton | +2.547 |
atin | +2.404 |
Devi | +2.359 |
Neg logit contributions | |
antioxid | -3.582 |
annoyance | -3.473 |
pleas | -3.385 |
Rate | -3.335 |
regression | -3.322 |
Token | u |
Token ID | 84 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
uala | +1.754 |
eni | +1.528 |
itton | +1.282 |
atin | +1.252 |
Devi | +1.236 |
Neg logit contributions | |
antioxid | -1.603 |
pleas | -1.542 |
annoyance | -1.532 |
\\\\\\\\ | -1.512 |
Rate | -1.497 |
Token | ( |
Token ID | 357 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
uala | +5.388 |
eni | +4.844 |
itton | +4.347 |
atin | +4.204 |
nil | +4.132 |
Neg logit contributions | |
antioxid | -3.015 |
annoyance | -2.861 |
pleas | -2.823 |
\\\\\\\\ | -2.808 |
---------- | -2.729 |
Token | ing |
Token ID | 278 |
Feature activation | -9.91e-01 |
Pos logit contributions | |
uala | +4.474 |
eni | +3.928 |
atin | +3.326 |
itton | +3.228 |
nil | +3.137 |
Neg logit contributions | |
antioxid | -4.889 |
\\\\\\\\ | -4.708 |
ONSORED | -4.461 |
★★ | -4.371 |
---------- | -4.370 |
Token | and |
Token ID | 290 |
Feature activation | -6.81e-01 |
Pos logit contributions | |
uala | +4.587 |
eni | +4.186 |
itton | +3.539 |
hurst | +3.473 |
Devi | +3.465 |
Neg logit contributions | |
antioxid | -3.513 |
annoyance | -3.167 |
\\\\\\\\ | -3.158 |
ONSORED | -3.133 |
unemploy | -3.117 |
Token | the |
Token ID | 262 |
Feature activation | -7.91e-01 |
Pos logit contributions | |
uala | +3.198 |
eni | +2.828 |
itton | +2.432 |
nil | +2.369 |
Devi | +2.367 |
Neg logit contributions | |
antioxid | -2.443 |
annoyance | -2.263 |
Rate | -2.216 |
\\\\\\\\ | -2.216 |
pleas | -2.202 |
Token | one |
Token ID | 530 |
Feature activation | -3.68e-01 |
Pos logit contributions | |
uala | +3.517 |
eni | +3.110 |
itton | +2.686 |
atin | +2.591 |
nil | +2.570 |
Neg logit contributions | |
antioxid | -2.993 |
\\\\\\\\ | -2.822 |
ONSORED | -2.773 |
Rate | -2.773 |
annoyance | -2.735 |
Token | that |
Token ID | 326 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
uala | +2.005 |
eni | +1.801 |
itton | +1.586 |
atin | +1.582 |
nil | +1.564 |
Neg logit contributions | |
antioxid | -1.043 |
\\\\\\\\ | -0.939 |
ONSORED | -0.929 |
Rate | -0.925 |
annoyance | -0.924 |
Token | I |
Token ID | 314 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
uala | +5.934 |
eni | +5.405 |
Devi | +4.583 |
itton | +4.508 |
nil | +4.498 |
Neg logit contributions | |
antioxid | -5.336 |
\\\\\\\\ | -4.874 |
ONSORED | -4.769 |
reven | -4.758 |
millenn | -4.745 |
Token | think |
Token ID | 892 |
Feature activation | -8.84e-01 |
Pos logit contributions | |
uala | +5.881 |
eni | +5.350 |
itton | +4.311 |
atin | +4.228 |
nil | +4.027 |
Neg logit contributions | |
antioxid | -8.412 |
ONSORED | -7.901 |
\\\\\\\\ | -7.852 |
gery | -7.694 |
ghazi | -7.647 |
Token | reduces |
Token ID | 12850 |
Feature activation | -6.67e-01 |
Pos logit contributions | |
uala | +3.434 |
eni | +2.973 |
Devi | +2.492 |
atin | +2.315 |
nil | +2.296 |
Neg logit contributions | |
antioxid | -3.740 |
\\\\\\\\ | -3.638 |
annoyance | -3.615 |
★★ | -3.606 |
pleas | -3.602 |
Token | immersion |
Token ID | 36375 |
Feature activation | -6.83e-01 |
Pos logit contributions | |
uala | +3.082 |
eni | +2.769 |
atin | +2.311 |
itton | +2.292 |
Devi | +2.273 |
Neg logit contributions | |
antioxid | -2.370 |
Rate | -2.250 |
\\\\\\\\ | -2.222 |
---------- | -2.216 |
ONSORED | -2.204 |
Token | more |
Token ID | 517 |
Feature activation | -8.99e-01 |
Pos logit contributions | |
uala | +3.270 |
eni | +2.907 |
itton | +2.550 |
atin | +2.436 |
hurst | +2.428 |
Neg logit contributions | |
antioxid | -2.338 |
\\\\\\\\ | -2.199 |
annoyance | -2.141 |
ONSORED | -2.130 |
ghazi | -2.113 |
Token | on |
Token ID | 319 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
uala | +4.178 |
eni | +3.784 |
itton | +3.216 |
nil | +3.137 |
atin | +3.122 |
Neg logit contributions | |
antioxid | -3.228 |
\\\\\\\\ | -2.987 |
annoyance | -2.920 |
ONSORED | -2.901 |
Rate | -2.854 |
Token | optimal |
Token ID | 16586 |
Feature activation | +4.26e-01 |
Pos logit contributions | |
uala | +0.332 |
eni | +0.297 |
itton | +0.264 |
atin | +0.257 |
Devi | +0.254 |
Neg logit contributions | |
antioxid | -0.182 |
annoyance | -0.174 |
Rate | -0.172 |
pleas | -0.169 |
\\\\\\\\ | -0.169 |
Token | considering |
Token ID | 6402 |
Feature activation | -5.77e-01 |
Pos logit contributions | |
antioxid | +1.244 |
annoyance | +1.213 |
pleas | +1.198 |
Rate | +1.162 |
± | +1.155 |
Neg logit contributions | |
uala | -2.276 |
eni | -2.034 |
itton | -1.809 |
atin | -1.750 |
Devi | -1.743 |
Token | the |
Token ID | 262 |
Feature activation | +2.06e-02 |
Pos logit contributions | |
uala | +2.984 |
eni | +2.637 |
itton | +2.338 |
atin | +2.282 |
Devi | +2.274 |
Neg logit contributions | |
antioxid | -1.721 |
annoyance | -1.649 |
pleas | -1.626 |
Rate | -1.625 |
---------- | -1.604 |
Token | all |
Token ID | 477 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
antioxid | +0.062 |
annoyance | +0.060 |
pleas | +0.059 |
Rate | +0.059 |
---------- | +0.058 |
Neg logit contributions | |
uala | -0.107 |
eni | -0.096 |
itton | -0.084 |
Devi | -0.082 |
atin | -0.082 |
Token | - |
Token ID | 12 |
Feature activation | -7.61e-01 |
Pos logit contributions | |
antioxid | +0.613 |
annoyance | +0.596 |
pleas | +0.588 |
Rate | +0.575 |
---------- | +0.569 |
Neg logit contributions | |
uala | -0.984 |
eni | -0.876 |
itton | -0.771 |
atin | -0.745 |
Devi | -0.741 |
Token | em |
Token ID | 368 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
uala | +3.188 |
eni | +2.808 |
itton | +2.320 |
nil | +2.276 |
atin | +2.225 |
Neg logit contributions | |
antioxid | -3.133 |
annoyance | -3.002 |
pleas | -2.982 |
\\\\\\\\ | -2.893 |
regression | -2.887 |
Token | br |
Token ID | 1671 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
uala | +4.242 |
eni | +3.725 |
itton | +2.717 |
nil | +2.418 |
atin | +2.384 |
Neg logit contributions | |
antioxid | -9.913 |
\\\\\\\\ | -9.378 |
gery | -9.345 |
ONSORED | -9.295 |
annoyance | -9.289 |
Token | acing |
Token ID | 4092 |
Feature activation | -7.36e-01 |
Pos logit contributions | |
pleas | +3.117 |
± | +3.099 |
gery | +3.095 |
Rate | +3.070 |
annoyance | +3.058 |
Neg logit contributions | |
uala | -5.576 |
eni | -4.944 |
� | -4.520 |
Devi | -4.464 |
itton | -4.269 |
Token | inter |
Token ID | 987 |
Feature activation | +5.77e-02 |
Pos logit contributions | |
uala | +3.793 |
eni | +3.403 |
itton | +2.960 |
atin | +2.885 |
Devi | +2.880 |
Neg logit contributions | |
antioxid | -2.145 |
Rate | -2.096 |
annoyance | -2.074 |
ONSORED | -2.072 |
ghazi | -2.059 |
Token | p |
Token ID | 279 |
Feature activation | +9.26e-01 |
Pos logit contributions | |
antioxid | +0.203 |
annoyance | +0.197 |
pleas | +0.192 |
Rate | +0.191 |
---------- | +0.188 |
Neg logit contributions | |
uala | -0.272 |
eni | -0.244 |
itton | -0.211 |
atin | -0.206 |
Devi | -0.203 |
Token | ares |
Token ID | 3565 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
antioxid | +3.644 |
annoyance | +3.602 |
pleas | +3.584 |
± | +3.515 |
Rate | +3.506 |
Neg logit contributions | |
uala | -3.886 |
eni | -3.382 |
itton | -2.875 |
Devi | -2.782 |
� | -2.743 |
Token | / |
Token ID | 14 |
Feature activation | +3.73e-01 |
Pos logit contributions | |
antioxid | +0.150 |
annoyance | +0.144 |
pleas | +0.142 |
Rate | +0.138 |
---------- | +0.138 |
Neg logit contributions | |
uala | -0.301 |
eni | -0.271 |
itton | -0.241 |
atin | -0.235 |
Devi | -0.234 |
Token | h |
Token ID | 71 |
Feature activation | +4.60e-01 |
Pos logit contributions | |
antioxid | +1.392 |
annoyance | +1.372 |
pleas | +1.369 |
Rate | +1.341 |
± | +1.335 |
Neg logit contributions | |
uala | -1.678 |
eni | -1.460 |
itton | -1.273 |
Devi | -1.213 |
atin | -1.212 |
Token | ). |
Token ID | 737 |
Feature activation | -3.02e-01 |
Pos logit contributions | |
antioxid | +1.197 |
annoyance | +1.184 |
pleas | +1.168 |
± | +1.143 |
Rate | +1.131 |
Neg logit contributions | |
uala | -2.567 |
eni | -2.315 |
itton | -2.077 |
atin | -2.001 |
Devi | -1.995 |
Token |
|
Token ID | 198 |
Feature activation | +2.34e-03 |
Pos logit contributions | |
uala | +1.471 |
eni | +1.298 |
itton | +1.127 |
Devi | +1.123 |
atin | +1.108 |
Neg logit contributions | |
antioxid | -1.029 |
annoyance | -0.992 |
pleas | -0.981 |
\\\\\\\\ | -0.948 |
reven | -0.946 |
Token |
|
Token ID | 198 |
Feature activation | -8.59e-02 |
Pos logit contributions | |
antioxid | +0.008 |
annoyance | +0.008 |
pleas | +0.008 |
\\\\\\\\ | +0.008 |
Rate | +0.008 |
Neg logit contributions | |
uala | -0.011 |
eni | -0.010 |
itton | -0.009 |
atin | -0.008 |
Devi | -0.008 |
Token | Sun |
Token ID | 16012 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
uala | +0.412 |
eni | +0.364 |
itton | +0.314 |
atin | +0.308 |
nil | +0.304 |
Neg logit contributions | |
antioxid | -0.301 |
annoyance | -0.292 |
pleas | -0.288 |
regression | -0.278 |
reven | -0.277 |
Token | and |
Token ID | 290 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
annoyance | +4.903 |
antioxid | +4.884 |
pleas | +4.798 |
Rate | +4.774 |
± | +4.690 |
Neg logit contributions | |
uala | -6.063 |
eni | -5.314 |
itton | -4.659 |
atin | -4.399 |
Devi | -4.373 |
Token | galaxy |
Token ID | 16161 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
uala | +0.062 |
eni | +0.054 |
itton | +0.047 |
Devi | +0.046 |
atin | +0.046 |
Neg logit contributions | |
antioxid | -0.046 |
annoyance | -0.044 |
pleas | -0.044 |
Rate | -0.043 |
\\\\\\\\ | -0.043 |
Token | move |
Token ID | 1445 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
uala | +0.645 |
eni | +0.573 |
itton | +0.504 |
Devi | +0.487 |
atin | +0.486 |
Neg logit contributions | |
antioxid | -0.433 |
annoyance | -0.418 |
pleas | -0.413 |
\\\\\\\\ | -0.408 |
Rate | -0.403 |
Token | , |
Token ID | 11 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
uala | +0.675 |
eni | +0.607 |
itton | +0.536 |
Devi | +0.523 |
atin | +0.522 |
Neg logit contributions | |
antioxid | -0.361 |
annoyance | -0.348 |
pleas | -0.343 |
\\\\\\\\ | -0.338 |
Rate | -0.335 |
Token | too |
Token ID | 1165 |
Feature activation | +3.60e-01 |
Pos logit contributions | |
antioxid | +0.643 |
annoyance | +0.626 |
pleas | +0.617 |
Rate | +0.599 |
± | +0.594 |
Neg logit contributions | |
uala | -1.275 |
eni | -1.144 |
itton | -1.021 |
atin | -0.988 |
Devi | -0.985 |
Token |
|
Token ID | 198 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
uala | +1.818 |
eni | +1.602 |
itton | +1.392 |
Devi | +1.378 |
atin | +1.361 |
Neg logit contributions | |
antioxid | -1.246 |
annoyance | -1.219 |
pleas | -1.191 |
gery | -1.154 |
Rate | -1.151 |
Token |
|
Token ID | 198 |
Feature activation | -7.71e-02 |
Pos logit contributions | |
uala | +0.687 |
eni | +0.608 |
itton | +0.520 |
Devi | +0.507 |
atin | +0.506 |
Neg logit contributions | |
antioxid | -0.529 |
annoyance | -0.509 |
pleas | -0.491 |
\\\\\\\\ | -0.486 |
reven | -0.482 |
Token | In |
Token ID | 818 |
Feature activation | +6.03e-02 |
Pos logit contributions | |
uala | +0.379 |
eni | +0.335 |
itton | +0.291 |
atin | +0.284 |
nil | +0.282 |
Neg logit contributions | |
antioxid | -0.260 |
annoyance | -0.254 |
pleas | -0.249 |
regression | -0.241 |
± | -0.240 |
Token | the |
Token ID | 262 |
Feature activation | +7.34e-01 |
Pos logit contributions | |
antioxid | +0.184 |
annoyance | +0.177 |
pleas | +0.175 |
Rate | +0.172 |
\\\\\\\\ | +0.170 |
Neg logit contributions | |
uala | -0.316 |
eni | -0.281 |
itton | -0.249 |
Devi | -0.241 |
atin | -0.241 |
Token | present |
Token ID | 1944 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
antioxid | +2.126 |
annoyance | +2.073 |
pleas | +2.049 |
Rate | +1.983 |
± | +1.972 |
Neg logit contributions | |
uala | -3.934 |
eni | -3.522 |
itton | -3.133 |
atin | -3.032 |
Devi | -3.012 |
Token | Motor |
Token ID | 12533 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
antioxid | +0.463 |
annoyance | +0.449 |
pleas | +0.442 |
Rate | +0.432 |
---------- | +0.428 |
Neg logit contributions | |
uala | -0.855 |
eni | -0.764 |
itton | -0.677 |
Devi | -0.657 |
atin | -0.656 |
Token | Vehicle |
Token ID | 21501 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
± | +3.280 |
annoyance | +3.269 |
Interest | +3.264 |
pleas | +3.227 |
gery | +3.219 |
Neg logit contributions | |
uala | -8.630 |
eni | -7.849 |
itton | -7.214 |
� | -6.972 |
atin | -6.858 |
Token | Act |
Token ID | 2191 |
Feature activation | -5.92e-01 |
Pos logit contributions | |
antioxid | +0.842 |
annoyance | +0.819 |
pleas | +0.807 |
Rate | +0.782 |
± | +0.776 |
Neg logit contributions | |
uala | -1.984 |
eni | -1.793 |
itton | -1.614 |
atin | -1.559 |
Devi | -1.550 |
Token | , |
Token ID | 11 |
Feature activation | -4.28e-01 |
Pos logit contributions | |
uala | +2.758 |
eni | +2.416 |
itton | +2.088 |
Devi | +2.061 |
atin | +2.055 |
Neg logit contributions | |
antioxid | -2.078 |
annoyance | -2.028 |
pleas | -2.002 |
Rate | -1.960 |
---------- | -1.941 |
Token | there |
Token ID | 612 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
uala | +2.176 |
eni | +1.941 |
itton | +1.708 |
Devi | +1.685 |
atin | +1.677 |
Neg logit contributions | |
antioxid | -1.343 |
annoyance | -1.274 |
pleas | -1.260 |
Rate | -1.242 |
\\\\\\\\ | -1.239 |
Token | are |
Token ID | 389 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
uala | +1.308 |
eni | +1.158 |
itton | +1.019 |
atin | +0.994 |
Devi | +0.988 |
Neg logit contributions | |
antioxid | -0.837 |
annoyance | -0.813 |
pleas | -0.800 |
Rate | -0.784 |
± | -0.775 |
Token | The |
Token ID | 383 |
Feature activation | +8.29e-01 |
Pos logit contributions | |
antioxid | +0.862 |
annoyance | +0.840 |
pleas | +0.828 |
Rate | +0.804 |
± | +0.798 |
Neg logit contributions | |
uala | -1.709 |
eni | -1.533 |
itton | -1.369 |
atin | -1.324 |
Devi | -1.319 |
Token | New |
Token ID | 968 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
annoyance | +1.920 |
antioxid | +1.908 |
pleas | +1.892 |
Interest | +1.862 |
---------- | +1.858 |
Neg logit contributions | |
uala | -4.846 |
eni | -4.367 |
itton | -3.960 |
atin | -3.810 |
Devi | -3.752 |
Token | York |
Token ID | 1971 |
Feature activation | +6.77e-01 |
Pos logit contributions | |
antioxid | +2.273 |
pleas | +2.247 |
annoyance | +2.245 |
Interest | +2.185 |
± | +2.169 |
Neg logit contributions | |
uala | -6.274 |
eni | -5.674 |
itton | -5.114 |
� | -5.000 |
atin | -4.996 |
Token | Times |
Token ID | 3782 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
antioxid | +2.257 |
annoyance | +2.211 |
pleas | +2.192 |
Rate | +2.145 |
± | +2.131 |
Neg logit contributions | |
uala | -3.322 |
eni | -2.945 |
itton | -2.586 |
atin | -2.492 |
Devi | -2.483 |
Token | . |
Token ID | 13 |
Feature activation | +6.73e-01 |
Pos logit contributions | |
antioxid | +2.906 |
annoyance | +2.905 |
pleas | +2.889 |
± | +2.851 |
Rate | +2.813 |
Neg logit contributions | |
uala | -5.231 |
eni | -4.647 |
itton | -4.101 |
atin | -3.991 |
� | -3.966 |
Token | You |
Token ID | 921 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
antioxid | +1.603 |
annoyance | +1.545 |
pleas | +1.517 |
Rate | +1.464 |
± | +1.446 |
Neg logit contributions | |
uala | -3.972 |
eni | -3.586 |
itton | -3.225 |
atin | -3.134 |
Devi | -3.130 |
Token | may |
Token ID | 743 |
Feature activation | +8.83e-01 |
Pos logit contributions | |
pleas | +2.634 |
annoyance | +2.595 |
antioxid | +2.511 |
---------- | +2.476 |
± | +2.471 |
Neg logit contributions | |
uala | -7.434 |
eni | -6.758 |
� | -6.094 |
itton | -6.090 |
atin | -5.997 |
Token | opt |
Token ID | 2172 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
pleas | +3.403 |
annoyance | +3.384 |
antioxid | +3.356 |
± | +3.302 |
Rate | +3.276 |
Neg logit contributions | |
uala | -3.866 |
eni | -3.322 |
itton | -2.847 |
� | -2.778 |
atin | -2.732 |
Token | - |
Token ID | 12 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
antioxid | +1.718 |
annoyance | +1.673 |
pleas | +1.649 |
Rate | +1.610 |
± | +1.593 |
Neg logit contributions | |
uala | -2.717 |
eni | -2.414 |
itton | -2.128 |
atin | -2.053 |
Devi | -2.047 |
Token | out |
Token ID | 448 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
antioxid | +0.591 |
annoyance | +0.570 |
pleas | +0.559 |
\\\\\\\\ | +0.544 |
Rate | +0.543 |
Neg logit contributions | |
uala | -0.910 |
eni | -0.807 |
itton | -0.709 |
atin | -0.685 |
Devi | -0.680 |
Token | at |
Token ID | 379 |
Feature activation | +9.05e-01 |
Pos logit contributions | |
uala | +0.552 |
eni | +0.497 |
itton | +0.438 |
Devi | +0.431 |
atin | +0.426 |
Neg logit contributions | |
antioxid | -0.324 |
annoyance | -0.305 |
ONSORED | -0.294 |
\\\\\\\\ | -0.293 |
Rate | -0.293 |
Token | happens |
Token ID | 4325 |
Feature activation | +4.31e-01 |
Pos logit contributions | |
annoyance | +1.602 |
pleas | +1.597 |
antioxid | +1.585 |
± | +1.530 |
Rate | +1.529 |
Neg logit contributions | |
uala | -2.637 |
eni | -2.313 |
itton | -2.057 |
atin | -1.985 |
Devi | -1.960 |
Token | in |
Token ID | 287 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
antioxid | +1.367 |
annoyance | +1.336 |
pleas | +1.327 |
Rate | +1.288 |
± | +1.286 |
Neg logit contributions | |
uala | -2.189 |
eni | -1.942 |
itton | -1.714 |
atin | -1.656 |
Devi | -1.641 |
Token | Greater |
Token ID | 18169 |
Feature activation | -4.48e-02 |
Pos logit contributions | |
antioxid | +0.305 |
annoyance | +0.297 |
pleas | +0.293 |
Rate | +0.284 |
± | +0.282 |
Neg logit contributions | |
uala | -0.600 |
eni | -0.539 |
itton | -0.481 |
atin | -0.465 |
Devi | -0.463 |
Token | Cincinnati |
Token ID | 16137 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
uala | +0.239 |
eni | +0.214 |
itton | +0.190 |
atin | +0.183 |
Devi | +0.182 |
Neg logit contributions | |
antioxid | -0.131 |
annoyance | -0.128 |
pleas | -0.127 |
Rate | -0.123 |
± | -0.122 |
Token | . |
Token ID | 13 |
Feature activation | +4.30e-01 |
Pos logit contributions | |
antioxid | +0.058 |
annoyance | +0.057 |
pleas | +0.056 |
Rate | +0.055 |
\\\\\\\\ | +0.054 |
Neg logit contributions | |
uala | -0.098 |
eni | -0.087 |
itton | -0.077 |
atin | -0.074 |
Devi | -0.074 |
Token | Please |
Token ID | 4222 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
antioxid | +1.210 |
annoyance | +1.174 |
pleas | +1.169 |
Rate | +1.129 |
---------- | +1.125 |
Neg logit contributions | |
uala | -2.338 |
eni | -2.109 |
itton | -1.870 |
atin | -1.811 |
Devi | -1.801 |
Token | try |
Token ID | 1949 |
Feature activation | +7.73e-01 |
Pos logit contributions | |
antioxid | +4.288 |
pleas | +4.009 |
± | +3.872 |
Rate | +3.836 |
annoyance | +3.748 |
Neg logit contributions | |
uala | -8.073 |
eni | -7.342 |
ignty | -6.493 |
� | -6.440 |
Devi | -6.338 |
Token | again |
Token ID | 757 |
Feature activation | +6.26e-01 |
Pos logit contributions | |
antioxid | +1.757 |
annoyance | +1.735 |
pleas | +1.717 |
Rate | +1.654 |
± | +1.648 |
Neg logit contributions | |
uala | -4.581 |
eni | -4.125 |
itton | -3.729 |
atin | -3.590 |
Devi | -3.589 |
Token | soon |
Token ID | 2582 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
antioxid | +1.557 |
annoyance | +1.509 |
pleas | +1.482 |
Rate | +1.433 |
\\\\\\\\ | +1.416 |
Neg logit contributions | |
uala | -3.615 |
eni | -3.265 |
itton | -2.931 |
atin | -2.848 |
Devi | -2.834 |
Token | , |
Token ID | 11 |
Feature activation | +6.21e-01 |
Pos logit contributions | |
antioxid | +1.374 |
annoyance | +1.343 |
pleas | +1.332 |
Rate | +1.299 |
± | +1.291 |
Neg logit contributions | |
uala | -2.083 |
eni | -1.846 |
itton | -1.624 |
atin | -1.566 |
Devi | -1.556 |
Token | or |
Token ID | 393 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
antioxid | +1.837 |
pleas | +1.824 |
annoyance | +1.818 |
Rate | +1.762 |
± | +1.739 |
Neg logit contributions | |
uala | -3.231 |
eni | -2.923 |
itton | -2.573 |
� | -2.516 |
atin | -2.501 |
Token | ble |
Token ID | 903 |
Feature activation | +5.11e-01 |
Pos logit contributions | |
antioxid | +0.670 |
annoyance | +0.657 |
pleas | +0.650 |
Rate | +0.642 |
\\\\\\\\ | +0.638 |
Neg logit contributions | |
uala | -0.355 |
eni | -0.286 |
itton | -0.220 |
atin | -0.202 |
Devi | -0.199 |
Token | in |
Token ID | 287 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
antioxid | +1.447 |
annoyance | +1.409 |
pleas | +1.390 |
Rate | +1.350 |
± | +1.339 |
Neg logit contributions | |
uala | -2.774 |
eni | -2.485 |
itton | -2.214 |
atin | -2.143 |
Devi | -2.134 |
Token | approximately |
Token ID | 6702 |
Feature activation | +3.39e-01 |
Pos logit contributions | |
uala | +0.859 |
eni | +0.769 |
itton | +0.683 |
atin | +0.666 |
Devi | +0.666 |
Neg logit contributions | |
antioxid | -0.458 |
annoyance | -0.440 |
pleas | -0.438 |
\\\\\\\\ | -0.422 |
Rate | -0.421 |
Token | 6 |
Token ID | 718 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
antioxid | +0.846 |
annoyance | +0.818 |
pleas | +0.807 |
Rate | +0.779 |
---------- | +0.769 |
Neg logit contributions | |
uala | -1.955 |
eni | -1.762 |
itton | -1.583 |
atin | -1.536 |
Devi | -1.532 |
Token | . |
Token ID | 13 |
Feature activation | +6.50e-02 |
Pos logit contributions | |
antioxid | +1.012 |
annoyance | +0.989 |
pleas | +0.978 |
Rate | +0.952 |
± | +0.947 |
Neg logit contributions | |
uala | -1.626 |
eni | -1.445 |
itton | -1.276 |
atin | -1.231 |
Devi | -1.226 |
Token | 28 |
Token ID | 2078 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
antioxid | +0.252 |
annoyance | +0.245 |
pleas | +0.242 |
Rate | +0.236 |
\\\\\\\\ | +0.235 |
Neg logit contributions | |
uala | -0.287 |
eni | -0.250 |
itton | -0.215 |
Devi | -0.207 |
atin | -0.207 |
Token | seconds |
Token ID | 4201 |
Feature activation | +7.54e-01 |
Pos logit contributions | |
± | +3.917 |
antioxid | +3.888 |
pleas | +3.866 |
annoyance | +3.837 |
regression | +3.703 |
Neg logit contributions | |
uala | -6.383 |
eni | -5.697 |
itton | -5.047 |
atin | -4.793 |
Devi | -4.786 |
Token | . |
Token ID | 13 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
antioxid | +2.346 |
annoyance | +2.305 |
pleas | +2.276 |
± | +2.253 |
Rate | +2.222 |
Neg logit contributions | |
uala | -3.859 |
eni | -3.429 |
itton | -3.027 |
atin | -2.920 |
Devi | -2.907 |
Token | The |
Token ID | 383 |
Feature activation | -5.76e-02 |
Pos logit contributions | |
uala | +0.616 |
eni | +0.544 |
itton | +0.478 |
Devi | +0.469 |
atin | +0.466 |
Neg logit contributions | |
antioxid | -0.410 |
annoyance | -0.399 |
pleas | -0.394 |
\\\\\\\\ | -0.384 |
Rate | -0.381 |
Token | problem |
Token ID | 1917 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
uala | +0.300 |
eni | +0.267 |
itton | +0.238 |
Devi | +0.231 |
atin | +0.230 |
Neg logit contributions | |
antioxid | -0.174 |
annoyance | -0.169 |
pleas | -0.167 |
\\\\\\\\ | -0.164 |
Rate | -0.164 |
Token | now |
Token ID | 783 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
antioxid | +0.459 |
annoyance | +0.441 |
pleas | +0.435 |
Rate | +0.425 |
\\\\\\\\ | +0.422 |
Neg logit contributions | |
uala | -0.869 |
eni | -0.779 |
itton | -0.692 |
atin | -0.673 |
Devi | -0.672 |
Token | in |
Token ID | 287 |
Feature activation | -9.79e-02 |
Pos logit contributions | |
uala | +0.590 |
eni | +0.534 |
itton | +0.467 |
atin | +0.456 |
Devi | +0.453 |
Neg logit contributions | |
antioxid | -0.323 |
annoyance | -0.316 |
Rate | -0.303 |
pleas | -0.302 |
---------- | -0.299 |
Token | the |
Token ID | 262 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
uala | +0.509 |
eni | +0.453 |
itton | +0.397 |
atin | +0.389 |
Devi | +0.385 |
Neg logit contributions | |
antioxid | -0.300 |
annoyance | -0.288 |
pleas | -0.282 |
Rate | -0.281 |
\\\\\\\\ | -0.279 |
Token | natural |
Token ID | 3288 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
antioxid | +0.799 |
annoyance | +0.774 |
pleas | +0.764 |
Rate | +0.751 |
\\\\\\\\ | +0.743 |
Neg logit contributions | |
uala | -1.370 |
eni | -1.224 |
itton | -1.080 |
atin | -1.046 |
Devi | -1.045 |
Token | gas |
Token ID | 3623 |
Feature activation | -2.06e-01 |
Pos logit contributions | |
annoyance | +2.781 |
pleas | +2.746 |
antioxid | +2.742 |
± | +2.625 |
regression | +2.613 |
Neg logit contributions | |
uala | -6.293 |
eni | -5.614 |
itton | -5.066 |
Devi | -4.916 |
atin | -4.887 |
Token | field |
Token ID | 2214 |
Feature activation | -6.73e-01 |
Pos logit contributions | |
uala | +1.107 |
eni | +1.002 |
itton | +0.881 |
atin | +0.861 |
Devi | +0.857 |
Neg logit contributions | |
antioxid | -0.588 |
annoyance | -0.567 |
pleas | -0.557 |
Rate | -0.548 |
± | -0.541 |
Token | – |
Token ID | 784 |
Feature activation | +3.47e-01 |
Pos logit contributions | |
uala | +3.446 |
eni | +3.108 |
itton | +2.711 |
atin | +2.659 |
Devi | +2.631 |
Neg logit contributions | |
antioxid | -2.072 |
annoyance | -1.991 |
pleas | -1.957 |
Rate | -1.923 |
\\\\\\\\ | -1.891 |
Token | with |
Token ID | 351 |
Feature activation | -4.01e-02 |
Pos logit contributions | |
antioxid | +1.001 |
annoyance | +0.973 |
pleas | +0.960 |
Rate | +0.933 |
± | +0.924 |
Neg logit contributions | |
uala | -1.867 |
eni | -1.672 |
itton | -1.486 |
atin | -1.440 |
Devi | -1.434 |
Token | Turkey |
Token ID | 7137 |
Feature activation | -4.34e-02 |
Pos logit contributions | |
uala | +0.204 |
eni | +0.182 |
itton | +0.159 |
atin | +0.155 |
Devi | +0.154 |
Neg logit contributions | |
antioxid | -0.126 |
annoyance | -0.122 |
pleas | -0.120 |
Rate | -0.118 |
\\\\\\\\ | -0.118 |
Token | buying |
Token ID | 7067 |
Feature activation | +1.00e-01 |
Pos logit contributions | |
uala | +0.233 |
eni | +0.209 |
itton | +0.186 |
atin | +0.180 |
Devi | +0.179 |
Neg logit contributions | |
antioxid | -0.126 |
annoyance | -0.121 |
pleas | -0.119 |
Rate | -0.117 |
\\\\\\\\ | -0.116 |
Token | gas |
Token ID | 3623 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
antioxid | +0.306 |
annoyance | +0.299 |
pleas | +0.295 |
Rate | +0.287 |
± | +0.284 |
Neg logit contributions | |
uala | -0.522 |
eni | -0.466 |
itton | -0.412 |
atin | -0.399 |
Devi | -0.397 |
Token | from |
Token ID | 422 |
Feature activation | -4.89e-01 |
Pos logit contributions | |
uala | +1.025 |
eni | +0.924 |
itton | +0.802 |
atin | +0.781 |
Devi | +0.774 |
Neg logit contributions | |
antioxid | -0.695 |
annoyance | -0.673 |
pleas | -0.659 |
Rate | -0.648 |
\\\\\\\\ | -0.646 |
Token | of |
Token ID | 286 |
Feature activation | -2.75e-02 |
Pos logit contributions | |
antioxid | +1.539 |
annoyance | +1.503 |
pleas | +1.483 |
Rate | +1.428 |
± | +1.424 |
Neg logit contributions | |
uala | -2.871 |
eni | -2.555 |
itton | -2.289 |
atin | -2.205 |
Devi | -2.195 |
Token | course |
Token ID | 1781 |
Feature activation | -2.23e-01 |
Pos logit contributions | |
uala | +0.145 |
eni | +0.130 |
itton | +0.115 |
atin | +0.111 |
Devi | +0.111 |
Neg logit contributions | |
antioxid | -0.083 |
annoyance | -0.080 |
pleas | -0.079 |
Rate | -0.077 |
\\\\\\\\ | -0.076 |
Token | the |
Token ID | 262 |
Feature activation | +3.70e-02 |
Pos logit contributions | |
uala | +1.139 |
eni | +1.023 |
itton | +0.895 |
atin | +0.869 |
Devi | +0.869 |
Neg logit contributions | |
antioxid | -0.691 |
annoyance | -0.670 |
pleas | -0.662 |
Rate | -0.656 |
\\\\\\\\ | -0.653 |
Token | work |
Token ID | 670 |
Feature activation | +4.78e-01 |
Pos logit contributions | |
antioxid | +0.112 |
annoyance | +0.109 |
pleas | +0.107 |
Rate | +0.106 |
\\\\\\\\ | +0.105 |
Neg logit contributions | |
uala | -0.193 |
eni | -0.173 |
itton | -0.152 |
atin | -0.148 |
Devi | -0.147 |
Token | of |
Token ID | 286 |
Feature activation | +3.29e-01 |
Pos logit contributions | |
antioxid | +1.186 |
annoyance | +1.149 |
pleas | +1.132 |
Rate | +1.094 |
± | +1.083 |
Neg logit contributions | |
uala | -2.763 |
eni | -2.493 |
itton | -2.240 |
atin | -2.173 |
Devi | -2.166 |
Token | the |
Token ID | 262 |
Feature activation | +3.04e-01 |
Pos logit contributions | |
antioxid | +0.990 |
annoyance | +0.965 |
pleas | +0.954 |
Rate | +0.924 |
± | +0.920 |
Neg logit contributions | |
uala | -1.733 |
eni | -1.544 |
itton | -1.372 |
atin | -1.325 |
Devi | -1.318 |
Token | anarchist |
Token ID | 26177 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
antioxid | +0.958 |
annoyance | +0.935 |
pleas | +0.924 |
Rate | +0.899 |
± | +0.893 |
Neg logit contributions | |
uala | -1.558 |
eni | -1.386 |
itton | -1.224 |
atin | -1.182 |
Devi | -1.177 |
Token | movement |
Token ID | 3356 |
Feature activation | +9.19e-02 |
Pos logit contributions | |
antioxid | +0.624 |
annoyance | +0.610 |
pleas | +0.603 |
Rate | +0.591 |
± | +0.585 |
Neg logit contributions | |
uala | -0.905 |
eni | -0.802 |
itton | -0.702 |
atin | -0.677 |
Devi | -0.675 |
Token | . |
Token ID | 13 |
Feature activation | +2.83e-01 |
Pos logit contributions | |
antioxid | +0.274 |
annoyance | +0.268 |
pleas | +0.263 |
Rate | +0.259 |
\\\\\\\\ | +0.255 |
Neg logit contributions | |
uala | -0.484 |
eni | -0.434 |
itton | -0.382 |
atin | -0.371 |
Devi | -0.371 |
Token |
|
Token ID | 198 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
antioxid | +0.906 |
annoyance | +0.883 |
pleas | +0.875 |
Rate | +0.853 |
± | +0.848 |
Neg logit contributions | |
uala | -1.428 |
eni | -1.266 |
itton | -1.119 |
atin | -1.080 |
Devi | -1.073 |
Token |
|
Token ID | 198 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
antioxid | +1.033 |
annoyance | +1.009 |
pleas | +0.998 |
Rate | +0.974 |
± | +0.966 |
Neg logit contributions | |
uala | -1.579 |
eni | -1.400 |
itton | -1.233 |
atin | -1.189 |
Devi | -1.184 |
Token | there |
Token ID | 612 |
Feature activation | +7.59e-02 |
Pos logit contributions | |
uala | +1.516 |
eni | +1.353 |
itton | +1.201 |
Devi | +1.164 |
atin | +1.160 |
Neg logit contributions | |
antioxid | -0.892 |
annoyance | -0.846 |
pleas | -0.839 |
Rate | -0.839 |
\\\\\\\\ | -0.837 |
Token | have |
Token ID | 423 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
antioxid | +0.236 |
annoyance | +0.229 |
pleas | +0.225 |
Rate | +0.220 |
± | +0.218 |
Neg logit contributions | |
uala | -0.393 |
eni | -0.349 |
itton | -0.309 |
atin | -0.299 |
Devi | -0.298 |
Token | been |
Token ID | 587 |
Feature activation | -6.08e-01 |
Pos logit contributions | |
uala | +1.573 |
eni | +1.416 |
itton | +1.257 |
Devi | +1.225 |
atin | +1.217 |
Neg logit contributions | |
antioxid | -0.809 |
annoyance | -0.783 |
\\\\\\\\ | -0.757 |
pleas | -0.756 |
Rate | -0.756 |
Token | multiple |
Token ID | 3294 |
Feature activation | -6.61e-02 |
Pos logit contributions | |
uala | +3.209 |
eni | +2.885 |
itton | +2.534 |
Devi | +2.477 |
atin | +2.436 |
Neg logit contributions | |
antioxid | -1.747 |
\\\\\\\\ | -1.658 |
annoyance | -1.635 |
Rate | -1.620 |
---------- | -1.617 |
Token | cases |
Token ID | 2663 |
Feature activation | +3.85e-02 |
Pos logit contributions | |
uala | +0.367 |
eni | +0.330 |
itton | +0.294 |
atin | +0.285 |
Devi | +0.284 |
Neg logit contributions | |
antioxid | -0.179 |
annoyance | -0.171 |
pleas | -0.167 |
\\\\\\\\ | -0.165 |
Rate | -0.165 |
Token | where |
Token ID | 810 |
Feature activation | +5.58e-01 |
Pos logit contributions | |
antioxid | +0.109 |
annoyance | +0.105 |
pleas | +0.102 |
Rate | +0.101 |
\\\\\\\\ | +0.100 |
Neg logit contributions | |
uala | -0.211 |
eni | -0.189 |
itton | -0.168 |
atin | -0.163 |
Devi | -0.162 |
Token | passengers |
Token ID | 10405 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
antioxid | +1.687 |
annoyance | +1.659 |
pleas | +1.641 |
Rate | +1.580 |
± | +1.576 |
Neg logit contributions | |
uala | -2.914 |
eni | -2.596 |
itton | -2.299 |
atin | -2.226 |
Devi | -2.215 |
Token | have |
Token ID | 423 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
uala | +1.397 |
eni | +1.247 |
itton | +1.101 |
atin | +1.051 |
Devi | +1.045 |
Neg logit contributions | |
antioxid | -0.939 |
annoyance | -0.883 |
Rate | -0.870 |
\\\\\\\\ | -0.869 |
pleas | -0.869 |
Token | been |
Token ID | 587 |
Feature activation | -7.30e-01 |
Pos logit contributions | |
uala | +0.725 |
eni | +0.652 |
itton | +0.582 |
Devi | +0.560 |
atin | +0.557 |
Neg logit contributions | |
antioxid | -0.382 |
annoyance | -0.362 |
\\\\\\\\ | -0.355 |
Rate | -0.354 |
pleas | -0.353 |
Token | singled |
Token ID | 31958 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
uala | +3.578 |
eni | +3.191 |
itton | +2.811 |
atin | +2.693 |
Devi | +2.670 |
Neg logit contributions | |
antioxid | -2.474 |
\\\\\\\\ | -2.339 |
annoyance | -2.301 |
Rate | -2.295 |
---------- | -2.244 |
Token | out |
Token ID | 503 |
Feature activation | -2.56e-01 |
Pos logit contributions | |
uala | +1.027 |
eni | +0.920 |
itton | +0.815 |
atin | +0.792 |
Devi | +0.788 |
Neg logit contributions | |
antioxid | -0.564 |
annoyance | -0.538 |
pleas | -0.530 |
Rate | -0.526 |
± | -0.512 |
Token | should |
Token ID | 815 |
Feature activation | +2.75e-02 |
Pos logit contributions | |
antioxid | +0.302 |
annoyance | +0.294 |
pleas | +0.289 |
Rate | +0.284 |
\\\\\\\\ | +0.281 |
Neg logit contributions | |
uala | -0.474 |
eni | -0.421 |
itton | -0.371 |
atin | -0.359 |
Devi | -0.358 |
Token | be |
Token ID | 307 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
antioxid | +0.090 |
annoyance | +0.088 |
pleas | +0.087 |
Rate | +0.085 |
± | +0.084 |
Neg logit contributions | |
uala | -0.137 |
eni | -0.121 |
itton | -0.107 |
atin | -0.103 |
Devi | -0.103 |
Token | cast |
Token ID | 3350 |
Feature activation | -9.23e-01 |
Pos logit contributions | |
uala | +0.564 |
eni | +0.504 |
itton | +0.448 |
atin | +0.433 |
Devi | +0.431 |
Neg logit contributions | |
antioxid | -0.322 |
annoyance | -0.313 |
pleas | -0.307 |
Rate | -0.301 |
± | -0.298 |
Token | as |
Token ID | 355 |
Feature activation | -6.31e-01 |
Pos logit contributions | |
uala | +4.656 |
eni | +4.201 |
itton | +3.664 |
atin | +3.629 |
Devi | +3.600 |
Neg logit contributions | |
antioxid | -2.870 |
annoyance | -2.750 |
Rate | -2.637 |
pleas | -2.629 |
\\\\\\\\ | -2.607 |
Token | Christian |
Token ID | 4302 |
Feature activation | -7.79e-01 |
Pos logit contributions | |
uala | +2.851 |
eni | +2.531 |
itton | +2.187 |
atin | +2.113 |
Devi | +2.108 |
Neg logit contributions | |
antioxid | -2.319 |
annoyance | -2.249 |
pleas | -2.208 |
Rate | -2.205 |
\\\\\\\\ | -2.170 |
Token | Grey |
Token ID | 13980 |
Feature activation | +7.12e-02 |
Pos logit contributions | |
uala | +2.970 |
eni | +2.573 |
itton | +2.140 |
Devi | +2.064 |
atin | +2.032 |
Neg logit contributions | |
antioxid | -3.413 |
annoyance | -3.334 |
Rate | -3.298 |
pleas | -3.238 |
gery | -3.214 |
Token | ? |
Token ID | 30 |
Feature activation | -4.42e-01 |
Pos logit contributions | |
antioxid | +0.215 |
annoyance | +0.208 |
pleas | +0.205 |
Rate | +0.201 |
± | +0.197 |
Neg logit contributions | |
uala | -0.375 |
eni | -0.335 |
itton | -0.298 |
atin | -0.287 |
Devi | -0.287 |
Token | Let |
Token ID | 3914 |
Feature activation | +8.96e-02 |
Pos logit contributions | |
uala | +2.128 |
eni | +1.881 |
itton | +1.629 |
Devi | +1.604 |
atin | +1.581 |
Neg logit contributions | |
antioxid | -1.514 |
annoyance | -1.479 |
pleas | -1.442 |
gery | -1.390 |
reven | -1.388 |
Token | us |
Token ID | 514 |
Feature activation | -3.73e-01 |
Pos logit contributions | |
antioxid | +0.230 |
annoyance | +0.223 |
pleas | +0.219 |
Rate | +0.212 |
± | +0.210 |
Neg logit contributions | |
uala | -0.511 |
eni | -0.461 |
itton | -0.413 |
atin | -0.401 |
Devi | -0.399 |
Token | know |
Token ID | 760 |
Feature activation | +8.62e-02 |
Pos logit contributions | |
uala | +1.768 |
eni | +1.579 |
itton | +1.370 |
atin | +1.317 |
Devi | +1.311 |
Neg logit contributions | |
antioxid | -1.303 |
annoyance | -1.253 |
ONSORED | -1.220 |
pleas | -1.217 |
\\\\\\\\ | -1.212 |
Token | in |
Token ID | 287 |
Feature activation | -9.42e-01 |
Pos logit contributions | |
antioxid | +0.251 |
annoyance | +0.243 |
pleas | +0.238 |
Rate | +0.233 |
\\\\\\\\ | +0.230 |
Neg logit contributions | |
uala | -0.461 |
eni | -0.415 |
itton | -0.368 |
atin | -0.356 |
Devi | -0.355 |
Token | found |
Token ID | 1043 |
Feature activation | +5.35e-01 |
Pos logit contributions | |
uala | +1.850 |
eni | +1.659 |
itton | +1.462 |
atin | +1.425 |
Devi | +1.425 |
Neg logit contributions | |
antioxid | -1.054 |
annoyance | -1.001 |
\\\\\\\\ | -0.983 |
Rate | -0.975 |
pleas | -0.975 |
Token | that |
Token ID | 326 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
antioxid | +1.332 |
annoyance | +1.298 |
pleas | +1.279 |
Rate | +1.229 |
± | +1.224 |
Neg logit contributions | |
uala | -3.083 |
eni | -2.782 |
itton | -2.498 |
atin | -2.421 |
Devi | -2.410 |
Token | the |
Token ID | 262 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
antioxid | +0.587 |
annoyance | +0.570 |
pleas | +0.562 |
Rate | +0.550 |
\\\\\\\\ | +0.545 |
Neg logit contributions | |
uala | -1.027 |
eni | -0.917 |
itton | -0.813 |
atin | -0.788 |
Devi | -0.785 |
Token | ability |
Token ID | 2694 |
Feature activation | +6.29e-01 |
Pos logit contributions | |
antioxid | +0.557 |
annoyance | +0.539 |
pleas | +0.532 |
Rate | +0.521 |
---------- | +0.516 |
Neg logit contributions | |
uala | -1.002 |
eni | -0.896 |
itton | -0.794 |
atin | -0.770 |
Devi | -0.768 |
Token | to |
Token ID | 284 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
antioxid | +1.349 |
annoyance | +1.329 |
pleas | +1.310 |
Rate | +1.252 |
± | +1.251 |
Neg logit contributions | |
uala | -3.807 |
eni | -3.447 |
itton | -3.111 |
Devi | -3.020 |
atin | -3.020 |
Token | confront |
Token ID | 7239 |
Feature activation | +4.52e-01 |
Pos logit contributions | |
uala | +0.604 |
eni | +0.533 |
itton | +0.469 |
atin | +0.448 |
Devi | +0.446 |
Neg logit contributions | |
antioxid | -0.435 |
annoyance | -0.420 |
pleas | -0.412 |
\\\\\\\\ | -0.412 |
Rate | -0.407 |
Token | one |
Token ID | 530 |
Feature activation | +5.84e-01 |
Pos logit contributions | |
antioxid | +1.300 |
annoyance | +1.275 |
pleas | +1.259 |
Rate | +1.215 |
± | +1.209 |
Neg logit contributions | |
uala | -2.435 |
eni | -2.177 |
itton | -1.941 |
atin | -1.877 |
Devi | -1.865 |
Token | 's |
Token ID | 338 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
antioxid | +1.522 |
annoyance | +1.506 |
pleas | +1.476 |
Rate | +1.410 |
± | +1.402 |
Neg logit contributions | |
uala | -3.291 |
eni | -2.966 |
itton | -2.669 |
atin | -2.577 |
Devi | -2.552 |
Token | accuser |
Token ID | 43738 |
Feature activation | +3.72e-01 |
Pos logit contributions | |
uala | +0.699 |
eni | +0.617 |
itton | +0.531 |
Devi | +0.515 |
atin | +0.511 |
Neg logit contributions | |
antioxid | -0.563 |
annoyance | -0.539 |
Rate | -0.535 |
\\\\\\\\ | -0.535 |
pleas | -0.534 |
Token | is |
Token ID | 318 |
Feature activation | -3.95e-02 |
Pos logit contributions | |
antioxid | +0.999 |
annoyance | +0.976 |
pleas | +0.965 |
Rate | +0.929 |
± | +0.924 |
Neg logit contributions | |
uala | -2.070 |
eni | -1.858 |
itton | -1.664 |
atin | -1.611 |
Devi | -1.603 |
Token | important |
Token ID | 1593 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
uala | +0.205 |
eni | +0.183 |
itton | +0.162 |
atin | +0.157 |
Devi | +0.156 |
Neg logit contributions | |
antioxid | -0.121 |
annoyance | -0.118 |
pleas | -0.115 |
Rate | -0.114 |
\\\\\\\\ | -0.113 |
Token | � |
Token ID | 251 |
Feature activation | +3.50e-01 |
Pos logit contributions | |
antioxid | +1.980 |
annoyance | +1.918 |
pleas | +1.909 |
± | +1.854 |
---------- | +1.845 |
Neg logit contributions | |
uala | -3.995 |
eni | -3.600 |
itton | -3.217 |
atin | -3.105 |
Devi | -3.075 |
Token | While |
Token ID | 2893 |
Feature activation | +7.02e-01 |
Pos logit contributions | |
antioxid | +1.168 |
annoyance | +1.140 |
pleas | +1.127 |
Rate | +1.100 |
± | +1.090 |
Neg logit contributions | |
uala | -1.726 |
eni | -1.528 |
itton | -1.340 |
atin | -1.293 |
Devi | -1.289 |
Token | she |
Token ID | 673 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
antioxid | +2.232 |
annoyance | +2.188 |
pleas | +2.163 |
Rate | +2.100 |
± | +2.092 |
Neg logit contributions | |
uala | -3.564 |
eni | -3.164 |
itton | -2.798 |
atin | -2.693 |
Devi | -2.675 |
Token | does |
Token ID | 857 |
Feature activation | +7.81e-02 |
Pos logit contributions | |
antioxid | +1.187 |
annoyance | +1.150 |
pleas | +1.132 |
Rate | +1.102 |
± | +1.091 |
Neg logit contributions | |
uala | -2.232 |
eni | -2.000 |
itton | -1.779 |
atin | -1.722 |
Devi | -1.716 |
Token | believe |
Token ID | 1975 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
antioxid | +0.225 |
annoyance | +0.216 |
pleas | +0.214 |
Rate | +0.207 |
\\\\\\\\ | +0.207 |
Neg logit contributions | |
uala | -0.422 |
eni | -0.378 |
itton | -0.337 |
atin | -0.326 |
Devi | -0.325 |
Token | that |
Token ID | 326 |
Feature activation | -2.16e-02 |
Pos logit contributions | |
antioxid | +0.661 |
annoyance | +0.637 |
pleas | +0.625 |
Rate | +0.608 |
---------- | +0.599 |
Neg logit contributions | |
uala | -1.553 |
eni | -1.401 |
itton | -1.258 |
atin | -1.222 |
Devi | -1.220 |
Token | Russia |
Token ID | 3284 |
Feature activation | +5.68e-02 |
Pos logit contributions | |
uala | +0.111 |
eni | +0.099 |
itton | +0.087 |
atin | +0.084 |
Devi | +0.084 |
Neg logit contributions | |
antioxid | -0.068 |
annoyance | -0.065 |
pleas | -0.064 |
Rate | -0.063 |
\\\\\\\\ | -0.063 |
Token | has |
Token ID | 468 |
Feature activation | +3.77e-02 |
Pos logit contributions | |
antioxid | +0.162 |
annoyance | +0.157 |
pleas | +0.154 |
Rate | +0.150 |
\\\\\\\\ | +0.148 |
Neg logit contributions | |
uala | -0.308 |
eni | -0.277 |
itton | -0.245 |
Devi | -0.238 |
atin | -0.238 |
Token | tried |
Token ID | 3088 |
Feature activation | -2.52e-01 |
Pos logit contributions | |
antioxid | +0.112 |
annoyance | +0.109 |
pleas | +0.107 |
Rate | +0.105 |
\\\\\\\\ | +0.104 |
Neg logit contributions | |
uala | -0.200 |
eni | -0.179 |
itton | -0.158 |
Devi | -0.153 |
atin | -0.152 |
Token | to |
Token ID | 284 |
Feature activation | -1.90e-01 |
Pos logit contributions | |
uala | +1.412 |
eni | +1.279 |
itton | +1.138 |
Devi | +1.107 |
atin | +1.102 |
Neg logit contributions | |
antioxid | -0.665 |
annoyance | -0.640 |
pleas | -0.619 |
Rate | -0.613 |
---------- | -0.608 |
Token | influence |
Token ID | 4588 |
Feature activation | -5.12e-01 |
Pos logit contributions | |
uala | +0.908 |
eni | +0.804 |
itton | +0.715 |
Devi | +0.674 |
atin | +0.671 |
Neg logit contributions | |
antioxid | -0.664 |
annoyance | -0.631 |
\\\\\\\\ | -0.625 |
pleas | -0.622 |
Rate | -0.615 |
Token | 's |
Token ID | 338 |
Feature activation | +5.17e-01 |
Pos logit contributions | |
antioxid | +0.077 |
annoyance | +0.075 |
pleas | +0.074 |
Rate | +0.072 |
± | +0.071 |
Neg logit contributions | |
uala | -0.160 |
eni | -0.144 |
itton | -0.129 |
atin | -0.124 |
Devi | -0.124 |
Token | stark |
Token ID | 19278 |
Feature activation | -5.17e-01 |
Pos logit contributions | |
antioxid | +1.307 |
annoyance | +1.273 |
pleas | +1.255 |
Rate | +1.205 |
± | +1.204 |
Neg logit contributions | |
uala | -2.968 |
eni | -2.673 |
itton | -2.404 |
atin | -2.321 |
Devi | -2.317 |
Token | " |
Token ID | 366 |
Feature activation | +3.89e-01 |
Pos logit contributions | |
uala | +2.536 |
eni | +2.260 |
itton | +1.979 |
atin | +1.923 |
nil | +1.880 |
Neg logit contributions | |
antioxid | -1.715 |
annoyance | -1.645 |
pleas | -1.622 |
Rate | -1.621 |
---------- | -1.612 |
Token | inst |
Token ID | 8625 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
antioxid | +1.430 |
annoyance | +1.403 |
pleas | +1.395 |
Rate | +1.371 |
---------- | +1.354 |
Neg logit contributions | |
uala | -1.773 |
eni | -1.551 |
itton | -1.350 |
Devi | -1.296 |
atin | -1.288 |
Token | itution |
Token ID | 2738 |
Feature activation | -4.62e-01 |
Pos logit contributions | |
antioxid | +0.125 |
annoyance | +0.124 |
pleas | +0.123 |
Rate | +0.121 |
± | +0.120 |
Neg logit contributions | |
uala | -0.087 |
eni | -0.073 |
itton | -0.059 |
Devi | -0.055 |
atin | -0.055 |
Token | chic |
Token ID | 47180 |
Feature activation | -1.91e-01 |
Pos logit contributions | |
uala | +2.291 |
eni | +2.030 |
itton | +1.779 |
atin | +1.746 |
Devi | +1.699 |
Neg logit contributions | |
antioxid | -1.530 |
annoyance | -1.464 |
pleas | -1.441 |
Rate | -1.429 |
\\\\\\\\ | -1.419 |
Token | " |
Token ID | 1 |
Feature activation | +3.84e-02 |
Pos logit contributions | |
uala | +0.935 |
eni | +0.828 |
itton | +0.725 |
atin | +0.703 |
Devi | +0.691 |
Neg logit contributions | |
antioxid | -0.649 |
annoyance | -0.632 |
pleas | -0.624 |
Rate | -0.612 |
± | -0.606 |
Token | would |
Token ID | 561 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
antioxid | +0.106 |
annoyance | +0.102 |
pleas | +0.100 |
Rate | +0.099 |
\\\\\\\\ | +0.099 |
Neg logit contributions | |
uala | -0.210 |
eni | -0.189 |
itton | -0.168 |
atin | -0.164 |
Devi | -0.163 |
Token | be |
Token ID | 307 |
Feature activation | +9.91e-02 |
Pos logit contributions | |
antioxid | +0.393 |
annoyance | +0.379 |
pleas | +0.374 |
Rate | +0.367 |
\\\\\\\\ | +0.367 |
Neg logit contributions | |
uala | -0.572 |
eni | -0.508 |
itton | -0.446 |
atin | -0.429 |
Devi | -0.427 |
Token | the |
Token ID | 262 |
Feature activation | -1.99e-01 |
Pos logit contributions | |
antioxid | +0.305 |
annoyance | +0.297 |
pleas | +0.293 |
Rate | +0.287 |
± | +0.283 |
Neg logit contributions | |
uala | -0.514 |
eni | -0.458 |
itton | -0.405 |
atin | -0.392 |
Devi | -0.390 |
Token | winner |
Token ID | 8464 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
uala | +0.980 |
eni | +0.872 |
itton | +0.759 |
atin | +0.737 |
Devi | +0.732 |
Neg logit contributions | |
antioxid | -0.659 |
annoyance | -0.629 |
Rate | -0.624 |
pleas | -0.621 |
\\\\\\\\ | -0.618 |
Token | ," |
Token ID | 553 |
Feature activation | +4.25e-01 |
Pos logit contributions | |
antioxid | +0.177 |
annoyance | +0.171 |
pleas | +0.168 |
Rate | +0.165 |
---------- | +0.164 |
Neg logit contributions | |
uala | -0.279 |
eni | -0.248 |
itton | -0.219 |
atin | -0.212 |
Devi | -0.210 |
Token | according |
Token ID | 1864 |
Feature activation | -1.90e-01 |
Pos logit contributions | |
antioxid | +1.274 |
annoyance | +1.251 |
pleas | +1.238 |
Rate | +1.194 |
± | +1.193 |
Neg logit contributions | |
uala | -2.227 |
eni | -1.990 |
itton | -1.766 |
atin | -1.702 |
Devi | -1.686 |
Token | to |
Token ID | 284 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
uala | +1.073 |
eni | +0.969 |
itton | +0.857 |
Devi | +0.841 |
atin | +0.837 |
Neg logit contributions | |
antioxid | -0.503 |
annoyance | -0.481 |
pleas | -0.462 |
\\\\\\\\ | -0.459 |
Rate | -0.458 |
Token | the |
Token ID | 262 |
Feature activation | +7.64e-03 |
Pos logit contributions | |
uala | +1.269 |
eni | +1.126 |
itton | +0.986 |
Devi | +0.960 |
atin | +0.949 |
Neg logit contributions | |
antioxid | -0.849 |
annoyance | -0.824 |
pleas | -0.816 |
Rate | -0.803 |
---------- | -0.797 |
Token | narrator |
Token ID | 32339 |
Feature activation | +2.93e-01 |
Pos logit contributions | |
antioxid | +0.029 |
annoyance | +0.028 |
pleas | +0.028 |
Rate | +0.028 |
---------- | +0.027 |
Neg logit contributions | |
uala | -0.034 |
eni | -0.030 |
itton | -0.026 |
Devi | -0.025 |
atin | -0.025 |
Token | . |
Token ID | 13 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
antioxid | +0.937 |
annoyance | +0.919 |
pleas | +0.909 |
± | +0.881 |
Rate | +0.876 |
Neg logit contributions | |
uala | -1.484 |
eni | -1.318 |
itton | -1.168 |
atin | -1.124 |
Devi | -1.106 |
Token | Also |
Token ID | 4418 |
Feature activation | +8.90e-01 |
Pos logit contributions | |
uala | +0.533 |
eni | +0.474 |
itton | +0.415 |
Devi | +0.405 |
atin | +0.403 |
Neg logit contributions | |
antioxid | -0.347 |
annoyance | -0.338 |
pleas | -0.334 |
Rate | -0.325 |
\\\\\\\\ | -0.322 |
Token | still |
Token ID | 991 |
Feature activation | +4.27e-01 |
Pos logit contributions | |
antioxid | +2.599 |
pleas | +2.570 |
annoyance | +2.565 |
± | +2.454 |
---------- | +2.406 |
Neg logit contributions | |
uala | -4.672 |
eni | -4.169 |
itton | -3.730 |
atin | -3.578 |
� | -3.568 |
Token | frequently |
Token ID | 6777 |
Feature activation | -3.47e-02 |
Pos logit contributions | |
antioxid | +1.356 |
annoyance | +1.327 |
pleas | +1.317 |
Rate | +1.272 |
± | +1.271 |
Neg logit contributions | |
uala | -2.164 |
eni | -1.922 |
itton | -1.701 |
atin | -1.638 |
Devi | -1.630 |
Token | seen |
Token ID | 1775 |
Feature activation | +6.40e-01 |
Pos logit contributions | |
uala | +0.181 |
eni | +0.162 |
itton | +0.143 |
atin | +0.138 |
Devi | +0.138 |
Neg logit contributions | |
antioxid | -0.106 |
annoyance | -0.103 |
pleas | -0.101 |
Rate | -0.099 |
\\\\\\\\ | -0.098 |
Token | today |
Token ID | 1909 |
Feature activation | -8.81e-02 |
Pos logit contributions | |
antioxid | +1.991 |
annoyance | +1.962 |
pleas | +1.952 |
± | +1.882 |
---------- | +1.870 |
Neg logit contributions | |
uala | -3.283 |
eni | -2.900 |
itton | -2.577 |
atin | -2.486 |
Devi | -2.466 |
Token | is |
Token ID | 318 |
Feature activation | +7.81e-02 |
Pos logit contributions | |
uala | +0.994 |
eni | +0.897 |
itton | +0.796 |
Devi | +0.774 |
atin | +0.768 |
Neg logit contributions | |
antioxid | -0.565 |
annoyance | -0.540 |
pleas | -0.528 |
\\\\\\\\ | -0.521 |
---------- | -0.517 |
Token | a |
Token ID | 257 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
antioxid | +0.234 |
annoyance | +0.226 |
pleas | +0.223 |
Rate | +0.219 |
\\\\\\\\ | +0.218 |
Neg logit contributions | |
uala | -0.412 |
eni | -0.367 |
itton | -0.327 |
atin | -0.317 |
Devi | -0.316 |
Token | credit |
Token ID | 3884 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
antioxid | +0.399 |
annoyance | +0.383 |
pleas | +0.378 |
Rate | +0.373 |
\\\\\\\\ | +0.371 |
Neg logit contributions | |
uala | -0.646 |
eni | -0.574 |
itton | -0.508 |
Devi | -0.492 |
atin | -0.492 |
Token | - |
Token ID | 12 |
Feature activation | -6.58e-02 |
Pos logit contributions | |
uala | +0.798 |
eni | +0.710 |
itton | +0.637 |
atin | +0.610 |
Devi | +0.608 |
Neg logit contributions | |
antioxid | -0.469 |
annoyance | -0.448 |
pleas | -0.442 |
\\\\\\\\ | -0.438 |
Rate | -0.437 |
Token | reporting |
Token ID | 49914 |
Feature activation | -9.35e-01 |
Pos logit contributions | |
uala | +0.322 |
eni | +0.285 |
itton | +0.250 |
atin | +0.241 |
Devi | +0.239 |
Neg logit contributions | |
antioxid | -0.224 |
annoyance | -0.216 |
pleas | -0.214 |
± | -0.208 |
\\\\\\\\ | -0.208 |
Token | agency |
Token ID | 4086 |
Feature activation | -6.62e-01 |
Pos logit contributions | |
uala | +4.873 |
eni | +4.316 |
itton | +3.947 |
Devi | +3.803 |
atin | +3.757 |
Neg logit contributions | |
antioxid | -2.656 |
\\\\\\\\ | -2.520 |
Rate | -2.477 |
---------- | -2.475 |
ULTS | -2.459 |
Token | , |
Token ID | 11 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
uala | +3.168 |
eni | +2.791 |
itton | +2.465 |
atin | +2.377 |
Devi | +2.363 |
Neg logit contributions | |
antioxid | -2.285 |
annoyance | -2.181 |
pleas | -2.164 |
Rate | -2.135 |
\\\\\\\\ | -2.125 |
Token | JPMorgan |
Token ID | 43318 |
Feature activation | -2.29e-01 |
Pos logit contributions | |
uala | +0.555 |
eni | +0.493 |
itton | +0.437 |
atin | +0.426 |
Devi | +0.424 |
Neg logit contributions | |
antioxid | -0.335 |
annoyance | -0.323 |
pleas | -0.319 |
\\\\\\\\ | -0.311 |
Rate | -0.310 |
Token | Chase |
Token ID | 16346 |
Feature activation | +4.10e-01 |
Pos logit contributions | |
uala | +1.074 |
eni | +0.949 |
itton | +0.831 |
atin | +0.800 |
Devi | +0.796 |
Neg logit contributions | |
antioxid | -0.818 |
annoyance | -0.794 |
pleas | -0.785 |
Rate | -0.766 |
---------- | -0.763 |
Token | , |
Token ID | 11 |
Feature activation | +5.91e-01 |
Pos logit contributions | |
antioxid | +1.356 |
annoyance | +1.336 |
pleas | +1.319 |
Rate | +1.294 |
± | +1.289 |
Neg logit contributions | |
uala | -2.022 |
eni | -1.789 |
itton | -1.564 |
atin | -1.505 |
Devi | -1.498 |
Token | and |
Token ID | 290 |
Feature activation | +6.11e-01 |
Pos logit contributions | |
antioxid | +1.766 |
annoyance | +1.736 |
pleas | +1.713 |
Rate | +1.668 |
± | +1.657 |
Neg logit contributions | |
uala | -3.109 |
eni | -2.778 |
itton | -2.460 |
atin | -2.364 |
Devi | -2.356 |
Token | due |
Token ID | 2233 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
uala | +2.243 |
eni | +2.020 |
itton | +1.779 |
atin | +1.708 |
Devi | +1.700 |
Neg logit contributions | |
antioxid | -1.440 |
annoyance | -1.409 |
Rate | -1.399 |
pleas | -1.388 |
\\\\\\\\ | -1.357 |
Token | to |
Token ID | 284 |
Feature activation | -3.36e-01 |
Pos logit contributions | |
antioxid | +0.289 |
annoyance | +0.280 |
pleas | +0.276 |
Rate | +0.264 |
± | +0.263 |
Neg logit contributions | |
uala | -0.732 |
eni | -0.662 |
itton | -0.596 |
atin | -0.578 |
Devi | -0.577 |
Token | an |
Token ID | 281 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
uala | +1.720 |
eni | +1.536 |
itton | +1.358 |
Devi | +1.314 |
atin | +1.311 |
Neg logit contributions | |
antioxid | -1.036 |
annoyance | -0.992 |
Rate | -0.983 |
pleas | -0.977 |
\\\\\\\\ | -0.968 |
Token | omission |
Token ID | 35725 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
uala | +1.360 |
eni | +1.214 |
itton | +1.057 |
atin | +1.020 |
Devi | +1.004 |
Neg logit contributions | |
antioxid | -0.976 |
pleas | -0.948 |
annoyance | -0.940 |
Rate | -0.933 |
---------- | -0.919 |
Token | from |
Token ID | 422 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
uala | +0.820 |
eni | +0.735 |
itton | +0.648 |
atin | +0.627 |
Devi | +0.623 |
Neg logit contributions | |
antioxid | -0.492 |
annoyance | -0.474 |
pleas | -0.468 |
Rate | -0.462 |
\\\\\\\\ | -0.456 |
Token | Team |
Token ID | 4816 |
Feature activation | -5.34e-01 |
Pos logit contributions | |
uala | +0.681 |
eni | +0.607 |
itton | +0.539 |
atin | +0.522 |
Devi | +0.519 |
Neg logit contributions | |
antioxid | -0.387 |
annoyance | -0.377 |
pleas | -0.370 |
Rate | -0.363 |
---------- | -0.358 |
Token | USA |
Token ID | 4916 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
uala | +2.799 |
eni | +2.501 |
itton | +2.217 |
atin | +2.178 |
Devi | +2.145 |
Neg logit contributions | |
antioxid | -1.601 |
annoyance | -1.554 |
pleas | -1.510 |
Rate | -1.480 |
\\\\\\\\ | -1.478 |
Token | � |
Token ID | 447 |
Feature activation | -1.88e-02 |
Pos logit contributions | |
uala | +0.863 |
eni | +0.771 |
itton | +0.684 |
atin | +0.662 |
Devi | +0.655 |
Neg logit contributions | |
antioxid | -0.515 |
annoyance | -0.503 |
pleas | -0.494 |
Rate | -0.488 |
---------- | -0.481 |
Token | � |
Token ID | 247 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
uala | +0.097 |
eni | +0.086 |
itton | +0.076 |
atin | +0.073 |
Devi | +0.073 |
Neg logit contributions | |
antioxid | -0.058 |
annoyance | -0.057 |
pleas | -0.056 |
Rate | -0.054 |
gery | -0.054 |
Token | s |
Token ID | 82 |
Feature activation | -2.32e-01 |
Pos logit contributions | |
uala | +1.111 |
eni | +1.007 |
itton | +0.912 |
atin | +0.893 |
Devi | +0.882 |
Neg logit contributions | |
antioxid | -0.368 |
annoyance | -0.353 |
pleas | -0.344 |
Rate | -0.332 |
± | -0.326 |
Token | roster |
Token ID | 9354 |
Feature activation | -5.72e-01 |
Pos logit contributions | |
uala | +1.282 |
eni | +1.152 |
itton | +1.027 |
atin | +0.999 |
Devi | +0.994 |
Neg logit contributions | |
antioxid | -0.624 |
annoyance | -0.603 |
pleas | -0.592 |
Rate | -0.588 |
\\\\\\\\ | -0.587 |
Token | . |
Token ID | 13 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
uala | +0.126 |
eni | +0.112 |
itton | +0.098 |
Devi | +0.095 |
atin | +0.095 |
Neg logit contributions | |
antioxid | -0.080 |
annoyance | -0.077 |
pleas | -0.076 |
Rate | -0.075 |
---------- | -0.074 |
Token |
|
Token ID | 198 |
Feature activation | -1.61e-01 |
Pos logit contributions | |
antioxid | +0.553 |
annoyance | +0.536 |
pleas | +0.526 |
Rate | +0.512 |
gery | +0.506 |
Neg logit contributions | |
uala | -0.853 |
eni | -0.755 |
itton | -0.660 |
Devi | -0.651 |
atin | -0.644 |
Token |
|
Token ID | 198 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
uala | +0.748 |
eni | +0.661 |
itton | +0.562 |
Devi | +0.549 |
atin | +0.548 |
Neg logit contributions | |
antioxid | -0.595 |
annoyance | -0.570 |
pleas | -0.548 |
\\\\\\\\ | -0.545 |
reven | -0.542 |
Token | When |
Token ID | 2215 |
Feature activation | -2.72e-01 |
Pos logit contributions | |
antioxid | +0.052 |
annoyance | +0.050 |
pleas | +0.049 |
regression | +0.048 |
reven | +0.048 |
Neg logit contributions | |
uala | -0.073 |
eni | -0.065 |
itton | -0.056 |
atin | -0.055 |
nil | -0.054 |
Token | you |
Token ID | 345 |
Feature activation | -4.43e-01 |
Pos logit contributions | |
uala | +1.456 |
eni | +1.297 |
itton | +1.145 |
Devi | +1.134 |
atin | +1.119 |
Neg logit contributions | |
antioxid | -0.795 |
annoyance | -0.759 |
\\\\\\\\ | -0.741 |
pleas | -0.741 |
Rate | -0.740 |
Token | say |
Token ID | 910 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
uala | +2.083 |
eni | +1.867 |
itton | +1.619 |
Devi | +1.544 |
atin | +1.539 |
Neg logit contributions | |
antioxid | -1.588 |
annoyance | -1.518 |
\\\\\\\\ | -1.477 |
pleas | -1.471 |
Rate | -1.464 |
Token | this |
Token ID | 428 |
Feature activation | -5.53e-01 |
Pos logit contributions | |
uala | +5.462 |
eni | +4.865 |
Devi | +4.293 |
atin | +4.223 |
itton | +4.210 |
Neg logit contributions | |
antioxid | -3.229 |
Rate | -3.036 |
ONSORED | -3.033 |
\\\\\\\\ | -2.996 |
annoyance | -2.983 |
Token | , |
Token ID | 11 |
Feature activation | -5.19e-01 |
Pos logit contributions | |
uala | +2.711 |
eni | +2.421 |
itton | +2.091 |
Devi | +2.064 |
atin | +2.038 |
Neg logit contributions | |
antioxid | -1.781 |
annoyance | -1.706 |
Rate | -1.704 |
pleas | -1.694 |
\\\\\\\\ | -1.690 |
Token | it |
Token ID | 340 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
uala | +2.660 |
eni | +2.368 |
itton | +2.090 |
Devi | +2.080 |
atin | +2.041 |
Neg logit contributions | |
antioxid | -1.571 |
annoyance | -1.493 |
\\\\\\\\ | -1.488 |
ONSORED | -1.481 |
Rate | -1.477 |
Token | tells |
Token ID | 4952 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
uala | +1.470 |
eni | +1.320 |
itton | +1.166 |
Devi | +1.134 |
atin | +1.128 |
Neg logit contributions | |
antioxid | -0.805 |
annoyance | -0.766 |
Rate | -0.745 |
pleas | -0.744 |
\\\\\\\\ | -0.732 |
Token | me |
Token ID | 502 |
Feature activation | -4.90e-01 |
Pos logit contributions | |
uala | +1.427 |
eni | +1.286 |
itton | +1.132 |
Devi | +1.110 |
atin | +1.094 |
Neg logit contributions | |
antioxid | -0.803 |
annoyance | -0.768 |
pleas | -0.754 |
Rate | -0.749 |
\\\\\\\\ | -0.736 |
Token | me |
Token ID | 502 |
Feature activation | -5.14e-01 |
Pos logit contributions | |
uala | +1.666 |
eni | +1.489 |
itton | +1.318 |
Devi | +1.288 |
atin | +1.284 |
Neg logit contributions | |
antioxid | -0.946 |
annoyance | -0.911 |
pleas | -0.879 |
Rate | -0.866 |
---------- | -0.855 |
Token | � |
Token ID | 447 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
uala | +2.615 |
eni | +2.334 |
itton | +2.043 |
Devi | +2.000 |
atin | +1.977 |
Neg logit contributions | |
antioxid | -1.619 |
annoyance | -1.578 |
pleas | -1.535 |
Rate | -1.515 |
gery | -1.503 |
Token | � |
Token ID | 247 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
antioxid | +0.686 |
annoyance | +0.665 |
pleas | +0.658 |
Rate | +0.636 |
± | +0.634 |
Neg logit contributions | |
uala | -1.512 |
eni | -1.362 |
itton | -1.221 |
atin | -1.184 |
Devi | -1.176 |
Token | and |
Token ID | 290 |
Feature activation | -1.61e-01 |
Pos logit contributions | |
antioxid | +0.725 |
annoyance | +0.704 |
pleas | +0.693 |
Rate | +0.676 |
± | +0.666 |
Neg logit contributions | |
uala | -1.355 |
eni | -1.213 |
itton | -1.077 |
atin | -1.046 |
Devi | -1.040 |
Token | all |
Token ID | 477 |
Feature activation | -4.11e-01 |
Pos logit contributions | |
uala | +0.848 |
eni | +0.756 |
itton | +0.667 |
Devi | +0.651 |
atin | +0.648 |
Neg logit contributions | |
antioxid | -0.485 |
annoyance | -0.466 |
pleas | -0.460 |
Rate | -0.452 |
\\\\\\\\ | -0.446 |
Token | that |
Token ID | 326 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
uala | +2.175 |
eni | +1.960 |
itton | +1.724 |
atin | +1.682 |
Devi | +1.667 |
Neg logit contributions | |
antioxid | -1.214 |
annoyance | -1.164 |
pleas | -1.143 |
Rate | -1.134 |
\\\\\\\\ | -1.105 |
Token | stuff |
Token ID | 3404 |
Feature activation | -9.25e-02 |
Pos logit contributions | |
uala | +6.249 |
eni | +5.571 |
itton | +4.892 |
atin | +4.833 |
Devi | +4.756 |
Neg logit contributions | |
antioxid | -3.846 |
annoyance | -3.704 |
Rate | -3.680 |
ONSORED | -3.632 |
pleas | -3.623 |
Token | , |
Token ID | 11 |
Feature activation | -3.19e-02 |
Pos logit contributions | |
uala | +0.471 |
eni | +0.419 |
itton | +0.368 |
atin | +0.357 |
Devi | +0.355 |
Neg logit contributions | |
antioxid | -0.295 |
annoyance | -0.284 |
pleas | -0.281 |
Rate | -0.278 |
\\\\\\\\ | -0.271 |
Token | and |
Token ID | 290 |
Feature activation | -2.32e-01 |
Pos logit contributions | |
uala | +0.175 |
eni | +0.156 |
itton | +0.140 |
Devi | +0.136 |
atin | +0.136 |
Neg logit contributions | |
antioxid | -0.089 |
annoyance | -0.086 |
pleas | -0.084 |
Rate | -0.083 |
gery | -0.081 |
Token | I |
Token ID | 314 |
Feature activation | +1.84e-01 |
Pos logit contributions | |
uala | +1.224 |
eni | +1.092 |
itton | +0.966 |
Devi | +0.944 |
atin | +0.937 |
Neg logit contributions | |
antioxid | -0.691 |
annoyance | -0.660 |
pleas | -0.649 |
Rate | -0.642 |
\\\\\\\\ | -0.635 |
Token | don |
Token ID | 836 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
antioxid | +0.604 |
annoyance | +0.590 |
pleas | +0.582 |
Rate | +0.568 |
± | +0.563 |
Neg logit contributions | |
uala | -0.919 |
eni | -0.816 |
itton | -0.717 |
atin | -0.692 |
Devi | -0.689 |
Token | ing |
Token ID | 278 |
Feature activation | +4.47e-02 |
Pos logit contributions | |
antioxid | +2.044 |
annoyance | +2.001 |
pleas | +1.987 |
± | +1.928 |
Rate | +1.922 |
Neg logit contributions | |
uala | -3.279 |
eni | -2.903 |
itton | -2.567 |
Devi | -2.473 |
atin | -2.470 |
Token | lately |
Token ID | 16537 |
Feature activation | +1.44e-01 |
Pos logit contributions | |
antioxid | +0.143 |
annoyance | +0.139 |
pleas | +0.137 |
Rate | +0.135 |
---------- | +0.133 |
Neg logit contributions | |
uala | -0.226 |
eni | -0.202 |
itton | -0.178 |
atin | -0.171 |
Devi | -0.171 |
Token | ? |
Token ID | 30 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
antioxid | +0.487 |
annoyance | +0.475 |
pleas | +0.469 |
Rate | +0.459 |
---------- | +0.453 |
Neg logit contributions | |
uala | -0.706 |
eni | -0.626 |
itton | -0.548 |
atin | -0.528 |
Devi | -0.527 |
Token | Well |
Token ID | 3894 |
Feature activation | -4.23e-01 |
Pos logit contributions | |
antioxid | +0.058 |
annoyance | +0.057 |
pleas | +0.056 |
Rate | +0.054 |
gery | +0.054 |
Neg logit contributions | |
uala | -0.093 |
eni | -0.083 |
itton | -0.073 |
Devi | -0.071 |
atin | -0.071 |
Token | , |
Token ID | 11 |
Feature activation | -1.97e-01 |
Pos logit contributions | |
uala | +2.023 |
eni | +1.781 |
itton | +1.563 |
Devi | +1.509 |
atin | +1.504 |
Neg logit contributions | |
antioxid | -1.465 |
annoyance | -1.422 |
pleas | -1.399 |
Rate | -1.380 |
gery | -1.366 |
Token | fuck |
Token ID | 5089 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
uala | +1.009 |
eni | +0.898 |
itton | +0.800 |
Devi | +0.777 |
atin | +0.771 |
Neg logit contributions | |
antioxid | -0.607 |
annoyance | -0.582 |
pleas | -0.574 |
\\\\\\\\ | -0.568 |
Rate | -0.566 |
Token | your |
Token ID | 534 |
Feature activation | +2.36e-02 |
Pos logit contributions | |
uala | +5.386 |
eni | +4.765 |
itton | +4.204 |
atin | +4.141 |
Devi | +4.079 |
Neg logit contributions | |
antioxid | -3.135 |
annoyance | -2.970 |
pleas | -2.934 |
Rate | -2.898 |
---------- | -2.860 |
Token | homebrew |
Token ID | 45729 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
antioxid | +0.074 |
annoyance | +0.071 |
pleas | +0.070 |
Rate | +0.069 |
---------- | +0.069 |
Neg logit contributions | |
uala | -0.121 |
eni | -0.108 |
itton | -0.095 |
atin | -0.092 |
Devi | -0.092 |
Token | ing |
Token ID | 278 |
Feature activation | +1.91e-02 |
Pos logit contributions | |
antioxid | +0.939 |
annoyance | +0.917 |
pleas | +0.906 |
Rate | +0.884 |
± | +0.877 |
Neg logit contributions | |
uala | -1.417 |
eni | -1.257 |
itton | -1.105 |
atin | -1.065 |
Devi | -1.061 |
Token | . |
Token ID | 13 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
antioxid | +0.060 |
annoyance | +0.058 |
pleas | +0.057 |
Rate | +0.056 |
\\\\\\\\ | +0.056 |
Neg logit contributions | |
uala | -0.098 |
eni | -0.087 |
itton | -0.077 |
atin | -0.074 |
Devi | -0.074 |
Token | Give |
Token ID | 13786 |
Feature activation | +9.24e-02 |
Pos logit contributions | |
uala | +0.530 |
eni | +0.471 |
itton | +0.415 |
Devi | +0.404 |
atin | +0.402 |
Neg logit contributions | |
antioxid | -0.331 |
annoyance | -0.322 |
pleas | -0.317 |
Rate | -0.309 |
---------- | -0.304 |
Token | , |
Token ID | 11 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
uala | +2.976 |
eni | +2.578 |
itton | +2.212 |
atin | +2.146 |
Devi | +2.133 |
Neg logit contributions | |
antioxid | -2.643 |
annoyance | -2.541 |
\\\\\\\\ | -2.505 |
ONSORED | -2.485 |
pleas | -2.477 |
Token | a |
Token ID | 257 |
Feature activation | +2.79e-01 |
Pos logit contributions | |
uala | +0.714 |
eni | +0.635 |
itton | +0.562 |
Devi | +0.547 |
atin | +0.547 |
Neg logit contributions | |
antioxid | -0.419 |
annoyance | -0.403 |
pleas | -0.399 |
Rate | -0.389 |
\\\\\\\\ | -0.389 |
Token | fluid |
Token ID | 11711 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
antioxid | +0.894 |
annoyance | +0.873 |
pleas | +0.862 |
Rate | +0.841 |
± | +0.834 |
Neg logit contributions | |
uala | -1.414 |
eni | -1.256 |
itton | -1.107 |
atin | -1.069 |
Devi | -1.065 |
Token | with |
Token ID | 351 |
Feature activation | +4.11e-02 |
Pos logit contributions | |
uala | +1.012 |
eni | +0.905 |
itton | +0.809 |
atin | +0.794 |
Devi | +0.785 |
Neg logit contributions | |
antioxid | -0.498 |
annoyance | -0.472 |
pleas | -0.469 |
\\\\\\\\ | -0.464 |
Rate | -0.456 |
Token | some |
Token ID | 617 |
Feature activation | -3.15e-01 |
Pos logit contributions | |
antioxid | +0.120 |
annoyance | +0.116 |
pleas | +0.115 |
\\\\\\\\ | +0.112 |
Rate | +0.112 |
Neg logit contributions | |
uala | -0.218 |
eni | -0.195 |
itton | -0.172 |
Devi | -0.168 |
atin | -0.168 |
Token | uniform |
Token ID | 8187 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
uala | +1.645 |
eni | +1.467 |
itton | +1.291 |
Devi | +1.264 |
atin | +1.255 |
Neg logit contributions | |
antioxid | -0.943 |
annoyance | -0.904 |
pleas | -0.894 |
\\\\\\\\ | -0.891 |
gery | -0.882 |
Token | ambient |
Token ID | 25237 |
Feature activation | +2.80e-01 |
Pos logit contributions | |
uala | +5.476 |
eni | +4.863 |
itton | +4.225 |
atin | +4.179 |
Devi | +4.127 |
Neg logit contributions | |
antioxid | -3.112 |
ONSORED | -2.937 |
annoyance | -2.932 |
pleas | -2.930 |
gery | -2.911 |
Token | density |
Token ID | 12109 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
antioxid | +0.784 |
annoyance | +0.759 |
pleas | +0.751 |
Rate | +0.729 |
---------- | +0.720 |
Neg logit contributions | |
uala | -1.531 |
eni | -1.372 |
itton | -1.222 |
atin | -1.185 |
Devi | -1.183 |
Token | ( |
Token ID | 357 |
Feature activation | -4.98e-01 |
Pos logit contributions | |
uala | +0.924 |
eni | +0.827 |
itton | +0.727 |
Devi | +0.709 |
atin | +0.705 |
Neg logit contributions | |
antioxid | -0.561 |
annoyance | -0.535 |
pleas | -0.532 |
\\\\\\\\ | -0.513 |
Rate | -0.513 |
Token | as |
Token ID | 292 |
Feature activation | -6.63e-02 |
Pos logit contributions | |
uala | +2.214 |
eni | +1.942 |
itton | +1.656 |
atin | +1.625 |
nil | +1.605 |
Neg logit contributions | |
antioxid | -1.902 |
annoyance | -1.848 |
pleas | -1.828 |
\\\\\\\\ | -1.765 |
gery | -1.765 |
Token | the |
Token ID | 262 |
Feature activation | -4.36e-01 |
Pos logit contributions | |
uala | +0.351 |
eni | +0.313 |
itton | +0.277 |
atin | +0.270 |
Devi | +0.269 |
Neg logit contributions | |
antioxid | -0.199 |
annoyance | -0.191 |
pleas | -0.189 |
Rate | -0.183 |
\\\\\\\\ | -0.182 |
Token | get |
Token ID | 651 |
Feature activation | -1.72e-01 |
Pos logit contributions | |
antioxid | +0.269 |
annoyance | +0.260 |
pleas | +0.255 |
\\\\\\\\ | +0.253 |
Rate | +0.251 |
Neg logit contributions | |
uala | -0.375 |
eni | -0.333 |
itton | -0.292 |
atin | -0.280 |
Devi | -0.278 |
Token | at |
Token ID | 379 |
Feature activation | -4.76e-01 |
Pos logit contributions | |
uala | +0.902 |
eni | +0.807 |
itton | +0.710 |
Devi | +0.693 |
atin | +0.692 |
Neg logit contributions | |
antioxid | -0.506 |
annoyance | -0.489 |
\\\\\\\\ | -0.486 |
Rate | -0.482 |
pleas | -0.476 |
Token | least |
Token ID | 1551 |
Feature activation | +5.87e-01 |
Pos logit contributions | |
uala | +2.332 |
eni | +2.085 |
itton | +1.818 |
atin | +1.760 |
Devi | +1.729 |
Neg logit contributions | |
antioxid | -1.592 |
annoyance | -1.532 |
\\\\\\\\ | -1.493 |
pleas | -1.478 |
gery | -1.465 |
Token | 8 |
Token ID | 807 |
Feature activation | -5.20e-03 |
Pos logit contributions | |
antioxid | +1.794 |
annoyance | +1.758 |
pleas | +1.740 |
± | +1.683 |
Rate | +1.676 |
Neg logit contributions | |
uala | -3.060 |
eni | -2.725 |
itton | -2.419 |
atin | -2.331 |
Devi | -2.323 |
Token | 1 |
Token ID | 352 |
Feature activation | +8.55e-03 |
Pos logit contributions | |
uala | +0.032 |
eni | +0.029 |
itton | +0.026 |
Devi | +0.025 |
atin | +0.025 |
Neg logit contributions | |
antioxid | -0.012 |
annoyance | -0.011 |
pleas | -0.011 |
Rate | -0.011 |
\\\\\\\\ | -0.010 |
Token | / |
Token ID | 14 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
antioxid | +0.023 |
annoyance | +0.022 |
pleas | +0.022 |
Rate | +0.021 |
---------- | +0.021 |
Neg logit contributions | |
uala | -0.048 |
eni | -0.043 |
itton | -0.038 |
atin | -0.037 |
Devi | -0.037 |
Token | 2 |
Token ID | 17 |
Feature activation | -6.80e-02 |
Pos logit contributions | |
uala | +4.291 |
eni | +3.562 |
atin | +2.975 |
� | +2.813 |
etta | +2.802 |
Neg logit contributions | |
antioxid | -5.250 |
annoyance | -5.068 |
reven | -4.998 |
\\\\\\\\ | -4.964 |
pleas | -4.929 |
Token | hours |
Token ID | 2250 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
uala | +0.434 |
eni | +0.397 |
itton | +0.360 |
Devi | +0.351 |
atin | +0.351 |
Neg logit contributions | |
antioxid | -0.127 |
annoyance | -0.119 |
Rate | -0.114 |
pleas | -0.112 |
\\\\\\\\ | -0.112 |
Token | of |
Token ID | 286 |
Feature activation | +4.98e-01 |
Pos logit contributions | |
antioxid | +0.443 |
annoyance | +0.424 |
pleas | +0.414 |
Rate | +0.413 |
\\\\\\\\ | +0.412 |
Neg logit contributions | |
uala | -0.998 |
eni | -0.901 |
itton | -0.805 |
atin | -0.784 |
Devi | -0.783 |
Token | sleep |
Token ID | 3993 |
Feature activation | +9.57e-02 |
Pos logit contributions | |
antioxid | +1.564 |
annoyance | +1.532 |
pleas | +1.516 |
Rate | +1.462 |
± | +1.461 |
Neg logit contributions | |
uala | -2.550 |
eni | -2.270 |
itton | -2.007 |
atin | -1.938 |
Devi | -1.926 |
Token | a |
Token ID | 257 |
Feature activation | -5.64e-01 |
Pos logit contributions | |
antioxid | +0.278 |
annoyance | +0.267 |
pleas | +0.262 |
Rate | +0.260 |
\\\\\\\\ | +0.257 |
Neg logit contributions | |
uala | -0.512 |
eni | -0.460 |
itton | -0.408 |
atin | -0.395 |
Devi | -0.395 |