Token | we |
Token ID | 356 |
Feature activation | -8.41e+00 |
Pos logit contributions | |
WAY | +2.513 |
PET | +2.283 |
ARE | +2.098 |
VER | +2.066 |
ggle | +2.065 |
Neg logit contributions | |
ividual | -2.811 |
anonymity | -2.735 |
favorite | -2.627 |
important | -2.515 |
-) | -2.505 |
Token | work |
Token ID | 670 |
Feature activation | -3.11e+00 |
Pos logit contributions | |
WAY | +5.842 |
PET | +5.287 |
ggle | +4.882 |
ARE | +4.841 |
respectively | +4.804 |
Neg logit contributions | |
ividual | -7.415 |
anonymity | -7.322 |
favorite | -6.967 |
important | -6.747 |
interstitial | -6.646 |
Token | . |
Token ID | 13 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
WAY | +2.435 |
PET | +2.216 |
ARE | +2.033 |
ggle | +2.002 |
VER | +1.993 |
Neg logit contributions | |
ividual | -2.618 |
anonymity | -2.572 |
favorite | -2.447 |
important | -2.363 |
-) | -2.344 |
Token | It |
Token ID | 632 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
anonymity | +8.641 |
-) | +8.603 |
important | +8.471 |
favorite | +8.412 |
ividual | +8.229 |
Neg logit contributions | |
WAY | -10.291 |
PET | -9.447 |
ggle | -9.103 |
VERT | -8.898 |
ARE | -8.683 |
Token | would |
Token ID | 561 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
anonymity | +6.691 |
ividual | +6.649 |
important | +6.198 |
-) | +6.039 |
favorite | +6.016 |
Neg logit contributions | |
WAY | -10.000 |
PET | -9.108 |
ARE | -8.687 |
VERT | -8.544 |
TW | -8.170 |
Token | have |
Token ID | 423 |
Feature activation | +2.71e+01 |
Pos logit contributions | |
anonymity | +11.179 |
ividual | +10.510 |
spoil | +10.164 |
-) | +10.022 |
favorite | +9.843 |
Neg logit contributions | |
WAY | -16.701 |
PET | -15.205 |
ARE | -14.715 |
VERT | -14.545 |
Charges | -14.052 |
Token | been |
Token ID | 587 |
Feature activation | +8.16e+00 |
Pos logit contributions | |
anonymity | +12.352 |
important | +11.261 |
-) | +10.502 |
spoil | +10.344 |
ividual | +10.116 |
Neg logit contributions | |
WAY | -22.191 |
PET | -21.428 |
VERT | -19.364 |
ARE | -19.108 |
Charges | -19.038 |
Token | nice |
Token ID | 3621 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
anonymity | +5.899 |
ividual | +5.471 |
important | +5.281 |
favorite | +5.222 |
-) | +5.079 |
Neg logit contributions | |
WAY | -6.894 |
PET | -6.599 |
ARE | -6.055 |
VERT | -5.839 |
TW | -5.777 |
Token | to |
Token ID | 284 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
anonymity | +8.052 |
ividual | +7.632 |
important | +7.028 |
-) | +6.938 |
favorite | +6.937 |
Neg logit contributions | |
WAY | -11.996 |
PET | -11.073 |
ARE | -10.326 |
ggle | -10.252 |
Charges | -10.211 |
Token | win |
Token ID | 1592 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
anonymity | +7.638 |
ividual | +7.033 |
favorite | +6.663 |
-) | +6.632 |
important | +6.496 |
Neg logit contributions | |
WAY | -9.556 |
PET | -8.783 |
ARE | -8.280 |
VERT | -8.121 |
VER | -8.086 |
Token | it |
Token ID | 340 |
Feature activation | +9.36e+00 |
Pos logit contributions | |
anonymity | +10.965 |
important | +9.925 |
ividual | +9.899 |
-) | +9.352 |
favorite | +9.149 |
Neg logit contributions | |
WAY | -13.400 |
PET | -12.190 |
ARE | -11.605 |
VERT | -11.069 |
TW | -10.918 |
Token | The |
Token ID | 464 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
anonymity | +1.628 |
ividual | +1.609 |
favorite | +1.565 |
important | +1.521 |
-) | +1.497 |
Neg logit contributions | |
WAY | -1.433 |
PET | -1.286 |
ggle | -1.190 |
ARE | -1.173 |
respectively | -1.166 |
Token | non |
Token ID | 1729 |
Feature activation | +1.59e+01 |
Pos logit contributions | |
anonymity | +0.089 |
ividual | +0.089 |
favorite | +0.082 |
important | +0.080 |
-) | +0.079 |
Neg logit contributions | |
WAY | -0.104 |
PET | -0.096 |
ARE | -0.089 |
ggle | -0.088 |
VER | -0.087 |
Token | - |
Token ID | 12 |
Feature activation | +5.30e+00 |
Pos logit contributions | |
anonymity | +8.375 |
ividual | +7.858 |
-) | +7.700 |
important | +7.279 |
favorite | +6.952 |
Neg logit contributions | |
WAY | -14.665 |
PET | -13.569 |
ARE | -12.805 |
ggle | -12.471 |
VERT | -12.433 |
Token | profit |
Token ID | 9183 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
anonymity | +3.301 |
ividual | +3.251 |
favorite | +3.118 |
important | +3.086 |
-) | +2.936 |
Neg logit contributions | |
WAY | -5.061 |
PET | -4.563 |
ARE | -4.388 |
ggle | -4.354 |
respectively | -4.305 |
Token | , |
Token ID | 11 |
Feature activation | +3.85e+00 |
Pos logit contributions | |
anonymity | +2.280 |
ividual | +2.211 |
favorite | +2.050 |
important | +1.992 |
-) | +1.973 |
Neg logit contributions | |
WAY | -2.995 |
PET | -2.744 |
ARE | -2.563 |
VERT | -2.522 |
ggle | -2.512 |
Token | self |
Token ID | 2116 |
Feature activation | +2.63e+01 |
Pos logit contributions | |
anonymity | +3.509 |
ividual | +3.455 |
favorite | +3.238 |
important | +3.195 |
-) | +3.182 |
Neg logit contributions | |
WAY | -2.726 |
PET | -2.428 |
ARE | -2.191 |
ggle | -2.166 |
VERT | -2.161 |
Token | - |
Token ID | 12 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
anonymity | +13.827 |
-) | +13.563 |
important | +12.837 |
ividual | +12.327 |
pecially | +12.217 |
Neg logit contributions | |
WAY | -20.032 |
PET | -18.165 |
ggle | -16.706 |
TW | -16.514 |
vati | -16.397 |
Token | govern |
Token ID | 47866 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
important | +9.251 |
favorite | +8.850 |
anonymity | +8.655 |
-) | +8.591 |
ividual | +8.522 |
Neg logit contributions | |
WAY | -13.349 |
PET | -11.481 |
ARE | -11.103 |
Charges | -11.050 |
ggle | -11.018 |
Token | ed |
Token ID | 276 |
Feature activation | +9.06e+00 |
Pos logit contributions | |
ividual | +1.329 |
anonymity | +1.309 |
favorite | +1.235 |
important | +1.195 |
-) | +1.179 |
Neg logit contributions | |
WAY | -1.716 |
PET | -1.576 |
ARE | -1.470 |
ggle | -1.449 |
VER | -1.444 |
Token | organisation |
Token ID | 12684 |
Feature activation | +7.41e-01 |
Pos logit contributions | |
anonymity | +6.560 |
ividual | +6.045 |
favorite | +5.531 |
important | +5.446 |
-) | +5.441 |
Neg logit contributions | |
WAY | -7.727 |
PET | -7.141 |
VERT | -6.632 |
ARE | -6.519 |
VER | -6.510 |
Token | " |
Token ID | 366 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
anonymity | +0.584 |
ividual | +0.579 |
favorite | +0.543 |
important | +0.526 |
-) | +0.523 |
Neg logit contributions | |
WAY | -0.620 |
PET | -0.565 |
ARE | -0.521 |
ggle | -0.512 |
VER | -0.511 |
Token | f |
Token ID | 69 |
Feature activation | +6.08e+00 |
Pos logit contributions | |
ividual | +5.079 |
anonymity | +5.060 |
favorite | +5.023 |
important | +4.915 |
-) | +4.833 |
Neg logit contributions | |
WAY | -4.830 |
PET | -4.409 |
ggle | -4.076 |
ARE | -3.991 |
VERT | -3.918 |
Token | inn |
Token ID | 3732 |
Feature activation | +6.68e+00 |
Pos logit contributions | |
ividual | +3.852 |
anonymity | +3.734 |
favorite | +3.509 |
-) | +3.440 |
important | +3.394 |
Neg logit contributions | |
WAY | -5.876 |
PET | -5.435 |
ARE | -5.061 |
VERT | -5.017 |
VER | -4.994 |
Token | ish |
Token ID | 680 |
Feature activation | +9.71e+00 |
Pos logit contributions | |
ividual | +3.922 |
anonymity | +3.868 |
favorite | +3.646 |
-) | +3.601 |
important | +3.511 |
Neg logit contributions | |
WAY | -6.705 |
PET | -6.204 |
ARE | -5.821 |
VERT | -5.780 |
ggle | -5.747 |
Token | , |
Token ID | 11 |
Feature activation | +6.19e+00 |
Pos logit contributions | |
anonymity | +7.381 |
ividual | +7.167 |
-) | +6.996 |
favorite | +6.933 |
important | +6.819 |
Neg logit contributions | |
WAY | -7.588 |
PET | -6.884 |
ARE | -6.345 |
VERT | -6.324 |
VER | -6.263 |
Token | published |
Token ID | 3199 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
anonymity | +4.684 |
ividual | +4.652 |
favorite | +4.332 |
-) | +4.318 |
important | +4.277 |
Neg logit contributions | |
WAY | -5.164 |
PET | -4.714 |
ARE | -4.354 |
ggle | -4.352 |
VERT | -4.259 |
Token | Jun |
Token ID | 7653 |
Feature activation | +2.61e+01 |
Pos logit contributions | |
anonymity | +9.040 |
-) | +8.504 |
ividual | +8.484 |
favorite | +8.176 |
important | +7.847 |
Neg logit contributions | |
WAY | -12.225 |
PET | -11.372 |
ARE | -10.548 |
VERT | -10.389 |
AMY | -10.230 |
Token | - |
Token ID | 12 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
-) | +13.567 |
anonymity | +11.963 |
favorite | +11.475 |
)- | +10.885 |
ividual | +10.836 |
Neg logit contributions | |
WAY | -19.012 |
PET | -18.212 |
ggle | -16.883 |
Charges | -16.665 |
VERT | -16.374 |
Token | 11 |
Token ID | 1157 |
Feature activation | +1.87e+01 |
Pos logit contributions | |
favorite | +6.784 |
-) | +6.676 |
anonymity | +6.445 |
important | +6.436 |
ividual | +6.223 |
Neg logit contributions | |
WAY | -10.901 |
PET | -10.210 |
ggle | -9.783 |
POL | -9.433 |
strides | -9.425 |
Token | - |
Token ID | 12 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
-) | +9.604 |
anonymity | +9.171 |
ividual | +8.651 |
favorite | +8.112 |
important | +7.951 |
Neg logit contributions | |
WAY | -16.518 |
PET | -15.507 |
ggle | -14.689 |
ARE | -14.302 |
VERT | -14.220 |
Token | 2014 |
Token ID | 4967 |
Feature activation | +9.42e+00 |
Pos logit contributions | |
ividual | +1.975 |
anonymity | +1.969 |
favorite | +1.858 |
important | +1.822 |
-) | +1.814 |
Neg logit contributions | |
WAY | -2.294 |
PET | -2.101 |
ggle | -1.937 |
ARE | -1.922 |
VER | -1.902 |
Token | at |
Token ID | 379 |
Feature activation | +3.43e+00 |
Pos logit contributions | |
ividual | +4.999 |
anonymity | +4.998 |
-) | +4.862 |
favorite | +4.610 |
important | +4.544 |
Neg logit contributions | |
WAY | -9.339 |
PET | -8.722 |
ggle | -8.264 |
ARE | -8.147 |
VERT | -8.084 |
Token |
|
Token ID | 198 |
Feature activation | -7.40e+00 |
Pos logit contributions | |
WAY | +1.054 |
PET | +0.946 |
ARE | +0.851 |
VER | +0.837 |
TW | +0.830 |
Neg logit contributions | |
ividual | -1.530 |
anonymity | -1.483 |
favorite | -1.390 |
important | -1.354 |
interstitial | -1.353 |
Token | Q |
Token ID | 48 |
Feature activation | -5.15e+00 |
Pos logit contributions | |
WAY | +5.013 |
PET | +4.554 |
ARE | +4.108 |
VER | +4.006 |
TW | +3.978 |
Neg logit contributions | |
ividual | -7.152 |
anonymity | -6.899 |
favorite | -6.437 |
important | -6.273 |
-) | -6.203 |
Token | : |
Token ID | 25 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
WAY | +3.606 |
PET | +3.259 |
ARE | +2.945 |
TW | +2.915 |
VER | +2.913 |
Neg logit contributions | |
ividual | -4.967 |
anonymity | -4.743 |
interstitial | -4.328 |
favorite | -4.314 |
important | -4.233 |
Token | It |
Token ID | 632 |
Feature activation | +3.37e-01 |
Pos logit contributions | |
WAY | +8.452 |
PET | +7.484 |
ARE | +6.938 |
POL | +6.838 |
VER | +6.770 |
Neg logit contributions | |
ividual | -11.145 |
anonymity | -10.358 |
interstitial | -9.773 |
favorite | -9.738 |
umatic | -9.493 |
Token | would |
Token ID | 561 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
ividual | +0.264 |
anonymity | +0.261 |
favorite | +0.245 |
important | +0.239 |
-) | +0.237 |
Neg logit contributions | |
WAY | -0.284 |
PET | -0.260 |
ARE | -0.240 |
ggle | -0.235 |
VER | -0.234 |
Token | have |
Token ID | 423 |
Feature activation | +2.61e+01 |
Pos logit contributions | |
anonymity | +10.360 |
ividual | +10.024 |
-) | +9.709 |
favorite | +9.324 |
spoil | +9.321 |
Neg logit contributions | |
WAY | -14.847 |
PET | -13.398 |
ARE | -13.034 |
VERT | -12.502 |
Charges | -12.306 |
Token | created |
Token ID | 2727 |
Feature activation | +3.15e+00 |
Pos logit contributions | |
anonymity | +14.264 |
-) | +13.605 |
ividual | +13.342 |
important | +13.228 |
spoil | +12.847 |
Neg logit contributions | |
WAY | -18.299 |
PET | -16.888 |
ARE | -15.768 |
Charges | -15.384 |
VERT | -15.313 |
Token | just |
Token ID | 655 |
Feature activation | +7.69e+00 |
Pos logit contributions | |
anonymity | +2.586 |
ividual | +2.518 |
favorite | +2.337 |
important | +2.302 |
-) | +2.284 |
Neg logit contributions | |
WAY | -2.548 |
PET | -2.359 |
ARE | -2.128 |
VERT | -2.098 |
ggle | -2.097 |
Token | too |
Token ID | 1165 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
anonymity | +5.966 |
ividual | +5.756 |
favorite | +5.248 |
-) | +5.202 |
important | +5.196 |
Neg logit contributions | |
WAY | -6.261 |
PET | -5.819 |
ARE | -5.372 |
ggle | -5.271 |
VERT | -5.243 |
Token | much |
Token ID | 881 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
anonymity | +1.322 |
ividual | +1.315 |
favorite | +1.234 |
important | +1.212 |
-) | +1.197 |
Neg logit contributions | |
WAY | -1.356 |
PET | -1.238 |
ARE | -1.134 |
ggle | -1.117 |
VERT | -1.105 |
Token | tension |
Token ID | 12097 |
Feature activation | +2.79e+00 |
Pos logit contributions | |
anonymity | +1.946 |
ividual | +1.879 |
favorite | +1.753 |
important | +1.725 |
-) | +1.709 |
Neg logit contributions | |
WAY | -1.983 |
PET | -1.824 |
ARE | -1.670 |
VERT | -1.634 |
ggle | -1.632 |
Token | funny |
Token ID | 8258 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
anonymity | +4.576 |
ividual | +4.384 |
important | +4.197 |
favorite | +4.168 |
-) | +4.065 |
Neg logit contributions | |
WAY | -4.721 |
PET | -4.363 |
ARE | -4.053 |
ggle | -3.888 |
TW | -3.884 |
Token | . |
Token ID | 13 |
Feature activation | +4.74e+00 |
Pos logit contributions | |
WAY | +2.025 |
PET | +1.853 |
ARE | +1.704 |
ggle | +1.681 |
VER | +1.673 |
Neg logit contributions | |
ividual | -1.969 |
anonymity | -1.935 |
favorite | -1.833 |
important | -1.773 |
-) | -1.754 |
Token | But |
Token ID | 887 |
Feature activation | +6.91e+00 |
Pos logit contributions | |
anonymity | +3.634 |
ividual | +3.590 |
favorite | +3.495 |
important | +3.454 |
-) | +3.444 |
Neg logit contributions | |
WAY | -3.780 |
PET | -3.420 |
ARE | -3.189 |
ggle | -3.168 |
VERT | -3.116 |
Token | it |
Token ID | 340 |
Feature activation | +7.55e+00 |
Pos logit contributions | |
anonymity | +5.522 |
ividual | +5.296 |
important | +5.044 |
favorite | +5.007 |
-) | +4.980 |
Neg logit contributions | |
WAY | -5.480 |
PET | -4.973 |
ARE | -4.573 |
VERT | -4.474 |
TW | -4.470 |
Token | must |
Token ID | 1276 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
ividual | +5.077 |
anonymity | +5.030 |
favorite | +4.684 |
important | +4.667 |
-) | +4.652 |
Neg logit contributions | |
WAY | -6.920 |
PET | -6.249 |
ARE | -5.883 |
VERT | -5.762 |
TW | -5.672 |
Token | have |
Token ID | 423 |
Feature activation | +2.47e+01 |
Pos logit contributions | |
ividual | +7.805 |
anonymity | +7.798 |
-) | +7.363 |
favorite | +7.154 |
important | +6.978 |
Neg logit contributions | |
WAY | -11.731 |
PET | -10.332 |
ARE | -9.998 |
VERT | -9.727 |
JECT | -9.696 |
Token | been |
Token ID | 587 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
anonymity | +13.560 |
important | +12.595 |
ividual | +12.179 |
-) | +11.980 |
spoil | +11.670 |
Neg logit contributions | |
WAY | -18.687 |
PET | -16.496 |
ARE | -15.689 |
VERT | -15.427 |
TW | -15.281 |
Token | so |
Token ID | 523 |
Feature activation | +5.86e+00 |
Pos logit contributions | |
anonymity | +7.479 |
ividual | +6.948 |
important | +6.820 |
favorite | +6.714 |
-) | +6.535 |
Neg logit contributions | |
WAY | -8.060 |
PET | -7.394 |
ARE | -6.989 |
VERT | -6.616 |
Charges | -6.601 |
Token | weird |
Token ID | 7650 |
Feature activation | +6.79e+00 |
Pos logit contributions | |
anonymity | +4.285 |
ividual | +4.219 |
important | +4.036 |
favorite | +3.973 |
-) | +3.830 |
Neg logit contributions | |
WAY | -5.033 |
PET | -4.561 |
ARE | -4.246 |
TW | -4.113 |
VERT | -4.106 |
Token | on |
Token ID | 319 |
Feature activation | +4.03e+00 |
Pos logit contributions | |
anonymity | +4.852 |
ividual | +4.796 |
important | +4.495 |
favorite | +4.477 |
-) | +4.400 |
Neg logit contributions | |
WAY | -5.826 |
PET | -5.326 |
ARE | -4.980 |
TW | -4.869 |
VERT | -4.864 |
Token | the |
Token ID | 262 |
Feature activation | +8.04e+00 |
Pos logit contributions | |
anonymity | +3.364 |
ividual | +3.207 |
favorite | +3.074 |
important | +3.026 |
-) | +2.990 |
Neg logit contributions | |
WAY | -3.177 |
PET | -2.864 |
ARE | -2.665 |
VER | -2.590 |
ggle | -2.559 |
Token | most |
Token ID | 749 |
Feature activation | +5.82e-01 |
Pos logit contributions | |
ividual | +1.689 |
anonymity | +1.685 |
favorite | +1.567 |
important | +1.529 |
-) | +1.521 |
Neg logit contributions | |
WAY | -1.676 |
PET | -1.537 |
ARE | -1.410 |
ggle | -1.384 |
TW | -1.375 |
Token | cases |
Token ID | 2663 |
Feature activation | +5.41e+00 |
Pos logit contributions | |
ividual | +0.594 |
anonymity | +0.591 |
favorite | +0.561 |
important | +0.550 |
-) | +0.545 |
Neg logit contributions | |
WAY | -0.353 |
PET | -0.313 |
ARE | -0.276 |
ggle | -0.271 |
TW | -0.268 |
Token | the |
Token ID | 262 |
Feature activation | +9.44e-01 |
Pos logit contributions | |
anonymity | +4.153 |
ividual | +4.052 |
favorite | +3.708 |
important | +3.673 |
-) | +3.644 |
Neg logit contributions | |
WAY | -4.572 |
PET | -4.170 |
ggle | -3.838 |
ARE | -3.810 |
TW | -3.774 |
Token | disease |
Token ID | 4369 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
anonymity | +0.775 |
ividual | +0.774 |
favorite | +0.723 |
important | +0.702 |
-) | +0.695 |
Neg logit contributions | |
WAY | -0.759 |
PET | -0.693 |
ARE | -0.633 |
ggle | -0.628 |
TW | -0.618 |
Token | is |
Token ID | 318 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
ividual | +0.527 |
anonymity | +0.522 |
favorite | +0.489 |
important | +0.475 |
-) | +0.472 |
Neg logit contributions | |
WAY | -0.543 |
PET | -0.494 |
ARE | -0.454 |
ggle | -0.450 |
TW | -0.445 |
Token | self |
Token ID | 2116 |
Feature activation | +2.44e+01 |
Pos logit contributions | |
anonymity | +2.704 |
ividual | +2.684 |
favorite | +2.518 |
important | +2.444 |
-) | +2.440 |
Neg logit contributions | |
WAY | -2.971 |
PET | -2.718 |
ARE | -2.519 |
ggle | -2.465 |
TW | -2.453 |
Token | - |
Token ID | 12 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
-) | +13.075 |
anonymity | +12.686 |
important | +12.381 |
pecially | +12.172 |
ividual | +11.984 |
Neg logit contributions | |
WAY | -19.846 |
PET | -17.490 |
ggle | -16.651 |
TW | -16.527 |
VERT | -16.061 |
Token | lim |
Token ID | 2475 |
Feature activation | -9.46e-01 |
Pos logit contributions | |
important | +7.688 |
favorite | +7.460 |
ividual | +7.323 |
-) | +7.030 |
contained | +6.855 |
Neg logit contributions | |
WAY | -12.962 |
PET | -11.540 |
ARE | -11.133 |
ggle | -11.000 |
VERT | -10.775 |
Token | iting |
Token ID | 1780 |
Feature activation | +9.46e-01 |
Pos logit contributions | |
WAY | +1.165 |
PET | +1.105 |
ggle | +1.039 |
ARE | +1.037 |
VER | +1.030 |
Neg logit contributions | |
ividual | -0.371 |
anonymity | -0.362 |
favorite | -0.318 |
important | -0.293 |
-) | -0.288 |
Token | ," |
Token ID | 553 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
ividual | +0.761 |
anonymity | +0.751 |
favorite | +0.703 |
important | +0.689 |
-) | +0.678 |
Neg logit contributions | |
WAY | -0.777 |
PET | -0.710 |
ARE | -0.655 |
ggle | -0.644 |
TW | -0.641 |
Token | he |
Token ID | 339 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
ividual | +2.089 |
anonymity | +2.075 |
favorite | +1.969 |
important | +1.931 |
-) | +1.913 |
Neg logit contributions | |
WAY | -1.457 |
PET | -1.302 |
ARE | -1.181 |
ggle | -1.173 |
TW | -1.138 |
Token | Foundation |
Token ID | 5693 |
Feature activation | +2.65e+00 |
Pos logit contributions | |
WAY | +1.004 |
PET | +0.912 |
ARE | +0.835 |
ggle | +0.821 |
VER | +0.819 |
Neg logit contributions | |
ividual | -1.116 |
anonymity | -1.094 |
favorite | -1.037 |
important | -1.008 |
-) | -0.997 |
Token | : |
Token ID | 25 |
Feature activation | -6.80e+00 |
Pos logit contributions | |
anonymity | +2.026 |
ividual | +2.024 |
favorite | +1.896 |
important | +1.824 |
-) | +1.802 |
Neg logit contributions | |
WAY | -2.235 |
PET | -2.066 |
ARE | -1.900 |
ggle | -1.885 |
VERT | -1.869 |
Token | " |
Token ID | 366 |
Feature activation | -7.73e+00 |
Pos logit contributions | |
WAY | +4.202 |
PET | +3.719 |
ARE | +3.346 |
TW | +3.227 |
ggle | +3.207 |
Neg logit contributions | |
ividual | -6.668 |
anonymity | -6.545 |
favorite | -6.315 |
important | -6.146 |
-) | -6.096 |
Token | 9 |
Token ID | 24 |
Feature activation | +6.14e+00 |
Pos logit contributions | |
WAY | +5.397 |
PET | +4.916 |
ARE | +4.452 |
TW | +4.303 |
VER | +4.296 |
Neg logit contributions | |
ividual | -7.076 |
anonymity | -6.917 |
favorite | -6.469 |
-) | -6.304 |
important | -6.295 |
Token | - |
Token ID | 12 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
ividual | +3.640 |
anonymity | +3.607 |
favorite | +3.291 |
-) | +3.251 |
important | +3.181 |
Neg logit contributions | |
WAY | -5.971 |
PET | -5.745 |
ggle | -5.275 |
ARE | -5.260 |
VER | -5.241 |
Token | to |
Token ID | 1462 |
Feature activation | +2.42e+01 |
Pos logit contributions | |
ividual | +2.707 |
anonymity | +2.664 |
favorite | +2.558 |
important | +2.482 |
-) | +2.447 |
Neg logit contributions | |
WAY | -2.621 |
PET | -2.396 |
ARE | -2.210 |
ggle | -2.183 |
VER | -2.175 |
Token | - |
Token ID | 12 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
-) | +10.267 |
favorite | +9.212 |
-$ | +8.891 |
important | +8.715 |
anonymity | +8.075 |
Neg logit contributions | |
WAY | -21.116 |
��� | -19.674 |
PET | -19.541 |
eleph | -19.312 |
VERT | -19.040 |
Token | 5 |
Token ID | 20 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
favorite | +7.041 |
important | +6.708 |
-) | +6.598 |
anonymity | +6.508 |
ividual | +6.435 |
Neg logit contributions | |
WAY | -11.481 |
PET | -10.509 |
ggle | -10.181 |
POL | -10.143 |
VERT | -10.018 |
Token | Working |
Token ID | 14594 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
ividual | +6.543 |
anonymity | +6.281 |
favorite | +5.989 |
important | +5.779 |
-) | +5.741 |
Neg logit contributions | |
WAY | -8.780 |
PET | -8.266 |
VERT | -7.722 |
ARE | -7.636 |
ggle | -7.536 |
Token | Women |
Token ID | 6926 |
Feature activation | -2.80e+00 |
Pos logit contributions | |
WAY | +4.948 |
PET | +3.826 |
ARE | +3.723 |
TW | +3.568 |
respectively | +3.523 |
Neg logit contributions | |
ividual | -12.356 |
anonymity | -12.321 |
favorite | -11.804 |
interstitial | -11.721 |
important | -11.365 |
Token | Education |
Token ID | 7868 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
WAY | +2.210 |
PET | +2.008 |
ARE | +1.848 |
ggle | +1.819 |
VER | +1.804 |
Neg logit contributions | |
ividual | -2.336 |
anonymity | -2.306 |
favorite | -2.183 |
important | -2.112 |
-) | -2.094 |
Token | people |
Token ID | 661 |
Feature activation | +4.61e+00 |
Pos logit contributions | |
ividual | +2.080 |
anonymity | +2.067 |
favorite | +1.924 |
important | +1.896 |
-) | +1.856 |
Neg logit contributions | |
WAY | -1.986 |
PET | -1.797 |
ARE | -1.640 |
ggle | -1.631 |
TW | -1.612 |
Token | and |
Token ID | 290 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
ividual | +3.416 |
anonymity | +3.357 |
favorite | +3.088 |
important | +3.071 |
-) | +2.978 |
Neg logit contributions | |
WAY | -4.021 |
PET | -3.712 |
ARE | -3.406 |
TW | -3.386 |
VERT | -3.376 |
Token | not |
Token ID | 407 |
Feature activation | +5.84e+00 |
Pos logit contributions | |
ividual | +1.098 |
anonymity | +1.096 |
favorite | +1.016 |
important | +0.996 |
-) | +0.979 |
Neg logit contributions | |
WAY | -1.159 |
PET | -1.053 |
ARE | -0.967 |
ggle | -0.957 |
TW | -0.952 |
Token | just |
Token ID | 655 |
Feature activation | +7.22e+00 |
Pos logit contributions | |
ividual | +4.613 |
anonymity | +4.556 |
important | +4.147 |
favorite | +4.138 |
-) | +4.098 |
Neg logit contributions | |
WAY | -4.799 |
PET | -4.354 |
ARE | -3.967 |
TW | -3.954 |
VER | -3.907 |
Token | their |
Token ID | 511 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
ividual | +5.707 |
anonymity | +5.626 |
important | +5.213 |
favorite | +5.108 |
-) | +5.056 |
Neg logit contributions | |
WAY | -5.838 |
PET | -5.225 |
ARE | -4.778 |
TW | -4.771 |
VERT | -4.723 |
Token | self |
Token ID | 2116 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
ividual | +8.591 |
anonymity | +8.490 |
important | +7.845 |
favorite | +7.770 |
-) | +7.447 |
Neg logit contributions | |
WAY | -7.598 |
PET | -6.793 |
TW | -6.182 |
VERT | -6.123 |
VER | -6.116 |
Token | - |
Token ID | 12 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
ividual | +13.914 |
important | +13.635 |
anonymity | +13.412 |
-) | +13.149 |
favorite | +12.358 |
Neg logit contributions | |
WAY | -18.272 |
PET | -16.460 |
TW | -15.346 |
ggle | -15.144 |
VERT | -14.955 |
Token | interest |
Token ID | 9446 |
Feature activation | +8.33e+00 |
Pos logit contributions | |
important | +8.944 |
ividual | +8.280 |
favorite | +8.274 |
involved | +7.311 |
-) | +7.161 |
Neg logit contributions | |
WAY | -16.860 |
PET | -14.899 |
VERT | -14.205 |
ggle | -14.161 |
TW | -14.085 |
Token | . |
Token ID | 13 |
Feature activation | +4.47e+00 |
Pos logit contributions | |
ividual | +5.379 |
anonymity | +5.243 |
favorite | +4.762 |
important | +4.709 |
-) | +4.590 |
Neg logit contributions | |
WAY | -7.866 |
PET | -7.184 |
ARE | -6.710 |
TW | -6.678 |
VERT | -6.609 |
Token |
|
Token ID | 198 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
anonymity | +3.465 |
ividual | +3.439 |
favorite | +3.321 |
important | +3.264 |
-) | +3.262 |
Neg logit contributions | |
WAY | -3.570 |
PET | -3.273 |
ggle | -3.017 |
ARE | -2.964 |
VERT | -2.962 |
Token |
|
Token ID | 198 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
ividual | +1.388 |
anonymity | +1.372 |
favorite | +1.309 |
important | +1.273 |
-) | +1.261 |
Neg logit contributions | |
WAY | -1.145 |
PET | -1.035 |
ARE | -0.941 |
ggle | -0.927 |
VER | -0.919 |
Token | of |
Token ID | 286 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
anonymity | +7.777 |
ividual | +7.768 |
-) | +7.458 |
favorite | +7.308 |
important | +7.180 |
Neg logit contributions | |
WAY | -10.330 |
PET | -9.466 |
ARE | -9.099 |
VERT | -8.890 |
ggle | -8.811 |
Token | Catalonia |
Token ID | 33859 |
Feature activation | +4.19e+00 |
Pos logit contributions | |
anonymity | +7.814 |
ividual | +7.682 |
important | +7.121 |
-) | +6.976 |
favorite | +6.929 |
Neg logit contributions | |
WAY | -9.357 |
PET | -8.557 |
ggle | -7.795 |
ARE | -7.738 |
VERT | -7.728 |
Token | � |
Token ID | 447 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
ividual | +3.073 |
anonymity | +3.035 |
favorite | +2.807 |
-) | +2.802 |
important | +2.777 |
Neg logit contributions | |
WAY | -3.672 |
PET | -3.367 |
ARE | -3.115 |
ggle | -3.098 |
VERT | -3.065 |
Token | � |
Token ID | 247 |
Feature activation | +7.69e+00 |
Pos logit contributions | |
ividual | +2.319 |
anonymity | +2.308 |
favorite | +2.221 |
-) | +2.182 |
important | +2.171 |
Neg logit contributions | |
WAY | -1.519 |
PET | -1.364 |
ARE | -1.220 |
ggle | -1.182 |
VERT | -1.172 |
Token | s |
Token ID | 82 |
Feature activation | +9.39e+00 |
Pos logit contributions | |
ividual | +5.255 |
anonymity | +5.078 |
favorite | +4.886 |
-) | +4.864 |
important | +4.805 |
Neg logit contributions | |
WAY | -6.798 |
PET | -6.288 |
ggle | -5.857 |
ARE | -5.807 |
VERT | -5.764 |
Token | self |
Token ID | 2116 |
Feature activation | +2.40e+01 |
Pos logit contributions | |
anonymity | +7.806 |
ividual | +7.651 |
important | +7.229 |
-) | +7.191 |
favorite | +7.156 |
Neg logit contributions | |
WAY | -6.833 |
PET | -6.189 |
VERT | -5.631 |
ggle | -5.627 |
ISON | -5.506 |
Token | - |
Token ID | 12 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
-) | +14.524 |
important | +13.431 |
ividual | +13.417 |
anonymity | +13.075 |
favorite | +11.952 |
Neg logit contributions | |
WAY | -18.158 |
PET | -16.588 |
ggle | -15.233 |
Charges | -15.072 |
VERT | -14.944 |
Token | rule |
Token ID | 25135 |
Feature activation | +4.61e+00 |
Pos logit contributions | |
important | +8.927 |
ividual | +8.521 |
favorite | +8.335 |
anonymity | +8.271 |
-) | +8.191 |
Neg logit contributions | |
WAY | -12.151 |
PET | -10.695 |
VERT | -10.220 |
Charges | -10.206 |
ggle | -10.119 |
Token | institutions |
Token ID | 6712 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
ividual | +3.175 |
anonymity | +3.146 |
favorite | +2.939 |
-) | +2.916 |
important | +2.894 |
Neg logit contributions | |
WAY | -4.175 |
PET | -3.870 |
ARE | -3.583 |
VERT | -3.563 |
ggle | -3.530 |
Token | ). |
Token ID | 737 |
Feature activation | +7.18e+00 |
Pos logit contributions | |
ividual | +7.329 |
anonymity | +7.052 |
-) | +6.955 |
favorite | +6.674 |
important | +6.632 |
Neg logit contributions | |
WAY | -9.741 |
PET | -9.042 |
VERT | -8.476 |
ggle | -8.401 |
ARE | -8.302 |
Token |
|
Token ID | 198 |
Feature activation | +3.71e+00 |
Pos logit contributions | |
anonymity | +5.186 |
ividual | +5.151 |
favorite | +5.057 |
-) | +5.031 |
important | +4.980 |
Neg logit contributions | |
WAY | -5.776 |
PET | -5.280 |
ggle | -4.983 |
ARE | -4.876 |
VERT | -4.786 |
Token | to |
Token ID | 284 |
Feature activation | -7.51e-02 |
Pos logit contributions | |
ividual | +2.813 |
anonymity | +2.805 |
favorite | +2.586 |
important | +2.530 |
-) | +2.473 |
Neg logit contributions | |
WAY | -3.331 |
PET | -3.081 |
ARE | -2.871 |
TW | -2.793 |
VERT | -2.789 |
Token | have |
Token ID | 423 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
WAY | +0.062 |
PET | +0.057 |
ARE | +0.053 |
VER | +0.052 |
VERT | +0.051 |
Neg logit contributions | |
ividual | -0.060 |
anonymity | -0.059 |
favorite | -0.056 |
important | -0.054 |
-) | -0.054 |
Token | a |
Token ID | 257 |
Feature activation | -2.39e+00 |
Pos logit contributions | |
anonymity | +1.514 |
ividual | +1.509 |
favorite | +1.419 |
important | +1.392 |
-) | +1.373 |
Neg logit contributions | |
WAY | -1.215 |
PET | -1.103 |
ARE | -0.996 |
ggle | -0.974 |
VER | -0.970 |
Token | none |
Token ID | 4844 |
Feature activation | +2.92e+00 |
Pos logit contributions | |
WAY | +1.907 |
PET | +1.741 |
ARE | +1.596 |
ggle | +1.575 |
VER | +1.565 |
Neg logit contributions | |
ividual | -1.973 |
anonymity | -1.939 |
favorite | -1.839 |
important | -1.784 |
-) | -1.765 |
Token | - |
Token ID | 12 |
Feature activation | -4.42e+00 |
Pos logit contributions | |
ividual | +2.185 |
anonymity | +2.162 |
favorite | +2.075 |
important | +2.010 |
-) | +1.946 |
Neg logit contributions | |
WAY | -2.515 |
PET | -2.297 |
ARE | -2.148 |
VERT | -2.071 |
TW | -2.070 |
Token | too |
Token ID | 18820 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
WAY | +3.558 |
PET | +3.264 |
ARE | +2.984 |
VER | +2.935 |
TW | +2.915 |
Neg logit contributions | |
ividual | -3.665 |
anonymity | -3.590 |
favorite | -3.338 |
-) | -3.253 |
important | -3.229 |
Token | - |
Token ID | 12 |
Feature activation | -4.57e-01 |
Pos logit contributions | |
-) | +13.499 |
anonymity | +13.446 |
favorite | +12.997 |
important | +12.851 |
ividual | +12.044 |
Neg logit contributions | |
WAY | -17.493 |
PET | -15.685 |
ggle | -14.855 |
ARE | -14.722 |
Fuck | -14.574 |
Token | sub |
Token ID | 7266 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
WAY | +0.400 |
PET | +0.367 |
ARE | +0.340 |
ggle | +0.337 |
VER | +0.332 |
Neg logit contributions | |
ividual | -0.340 |
anonymity | -0.336 |
favorite | -0.323 |
important | -0.312 |
-) | -0.306 |
Token | tle |
Token ID | 7100 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
ividual | +8.191 |
anonymity | +8.188 |
-) | +8.095 |
favorite | +8.073 |
important | +7.980 |
Neg logit contributions | |
WAY | -10.504 |
PET | -9.587 |
ARE | -9.482 |
Charges | -9.257 |
ggle | -9.158 |
Token | dig |
Token ID | 3100 |
Feature activation | -9.86e-01 |
Pos logit contributions | |
ividual | +1.513 |
anonymity | +1.511 |
favorite | +1.423 |
important | +1.380 |
-) | +1.367 |
Neg logit contributions | |
WAY | -1.491 |
PET | -1.368 |
ARE | -1.252 |
VER | -1.232 |
ggle | -1.228 |
Token | at |
Token ID | 379 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
WAY | +0.801 |
PET | +0.733 |
ARE | +0.675 |
ggle | +0.661 |
VER | +0.659 |
Neg logit contributions | |
ividual | -0.804 |
anonymity | -0.791 |
favorite | -0.749 |
important | -0.727 |
-) | -0.719 |
Token | , |
Token ID | 11 |
Feature activation | -2.93e+00 |
Pos logit contributions | |
WAY | +3.503 |
PET | +3.196 |
ARE | +2.923 |
VER | +2.890 |
ggle | +2.890 |
Neg logit contributions | |
ividual | -3.880 |
anonymity | -3.794 |
favorite | -3.639 |
important | -3.497 |
-) | -3.494 |
Token | composed |
Token ID | 13160 |
Feature activation | -4.80e+00 |
Pos logit contributions | |
WAY | +2.332 |
PET | +2.130 |
ARE | +1.949 |
ggle | +1.922 |
VER | +1.919 |
Neg logit contributions | |
ividual | -2.428 |
anonymity | -2.379 |
favorite | -2.269 |
important | -2.191 |
-) | -2.170 |
Token | of |
Token ID | 286 |
Feature activation | -2.83e+00 |
Pos logit contributions | |
WAY | +3.700 |
PET | +3.370 |
ARE | +3.072 |
ggle | +3.063 |
VER | +3.050 |
Neg logit contributions | |
ividual | -4.052 |
anonymity | -3.939 |
favorite | -3.784 |
important | -3.661 |
-) | -3.624 |
Token | what |
Token ID | 644 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
WAY | +2.266 |
PET | +2.068 |
ARE | +1.899 |
ggle | +1.870 |
VER | +1.862 |
Neg logit contributions | |
ividual | -2.332 |
anonymity | -2.289 |
favorite | -2.176 |
important | -2.109 |
-) | -2.088 |
Token | must |
Token ID | 1276 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
ividual | +0.213 |
anonymity | +0.211 |
favorite | +0.196 |
important | +0.191 |
-) | +0.189 |
Neg logit contributions | |
WAY | -0.268 |
PET | -0.247 |
ARE | -0.229 |
ggle | -0.226 |
TW | -0.224 |
Token | have |
Token ID | 423 |
Feature activation | +2.36e+01 |
Pos logit contributions | |
ividual | +8.646 |
anonymity | +8.622 |
-) | +7.973 |
favorite | +7.736 |
important | +7.480 |
Neg logit contributions | |
WAY | -12.033 |
PET | -10.641 |
ARE | -10.186 |
VERT | -10.127 |
JECT | -10.048 |
Token | amounted |
Token ID | 30008 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
anonymity | +12.009 |
ividual | +11.659 |
favorite | +10.600 |
important | +10.575 |
pecially | +10.356 |
Neg logit contributions | |
WAY | -18.466 |
PET | -17.051 |
ARE | -15.768 |
JECT | -15.601 |
FY | -15.550 |
Token | to |
Token ID | 284 |
Feature activation | +4.28e+00 |
Pos logit contributions | |
anonymity | +2.612 |
ividual | +2.590 |
favorite | +2.411 |
important | +2.357 |
-) | +2.329 |
Neg logit contributions | |
WAY | -3.103 |
PET | -2.856 |
ARE | -2.639 |
ggle | -2.586 |
VER | -2.567 |
Token | literally |
Token ID | 7360 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
anonymity | +3.468 |
ividual | +3.369 |
favorite | +3.190 |
important | +3.120 |
-) | +3.062 |
Neg logit contributions | |
WAY | -3.433 |
PET | -3.130 |
ARE | -2.880 |
ggle | -2.803 |
VERT | -2.773 |
Token | hundreds |
Token ID | 5179 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
anonymity | +7.730 |
ividual | +7.236 |
favorite | +6.796 |
important | +6.757 |
-) | +6.546 |
Neg logit contributions | |
WAY | -8.265 |
PET | -7.511 |
ARE | -7.091 |
ggle | -6.784 |
VERT | -6.669 |
Token | of |
Token ID | 286 |
Feature activation | -4.26e+00 |
Pos logit contributions | |
ividual | +1.128 |
anonymity | +1.111 |
favorite | +1.045 |
important | +1.008 |
-) | +1.001 |
Neg logit contributions | |
WAY | -1.229 |
PET | -1.127 |
ARE | -1.040 |
ggle | -1.019 |
VER | -1.014 |
Token | the |
Token ID | 262 |
Feature activation | -2.10e-02 |
Pos logit contributions | |
WAY | +0.750 |
PET | +0.684 |
ARE | +0.623 |
ggle | +0.618 |
TW | +0.609 |
Neg logit contributions | |
ividual | -0.842 |
anonymity | -0.834 |
favorite | -0.789 |
important | -0.774 |
-) | -0.760 |
Token | subtle |
Token ID | 11800 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
WAY | +0.017 |
PET | +0.016 |
ARE | +0.014 |
ggle | +0.014 |
VER | +0.014 |
Neg logit contributions | |
ividual | -0.017 |
anonymity | -0.017 |
favorite | -0.016 |
important | -0.016 |
-) | -0.015 |
Token | and |
Token ID | 290 |
Feature activation | +4.97e+00 |
Pos logit contributions | |
anonymity | +1.172 |
ividual | +1.171 |
favorite | +1.085 |
important | +1.064 |
-) | +1.032 |
Neg logit contributions | |
WAY | -1.388 |
PET | -1.288 |
ARE | -1.191 |
ggle | -1.176 |
VER | -1.167 |
Token | not |
Token ID | 407 |
Feature activation | +9.48e+00 |
Pos logit contributions | |
anonymity | +3.986 |
ividual | +3.945 |
favorite | +3.684 |
important | +3.682 |
-) | +3.549 |
Neg logit contributions | |
WAY | -3.986 |
PET | -3.629 |
ARE | -3.365 |
TW | -3.276 |
VERT | -3.246 |
Token | - |
Token ID | 12 |
Feature activation | +3.05e+00 |
Pos logit contributions | |
anonymity | +7.580 |
ividual | +7.470 |
important | +7.310 |
favorite | +7.146 |
-) | +7.092 |
Neg logit contributions | |
WAY | -7.156 |
PET | -6.334 |
ARE | -5.866 |
TW | -5.707 |
VER | -5.649 |
Token | so |
Token ID | 568 |
Feature activation | +2.35e+01 |
Pos logit contributions | |
anonymity | +2.479 |
ividual | +2.478 |
favorite | +2.424 |
important | +2.392 |
-) | +2.291 |
Neg logit contributions | |
WAY | -2.394 |
PET | -2.156 |
ARE | -1.985 |
ggle | -1.968 |
POL | -1.930 |
Token | - |
Token ID | 12 |
Feature activation | +5.18e+00 |
Pos logit contributions | |
-) | +12.348 |
important | +12.206 |
anonymity | +11.615 |
favorite | +11.500 |
ividual | +10.942 |
Neg logit contributions | |
WAY | -18.196 |
PET | -16.836 |
ARE | -16.012 |
ISON | -15.442 |
POL | -15.298 |
Token | sub |
Token ID | 7266 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
important | +3.587 |
anonymity | +3.557 |
ividual | +3.552 |
favorite | +3.544 |
-) | +3.292 |
Neg logit contributions | |
WAY | -4.572 |
PET | -4.172 |
ARE | -3.912 |
ggle | -3.852 |
POL | -3.831 |
Token | tle |
Token ID | 7100 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
-) | +8.626 |
ividual | +8.595 |
important | +8.404 |
anonymity | +8.216 |
favorite | +8.034 |
Neg logit contributions | |
WAY | -11.852 |
PET | -10.866 |
ARE | -10.687 |
Charges | -10.373 |
USH | -10.177 |
Token | emotions |
Token ID | 10825 |
Feature activation | +4.65e-01 |
Pos logit contributions | |
anonymity | +1.247 |
ividual | +1.241 |
favorite | +1.161 |
important | +1.149 |
-) | +1.116 |
Neg logit contributions | |
WAY | -1.230 |
PET | -1.139 |
ARE | -1.035 |
ggle | -1.028 |
VER | -1.014 |
Token | Robert |
Token ID | 5199 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
ividual | +0.377 |
anonymity | +0.375 |
favorite | +0.352 |
important | +0.344 |
-) | +0.338 |
Neg logit contributions | |
WAY | -0.379 |
PET | -0.348 |
ARE | -0.318 |
ggle | -0.315 |
VERT | -0.310 |
Token | complaints |
Token ID | 9687 |
Feature activation | +6.81e+00 |
Pos logit contributions | |
WAY | +0.429 |
PET | +0.376 |
ARE | +0.332 |
ggle | +0.325 |
VER | +0.321 |
Neg logit contributions | |
ividual | -0.762 |
anonymity | -0.756 |
favorite | -0.722 |
important | -0.706 |
-) | -0.700 |
Token | under |
Token ID | 739 |
Feature activation | -5.95e+00 |
Pos logit contributions | |
anonymity | +5.172 |
ividual | +5.164 |
favorite | +4.682 |
important | +4.650 |
-) | +4.585 |
Neg logit contributions | |
WAY | -5.672 |
PET | -5.167 |
ARE | -4.820 |
VERT | -4.805 |
ggle | -4.778 |
Token | these |
Token ID | 777 |
Feature activation | -2.59e+00 |
Pos logit contributions | |
WAY | +4.383 |
PET | +3.939 |
ARE | +3.611 |
VER | +3.529 |
VERT | +3.489 |
Neg logit contributions | |
ividual | -5.260 |
anonymity | -5.095 |
favorite | -4.896 |
important | -4.758 |
-) | -4.714 |
Token | � |
Token ID | 564 |
Feature activation | +9.78e-01 |
Pos logit contributions | |
WAY | +1.905 |
PET | +1.723 |
ARE | +1.569 |
ggle | +1.538 |
VER | +1.533 |
Neg logit contributions | |
ividual | -2.304 |
anonymity | -2.268 |
favorite | -2.161 |
important | -2.100 |
-) | -2.080 |
Token | � |
Token ID | 250 |
Feature activation | +5.25e+00 |
Pos logit contributions | |
ividual | +1.051 |
anonymity | +1.042 |
favorite | +1.005 |
important | +0.983 |
-) | +0.974 |
Neg logit contributions | |
WAY | -0.534 |
PET | -0.464 |
ARE | -0.407 |
ggle | -0.397 |
VER | -0.393 |
Token | self |
Token ID | 944 |
Feature activation | +2.34e+01 |
Pos logit contributions | |
anonymity | +3.755 |
favorite | +3.725 |
important | +3.692 |
ividual | +3.691 |
-) | +3.461 |
Neg logit contributions | |
WAY | -4.452 |
PET | -4.061 |
ggle | -3.833 |
ARE | -3.723 |
VERT | -3.694 |
Token | - |
Token ID | 12 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
anonymity | +14.772 |
-) | +14.600 |
ividual | +14.314 |
important | +14.308 |
pecially | +14.105 |
Neg logit contributions | |
WAY | -16.550 |
PET | -14.303 |
VERT | -13.696 |
TW | -13.652 |
ggle | -13.116 |
Token | imposed |
Token ID | 36457 |
Feature activation | +6.75e+00 |
Pos logit contributions | |
favorite | +8.670 |
important | +8.669 |
anonymity | +8.302 |
ividual | +8.032 |
-) | +8.018 |
Neg logit contributions | |
WAY | -11.218 |
PET | -9.692 |
VERT | -9.547 |
ARE | -9.544 |
ggle | -9.442 |
Token | , |
Token ID | 11 |
Feature activation | +5.85e+00 |
Pos logit contributions | |
anonymity | +5.548 |
ividual | +5.311 |
favorite | +5.019 |
-) | +4.892 |
important | +4.826 |
Neg logit contributions | |
WAY | -5.292 |
PET | -4.783 |
ggle | -4.427 |
ARE | -4.395 |
VERT | -4.296 |
Token | inf |
Token ID | 1167 |
Feature activation | +7.44e+00 |
Pos logit contributions | |
anonymity | +4.969 |
ividual | +4.868 |
favorite | +4.614 |
-) | +4.504 |
important | +4.502 |
Neg logit contributions | |
WAY | -4.425 |
PET | -3.944 |
ARE | -3.607 |
ggle | -3.599 |
TW | -3.497 |
Token | lex |
Token ID | 2588 |
Feature activation | +4.83e+00 |
Pos logit contributions | |
ividual | +4.468 |
anonymity | +4.324 |
favorite | +4.213 |
important | +4.133 |
-) | +4.055 |
Neg logit contributions | |
WAY | -7.432 |
PET | -6.610 |
ggle | -6.403 |
ARE | -6.342 |
VER | -6.211 |
Token | their |
Token ID | 511 |
Feature activation | -3.16e-01 |
Pos logit contributions | |
anonymity | +2.329 |
ividual | +2.307 |
favorite | +2.139 |
important | +2.112 |
-) | +2.073 |
Neg logit contributions | |
WAY | -2.477 |
PET | -2.287 |
ARE | -2.081 |
ggle | -2.062 |
VERT | -2.051 |
Token | ambitions |
Token ID | 22455 |
Feature activation | +2.94e+00 |
Pos logit contributions | |
WAY | +0.243 |
PET | +0.222 |
ARE | +0.202 |
ggle | +0.199 |
VER | +0.199 |
Neg logit contributions | |
ividual | -0.269 |
anonymity | -0.269 |
favorite | -0.254 |
important | -0.246 |
-) | -0.243 |
Token | were |
Token ID | 547 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
ividual | +2.432 |
anonymity | +2.411 |
favorite | +2.238 |
important | +2.221 |
-) | +2.192 |
Neg logit contributions | |
WAY | -2.334 |
PET | -2.135 |
ARE | -1.934 |
VERT | -1.909 |
VER | -1.907 |
Token | not |
Token ID | 407 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
WAY | +3.534 |
PET | +3.206 |
ARE | +2.937 |
ggle | +2.921 |
VER | +2.902 |
Neg logit contributions | |
ividual | -3.801 |
anonymity | -3.674 |
favorite | -3.543 |
important | -3.399 |
-) | -3.364 |
Token | always |
Token ID | 1464 |
Feature activation | -8.99e+00 |
Pos logit contributions | |
WAY | +3.545 |
PET | +3.237 |
ARE | +2.970 |
ggle | +2.949 |
VER | +2.927 |
Neg logit contributions | |
ividual | -3.772 |
anonymity | -3.639 |
favorite | -3.508 |
important | -3.370 |
-) | -3.334 |
Token | self |
Token ID | 2116 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
WAY | +6.785 |
PET | +6.213 |
ggle | +5.747 |
respectively | +5.746 |
ARE | +5.730 |
Neg logit contributions | |
ividual | -7.418 |
anonymity | -6.904 |
favorite | -6.795 |
interstitial | -6.555 |
important | -6.490 |
Token | less |
Token ID | 1203 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
important | +12.327 |
-) | +11.980 |
anonymity | +11.662 |
ividual | +11.537 |
favorite | +11.006 |
Neg logit contributions | |
WAY | -18.778 |
PET | -16.895 |
TW | -16.155 |
Ton | -15.597 |
VERT | -15.460 |
Token | ".[ |
Token ID | 42924 |
Feature activation | +9.50e-01 |
Pos logit contributions | |
WAY | +1.445 |
PET | +1.305 |
ARE | +1.188 |
ggle | +1.164 |
VER | +1.160 |
Neg logit contributions | |
ividual | -1.754 |
anonymity | -1.732 |
favorite | -1.645 |
important | -1.603 |
-) | -1.585 |
Token | 39 |
Token ID | 2670 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
ividual | +0.755 |
anonymity | +0.746 |
favorite | +0.713 |
important | +0.701 |
-) | +0.687 |
Neg logit contributions | |
WAY | -0.776 |
PET | -0.706 |
ARE | -0.657 |
ggle | -0.654 |
VER | -0.645 |
Token | ] |
Token ID | 60 |
Feature activation | -2.80e+00 |
Pos logit contributions | |
WAY | +1.991 |
PET | +1.848 |
ARE | +1.689 |
TW | +1.683 |
VER | +1.675 |
Neg logit contributions | |
ividual | -1.706 |
anonymity | -1.648 |
favorite | -1.518 |
interstitial | -1.459 |
important | -1.455 |
Token |
|
Token ID | 198 |
Feature activation | +5.12e-01 |
Pos logit contributions | |
WAY | +2.055 |
PET | +1.856 |
ARE | +1.687 |
VER | +1.649 |
ggle | +1.649 |
Neg logit contributions | |
ividual | -2.517 |
anonymity | -2.475 |
favorite | -2.350 |
important | -2.281 |
-) | -2.254 |
Token | , |
Token ID | 11 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
ividual | +2.752 |
anonymity | +2.733 |
favorite | +2.518 |
important | +2.474 |
-) | +2.451 |
Neg logit contributions | |
WAY | -3.084 |
PET | -2.774 |
ARE | -2.620 |
ggle | -2.605 |
VERT | -2.553 |
Token | the |
Token ID | 262 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
ividual | +1.133 |
anonymity | +1.126 |
favorite | +1.048 |
important | +1.030 |
-) | +1.013 |
Neg logit contributions | |
WAY | -1.136 |
PET | -1.029 |
ARE | -0.956 |
ggle | -0.944 |
VER | -0.928 |
Token | Commonwealth |
Token ID | 17165 |
Feature activation | -9.23e+00 |
Pos logit contributions | |
ividual | +0.186 |
anonymity | +0.184 |
favorite | +0.173 |
important | +0.168 |
-) | +0.166 |
Neg logit contributions | |
WAY | -0.195 |
PET | -0.178 |
ARE | -0.164 |
ggle | -0.162 |
VER | -0.161 |
Token | Parliament |
Token ID | 8411 |
Feature activation | -6.84e+00 |
Pos logit contributions | |
WAY | +6.371 |
PET | +5.837 |
respectively | +5.289 |
VER | +5.214 |
ARE | +5.194 |
Neg logit contributions | |
ividual | -8.102 |
anonymity | -7.849 |
favorite | -7.655 |
important | -7.314 |
-) | -7.230 |
Token | abolished |
Token ID | 32424 |
Feature activation | +4.40e+00 |
Pos logit contributions | |
WAY | +5.353 |
PET | +4.879 |
respectively | +4.507 |
ARE | +4.456 |
VER | +4.439 |
Neg logit contributions | |
ividual | -5.570 |
anonymity | -5.427 |
favorite | -5.214 |
important | -5.004 |
-) | -4.941 |
Token | self |
Token ID | 2116 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
anonymity | +3.509 |
ividual | +3.435 |
favorite | +3.204 |
important | +3.145 |
-) | +3.097 |
Neg logit contributions | |
WAY | -3.641 |
PET | -3.319 |
ARE | -3.045 |
ggle | -3.004 |
TW | -2.985 |
Token | - |
Token ID | 12 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
anonymity | +13.961 |
ividual | +13.913 |
-) | +13.480 |
important | +13.440 |
favorite | +12.527 |
Neg logit contributions | |
WAY | -17.055 |
PET | -15.272 |
ggle | -14.040 |
VERT | -14.007 |
TW | -13.872 |
Token | government |
Token ID | 14480 |
Feature activation | +4.65e+00 |
Pos logit contributions | |
important | +8.857 |
favorite | +8.552 |
anonymity | +8.544 |
ividual | +8.434 |
-) | +7.879 |
Neg logit contributions | |
WAY | -12.609 |
PET | -10.903 |
ggle | -10.802 |
VERT | -10.604 |
ARE | -10.493 |
Token | , |
Token ID | 11 |
Feature activation | +4.45e+00 |
Pos logit contributions | |
anonymity | +3.546 |
ividual | +3.425 |
favorite | +3.210 |
important | +3.184 |
-) | +3.090 |
Neg logit contributions | |
WAY | -3.998 |
PET | -3.624 |
ARE | -3.361 |
VERT | -3.359 |
ggle | -3.317 |
Token | integrating |
Token ID | 32029 |
Feature activation | +3.96e+00 |
Pos logit contributions | |
anonymity | +3.418 |
ividual | +3.382 |
favorite | +3.095 |
important | +3.064 |
-) | +3.032 |
Neg logit contributions | |
WAY | -3.796 |
PET | -3.442 |
ARE | -3.192 |
ggle | -3.177 |
VERT | -3.152 |
Token | Norfolk |
Token ID | 32134 |
Feature activation | +3.92e+00 |
Pos logit contributions | |
anonymity | +3.125 |
ividual | +3.101 |
favorite | +2.875 |
important | +2.855 |
-) | +2.781 |
Neg logit contributions | |
WAY | -3.290 |
PET | -2.989 |
ARE | -2.752 |
ggle | -2.718 |
VERT | -2.697 |
Token | extra |
Token ID | 3131 |
Feature activation | +4.90e+00 |
Pos logit contributions | |
WAY | +3.740 |
PET | +3.390 |
ARE | +3.112 |
ggle | +3.095 |
VER | +3.089 |
Neg logit contributions | |
ividual | -3.895 |
anonymity | -3.733 |
favorite | -3.622 |
important | -3.467 |
-) | -3.456 |
Token | pressure |
Token ID | 3833 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
anonymity | +3.844 |
ividual | +3.728 |
important | +3.591 |
favorite | +3.495 |
-) | +3.419 |
Neg logit contributions | |
WAY | -3.999 |
PET | -3.711 |
ARE | -3.404 |
ggle | -3.334 |
TW | -3.323 |
Token | . |
Token ID | 13 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
ividual | +0.825 |
anonymity | +0.815 |
favorite | +0.766 |
important | +0.749 |
-) | +0.735 |
Neg logit contributions | |
WAY | -0.928 |
PET | -0.852 |
ARE | -0.791 |
ggle | -0.777 |
TW | -0.770 |
Token | It |
Token ID | 632 |
Feature activation | +7.67e+00 |
Pos logit contributions | |
anonymity | +2.492 |
ividual | +2.486 |
favorite | +2.394 |
important | +2.340 |
-) | +2.339 |
Neg logit contributions | |
WAY | -2.480 |
PET | -2.259 |
ggle | -2.089 |
ARE | -2.073 |
VERT | -2.027 |
Token | would |
Token ID | 561 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
ividual | +4.997 |
anonymity | +4.797 |
favorite | +4.489 |
important | +4.486 |
-) | +4.395 |
Neg logit contributions | |
WAY | -7.227 |
PET | -6.668 |
ARE | -6.239 |
VERT | -6.081 |
ggle | -6.038 |
Token | have |
Token ID | 423 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
ividual | +7.937 |
anonymity | +7.828 |
favorite | +7.202 |
-) | +7.111 |
important | +7.055 |
Neg logit contributions | |
WAY | -10.030 |
PET | -9.019 |
ARE | -8.497 |
VERT | -8.285 |
VER | -8.165 |
Token | been |
Token ID | 587 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
anonymity | +11.026 |
important | +10.404 |
ividual | +10.307 |
-) | +9.863 |
umatic | +9.385 |
Neg logit contributions | |
WAY | -19.143 |
PET | -18.238 |
VERT | -16.350 |
ARE | -16.310 |
ggle | -16.155 |
Token | great |
Token ID | 1049 |
Feature activation | +7.40e+00 |
Pos logit contributions | |
anonymity | +1.545 |
ividual | +1.534 |
favorite | +1.439 |
important | +1.414 |
-) | +1.380 |
Neg logit contributions | |
WAY | -1.657 |
PET | -1.538 |
ARE | -1.419 |
ggle | -1.370 |
VERT | -1.370 |
Token | to |
Token ID | 284 |
Feature activation | +5.29e+00 |
Pos logit contributions | |
anonymity | +5.236 |
ividual | +5.079 |
favorite | +4.713 |
important | +4.619 |
-) | +4.539 |
Neg logit contributions | |
WAY | -6.490 |
PET | -6.015 |
ARE | -5.558 |
ggle | -5.550 |
VERT | -5.424 |
Token | come |
Token ID | 1282 |
Feature activation | +6.95e+00 |
Pos logit contributions | |
anonymity | +3.945 |
ividual | +3.812 |
favorite | +3.612 |
-) | +3.506 |
important | +3.497 |
Neg logit contributions | |
WAY | -4.562 |
PET | -4.192 |
ARE | -3.887 |
VERT | -3.799 |
VER | -3.798 |
Token | in |
Token ID | 287 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
anonymity | +5.357 |
ividual | +5.225 |
favorite | +4.983 |
important | +4.852 |
-) | +4.834 |
Neg logit contributions | |
WAY | -5.675 |
PET | -5.206 |
ARE | -4.801 |
VERT | -4.676 |
TW | -4.624 |
Token |
|
Token ID | 198 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
ividual | +1.995 |
anonymity | +1.977 |
favorite | +1.906 |
important | +1.840 |
-) | +1.832 |
Neg logit contributions | |
WAY | -1.934 |
PET | -1.760 |
ARE | -1.625 |
ggle | -1.609 |
VERT | -1.585 |
Token |
|
Token ID | 198 |
Feature activation | +7.99e-01 |
Pos logit contributions | |
ividual | +1.220 |
anonymity | +1.206 |
favorite | +1.151 |
important | +1.119 |
-) | +1.109 |
Neg logit contributions | |
WAY | -1.005 |
PET | -0.908 |
ARE | -0.826 |
ggle | -0.813 |
VER | -0.806 |
Token | But |
Token ID | 1537 |
Feature activation | +3.71e+00 |
Pos logit contributions | |
ividual | +0.670 |
anonymity | +0.668 |
favorite | +0.651 |
important | +0.628 |
-) | +0.621 |
Neg logit contributions | |
WAY | -0.604 |
PET | -0.545 |
ggle | -0.500 |
ARE | -0.498 |
respectively | -0.490 |
Token | what |
Token ID | 644 |
Feature activation | -3.84e+00 |
Pos logit contributions | |
anonymity | +2.995 |
ividual | +2.954 |
favorite | +2.769 |
important | +2.702 |
-) | +2.668 |
Neg logit contributions | |
WAY | -2.987 |
PET | -2.744 |
ARE | -2.504 |
VERT | -2.462 |
ggle | -2.445 |
Token | must |
Token ID | 1276 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
WAY | +3.182 |
PET | +2.914 |
ARE | +2.713 |
VER | +2.669 |
ggle | +2.658 |
Neg logit contributions | |
ividual | -3.048 |
anonymity | -2.947 |
favorite | -2.825 |
important | -2.722 |
-) | -2.695 |
Token | have |
Token ID | 423 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
anonymity | +7.771 |
ividual | +7.553 |
favorite | +7.098 |
-) | +7.016 |
important | +6.912 |
Neg logit contributions | |
WAY | -8.865 |
PET | -7.888 |
VERT | -7.313 |
ARE | -7.113 |
VER | -7.070 |
Token | sounded |
Token ID | 14846 |
Feature activation | +6.96e-01 |
Pos logit contributions | |
anonymity | +12.593 |
important | +11.361 |
ividual | +11.010 |
favorite | +10.767 |
-) | +10.714 |
Neg logit contributions | |
WAY | -17.291 |
PET | -15.754 |
Charges | -14.467 |
VERT | -14.461 |
Fuck | -14.073 |
Token | like |
Token ID | 588 |
Feature activation | +3.22e+00 |
Pos logit contributions | |
anonymity | +0.514 |
ividual | +0.513 |
favorite | +0.481 |
important | +0.469 |
-) | +0.460 |
Neg logit contributions | |
WAY | -0.609 |
PET | -0.567 |
ARE | -0.520 |
TW | -0.510 |
VERT | -0.510 |
Token | a |
Token ID | 257 |
Feature activation | +2.59e+00 |
Pos logit contributions | |
anonymity | +2.620 |
ividual | +2.522 |
favorite | +2.382 |
important | +2.342 |
-) | +2.298 |
Neg logit contributions | |
WAY | -2.604 |
PET | -2.401 |
ARE | -2.201 |
VERT | -2.147 |
ggle | -2.131 |
Token | good |
Token ID | 922 |
Feature activation | -4.87e+00 |
Pos logit contributions | |
anonymity | +2.052 |
ividual | +2.028 |
favorite | +1.929 |
important | +1.878 |
-) | +1.853 |
Neg logit contributions | |
WAY | -2.118 |
PET | -1.932 |
ARE | -1.797 |
TW | -1.743 |
VERT | -1.721 |
Token | idea |
Token ID | 2126 |
Feature activation | +7.29e+00 |
Pos logit contributions | |
WAY | +3.832 |
PET | +3.477 |
ARE | +3.185 |
ggle | +3.139 |
TW | +3.112 |
Neg logit contributions | |
ividual | -4.090 |
anonymity | -3.964 |
favorite | -3.796 |
important | -3.676 |
-) | -3.627 |
Token | or |
Token ID | 393 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
WAY | +0.235 |
PET | +0.219 |
ARE | +0.205 |
ggle | +0.203 |
VER | +0.201 |
Neg logit contributions | |
ividual | -0.144 |
anonymity | -0.141 |
favorite | -0.131 |
important | -0.126 |
-) | -0.124 |
Token | another |
Token ID | 1194 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
ividual | +0.107 |
anonymity | +0.106 |
favorite | +0.099 |
important | +0.096 |
-) | +0.095 |
Neg logit contributions | |
WAY | -0.116 |
PET | -0.106 |
ARE | -0.099 |
ggle | -0.097 |
VER | -0.096 |
Token | of |
Token ID | 286 |
Feature activation | +3.82e+00 |
Pos logit contributions | |
WAY | +1.058 |
PET | +0.969 |
ARE | +0.894 |
ggle | +0.879 |
VER | +0.874 |
Neg logit contributions | |
ividual | -1.002 |
anonymity | -0.986 |
favorite | -0.931 |
important | -0.904 |
-) | -0.892 |
Token | his |
Token ID | 465 |
Feature activation | +7.24e+00 |
Pos logit contributions | |
ividual | +2.959 |
anonymity | +2.942 |
favorite | +2.723 |
important | +2.710 |
-) | +2.642 |
Neg logit contributions | |
WAY | -3.177 |
PET | -2.922 |
ARE | -2.689 |
ggle | -2.643 |
TW | -2.629 |
Token | " |
Token ID | 366 |
Feature activation | +8.71e+00 |
Pos logit contributions | |
anonymity | +5.414 |
ividual | +5.318 |
favorite | +5.017 |
important | +4.997 |
-) | +4.811 |
Neg logit contributions | |
WAY | -5.980 |
PET | -5.526 |
VER | -5.020 |
ARE | -5.020 |
ggle | -4.986 |
Token | near |
Token ID | 40093 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
favorite | +6.129 |
important | +5.928 |
ividual | +5.893 |
anonymity | +5.734 |
-) | +5.461 |
Neg logit contributions | |
WAY | -7.327 |
PET | -6.596 |
respectively | -6.246 |
ggle | -6.235 |
POL | -6.092 |
Token | abroad |
Token ID | 10522 |
Feature activation | +9.08e+00 |
Pos logit contributions | |
anonymity | +14.653 |
ividual | +13.727 |
-) | +13.712 |
favorite | +13.179 |
important | +12.561 |
Neg logit contributions | |
WAY | -15.404 |
PET | -14.293 |
VERT | -13.341 |
Charges | -13.053 |
TW | -12.959 |
Token | ." |
Token ID | 526 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
ividual | +6.442 |
anonymity | +6.422 |
favorite | +6.051 |
important | +5.849 |
-) | +5.556 |
Neg logit contributions | |
WAY | -7.670 |
PET | -7.136 |
VERT | -6.500 |
VER | -6.373 |
ARE | -6.354 |
Token | He |
Token ID | 679 |
Feature activation | -3.71e+00 |
Pos logit contributions | |
WAY | +0.173 |
PET | +0.158 |
ARE | +0.144 |
ggle | +0.142 |
VER | +0.141 |
Neg logit contributions | |
ividual | -0.187 |
anonymity | -0.185 |
favorite | -0.176 |
important | -0.171 |
-) | -0.170 |
Token | is |
Token ID | 318 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
WAY | +2.969 |
PET | +2.720 |
ARE | +2.495 |
ggle | +2.464 |
VER | +2.449 |
Neg logit contributions | |
ividual | -3.037 |
anonymity | -2.990 |
favorite | -2.837 |
important | -2.738 |
-) | -2.705 |
Token | at |
Token ID | 379 |
Feature activation | +8.70e-01 |
Pos logit contributions | |
WAY | +2.371 |
PET | +2.183 |
ARE | +2.016 |
ggle | +1.989 |
VER | +1.984 |
Neg logit contributions | |
ividual | -2.028 |
anonymity | -1.976 |
favorite | -1.873 |
important | -1.801 |
-) | -1.781 |
Token | - |
Token ID | 12 |
Feature activation | +2.61e+00 |
Pos logit contributions | |
anonymity | +2.588 |
ividual | +2.564 |
favorite | +2.378 |
-) | +2.304 |
important | +2.294 |
Neg logit contributions | |
WAY | -4.684 |
PET | -4.310 |
ARE | -4.062 |
ggle | -4.054 |
VER | -4.042 |
Token | to |
Token ID | 1462 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
ividual | +2.064 |
anonymity | +2.030 |
favorite | +1.990 |
important | +1.934 |
-) | +1.899 |
Neg logit contributions | |
WAY | -2.138 |
PET | -1.914 |
ggle | -1.782 |
ARE | -1.779 |
VER | -1.755 |
Token | - |
Token ID | 12 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
-) | +8.612 |
favorite | +8.257 |
anonymity | +7.825 |
important | +7.206 |
ividual | +6.889 |
Neg logit contributions | |
WAY | -20.900 |
PET | -19.300 |
VERT | -18.338 |
ARE | -18.226 |
ggle | -17.967 |
Token | back |
Token ID | 1891 |
Feature activation | +9.17e+00 |
Pos logit contributions | |
favorite | +7.791 |
anonymity | +7.211 |
important | +7.142 |
ividual | +6.876 |
-) | +6.762 |
Neg logit contributions | |
WAY | -10.672 |
PET | -9.658 |
ggle | -9.222 |
Defendant | -9.170 |
Defendants | -9.086 |
Token | - |
Token ID | 12 |
Feature activation | +5.66e+00 |
Pos logit contributions | |
anonymity | +6.594 |
ividual | +6.424 |
favorite | +6.189 |
important | +6.060 |
-) | +5.950 |
Neg logit contributions | |
WAY | -7.642 |
PET | -6.937 |
ARE | -6.559 |
ggle | -6.474 |
VERT | -6.365 |
Token | to |
Token ID | 1462 |
Feature activation | +2.22e+01 |
Pos logit contributions | |
ividual | +4.214 |
favorite | +4.196 |
anonymity | +4.126 |
important | +4.033 |
-) | +3.905 |
Neg logit contributions | |
WAY | -4.707 |
PET | -4.200 |
ggle | -4.016 |
ARE | -3.923 |
POL | -3.846 |
Token | - |
Token ID | 12 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
-) | +10.675 |
anonymity | +10.428 |
favorite | +10.397 |
important | +9.771 |
ividual | +9.737 |
Neg logit contributions | |
WAY | -18.905 |
PET | -17.268 |
ARE | -16.398 |
VERT | -16.209 |
POL | -15.973 |
Token | back |
Token ID | 1891 |
Feature activation | +9.17e+00 |
Pos logit contributions | |
favorite | +7.467 |
anonymity | +7.043 |
important | +6.901 |
ividual | +6.766 |
-) | +6.603 |
Neg logit contributions | |
WAY | -9.560 |
PET | -8.665 |
ggle | -8.246 |
Defendant | -8.104 |
ARE | -8.078 |
Token | - |
Token ID | 12 |
Feature activation | +3.28e+00 |
Pos logit contributions | |
anonymity | +6.643 |
ividual | +6.483 |
favorite | +6.229 |
important | +6.110 |
-) | +6.026 |
Neg logit contributions | |
WAY | -7.559 |
PET | -6.911 |
ARE | -6.517 |
ggle | -6.377 |
VERT | -6.352 |
Token | to |
Token ID | 1462 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
ividual | +2.593 |
anonymity | +2.540 |
favorite | +2.516 |
important | +2.427 |
-) | +2.379 |
Neg logit contributions | |
WAY | -2.665 |
PET | -2.403 |
ARE | -2.237 |
ggle | -2.234 |
VERT | -2.164 |
Token | - |
Token ID | 12 |
Feature activation | +7.82e+00 |
Pos logit contributions | |
-) | +7.660 |
favorite | +7.629 |
anonymity | +7.612 |
ividual | +7.305 |
important | +6.913 |
Neg logit contributions | |
WAY | -16.790 |
PET | -15.297 |
ARE | -14.764 |
VERT | -14.241 |
TW | -14.222 |
Token | - |
Token ID | 12 |
Feature activation | -5.21e+00 |
Pos logit contributions | |
anonymity | +3.192 |
ividual | +3.112 |
favorite | +2.988 |
-) | +2.890 |
important | +2.856 |
Neg logit contributions | |
WAY | -7.860 |
PET | -7.391 |
ARE | -6.967 |
VERT | -6.926 |
VER | -6.866 |
Token | high |
Token ID | 8929 |
Feature activation | +6.20e+00 |
Pos logit contributions | |
WAY | +4.631 |
PET | +4.271 |
ARE | +3.953 |
ggle | +3.911 |
TW | +3.889 |
Neg logit contributions | |
ividual | -3.834 |
anonymity | -3.737 |
favorite | -3.430 |
-) | -3.317 |
important | -3.298 |
Token | - |
Token ID | 12 |
Feature activation | -7.92e+00 |
Pos logit contributions | |
anonymity | +4.632 |
ividual | +4.535 |
favorite | +4.392 |
-) | +4.312 |
important | +4.216 |
Neg logit contributions | |
WAY | -4.796 |
PET | -4.671 |
VERT | -4.311 |
ARE | -4.265 |
ggle | -4.222 |
Token | price |
Token ID | 20888 |
Feature activation | +6.58e+00 |
Pos logit contributions | |
WAY | +6.971 |
PET | +6.311 |
ARE | +5.856 |
TW | +5.811 |
ggle | +5.776 |
Neg logit contributions | |
ividual | -5.872 |
anonymity | -5.730 |
favorite | -5.213 |
-) | -5.078 |
important | -4.993 |
Token | - |
Token ID | 12 |
Feature activation | -5.20e+00 |
Pos logit contributions | |
anonymity | +2.643 |
ividual | +2.559 |
favorite | +2.407 |
-) | +2.307 |
important | +2.173 |
Neg logit contributions | |
WAY | -7.580 |
PET | -7.235 |
VERT | -6.821 |
ARE | -6.772 |
TW | -6.762 |
Token | of |
Token ID | 1659 |
Feature activation | +2.21e+01 |
Pos logit contributions | |
WAY | +3.897 |
PET | +3.546 |
ARE | +3.232 |
ggle | +3.158 |
VER | +3.154 |
Neg logit contributions | |
ividual | -4.569 |
anonymity | -4.477 |
favorite | -4.186 |
-) | -4.074 |
important | -4.058 |
Token | - |
Token ID | 12 |
Feature activation | +5.60e+00 |
Pos logit contributions | |
anonymity | +8.942 |
-) | +8.622 |
favorite | +7.668 |
important | +7.281 |
ividual | +7.082 |
Neg logit contributions | |
WAY | -20.624 |
PET | -19.409 |
VERT | -18.372 |
Defendant | -18.237 |
ARE | -18.187 |
Token | the |
Token ID | 1169 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
anonymity | +4.058 |
ividual | +4.031 |
favorite | +3.987 |
important | +3.901 |
-) | +3.742 |
Neg logit contributions | |
WAY | -4.707 |
PET | -4.282 |
ARE | -3.987 |
ggle | -3.966 |
respectively | -3.944 |
Token | - |
Token ID | 12 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
-) | +6.071 |
anonymity | +6.031 |
favorite | +5.724 |
important | +5.497 |
ividual | +5.328 |
Neg logit contributions | |
WAY | -17.466 |
PET | -16.227 |
VERT | -15.594 |
VER | -15.344 |
ARE | -15.207 |
Token | trans |
Token ID | 7645 |
Feature activation | +5.55e+00 |
Pos logit contributions | |
ividual | +0.781 |
anonymity | +0.776 |
favorite | +0.749 |
important | +0.727 |
-) | +0.708 |
Neg logit contributions | |
WAY | -0.891 |
PET | -0.813 |
ARE | -0.754 |
ggle | -0.747 |
VER | -0.742 |
Token | - |
Token ID | 12 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
anonymity | +2.855 |
ividual | +2.767 |
favorite | +2.627 |
-) | +2.614 |
important | +2.562 |
Neg logit contributions | |
WAY | -5.873 |
PET | -5.525 |
ARE | -5.208 |
ggle | -5.181 |
VER | -5.127 |
Token | aim |
Token ID | 4031 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
WAY | +3.293 |
PET | +2.969 |
ARE | +2.735 |
ggle | +2.693 |
VER | +2.665 |
Neg logit contributions | |
ividual | -3.917 |
anonymity | -3.852 |
favorite | -3.666 |
important | -3.565 |
-) | -3.479 |
Token | to |
Token ID | 284 |
Feature activation | -6.98e-01 |
Pos logit contributions | |
WAY | +1.581 |
PET | +1.447 |
ARE | +1.332 |
ggle | +1.312 |
VER | +1.306 |
Neg logit contributions | |
ividual | -1.518 |
anonymity | -1.494 |
favorite | -1.414 |
important | -1.370 |
-) | -1.354 |
Token | answer |
Token ID | 3280 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
WAY | +0.510 |
PET | +0.460 |
ARE | +0.418 |
VER | +0.408 |
ggle | +0.408 |
Neg logit contributions | |
ividual | -0.625 |
anonymity | -0.621 |
favorite | -0.588 |
important | -0.574 |
-) | -0.569 |
Token | here |
Token ID | 994 |
Feature activation | +4.46e-01 |
Pos logit contributions | |
ividual | +1.074 |
anonymity | +1.062 |
favorite | +0.993 |
important | +0.968 |
-) | +0.963 |
Neg logit contributions | |
WAY | -1.165 |
PET | -1.069 |
ARE | -0.984 |
ggle | -0.970 |
VER | -0.959 |
Token | is |
Token ID | 318 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
ividual | +0.361 |
anonymity | +0.356 |
favorite | +0.337 |
important | +0.328 |
-) | +0.325 |
Neg logit contributions | |
WAY | -0.364 |
PET | -0.333 |
ARE | -0.304 |
ggle | -0.302 |
VER | -0.298 |
Token | , |
Token ID | 11 |
Feature activation | -3.01e+01 |
Pos logit contributions | |
WAY | +13.872 |
PET | +12.361 |
POL | +12.298 |
respectively | +12.141 |
VER | +12.042 |
Neg logit contributions | |
ividual | -15.035 |
interstitial | -14.074 |
favorite | -14.072 |
anonymity | -13.837 |
pecially | -13.119 |
Token | which |
Token ID | 543 |
Feature activation | -5.18e+00 |
Pos logit contributions | |
respectively | +16.401 |
WAY | +16.244 |
ARE | +15.203 |
POL | +15.090 |
PET | +14.704 |
Neg logit contributions | |
ividual | -18.883 |
interstitial | -17.902 |
anonymity | -17.099 |
favorite | -16.991 |
important | -16.163 |
Token | way |
Token ID | 835 |
Feature activation | -9.83e+00 |
Pos logit contributions | |
WAY | +3.965 |
PET | +3.589 |
ARE | +3.293 |
VER | +3.233 |
ggle | +3.196 |
Neg logit contributions | |
ividual | -4.402 |
anonymity | -4.254 |
favorite | -4.135 |
important | -3.986 |
-) | -3.916 |
Token | ? |
Token ID | 5633 |
Feature activation | -3.54e+00 |
Pos logit contributions | |
WAY | +6.879 |
PET | +6.137 |
ARE | +5.750 |
VER | +5.669 |
POL | +5.563 |
Neg logit contributions | |
ividual | -8.645 |
anonymity | -8.225 |
favorite | -8.078 |
important | -7.810 |
interstitial | -7.668 |
Token | How |
Token ID | 1374 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
WAY | +2.630 |
PET | +2.378 |
ARE | +2.170 |
VER | +2.127 |
ggle | +2.125 |
Neg logit contributions | |
ividual | -3.120 |
anonymity | -3.065 |
favorite | -2.923 |
important | -2.829 |
-) | -2.793 |
Token | would |
Token ID | 561 |
Feature activation | +3.71e+00 |
Pos logit contributions | |
WAY | +8.183 |
PET | +7.302 |
ARE | +6.970 |
VER | +6.849 |
POL | +6.813 |
Neg logit contributions | |
ividual | -10.535 |
favorite | -9.973 |
anonymity | -9.951 |
interstitial | -9.635 |
important | -9.301 |
Token | on |
Token ID | 319 |
Feature activation | -4.64e+00 |
Pos logit contributions | |
WAY | +6.822 |
PET | +6.276 |
respectively | +5.779 |
VER | +5.675 |
ARE | +5.631 |
Neg logit contributions | |
ividual | -7.560 |
anonymity | -7.314 |
favorite | -7.105 |
interstitial | -6.853 |
important | -6.794 |
Token | Ubuntu |
Token ID | 14949 |
Feature activation | -5.21e+00 |
Pos logit contributions | |
WAY | +3.325 |
PET | +2.979 |
ARE | +2.716 |
ggle | +2.675 |
VER | +2.650 |
Neg logit contributions | |
ividual | -4.182 |
anonymity | -4.096 |
favorite | -3.942 |
important | -3.819 |
-) | -3.771 |
Token | and |
Token ID | 290 |
Feature activation | -8.25e+00 |
Pos logit contributions | |
WAY | +4.125 |
PET | +3.733 |
ARE | +3.423 |
VER | +3.406 |
respectively | +3.397 |
Neg logit contributions | |
ividual | -4.280 |
anonymity | -4.177 |
favorite | -4.024 |
important | -3.845 |
-) | -3.826 |
Token | Fedora |
Token ID | 32245 |
Feature activation | -7.31e+00 |
Pos logit contributions | |
WAY | +5.407 |
PET | +4.841 |
respectively | +4.356 |
ggle | +4.340 |
ARE | +4.335 |
Neg logit contributions | |
ividual | -7.822 |
anonymity | -7.461 |
favorite | -7.236 |
important | -7.011 |
interstitial | -6.955 |
Token | to |
Token ID | 284 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
WAY | +5.668 |
PET | +5.175 |
respectively | +4.850 |
ARE | +4.714 |
VER | +4.691 |
Neg logit contributions | |
ividual | -5.979 |
anonymity | -5.801 |
favorite | -5.628 |
important | -5.385 |
interstitial | -5.351 |
Token | see |
Token ID | 766 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
WAY | +6.960 |
PET | +6.176 |
respectively | +5.922 |
ggle | +5.868 |
lengths | +5.691 |
Neg logit contributions | |
ividual | -10.102 |
anonymity | -9.533 |
favorite | -9.417 |
interstitial | -9.308 |
important | -9.089 |
Token | how |
Token ID | 703 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
respectively | +11.630 |
WAY | +11.183 |
strides | +9.910 |
lengths | +9.802 |
ARE | +9.732 |
Neg logit contributions | |
ividual | -21.459 |
interstitial | -20.200 |
anonymity | -19.516 |
favorite | -19.141 |
important | -18.980 |
Token | the |
Token ID | 262 |
Feature activation | -9.18e+00 |
Pos logit contributions | |
WAY | +8.073 |
PET | +7.311 |
respectively | +7.182 |
VER | +6.933 |
ggle | +6.876 |
Neg logit contributions | |
ividual | -10.289 |
favorite | -9.599 |
anonymity | -9.510 |
interstitial | -9.366 |
important | -8.952 |
Token | experiences |
Token ID | 6461 |
Feature activation | -3.06e+00 |
Pos logit contributions | |
WAY | +6.248 |
PET | +5.656 |
respectively | +5.269 |
TW | +5.118 |
ARE | +5.098 |
Neg logit contributions | |
ividual | -8.199 |
anonymity | -7.681 |
favorite | -7.634 |
interstitial | -7.365 |
important | -7.360 |
Token | would |
Token ID | 561 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
WAY | +2.540 |
PET | +2.325 |
ARE | +2.145 |
ggle | +2.116 |
VER | +2.105 |
Neg logit contributions | |
ividual | -2.416 |
anonymity | -2.373 |
favorite | -2.259 |
important | -2.181 |
-) | -2.145 |
Token | compare |
Token ID | 8996 |
Feature activation | -7.75e+00 |
Pos logit contributions | |
WAY | +1.733 |
PET | +1.593 |
ARE | +1.473 |
ggle | +1.454 |
VER | +1.446 |
Neg logit contributions | |
ividual | -1.523 |
anonymity | -1.497 |
favorite | -1.415 |
important | -1.368 |
-) | -1.346 |
Token | common |
Token ID | 2219 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
WAY | +0.973 |
PET | +0.887 |
ARE | +0.812 |
ggle | +0.799 |
VER | +0.795 |
Neg logit contributions | |
ividual | -1.030 |
anonymity | -1.019 |
favorite | -0.963 |
important | -0.938 |
-) | -0.926 |
Token | question |
Token ID | 1808 |
Feature activation | -9.42e+00 |
Pos logit contributions | |
WAY | +9.039 |
PET | +7.941 |
ARE | +7.524 |
strides | +7.402 |
lengths | +7.313 |
Neg logit contributions | |
ividual | -10.499 |
favorite | -9.668 |
important | -9.389 |
anonymity | -9.329 |
-) | -9.251 |
Token | from |
Token ID | 422 |
Feature activation | -7.20e+00 |
Pos logit contributions | |
WAY | +6.664 |
PET | +6.150 |
ARE | +5.648 |
respectively | +5.472 |
TW | +5.468 |
Neg logit contributions | |
ividual | -7.906 |
anonymity | -7.671 |
favorite | -7.528 |
important | -7.266 |
-) | -7.132 |
Token | colleagues |
Token ID | 7810 |
Feature activation | +7.81e+00 |
Pos logit contributions | |
WAY | +5.119 |
PET | +4.616 |
ARE | +4.243 |
ggle | +4.137 |
VER | +4.131 |
Neg logit contributions | |
ividual | -6.375 |
anonymity | -6.145 |
favorite | -6.070 |
important | -5.822 |
-) | -5.733 |
Token | has |
Token ID | 468 |
Feature activation | -6.38e-01 |
Pos logit contributions | |
ividual | +5.619 |
anonymity | +5.608 |
favorite | +5.040 |
important | +4.961 |
-) | +4.952 |
Neg logit contributions | |
WAY | -6.784 |
PET | -6.204 |
ARE | -5.755 |
ggle | -5.690 |
VER | -5.654 |
Token | been |
Token ID | 587 |
Feature activation | -2.48e+01 |
Pos logit contributions | |
WAY | +0.705 |
PET | +0.659 |
ARE | +0.621 |
ggle | +0.613 |
VER | +0.611 |
Neg logit contributions | |
ividual | -0.334 |
anonymity | -0.326 |
favorite | -0.299 |
important | -0.285 |
-) | -0.280 |
Token | � |
Token ID | 564 |
Feature activation | -5.93e+00 |
Pos logit contributions | |
WAY | +15.478 |
PET | +13.703 |
ARE | +13.552 |
POL | +13.395 |
VER | +13.103 |
Neg logit contributions | |
ividual | -16.473 |
favorite | -15.547 |
interstitial | -15.316 |
pecially | -15.042 |
anonymity | -15.021 |
Token | � |
Token ID | 250 |
Feature activation | -6.72e+00 |
Pos logit contributions | |
WAY | +3.419 |
PET | +2.970 |
ARE | +2.665 |
VER | +2.601 |
� | +2.568 |
Neg logit contributions | |
ividual | -6.200 |
anonymity | -6.045 |
favorite | -5.713 |
important | -5.596 |
-) | -5.518 |
Token | W |
Token ID | 54 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
WAY | +5.923 |
PET | +5.464 |
ARE | +5.141 |
VER | +5.055 |
ggle | +5.005 |
Neg logit contributions | |
ividual | -4.882 |
anonymity | -4.724 |
favorite | -4.424 |
important | -4.241 |
-) | -4.199 |
Token | eren |
Token ID | 14226 |
Feature activation | -1.52e+01 |
Pos logit contributions | |
WAY | +10.338 |
PET | +9.743 |
ARE | +9.496 |
TW | +9.258 |
VER | +9.255 |
Neg logit contributions | |
ividual | -8.154 |
anonymity | -8.028 |
favorite | -7.472 |
important | -7.020 |
interstitial | -6.994 |
Token | � |
Token ID | 447 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
WAY | +9.797 |
PET | +9.022 |
TW | +8.538 |
ggle | +8.311 |
ARE | +8.236 |
Neg logit contributions | |
ividual | -12.215 |
anonymity | -11.968 |
favorite | -11.467 |
interstitial | -11.059 |
inav | -10.722 |
Token | conscious |
Token ID | 16796 |
Feature activation | +2.61e+00 |
Pos logit contributions | |
WAY | +2.808 |
PET | +2.544 |
ARE | +2.353 |
ggle | +2.308 |
VER | +2.287 |
Neg logit contributions | |
ividual | -2.945 |
anonymity | -2.878 |
favorite | -2.714 |
important | -2.627 |
-) | -2.585 |
Token | a |
Token ID | 257 |
Feature activation | +5.88e+00 |
Pos logit contributions | |
ividual | +2.131 |
anonymity | +2.128 |
favorite | +2.002 |
important | +1.951 |
-) | +1.925 |
Neg logit contributions | |
WAY | -2.081 |
PET | -1.908 |
ARE | -1.750 |
ggle | -1.719 |
VER | -1.698 |
Token | low |
Token ID | 1877 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
anonymity | +4.528 |
ividual | +4.453 |
favorite | +4.306 |
-) | +4.135 |
important | +4.099 |
Neg logit contributions | |
WAY | -4.850 |
PET | -4.474 |
ARE | -4.109 |
TW | -4.016 |
ggle | -4.012 |
Token | grade |
Token ID | 9559 |
Feature activation | +7.11e+00 |
Pos logit contributions | |
anonymity | +1.460 |
ividual | +1.451 |
favorite | +1.385 |
important | +1.332 |
-) | +1.328 |
Neg logit contributions | |
WAY | -1.496 |
PET | -1.375 |
ARE | -1.262 |
ggle | -1.245 |
VERT | -1.232 |
Token | is |
Token ID | 318 |
Feature activation | -9.18e+00 |
Pos logit contributions | |
anonymity | +5.196 |
ividual | +4.964 |
favorite | +4.829 |
important | +4.675 |
-) | +4.657 |
Neg logit contributions | |
WAY | -6.126 |
PET | -5.645 |
ARE | -5.193 |
ggle | -5.075 |
VERT | -5.068 |
Token | wondering |
Token ID | 11263 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
WAY | +6.538 |
PET | +5.833 |
ggle | +5.320 |
ARE | +5.309 |
VER | +5.249 |
Neg logit contributions | |
ividual | -8.022 |
anonymity | -7.469 |
favorite | -7.453 |
-) | -7.078 |
important | -7.039 |
Token | who |
Token ID | 508 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
WAY | +11.985 |
respectively | +11.131 |
ARE | +10.277 |
PET | +10.233 |
lengths | +10.168 |
Neg logit contributions | |
ividual | -20.041 |
interstitial | -18.375 |
anonymity | -17.729 |
favorite | -17.539 |
important | -17.234 |
Token | it |
Token ID | 340 |
Feature activation | +8.02e-02 |
Pos logit contributions | |
WAY | +0.101 |
PET | +0.093 |
ARE | +0.085 |
ggle | +0.084 |
VERT | +0.083 |
Neg logit contributions | |
ividual | -0.099 |
anonymity | -0.099 |
favorite | -0.093 |
important | -0.091 |
-) | -0.090 |
Token | could |
Token ID | 714 |
Feature activation | +8.42e+00 |
Pos logit contributions | |
ividual | +0.064 |
anonymity | +0.063 |
favorite | +0.060 |
important | +0.058 |
-) | +0.058 |
Neg logit contributions | |
WAY | -0.067 |
PET | -0.061 |
ARE | -0.056 |
ggle | -0.055 |
VER | -0.055 |
Token | have |
Token ID | 423 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
anonymity | +5.982 |
ividual | +5.963 |
favorite | +5.610 |
-) | +5.376 |
important | +5.365 |
Neg logit contributions | |
WAY | -7.268 |
PET | -6.656 |
ARE | -6.114 |
VERT | -6.099 |
VER | -6.019 |
Token | been |
Token ID | 587 |
Feature activation | +3.63e+00 |
Pos logit contributions | |
anonymity | +10.429 |
important | +9.678 |
favorite | +9.564 |
ividual | +9.557 |
-) | +9.136 |
Neg logit contributions | |
WAY | -12.231 |
PET | -11.644 |
VERT | -10.379 |
ggle | -10.304 |
TW | -10.303 |
Token | not |
Token ID | 407 |
Feature activation | -7.90e+00 |
Pos logit contributions | |
WAY | +2.403 |
PET | +2.212 |
ARE | +2.038 |
ggle | +2.012 |
VER | +2.005 |
Neg logit contributions | |
ividual | -2.211 |
anonymity | -2.173 |
favorite | -2.056 |
important | -1.989 |
-) | -1.967 |
Token | use |
Token ID | 779 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
WAY | +5.755 |
PET | +5.347 |
ggle | +4.921 |
ARE | +4.851 |
VER | +4.807 |
Neg logit contributions | |
ividual | -6.616 |
anonymity | -6.429 |
favorite | -6.184 |
important | -6.027 |
interstitial | -6.021 |
Token | crack |
Token ID | 8469 |
Feature activation | -6.76e+00 |
Pos logit contributions | |
WAY | +1.502 |
PET | +1.361 |
ARE | +1.241 |
ggle | +1.221 |
VER | +1.215 |
Neg logit contributions | |
ividual | -1.750 |
anonymity | -1.721 |
favorite | -1.640 |
important | -1.594 |
-) | -1.577 |
Token | cocaine |
Token ID | 15144 |
Feature activation | -8.31e+00 |
Pos logit contributions | |
WAY | +4.509 |
PET | +4.091 |
ARE | +3.675 |
ggle | +3.663 |
VER | +3.632 |
Neg logit contributions | |
ividual | -6.284 |
anonymity | -6.087 |
favorite | -5.941 |
important | -5.742 |
-) | -5.653 |
Token | , |
Token ID | 11 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
WAY | +6.884 |
PET | +6.345 |
VER | +5.822 |
ARE | +5.815 |
ggle | +5.809 |
Neg logit contributions | |
ividual | -6.224 |
anonymity | -6.038 |
favorite | -5.801 |
important | -5.617 |
interstitial | -5.496 |
Token | nor |
Token ID | 4249 |
Feature activation | -2.44e+01 |
Pos logit contributions | |
WAY | +10.489 |
PET | +9.777 |
TW | +9.064 |
ARE | +9.011 |
POL | +8.948 |
Neg logit contributions | |
ividual | -10.052 |
anonymity | -9.489 |
favorite | -9.301 |
important | -8.946 |
interstitial | -8.832 |
Token | am |
Token ID | 716 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
WAY | +13.484 |
PET | +12.080 |
POL | +11.851 |
ever | +11.831 |
ARE | +11.764 |
Neg logit contributions | |
ividual | -18.392 |
favorite | -17.404 |
important | -16.782 |
interstitial | -16.295 |
anonymity | -16.251 |
Token | I |
Token ID | 314 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
WAY | +7.462 |
PET | +6.627 |
VER | +5.795 |
ARE | +5.751 |
POL | +5.742 |
Neg logit contributions | |
ividual | -13.386 |
favorite | -13.107 |
anonymity | -13.075 |
important | -12.330 |
inav | -12.306 |
Token | an |
Token ID | 281 |
Feature activation | -8.57e+00 |
Pos logit contributions | |
WAY | +12.184 |
PET | +11.059 |
ARE | +10.490 |
POL | +10.467 |
VER | +10.339 |
Neg logit contributions | |
ividual | -11.909 |
favorite | -11.319 |
anonymity | -11.110 |
inav | -10.959 |
interstitial | -10.444 |
Token | addict |
Token ID | 19678 |
Feature activation | -4.56e+00 |
Pos logit contributions | |
WAY | +4.730 |
PET | +4.076 |
ARE | +3.743 |
TW | +3.538 |
POL | +3.510 |
Neg logit contributions | |
ividual | -8.691 |
anonymity | -8.489 |
favorite | -8.391 |
important | -8.027 |
-) | -7.977 |
Token | of |
Token ID | 286 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
WAY | +4.003 |
PET | +3.707 |
ARE | +3.426 |
ggle | +3.397 |
VER | +3.372 |
Neg logit contributions | |
ividual | -3.317 |
anonymity | -3.296 |
favorite | -3.090 |
important | -2.987 |
-) | -2.939 |
Token | . |
Token ID | 13 |
Feature activation | -4.63e+00 |
Pos logit contributions | |
anonymity | +0.969 |
ividual | +0.959 |
favorite | +0.891 |
important | +0.872 |
-) | +0.853 |
Neg logit contributions | |
WAY | -1.115 |
PET | -1.030 |
ARE | -0.946 |
ggle | -0.936 |
VERT | -0.929 |
Token | " |
Token ID | 366 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
WAY | +2.973 |
PET | +2.641 |
ARE | +2.373 |
VER | +2.310 |
TW | +2.300 |
Neg logit contributions | |
ividual | -4.559 |
anonymity | -4.464 |
favorite | -4.285 |
important | -4.157 |
-) | -4.124 |
Token | I |
Token ID | 40 |
Feature activation | -5.21e+00 |
Pos logit contributions | |
WAY | +7.600 |
PET | +7.028 |
ARE | +6.395 |
VER | +6.232 |
TW | +6.189 |
Neg logit contributions | |
ividual | -9.995 |
anonymity | -9.401 |
favorite | -8.588 |
interstitial | -8.518 |
umatic | -8.486 |
Token | am |
Token ID | 716 |
Feature activation | -8.13e+00 |
Pos logit contributions | |
WAY | +3.980 |
PET | +3.620 |
ARE | +3.308 |
ggle | +3.292 |
VER | +3.257 |
Neg logit contributions | |
ividual | -4.413 |
anonymity | -4.309 |
favorite | -4.142 |
important | -4.007 |
interstitial | -3.934 |
Token | wondering |
Token ID | 11263 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
WAY | +6.540 |
PET | +5.947 |
ARE | +5.471 |
respectively | +5.409 |
VER | +5.409 |
Neg logit contributions | |
ividual | -6.481 |
anonymity | -6.049 |
favorite | -6.029 |
important | -5.704 |
interstitial | -5.695 |
Token | , |
Token ID | 11 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
WAY | +10.195 |
respectively | +9.123 |
PET | +9.024 |
ARE | +8.748 |
POL | +8.634 |
Neg logit contributions | |
ividual | -17.268 |
interstitial | -16.246 |
favorite | -15.731 |
anonymity | -15.682 |
important | -14.985 |
Token | why |
Token ID | 1521 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
WAY | +14.550 |
respectively | +13.841 |
ARE | +13.438 |
PET | +13.285 |
POL | +12.903 |
Neg logit contributions | |
ividual | -16.985 |
interstitial | -15.997 |
favorite | -15.836 |
anonymity | -15.152 |
important | -14.824 |
Token | is |
Token ID | 318 |
Feature activation | -5.49e-01 |
Pos logit contributions | |
WAY | +8.866 |
PET | +8.290 |
respectively | +7.623 |
ARE | +7.590 |
POL | +7.546 |
Neg logit contributions | |
ividual | -11.595 |
favorite | -10.811 |
interstitial | -10.512 |
anonymity | -10.239 |
important | -10.230 |
Token | the |
Token ID | 262 |
Feature activation | -5.99e+00 |
Pos logit contributions | |
WAY | +0.438 |
PET | +0.398 |
ARE | +0.366 |
ggle | +0.361 |
VER | +0.356 |
Neg logit contributions | |
anonymity | -0.455 |
ividual | -0.454 |
favorite | -0.423 |
important | -0.416 |
-) | -0.409 |
Token | Finance |
Token ID | 15007 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
WAY | +4.195 |
PET | +3.784 |
ARE | +3.421 |
VER | +3.340 |
ggle | +3.335 |
Neg logit contributions | |
ividual | -5.506 |
anonymity | -5.262 |
favorite | -5.184 |
important | -4.981 |
-) | -4.952 |
Token | Minister |
Token ID | 4139 |
Feature activation | -6.22e+00 |
Pos logit contributions | |
WAY | +5.476 |
PET | +4.611 |
ARE | +4.064 |
POL | +3.957 |
TW | +3.846 |
Neg logit contributions | |
ividual | -12.653 |
anonymity | -12.219 |
favorite | -12.189 |
interstitial | -11.676 |
-) | -11.656 |
Token | %). |
Token ID | 18823 |
Feature activation | +4.52e+00 |
Pos logit contributions | |
ividual | +3.316 |
anonymity | +3.297 |
favorite | +3.062 |
-) | +3.060 |
important | +3.039 |
Neg logit contributions | |
WAY | -5.345 |
PET | -4.925 |
ggle | -4.612 |
ARE | -4.600 |
VERT | -4.530 |
Token | It |
Token ID | 632 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
anonymity | +3.381 |
ividual | +3.363 |
favorite | +3.236 |
-) | +3.182 |
important | +3.174 |
Neg logit contributions | |
WAY | -3.744 |
PET | -3.396 |
ggle | -3.185 |
ARE | -3.152 |
VERT | -3.073 |
Token | remains |
Token ID | 3793 |
Feature activation | -9.97e+00 |
Pos logit contributions | |
WAY | +1.083 |
PET | +0.991 |
ARE | +0.912 |
ggle | +0.898 |
VER | +0.894 |
Neg logit contributions | |
ividual | -1.052 |
anonymity | -1.036 |
favorite | -0.981 |
important | -0.950 |
-) | -0.939 |
Token | to |
Token ID | 284 |
Feature activation | -6.34e+00 |
Pos logit contributions | |
WAY | +6.999 |
PET | +6.371 |
respectively | +5.856 |
VER | +5.844 |
POL | +5.800 |
Neg logit contributions | |
ividual | -8.767 |
anonymity | -8.042 |
favorite | -7.986 |
interstitial | -7.651 |
-) | -7.618 |
Token | be |
Token ID | 307 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
WAY | +5.880 |
PET | +5.499 |
ggle | +5.169 |
ARE | +5.123 |
respectively | +5.063 |
Neg logit contributions | |
ividual | -4.197 |
anonymity | -3.946 |
favorite | -3.860 |
important | -3.608 |
interstitial | -3.604 |
Token | seen |
Token ID | 1775 |
Feature activation | -2.42e+01 |
Pos logit contributions | |
WAY | +8.197 |
PET | +7.282 |
ggle | +6.608 |
respectively | +6.505 |
POL | +6.426 |
Neg logit contributions | |
ividual | -13.862 |
anonymity | -13.257 |
favorite | -12.950 |
interstitial | -12.793 |
-) | -12.417 |
Token | whether |
Token ID | 1771 |
Feature activation | -5.65e+00 |
Pos logit contributions | |
WAY | +11.726 |
respectively | +10.944 |
PET | +10.759 |
POL | +9.992 |
ARE | +9.801 |
Neg logit contributions | |
ividual | -19.435 |
interstitial | -18.551 |
anonymity | -18.077 |
favorite | -18.017 |
important | -17.449 |
Token | the |
Token ID | 262 |
Feature activation | -5.17e+00 |
Pos logit contributions | |
WAY | +4.639 |
PET | +4.279 |
ARE | +3.936 |
VER | +3.882 |
ggle | +3.861 |
Neg logit contributions | |
ividual | -4.424 |
anonymity | -4.289 |
favorite | -4.149 |
important | -3.961 |
-) | -3.909 |
Token | C |
Token ID | 327 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
WAY | +4.640 |
PET | +4.275 |
ARE | +3.951 |
VER | +3.910 |
ggle | +3.905 |
Neg logit contributions | |
ividual | -3.714 |
anonymity | -3.578 |
favorite | -3.446 |
important | -3.280 |
-) | -3.246 |
Token | UP |
Token ID | 8577 |
Feature activation | -6.42e+00 |
Pos logit contributions | |
WAY | +1.152 |
PET | +1.038 |
ARE | +0.945 |
VER | +0.926 |
ggle | +0.921 |
Neg logit contributions | |
ividual | -1.484 |
anonymity | -1.461 |
favorite | -1.388 |
important | -1.349 |
-) | -1.327 |
Token | will |
Token ID | 481 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
WAY | +5.013 |
PET | +4.627 |
ARE | +4.228 |
VER | +4.175 |
ggle | +4.172 |
Neg logit contributions | |
ividual | -5.270 |
anonymity | -5.153 |
favorite | -4.945 |
important | -4.777 |
-) | -4.672 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+00 |
Pos logit contributions | |
WAY | +1.184 |
PET | +1.066 |
ARE | +0.956 |
VER | +0.939 |
TW | +0.936 |
Neg logit contributions | |
ividual | -1.755 |
anonymity | -1.699 |
favorite | -1.589 |
interstitial | -1.556 |
important | -1.549 |
Token | He |
Token ID | 1544 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
WAY | +2.962 |
PET | +2.683 |
ARE | +2.411 |
VER | +2.362 |
TW | +2.343 |
Neg logit contributions | |
ividual | -4.025 |
anonymity | -3.911 |
favorite | -3.667 |
important | -3.583 |
-) | -3.550 |
Token | then |
Token ID | 788 |
Feature activation | -5.91e+00 |
Pos logit contributions | |
WAY | +2.459 |
PET | +2.272 |
ARE | +2.106 |
ggle | +2.086 |
VER | +2.074 |
Neg logit contributions | |
ividual | -1.920 |
anonymity | -1.877 |
favorite | -1.772 |
important | -1.706 |
-) | -1.681 |
Token | asks |
Token ID | 7893 |
Feature activation | -1.69e+01 |
Pos logit contributions | |
WAY | +5.053 |
PET | +4.657 |
ggle | +4.271 |
ARE | +4.270 |
strides | +4.252 |
Neg logit contributions | |
ividual | -4.432 |
anonymity | -4.222 |
favorite | -4.098 |
important | -3.919 |
interstitial | -3.861 |
Token | : |
Token ID | 25 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
WAY | +10.272 |
PET | +9.087 |
respectively | +8.700 |
ARE | +8.504 |
POL | +8.395 |
Neg logit contributions | |
ividual | -14.532 |
favorite | -13.459 |
anonymity | -12.961 |
interstitial | -12.897 |
-) | -12.745 |
Token | " |
Token ID | 366 |
Feature activation | -2.40e+01 |
Pos logit contributions | |
WAY | +9.506 |
PET | +8.551 |
ARE | +8.294 |
respectively | +7.898 |
TW | +7.487 |
Neg logit contributions | |
ividual | -18.503 |
anonymity | -17.323 |
favorite | -17.058 |
interstitial | -16.822 |
important | -16.358 |
Token | Is |
Token ID | 3792 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
WAY | +14.206 |
PET | +13.630 |
ARE | +12.794 |
Are | +12.371 |
VER | +12.056 |
Neg logit contributions | |
ividual | -20.221 |
anonymity | -18.453 |
interstitial | -16.734 |
umatic | -16.667 |
romeda | -16.237 |
Token | there |
Token ID | 612 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
anonymity | +2.265 |
ividual | +2.219 |
favorite | +2.065 |
important | +2.026 |
-) | +2.000 |
Neg logit contributions | |
WAY | -2.833 |
PET | -2.603 |
ARE | -2.430 |
ggle | -2.394 |
TW | -2.363 |
Token | really |
Token ID | 1107 |
Feature activation | -6.47e+00 |
Pos logit contributions | |
WAY | +7.502 |
PET | +6.694 |
VER | +6.167 |
ARE | +6.065 |
respectively | +6.013 |
Neg logit contributions | |
ividual | -10.428 |
favorite | -9.896 |
anonymity | -9.451 |
interstitial | -9.409 |
important | -9.244 |
Token | such |
Token ID | 884 |
Feature activation | -3.74e+00 |
Pos logit contributions | |
WAY | +4.736 |
PET | +4.255 |
ARE | +3.895 |
VER | +3.889 |
ggle | +3.850 |
Neg logit contributions | |
ividual | -5.669 |
favorite | -5.333 |
anonymity | -5.322 |
important | -5.060 |
-) | -5.044 |
Token | a |
Token ID | 257 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
WAY | +2.746 |
PET | +2.481 |
ARE | +2.274 |
ggle | +2.220 |
VER | +2.220 |
Neg logit contributions | |
ividual | -3.318 |
anonymity | -3.217 |
favorite | -3.115 |
important | -3.007 |
-) | -2.983 |
Token | both |
Token ID | 1111 |
Feature activation | -3.32e+00 |
Pos logit contributions | |
ividual | +0.487 |
anonymity | +0.486 |
favorite | +0.459 |
important | +0.446 |
-) | +0.444 |
Neg logit contributions | |
WAY | -0.406 |
PET | -0.370 |
ARE | -0.337 |
ggle | -0.329 |
VER | -0.328 |
Token | Fedora |
Token ID | 32245 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
WAY | +2.515 |
PET | +2.286 |
ARE | +2.083 |
ggle | +2.048 |
VER | +2.045 |
Neg logit contributions | |
ividual | -2.873 |
anonymity | -2.807 |
favorite | -2.681 |
important | -2.606 |
-) | -2.572 |
Token | and |
Token ID | 290 |
Feature activation | -2.48e+00 |
Pos logit contributions | |
ividual | +0.818 |
anonymity | +0.812 |
favorite | +0.764 |
important | +0.742 |
-) | +0.735 |
Neg logit contributions | |
WAY | -0.846 |
PET | -0.775 |
ARE | -0.716 |
ggle | -0.716 |
TW | -0.700 |
Token | Ubuntu |
Token ID | 14949 |
Feature activation | -7.20e+00 |
Pos logit contributions | |
WAY | +1.751 |
PET | +1.576 |
ARE | +1.426 |
ggle | +1.400 |
VER | +1.393 |
Neg logit contributions | |
ividual | -2.288 |
anonymity | -2.256 |
favorite | -2.151 |
important | -2.094 |
-) | -2.073 |
Token | to |
Token ID | 284 |
Feature activation | -5.11e+00 |
Pos logit contributions | |
WAY | +5.579 |
PET | +5.028 |
respectively | +4.680 |
VER | +4.599 |
ARE | +4.572 |
Neg logit contributions | |
ividual | -6.006 |
anonymity | -5.772 |
favorite | -5.590 |
important | -5.351 |
-) | -5.309 |
Token | see |
Token ID | 766 |
Feature activation | -2.35e+01 |
Pos logit contributions | |
WAY | +3.833 |
PET | +3.461 |
ggle | +3.170 |
ARE | +3.159 |
VER | +3.097 |
Neg logit contributions | |
ividual | -4.437 |
anonymity | -4.289 |
favorite | -4.142 |
important | -4.011 |
-) | -3.928 |
Token | how |
Token ID | 703 |
Feature activation | -8.64e+00 |
Pos logit contributions | |
WAY | +10.622 |
respectively | +10.149 |
strides | +8.947 |
ARE | +8.944 |
lengths | +8.926 |
Neg logit contributions | |
ividual | -20.424 |
interstitial | -19.203 |
favorite | -18.585 |
anonymity | -18.389 |
important | -18.098 |
Token | this |
Token ID | 428 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
WAY | +6.880 |
PET | +6.337 |
respectively | +5.884 |
ggle | +5.878 |
VER | +5.853 |
Neg logit contributions | |
ividual | -6.721 |
anonymity | -6.328 |
favorite | -6.245 |
interstitial | -5.906 |
important | -5.889 |
Token | uns |
Token ID | 5576 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
WAY | +1.245 |
PET | +1.138 |
ARE | +1.049 |
ggle | +1.032 |
VER | +1.027 |
Neg logit contributions | |
ividual | -1.192 |
anonymity | -1.177 |
favorite | -1.110 |
important | -1.076 |
-) | -1.065 |
Token | ung |
Token ID | 2150 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
ividual | +6.767 |
anonymity | +6.597 |
cient | +6.426 |
important | +6.376 |
favorite | +6.225 |
Neg logit contributions | |
WAY | -10.293 |
PET | -9.493 |
ggle | -8.901 |
ARE | -8.876 |
ISON | -8.722 |
Token | third |
Token ID | 2368 |
Feature activation | +5.97e+00 |
Pos logit contributions | |
anonymity | +9.097 |
ividual | +8.490 |
favorite | +8.164 |
important | +7.843 |
-) | +7.824 |
Neg logit contributions | |
WAY | -8.743 |
PET | -7.898 |
ARE | -7.306 |
Charges | -7.185 |
VERT | -7.080 |
Token | people |
Token ID | 661 |
Feature activation | +2.77e+00 |
Pos logit contributions | |
anonymity | +2.362 |
ividual | +2.345 |
favorite | +2.237 |
important | +2.184 |
-) | +2.134 |
Neg logit contributions | |
WAY | -1.668 |
PET | -1.527 |
ARE | -1.345 |
ggle | -1.340 |
VER | -1.317 |
Token | were |
Token ID | 547 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
anonymity | +2.259 |
ividual | +2.233 |
favorite | +2.120 |
important | +2.047 |
-) | +2.022 |
Neg logit contributions | |
WAY | -2.213 |
PET | -2.028 |
ARE | -1.843 |
VERT | -1.810 |
VER | -1.806 |
Token | asking |
Token ID | 4737 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
WAY | +1.188 |
PET | +1.095 |
ARE | +1.015 |
ggle | +1.001 |
VER | +0.997 |
Neg logit contributions | |
ividual | -0.975 |
anonymity | -0.959 |
favorite | -0.902 |
important | -0.872 |
-) | -0.861 |
Token | me |
Token ID | 502 |
Feature activation | -7.78e+00 |
Pos logit contributions | |
WAY | +8.566 |
PET | +7.277 |
ARE | +6.911 |
VER | +6.875 |
respectively | +6.854 |
Neg logit contributions | |
ividual | -12.654 |
favorite | -11.570 |
anonymity | -11.474 |
interstitial | -11.355 |
-) | -11.211 |
Token | , |
Token ID | 11 |
Feature activation | -1.61e+01 |
Pos logit contributions | |
WAY | +5.370 |
PET | +4.814 |
ARE | +4.429 |
VER | +4.375 |
respectively | +4.311 |
Neg logit contributions | |
ividual | -7.046 |
anonymity | -6.724 |
favorite | -6.554 |
important | -6.326 |
-) | -6.271 |
Token | ' |
Token ID | 705 |
Feature activation | -2.34e+01 |
Pos logit contributions | |
WAY | +9.970 |
PET | +8.546 |
ARE | +8.395 |
respectively | +8.215 |
VER | +8.075 |
Neg logit contributions | |
ividual | -14.092 |
anonymity | -13.054 |
favorite | -12.815 |
important | -12.436 |
interstitial | -12.387 |
Token | how |
Token ID | 4919 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
WAY | +15.631 |
PET | +14.286 |
ARE | +14.273 |
Are | +13.861 |
Fuck | +13.487 |
Neg logit contributions | |
ividual | -17.271 |
anonymity | -16.010 |
umatic | -13.831 |
-) | -13.735 |
agascar | -13.677 |
Token | do |
Token ID | 466 |
Feature activation | -5.35e+00 |
Pos logit contributions | |
WAY | +7.178 |
PET | +6.567 |
ARE | +6.141 |
VER | +6.043 |
ggle | +5.815 |
Neg logit contributions | |
ividual | -11.371 |
anonymity | -10.629 |
favorite | -10.456 |
interstitial | -10.214 |
important | -9.986 |
Token | you |
Token ID | 345 |
Feature activation | -3.84e+00 |
Pos logit contributions | |
WAY | +3.800 |
PET | +3.410 |
ARE | +3.133 |
VER | +3.080 |
ggle | +3.052 |
Neg logit contributions | |
ividual | -4.824 |
anonymity | -4.705 |
favorite | -4.519 |
important | -4.386 |
-) | -4.356 |
Token | do |
Token ID | 466 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
WAY | +2.854 |
PET | +2.586 |
ARE | +2.340 |
ggle | +2.332 |
VER | +2.308 |
Neg logit contributions | |
ividual | -3.386 |
anonymity | -3.293 |
favorite | -3.153 |
important | -3.063 |
-) | -3.034 |
Token | your |
Token ID | 534 |
Feature activation | +5.34e+00 |
Pos logit contributions | |
anonymity | +1.452 |
ividual | +1.442 |
favorite | +1.352 |
important | +1.315 |
-) | +1.283 |
Neg logit contributions | |
WAY | -1.639 |
PET | -1.504 |
ARE | -1.392 |
ggle | -1.362 |
TW | -1.352 |
Token | . |
Token ID | 13 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
WAY | +6.530 |
PET | +5.731 |
ggle | +5.302 |
ARE | +5.282 |
respectively | +5.272 |
Neg logit contributions | |
ividual | -7.795 |
anonymity | -7.508 |
favorite | -7.167 |
-) | -6.995 |
important | -6.944 |
Token | It |
Token ID | 632 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
WAY | +1.045 |
PET | +0.953 |
ARE | +0.874 |
ggle | +0.862 |
VER | +0.854 |
Neg logit contributions | |
ividual | -1.100 |
anonymity | -1.087 |
favorite | -1.033 |
important | -1.004 |
-) | -0.993 |
Token | remains |
Token ID | 3793 |
Feature activation | -5.79e+00 |
Pos logit contributions | |
WAY | +1.264 |
PET | +1.156 |
ARE | +1.064 |
ggle | +1.047 |
VER | +1.042 |
Neg logit contributions | |
ividual | -1.232 |
anonymity | -1.213 |
favorite | -1.148 |
important | -1.114 |
-) | -1.101 |
Token | to |
Token ID | 284 |
Feature activation | -4.55e+00 |
Pos logit contributions | |
WAY | +4.515 |
PET | +4.059 |
ggle | +3.735 |
ARE | +3.728 |
VER | +3.696 |
Neg logit contributions | |
ividual | -4.900 |
anonymity | -4.667 |
favorite | -4.490 |
-) | -4.319 |
important | -4.308 |
Token | be |
Token ID | 307 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
WAY | +4.473 |
PET | +4.170 |
ARE | +3.910 |
ggle | +3.903 |
VER | +3.850 |
Neg logit contributions | |
ividual | -2.890 |
anonymity | -2.748 |
favorite | -2.608 |
important | -2.480 |
-) | -2.440 |
Token | seen |
Token ID | 1775 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
WAY | +8.000 |
PET | +6.954 |
ggle | +6.407 |
VER | +6.219 |
ARE | +6.157 |
Neg logit contributions | |
ividual | -13.876 |
anonymity | -13.212 |
favorite | -12.582 |
interstitial | -12.535 |
-) | -12.409 |
Token | whether |
Token ID | 1771 |
Feature activation | -6.85e+00 |
Pos logit contributions | |
WAY | +11.189 |
PET | +9.881 |
respectively | +9.732 |
ARE | +9.259 |
POL | +8.951 |
Neg logit contributions | |
ividual | -19.738 |
anonymity | -18.741 |
interstitial | -18.333 |
favorite | -17.808 |
pecially | -17.766 |
Token | this |
Token ID | 428 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
WAY | +4.996 |
PET | +4.509 |
ARE | +4.106 |
VER | +4.077 |
TW | +4.042 |
Neg logit contributions | |
ividual | -6.016 |
anonymity | -5.776 |
favorite | -5.629 |
important | -5.403 |
-) | -5.361 |
Token | sort |
Token ID | 3297 |
Feature activation | -6.94e-01 |
Pos logit contributions | |
anonymity | +1.691 |
ividual | +1.663 |
favorite | +1.575 |
important | +1.545 |
-) | +1.515 |
Neg logit contributions | |
WAY | -1.561 |
PET | -1.423 |
ARE | -1.301 |
ggle | -1.276 |
VERT | -1.273 |
Token | of |
Token ID | 286 |
Feature activation | +5.55e-01 |
Pos logit contributions | |
WAY | +0.540 |
PET | +0.492 |
ARE | +0.451 |
ggle | +0.441 |
VER | +0.440 |
Neg logit contributions | |
ividual | -0.592 |
anonymity | -0.579 |
favorite | -0.548 |
important | -0.532 |
-) | -0.525 |
Token | outside |
Token ID | 2354 |
Feature activation | +9.19e+00 |
Pos logit contributions | |
anonymity | +0.483 |
ividual | +0.477 |
favorite | +0.449 |
important | +0.440 |
-) | +0.433 |
Neg logit contributions | |
WAY | -0.422 |
PET | -0.383 |
ARE | -0.348 |
VER | -0.341 |
ggle | -0.340 |
Token | the |
Token ID | 262 |
Feature activation | +3.92e+00 |
Pos logit contributions | |
anonymity | +0.523 |
ividual | +0.516 |
favorite | +0.488 |
important | +0.472 |
-) | +0.463 |
Neg logit contributions | |
WAY | -0.547 |
PET | -0.497 |
ARE | -0.459 |
VERT | -0.448 |
VER | -0.444 |
Token | video |
Token ID | 2008 |
Feature activation | +2.42e+00 |
Pos logit contributions | |
anonymity | +3.400 |
ividual | +3.234 |
favorite | +3.106 |
important | +3.060 |
-) | +2.973 |
Neg logit contributions | |
WAY | -3.012 |
PET | -2.671 |
ARE | -2.473 |
VERT | -2.420 |
TW | -2.390 |
Token | can |
Token ID | 460 |
Feature activation | -6.58e+00 |
Pos logit contributions | |
anonymity | +1.843 |
ividual | +1.843 |
favorite | +1.700 |
important | +1.670 |
-) | +1.639 |
Neg logit contributions | |
WAY | -2.084 |
PET | -1.914 |
ARE | -1.748 |
VERT | -1.741 |
ggle | -1.727 |
Token | be |
Token ID | 307 |
Feature activation | -4.07e+00 |
Pos logit contributions | |
WAY | +6.367 |
PET | +5.944 |
ggle | +5.586 |
ARE | +5.520 |
VER | +5.504 |
Neg logit contributions | |
ividual | -4.112 |
anonymity | -4.012 |
favorite | -3.760 |
important | -3.584 |
-) | -3.499 |
Token | heard |
Token ID | 2982 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
WAY | +3.172 |
PET | +2.879 |
ARE | +2.648 |
ggle | +2.619 |
VER | +2.593 |
Neg logit contributions | |
ividual | -3.434 |
anonymity | -3.353 |
favorite | -3.191 |
important | -3.092 |
-) | -3.068 |
Token | asking |
Token ID | 4737 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
ividual | +0.819 |
anonymity | +0.818 |
favorite | +0.753 |
important | +0.731 |
-) | +0.716 |
Neg logit contributions | |
WAY | -1.133 |
PET | -1.051 |
ARE | -0.977 |
VERT | -0.959 |
TW | -0.955 |
Token | � |
Token ID | 564 |
Feature activation | -4.37e+00 |
Pos logit contributions | |
WAY | +14.706 |
POL | +13.272 |
PET | +13.089 |
Defendant | +13.006 |
Defendants | +12.653 |
Neg logit contributions | |
ividual | -16.525 |
favorite | -15.692 |
-) | -15.070 |
important | -14.831 |
anonymity | -14.810 |
Token | � |
Token ID | 250 |
Feature activation | -6.45e+00 |
Pos logit contributions | |
WAY | +2.386 |
PET | +2.086 |
ARE | +1.822 |
ggle | +1.781 |
VER | +1.766 |
Neg logit contributions | |
ividual | -4.721 |
anonymity | -4.651 |
favorite | -4.433 |
important | -4.346 |
-) | -4.304 |
Token | What |
Token ID | 2061 |
Feature activation | -1.49e+01 |
Pos logit contributions | |
WAY | +5.490 |
PET | +5.059 |
ARE | +4.687 |
VER | +4.636 |
ggle | +4.579 |
Neg logit contributions | |
ividual | -4.949 |
anonymity | -4.847 |
favorite | -4.500 |
important | -4.352 |
-) | -4.321 |
Token | flavor |
Token ID | 9565 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
WAY | +11.156 |
PET | +10.345 |
ARE | +9.878 |
VER | +9.765 |
POL | +9.710 |
Neg logit contributions | |
ividual | -11.112 |
anonymity | -10.455 |
favorite | -10.241 |
interstitial | -10.003 |
important | -9.885 |
Token | ? |
Token ID | 30 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
WAY | +8.531 |
PET | +7.884 |
ARE | +7.487 |
ggle | +7.304 |
VER | +7.260 |
Neg logit contributions | |
ividual | -7.869 |
anonymity | -7.616 |
favorite | -7.122 |
interstitial | -7.119 |
important | -7.037 |
Token | to |
Token ID | 284 |
Feature activation | -9.15e+00 |
Pos logit contributions | |
WAY | +3.126 |
PET | +2.858 |
ARE | +2.622 |
ggle | +2.579 |
VER | +2.573 |
Neg logit contributions | |
ividual | -3.195 |
anonymity | -3.138 |
favorite | -2.984 |
important | -2.893 |
-) | -2.858 |
Token | exercise |
Token ID | 5517 |
Feature activation | +4.55e+00 |
Pos logit contributions | |
WAY | +6.198 |
PET | +5.629 |
TW | +5.031 |
respectively | +5.016 |
ggle | +4.993 |
Neg logit contributions | |
ividual | -8.235 |
anonymity | -8.073 |
favorite | -7.793 |
important | -7.575 |
interstitial | -7.526 |
Token | that |
Token ID | 326 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
anonymity | +3.985 |
ividual | +3.884 |
favorite | +3.644 |
important | +3.576 |
-) | +3.504 |
Neg logit contributions | |
WAY | -3.409 |
PET | -3.078 |
ARE | -2.834 |
ggle | -2.788 |
VERT | -2.717 |
Token | discretion |
Token ID | 14130 |
Feature activation | +6.75e+00 |
Pos logit contributions | |
anonymity | +6.022 |
ividual | +5.684 |
important | +5.290 |
favorite | +5.201 |
-) | +4.831 |
Neg logit contributions | |
WAY | -10.133 |
PET | -9.302 |
ARE | -8.917 |
VERT | -8.911 |
TW | -8.833 |
Token | will |
Token ID | 481 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
anonymity | +4.810 |
ividual | +4.786 |
important | +4.374 |
favorite | +4.296 |
-) | +4.216 |
Neg logit contributions | |
WAY | -5.952 |
PET | -5.454 |
ARE | -5.127 |
VERT | -5.109 |
TW | -4.945 |
Token | determine |
Token ID | 5004 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
WAY | +1.007 |
PET | +0.925 |
ARE | +0.856 |
ggle | +0.842 |
VER | +0.839 |
Neg logit contributions | |
ividual | -0.878 |
anonymity | -0.865 |
favorite | -0.814 |
important | -0.790 |
-) | -0.780 |
Token | Bob |
Token ID | 5811 |
Feature activation | -5.55e+00 |
Pos logit contributions | |
WAY | +12.466 |
PET | +11.093 |
respectively | +10.878 |
Defendant | +10.842 |
lengths | +10.682 |
Neg logit contributions | |
ividual | -17.785 |
interstitial | -16.826 |
favorite | -16.583 |
anonymity | -16.547 |
-) | -16.110 |
Token | McDonnell |
Token ID | 39441 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
WAY | +2.749 |
PET | +2.436 |
ARE | +2.057 |
VER | +2.021 |
ggle | +2.002 |
Neg logit contributions | |
ividual | -6.106 |
anonymity | -6.095 |
favorite | -5.847 |
important | -5.684 |
-) | -5.654 |
Token | � |
Token ID | 447 |
Feature activation | +2.54e+00 |
Pos logit contributions | |
WAY | +11.588 |
PET | +10.727 |
TW | +10.083 |
VER | +10.076 |
POL | +9.941 |
Neg logit contributions | |
ividual | -8.433 |
anonymity | -8.316 |
favorite | -7.895 |
important | -7.657 |
-) | -7.572 |
Token | � |
Token ID | 247 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
ividual | +2.294 |
anonymity | +2.264 |
favorite | +2.166 |
important | +2.104 |
-) | +2.089 |
Neg logit contributions | |
WAY | -1.828 |
PET | -1.651 |
ARE | -1.498 |
ggle | -1.468 |
VER | -1.464 |
Token | s |
Token ID | 82 |
Feature activation | -1.45e+01 |
Pos logit contributions | |
WAY | +3.048 |
PET | +2.816 |
ARE | +2.602 |
ggle | +2.574 |
VER | +2.571 |
Neg logit contributions | |
ividual | -2.479 |
anonymity | -2.441 |
favorite | -2.285 |
important | -2.210 |
-) | -2.184 |
Token | yet |
Token ID | 1865 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
anonymity | +1.887 |
ividual | +1.880 |
favorite | +1.766 |
important | +1.707 |
-) | +1.683 |
Neg logit contributions | |
WAY | -2.040 |
PET | -1.897 |
ARE | -1.726 |
ggle | -1.698 |
VERT | -1.697 |
Token | again |
Token ID | 757 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
WAY | +2.098 |
PET | +1.891 |
ARE | +1.714 |
ggle | +1.688 |
VER | +1.674 |
Neg logit contributions | |
ividual | -2.735 |
anonymity | -2.693 |
favorite | -2.571 |
important | -2.501 |
-) | -2.477 |
Token | today |
Token ID | 1909 |
Feature activation | +6.02e-01 |
Pos logit contributions | |
WAY | +2.249 |
PET | +2.045 |
ARE | +1.888 |
ggle | +1.859 |
VER | +1.854 |
Neg logit contributions | |
ividual | -2.251 |
anonymity | -2.209 |
favorite | -2.097 |
important | -2.030 |
-) | -2.010 |
Token | , |
Token ID | 11 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
ividual | +0.461 |
anonymity | +0.457 |
favorite | +0.428 |
important | +0.416 |
-) | +0.409 |
Neg logit contributions | |
WAY | -0.517 |
PET | -0.477 |
ARE | -0.438 |
ggle | -0.432 |
VER | -0.429 |
Token | and |
Token ID | 290 |
Feature activation | -3.77e+00 |
Pos logit contributions | |
ividual | +0.824 |
anonymity | +0.821 |
favorite | +0.768 |
important | +0.744 |
-) | +0.734 |
Neg logit contributions | |
WAY | -0.891 |
PET | -0.815 |
ARE | -0.751 |
ggle | -0.744 |
VERT | -0.736 |
Token | wonders |
Token ID | 19294 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
WAY | +2.935 |
PET | +2.669 |
ARE | +2.457 |
ggle | +2.415 |
VER | +2.397 |
Neg logit contributions | |
ividual | -3.179 |
anonymity | -3.103 |
favorite | -2.959 |
important | -2.877 |
-) | -2.839 |
Token | what |
Token ID | 644 |
Feature activation | -7.93e+00 |
Pos logit contributions | |
WAY | +11.525 |
respectively | +10.542 |
ARE | +9.975 |
PET | +9.920 |
POL | +9.767 |
Neg logit contributions | |
ividual | -18.897 |
anonymity | -17.211 |
interstitial | -17.177 |
favorite | -16.623 |
important | -16.244 |
Token | is |
Token ID | 318 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
WAY | +6.080 |
PET | +5.550 |
ARE | +5.210 |
VER | +5.081 |
strides | +5.011 |
Neg logit contributions | |
ividual | -6.645 |
anonymity | -6.257 |
favorite | -6.139 |
important | -5.904 |
-) | -5.841 |
Token | to |
Token ID | 284 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
anonymity | +1.384 |
ividual | +1.368 |
favorite | +1.290 |
important | +1.276 |
-) | +1.241 |
Neg logit contributions | |
WAY | -1.635 |
PET | -1.513 |
ARE | -1.390 |
ggle | -1.370 |
VERT | -1.362 |
Token | be |
Token ID | 307 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
ividual | +0.899 |
anonymity | +0.893 |
favorite | +0.833 |
important | +0.815 |
-) | +0.795 |
Neg logit contributions | |
WAY | -1.082 |
PET | -0.996 |
ARE | -0.910 |
VER | -0.905 |
VERT | -0.902 |
Token | done |
Token ID | 1760 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
ividual | +1.438 |
anonymity | +1.434 |
favorite | +1.358 |
important | +1.317 |
-) | +1.282 |
Neg logit contributions | |
WAY | -1.794 |
PET | -1.659 |
ARE | -1.526 |
ggle | -1.522 |
VER | -1.504 |
Token | where |
Token ID | 810 |
Feature activation | -7.30e+00 |
Pos logit contributions | |
WAY | +3.147 |
PET | +2.854 |
ARE | +2.596 |
VER | +2.558 |
ggle | +2.557 |
Neg logit contributions | |
ividual | -3.671 |
anonymity | -3.573 |
favorite | -3.410 |
important | -3.311 |
-) | -3.259 |
Token | things |
Token ID | 1243 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
WAY | +4.907 |
PET | +4.404 |
ARE | +4.017 |
VER | +3.961 |
ggle | +3.936 |
Neg logit contributions | |
ividual | -6.782 |
anonymity | -6.483 |
favorite | -6.320 |
important | -6.126 |
-) | -6.018 |
Token | seem |
Token ID | 1283 |
Feature activation | -6.50e+00 |
Pos logit contributions | |
WAY | +1.998 |
PET | +1.833 |
ARE | +1.694 |
ggle | +1.669 |
VER | +1.662 |
Neg logit contributions | |
ividual | -1.795 |
anonymity | -1.765 |
favorite | -1.668 |
important | -1.613 |
-) | -1.593 |
Token | to |
Token ID | 284 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
WAY | +5.096 |
PET | +4.605 |
ARE | +4.245 |
ggle | +4.222 |
VER | +4.206 |
Neg logit contributions | |
ividual | -5.446 |
anonymity | -5.268 |
favorite | -4.979 |
important | -4.804 |
interstitial | -4.740 |
Token | be |
Token ID | 307 |
Feature activation | -7.13e+00 |
Pos logit contributions | |
WAY | +1.826 |
PET | +1.687 |
ARE | +1.569 |
ggle | +1.548 |
VER | +1.541 |
Neg logit contributions | |
ividual | -1.381 |
anonymity | -1.358 |
favorite | -1.274 |
important | -1.229 |
-) | -1.213 |
Token | going |
Token ID | 1016 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
WAY | +6.263 |
PET | +5.728 |
ggle | +5.294 |
ARE | +5.281 |
VER | +5.267 |
Neg logit contributions | |
ividual | -5.320 |
anonymity | -5.060 |
favorite | -4.734 |
important | -4.555 |
interstitial | -4.473 |
Token | comparatively |
Token ID | 31188 |
Feature activation | -1.52e+01 |
Pos logit contributions | |
WAY | +13.548 |
respectively | +12.112 |
PET | +11.668 |
VER | +11.657 |
ggle | +11.593 |
Neg logit contributions | |
ividual | -18.658 |
interstitial | -16.586 |
anonymity | -16.370 |
favorite | -15.646 |
inav | -15.512 |
Token | well |
Token ID | 880 |
Feature activation | -9.42e+00 |
Pos logit contributions | |
WAY | +8.408 |
PET | +7.134 |
respectively | +6.723 |
VER | +6.722 |
ggle | +6.679 |
Neg logit contributions | |
ividual | -15.595 |
interstitial | -14.082 |
anonymity | -13.937 |
favorite | -13.540 |
important | -13.349 |
Token | ). |
Token ID | 737 |
Feature activation | -5.24e+00 |
Pos logit contributions | |
WAY | +7.352 |
PET | +6.588 |
respectively | +6.118 |
VER | +6.099 |
ARE | +6.018 |
Neg logit contributions | |
ividual | -7.679 |
anonymity | -7.393 |
favorite | -6.984 |
interstitial | -6.778 |
important | -6.726 |
Token |
|
Token ID | 198 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
WAY | +3.782 |
PET | +3.406 |
ARE | +3.130 |
VER | +3.045 |
TW | +3.020 |
Neg logit contributions | |
ividual | -4.802 |
anonymity | -4.669 |
favorite | -4.371 |
important | -4.237 |
interstitial | -4.212 |
Token |
|
Token ID | 198 |
Feature activation | -2.84e+00 |
Pos logit contributions | |
WAY | +1.240 |
PET | +1.114 |
ARE | +1.001 |
VER | +0.986 |
TW | +0.976 |
Neg logit contributions | |
ividual | -1.832 |
anonymity | -1.774 |
favorite | -1.657 |
interstitial | -1.621 |
important | -1.614 |
Token | frequency |
Token ID | 8373 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
anonymity | +1.436 |
ividual | +1.418 |
favorite | +1.336 |
important | +1.306 |
-) | +1.286 |
Neg logit contributions | |
WAY | -1.463 |
PET | -1.356 |
ARE | -1.234 |
ggle | -1.226 |
VER | -1.210 |
Token | , |
Token ID | 11 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
WAY | +1.472 |
PET | +1.344 |
ARE | +1.238 |
ggle | +1.219 |
VER | +1.213 |
Neg logit contributions | |
ividual | -1.439 |
anonymity | -1.413 |
favorite | -1.340 |
important | -1.297 |
-) | -1.283 |
Token | and |
Token ID | 290 |
Feature activation | +6.69e+00 |
Pos logit contributions | |
anonymity | +1.437 |
ividual | +1.418 |
favorite | +1.326 |
important | +1.301 |
-) | +1.284 |
Neg logit contributions | |
WAY | -1.613 |
PET | -1.495 |
ARE | -1.382 |
ggle | -1.366 |
VER | -1.342 |
Token | asked |
Token ID | 1965 |
Feature activation | -8.80e+00 |
Pos logit contributions | |
anonymity | +5.234 |
ividual | +5.002 |
important | +4.673 |
favorite | +4.668 |
-) | +4.595 |
Neg logit contributions | |
WAY | -5.271 |
PET | -4.932 |
ggle | -4.521 |
ARE | -4.485 |
VERT | -4.376 |
Token | , |
Token ID | 11 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
WAY | +6.204 |
PET | +5.512 |
ARE | +5.127 |
respectively | +4.998 |
TW | +4.967 |
Neg logit contributions | |
ividual | -7.843 |
anonymity | -7.476 |
favorite | -7.368 |
important | -7.077 |
-) | -7.001 |
Token | " |
Token ID | 366 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
WAY | +10.190 |
PET | +8.927 |
ARE | +8.563 |
respectively | +8.485 |
VER | +8.141 |
Neg logit contributions | |
ividual | -13.735 |
anonymity | -13.003 |
favorite | -12.631 |
interstitial | -12.360 |
important | -12.136 |
Token | Ron |
Token ID | 23672 |
Feature activation | -3.78e+00 |
Pos logit contributions | |
WAY | +15.735 |
PET | +14.630 |
ARE | +14.133 |
TW | +13.345 |
Are | +13.228 |
Neg logit contributions | |
ividual | -16.718 |
anonymity | -15.735 |
interstitial | -13.801 |
-) | -13.335 |
umatic | -13.240 |
Token | . |
Token ID | 13 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
WAY | +2.905 |
PET | +2.641 |
ARE | +2.412 |
ggle | +2.372 |
VER | +2.364 |
Neg logit contributions | |
ividual | -3.244 |
anonymity | -3.196 |
favorite | -3.034 |
important | -2.938 |
-) | -2.912 |
Token | This |
Token ID | 770 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
WAY | +9.061 |
PET | +8.193 |
ARE | +7.680 |
POL | +7.369 |
TW | +7.303 |
Neg logit contributions | |
ividual | -12.242 |
anonymity | -11.618 |
favorite | -10.828 |
interstitial | -10.766 |
important | -10.603 |
Token | is |
Token ID | 318 |
Feature activation | -4.73e+00 |
Pos logit contributions | |
WAY | +1.770 |
PET | +1.611 |
ARE | +1.480 |
ggle | +1.455 |
VER | +1.449 |
Neg logit contributions | |
ividual | -1.843 |
anonymity | -1.810 |
favorite | -1.721 |
important | -1.668 |
-) | -1.651 |
Token | George |
Token ID | 4502 |
Feature activation | -4.97e+00 |
Pos logit contributions | |
WAY | +3.632 |
PET | +3.281 |
ARE | +3.009 |
ggle | +2.943 |
VER | +2.941 |
Neg logit contributions | |
ividual | -4.064 |
anonymity | -3.942 |
favorite | -3.783 |
important | -3.642 |
-) | -3.626 |
Token | So |
Token ID | 1406 |
Feature activation | -4.49e-01 |
Pos logit contributions | |
ividual | +2.036 |
anonymity | +2.028 |
favorite | +1.933 |
important | +1.899 |
-) | +1.888 |
Neg logit contributions | |
WAY | -2.328 |
PET | -2.135 |
ggle | -1.987 |
ARE | -1.978 |
VER | -1.933 |
Token | , |
Token ID | 11 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
WAY | +0.365 |
PET | +0.332 |
ARE | +0.304 |
ggle | +0.301 |
VER | +0.298 |
Neg logit contributions | |
ividual | -0.367 |
anonymity | -0.363 |
favorite | -0.341 |
important | -0.334 |
-) | -0.330 |
Token | one |
Token ID | 530 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
WAY | +1.223 |
PET | +1.118 |
ARE | +1.028 |
ggle | +1.013 |
VER | +1.007 |
Neg logit contributions | |
ividual | -1.192 |
anonymity | -1.176 |
favorite | -1.110 |
important | -1.079 |
-) | -1.066 |
Token | might |
Token ID | 1244 |
Feature activation | +4.27e+00 |
Pos logit contributions | |
WAY | +1.390 |
PET | +1.270 |
ARE | +1.165 |
ggle | +1.144 |
VER | +1.140 |
Neg logit contributions | |
ividual | -1.433 |
anonymity | -1.419 |
favorite | -1.338 |
important | -1.303 |
-) | -1.290 |
Token | ask |
Token ID | 1265 |
Feature activation | -1.88e+01 |
Pos logit contributions | |
anonymity | +3.415 |
ividual | +3.404 |
favorite | +3.216 |
-) | +3.164 |
important | +3.121 |
Neg logit contributions | |
WAY | -3.421 |
PET | -3.141 |
ARE | -2.883 |
VER | -2.822 |
VERT | -2.813 |
Token | , |
Token ID | 11 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
WAY | +10.746 |
PET | +9.379 |
respectively | +9.077 |
ARE | +8.791 |
VER | +8.784 |
Neg logit contributions | |
ividual | -16.540 |
interstitial | -15.269 |
favorite | -15.182 |
anonymity | -15.109 |
important | -14.356 |
Token | why |
Token ID | 1521 |
Feature activation | -9.46e+00 |
Pos logit contributions | |
WAY | +12.153 |
PET | +11.029 |
respectively | +10.952 |
ARE | +10.521 |
POL | +10.424 |
Neg logit contributions | |
ividual | -18.167 |
interstitial | -16.806 |
favorite | -16.505 |
anonymity | -16.162 |
important | -15.485 |
Token | go |
Token ID | 467 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
WAY | +6.893 |
PET | +6.371 |
VER | +5.859 |
ggle | +5.790 |
VERT | +5.777 |
Neg logit contributions | |
ividual | -7.967 |
favorite | -7.404 |
anonymity | -7.375 |
interstitial | -7.139 |
important | -7.051 |
Token | that |
Token ID | 326 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
WAY | +1.640 |
PET | +1.494 |
ARE | +1.371 |
ggle | +1.355 |
VER | +1.345 |
Neg logit contributions | |
ividual | -1.714 |
anonymity | -1.685 |
favorite | -1.601 |
important | -1.551 |
-) | -1.534 |
Token | one |
Token ID | 530 |
Feature activation | +3.30e+00 |
Pos logit contributions | |
anonymity | +1.727 |
ividual | +1.706 |
favorite | +1.614 |
important | +1.586 |
-) | +1.579 |
Neg logit contributions | |
WAY | -1.498 |
PET | -1.372 |
ARE | -1.256 |
VER | -1.218 |
VERT | -1.216 |
Token | small |
Token ID | 1402 |
Feature activation | +9.02e-01 |
Pos logit contributions | |
anonymity | +2.949 |
ividual | +2.945 |
favorite | +2.765 |
-) | +2.738 |
important | +2.734 |
Neg logit contributions | |
WAY | -2.292 |
PET | -2.099 |
ARE | -1.936 |
ggle | -1.868 |
VER | -1.859 |
Token | it |
Token ID | 340 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
WAY | +5.933 |
PET | +5.354 |
ARE | +4.979 |
VER | +4.942 |
TW | +4.804 |
Neg logit contributions | |
ividual | -7.098 |
anonymity | -6.789 |
favorite | -6.613 |
important | -6.320 |
-) | -6.278 |
Token | did |
Token ID | 750 |
Feature activation | -6.62e-01 |
Pos logit contributions | |
WAY | +2.234 |
PET | +2.053 |
ARE | +1.898 |
ggle | +1.869 |
VER | +1.866 |
Neg logit contributions | |
ividual | -1.986 |
anonymity | -1.955 |
favorite | -1.846 |
important | -1.782 |
-) | -1.763 |
Token | , |
Token ID | 11 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
WAY | +0.561 |
PET | +0.513 |
ARE | +0.473 |
ggle | +0.467 |
VER | +0.463 |
Neg logit contributions | |
ividual | -0.518 |
anonymity | -0.510 |
favorite | -0.480 |
important | -0.467 |
-) | -0.461 |
Token | Kaine |
Token ID | 37193 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
WAY | +3.458 |
PET | +3.148 |
ARE | +2.893 |
VER | +2.838 |
ggle | +2.824 |
Neg logit contributions | |
ividual | -3.702 |
anonymity | -3.628 |
favorite | -3.459 |
important | -3.346 |
-) | -3.309 |
Token | asked |
Token ID | 1965 |
Feature activation | -1.81e+01 |
Pos logit contributions | |
ividual | +1.238 |
anonymity | +1.226 |
favorite | +1.148 |
important | +1.122 |
-) | +1.111 |
Neg logit contributions | |
WAY | -1.414 |
PET | -1.301 |
ARE | -1.200 |
ggle | -1.176 |
VER | -1.170 |
Token | : |
Token ID | 25 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
WAY | +11.265 |
PET | +10.028 |
VER | +9.490 |
POL | +9.430 |
respectively | +9.421 |
Neg logit contributions | |
ividual | -15.102 |
favorite | -13.838 |
anonymity | -13.814 |
interstitial | -13.234 |
important | -13.096 |
Token | � |
Token ID | 564 |
Feature activation | -9.39e+00 |
Pos logit contributions | |
WAY | +14.294 |
PET | +13.152 |
ARE | +12.934 |
VER | +12.304 |
POL | +12.280 |
Neg logit contributions | |
ividual | -16.003 |
anonymity | -15.254 |
favorite | -14.501 |
interstitial | -14.002 |
important | -13.860 |
Token | � |
Token ID | 250 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
WAY | +4.925 |
PET | +4.324 |
ARE | +3.807 |
ggle | +3.643 |
VER | +3.641 |
Neg logit contributions | |
ividual | -10.096 |
anonymity | -9.835 |
favorite | -9.210 |
-) | -9.067 |
important | -9.043 |
Token | It |
Token ID | 1026 |
Feature activation | -5.37e+00 |
Pos logit contributions | |
WAY | +11.271 |
PET | +10.482 |
ARE | +9.990 |
VER | +9.736 |
TW | +9.424 |
Neg logit contributions | |
ividual | -12.776 |
anonymity | -12.236 |
favorite | -10.892 |
-) | -10.737 |
interstitial | -10.695 |
Token | � |
Token ID | 447 |
Feature activation | +2.53e+00 |
Pos logit contributions | |
WAY | +4.298 |
PET | +3.958 |
ARE | +3.652 |
ggle | +3.608 |
VER | +3.603 |
Neg logit contributions | |
ividual | -4.266 |
anonymity | -4.226 |
favorite | -4.020 |
important | -3.837 |
-) | -3.818 |
Token | � |
Token ID | 247 |
Feature activation | +7.85e-01 |
Pos logit contributions | |
ividual | +2.551 |
anonymity | +2.523 |
favorite | +2.429 |
important | +2.378 |
-) | +2.360 |
Neg logit contributions | |
WAY | -1.540 |
PET | -1.367 |
ARE | -1.209 |
VER | -1.172 |
ggle | -1.169 |
Token | a |
Token ID | 64 |
Feature activation | +5.54e+00 |
Pos logit contributions | |
ividual | +3.607 |
anonymity | +3.569 |
favorite | +3.399 |
important | +3.356 |
-) | +3.195 |
Neg logit contributions | |
WAY | -4.979 |
PET | -4.698 |
ggle | -4.308 |
ARE | -4.287 |
VERT | -4.241 |
Token | does |
Token ID | 857 |
Feature activation | -7.67e+00 |
Pos logit contributions | |
anonymity | +3.152 |
ividual | +3.029 |
-) | +3.021 |
important | +2.867 |
favorite | +2.785 |
Neg logit contributions | |
WAY | -5.477 |
PET | -5.205 |
ggle | -4.972 |
TW | -4.804 |
AMY | -4.768 |
Token | opt |
Token ID | 2172 |
Feature activation | +5.36e+00 |
Pos logit contributions | |
WAY | +5.451 |
PET | +4.952 |
ARE | +4.546 |
ggle | +4.473 |
VER | +4.426 |
Neg logit contributions | |
ividual | -6.774 |
anonymity | -6.542 |
favorite | -6.336 |
important | -6.113 |
interstitial | -6.036 |
Token | in |
Token ID | 287 |
Feature activation | +2.86e-01 |
Pos logit contributions | |
anonymity | +3.957 |
ividual | +3.808 |
favorite | +3.588 |
-) | +3.550 |
important | +3.545 |
Neg logit contributions | |
WAY | -4.647 |
PET | -4.303 |
ARE | -3.930 |
ggle | -3.903 |
VERT | -3.891 |
Token | : |
Token ID | 25 |
Feature activation | -3.77e+00 |
Pos logit contributions | |
ividual | +0.225 |
anonymity | +0.224 |
favorite | +0.210 |
important | +0.204 |
-) | +0.201 |
Neg logit contributions | |
WAY | -0.239 |
PET | -0.220 |
ARE | -0.202 |
ggle | -0.199 |
TW | -0.198 |
Token | what |
Token ID | 644 |
Feature activation | -2.21e+01 |
Pos logit contributions | |
WAY | +2.775 |
PET | +2.498 |
ARE | +2.290 |
VER | +2.237 |
ggle | +2.234 |
Neg logit contributions | |
ividual | -3.352 |
anonymity | -3.275 |
favorite | -3.142 |
important | -3.043 |
-) | -3.005 |
Token | does |
Token ID | 857 |
Feature activation | -3.58e-01 |
Pos logit contributions | |
WAY | +12.850 |
PET | +11.597 |
lengths | +11.570 |
ARE | +11.360 |
strides | +11.241 |
Neg logit contributions | |
ividual | -17.899 |
interstitial | -16.367 |
favorite | -15.949 |
important | -15.405 |
inav | -15.239 |
Token | that |
Token ID | 326 |
Feature activation | +9.23e+00 |
Pos logit contributions | |
WAY | +0.290 |
PET | +0.265 |
ARE | +0.242 |
ggle | +0.239 |
VER | +0.237 |
Neg logit contributions | |
ividual | -0.292 |
anonymity | -0.291 |
favorite | -0.273 |
important | -0.266 |
-) | -0.263 |
Token | do |
Token ID | 466 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
anonymity | +7.166 |
ividual | +6.614 |
important | +6.150 |
-) | +6.132 |
favorite | +6.094 |
Neg logit contributions | |
WAY | -7.367 |
PET | -6.843 |
VERT | -6.257 |
ggle | -6.129 |
Charges | -6.072 |
Token | to |
Token ID | 284 |
Feature activation | -9.93e+00 |
Pos logit contributions | |
WAY | +1.456 |
PET | +1.335 |
ARE | +1.222 |
ggle | +1.208 |
VER | +1.196 |
Neg logit contributions | |
ividual | -1.441 |
anonymity | -1.422 |
favorite | -1.340 |
important | -1.304 |
-) | -1.287 |
Token | the |
Token ID | 262 |
Feature activation | -6.71e+00 |
Pos logit contributions | |
WAY | +6.463 |
PET | +5.602 |
ARE | +5.262 |
ggle | +5.068 |
VER | +5.068 |
Neg logit contributions | |
ividual | -9.107 |
favorite | -8.636 |
anonymity | -8.622 |
important | -8.279 |
-) | -8.171 |
Token | This |
Token ID | 1212 |
Feature activation | +3.75e+00 |
Pos logit contributions | |
WAY | +2.742 |
PET | +2.489 |
ARE | +2.268 |
VER | +2.220 |
TW | +2.209 |
Neg logit contributions | |
ividual | -3.276 |
anonymity | -3.212 |
favorite | -3.021 |
important | -2.938 |
-) | -2.910 |
Token | is |
Token ID | 318 |
Feature activation | -3.38e+00 |
Pos logit contributions | |
anonymity | +2.899 |
ividual | +2.899 |
favorite | +2.707 |
important | +2.655 |
-) | +2.600 |
Neg logit contributions | |
WAY | -3.120 |
PET | -2.847 |
ARE | -2.639 |
ggle | -2.622 |
VER | -2.581 |
Token | the |
Token ID | 262 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
WAY | +2.568 |
PET | +2.328 |
ARE | +2.127 |
ggle | +2.094 |
VER | +2.084 |
Neg logit contributions | |
ividual | -2.925 |
anonymity | -2.867 |
favorite | -2.737 |
important | -2.644 |
-) | -2.625 |
Token | first |
Token ID | 717 |
Feature activation | -8.10e+00 |
Pos logit contributions | |
anonymity | +1.025 |
ividual | +1.019 |
favorite | +0.958 |
important | +0.933 |
-) | +0.916 |
Neg logit contributions | |
WAY | -1.172 |
PET | -1.083 |
ARE | -1.001 |
ggle | -0.982 |
VER | -0.977 |
Token | time |
Token ID | 640 |
Feature activation | -9.76e+00 |
Pos logit contributions | |
WAY | +5.649 |
PET | +5.047 |
ARE | +4.590 |
VER | +4.578 |
ggle | +4.528 |
Neg logit contributions | |
ividual | -7.274 |
anonymity | -6.952 |
favorite | -6.801 |
important | -6.457 |
inav | -6.409 |
Token | in |
Token ID | 287 |
Feature activation | -2.21e+01 |
Pos logit contributions | |
WAY | +7.076 |
PET | +6.446 |
ARE | +5.886 |
VER | +5.858 |
TW | +5.849 |
Neg logit contributions | |
ividual | -8.308 |
anonymity | -7.968 |
favorite | -7.791 |
important | -7.472 |
-) | -7.363 |
Token | over |
Token ID | 625 |
Feature activation | +3.44e-01 |
Pos logit contributions | |
WAY | +13.462 |
PET | +12.747 |
TW | +12.008 |
VER | +11.971 |
POL | +11.792 |
Neg logit contributions | |
ividual | -15.644 |
anonymity | -14.891 |
favorite | -14.791 |
important | -14.330 |
pecially | -14.125 |
Token | 80 |
Token ID | 4019 |
Feature activation | -8.05e+00 |
Pos logit contributions | |
ividual | +0.272 |
anonymity | +0.268 |
favorite | +0.254 |
important | +0.246 |
-) | +0.244 |
Neg logit contributions | |
WAY | -0.287 |
PET | -0.262 |
ARE | -0.242 |
ggle | -0.240 |
VER | -0.236 |
Token | years |
Token ID | 812 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
WAY | +3.675 |
PET | +3.201 |
ARE | +2.704 |
TW | +2.686 |
VER | +2.626 |
Neg logit contributions | |
ividual | -9.070 |
anonymity | -9.023 |
favorite | -8.604 |
important | -8.420 |
interstitial | -8.309 |
Token | that |
Token ID | 326 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
WAY | +10.827 |
PET | +10.087 |
TW | +9.222 |
ARE | +9.214 |
respectively | +9.169 |
Neg logit contributions | |
ividual | -9.803 |
anonymity | -9.360 |
favorite | -9.097 |
important | -8.716 |
-) | -8.554 |
Token | there |
Token ID | 612 |
Feature activation | -9.40e+00 |
Pos logit contributions | |
WAY | +1.755 |
PET | +1.591 |
ARE | +1.449 |
ggle | +1.424 |
VER | +1.418 |
Neg logit contributions | |
ividual | -2.059 |
anonymity | -2.028 |
favorite | -1.931 |
important | -1.876 |
-) | -1.857 |
Token | ." |
Token ID | 526 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
WAY | +2.906 |
PET | +2.639 |
ARE | +2.407 |
ggle | +2.369 |
VER | +2.367 |
Neg logit contributions | |
ividual | -3.233 |
anonymity | -3.181 |
favorite | -3.027 |
important | -2.931 |
-) | -2.913 |
Token |
|
Token ID | 198 |
Feature activation | -4.52e-01 |
Pos logit contributions | |
ividual | +1.053 |
anonymity | +1.036 |
favorite | +0.997 |
important | +0.969 |
-) | +0.961 |
Neg logit contributions | |
WAY | -0.969 |
PET | -0.888 |
ggle | -0.808 |
ARE | -0.806 |
VERT | -0.792 |
Token |
|
Token ID | 198 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
WAY | +0.314 |
PET | +0.283 |
ARE | +0.255 |
VER | +0.250 |
TW | +0.249 |
Neg logit contributions | |
ividual | -0.430 |
anonymity | -0.420 |
favorite | -0.396 |
important | -0.385 |
-) | -0.380 |
Token | It |
Token ID | 1026 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
WAY | +1.264 |
PET | +1.143 |
ARE | +1.040 |
ggle | +1.028 |
VER | +1.017 |
Neg logit contributions | |
ividual | -1.508 |
anonymity | -1.490 |
favorite | -1.423 |
important | -1.383 |
-) | -1.369 |
Token | 's |
Token ID | 338 |
Feature activation | +3.60e+00 |
Pos logit contributions | |
ividual | +1.897 |
anonymity | +1.878 |
favorite | +1.754 |
important | +1.715 |
-) | +1.704 |
Neg logit contributions | |
WAY | -2.237 |
PET | -2.058 |
ARE | -1.899 |
VERT | -1.863 |
ggle | -1.862 |
Token | worth |
Token ID | 2861 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
anonymity | +2.898 |
ividual | +2.853 |
important | +2.673 |
favorite | +2.652 |
-) | +2.579 |
Neg logit contributions | |
WAY | -2.927 |
PET | -2.699 |
ARE | -2.455 |
VERT | -2.423 |
ggle | -2.416 |
Token | noting |
Token ID | 10820 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
anonymity | +7.016 |
ividual | +6.139 |
important | +5.806 |
-) | +5.729 |
favorite | +5.274 |
Neg logit contributions | |
WAY | -13.398 |
PET | -12.674 |
VERT | -12.114 |
ggle | -11.822 |
Fuck | -11.774 |
Token | that |
Token ID | 326 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
WAY | +0.933 |
PET | +0.853 |
ARE | +0.783 |
ggle | +0.774 |
VER | +0.768 |
Neg logit contributions | |
ividual | -0.910 |
anonymity | -0.900 |
favorite | -0.847 |
important | -0.826 |
-) | -0.814 |
Token | there |
Token ID | 612 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
anonymity | +1.945 |
ividual | +1.930 |
favorite | +1.800 |
important | +1.770 |
-) | +1.751 |
Neg logit contributions | |
WAY | -1.926 |
PET | -1.779 |
ggle | -1.609 |
ARE | -1.605 |
VERT | -1.586 |
Token | are |
Token ID | 389 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
WAY | +9.974 |
PET | +8.934 |
respectively | +8.504 |
ARE | +8.497 |
VER | +8.375 |
Neg logit contributions | |
ividual | -13.721 |
anonymity | -13.287 |
favorite | -13.160 |
important | -12.834 |
interstitial | -12.768 |
Token | many |
Token ID | 867 |
Feature activation | -7.64e+00 |
Pos logit contributions | |
WAY | +10.059 |
PET | +8.751 |
strides | +8.617 |
respectively | +8.528 |
ARE | +8.479 |
Neg logit contributions | |
ividual | -12.537 |
favorite | -11.836 |
anonymity | -11.512 |
interstitial | -11.068 |
inav | -10.976 |
Token | year |
Token ID | 614 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
WAY | +2.639 |
PET | +2.219 |
ARE | +1.944 |
VER | +1.837 |
TW | +1.830 |
Neg logit contributions | |
ividual | -6.829 |
anonymity | -6.607 |
favorite | -6.458 |
important | -6.292 |
-) | -6.248 |
Token | , |
Token ID | 11 |
Feature activation | +4.85e+00 |
Pos logit contributions | |
WAY | +1.985 |
PET | +1.809 |
ARE | +1.658 |
VER | +1.629 |
ggle | +1.625 |
Neg logit contributions | |
ividual | -2.071 |
anonymity | -2.035 |
favorite | -1.936 |
important | -1.872 |
-) | -1.856 |
Token | contrary |
Token ID | 10388 |
Feature activation | -4.97e+00 |
Pos logit contributions | |
anonymity | +4.046 |
ividual | +3.992 |
important | +3.721 |
favorite | +3.706 |
-) | +3.624 |
Neg logit contributions | |
WAY | -3.700 |
PET | -3.349 |
ggle | -3.101 |
ARE | -3.057 |
VERT | -3.039 |
Token | to |
Token ID | 284 |
Feature activation | -8.19e+00 |
Pos logit contributions | |
WAY | +3.601 |
PET | +3.249 |
ARE | +2.967 |
VER | +2.937 |
respectively | +2.930 |
Neg logit contributions | |
ividual | -4.464 |
anonymity | -4.236 |
favorite | -4.122 |
important | -3.924 |
-) | -3.892 |
Token | what |
Token ID | 644 |
Feature activation | -8.37e-02 |
Pos logit contributions | |
WAY | +5.869 |
PET | +5.242 |
ARE | +4.883 |
VER | +4.781 |
POL | +4.693 |
Neg logit contributions | |
ividual | -7.302 |
anonymity | -6.918 |
favorite | -6.718 |
important | -6.505 |
-) | -6.411 |
Token | economists |
Token ID | 16816 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
WAY | +0.066 |
PET | +0.060 |
ARE | +0.055 |
ggle | +0.054 |
VER | +0.053 |
Neg logit contributions | |
ividual | -0.070 |
anonymity | -0.070 |
favorite | -0.066 |
important | -0.064 |
-) | -0.063 |
Token | would |
Token ID | 561 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
anonymity | +8.471 |
ividual | +8.122 |
favorite | +7.802 |
-) | +7.567 |
important | +7.453 |
Neg logit contributions | |
WAY | -11.159 |
PET | -10.328 |
AMY | -9.357 |
VERT | -9.354 |
VER | -9.283 |
Token | have |
Token ID | 423 |
Feature activation | +2.04e+01 |
Pos logit contributions | |
ividual | +8.413 |
anonymity | +8.412 |
favorite | +8.215 |
-) | +8.123 |
important | +7.537 |
Neg logit contributions | |
WAY | -10.704 |
PET | -9.834 |
VERT | -9.136 |
ARE | -9.083 |
AMY | -8.922 |
Token | expected |
Token ID | 2938 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
anonymity | +11.757 |
important | +11.274 |
ividual | +11.000 |
favorite | +10.985 |
-) | +10.981 |
Neg logit contributions | |
WAY | -14.985 |
PET | -14.618 |
AMY | -13.031 |
ggle | -13.012 |
VERT | -12.930 |
Token | , |
Token ID | 11 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
anonymity | +6.652 |
ividual | +6.353 |
favorite | +6.066 |
important | +5.920 |
-) | +5.684 |
Neg logit contributions | |
WAY | -9.141 |
PET | -8.528 |
ggle | -8.078 |
VERT | -7.764 |
ARE | -7.725 |
Token | according |
Token ID | 1864 |
Feature activation | -3.20e+00 |
Pos logit contributions | |
anonymity | +2.109 |
ividual | +2.107 |
favorite | +1.981 |
important | +1.953 |
-) | +1.913 |
Neg logit contributions | |
WAY | -1.733 |
PET | -1.566 |
ggle | -1.419 |
ARE | -1.414 |
VERT | -1.389 |
Token | , |
Token ID | 11 |
Feature activation | -5.01e-02 |
Pos logit contributions | |
WAY | +1.357 |
PET | +1.247 |
ARE | +1.152 |
ggle | +1.135 |
VER | +1.132 |
Neg logit contributions | |
ividual | -1.216 |
anonymity | -1.198 |
favorite | -1.131 |
important | -1.093 |
-) | -1.081 |
Token | � |
Token ID | 447 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
WAY | +0.041 |
PET | +0.037 |
ARE | +0.034 |
ggle | +0.034 |
VER | +0.034 |
Neg logit contributions | |
ividual | -0.041 |
anonymity | -0.040 |
favorite | -0.038 |
important | -0.037 |
-) | -0.036 |
Token | � |
Token ID | 251 |
Feature activation | -6.31e-01 |
Pos logit contributions | |
ividual | +1.016 |
anonymity | +1.005 |
favorite | +0.967 |
important | +0.938 |
-) | +0.932 |
Neg logit contributions | |
WAY | -0.806 |
PET | -0.728 |
ARE | -0.660 |
VER | -0.646 |
ggle | -0.646 |
Token | B |
Token ID | 347 |
Feature activation | +5.77e+00 |
Pos logit contributions | |
WAY | +0.545 |
PET | +0.500 |
ARE | +0.463 |
ggle | +0.457 |
VER | +0.453 |
Neg logit contributions | |
ividual | -0.482 |
anonymity | -0.474 |
favorite | -0.448 |
important | -0.434 |
-) | -0.428 |
Token | amber |
Token ID | 7789 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
ividual | +3.992 |
anonymity | +3.850 |
favorite | +3.703 |
important | +3.580 |
-) | +3.539 |
Neg logit contributions | |
WAY | -5.301 |
PET | -4.873 |
ARE | -4.505 |
ggle | -4.486 |
POL | -4.466 |
Token | ger |
Token ID | 1362 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
ividual | +2.497 |
anonymity | +2.455 |
favorite | +2.338 |
important | +2.262 |
-) | +2.247 |
Neg logit contributions | |
WAY | -2.708 |
PET | -2.478 |
ARE | -2.304 |
VER | -2.239 |
ggle | -2.233 |
Token | said |
Token ID | 531 |
Feature activation | +7.45e+00 |
Pos logit contributions | |
anonymity | +6.026 |
ividual | +5.884 |
favorite | +5.443 |
important | +5.191 |
-) | +5.112 |
Neg logit contributions | |
WAY | -13.600 |
PET | -12.886 |
ggle | -12.177 |
ARE | -11.977 |
VER | -11.762 |
Token | . |
Token ID | 13 |
Feature activation | +6.19e+00 |
Pos logit contributions | |
anonymity | +4.853 |
ividual | +4.847 |
favorite | +4.411 |
important | +4.349 |
-) | +4.183 |
Neg logit contributions | |
WAY | -6.820 |
PET | -6.323 |
ggle | -5.857 |
ARE | -5.843 |
VERT | -5.745 |
Token | � |
Token ID | 564 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
anonymity | +4.645 |
ividual | +4.637 |
favorite | +4.467 |
-) | +4.381 |
important | +4.342 |
Neg logit contributions | |
WAY | -4.878 |
PET | -4.486 |
ggle | -4.185 |
VERT | -4.097 |
ARE | -4.087 |
Token | � |
Token ID | 250 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
WAY | +0.913 |
PET | +0.799 |
ARE | +0.703 |
ggle | +0.684 |
VER | +0.681 |
Neg logit contributions | |
ividual | -1.706 |
anonymity | -1.688 |
favorite | -1.622 |
important | -1.584 |
-) | -1.570 |
Token | Once |
Token ID | 7454 |
Feature activation | +5.29e+00 |
Pos logit contributions | |
anonymity | +2.154 |
ividual | +2.148 |
favorite | +2.077 |
important | +2.033 |
-) | +2.000 |
Neg logit contributions | |
WAY | -1.801 |
PET | -1.624 |
ggle | -1.496 |
ARE | -1.473 |
respectively | -1.455 |
Token | Here |
Token ID | 4342 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
anonymity | +2.750 |
favorite | +2.723 |
ividual | +2.695 |
important | +2.657 |
-) | +2.616 |
Neg logit contributions | |
WAY | -2.286 |
PET | -2.041 |
ggle | -1.924 |
respectively | -1.911 |
POL | -1.874 |
Token | are |
Token ID | 389 |
Feature activation | -9.12e+00 |
Pos logit contributions | |
WAY | +7.810 |
PET | +7.015 |
ARE | +6.670 |
VER | +6.457 |
respectively | +6.349 |
Neg logit contributions | |
ividual | -11.318 |
anonymity | -10.891 |
favorite | -10.580 |
interstitial | -10.274 |
important | -10.196 |
Token | some |
Token ID | 617 |
Feature activation | +2.44e-01 |
Pos logit contributions | |
WAY | +6.568 |
PET | +5.843 |
ARE | +5.548 |
TW | +5.347 |
VER | +5.341 |
Neg logit contributions | |
ividual | -7.892 |
anonymity | -7.533 |
favorite | -7.350 |
-) | -7.068 |
important | -7.020 |
Token | other |
Token ID | 584 |
Feature activation | -7.89e-01 |
Pos logit contributions | |
anonymity | +0.200 |
ividual | +0.200 |
favorite | +0.188 |
important | +0.183 |
-) | +0.180 |
Neg logit contributions | |
WAY | -0.196 |
PET | -0.180 |
ARE | -0.164 |
ggle | -0.162 |
VER | -0.160 |
Token | , |
Token ID | 11 |
Feature activation | +5.34e-01 |
Pos logit contributions | |
WAY | +0.619 |
PET | +0.566 |
ARE | +0.516 |
ggle | +0.509 |
VER | +0.505 |
Neg logit contributions | |
ividual | -0.662 |
anonymity | -0.657 |
favorite | -0.621 |
important | -0.605 |
-) | -0.596 |
Token | semi |
Token ID | 10663 |
Feature activation | +1.89e+01 |
Pos logit contributions | |
anonymity | +0.449 |
ividual | +0.448 |
favorite | +0.423 |
important | +0.412 |
-) | +0.407 |
Neg logit contributions | |
WAY | -0.418 |
PET | -0.382 |
ARE | -0.347 |
ggle | -0.341 |
VERT | -0.341 |
Token | - |
Token ID | 12 |
Feature activation | +5.50e+00 |
Pos logit contributions | |
important | +9.934 |
anonymity | +9.861 |
-) | +9.839 |
favorite | +9.290 |
cient | +8.958 |
Neg logit contributions | |
WAY | -16.551 |
PET | -15.168 |
ISON | -14.215 |
POL | -14.023 |
VERT | -13.939 |
Token | relevant |
Token ID | 49659 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
anonymity | +3.830 |
favorite | +3.812 |
important | +3.804 |
ividual | +3.725 |
-) | +3.562 |
Neg logit contributions | |
WAY | -4.874 |
PET | -4.398 |
ggle | -4.134 |
ARE | -4.105 |
POL | -4.073 |
Token | survey |
Token ID | 5526 |
Feature activation | -7.66e-01 |
Pos logit contributions | |
anonymity | +1.224 |
ividual | +1.210 |
favorite | +1.143 |
important | +1.120 |
-) | +1.097 |
Neg logit contributions | |
WAY | -1.147 |
PET | -1.060 |
ARE | -0.954 |
ggle | -0.949 |
VERT | -0.935 |
Token | results |
Token ID | 2482 |
Feature activation | +4.17e+00 |
Pos logit contributions | |
WAY | +0.566 |
PET | +0.512 |
ARE | +0.465 |
ggle | +0.458 |
VER | +0.454 |
Neg logit contributions | |
ividual | -0.680 |
anonymity | -0.672 |
favorite | -0.639 |
important | -0.621 |
-) | -0.615 |
Token | to |
Token ID | 284 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
anonymity | +2.936 |
ividual | +2.899 |
favorite | +2.711 |
important | +2.684 |
-) | +2.581 |
Neg logit contributions | |
WAY | -3.718 |
PET | -3.464 |
ggle | -3.162 |
ARE | -3.161 |
VERT | -3.131 |
Token | because |
Token ID | 780 |
Feature activation | +8.23e+00 |
Pos logit contributions | |
ividual | +1.075 |
anonymity | +1.067 |
favorite | +0.996 |
important | +0.975 |
-) | +0.962 |
Neg logit contributions | |
WAY | -1.146 |
PET | -1.053 |
ARE | -0.970 |
VERT | -0.951 |
ggle | -0.950 |
Token | I |
Token ID | 314 |
Feature activation | +6.29e+00 |
Pos logit contributions | |
anonymity | +6.426 |
ividual | +6.031 |
important | +5.725 |
favorite | +5.676 |
-) | +5.649 |
Neg logit contributions | |
WAY | -6.688 |
PET | -6.197 |
ARE | -5.681 |
VERT | -5.556 |
ggle | -5.525 |
Token | was |
Token ID | 373 |
Feature activation | +3.98e+00 |
Pos logit contributions | |
anonymity | +4.690 |
ividual | +4.624 |
favorite | +4.373 |
important | +4.275 |
-) | +4.273 |
Neg logit contributions | |
WAY | -5.251 |
PET | -4.836 |
ARE | -4.427 |
VERT | -4.410 |
ggle | -4.318 |
Token | a |
Token ID | 257 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
anonymity | +3.061 |
ividual | +2.982 |
favorite | +2.794 |
important | +2.756 |
-) | +2.715 |
Neg logit contributions | |
WAY | -3.323 |
PET | -3.079 |
ARE | -2.838 |
TW | -2.782 |
ggle | -2.781 |
Token | part |
Token ID | 636 |
Feature activation | +3.08e+00 |
Pos logit contributions | |
ividual | +3.306 |
anonymity | +3.297 |
favorite | +3.117 |
-) | +3.040 |
important | +3.037 |
Neg logit contributions | |
WAY | -3.156 |
PET | -2.874 |
ARE | -2.659 |
ggle | -2.615 |
TW | -2.570 |
Token | of |
Token ID | 286 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
ividual | +2.357 |
anonymity | +2.304 |
favorite | +2.176 |
-) | +2.127 |
important | +2.098 |
Neg logit contributions | |
WAY | -2.589 |
PET | -2.393 |
ARE | -2.230 |
ggle | -2.198 |
VERT | -2.174 |
Token | the |
Token ID | 262 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
anonymity | +9.192 |
ividual | +8.924 |
-) | +8.231 |
important | +8.209 |
favorite | +8.208 |
Neg logit contributions | |
WAY | -11.236 |
PET | -10.342 |
ARE | -9.548 |
VERT | -9.385 |
ggle | -9.378 |
Token | personnel |
Token ID | 8213 |
Feature activation | +9.26e+00 |
Pos logit contributions | |
anonymity | +8.560 |
ividual | +8.373 |
favorite | +7.835 |
important | +7.762 |
-) | +7.622 |
Neg logit contributions | |
WAY | -8.162 |
PET | -7.450 |
ARE | -6.805 |
VERT | -6.773 |
ggle | -6.678 |
Token | . |
Token ID | 13 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
anonymity | +6.945 |
ividual | +6.913 |
favorite | +6.352 |
important | +6.237 |
-) | +6.085 |
Neg logit contributions | |
WAY | -7.589 |
PET | -6.862 |
VERT | -6.400 |
TW | -6.299 |
ARE | -6.290 |
Token |
|
Token ID | 198 |
Feature activation | +7.63e-01 |
Pos logit contributions | |
ividual | +1.261 |
anonymity | +1.258 |
favorite | +1.200 |
important | +1.172 |
-) | +1.163 |
Neg logit contributions | |
WAY | -1.212 |
PET | -1.108 |
ARE | -1.015 |
ggle | -1.005 |
VERT | -0.990 |
Token |
|
Token ID | 198 |
Feature activation | -4.30e+00 |
Pos logit contributions | |
ividual | +0.695 |
anonymity | +0.684 |
favorite | +0.650 |
important | +0.633 |
-) | +0.626 |
Neg logit contributions | |
WAY | -0.550 |
PET | -0.496 |
ARE | -0.450 |
ggle | -0.441 |
VER | -0.440 |
Token | commute |
Token ID | 31099 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
WAY | +1.949 |
PET | +1.713 |
ARE | +1.532 |
ggle | +1.486 |
VER | +1.477 |
Neg logit contributions | |
ividual | -3.389 |
anonymity | -3.331 |
favorite | -3.220 |
important | -3.121 |
-) | -3.102 |
Token | in |
Token ID | 287 |
Feature activation | +3.07e+00 |
Pos logit contributions | |
WAY | +1.789 |
PET | +1.632 |
ARE | +1.511 |
ggle | +1.491 |
VER | +1.487 |
Neg logit contributions | |
ividual | -1.639 |
anonymity | -1.597 |
favorite | -1.522 |
important | -1.466 |
-) | -1.449 |
Token | from |
Token ID | 422 |
Feature activation | +6.46e+00 |
Pos logit contributions | |
anonymity | +2.428 |
ividual | +2.371 |
favorite | +2.207 |
important | +2.168 |
-) | +2.135 |
Neg logit contributions | |
WAY | -2.550 |
PET | -2.373 |
ARE | -2.159 |
ggle | -2.138 |
TW | -2.096 |
Token | its |
Token ID | 663 |
Feature activation | +9.16e+00 |
Pos logit contributions | |
anonymity | +4.814 |
ividual | +4.602 |
favorite | +4.316 |
important | +4.275 |
-) | +4.190 |
Neg logit contributions | |
WAY | -5.461 |
PET | -5.133 |
ARE | -4.629 |
ggle | -4.602 |
TW | -4.523 |
Token | outskirts |
Token ID | 30140 |
Feature activation | +5.02e+00 |
Pos logit contributions | |
anonymity | +6.777 |
ividual | +6.003 |
favorite | +5.826 |
important | +5.747 |
-) | +5.664 |
Neg logit contributions | |
WAY | -7.851 |
PET | -7.322 |
ggle | -6.747 |
ARE | -6.722 |
VER | -6.630 |
Token | and |
Token ID | 290 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
ividual | +3.935 |
anonymity | +3.931 |
favorite | +3.686 |
important | +3.626 |
-) | +3.511 |
Neg logit contributions | |
WAY | -4.013 |
PET | -3.722 |
ARE | -3.423 |
ggle | -3.366 |
VERT | -3.306 |
Token | beyond |
Token ID | 3675 |
Feature activation | +5.44e+00 |
Pos logit contributions | |
anonymity | +1.307 |
ividual | +1.285 |
favorite | +1.208 |
important | +1.185 |
-) | +1.160 |
Neg logit contributions | |
WAY | -1.338 |
PET | -1.233 |
ARE | -1.128 |
ggle | -1.109 |
TW | -1.106 |
Token | . |
Token ID | 13 |
Feature activation | +3.41e+00 |
Pos logit contributions | |
anonymity | +4.072 |
ividual | +3.952 |
favorite | +3.702 |
important | +3.691 |
-) | +3.553 |
Neg logit contributions | |
WAY | -4.590 |
PET | -4.289 |
ARE | -3.929 |
ggle | -3.892 |
VERT | -3.837 |
Token | Since |
Token ID | 4619 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
ividual | +2.600 |
anonymity | +2.591 |
favorite | +2.488 |
important | +2.434 |
-) | +2.414 |
Neg logit contributions | |
WAY | -2.786 |
PET | -2.580 |
ggle | -2.378 |
ARE | -2.354 |
VER | -2.306 |
Token | 2004 |
Token ID | 5472 |
Feature activation | +5.13e+00 |
Pos logit contributions | |
WAY | +1.371 |
PET | +1.249 |
ARE | +1.147 |
ggle | +1.128 |
VER | +1.126 |
Neg logit contributions | |
ividual | -1.408 |
anonymity | -1.380 |
favorite | -1.316 |
important | -1.274 |
-) | -1.259 |
Token | the |
Token ID | 262 |
Feature activation | -6.84e+00 |
Pos logit contributions | |
anonymity | +3.851 |
ividual | +3.822 |
favorite | +3.460 |
important | +3.432 |
-) | +3.390 |
Neg logit contributions | |
WAY | -4.393 |
PET | -4.071 |
ARE | -3.777 |
ggle | -3.693 |
VERT | -3.649 |
Token | has |
Token ID | 468 |
Feature activation | +7.28e+00 |
Pos logit contributions | |
anonymity | +2.495 |
ividual | +2.488 |
favorite | +2.346 |
-) | +2.265 |
important | +2.257 |
Neg logit contributions | |
WAY | -3.020 |
PET | -2.773 |
ARE | -2.552 |
TW | -2.480 |
VERT | -2.471 |
Token | one |
Token ID | 530 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
anonymity | +5.401 |
ividual | +4.981 |
favorite | +4.874 |
important | +4.756 |
-) | +4.746 |
Neg logit contributions | |
WAY | -6.351 |
PET | -5.776 |
ARE | -5.327 |
Fuck | -5.236 |
TW | -5.188 |
Token | year |
Token ID | 614 |
Feature activation | -3.60e+00 |
Pos logit contributions | |
anonymity | +1.499 |
ividual | +1.496 |
favorite | +1.417 |
important | +1.366 |
-) | +1.365 |
Neg logit contributions | |
WAY | -1.347 |
PET | -1.222 |
ARE | -1.118 |
ggle | -1.106 |
VER | -1.086 |
Token | and |
Token ID | 290 |
Feature activation | +7.30e+00 |
Pos logit contributions | |
WAY | +2.934 |
PET | +2.679 |
ARE | +2.458 |
VER | +2.438 |
ggle | +2.421 |
Neg logit contributions | |
ividual | -2.901 |
anonymity | -2.808 |
favorite | -2.697 |
important | -2.613 |
-) | -2.573 |
Token | $ |
Token ID | 720 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
anonymity | +5.363 |
ividual | +5.031 |
favorite | +4.809 |
important | +4.663 |
-) | +4.612 |
Neg logit contributions | |
WAY | -6.326 |
PET | -5.849 |
ggle | -5.390 |
VERT | -5.308 |
ARE | -5.298 |
Token | 1 |
Token ID | 16 |
Feature activation | -7.52e-01 |
Pos logit contributions | |
WAY | +1.083 |
PET | +0.991 |
ARE | +0.913 |
VER | +0.895 |
ggle | +0.893 |
Neg logit contributions | |
ividual | -1.060 |
anonymity | -1.041 |
favorite | -0.978 |
important | -0.949 |
-) | -0.938 |
Token | . |
Token ID | 13 |
Feature activation | +4.85e+00 |
Pos logit contributions | |
WAY | +0.654 |
PET | +0.601 |
ARE | +0.556 |
ggle | +0.549 |
VER | +0.545 |
Neg logit contributions | |
ividual | -0.569 |
anonymity | -0.561 |
favorite | -0.528 |
important | -0.511 |
-) | -0.505 |
Token | 35 |
Token ID | 2327 |
Feature activation | -2.52e+00 |
Pos logit contributions | |
anonymity | +3.391 |
favorite | +3.354 |
ividual | +3.351 |
important | +3.228 |
-) | +3.221 |
Neg logit contributions | |
WAY | -4.173 |
PET | -3.810 |
ggle | -3.608 |
ARE | -3.492 |
VERT | -3.470 |
Token | million |
Token ID | 1510 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
WAY | +2.185 |
PET | +2.009 |
ARE | +1.861 |
VER | +1.829 |
ggle | +1.826 |
Neg logit contributions | |
ividual | -1.918 |
anonymity | -1.859 |
favorite | -1.764 |
important | -1.703 |
-) | -1.676 |
Token | left |
Token ID | 1364 |
Feature activation | -9.24e+00 |
Pos logit contributions | |
WAY | +7.506 |
PET | +6.748 |
respectively | +6.520 |
VER | +6.411 |
ARE | +6.329 |
Neg logit contributions | |
ividual | -9.639 |
favorite | -8.811 |
anonymity | -8.760 |
important | -8.583 |
inav | -8.453 |
Token | on |
Token ID | 319 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
WAY | +5.792 |
PET | +5.104 |
respectively | +4.776 |
VER | +4.705 |
ARE | +4.589 |
Neg logit contributions | |
ividual | -8.834 |
anonymity | -8.445 |
favorite | -8.246 |
important | -8.011 |
interstitial | -7.931 |
Token |
|
Token ID | 198 |
Feature activation | +5.58e+00 |
Pos logit contributions | |
anonymity | +3.639 |
ividual | +3.600 |
favorite | +3.466 |
important | +3.367 |
-) | +3.348 |
Neg logit contributions | |
WAY | -3.650 |
PET | -3.386 |
ggle | -3.171 |
ARE | -3.115 |
VER | -3.050 |
Token |
|
Token ID | 198 |
Feature activation | +4.85e+00 |
Pos logit contributions | |
anonymity | +4.336 |
ividual | +4.265 |
favorite | +4.235 |
important | +4.115 |
-) | +4.105 |
Neg logit contributions | |
WAY | -4.422 |
PET | -4.032 |
ggle | -3.714 |
ARE | -3.705 |
VERT | -3.614 |
Token | The |
Token ID | 464 |
Feature activation | +3.11e+00 |
Pos logit contributions | |
anonymity | +3.957 |
favorite | +3.874 |
ividual | +3.870 |
important | +3.743 |
-) | +3.685 |
Neg logit contributions | |
WAY | -3.597 |
PET | -3.254 |
ggle | -3.070 |
respectively | -2.980 |
ARE | -2.968 |
Token | reconciliation |
Token ID | 27515 |
Feature activation | +8.10e-01 |
Pos logit contributions | |
anonymity | +2.539 |
ividual | +2.481 |
favorite | +2.342 |
important | +2.292 |
-) | +2.249 |
Neg logit contributions | |
WAY | -2.478 |
PET | -2.291 |
ARE | -2.102 |
ggle | -2.083 |
VER | -2.082 |
Token | agreement |
Token ID | 4381 |
Feature activation | +6.73e+00 |
Pos logit contributions | |
ividual | +0.719 |
anonymity | +0.717 |
favorite | +0.680 |
important | +0.663 |
-) | +0.655 |
Neg logit contributions | |
WAY | -0.591 |
PET | -0.537 |
ARE | -0.488 |
ggle | -0.479 |
VER | -0.478 |
Token | came |
Token ID | 1625 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
anonymity | +5.309 |
ividual | +5.186 |
favorite | +4.878 |
important | +4.826 |
-) | +4.775 |
Neg logit contributions | |
WAY | -5.284 |
PET | -4.876 |
ARE | -4.528 |
ggle | -4.488 |
VERT | -4.399 |
Token | just |
Token ID | 655 |
Feature activation | +2.73e-01 |
Pos logit contributions | |
anonymity | +1.295 |
ividual | +1.288 |
favorite | +1.211 |
important | +1.182 |
-) | +1.167 |
Neg logit contributions | |
WAY | -1.313 |
PET | -1.211 |
ARE | -1.104 |
ggle | -1.093 |
VERT | -1.085 |
Token | days |
Token ID | 1528 |
Feature activation | +6.75e-01 |
Pos logit contributions | |
ividual | +0.247 |
anonymity | +0.245 |
favorite | +0.232 |
important | +0.228 |
-) | +0.225 |
Neg logit contributions | |
WAY | -0.196 |
PET | -0.177 |
ARE | -0.161 |
ggle | -0.158 |
VERT | -0.156 |
Token | after |
Token ID | 706 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
ividual | +0.529 |
anonymity | +0.527 |
favorite | +0.493 |
important | +0.483 |
-) | +0.475 |
Neg logit contributions | |
WAY | -0.561 |
PET | -0.514 |
ARE | -0.473 |
ggle | -0.472 |
TW | -0.462 |
Token | Turkey |
Token ID | 7137 |
Feature activation | -3.25e+00 |
Pos logit contributions | |
anonymity | +1.638 |
ividual | +1.634 |
favorite | +1.516 |
important | +1.486 |
-) | +1.464 |
Neg logit contributions | |
WAY | -1.789 |
PET | -1.648 |
ARE | -1.519 |
ggle | -1.511 |
VER | -1.493 |
Token | � |
Token ID | 447 |
Feature activation | +5.25e+00 |
Pos logit contributions | |
WAY | +2.611 |
PET | +2.386 |
ARE | +2.180 |
ggle | +2.154 |
VER | +2.150 |
Neg logit contributions | |
ividual | -2.664 |
anonymity | -2.615 |
favorite | -2.480 |
important | -2.405 |
-) | -2.366 |
Token | who |
Token ID | 508 |
Feature activation | -7.17e+00 |
Pos logit contributions | |
anonymity | +2.768 |
ividual | +2.754 |
important | +2.520 |
favorite | +2.509 |
-) | +2.430 |
Neg logit contributions | |
WAY | -3.303 |
PET | -3.017 |
ggle | -2.781 |
ARE | -2.767 |
VERT | -2.730 |
Token | do |
Token ID | 466 |
Feature activation | +2.12e+00 |
Pos logit contributions | |
WAY | +5.241 |
PET | +4.786 |
ARE | +4.446 |
respectively | +4.408 |
ggle | +4.375 |
Neg logit contributions | |
ividual | -6.184 |
anonymity | -5.999 |
favorite | -5.812 |
interstitial | -5.627 |
important | -5.568 |
Token | not |
Token ID | 407 |
Feature activation | -3.32e+00 |
Pos logit contributions | |
ividual | +1.562 |
anonymity | +1.551 |
favorite | +1.427 |
important | +1.408 |
-) | +1.378 |
Neg logit contributions | |
WAY | -1.901 |
PET | -1.730 |
ARE | -1.601 |
ggle | -1.581 |
TW | -1.572 |
Token | have |
Token ID | 423 |
Feature activation | +2.60e+00 |
Pos logit contributions | |
WAY | +2.472 |
PET | +2.257 |
ARE | +2.052 |
ggle | +2.029 |
VER | +2.014 |
Neg logit contributions | |
ividual | -2.899 |
anonymity | -2.841 |
favorite | -2.724 |
important | -2.632 |
-) | -2.604 |
Token | jobs |
Token ID | 3946 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
anonymity | +2.197 |
ividual | +2.152 |
favorite | +1.999 |
important | +1.968 |
-) | +1.943 |
Neg logit contributions | |
WAY | -2.069 |
PET | -1.861 |
ARE | -1.680 |
ggle | -1.677 |
VER | -1.651 |
Token | . |
Token ID | 13 |
Feature activation | +5.52e+00 |
Pos logit contributions | |
ividual | +1.466 |
anonymity | +1.450 |
favorite | +1.359 |
important | +1.328 |
-) | +1.304 |
Neg logit contributions | |
WAY | -1.570 |
PET | -1.431 |
ARE | -1.321 |
ggle | -1.306 |
VER | -1.292 |
Token |
|
Token ID | 198 |
Feature activation | +3.68e+00 |
Pos logit contributions | |
ividual | +4.426 |
anonymity | +4.413 |
favorite | +4.176 |
important | +4.112 |
-) | +4.003 |
Neg logit contributions | |
WAY | -4.336 |
PET | -3.878 |
ggle | -3.647 |
ARE | -3.603 |
VERT | -3.560 |
Token |
|
Token ID | 198 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
ividual | +3.084 |
anonymity | +3.081 |
favorite | +2.976 |
important | +2.895 |
-) | +2.861 |
Neg logit contributions | |
WAY | -2.794 |
PET | -2.532 |
ARE | -2.311 |
ggle | -2.304 |
VER | -2.255 |
Token | � |
Token ID | 447 |
Feature activation | -6.67e+00 |
Pos logit contributions | |
anonymity | +1.816 |
ividual | +1.801 |
favorite | +1.771 |
important | +1.724 |
-) | +1.686 |
Neg logit contributions | |
WAY | -1.459 |
PET | -1.290 |
ggle | -1.216 |
ARE | -1.179 |
respectively | -1.172 |
Token | � |
Token ID | 250 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
WAY | +3.682 |
PET | +3.225 |
ARE | +2.791 |
ggle | +2.752 |
VER | +2.721 |
Neg logit contributions | |
ividual | -7.136 |
anonymity | -6.992 |
favorite | -6.749 |
important | -6.557 |
-) | -6.522 |
Token | Make |
Token ID | 12050 |
Feature activation | -5.06e-01 |
Pos logit contributions | |
WAY | +0.083 |
PET | +0.075 |
ARE | +0.068 |
ggle | +0.068 |
VER | +0.067 |
Neg logit contributions | |
ividual | -0.099 |
anonymity | -0.098 |
favorite | -0.094 |
important | -0.091 |
-) | -0.090 |
Token | � |
Token ID | 251 |
Feature activation | +2.41e+00 |
Pos logit contributions | |
WAY | +0.041 |
PET | +0.036 |
ARE | +0.031 |
ggle | +0.030 |
VER | +0.030 |
Neg logit contributions | |
ividual | -0.078 |
anonymity | -0.078 |
favorite | -0.075 |
important | -0.073 |
-) | -0.072 |
Token | Lat |
Token ID | 5476 |
Feature activation | +3.34e+00 |
Pos logit contributions | |
ividual | +1.870 |
anonymity | +1.860 |
favorite | +1.755 |
important | +1.702 |
-) | +1.684 |
Neg logit contributions | |
WAY | -2.030 |
PET | -1.844 |
ARE | -1.713 |
ggle | -1.697 |
VER | -1.659 |
Token | end |
Token ID | 437 |
Feature activation | +5.21e+00 |
Pos logit contributions | |
ividual | +2.735 |
anonymity | +2.685 |
favorite | +2.574 |
important | +2.508 |
-) | +2.469 |
Neg logit contributions | |
WAY | -2.665 |
PET | -2.437 |
ARE | -2.227 |
ggle | -2.195 |
VER | -2.174 |
Token | res |
Token ID | 411 |
Feature activation | +8.34e+00 |
Pos logit contributions | |
ividual | +3.000 |
anonymity | +2.918 |
favorite | +2.791 |
important | +2.647 |
-) | +2.616 |
Neg logit contributions | |
WAY | -5.390 |
PET | -5.025 |
ARE | -4.689 |
ggle | -4.648 |
VERT | -4.619 |
Token | se |
Token ID | 325 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
ividual | +3.892 |
anonymity | +3.828 |
favorite | +3.738 |
important | +3.607 |
-) | +3.468 |
Neg logit contributions | |
WAY | -9.111 |
PET | -8.557 |
ARE | -8.076 |
ggle | -8.001 |
POL | -7.906 |
Token | said |
Token ID | 531 |
Feature activation | +5.92e+00 |
Pos logit contributions | |
anonymity | +6.085 |
ividual | +5.986 |
favorite | +5.371 |
-) | +5.093 |
important | +4.980 |
Neg logit contributions | |
WAY | -13.469 |
PET | -12.705 |
ARE | -12.018 |
ggle | -11.899 |
VER | -11.768 |
Token | . |
Token ID | 13 |
Feature activation | +2.86e+00 |
Pos logit contributions | |
anonymity | +3.972 |
ividual | +3.945 |
favorite | +3.608 |
important | +3.536 |
-) | +3.438 |
Neg logit contributions | |
WAY | -5.411 |
PET | -5.051 |
ARE | -4.646 |
ggle | -4.614 |
VERT | -4.581 |
Token |
|
Token ID | 198 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
ividual | +2.356 |
anonymity | +2.341 |
favorite | +2.231 |
important | +2.174 |
-) | +2.170 |
Neg logit contributions | |
WAY | -2.207 |
PET | -2.022 |
ARE | -1.852 |
ggle | -1.845 |
VER | -1.810 |
Token |
|
Token ID | 198 |
Feature activation | +2.57e-01 |
Pos logit contributions | |
ividual | +0.140 |
anonymity | +0.137 |
favorite | +0.129 |
important | +0.126 |
-) | +0.125 |
Neg logit contributions | |
WAY | -0.106 |
PET | -0.096 |
ARE | -0.086 |
VER | -0.085 |
ggle | -0.084 |
Token | Last |
Token ID | 5956 |
Feature activation | -7.78e+00 |
Pos logit contributions | |
ividual | +0.192 |
anonymity | +0.191 |
favorite | +0.183 |
important | +0.177 |
-) | +0.174 |
Neg logit contributions | |
WAY | -0.220 |
PET | -0.202 |
ARE | -0.187 |
ggle | -0.186 |
VER | -0.183 |
Token | November |
Token ID | 3389 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
WAY | +5.440 |
PET | +4.950 |
ARE | +4.523 |
VER | +4.372 |
TW | +4.359 |
Neg logit contributions | |
ividual | -6.926 |
anonymity | -6.687 |
favorite | -6.509 |
important | -6.218 |
-) | -6.117 |
Token | DO |
Token ID | 8410 |
Feature activation | -3.30e+00 |
Pos logit contributions | |
anonymity | +3.258 |
ividual | +3.162 |
favorite | +3.020 |
important | +2.933 |
-) | +2.901 |
Neg logit contributions | |
WAY | -3.098 |
PET | -2.874 |
ARE | -2.623 |
ggle | -2.586 |
VERT | -2.542 |
Token | A |
Token ID | 32 |
Feature activation | +5.15e+00 |
Pos logit contributions | |
WAY | +1.836 |
PET | +1.608 |
ARE | +1.411 |
VER | +1.372 |
ggle | +1.371 |
Neg logit contributions | |
ividual | -3.542 |
anonymity | -3.499 |
favorite | -3.354 |
important | -3.270 |
-) | -3.247 |
Token | and |
Token ID | 290 |
Feature activation | +2.46e+00 |
Pos logit contributions | |
anonymity | +3.962 |
ividual | +3.955 |
favorite | +3.713 |
important | +3.625 |
-) | +3.590 |
Neg logit contributions | |
WAY | -4.155 |
PET | -3.833 |
ggle | -3.568 |
ARE | -3.516 |
VERT | -3.473 |
Token | one |
Token ID | 530 |
Feature activation | -5.00e-01 |
Pos logit contributions | |
anonymity | +2.145 |
ividual | +2.115 |
favorite | +2.006 |
important | +1.953 |
-) | +1.944 |
Neg logit contributions | |
WAY | -1.833 |
PET | -1.667 |
ARE | -1.522 |
ggle | -1.507 |
VERT | -1.479 |
Token | song |
Token ID | 3496 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
WAY | +0.395 |
PET | +0.361 |
ARE | +0.330 |
ggle | +0.326 |
VER | +0.323 |
Neg logit contributions | |
ividual | -0.418 |
anonymity | -0.413 |
favorite | -0.390 |
important | -0.379 |
-) | -0.375 |
Token | with |
Token ID | 351 |
Feature activation | -1.77e+00 |
Pos logit contributions | |
WAY | +1.116 |
PET | +1.022 |
ARE | +0.939 |
ggle | +0.925 |
VER | +0.918 |
Neg logit contributions | |
ividual | -1.120 |
anonymity | -1.105 |
favorite | -1.044 |
important | -1.012 |
-) | -1.003 |
Token | N |
Token ID | 399 |
Feature activation | -2.46e+00 |
Pos logit contributions | |
WAY | +1.286 |
PET | +1.162 |
ARE | +1.055 |
ggle | +1.037 |
VER | +1.031 |
Neg logit contributions | |
ividual | -1.597 |
anonymity | -1.575 |
favorite | -1.500 |
important | -1.459 |
-) | -1.444 |
Token | ome |
Token ID | 462 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
WAY | +1.811 |
PET | +1.628 |
ARE | +1.490 |
VER | +1.456 |
ggle | +1.453 |
Neg logit contributions | |
ividual | -2.200 |
anonymity | -2.169 |
favorite | -2.059 |
important | -2.000 |
-) | -1.983 |
Token | ans |
Token ID | 504 |
Feature activation | +4.24e+00 |
Pos logit contributions | |
WAY | +2.129 |
PET | +1.949 |
ARE | +1.791 |
ggle | +1.767 |
VER | +1.759 |
Neg logit contributions | |
ividual | -2.073 |
anonymity | -2.041 |
favorite | -1.932 |
important | -1.869 |
-) | -1.848 |
Token | no |
Token ID | 3919 |
Feature activation | -2.46e+00 |
Pos logit contributions | |
ividual | +3.191 |
anonymity | +3.185 |
favorite | +3.005 |
important | +2.919 |
-) | +2.838 |
Neg logit contributions | |
WAY | -3.568 |
PET | -3.269 |
ggle | -3.033 |
ARE | -2.999 |
VERT | -2.982 |
Token | . |
Token ID | 13 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
WAY | +2.021 |
PET | +1.850 |
ARE | +1.701 |
ggle | +1.672 |
VER | +1.671 |
Neg logit contributions | |
ividual | -1.981 |
anonymity | -1.945 |
favorite | -1.843 |
important | -1.783 |
-) | -1.763 |
Token | volume |
Token ID | 6115 |
Feature activation | -7.69e+00 |
Pos logit contributions | |
WAY | +3.301 |
PET | +3.004 |
ARE | +2.748 |
ggle | +2.702 |
VER | +2.689 |
Neg logit contributions | |
ividual | -3.690 |
anonymity | -3.584 |
favorite | -3.437 |
important | -3.332 |
-) | -3.296 |
Token | . |
Token ID | 13 |
Feature activation | -1.61e-01 |
Pos logit contributions | |
WAY | +5.820 |
PET | +5.310 |
ARE | +4.879 |
VER | +4.793 |
respectively | +4.761 |
Neg logit contributions | |
ividual | -6.447 |
anonymity | -6.233 |
favorite | -5.985 |
important | -5.811 |
-) | -5.734 |
Token | There |
Token ID | 1318 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
WAY | +0.128 |
PET | +0.117 |
ARE | +0.107 |
ggle | +0.106 |
VER | +0.105 |
Neg logit contributions | |
ividual | -0.132 |
anonymity | -0.131 |
favorite | -0.125 |
important | -0.121 |
-) | -0.120 |
Token | � |
Token ID | 447 |
Feature activation | -3.19e-01 |
Pos logit contributions | |
WAY | +8.041 |
PET | +7.385 |
ARE | +6.963 |
VER | +6.899 |
TW | +6.755 |
Neg logit contributions | |
ividual | -8.279 |
anonymity | -8.082 |
favorite | -7.744 |
important | -7.465 |
-) | -7.338 |
Token | � |
Token ID | 247 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
WAY | +0.222 |
PET | +0.200 |
ARE | +0.181 |
ggle | +0.178 |
VER | +0.176 |
Neg logit contributions | |
ividual | -0.296 |
anonymity | -0.292 |
favorite | -0.279 |
important | -0.271 |
-) | -0.268 |
Token | s |
Token ID | 82 |
Feature activation | -5.31e+00 |
Pos logit contributions | |
WAY | +1.864 |
PET | +1.719 |
ARE | +1.596 |
ggle | +1.574 |
VER | +1.572 |
Neg logit contributions | |
ividual | -1.516 |
anonymity | -1.491 |
favorite | -1.403 |
important | -1.353 |
-) | -1.335 |
Token | also |
Token ID | 635 |
Feature activation | -6.60e+00 |
Pos logit contributions | |
WAY | +4.045 |
PET | +3.638 |
ARE | +3.322 |
VER | +3.313 |
ggle | +3.312 |
Neg logit contributions | |
ividual | -4.550 |
anonymity | -4.407 |
favorite | -4.274 |
important | -4.085 |
-) | -4.070 |
Token | the |
Token ID | 262 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
WAY | +5.017 |
PET | +4.489 |
VER | +4.126 |
ARE | +4.098 |
ggle | +4.053 |
Neg logit contributions | |
ividual | -5.628 |
anonymity | -5.404 |
favorite | -5.273 |
important | -5.026 |
-) | -5.015 |
Token | fact |
Token ID | 1109 |
Feature activation | -4.46e+00 |
Pos logit contributions | |
WAY | +7.820 |
PET | +7.027 |
VER | +6.512 |
ggle | +6.370 |
ARE | +6.329 |
Neg logit contributions | |
ividual | -8.990 |
favorite | -8.382 |
anonymity | -8.367 |
interstitial | -7.893 |
-) | -7.858 |
Token | that |
Token ID | 326 |
Feature activation | +7.60e-01 |
Pos logit contributions | |
WAY | +3.454 |
PET | +3.137 |
ARE | +2.873 |
ggle | +2.839 |
VER | +2.828 |
Neg logit contributions | |
ividual | -3.759 |
anonymity | -3.681 |
favorite | -3.516 |
important | -3.393 |
-) | -3.376 |
Token | it |
Token ID | 340 |
Feature activation | -5.98e+00 |
Pos logit contributions | |
ividual | +0.609 |
anonymity | +0.608 |
favorite | +0.571 |
important | +0.556 |
-) | +0.549 |
Neg logit contributions | |
WAY | -0.625 |
PET | -0.574 |
ARE | -0.528 |
ggle | -0.516 |
VERT | -0.510 |
Token | since |
Token ID | 1201 |
Feature activation | -7.17e-01 |
Pos logit contributions | |
WAY | +3.909 |
PET | +3.534 |
ARE | +3.201 |
VER | +3.196 |
ggle | +3.178 |
Neg logit contributions | |
ividual | -4.608 |
anonymity | -4.512 |
favorite | -4.326 |
important | -4.192 |
-) | -4.157 |
Token | organized |
Token ID | 8389 |
Feature activation | +7.52e+00 |
Pos logit contributions | |
WAY | +0.592 |
PET | +0.541 |
ARE | +0.498 |
ggle | +0.491 |
VER | +0.488 |
Neg logit contributions | |
ividual | -0.575 |
anonymity | -0.568 |
favorite | -0.535 |
important | -0.519 |
-) | -0.514 |
Token | crime |
Token ID | 4065 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
anonymity | +6.843 |
ividual | +6.704 |
favorite | +6.199 |
-) | +6.145 |
important | +5.959 |
Neg logit contributions | |
WAY | -5.347 |
PET | -4.817 |
ARE | -4.322 |
TW | -4.212 |
VER | -4.203 |
Token | counter |
Token ID | 3753 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
anonymity | +1.190 |
ividual | +1.187 |
favorite | +1.104 |
important | +1.065 |
-) | +1.064 |
Neg logit contributions | |
WAY | -1.345 |
PET | -1.234 |
ARE | -1.142 |
ggle | -1.119 |
VER | -1.115 |
Token | measures |
Token ID | 47336 |
Feature activation | +6.31e+00 |
Pos logit contributions | |
anonymity | +7.419 |
ividual | +7.138 |
-) | +6.906 |
important | +6.830 |
favorite | +6.781 |
Neg logit contributions | |
WAY | -11.120 |
PET | -9.937 |
ggle | -9.425 |
TW | -9.242 |
VER | -9.189 |
Token | were |
Token ID | 547 |
Feature activation | -3.04e+00 |
Pos logit contributions | |
anonymity | +4.905 |
ividual | +4.742 |
favorite | +4.405 |
important | +4.342 |
-) | +4.274 |
Neg logit contributions | |
WAY | -5.276 |
PET | -4.859 |
ARE | -4.389 |
ggle | -4.354 |
TW | -4.351 |
Token | enacted |
Token ID | 17814 |
Feature activation | +4.37e+00 |
Pos logit contributions | |
WAY | +2.428 |
PET | +2.217 |
ARE | +2.022 |
ggle | +2.006 |
VER | +1.997 |
Neg logit contributions | |
ividual | -2.520 |
anonymity | -2.453 |
favorite | -2.347 |
important | -2.267 |
-) | -2.246 |
Token | in |
Token ID | 287 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
anonymity | +3.272 |
ividual | +3.213 |
favorite | +3.000 |
important | +2.931 |
-) | +2.864 |
Neg logit contributions | |
WAY | -3.774 |
PET | -3.498 |
ARE | -3.212 |
ggle | -3.165 |
VERT | -3.137 |
Token | the |
Token ID | 262 |
Feature activation | +4.55e+00 |
Pos logit contributions | |
anonymity | +0.993 |
ividual | +0.987 |
favorite | +0.920 |
important | +0.895 |
-) | +0.885 |
Neg logit contributions | |
WAY | -1.066 |
PET | -0.979 |
ARE | -0.901 |
ggle | -0.886 |
VER | -0.880 |
Token | early |
Token ID | 1903 |
Feature activation | +3.29e+00 |
Pos logit contributions | |
anonymity | +3.434 |
ividual | +3.293 |
favorite | +3.067 |
important | +2.990 |
-) | +2.980 |
Neg logit contributions | |
WAY | -3.990 |
PET | -3.668 |
VER | -3.352 |
ARE | -3.346 |
ggle | -3.341 |
Token | 1990 |
Token ID | 6303 |
Feature activation | +5.44e+00 |
Pos logit contributions | |
anonymity | +2.502 |
ividual | +2.472 |
favorite | +2.275 |
important | +2.226 |
-) | +2.218 |
Neg logit contributions | |
WAY | -2.838 |
PET | -2.617 |
ggle | -2.382 |
ARE | -2.377 |
VER | -2.375 |
Token | particularly |
Token ID | 3573 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
WAY | +0.898 |
PET | +0.823 |
ARE | +0.756 |
ggle | +0.746 |
VER | +0.739 |
Neg logit contributions | |
ividual | -0.888 |
anonymity | -0.877 |
favorite | -0.828 |
important | -0.804 |
-) | -0.794 |
Token | interested |
Token ID | 4609 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
WAY | +2.317 |
PET | +2.113 |
ARE | +1.958 |
ggle | +1.928 |
VER | +1.923 |
Neg logit contributions | |
ividual | -2.158 |
anonymity | -2.104 |
favorite | -1.997 |
important | -1.923 |
-) | -1.907 |
Token | in |
Token ID | 287 |
Feature activation | +2.86e+00 |
Pos logit contributions | |
ividual | +2.009 |
anonymity | +1.979 |
favorite | +1.861 |
important | +1.802 |
-) | +1.789 |
Neg logit contributions | |
WAY | -2.330 |
PET | -2.147 |
ggle | -1.972 |
ARE | -1.968 |
VER | -1.946 |
Token | how |
Token ID | 703 |
Feature activation | -6.71e+00 |
Pos logit contributions | |
anonymity | +2.153 |
ividual | +2.112 |
favorite | +1.946 |
important | +1.903 |
-) | +1.874 |
Neg logit contributions | |
WAY | -2.498 |
PET | -2.303 |
ARE | -2.105 |
ggle | -2.093 |
TW | -2.076 |
Token | Good |
Token ID | 4599 |
Feature activation | -4.31e+00 |
Pos logit contributions | |
WAY | +5.090 |
PET | +4.635 |
ARE | +4.294 |
VER | +4.263 |
ggle | +4.189 |
Neg logit contributions | |
ividual | -5.615 |
anonymity | -5.458 |
favorite | -5.284 |
important | -5.069 |
-) | -5.040 |
Token | will |
Token ID | 10594 |
Feature activation | -3.52e+00 |
Pos logit contributions | |
WAY | +3.482 |
PET | +3.154 |
ARE | +2.918 |
VER | +2.855 |
ggle | +2.837 |
Neg logit contributions | |
ividual | -3.539 |
anonymity | -3.500 |
favorite | -3.264 |
important | -3.175 |
-) | -3.149 |
Token | determines |
Token ID | 15947 |
Feature activation | -8.84e+00 |
Pos logit contributions | |
WAY | +2.826 |
PET | +2.581 |
ARE | +2.372 |
ggle | +2.330 |
VER | +2.322 |
Neg logit contributions | |
ividual | -2.885 |
anonymity | -2.846 |
favorite | -2.695 |
important | -2.614 |
-) | -2.584 |
Token | what |
Token ID | 644 |
Feature activation | -3.88e+00 |
Pos logit contributions | |
WAY | +5.925 |
PET | +5.369 |
ARE | +4.991 |
VER | +4.862 |
ggle | +4.808 |
Neg logit contributions | |
ividual | -7.905 |
anonymity | -7.637 |
favorite | -7.437 |
important | -7.244 |
-) | -7.203 |
Token | it |
Token ID | 340 |
Feature activation | -3.75e+00 |
Pos logit contributions | |
WAY | +3.081 |
PET | +2.821 |
ARE | +2.600 |
VER | +2.549 |
ggle | +2.541 |
Neg logit contributions | |
ividual | -3.194 |
anonymity | -3.132 |
favorite | -2.995 |
important | -2.892 |
-) | -2.862 |
Token | pays |
Token ID | 13831 |
Feature activation | -5.81e+00 |
Pos logit contributions | |
WAY | +3.098 |
PET | +2.843 |
ARE | +2.621 |
ggle | +2.574 |
VER | +2.566 |
Neg logit contributions | |
ividual | -2.969 |
anonymity | -2.925 |
favorite | -2.774 |
important | -2.684 |
-) | -2.647 |
Token | in |
Token ID | 287 |
Feature activation | -3.40e+00 |
Pos logit contributions | |
WAY | +4.071 |
PET | +3.679 |
ARE | +3.373 |
VER | +3.277 |
ggle | +3.258 |
Neg logit contributions | |
ividual | -5.241 |
anonymity | -5.151 |
favorite | -4.972 |
important | -4.807 |
-) | -4.774 |
Token | treatment |
Token ID | 3513 |
Feature activation | -6.71e+00 |
Pos logit contributions | |
WAY | +4.450 |
PET | +4.009 |
ARE | +3.673 |
ggle | +3.565 |
TW | +3.558 |
Neg logit contributions | |
ividual | -5.582 |
anonymity | -5.395 |
favorite | -5.198 |
important | -5.031 |
-) | -4.994 |
Token | for |
Token ID | 329 |
Feature activation | -4.80e+00 |
Pos logit contributions | |
WAY | +4.975 |
PET | +4.553 |
ARE | +4.179 |
respectively | +4.107 |
ggle | +4.099 |
Neg logit contributions | |
ividual | -5.742 |
anonymity | -5.576 |
favorite | -5.386 |
important | -5.227 |
-) | -5.164 |
Token | all |
Token ID | 477 |
Feature activation | -7.32e+00 |
Pos logit contributions | |
WAY | +3.641 |
PET | +3.321 |
ARE | +3.029 |
ggle | +2.985 |
VER | +2.985 |
Neg logit contributions | |
ividual | -4.104 |
anonymity | -4.024 |
favorite | -3.871 |
important | -3.738 |
-) | -3.710 |
Token | , |
Token ID | 11 |
Feature activation | -2.54e-01 |
Pos logit contributions | |
WAY | +5.299 |
PET | +4.821 |
ARE | +4.376 |
VER | +4.332 |
respectively | +4.288 |
Neg logit contributions | |
ividual | -6.341 |
anonymity | -6.272 |
favorite | -6.033 |
-) | -5.807 |
important | -5.777 |
Token | � |
Token ID | 447 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
WAY | +0.206 |
PET | +0.188 |
ARE | +0.172 |
ggle | +0.171 |
VER | +0.169 |
Neg logit contributions | |
ividual | -0.207 |
anonymity | -0.204 |
favorite | -0.194 |
important | -0.188 |
-) | -0.185 |
Token | � |
Token ID | 251 |
Feature activation | -3.61e+00 |
Pos logit contributions | |
ividual | +0.127 |
anonymity | +0.126 |
favorite | +0.121 |
important | +0.118 |
-) | +0.117 |
Neg logit contributions | |
WAY | -0.069 |
PET | -0.061 |
ARE | -0.054 |
ggle | -0.052 |
VER | -0.052 |
Token | Mr |
Token ID | 1770 |
Feature activation | +6.97e+00 |
Pos logit contributions | |
WAY | +2.237 |
PET | +1.980 |
ARE | +1.761 |
VER | +1.721 |
ggle | +1.703 |
Neg logit contributions | |
ividual | -3.629 |
anonymity | -3.570 |
favorite | -3.416 |
important | -3.332 |
-) | -3.313 |
Token | . |
Token ID | 13 |
Feature activation | -4.45e+00 |
Pos logit contributions | |
anonymity | +4.442 |
ividual | +4.399 |
favorite | +4.354 |
important | +4.203 |
-) | +4.154 |
Neg logit contributions | |
WAY | -6.367 |
PET | -5.888 |
ggle | -5.508 |
ARE | -5.459 |
VER | -5.392 |
Token | Perez |
Token ID | 23058 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
WAY | +2.719 |
PET | +2.401 |
ARE | +2.143 |
ggle | +2.073 |
VER | +2.071 |
Neg logit contributions | |
ividual | -4.499 |
anonymity | -4.423 |
favorite | -4.234 |
important | -4.125 |
-) | -4.086 |
Token | said |
Token ID | 531 |
Feature activation | +6.58e+00 |
Pos logit contributions | |
anonymity | +6.012 |
ividual | +5.949 |
favorite | +5.460 |
important | +5.168 |
-) | +5.093 |
Neg logit contributions | |
WAY | -11.891 |
PET | -11.447 |
ggle | -10.748 |
VER | -10.446 |
ARE | -10.366 |
Token | . |
Token ID | 13 |
Feature activation | -5.90e-01 |
Pos logit contributions | |
anonymity | +4.377 |
ividual | +4.333 |
favorite | +3.979 |
important | +3.944 |
-) | +3.766 |
Neg logit contributions | |
WAY | -5.984 |
PET | -5.610 |
ggle | -5.176 |
ARE | -5.111 |
VERT | -5.097 |
Token |
|
Token ID | 198 |
Feature activation | -4.13e-01 |
Pos logit contributions | |
WAY | +1.989 |
PET | +1.829 |
ARE | +1.691 |
ggle | +1.668 |
VER | +1.660 |
Neg logit contributions | |
ividual | -1.723 |
anonymity | -1.694 |
favorite | -1.598 |
important | -1.544 |
-) | -1.525 |
Token |
|
Token ID | 198 |
Feature activation | -3.27e-01 |
Pos logit contributions | |
WAY | +0.287 |
PET | +0.258 |
ARE | +0.233 |
VER | +0.229 |
TW | +0.227 |
Neg logit contributions | |
ividual | -0.392 |
anonymity | -0.383 |
favorite | -0.361 |
important | -0.351 |
-) | -0.347 |
Token | making |
Token ID | 8601 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
WAY | +0.287 |
PET | +0.264 |
ARE | +0.245 |
ggle | +0.242 |
VER | +0.240 |
Neg logit contributions | |
ividual | -0.243 |
anonymity | -0.240 |
favorite | -0.228 |
important | -0.221 |
-) | -0.217 |
Token | a |
Token ID | 257 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
WAY | +10.035 |
strides | +9.172 |
PET | +9.025 |
VER | +8.474 |
ggle | +8.425 |
Neg logit contributions | |
ividual | -12.366 |
favorite | -11.313 |
anonymity | -11.034 |
interstitial | -10.490 |
important | -10.328 |
Token | lot |
Token ID | 1256 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
WAY | +7.836 |
PET | +7.256 |
ggle | +6.642 |
VER | +6.602 |
ARE | +6.546 |
Neg logit contributions | |
ividual | -8.888 |
anonymity | -8.345 |
favorite | -8.096 |
important | -7.737 |
interstitial | -7.705 |
Token | of |
Token ID | 286 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
WAY | +9.117 |
PET | +8.186 |
strides | +7.458 |
VER | +7.204 |
respectively | +7.194 |
Neg logit contributions | |
ividual | -13.646 |
anonymity | -12.783 |
favorite | -12.442 |
interstitial | -12.036 |
important | -11.923 |
Token | sense |
Token ID | 2565 |
Feature activation | -7.57e+00 |
Pos logit contributions | |
WAY | +10.334 |
strides | +9.285 |
PET | +9.086 |
POL | +8.566 |
ggle | +8.305 |
Neg logit contributions | |
ividual | -15.555 |
favorite | -14.169 |
anonymity | -13.527 |
pecially | -13.258 |
interstitial | -13.056 |
Token | . |
Token ID | 13 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
WAY | +5.777 |
PET | +5.231 |
ARE | +4.763 |
ggle | +4.731 |
VER | +4.717 |
Neg logit contributions | |
ividual | -6.357 |
anonymity | -6.196 |
favorite | -5.957 |
important | -5.670 |
-) | -5.616 |
Token | Its |
Token ID | 6363 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
anonymity | +1.676 |
ividual | +1.667 |
favorite | +1.589 |
-) | +1.563 |
important | +1.559 |
Neg logit contributions | |
WAY | -1.663 |
PET | -1.517 |
ARE | -1.398 |
ggle | -1.387 |
VER | -1.363 |
Token | admittedly |
Token ID | 33603 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
WAY | +1.724 |
PET | +1.573 |
ARE | +1.443 |
ggle | +1.421 |
VER | +1.414 |
Neg logit contributions | |
ividual | -1.779 |
anonymity | -1.749 |
favorite | -1.660 |
important | -1.610 |
-) | -1.592 |
Token | high |
Token ID | 1029 |
Feature activation | -4.38e+00 |
Pos logit contributions | |
anonymity | +8.800 |
ividual | +7.904 |
important | +7.677 |
-) | +7.669 |
favorite | +7.560 |
Neg logit contributions | |
WAY | -9.022 |
PET | -8.293 |
ARE | -7.626 |
TW | -7.427 |
ggle | -7.419 |
Token | star |
Token ID | 7364 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
ividual | +1.306 |
anonymity | +1.269 |
favorite | +1.246 |
important | +1.183 |
-) | +1.174 |
Neg logit contributions | |
WAY | -2.094 |
PET | -1.934 |
ARE | -1.807 |
ggle | -1.807 |
TW | -1.769 |
Token | red |
Token ID | 445 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
WAY | +0.186 |
PET | +0.173 |
ARE | +0.162 |
ggle | +0.161 |
VER | +0.160 |
Neg logit contributions | |
ividual | -0.114 |
anonymity | -0.111 |
favorite | -0.104 |
important | -0.100 |
-) | -0.098 |
Token | and |
Token ID | 290 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
WAY | +1.076 |
PET | +0.984 |
ARE | +0.903 |
ggle | +0.889 |
VER | +0.883 |
Neg logit contributions | |
ividual | -1.111 |
anonymity | -1.094 |
favorite | -1.036 |
important | -1.007 |
-) | -0.996 |
Token | are |
Token ID | 389 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
ividual | +1.276 |
anonymity | +1.264 |
favorite | +1.199 |
-) | +1.162 |
important | +1.158 |
Neg logit contributions | |
WAY | -1.234 |
PET | -1.125 |
ARE | -1.020 |
ggle | -1.019 |
VERT | -1.001 |
Token | the |
Token ID | 262 |
Feature activation | -2.26e+00 |
Pos logit contributions | |
WAY | +3.807 |
PET | +3.486 |
ARE | +3.231 |
VER | +3.181 |
ggle | +3.164 |
Neg logit contributions | |
ividual | -3.365 |
anonymity | -3.280 |
favorite | -3.090 |
important | -2.985 |
-) | -2.931 |
Token | only |
Token ID | 691 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
WAY | +1.919 |
PET | +1.760 |
ARE | +1.623 |
ggle | +1.599 |
VER | +1.598 |
Neg logit contributions | |
ividual | -1.762 |
anonymity | -1.730 |
favorite | -1.633 |
important | -1.583 |
-) | -1.562 |
Token | on |
Token ID | 319 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
WAY | +11.034 |
PET | +9.530 |
respectively | +9.199 |
VER | +9.129 |
ARE | +8.903 |
Neg logit contributions | |
ividual | -13.096 |
anonymity | -12.419 |
favorite | -12.305 |
interstitial | -11.768 |
pecially | -11.761 |
Token | - |
Token ID | 12 |
Feature activation | -2.83e+00 |
Pos logit contributions | |
WAY | +0.270 |
PET | +0.252 |
ARE | +0.238 |
ggle | +0.235 |
VER | +0.235 |
Neg logit contributions | |
ividual | -0.118 |
anonymity | -0.115 |
favorite | -0.106 |
important | -0.100 |
-) | -0.099 |
Token | set |
Token ID | 2617 |
Feature activation | -3.70e+00 |
Pos logit contributions | |
WAY | +2.403 |
PET | +2.208 |
ARE | +2.036 |
ggle | +2.002 |
VER | +1.997 |
Neg logit contributions | |
ividual | -2.197 |
anonymity | -2.159 |
favorite | -2.032 |
important | -1.967 |
-) | -1.947 |
Token | crew |
Token ID | 5462 |
Feature activation | -7.89e+00 |
Pos logit contributions | |
WAY | +2.775 |
PET | +2.511 |
ARE | +2.290 |
ggle | +2.253 |
VER | +2.245 |
Neg logit contributions | |
ividual | -3.239 |
anonymity | -3.188 |
favorite | -3.041 |
important | -2.947 |
-) | -2.919 |
Token | , |
Token ID | 11 |
Feature activation | -4.07e+00 |
Pos logit contributions | |
WAY | +6.129 |
PET | +5.551 |
ARE | +5.139 |
VER | +5.088 |
respectively | +5.060 |
Neg logit contributions | |
ividual | -6.442 |
anonymity | -6.274 |
favorite | -6.032 |
important | -5.756 |
-) | -5.747 |
Token | in |
Token ID | 287 |
Feature activation | -3.28e+00 |
Pos logit contributions | |
WAY | +3.955 |
PET | +3.590 |
ARE | +3.333 |
VER | +3.292 |
respectively | +3.268 |
Neg logit contributions | |
ividual | -3.689 |
anonymity | -3.597 |
favorite | -3.424 |
important | -3.295 |
-) | -3.263 |
Token | Baltimore |
Token ID | 10346 |
Feature activation | -9.39e+00 |
Pos logit contributions | |
WAY | +2.625 |
PET | +2.389 |
ARE | +2.206 |
ggle | +2.166 |
VER | +2.163 |
Neg logit contributions | |
ividual | -2.697 |
anonymity | -2.646 |
favorite | -2.514 |
important | -2.434 |
-) | -2.414 |
Token | in |
Token ID | 287 |
Feature activation | -9.21e+00 |
Pos logit contributions | |
WAY | +6.922 |
PET | +6.142 |
VER | +5.741 |
ARE | +5.701 |
respectively | +5.672 |
Neg logit contributions | |
ividual | -7.889 |
anonymity | -7.765 |
favorite | -7.437 |
important | -7.157 |
-) | -7.086 |
Token | half |
Token ID | 2063 |
Feature activation | -8.82e+00 |
Pos logit contributions | |
WAY | +6.385 |
PET | +5.582 |
VER | +5.256 |
ARE | +5.222 |
strides | +5.215 |
Neg logit contributions | |
ividual | -8.148 |
anonymity | -7.855 |
favorite | -7.644 |
important | -7.407 |
-) | -7.293 |
Token | in |
Token ID | 287 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
WAY | +6.527 |
PET | +5.776 |
ARE | +5.348 |
respectively | +5.339 |
VER | +5.271 |
Neg logit contributions | |
ividual | -7.524 |
anonymity | -7.375 |
favorite | -7.074 |
important | -6.760 |
interstitial | -6.705 |
Token | recent |
Token ID | 2274 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
WAY | +10.145 |
strides | +8.584 |
PET | +8.484 |
respectively | +8.460 |
VER | +8.304 |
Neg logit contributions | |
ividual | -14.023 |
anonymity | -13.333 |
favorite | -13.319 |
important | -12.853 |
interstitial | -12.848 |
Token | years |
Token ID | 812 |
Feature activation | -7.95e+00 |
Pos logit contributions | |
WAY | +7.882 |
strides | +6.654 |
PET | +6.359 |
POL | +6.013 |
respectively | +5.870 |
Neg logit contributions | |
ividual | -17.262 |
favorite | -16.676 |
anonymity | -16.343 |
important | -16.264 |
interstitial | -16.043 |
Token | , |
Token ID | 11 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
WAY | +5.959 |
PET | +5.378 |
respectively | +4.897 |
ARE | +4.896 |
VER | +4.867 |
Neg logit contributions | |
ividual | -6.690 |
anonymity | -6.596 |
favorite | -6.330 |
important | -6.063 |
-) | -6.024 |
Token | and |
Token ID | 290 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
WAY | +0.134 |
PET | +0.123 |
ARE | +0.112 |
ggle | +0.111 |
VER | +0.110 |
Neg logit contributions | |
ividual | -0.135 |
anonymity | -0.133 |
favorite | -0.125 |
important | -0.122 |
-) | -0.121 |
Token | if |
Token ID | 611 |
Feature activation | -9.17e+00 |
Pos logit contributions | |
ividual | +0.929 |
anonymity | +0.928 |
favorite | +0.863 |
important | +0.851 |
-) | +0.836 |
Neg logit contributions | |
WAY | -0.923 |
PET | -0.846 |
ARE | -0.764 |
ggle | -0.763 |
VERT | -0.752 |
Token | anything |
Token ID | 1997 |
Feature activation | +6.22e+00 |
Pos logit contributions | |
WAY | +6.811 |
PET | +6.141 |
ARE | +5.879 |
VER | +5.769 |
respectively | +5.659 |
Neg logit contributions | |
ividual | -7.657 |
favorite | -7.264 |
anonymity | -7.145 |
important | -6.785 |
-) | -6.776 |
Token | of |
Token ID | 286 |
Feature activation | -8.93e+00 |
Pos logit contributions | |
WAY | +5.066 |
PET | +4.557 |
VER | +4.176 |
ARE | +4.167 |
ggle | +4.152 |
Neg logit contributions | |
ividual | -6.462 |
anonymity | -6.171 |
favorite | -6.042 |
-) | -5.812 |
important | -5.802 |
Token | school |
Token ID | 1524 |
Feature activation | -4.21e+00 |
Pos logit contributions | |
WAY | +6.694 |
PET | +6.005 |
ARE | +5.638 |
VER | +5.536 |
POL | +5.529 |
Neg logit contributions | |
ividual | -7.503 |
anonymity | -7.070 |
favorite | -6.995 |
-) | -6.672 |
important | -6.667 |
Token | systems |
Token ID | 3341 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
WAY | +4.527 |
PET | +4.214 |
ARE | +3.995 |
VER | +3.923 |
ggle | +3.914 |
Neg logit contributions | |
ividual | -2.312 |
anonymity | -2.201 |
favorite | -2.061 |
important | -1.948 |
-) | -1.880 |
Token | throughout |
Token ID | 3690 |
Feature activation | -2.56e+00 |
Pos logit contributions | |
WAY | +1.294 |
PET | +1.174 |
ARE | +1.071 |
ggle | +1.053 |
VER | +1.047 |
Neg logit contributions | |
ividual | -1.488 |
anonymity | -1.468 |
favorite | -1.395 |
important | -1.356 |
-) | -1.341 |
Token | Maryland |
Token ID | 10769 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
WAY | +2.082 |
PET | +1.901 |
ARE | +1.749 |
ggle | +1.721 |
VER | +1.714 |
Neg logit contributions | |
ividual | -2.076 |
anonymity | -2.044 |
favorite | -1.936 |
important | -1.877 |
-) | -1.856 |
Token | for |
Token ID | 329 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
WAY | +7.652 |
PET | +6.896 |
VER | +6.394 |
respectively | +6.350 |
ARE | +6.270 |
Neg logit contributions | |
ividual | -9.613 |
anonymity | -9.385 |
favorite | -9.053 |
-) | -8.783 |
important | -8.706 |
Token | many |
Token ID | 867 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
WAY | +10.897 |
strides | +9.530 |
respectively | +9.392 |
PET | +9.273 |
VER | +9.087 |
Neg logit contributions | |
ividual | -15.400 |
favorite | -14.405 |
interstitial | -14.319 |
anonymity | -14.214 |
important | -13.889 |
Token | years |
Token ID | 812 |
Feature activation | -7.68e+00 |
Pos logit contributions | |
WAY | +6.009 |
PET | +4.878 |
strides | +4.740 |
lengths | +4.393 |
respectively | +4.343 |
Neg logit contributions | |
ividual | -15.136 |
anonymity | -14.819 |
favorite | -14.744 |
interstitial | -14.611 |
-) | -14.166 |
Token | . |
Token ID | 13 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
WAY | +5.742 |
PET | +5.220 |
ARE | +4.743 |
VER | +4.717 |
respectively | +4.692 |
Neg logit contributions | |
ividual | -6.503 |
anonymity | -6.359 |
favorite | -6.115 |
important | -5.881 |
-) | -5.835 |
Token | Parents |
Token ID | 28231 |
Feature activation | +4.38e+00 |
Pos logit contributions | |
WAY | +1.244 |
PET | +1.130 |
ARE | +1.032 |
ggle | +1.021 |
VER | +1.010 |
Neg logit contributions | |
ividual | -1.371 |
anonymity | -1.355 |
favorite | -1.289 |
important | -1.254 |
-) | -1.241 |
Token | who |
Token ID | 508 |
Feature activation | -9.18e+00 |
Pos logit contributions | |
anonymity | +3.543 |
ividual | +3.469 |
favorite | +3.231 |
important | +3.197 |
-) | +3.167 |
Neg logit contributions | |
WAY | -3.521 |
PET | -3.249 |
VERT | -2.919 |
ARE | -2.912 |
TW | -2.898 |
Token | , |
Token ID | 11 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
ividual | +0.138 |
anonymity | +0.138 |
favorite | +0.129 |
important | +0.126 |
-) | +0.123 |
Neg logit contributions | |
WAY | -0.143 |
PET | -0.131 |
ARE | -0.120 |
ggle | -0.119 |
VER | -0.117 |
Token | this |
Token ID | 428 |
Feature activation | +2.65e+00 |
Pos logit contributions | |
WAY | +1.184 |
PET | +1.073 |
ARE | +0.976 |
ggle | +0.960 |
VER | +0.954 |
Neg logit contributions | |
ividual | -1.400 |
anonymity | -1.383 |
favorite | -1.314 |
important | -1.278 |
-) | -1.264 |
Token | was |
Token ID | 373 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
anonymity | +2.140 |
ividual | +2.121 |
favorite | +1.992 |
important | +1.944 |
-) | +1.898 |
Neg logit contributions | |
WAY | -2.161 |
PET | -1.993 |
ARE | -1.810 |
ggle | -1.808 |
TW | -1.773 |
Token | the |
Token ID | 262 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
WAY | +2.493 |
PET | +2.262 |
ARE | +2.070 |
ggle | +2.035 |
VER | +2.034 |
Neg logit contributions | |
ividual | -2.733 |
anonymity | -2.675 |
favorite | -2.550 |
important | -2.471 |
-) | -2.454 |
Token | only |
Token ID | 691 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
anonymity | +1.894 |
ividual | +1.841 |
favorite | +1.757 |
important | +1.688 |
-) | +1.646 |
Neg logit contributions | |
WAY | -2.238 |
PET | -2.101 |
ARE | -1.922 |
ggle | -1.903 |
VER | -1.886 |
Token | place |
Token ID | 1295 |
Feature activation | -1.89e+01 |
Pos logit contributions | |
WAY | +8.291 |
PET | +7.123 |
ARE | +6.859 |
strides | +6.710 |
VER | +6.707 |
Neg logit contributions | |
ividual | -9.464 |
anonymity | -8.686 |
favorite | -8.636 |
-) | -8.409 |
important | -8.337 |
Token | in |
Token ID | 287 |
Feature activation | -7.59e-01 |
Pos logit contributions | |
WAY | +11.280 |
PET | +9.584 |
respectively | +9.532 |
VER | +9.498 |
ARE | +9.206 |
Neg logit contributions | |
ividual | -15.979 |
favorite | -14.666 |
interstitial | -14.219 |
inav | -14.141 |
anonymity | -14.133 |
Token | the |
Token ID | 262 |
Feature activation | +9.66e-01 |
Pos logit contributions | |
WAY | +0.619 |
PET | +0.567 |
ARE | +0.519 |
ggle | +0.512 |
TW | +0.504 |
Neg logit contributions | |
ividual | -0.618 |
anonymity | -0.613 |
favorite | -0.577 |
important | -0.560 |
-) | -0.553 |
Token | city |
Token ID | 1748 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
anonymity | +0.665 |
ividual | +0.662 |
favorite | +0.612 |
important | +0.595 |
-) | +0.583 |
Neg logit contributions | |
WAY | -0.902 |
PET | -0.842 |
ARE | -0.775 |
ggle | -0.768 |
VER | -0.761 |
Token | of |
Token ID | 286 |
Feature activation | -6.52e-01 |
Pos logit contributions | |
WAY | +9.570 |
PET | +8.254 |
respectively | +7.894 |
VER | +7.804 |
strides | +7.608 |
Neg logit contributions | |
ividual | -13.536 |
favorite | -12.752 |
anonymity | -12.355 |
interstitial | -12.254 |
important | -12.192 |
Token | Daytona |
Token ID | 47299 |
Feature activation | -4.55e+00 |
Pos logit contributions | |
WAY | +0.594 |
PET | +0.549 |
ARE | +0.508 |
ggle | +0.501 |
VER | +0.497 |
Neg logit contributions | |
ividual | -0.465 |
anonymity | -0.465 |
favorite | -0.433 |
important | -0.419 |
-) | -0.412 |