Token | gospel |
Token ID | 21443 |
Feature activation | +9.20e-01 |
Pos logit contributions | |
newfound | +16.101 |
companions | +16.050 |
unborn | +15.794 |
enduring | +15.662 |
awakening | +15.206 |
Neg logit contributions | |
libel | -12.478 |
offensive | -10.511 |
rubbish | -9.923 |
ograph | -9.776 |
ictionary | -9.572 |
Token | : |
Token ID | 25 |
Feature activation | +2.96e+00 |
Pos logit contributions | |
companions | +10.775 |
unborn | +10.484 |
newfound | +10.348 |
enduring | +10.292 |
blessings | +10.172 |
Neg logit contributions | |
libel | -10.238 |
offensive | -8.647 |
rubbish | -8.431 |
Serie | -8.256 |
vitro | -7.876 |
Token | Jesus |
Token ID | 5803 |
Feature activation | +2.18e+00 |
Pos logit contributions | |
companions | +28.406 |
blessings | +27.239 |
enduring | +27.006 |
unborn | +26.970 |
healing | +26.518 |
Neg logit contributions | |
libel | -17.187 |
ictionary | -14.395 |
offensive | -14.112 |
ograph | -13.543 |
rubbish | -13.489 |
Token | � |
Token ID | 447 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
unborn | +21.460 |
companions | +21.158 |
enduring | +20.747 |
awakened | +20.699 |
awakening | +20.591 |
Neg logit contributions | |
libel | -17.259 |
rubbish | -14.323 |
offensive | -13.682 |
Serie | -13.138 |
vitro | -13.126 |
Token | � |
Token ID | 247 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
libel | +1.918 |
rubbish | +1.493 |
offensive | +1.480 |
Serie | +1.389 |
punt | +1.388 |
Neg logit contributions | |
companions | -2.665 |
unborn | -2.630 |
newfound | -2.615 |
grandchildren | -2.574 |
caregivers | -2.525 |
Token | s |
Token ID | 82 |
Feature activation | +3.39e+00 |
Pos logit contributions | |
companions | +15.731 |
unborn | +15.142 |
blessings | +15.040 |
grandchildren | +14.916 |
followers | +14.898 |
Neg logit contributions | |
libel | -15.281 |
rubbish | -13.145 |
offensive | -12.141 |
punt | -11.933 |
tabloid | -11.871 |
Token | birth |
Token ID | 4082 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
companions | +31.143 |
unborn | +30.751 |
enduring | +30.221 |
arrival | +29.902 |
newfound | +29.794 |
Neg logit contributions | |
libel | -17.035 |
ograph | -14.204 |
ictionary | -13.636 |
offensive | -13.626 |
England | -13.279 |
Token | , |
Token ID | 11 |
Feature activation | +2.96e+00 |
Pos logit contributions | |
companions | +13.490 |
unborn | +13.256 |
attendants | +12.849 |
blessings | +12.588 |
newfound | +12.536 |
Neg logit contributions | |
libel | -13.753 |
rubbish | -11.957 |
Serie | -11.537 |
offensive | -11.475 |
vitro | -11.132 |
Token | death |
Token ID | 1918 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
companions | +28.356 |
unborn | +26.896 |
blessings | +26.633 |
enduring | +26.468 |
Resurrection | +26.312 |
Neg logit contributions | |
libel | -17.859 |
offensive | -15.546 |
ictionary | -15.172 |
rubbish | -14.907 |
ograph | -14.777 |
Token | , |
Token ID | 11 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
companions | +16.872 |
unborn | +16.316 |
blessings | +15.793 |
awakening | +15.673 |
attendants | +15.582 |
Neg logit contributions | |
libel | -19.374 |
rubbish | -17.217 |
offensive | -16.411 |
Serie | -16.057 |
wik | -15.885 |
Token | and |
Token ID | 290 |
Feature activation | +2.67e+00 |
Pos logit contributions | |
companions | +23.125 |
blessings | +22.423 |
unborn | +22.113 |
healing | +21.683 |
awakening | +21.669 |
Neg logit contributions | |
libel | -17.970 |
offensive | -16.014 |
ograph | -15.274 |
rubbish | -15.245 |
ictionary | -14.831 |
Token | nation |
Token ID | 3277 |
Feature activation | +9.10e-01 |
Pos logit contributions | |
grandchildren | +24.130 |
unborn | +23.669 |
newfound | +23.406 |
companions | +23.094 |
awakening | +22.995 |
Neg logit contributions | |
libel | -17.518 |
offensive | -15.274 |
ograph | -14.849 |
Serie | -14.354 |
ictionary | -14.341 |
Token | . |
Token ID | 13 |
Feature activation | +7.18e-01 |
Pos logit contributions | |
unborn | +10.288 |
grandchildren | +10.177 |
companions | +10.089 |
enduring | +9.879 |
newfound | +9.875 |
Neg logit contributions | |
libel | -10.430 |
rubbish | -8.890 |
offensive | -8.574 |
Serie | -8.369 |
punt | -8.172 |
Token | I |
Token ID | 314 |
Feature activation | +6.32e-01 |
Pos logit contributions | |
grandchildren | +7.468 |
unborn | +7.430 |
companions | +7.385 |
survivors | +7.144 |
newfound | +7.093 |
Neg logit contributions | |
libel | -9.324 |
rubbish | -8.033 |
offensive | -7.810 |
vitro | -7.551 |
advert | -7.374 |
Token | wish |
Token ID | 4601 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
companions | +7.431 |
unborn | +7.382 |
grandchildren | +7.316 |
newfound | +7.216 |
awakened | +7.205 |
Neg logit contributions | |
libel | -7.464 |
offensive | -6.372 |
rubbish | -6.297 |
Serie | -6.048 |
vitro | -5.886 |
Token | you |
Token ID | 345 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
companions | +17.732 |
grandchildren | +17.613 |
unborn | +17.464 |
survivors | +17.339 |
blessings | +16.991 |
Neg logit contributions | |
libel | -15.317 |
offensive | -13.659 |
rubbish | -12.975 |
ictionary | -12.836 |
vitro | -12.749 |
Token | the |
Token ID | 262 |
Feature activation | +3.34e+00 |
Pos logit contributions | |
blessings | +27.884 |
companions | +27.720 |
grandchildren | +27.436 |
newfound | +26.636 |
enduring | +26.302 |
Neg logit contributions | |
libel | -19.925 |
offensive | -15.714 |
rubbish | -15.699 |
vitro | -15.547 |
ograph | -15.332 |
Token | best |
Token ID | 1266 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
blessings | +28.969 |
companions | +28.134 |
grandchildren | +27.134 |
enduring | +26.935 |
newfound | +26.799 |
Neg logit contributions | |
libel | -19.852 |
offensive | -16.748 |
rubbish | -16.192 |
ictionary | -16.111 |
vitro | -16.024 |
Token | and |
Token ID | 290 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
grandchildren | +15.461 |
unborn | +15.459 |
companions | +15.381 |
blessings | +15.034 |
remaining | +14.696 |
Neg logit contributions | |
libel | -15.503 |
rubbish | -13.212 |
offensive | -12.935 |
vitro | -12.553 |
advert | -12.194 |
Token | the |
Token ID | 262 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
blessings | +23.966 |
grandchildren | +23.852 |
companions | +23.799 |
unborn | +23.244 |
newfound | +23.078 |
Neg logit contributions | |
libel | -17.540 |
offensive | -15.212 |
ictionary | -14.692 |
vitro | -14.665 |
rubbish | -14.601 |
Token | best |
Token ID | 1266 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
blessings | +31.912 |
companions | +30.953 |
grandchildren | +30.415 |
unborn | +30.033 |
newfound | +29.645 |
Neg logit contributions | |
libel | -16.923 |
offensive | -14.364 |
rubbish | -13.968 |
ictionary | -13.863 |
Anyway | -13.808 |
Token | of |
Token ID | 286 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
grandchildren | +17.917 |
blessings | +17.855 |
companions | +17.652 |
unborn | +17.461 |
arrival | +16.740 |
Neg logit contributions | |
libel | -15.507 |
rubbish | -13.057 |
offensive | -12.767 |
vitro | -12.419 |
Serie | -12.233 |
Token | with |
Token ID | 351 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
companions | +15.987 |
awakening | +15.729 |
unborn | +15.418 |
enduring | +15.223 |
grandchildren | +15.184 |
Neg logit contributions | |
libel | -14.092 |
offensive | -11.099 |
rubbish | -11.048 |
Serie | -10.641 |
vitro | -10.622 |
Token | a |
Token ID | 257 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
companions | +21.131 |
newfound | +20.179 |
blessings | +20.055 |
survivors | +20.026 |
grandchildren | +19.811 |
Neg logit contributions | |
libel | -15.663 |
offensive | -12.397 |
ictionary | -11.627 |
pub | -11.445 |
rubbish | -11.357 |
Token | view |
Token ID | 1570 |
Feature activation | +7.71e-01 |
Pos logit contributions | |
newfound | +19.668 |
companions | +19.245 |
awakening | +18.592 |
sunrise | +18.197 |
enduring | +18.131 |
Neg logit contributions | |
libel | -15.120 |
offensive | -12.898 |
ograph | -11.583 |
rubbish | -11.552 |
redit | -11.551 |
Token | to |
Token ID | 284 |
Feature activation | +2.42e+00 |
Pos logit contributions | |
companions | +7.574 |
awakening | +7.369 |
unborn | +7.342 |
newfound | +7.081 |
grandchildren | +7.058 |
Neg logit contributions | |
libel | -10.445 |
offensive | -8.892 |
rubbish | -8.746 |
Serie | -8.572 |
punt | -8.420 |
Token | ensuring |
Token ID | 13359 |
Feature activation | +2.95e+00 |
Pos logit contributions | |
awakening | +25.121 |
companions | +24.471 |
enduring | +24.182 |
healing | +23.544 |
unborn | +23.468 |
Neg logit contributions | |
libel | -17.605 |
offensive | -14.779 |
ictionary | -13.871 |
ograph | -13.684 |
shit | -13.524 |
Token | the |
Token ID | 262 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
companions | +26.390 |
unborn | +26.223 |
enduring | +25.940 |
grandchildren | +25.816 |
survivors | +25.790 |
Neg logit contributions | |
libel | -20.182 |
offensive | -16.332 |
ictionary | -16.143 |
ograph | -15.895 |
Serie | -15.413 |
Token | future |
Token ID | 2003 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
companions | +30.096 |
unborn | +30.085 |
blessings | +29.571 |
enduring | +29.340 |
awakening | +29.196 |
Neg logit contributions | |
libel | -19.373 |
offensive | -15.281 |
ograph | -15.204 |
ictionary | -15.035 |
shit | -14.565 |
Token | health |
Token ID | 1535 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
companions | +21.585 |
unborn | +20.601 |
blessings | +20.407 |
grandchildren | +20.404 |
enduring | +19.776 |
Neg logit contributions | |
libel | -17.950 |
offensive | -14.994 |
ograph | -14.331 |
ictionary | -13.746 |
shit | -13.716 |
Token | of |
Token ID | 286 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
companions | +14.136 |
unborn | +13.409 |
blessings | +13.078 |
awakening | +13.023 |
grandchildren | +12.952 |
Neg logit contributions | |
libel | -15.237 |
offensive | -13.115 |
rubbish | -12.855 |
vitro | -12.381 |
punt | -12.172 |
Token | the |
Token ID | 262 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
unborn | +15.528 |
companions | +15.240 |
grandchildren | +15.026 |
survivors | +14.831 |
newfound | +14.284 |
Neg logit contributions | |
libel | -14.878 |
offensive | -12.269 |
ograph | -11.706 |
advert | -11.471 |
rubbish | -11.435 |
Token | planet |
Token ID | 5440 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
unborn | +20.298 |
companions | +19.779 |
grandchildren | +19.248 |
survivors | +19.170 |
remaining | +18.708 |
Neg logit contributions | |
libel | -17.444 |
offensive | -14.926 |
ograph | -14.262 |
ictionary | -14.135 |
advert | -13.667 |
Token | by |
Token ID | 416 |
Feature activation | +9.61e-01 |
Pos logit contributions | |
companions | +7.088 |
unborn | +7.024 |
newfound | +6.914 |
grandchildren | +6.864 |
survivors | +6.746 |
Neg logit contributions | |
libel | -6.869 |
rubbish | -5.768 |
offensive | -5.643 |
Serie | -5.454 |
punt | -5.426 |
Token | our |
Token ID | 674 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
newfound | +11.419 |
companions | +11.296 |
unborn | +11.126 |
grandchildren | +11.084 |
awakening | +11.081 |
Neg logit contributions | |
libel | -10.337 |
rubbish | -8.572 |
offensive | -8.271 |
Serie | -8.169 |
ograph | -8.112 |
Token | technologies |
Token ID | 8514 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
newfound | +22.730 |
grandchildren | +21.925 |
companions | +21.747 |
awakening | +21.247 |
arrival | +21.189 |
Neg logit contributions | |
libel | -15.791 |
offensive | -13.104 |
ictionary | -12.858 |
ograph | -12.697 |
Serie | -12.691 |
Token | and |
Token ID | 290 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
companions | +17.712 |
grandchildren | +17.629 |
unborn | +17.573 |
enduring | +17.538 |
newfound | +17.463 |
Neg logit contributions | |
libel | -17.916 |
rubbish | -14.861 |
offensive | -14.530 |
Serie | -14.286 |
advert | -13.945 |
Token | enjoy |
Token ID | 2883 |
Feature activation | +2.78e+00 |
Pos logit contributions | |
companions | +18.585 |
newfound | +18.564 |
grandchildren | +18.332 |
enduring | +18.261 |
survivors | +17.875 |
Neg logit contributions | |
libel | -15.365 |
offensive | -12.696 |
Serie | -12.687 |
rubbish | -12.328 |
ictionary | -12.129 |
Token | their |
Token ID | 511 |
Feature activation | +3.29e+00 |
Pos logit contributions | |
newfound | +26.635 |
enduring | +26.395 |
companions | +25.617 |
grandchildren | +24.800 |
blessings | +24.565 |
Neg logit contributions | |
libel | -18.850 |
rubbish | -15.609 |
ograph | -15.011 |
offensive | -14.847 |
shit | -14.712 |
Token | abundant |
Token ID | 23263 |
Feature activation | +2.43e+00 |
Pos logit contributions | |
blessings | +31.101 |
newfound | +30.645 |
enduring | +30.392 |
companions | +30.113 |
arrival | +28.885 |
Neg logit contributions | |
libel | -18.404 |
offensive | -15.791 |
ograph | -15.738 |
England | -15.293 |
Serie | -15.171 |
Token | bounty |
Token ID | 24180 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
blessings | +25.348 |
companions | +25.067 |
newfound | +24.265 |
grandchildren | +23.639 |
vitality | +23.427 |
Neg logit contributions | |
libel | -17.574 |
offensive | -15.149 |
ictionary | -14.952 |
England | -14.558 |
shit | -14.462 |
Token | , |
Token ID | 11 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
companions | +15.719 |
unborn | +15.313 |
grandchildren | +15.221 |
blessings | +15.045 |
remaining | +14.900 |
Neg logit contributions | |
libel | -16.367 |
rubbish | -13.465 |
offensive | -13.084 |
advert | -12.850 |
Serie | -12.457 |
Token | we |
Token ID | 356 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
companions | +18.931 |
enduring | +18.682 |
newfound | +18.576 |
grandchildren | +18.527 |
survivors | +18.436 |
Neg logit contributions | |
libel | -17.170 |
rubbish | -14.533 |
offensive | -14.391 |
ictionary | -14.055 |
ograph | -13.939 |
Token | must |
Token ID | 1276 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
companions | +10.590 |
grandchildren | +10.498 |
survivors | +10.115 |
unborn | +10.110 |
awakened | +9.950 |
Neg logit contributions | |
libel | -15.542 |
offensive | -13.341 |
rubbish | -13.339 |
Serie | -12.896 |
vitro | -12.742 |
Token | Great |
Token ID | 3878 |
Feature activation | +2.43e+00 |
Pos logit contributions | |
grandchildren | +21.830 |
unborn | +21.787 |
companions | +20.981 |
blessings | +20.719 |
followers | +20.684 |
Neg logit contributions | |
libel | -14.229 |
rubbish | -11.837 |
offensive | -11.758 |
vitro | -11.369 |
Serie | -10.908 |
Token | day |
Token ID | 1110 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
grandchildren | +26.637 |
unborn | +25.932 |
blessings | +25.696 |
newfound | +25.690 |
companions | +25.419 |
Neg logit contributions | |
libel | -14.928 |
offensive | -12.129 |
rubbish | -11.923 |
Serie | -11.419 |
redit | -11.179 |
Token | 2 |
Token ID | 362 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
unborn | +20.461 |
grandchildren | +20.129 |
companions | +20.047 |
blessings | +19.674 |
awakening | +19.437 |
Neg logit contributions | |
libel | -15.933 |
offensive | -13.542 |
rubbish | -13.112 |
vitro | -12.629 |
Serie | -12.167 |
Token | announce |
Token ID | 5453 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
grandchildren | +20.872 |
unborn | +20.693 |
blessings | +20.144 |
companions | +20.074 |
newfound | +19.858 |
Neg logit contributions | |
libel | -13.653 |
rubbish | -11.220 |
offensive | -11.061 |
vitro | -10.602 |
Serie | -10.574 |
Token | 2 |
Token ID | 362 |
Feature activation | +2.47e+00 |
Pos logit contributions | |
unborn | +19.293 |
grandchildren | +18.608 |
newfound | +18.286 |
companions | +18.199 |
arrival | +18.170 |
Neg logit contributions | |
libel | -12.904 |
rubbish | -10.688 |
offensive | -10.512 |
Serie | -9.911 |
vitro | -9.676 |
Token | the |
Token ID | 262 |
Feature activation | +3.29e+00 |
Pos logit contributions | |
unborn | +27.208 |
grandchildren | +26.619 |
blessings | +25.770 |
companions | +25.562 |
newfound | +25.108 |
Neg logit contributions | |
libel | -13.764 |
offensive | -11.449 |
rubbish | -11.193 |
Serie | -10.614 |
ictionary | -10.432 |
Token | social |
Token ID | 1919 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
unborn | +32.261 |
grandchildren | +31.523 |
arrival | +30.731 |
blessings | +30.377 |
newfound | +29.451 |
Neg logit contributions | |
libel | -15.061 |
offensive | -11.935 |
rubbish | -11.381 |
Anyway | -11.248 |
ictionary | -11.234 |
Token | media |
Token ID | 2056 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
companions | +17.485 |
awakening | +16.944 |
blessings | +16.701 |
unborn | +16.641 |
grandchildren | +16.555 |
Neg logit contributions | |
libel | -12.997 |
offensive | -10.957 |
vitro | -10.818 |
rubbish | -10.763 |
Serie | -10.568 |
Token | world |
Token ID | 995 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
companions | +17.209 |
grandchildren | +16.718 |
awakening | +16.650 |
followers | +16.622 |
newfound | +16.466 |
Neg logit contributions | |
libel | -12.058 |
offensive | -9.959 |
vitro | -9.551 |
Serie | -9.438 |
rubbish | -9.275 |
Token | !!! |
Token ID | 10185 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
companions | +18.777 |
awakening | +18.321 |
newfound | +18.296 |
grandchildren | +18.287 |
blessings | +18.128 |
Neg logit contributions | |
libel | -14.419 |
offensive | -12.404 |
vitro | -11.701 |
rubbish | -11.555 |
Serie | -11.299 |
Token | Exc |
Token ID | 25268 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
unborn | +17.047 |
newfound | +16.803 |
blessings | +16.635 |
grandchildren | +16.629 |
companions | +16.412 |
Neg logit contributions | |
libel | -13.843 |
offensive | -11.339 |
rubbish | -11.181 |
vitro | -10.923 |
Serie | -10.327 |
Token | wish |
Token ID | 4601 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
companions | +7.431 |
unborn | +7.382 |
grandchildren | +7.316 |
newfound | +7.216 |
awakened | +7.205 |
Neg logit contributions | |
libel | -7.464 |
offensive | -6.372 |
rubbish | -6.297 |
Serie | -6.048 |
vitro | -5.886 |
Token | you |
Token ID | 345 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
companions | +17.732 |
grandchildren | +17.613 |
unborn | +17.464 |
survivors | +17.339 |
blessings | +16.991 |
Neg logit contributions | |
libel | -15.317 |
offensive | -13.659 |
rubbish | -12.975 |
ictionary | -12.836 |
vitro | -12.749 |
Token | the |
Token ID | 262 |
Feature activation | +3.34e+00 |
Pos logit contributions | |
blessings | +27.884 |
companions | +27.720 |
grandchildren | +27.436 |
newfound | +26.636 |
enduring | +26.302 |
Neg logit contributions | |
libel | -19.925 |
offensive | -15.714 |
rubbish | -15.699 |
vitro | -15.547 |
ograph | -15.332 |
Token | best |
Token ID | 1266 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
blessings | +28.969 |
companions | +28.134 |
grandchildren | +27.134 |
enduring | +26.935 |
newfound | +26.799 |
Neg logit contributions | |
libel | -19.852 |
offensive | -16.748 |
rubbish | -16.192 |
ictionary | -16.111 |
vitro | -16.024 |
Token | and |
Token ID | 290 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
grandchildren | +15.461 |
unborn | +15.459 |
companions | +15.381 |
blessings | +15.034 |
remaining | +14.696 |
Neg logit contributions | |
libel | -15.503 |
rubbish | -13.212 |
offensive | -12.935 |
vitro | -12.553 |
advert | -12.194 |
Token | the |
Token ID | 262 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
blessings | +23.966 |
grandchildren | +23.852 |
companions | +23.799 |
unborn | +23.244 |
newfound | +23.078 |
Neg logit contributions | |
libel | -17.540 |
offensive | -15.212 |
ictionary | -14.692 |
vitro | -14.665 |
rubbish | -14.601 |
Token | best |
Token ID | 1266 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
blessings | +31.912 |
companions | +30.953 |
grandchildren | +30.415 |
unborn | +30.033 |
newfound | +29.645 |
Neg logit contributions | |
libel | -16.923 |
offensive | -14.364 |
rubbish | -13.968 |
ictionary | -13.863 |
Anyway | -13.808 |
Token | of |
Token ID | 286 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
grandchildren | +17.917 |
blessings | +17.855 |
companions | +17.652 |
unborn | +17.461 |
arrival | +16.740 |
Neg logit contributions | |
libel | -15.507 |
rubbish | -13.057 |
offensive | -12.767 |
vitro | -12.419 |
Serie | -12.233 |
Token | luck |
Token ID | 8458 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
newfound | +18.659 |
grandchildren | +18.604 |
companions | +18.514 |
blessings | +18.458 |
enduring | +18.383 |
Neg logit contributions | |
libel | -15.573 |
rubbish | -13.106 |
offensive | -12.567 |
advert | -12.292 |
Serie | -12.284 |
Token | in |
Token ID | 287 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
unborn | +17.019 |
companions | +16.575 |
grandchildren | +16.430 |
enduring | +16.367 |
remaining | +16.135 |
Neg logit contributions | |
libel | -16.528 |
rubbish | -14.523 |
offensive | -13.880 |
vitro | -13.284 |
Serie | -13.143 |
Token | the |
Token ID | 262 |
Feature activation | +2.07e+00 |
Pos logit contributions | |
unborn | +15.224 |
newfound | +15.177 |
remaining | +15.160 |
enduring | +15.126 |
awakening | +14.975 |
Neg logit contributions | |
libel | -14.380 |
rubbish | -12.270 |
ictionary | -11.721 |
ograph | -11.656 |
offensive | -11.646 |
Token | ö |
Token ID | 9101 |
Feature activation | +3.40e-01 |
Pos logit contributions | |
companions | +11.604 |
newfound | +11.356 |
unborn | +11.252 |
awakened | +10.977 |
grandchildren | +10.976 |
Neg logit contributions | |
libel | -11.360 |
rubbish | -8.821 |
tabloid | -8.581 |
Serie | -8.367 |
offensive | -8.277 |
Token | ng |
Token ID | 782 |
Feature activation | +2.26e-01 |
Pos logit contributions | |
companions | +4.305 |
grandchildren | +4.240 |
newfound | +4.204 |
unborn | +4.199 |
awakened | +4.049 |
Neg logit contributions | |
libel | -3.977 |
rubbish | -3.215 |
offensive | -3.039 |
tabloid | -2.996 |
Serie | -2.987 |
Token | ke |
Token ID | 365 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
companions | +3.078 |
newfound | +2.998 |
grandchildren | +2.992 |
unborn | +2.987 |
awakening | +2.895 |
Neg logit contributions | |
libel | -2.575 |
rubbish | -2.052 |
offensive | -1.962 |
advert | -1.910 |
punt | -1.888 |
Token | ( |
Token ID | 357 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
companions | +2.111 |
unborn | +2.071 |
newfound | +2.064 |
grandchildren | +2.063 |
enduring | +1.984 |
Neg logit contributions | |
libel | -1.892 |
rubbish | -1.541 |
offensive | -1.513 |
advert | -1.430 |
vitro | -1.409 |
Token | meaning |
Token ID | 24815 |
Feature activation | +2.96e+00 |
Pos logit contributions | |
companions | +18.593 |
blessings | +18.467 |
grandchildren | +18.358 |
newfound | +18.323 |
unborn | +18.176 |
Neg logit contributions | |
libel | -14.955 |
rubbish | -11.679 |
advert | -11.660 |
tabloid | -11.559 |
vitro | -11.331 |
Token | " |
Token ID | 366 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
companions | +28.370 |
unborn | +28.277 |
blessings | +28.257 |
grandchildren | +27.879 |
newfound | +27.157 |
Neg logit contributions | |
libel | -16.147 |
offensive | -12.846 |
vitro | -12.314 |
advert | -11.963 |
Anyway | -11.783 |
Token | et |
Token ID | 316 |
Feature activation | +9.04e-01 |
Pos logit contributions | |
companions | +26.811 |
blessings | +26.606 |
unborn | +26.567 |
grandchildren | +26.284 |
newfound | +25.737 |
Neg logit contributions | |
libel | -18.473 |
tabloid | -14.828 |
Serie | -14.559 |
advert | -14.491 |
punt | -14.037 |
Token | ernal |
Token ID | 35220 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
companions | +8.311 |
unborn | +7.876 |
newfound | +7.542 |
blessings | +7.507 |
grandchildren | +7.457 |
Neg logit contributions | |
libel | -12.335 |
Serie | -10.170 |
offensive | -10.075 |
rubbish | -10.034 |
advert | -9.994 |
Token | " |
Token ID | 1 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
companions | +24.690 |
blessings | +24.088 |
unborn | +24.067 |
awakening | +23.746 |
grandchildren | +23.487 |
Neg logit contributions | |
libel | -15.985 |
offensive | -13.755 |
Serie | -12.935 |
vitro | -12.396 |
pub | -12.173 |
Token | in |
Token ID | 287 |
Feature activation | -7.87e-01 |
Pos logit contributions | |
companions | +12.050 |
unborn | +11.742 |
grandchildren | +11.491 |
blessings | +11.444 |
newfound | +11.421 |
Neg logit contributions | |
libel | -10.731 |
offensive | -8.917 |
rubbish | -8.572 |
vitro | -8.421 |
Serie | -8.391 |
Token | the |
Token ID | 262 |
Feature activation | +7.30e-02 |
Pos logit contributions | |
libel | +9.132 |
rubbish | +7.447 |
offensive | +7.265 |
Serie | +6.946 |
advert | +6.926 |
Neg logit contributions | |
companions | -9.991 |
newfound | -9.863 |
unborn | -9.847 |
grandchildren | -9.723 |
caregivers | -9.524 |
Token | � |
Token ID | 447 |
Feature activation | -6.42e-01 |
Pos logit contributions | |
companions | +10.010 |
newfound | +9.692 |
survivors | +9.624 |
unborn | +9.572 |
grandchildren | +9.489 |
Neg logit contributions | |
libel | -8.724 |
rubbish | -6.982 |
offensive | -6.962 |
punt | -6.591 |
ograph | -6.576 |
Token | � |
Token ID | 247 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
libel | +7.291 |
rubbish | +5.876 |
offensive | +5.709 |
advert | +5.444 |
Serie | +5.416 |
Neg logit contributions | |
companions | -8.818 |
newfound | -8.662 |
unborn | -8.661 |
grandchildren | -8.552 |
caregivers | -8.327 |
Token | s |
Token ID | 82 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
companions | +12.724 |
newfound | +12.592 |
grandchildren | +12.355 |
unborn | +12.315 |
survivors | +12.227 |
Neg logit contributions | |
libel | -11.199 |
rubbish | -8.948 |
punt | -8.651 |
offensive | -8.456 |
advert | -8.269 |
Token | search |
Token ID | 2989 |
Feature activation | +5.74e-01 |
Pos logit contributions | |
newfound | +26.557 |
companions | +25.898 |
unborn | +25.509 |
arrival | +25.258 |
enduring | +24.827 |
Neg logit contributions | |
libel | -14.810 |
ograph | -11.745 |
offensive | -11.111 |
England | -10.812 |
pub | -10.812 |
Token | for |
Token ID | 329 |
Feature activation | +2.18e+00 |
Pos logit contributions | |
companions | +7.636 |
newfound | +7.220 |
unborn | +7.036 |
survivors | +6.999 |
grandchildren | +6.942 |
Neg logit contributions | |
libel | -6.468 |
rubbish | -5.204 |
offensive | -5.014 |
Serie | -4.916 |
punt | -4.782 |
Token | their |
Token ID | 511 |
Feature activation | +3.22e+00 |
Pos logit contributions | |
companions | +24.241 |
newfound | +23.428 |
survivors | +23.145 |
unborn | +22.184 |
grandchildren | +21.968 |
Neg logit contributions | |
libel | -16.056 |
punt | -13.140 |
ograph | -12.819 |
offensive | -12.532 |
rubbish | -12.238 |
Token | lost |
Token ID | 2626 |
Feature activation | +2.61e+00 |
Pos logit contributions | |
newfound | +31.385 |
companions | +30.937 |
unborn | +30.006 |
remaining | +29.271 |
survivors | +29.166 |
Neg logit contributions | |
libel | -17.101 |
ograph | -13.644 |
offensive | -13.578 |
Anyway | -12.738 |
vitro | -12.651 |
Token | leader |
Token ID | 3554 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
companions | +27.526 |
newfound | +25.694 |
unborn | +25.531 |
souls | +25.245 |
survivors | +25.180 |
Neg logit contributions | |
libel | -16.240 |
offensive | -13.963 |
ograph | -13.783 |
ictionary | -13.069 |
rubbish | -12.701 |
Token | O |
Token ID | 440 |
Feature activation | +6.71e-01 |
Pos logit contributions | |
companions | +13.904 |
unborn | +13.571 |
newfound | +13.545 |
awakening | +13.281 |
survivors | +13.098 |
Neg logit contributions | |
libel | -12.815 |
rubbish | -10.375 |
punt | -10.135 |
offensive | -10.122 |
vitro | -9.777 |
Token | der |
Token ID | 1082 |
Feature activation | +7.03e-01 |
Pos logit contributions | |
companions | +9.714 |
newfound | +9.567 |
unborn | +9.456 |
grandchildren | +9.395 |
blessings | +9.117 |
Neg logit contributions | |
libel | -6.396 |
rubbish | -4.912 |
offensive | -4.738 |
punt | -4.684 |
advert | -4.623 |
Token | us |
Token ID | 385 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
companions | +7.522 |
newfound | +7.387 |
grandchildren | +7.315 |
unborn | +7.171 |
survivors | +7.040 |
Neg logit contributions | |
libel | -9.414 |
rubbish | -7.889 |
offensive | -7.569 |
advert | -7.385 |
punt | -7.336 |
Token | our |
Token ID | 674 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
unborn | +12.849 |
grandchildren | +12.557 |
companions | +12.486 |
newfound | +12.277 |
survivors | +12.217 |
Neg logit contributions | |
libel | -11.650 |
offensive | -9.533 |
rubbish | -9.510 |
ograph | -9.348 |
Serie | -9.141 |
Token | nation |
Token ID | 3277 |
Feature activation | +9.10e-01 |
Pos logit contributions | |
grandchildren | +24.130 |
unborn | +23.669 |
newfound | +23.406 |
companions | +23.094 |
awakening | +22.995 |
Neg logit contributions | |
libel | -17.518 |
offensive | -15.274 |
ograph | -14.849 |
Serie | -14.354 |
ictionary | -14.341 |
Token | . |
Token ID | 13 |
Feature activation | +7.18e-01 |
Pos logit contributions | |
unborn | +10.288 |
grandchildren | +10.177 |
companions | +10.089 |
enduring | +9.879 |
newfound | +9.875 |
Neg logit contributions | |
libel | -10.430 |
rubbish | -8.890 |
offensive | -8.574 |
Serie | -8.369 |
punt | -8.172 |
Token | I |
Token ID | 314 |
Feature activation | +6.32e-01 |
Pos logit contributions | |
grandchildren | +7.468 |
unborn | +7.430 |
companions | +7.385 |
survivors | +7.144 |
newfound | +7.093 |
Neg logit contributions | |
libel | -9.324 |
rubbish | -8.033 |
offensive | -7.810 |
vitro | -7.551 |
advert | -7.374 |
Token | wish |
Token ID | 4601 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
companions | +7.431 |
unborn | +7.382 |
grandchildren | +7.316 |
newfound | +7.216 |
awakened | +7.205 |
Neg logit contributions | |
libel | -7.464 |
offensive | -6.372 |
rubbish | -6.297 |
Serie | -6.048 |
vitro | -5.886 |
Token | you |
Token ID | 345 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
companions | +17.732 |
grandchildren | +17.613 |
unborn | +17.464 |
survivors | +17.339 |
blessings | +16.991 |
Neg logit contributions | |
libel | -15.317 |
offensive | -13.659 |
rubbish | -12.975 |
ictionary | -12.836 |
vitro | -12.749 |
Token | the |
Token ID | 262 |
Feature activation | +3.34e+00 |
Pos logit contributions | |
blessings | +27.884 |
companions | +27.720 |
grandchildren | +27.436 |
newfound | +26.636 |
enduring | +26.302 |
Neg logit contributions | |
libel | -19.925 |
offensive | -15.714 |
rubbish | -15.699 |
vitro | -15.547 |
ograph | -15.332 |
Token | best |
Token ID | 1266 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
blessings | +28.969 |
companions | +28.134 |
grandchildren | +27.134 |
enduring | +26.935 |
newfound | +26.799 |
Neg logit contributions | |
libel | -19.852 |
offensive | -16.748 |
rubbish | -16.192 |
ictionary | -16.111 |
vitro | -16.024 |
Token | and |
Token ID | 290 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
grandchildren | +15.461 |
unborn | +15.459 |
companions | +15.381 |
blessings | +15.034 |
remaining | +14.696 |
Neg logit contributions | |
libel | -15.503 |
rubbish | -13.212 |
offensive | -12.935 |
vitro | -12.553 |
advert | -12.194 |
Token | the |
Token ID | 262 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
blessings | +23.966 |
grandchildren | +23.852 |
companions | +23.799 |
unborn | +23.244 |
newfound | +23.078 |
Neg logit contributions | |
libel | -17.540 |
offensive | -15.212 |
ictionary | -14.692 |
vitro | -14.665 |
rubbish | -14.601 |
Token | best |
Token ID | 1266 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
blessings | +31.912 |
companions | +30.953 |
grandchildren | +30.415 |
unborn | +30.033 |
newfound | +29.645 |
Neg logit contributions | |
libel | -16.923 |
offensive | -14.364 |
rubbish | -13.968 |
ictionary | -13.863 |
Anyway | -13.808 |
Token | one |
Token ID | 530 |
Feature activation | +7.11e-01 |
Pos logit contributions | |
companions | +17.957 |
awakening | +17.744 |
unborn | +17.728 |
blessings | +17.188 |
enduring | +17.180 |
Neg logit contributions | |
libel | -15.576 |
offensive | -12.651 |
ictionary | -12.189 |
vitro | -12.138 |
rubbish | -11.967 |
Token | must |
Token ID | 1276 |
Feature activation | +9.67e-01 |
Pos logit contributions | |
companions | +8.095 |
awakening | +7.819 |
newfound | +7.808 |
unborn | +7.768 |
awakened | +7.679 |
Neg logit contributions | |
libel | -8.764 |
offensive | -7.403 |
rubbish | -7.133 |
vitro | -6.907 |
ograph | -6.904 |
Token | have |
Token ID | 423 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
companions | +11.396 |
unborn | +10.996 |
awakened | +10.788 |
awakening | +10.771 |
grandchildren | +10.762 |
Neg logit contributions | |
libel | -10.565 |
offensive | -8.903 |
Serie | -8.569 |
rubbish | -8.273 |
England | -8.156 |
Token | faith |
Token ID | 4562 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
companions | +18.639 |
newfound | +17.902 |
awakening | +17.863 |
awakened | +17.779 |
grandchildren | +17.697 |
Neg logit contributions | |
libel | -16.024 |
offensive | -13.043 |
ograph | -12.297 |
ictionary | -12.131 |
rubbish | -12.097 |
Token | in |
Token ID | 287 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
companions | +14.228 |
unborn | +13.666 |
newfound | +13.602 |
awakening | +13.583 |
remaining | +13.517 |
Neg logit contributions | |
libel | -15.359 |
offensive | -12.398 |
rubbish | -12.368 |
advert | -11.874 |
Serie | -11.857 |
Token | our |
Token ID | 674 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
companions | +20.260 |
awakening | +19.883 |
unborn | +19.472 |
blessings | +19.396 |
souls | +19.339 |
Neg logit contributions | |
libel | -15.914 |
offensive | -12.755 |
ictionary | -12.662 |
ograph | -12.578 |
rubbish | -12.092 |
Token | HS |
Token ID | 18070 |
Feature activation | +1.98e+00 |
Pos logit contributions | |
companions | +30.309 |
awakening | +29.144 |
newfound | +29.049 |
arrival | +28.956 |
souls | +28.883 |
Neg logit contributions | |
libel | -18.632 |
ictionary | -15.929 |
offensive | -15.729 |
ograph | -15.541 |
England | -14.505 |
Token | that |
Token ID | 326 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
companions | +20.133 |
awakening | +19.193 |
arrival | +19.155 |
grandchildren | +18.895 |
blessings | +18.762 |
Neg logit contributions | |
libel | -17.527 |
rubbish | -14.125 |
offensive | -13.728 |
vitro | -13.427 |
Serie | -13.024 |
Token | they |
Token ID | 484 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
companions | +26.715 |
awakening | +26.251 |
blessings | +25.927 |
arrival | +25.860 |
unborn | +25.721 |
Neg logit contributions | |
libel | -20.089 |
ictionary | -16.766 |
offensive | -15.888 |
ograph | -15.378 |
redit | -14.917 |
Token | will |
Token ID | 481 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
awakened | +17.178 |
unborn | +17.098 |
grandchildren | +16.960 |
companions | +16.882 |
arrival | +16.559 |
Neg logit contributions | |
libel | -19.218 |
offensive | -16.559 |
Serie | -15.695 |
rubbish | -15.550 |
Yugoslavia | -14.834 |
Token | arrange |
Token ID | 21674 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
companions | +18.482 |
arrival | +17.997 |
awakening | +17.763 |
awakened | +17.637 |
enduring | +17.634 |
Neg logit contributions | |
libel | -17.980 |
offensive | -15.478 |
Serie | -14.244 |
ictionary | -13.974 |
football | -13.913 |
Token | American |
Token ID | 1605 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
enduring | +22.950 |
unborn | +22.480 |
awakened | +21.947 |
awakening | +21.781 |
companions | +21.069 |
Neg logit contributions | |
libel | -18.544 |
rubbish | -14.894 |
pub | -14.622 |
vitro | -14.372 |
punt | -14.279 |
Token | hero |
Token ID | 4293 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
companions | +14.811 |
unborn | +14.659 |
enduring | +14.421 |
grandchildren | +14.347 |
awakening | +14.345 |
Neg logit contributions | |
libel | -15.848 |
offensive | -13.833 |
rubbish | -13.488 |
vitro | -12.816 |
advert | -12.747 |
Token | & |
Token ID | 1222 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
unborn | +15.055 |
companions | +14.520 |
awakened | +14.502 |
enduring | +14.496 |
awakening | +14.330 |
Neg logit contributions | |
libel | -16.122 |
rubbish | -13.722 |
offensive | -13.190 |
punt | -13.009 |
vitro | -12.735 |
Token | one |
Token ID | 530 |
Feature activation | +6.31e-01 |
Pos logit contributions | |
enduring | +21.494 |
companions | +21.264 |
unborn | +21.212 |
newfound | +20.739 |
survivors | +20.686 |
Neg logit contributions | |
libel | -15.329 |
rubbish | -12.676 |
vitro | -12.013 |
offensive | -11.876 |
Serie | -11.598 |
Token | of |
Token ID | 286 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
unborn | +7.723 |
companions | +7.683 |
newfound | +7.468 |
enduring | +7.461 |
grandchildren | +7.435 |
Neg logit contributions | |
libel | -7.161 |
offensive | -5.905 |
rubbish | -5.881 |
vitro | -5.574 |
advert | -5.511 |
Token | the |
Token ID | 262 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
companions | +13.438 |
unborn | +13.111 |
enduring | +13.057 |
grandchildren | +12.976 |
survivors | +12.951 |
Neg logit contributions | |
libel | -9.487 |
offensive | -7.664 |
rubbish | -7.663 |
advert | -7.388 |
ograph | -7.122 |
Token | brav |
Token ID | 49025 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
companions | +29.369 |
survivors | +28.521 |
enduring | +28.322 |
blessings | +28.226 |
grandchildren | +28.076 |
Neg logit contributions | |
libel | -18.079 |
ictionary | -14.916 |
offensive | -14.862 |
Anyway | -14.478 |
ograph | -14.367 |
Token | est |
Token ID | 395 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
companions | +8.812 |
unborn | +7.965 |
survivors | +7.931 |
grandchildren | +7.893 |
souls | +7.828 |
Neg logit contributions | |
libel | -17.905 |
rubbish | -15.144 |
vitro | -15.050 |
offensive | -14.825 |
punt | -14.778 |
Token | fighters |
Token ID | 8486 |
Feature activation | +6.35e-01 |
Pos logit contributions | |
companions | +15.925 |
survivors | +15.312 |
unborn | +15.155 |
grandchildren | +14.754 |
blessings | +14.644 |
Neg logit contributions | |
libel | -13.274 |
offensive | -11.504 |
rubbish | -11.265 |
vitro | -11.004 |
ictionary | -10.888 |
Token | I |
Token ID | 314 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
companions | +8.196 |
unborn | +8.125 |
survivors | +7.916 |
grandchildren | +7.844 |
enduring | +7.786 |
Neg logit contributions | |
libel | -6.761 |
rubbish | -5.747 |
offensive | -5.550 |
vitro | -5.224 |
advert | -5.173 |
Token | � |
Token ID | 447 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
companions | +2.561 |
unborn | +2.523 |
newfound | +2.477 |
grandchildren | +2.461 |
awakened | +2.418 |
Neg logit contributions | |
libel | -2.472 |
rubbish | -2.097 |
offensive | -2.037 |
Serie | -1.966 |
vitro | -1.929 |
Token | Jedi |
Token ID | 16147 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
companions | +2.922 |
newfound | +2.892 |
unborn | +2.883 |
grandchildren | +2.789 |
blessings | +2.773 |
Neg logit contributions | |
libel | -2.586 |
rubbish | -2.103 |
offensive | -2.034 |
Serie | -1.991 |
vitro | -1.983 |
Token | acts |
Token ID | 6529 |
Feature activation | -6.71e-02 |
Pos logit contributions | |
companions | +0.335 |
unborn | +0.330 |
newfound | +0.327 |
grandchildren | +0.319 |
awakening | +0.316 |
Neg logit contributions | |
libel | -0.398 |
rubbish | -0.334 |
offensive | -0.329 |
Serie | -0.317 |
vitro | -0.314 |
Token | self |
Token ID | 2116 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
libel | +0.793 |
rubbish | +0.650 |
offensive | +0.639 |
Serie | +0.615 |
vitro | +0.612 |
Neg logit contributions | |
companions | -0.876 |
unborn | -0.871 |
newfound | -0.863 |
grandchildren | -0.843 |
awakening | -0.834 |
Token | lessly |
Token ID | 8613 |
Feature activation | +7.96e-01 |
Pos logit contributions | |
companions | +6.184 |
unborn | +6.184 |
newfound | +6.147 |
awakened | +6.028 |
awakening | +6.027 |
Neg logit contributions | |
libel | -4.790 |
rubbish | -3.862 |
offensive | -3.679 |
punt | -3.620 |
vitro | -3.603 |
Token | for |
Token ID | 329 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
unborn | +9.335 |
companions | +9.207 |
newfound | +9.047 |
awakening | +9.038 |
enduring | +8.920 |
Neg logit contributions | |
libel | -8.867 |
rubbish | -7.300 |
offensive | -7.212 |
vitro | -7.030 |
punt | -6.941 |
Token | the |
Token ID | 262 |
Feature activation | +3.16e+00 |
Pos logit contributions | |
unborn | +20.482 |
companions | +20.365 |
awakening | +20.158 |
survivors | +19.721 |
blessings | +19.648 |
Neg logit contributions | |
libel | -11.878 |
ograph | -9.977 |
rubbish | -9.903 |
vitro | -9.748 |
ictionary | -9.325 |
Token | common |
Token ID | 2219 |
Feature activation | +2.07e+00 |
Pos logit contributions | |
unborn | +32.334 |
companions | +31.369 |
awakening | +31.145 |
blessings | +30.598 |
survivors | +30.278 |
Neg logit contributions | |
libel | -13.977 |
ograph | -12.564 |
ictionary | -11.496 |
Anyway | -11.125 |
offensive | -10.933 |
Token | man |
Token ID | 582 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
unborn | +21.656 |
companions | +21.329 |
blessings | +20.694 |
awakening | +20.630 |
enduring | +20.032 |
Neg logit contributions | |
libel | -16.406 |
ograph | -13.516 |
rubbish | -13.150 |
vitro | -12.941 |
offensive | -12.797 |
Token | - |
Token ID | 12 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
unborn | +19.633 |
companions | +18.799 |
awakening | +18.768 |
grandchildren | +18.416 |
survivors | +18.345 |
Neg logit contributions | |
libel | -14.612 |
rubbish | -12.061 |
offensive | -11.819 |
punt | -11.645 |
Serie | -11.334 |
Token | NOT |
Token ID | 11929 |
Feature activation | -3.77e-01 |
Pos logit contributions | |
unborn | +16.259 |
companions | +15.938 |
newfound | +15.668 |
awakening | +15.418 |
grandchildren | +15.356 |
Neg logit contributions | |
libel | -12.626 |
rubbish | -10.267 |
Serie | -9.583 |
tabloid | -9.556 |
punt | -9.465 |
Token | lie |
Token ID | 6486 |
Feature activation | +4.51e-02 |
Pos logit contributions | |
libel | +4.851 |
rubbish | +4.026 |
offensive | +3.927 |
advert | +3.767 |
Serie | +3.763 |
Neg logit contributions | |
companions | -4.613 |
unborn | -4.529 |
newfound | -4.516 |
grandchildren | -4.462 |
awakening | -4.327 |
Token | ultimately |
Token ID | 6165 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
companions | +9.641 |
unborn | +9.496 |
grandchildren | +9.419 |
newfound | +9.242 |
enduring | +9.131 |
Neg logit contributions | |
libel | -8.359 |
offensive | -6.966 |
rubbish | -6.902 |
Serie | -6.526 |
vitro | -6.520 |
Token | , |
Token ID | 11 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
unborn | +13.916 |
companions | +13.455 |
newfound | +13.000 |
grandchildren | +12.930 |
enduring | +12.909 |
Neg logit contributions | |
libel | -16.054 |
rubbish | -13.569 |
offensive | -13.229 |
Serie | -13.192 |
tabloid | -13.076 |
Token | to |
Token ID | 284 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
unborn | +15.408 |
grandchildren | +14.978 |
companions | +14.970 |
newfound | +14.726 |
blessings | +14.640 |
Neg logit contributions | |
libel | -14.358 |
rubbish | -12.156 |
advert | -11.811 |
punt | -11.744 |
offensive | -11.721 |
Token | deny |
Token ID | 10129 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
companions | +5.158 |
unborn | +5.144 |
grandchildren | +5.097 |
newfound | +5.034 |
awakening | +4.916 |
Neg logit contributions | |
libel | -5.363 |
offensive | -4.608 |
rubbish | -4.440 |
Serie | -4.348 |
vitro | -4.248 |
Token | us |
Token ID | 514 |
Feature activation | +2.25e+00 |
Pos logit contributions | |
unborn | +16.951 |
survivors | +16.525 |
grandchildren | +16.297 |
companions | +16.286 |
enduring | +16.056 |
Neg logit contributions | |
libel | -13.900 |
rubbish | -11.575 |
offensive | -11.509 |
advert | -11.121 |
punt | -10.951 |
Token | our |
Token ID | 674 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
grandchildren | +22.971 |
companions | +22.829 |
unborn | +22.817 |
newfound | +22.670 |
enduring | +22.606 |
Neg logit contributions | |
libel | -16.393 |
offensive | -13.888 |
rubbish | -13.620 |
vitro | -13.138 |
ograph | -13.056 |
Token | future |
Token ID | 2003 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
grandchildren | +30.772 |
unborn | +30.332 |
newfound | +30.052 |
blessings | +29.217 |
companions | +29.196 |
Neg logit contributions | |
libel | -16.293 |
offensive | -14.890 |
ograph | -14.367 |
Anyway | -13.235 |
pub | -13.180 |
Token | . |
Token ID | 13 |
Feature activation | +3.84e-01 |
Pos logit contributions | |
companions | +16.218 |
grandchildren | +16.045 |
unborn | +15.504 |
survivors | +15.210 |
blessings | +15.160 |
Neg logit contributions | |
libel | -14.744 |
rubbish | -12.583 |
offensive | -12.574 |
punt | -11.910 |
advert | -11.778 |
Token |
|
Token ID | 198 |
Feature activation | +3.61e-01 |
Pos logit contributions | |
unborn | +3.941 |
companions | +3.868 |
grandchildren | +3.867 |
newfound | +3.735 |
survivors | +3.717 |
Neg logit contributions | |
libel | -5.377 |
rubbish | -4.599 |
offensive | -4.442 |
vitro | -4.341 |
advert | -4.321 |
Token |
|
Token ID | 198 |
Feature activation | +4.69e-02 |
Pos logit contributions | |
companions | +4.143 |
unborn | +4.048 |
newfound | +4.042 |
grandchildren | +4.013 |
blessings | +3.869 |
Neg logit contributions | |
libel | -4.848 |
rubbish | -4.058 |
offensive | -3.929 |
advert | -3.796 |
vitro | -3.765 |
Token | A |
Token ID | 32 |
Feature activation | +8.30e-02 |
Pos logit contributions | |
companions | +0.595 |
unborn | +0.587 |
newfound | +0.584 |
grandchildren | +0.581 |
blessings | +0.565 |
Neg logit contributions | |
libel | -0.578 |
rubbish | -0.477 |
offensive | -0.448 |
advert | -0.446 |
punt | -0.441 |
Token | une |
Token ID | 1726 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
newfound | +10.613 |
companions | +10.529 |
grandchildren | +10.351 |
unborn | +10.217 |
awakening | +10.056 |
Neg logit contributions | |
libel | -21.301 |
rubbish | -18.220 |
Serie | -17.332 |
tabloid | -17.298 |
punt | -17.212 |
Token | Mik |
Token ID | 17722 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
awakening | +12.845 |
companions | +12.567 |
newfound | +12.441 |
enduring | +12.374 |
unborn | +12.279 |
Neg logit contributions | |
libel | -16.269 |
rubbish | -13.794 |
offensive | -13.626 |
vitro | -13.034 |
England | -12.712 |
Token | u |
Token ID | 84 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
grandchildren | +11.765 |
companions | +11.747 |
newfound | +11.539 |
unborn | +11.443 |
awakening | +11.075 |
Neg logit contributions | |
libel | -15.112 |
rubbish | -12.571 |
Serie | -12.042 |
tabloid | -11.980 |
offensive | -11.924 |
Token | � |
Token ID | 447 |
Feature activation | -4.14e-01 |
Pos logit contributions | |
awakening | +21.522 |
companions | +20.603 |
awakened | +20.492 |
enduring | +20.441 |
unborn | +20.221 |
Neg logit contributions | |
libel | -17.460 |
rubbish | -14.137 |
offensive | -13.894 |
vitro | -13.164 |
redit | -12.650 |
Token | � |
Token ID | 247 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
libel | +4.363 |
rubbish | +3.448 |
offensive | +3.330 |
advert | +3.160 |
Serie | +3.149 |
Neg logit contributions | |
companions | -6.075 |
unborn | -5.971 |
newfound | -5.970 |
grandchildren | -5.893 |
awakening | -5.764 |
Token | s |
Token ID | 82 |
Feature activation | +3.13e+00 |
Pos logit contributions | |
awakening | +15.697 |
companions | +15.329 |
grandchildren | +15.170 |
newfound | +15.154 |
arrival | +15.137 |
Neg logit contributions | |
libel | -15.918 |
rubbish | -13.150 |
offensive | -12.348 |
vitro | -12.044 |
punt | -11.825 |
Token | � |
Token ID | 564 |
Feature activation | +8.05e-02 |
Pos logit contributions | |
awakening | +29.543 |
arrival | +29.464 |
newfound | +29.364 |
companions | +28.982 |
unborn | +28.376 |
Neg logit contributions | |
libel | -17.286 |
England | -13.753 |
offensive | -13.644 |
rubbish | -13.341 |
redit | -12.915 |
Token | � |
Token ID | 250 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
companions | +1.209 |
newfound | +1.193 |
unborn | +1.184 |
grandchildren | +1.165 |
awakening | +1.151 |
Neg logit contributions | |
libel | -0.819 |
rubbish | -0.641 |
offensive | -0.605 |
advert | -0.587 |
Serie | -0.581 |
Token | loss |
Token ID | 22462 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
companions | +17.818 |
awakening | +17.723 |
newfound | +17.546 |
grandchildren | +17.380 |
arrival | +17.354 |
Neg logit contributions | |
libel | -15.771 |
rubbish | -12.359 |
advert | -11.449 |
tabloid | -11.351 |
punt | -11.261 |
Token | of |
Token ID | 286 |
Feature activation | +2.28e+00 |
Pos logit contributions | |
companions | +15.537 |
awakening | +15.531 |
unborn | +15.357 |
newfound | +14.960 |
remaining | +14.875 |
Neg logit contributions | |
libel | -13.828 |
rubbish | -11.922 |
offensive | -11.008 |
Serie | -10.607 |
England | -10.498 |
Token | song |
Token ID | 3496 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
companions | +25.143 |
newfound | +23.659 |
unborn | +23.573 |
awakening | +23.530 |
grandchildren | +23.391 |
Neg logit contributions | |
libel | -15.477 |
rubbish | -12.660 |
England | -12.493 |
offensive | -12.429 |
ograph | -12.165 |
Token | Unt |
Token ID | 26970 |
Feature activation | +8.04e-01 |
Pos logit contributions | |
newfound | +15.067 |
unborn | +14.898 |
companions | +14.523 |
remaining | +14.486 |
followers | +14.304 |
Neg logit contributions | |
libel | -17.275 |
offensive | -14.373 |
rubbish | -14.218 |
advert | -13.015 |
Yugoslavia | -12.901 |
Token | app |
Token ID | 1324 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
companions | +8.229 |
newfound | +8.082 |
unborn | +8.023 |
grandchildren | +7.848 |
awakened | +7.619 |
Neg logit contributions | |
libel | -11.183 |
rubbish | -9.270 |
Serie | -8.839 |
offensive | -8.794 |
punt | -8.714 |
Token | d |
Token ID | 67 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
companions | +5.367 |
newfound | +5.276 |
unborn | +5.208 |
grandchildren | +5.156 |
enduring | +5.039 |
Neg logit contributions | |
libel | -5.430 |
rubbish | -4.383 |
offensive | -4.246 |
Serie | -4.087 |
vitro | -4.064 |
Token | user |
Token ID | 2836 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
newfound | +15.898 |
companions | +15.675 |
followers | +15.575 |
arrival | +15.215 |
unborn | +15.189 |
Neg logit contributions | |
libel | -17.362 |
offensive | -14.267 |
rubbish | -14.042 |
vitro | -12.782 |
Yugoslavia | -12.695 |
Token | for |
Token ID | 329 |
Feature activation | +2.89e+00 |
Pos logit contributions | |
companions | +15.584 |
enduring | +15.257 |
newfound | +15.173 |
unborn | +15.074 |
remaining | +14.834 |
Neg logit contributions | |
libel | -17.360 |
offensive | -14.633 |
rubbish | -14.458 |
vitro | -13.177 |
advert | -12.959 |
Token | your |
Token ID | 534 |
Feature activation | +3.09e+00 |
Pos logit contributions | |
enduring | +25.399 |
newfound | +24.602 |
companions | +24.563 |
remaining | +24.456 |
blessings | +24.431 |
Neg logit contributions | |
libel | -21.297 |
offensive | -17.034 |
rubbish | -16.576 |
ictionary | -16.394 |
redit | -16.159 |
Token | continued |
Token ID | 3767 |
Feature activation | +2.80e+00 |
Pos logit contributions | |
newfound | +27.758 |
blessings | +27.222 |
companions | +27.157 |
enduring | +26.847 |
arrival | +25.688 |
Neg logit contributions | |
libel | -21.369 |
offensive | -16.695 |
rubbish | -16.206 |
redit | -15.668 |
uphem | -15.372 |
Token | support |
Token ID | 1104 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
companions | +24.327 |
blessings | +23.995 |
enduring | +22.899 |
newfound | +22.861 |
followers | +22.390 |
Neg logit contributions | |
libel | -22.078 |
uphem | -17.621 |
offensive | -17.492 |
rubbish | -17.312 |
ograph | -17.199 |
Token | . |
Token ID | 13 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
companions | +14.311 |
unborn | +13.513 |
newfound | +13.433 |
enduring | +13.269 |
grandchildren | +13.202 |
Neg logit contributions | |
libel | -17.074 |
rubbish | -14.280 |
offensive | -13.679 |
vitro | -12.972 |
counterfe | -12.960 |
Token | We |
Token ID | 775 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
companions | +13.177 |
Guests | +13.004 |
unborn | +12.975 |
newfound | +12.881 |
grandchildren | +12.878 |
Neg logit contributions | |
libel | -15.989 |
rubbish | -13.313 |
offensive | -12.966 |
vitro | -12.459 |
advert | -12.117 |
Token | also |
Token ID | 635 |
Feature activation | +8.22e-01 |
Pos logit contributions | |
unborn | +11.621 |
companions | +11.467 |
grandchildren | +11.366 |
newfound | +11.287 |
awakened | +11.261 |
Neg logit contributions | |
libel | -12.448 |
offensive | -10.590 |
rubbish | -10.417 |
Serie | -9.946 |
vitro | -9.767 |
Token | have |
Token ID | 423 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
companions | +11.396 |
unborn | +10.996 |
awakened | +10.788 |
awakening | +10.771 |
grandchildren | +10.762 |
Neg logit contributions | |
libel | -10.565 |
offensive | -8.903 |
Serie | -8.569 |
rubbish | -8.273 |
England | -8.156 |
Token | faith |
Token ID | 4562 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
companions | +18.639 |
newfound | +17.902 |
awakening | +17.863 |
awakened | +17.779 |
grandchildren | +17.697 |
Neg logit contributions | |
libel | -16.024 |
offensive | -13.043 |
ograph | -12.297 |
ictionary | -12.131 |
rubbish | -12.097 |
Token | in |
Token ID | 287 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
companions | +14.228 |
unborn | +13.666 |
newfound | +13.602 |
awakening | +13.583 |
remaining | +13.517 |
Neg logit contributions | |
libel | -15.359 |
offensive | -12.398 |
rubbish | -12.368 |
advert | -11.874 |
Serie | -11.857 |
Token | our |
Token ID | 674 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
companions | +20.260 |
awakening | +19.883 |
unborn | +19.472 |
blessings | +19.396 |
souls | +19.339 |
Neg logit contributions | |
libel | -15.914 |
offensive | -12.755 |
ictionary | -12.662 |
ograph | -12.578 |
rubbish | -12.092 |
Token | HS |
Token ID | 18070 |
Feature activation | +1.98e+00 |
Pos logit contributions | |
companions | +30.309 |
awakening | +29.144 |
newfound | +29.049 |
arrival | +28.956 |
souls | +28.883 |
Neg logit contributions | |
libel | -18.632 |
ictionary | -15.929 |
offensive | -15.729 |
ograph | -15.541 |
England | -14.505 |
Token | that |
Token ID | 326 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
companions | +20.133 |
awakening | +19.193 |
arrival | +19.155 |
grandchildren | +18.895 |
blessings | +18.762 |
Neg logit contributions | |
libel | -17.527 |
rubbish | -14.125 |
offensive | -13.728 |
vitro | -13.427 |
Serie | -13.024 |
Token | they |
Token ID | 484 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
companions | +26.715 |
awakening | +26.251 |
blessings | +25.927 |
arrival | +25.860 |
unborn | +25.721 |
Neg logit contributions | |
libel | -20.089 |
ictionary | -16.766 |
offensive | -15.888 |
ograph | -15.378 |
redit | -14.917 |
Token | will |
Token ID | 481 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
awakened | +17.178 |
unborn | +17.098 |
grandchildren | +16.960 |
companions | +16.882 |
arrival | +16.559 |
Neg logit contributions | |
libel | -19.218 |
offensive | -16.559 |
Serie | -15.695 |
rubbish | -15.550 |
Yugoslavia | -14.834 |
Token | arrange |
Token ID | 21674 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
companions | +18.482 |
arrival | +17.997 |
awakening | +17.763 |
awakened | +17.637 |
enduring | +17.634 |
Neg logit contributions | |
libel | -17.980 |
offensive | -15.478 |
Serie | -14.244 |
ictionary | -13.974 |
football | -13.913 |
Token | the |
Token ID | 262 |
Feature activation | +2.25e+00 |
Pos logit contributions | |
companions | +15.152 |
blessings | +14.698 |
arrival | +14.307 |
grandchildren | +14.215 |
awakening | +14.175 |
Neg logit contributions | |
libel | -14.455 |
offensive | -11.911 |
rubbish | -10.990 |
vitro | -10.966 |
advert | -10.867 |
Token | perfect |
Token ID | 2818 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
arrival | +23.438 |
companions | +23.345 |
awakening | +22.952 |
blessings | +22.800 |
newfound | +22.523 |
Neg logit contributions | |
libel | -16.977 |
ictionary | -13.728 |
offensive | -13.650 |
England | -13.161 |
redit | -12.889 |
Token | we |
Token ID | 356 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
unborn | +21.844 |
grandchildren | +21.801 |
companions | +21.644 |
survivors | +21.611 |
enduring | +21.280 |
Neg logit contributions | |
libel | -16.624 |
rubbish | -13.511 |
offensive | -13.434 |
ictionary | -13.205 |
vitro | -12.529 |
Token | choose |
Token ID | 3853 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
unborn | +17.104 |
grandchildren | +17.077 |
survivors | +16.773 |
awakened | +16.625 |
companions | +16.578 |
Neg logit contributions | |
libel | -15.861 |
offensive | -14.005 |
rubbish | -13.117 |
vitro | -12.751 |
Serie | -12.749 |
Token | to |
Token ID | 284 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
companions | +18.906 |
grandchildren | +18.246 |
unborn | +18.236 |
survivors | +17.909 |
newfound | +17.879 |
Neg logit contributions | |
libel | -15.719 |
rubbish | -12.671 |
ograph | -12.463 |
offensive | -12.376 |
punt | -12.086 |
Token | focus |
Token ID | 2962 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
companions | +12.786 |
unborn | +12.765 |
grandchildren | +12.689 |
enduring | +12.329 |
newfound | +12.325 |
Neg logit contributions | |
libel | -12.205 |
offensive | -10.751 |
Serie | -9.916 |
rubbish | -9.590 |
vitro | -9.570 |
Token | on |
Token ID | 319 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
companions | +12.620 |
newfound | +12.538 |
unborn | +12.424 |
grandchildren | +12.332 |
enduring | +11.949 |
Neg logit contributions | |
libel | -13.638 |
offensive | -11.181 |
rubbish | -11.114 |
vitro | -10.567 |
Serie | -10.536 |
Token | the |
Token ID | 262 |
Feature activation | +3.04e+00 |
Pos logit contributions | |
grandchildren | +24.723 |
unborn | +24.695 |
companions | +24.549 |
survivors | +24.372 |
enduring | +23.800 |
Neg logit contributions | |
libel | -17.964 |
ictionary | -13.722 |
rubbish | -13.508 |
ograph | -13.496 |
offensive | -13.369 |
Token | time |
Token ID | 640 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
unborn | +29.609 |
companions | +29.462 |
grandchildren | +29.318 |
survivors | +28.936 |
enduring | +28.832 |
Neg logit contributions | |
libel | -17.123 |
ograph | -14.385 |
ictionary | -13.118 |
offensive | -13.100 |
redit | -13.075 |
Token | we |
Token ID | 356 |
Feature activation | +2.11e+00 |
Pos logit contributions | |
unborn | +21.343 |
companions | +21.069 |
remaining | +21.024 |
grandchildren | +20.622 |
caregivers | +20.424 |
Neg logit contributions | |
libel | -17.752 |
rubbish | -14.456 |
offensive | -14.348 |
ograph | -13.488 |
ictionary | -13.424 |
Token | were |
Token ID | 547 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
unborn | +19.987 |
companions | +19.031 |
grandchildren | +19.003 |
awakened | +18.908 |
survivors | +18.852 |
Neg logit contributions | |
libel | -18.619 |
offensive | -16.014 |
rubbish | -15.429 |
Serie | -15.333 |
ograph | -14.895 |
Token | given |
Token ID | 1813 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
companions | +20.084 |
enduring | +19.640 |
awakened | +19.577 |
unborn | +19.540 |
survivors | +19.068 |
Neg logit contributions | |
libel | -17.112 |
offensive | -13.924 |
ictionary | -13.834 |
ograph | -13.485 |
Serie | -12.971 |
Token | to |
Token ID | 284 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
companions | +19.498 |
unborn | +19.361 |
newfound | +18.688 |
grandchildren | +18.548 |
caregivers | +18.434 |
Neg logit contributions | |
libel | -18.039 |
rubbish | -15.125 |
offensive | -14.585 |
ograph | -14.072 |
advert | -13.962 |
Token | . |
Token ID | 13 |
Feature activation | +6.69e-02 |
Pos logit contributions | |
companions | +9.747 |
unborn | +9.561 |
awakening | +9.309 |
grandchildren | +9.278 |
newfound | +9.203 |
Neg logit contributions | |
libel | -9.764 |
offensive | -7.950 |
rubbish | -7.845 |
Serie | -7.577 |
punt | -7.552 |
Token | Everything |
Token ID | 11391 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
companions | +0.888 |
unborn | +0.870 |
newfound | +0.865 |
grandchildren | +0.863 |
blessings | +0.837 |
Neg logit contributions | |
libel | -0.790 |
rubbish | -0.637 |
offensive | -0.627 |
vitro | -0.595 |
advert | -0.595 |
Token | will |
Token ID | 481 |
Feature activation | +8.11e-01 |
Pos logit contributions | |
companions | +11.031 |
unborn | +10.949 |
newfound | +10.916 |
awakened | +10.780 |
awakening | +10.780 |
Neg logit contributions | |
libel | -11.946 |
offensive | -10.042 |
vitro | -9.569 |
rubbish | -9.514 |
Serie | -9.400 |
Token | begin |
Token ID | 2221 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
companions | +8.761 |
newfound | +8.438 |
unborn | +8.354 |
awakening | +8.277 |
awakened | +8.264 |
Neg logit contributions | |
libel | -9.854 |
offensive | -8.507 |
Serie | -8.108 |
rubbish | -7.845 |
vitro | -7.813 |
Token | with |
Token ID | 351 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
awakening | +11.402 |
companions | +11.283 |
unborn | +11.182 |
newfound | +11.090 |
arrival | +10.775 |
Neg logit contributions | |
libel | -12.620 |
offensive | -10.273 |
Serie | -9.880 |
rubbish | -9.872 |
punt | -9.707 |
Token | our |
Token ID | 674 |
Feature activation | +3.03e+00 |
Pos logit contributions | |
companions | +21.338 |
awakening | +21.240 |
newfound | +20.884 |
arrival | +20.815 |
blessings | +20.725 |
Neg logit contributions | |
libel | -15.946 |
ictionary | -12.789 |
offensive | -12.651 |
ograph | -12.139 |
England | -11.805 |
Token | asc |
Token ID | 10570 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
companions | +30.130 |
arrival | +30.054 |
awakening | +29.611 |
newfound | +29.041 |
followers | +28.019 |
Neg logit contributions | |
libel | -17.148 |
ictionary | -14.573 |
offensive | -14.213 |
England | -13.594 |
redit | -13.240 |
Token | ension |
Token ID | 3004 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
companions | +10.768 |
awakening | +10.029 |
arrival | +9.944 |
newfound | +9.830 |
attendants | +9.467 |
Neg logit contributions | |
libel | -19.476 |
rubbish | -17.017 |
offensive | -16.756 |
Yugoslavia | -16.548 |
Serie | -16.376 |
Token | . |
Token ID | 13 |
Feature activation | +6.28e-01 |
Pos logit contributions | |
companions | +19.302 |
awakening | +18.918 |
arrival | +18.626 |
newfound | +17.941 |
grandchildren | +17.882 |
Neg logit contributions | |
libel | -17.037 |
offensive | -13.675 |
Serie | -13.203 |
rubbish | -12.920 |
England | -12.859 |
Token | Therefore |
Token ID | 8447 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
companions | +7.639 |
grandchildren | +7.500 |
unborn | +7.485 |
newfound | +7.320 |
survivors | +7.299 |
Neg logit contributions | |
libel | -7.478 |
offensive | -6.002 |
rubbish | -6.001 |
vitro | -5.741 |
advert | -5.659 |
Token | one |
Token ID | 530 |
Feature activation | +7.11e-01 |
Pos logit contributions | |
companions | +17.957 |
awakening | +17.744 |
unborn | +17.728 |
blessings | +17.188 |
enduring | +17.180 |
Neg logit contributions | |
libel | -15.576 |
offensive | -12.651 |
ictionary | -12.189 |
vitro | -12.138 |
rubbish | -11.967 |
Token | and |
Token ID | 290 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
unborn | +12.550 |
companions | +12.329 |
grandchildren | +11.681 |
newfound | +11.593 |
awakening | +11.542 |
Neg logit contributions | |
libel | -16.865 |
rubbish | -14.380 |
advert | -13.734 |
vitro | -13.626 |
punt | -13.560 |
Token | cre |
Token ID | 1126 |
Feature activation | +7.64e-01 |
Pos logit contributions | |
companions | +11.801 |
unborn | +11.480 |
grandchildren | +11.396 |
newfound | +11.214 |
awakened | +11.202 |
Neg logit contributions | |
libel | -11.573 |
rubbish | -9.632 |
offensive | -9.474 |
ictionary | -9.405 |
ograph | -9.255 |
Token | eds |
Token ID | 5379 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
companions | +7.214 |
unborn | +6.943 |
blessings | +6.811 |
caregivers | +6.709 |
survivors | +6.702 |
Neg logit contributions | |
libel | -11.025 |
rubbish | -9.308 |
tabloid | -9.051 |
punt | -8.846 |
Serie | -8.736 |
Token | in |
Token ID | 287 |
Feature activation | +3.78e-01 |
Pos logit contributions | |
unborn | +18.881 |
enduring | +18.033 |
companions | +18.017 |
awakening | +17.715 |
grandchildren | +17.665 |
Neg logit contributions | |
libel | -19.773 |
rubbish | -16.236 |
offensive | -16.141 |
vitro | -15.610 |
ograph | -15.548 |
Token | America |
Token ID | 2253 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
companions | +4.836 |
unborn | +4.785 |
newfound | +4.730 |
grandchildren | +4.714 |
awakening | +4.603 |
Neg logit contributions | |
libel | -4.465 |
rubbish | -3.646 |
offensive | -3.431 |
ograph | -3.407 |
advert | -3.375 |
Token | as |
Token ID | 355 |
Feature activation | +3.02e+00 |
Pos logit contributions | |
unborn | +13.330 |
enduring | +12.748 |
grandchildren | +12.691 |
companions | +12.626 |
newfound | +12.561 |
Neg logit contributions | |
libel | -15.214 |
rubbish | -12.800 |
offensive | -12.245 |
vitro | -12.065 |
Serie | -12.013 |
Token | ' |
Token ID | 705 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
companions | +26.303 |
grandchildren | +26.270 |
unborn | +25.987 |
blessings | +25.797 |
attendees | +25.607 |
Neg logit contributions | |
libel | -20.008 |
offensive | -15.821 |
ograph | -15.814 |
shit | -15.713 |
ictionary | -15.574 |
Token | not |
Token ID | 1662 |
Feature activation | -2.23e-01 |
Pos logit contributions | |
companions | +21.920 |
newfound | +21.505 |
blessings | +21.431 |
unborn | +21.246 |
enduring | +21.145 |
Neg logit contributions | |
libel | -17.893 |
rubbish | -13.835 |
punt | -13.807 |
tabloid | -13.708 |
advert | -13.638 |
Token | a |
Token ID | 257 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
libel | +3.111 |
rubbish | +2.601 |
offensive | +2.551 |
advert | +2.472 |
Serie | +2.470 |
Neg logit contributions | |
companions | -2.501 |
unborn | -2.462 |
newfound | -2.444 |
grandchildren | -2.420 |
blessings | -2.330 |
Token | threat |
Token ID | 2372 |
Feature activation | +8.84e-02 |
Pos logit contributions | |
libel | +1.570 |
rubbish | +1.299 |
offensive | +1.287 |
advert | +1.228 |
Serie | +1.223 |
Neg logit contributions | |
companions | -1.423 |
newfound | -1.410 |
unborn | -1.395 |
grandchildren | -1.381 |
awakening | -1.338 |
Token | to |
Token ID | 284 |
Feature activation | +7.07e-01 |
Pos logit contributions | |
companions | +1.072 |
unborn | +1.070 |
grandchildren | +1.034 |
newfound | +1.031 |
awakening | +1.007 |
Neg logit contributions | |
libel | -1.138 |
rubbish | -0.942 |
offensive | -0.914 |
Serie | -0.899 |
advert | -0.895 |
Token | Live |
Token ID | 7547 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
companions | +22.353 |
attendees | +22.229 |
newfound | +21.916 |
unborn | +21.139 |
awakening | +21.044 |
Neg logit contributions | |
libel | -18.515 |
offensive | -15.248 |
rubbish | -14.546 |
England | -14.116 |
football | -14.008 |
Token | Quest |
Token ID | 6785 |
Feature activation | +1.78e+00 |
Pos logit contributions | |
companions | +13.622 |
attendees | +12.907 |
arrival | +12.670 |
grandchildren | +12.530 |
newfound | +12.487 |
Neg logit contributions | |
libel | -14.405 |
rubbish | -12.013 |
offensive | -11.784 |
vitro | -10.768 |
punt | -10.543 |
Token | Mode |
Token ID | 10363 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
companions | +18.908 |
awakening | +17.858 |
attendees | +17.598 |
arrival | +17.395 |
blessings | +17.313 |
Neg logit contributions | |
libel | -16.600 |
offensive | -13.437 |
rubbish | -13.013 |
vitro | -12.657 |
redit | -12.285 |
Token | � |
Token ID | 447 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
companions | +18.289 |
awakening | +17.834 |
newfound | +17.188 |
arrival | +17.138 |
attendees | +17.039 |
Neg logit contributions | |
libel | -18.164 |
offensive | -14.788 |
rubbish | -14.602 |
vitro | -14.111 |
Anyway | -13.779 |
Token | � |
Token ID | 247 |
Feature activation | +2.42e+00 |
Pos logit contributions | |
libel | +3.039 |
rubbish | +2.537 |
offensive | +2.452 |
vitro | +2.343 |
advert | +2.342 |
Neg logit contributions | |
companions | -2.897 |
newfound | -2.842 |
unborn | -2.827 |
grandchildren | -2.782 |
awakening | -2.723 |
Token | s |
Token ID | 82 |
Feature activation | +3.02e+00 |
Pos logit contributions | |
companions | +22.944 |
newfound | +22.318 |
attendees | +22.216 |
awakening | +22.156 |
arrival | +21.929 |
Neg logit contributions | |
libel | -18.369 |
rubbish | -14.654 |
vitro | -13.097 |
offensive | -13.016 |
punt | -12.999 |
Token | Event |
Token ID | 8558 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
arrival | +27.235 |
companions | +27.030 |
newfound | +26.605 |
awakening | +26.350 |
attendees | +25.978 |
Neg logit contributions | |
libel | -18.786 |
rubbish | -14.554 |
offensive | -13.954 |
vitro | -13.549 |
redit | -12.713 |
Token | Qu |
Token ID | 2264 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
companions | +17.888 |
attendees | +16.645 |
awakening | +16.182 |
followers | +16.028 |
newfound | +16.004 |
Neg logit contributions | |
libel | -19.783 |
offensive | -16.750 |
rubbish | -16.365 |
vitro | -15.296 |
punt | -15.208 |
Token | ests |
Token ID | 3558 |
Feature activation | +2.54e+00 |
Pos logit contributions | |
companions | +9.615 |
newfound | +9.076 |
grandchildren | +8.997 |
unborn | +8.909 |
attendees | +8.835 |
Neg logit contributions | |
libel | -15.639 |
rubbish | -12.959 |
offensive | -12.429 |
punt | -12.418 |
tabloid | -12.318 |
Token | and |
Token ID | 290 |
Feature activation | +2.62e+00 |
Pos logit contributions | |
companions | +21.318 |
newfound | +20.567 |
awakening | +20.461 |
arrival | +20.308 |
unborn | +19.956 |
Neg logit contributions | |
libel | -20.949 |
rubbish | -17.351 |
offensive | -16.715 |
vitro | -16.056 |
punt | -15.691 |
Token | Special |
Token ID | 6093 |
Feature activation | +6.98e-01 |
Pos logit contributions | |
companions | +24.397 |
newfound | +23.993 |
awakening | +22.947 |
arrival | +22.934 |
blessings | +22.768 |
Neg logit contributions | |
libel | -19.271 |
offensive | -15.321 |
rubbish | -14.996 |
vitro | -14.324 |
ictionary | -13.993 |
Token | . |
Token ID | 13 |
Feature activation | -3.19e+00 |
Pos logit contributions | |
libel | +31.281 |
rubbish | +29.626 |
cricket | +28.617 |
England | +28.126 |
racket | +28.013 |
Neg logit contributions | |
ollower | -16.219 |
newfound | -15.480 |
companions | -15.464 |
unborn | -15.426 |
caregivers | -14.966 |
Token | They |
Token ID | 1119 |
Feature activation | -2.38e+00 |
Pos logit contributions | |
Anyway | +26.453 |
England | +26.402 |
libel | +25.993 |
Bangladesh | +25.171 |
Fifa | +25.165 |
Neg logit contributions | |
newfound | -22.062 |
unborn | -21.531 |
companions | -21.490 |
awakening | -21.253 |
caregivers | -20.367 |
Token | have |
Token ID | 423 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
libel | +26.106 |
rubbish | +22.852 |
penal | +22.524 |
analyse | +22.106 |
punt | +21.922 |
Neg logit contributions | |
companions | -16.654 |
awakening | -16.157 |
newfound | -16.135 |
unborn | -15.929 |
grandchildren | -15.531 |
Token | a |
Token ID | 257 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
libel | +28.358 |
rubbish | +25.676 |
penal | +24.643 |
England | +23.977 |
Serie | +23.872 |
Neg logit contributions | |
reetings | -13.638 |
companions | -13.390 |
ollower | -13.019 |
unborn | -12.970 |
caregivers | -12.918 |
Token | system |
Token ID | 1080 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
libel | +28.129 |
rubbish | +24.738 |
racket | +23.831 |
punt | +23.470 |
penal | +23.411 |
Neg logit contributions | |
companions | -14.680 |
unborn | -14.175 |
caregivers | -14.024 |
reetings | -14.020 |
grandchildren | -13.778 |
Token | in |
Token ID | 287 |
Feature activation | -4.05e+00 |
Pos logit contributions | |
libel | +22.081 |
rubbish | +19.314 |
advert | +18.288 |
bullshit | +17.819 |
penal | +17.758 |
Neg logit contributions | |
companions | -16.978 |
newfound | -16.717 |
grandchildren | -16.345 |
unborn | -16.265 |
caregivers | -15.953 |
Token | place |
Token ID | 1295 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
libel | +30.973 |
England | +28.848 |
cricket | +27.878 |
Switzerland | +27.345 |
vitro | +27.107 |
Neg logit contributions | |
reetings | -21.438 |
companions | -21.381 |
newfound | -21.137 |
grandchildren | -21.019 |
unborn | -20.866 |
Token | . |
Token ID | 13 |
Feature activation | -2.85e+00 |
Pos logit contributions | |
libel | +25.806 |
rubbish | +22.798 |
advert | +21.866 |
penal | +21.725 |
England | +21.319 |
Neg logit contributions | |
newfound | -18.034 |
companions | -17.921 |
grandchildren | -17.361 |
unborn | -17.176 |
reetings | -17.104 |
Token |
|
Token ID | 198 |
Feature activation | -8.09e-01 |
Pos logit contributions | |
libel | +25.423 |
England | +25.137 |
Anyway | +24.999 |
Switzerland | +24.280 |
Fifa | +24.215 |
Neg logit contributions | |
newfound | -20.401 |
companions | -20.055 |
unborn | -19.854 |
awakening | -19.473 |
caregivers | -18.640 |
Token |
|
Token ID | 198 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
libel | +6.801 |
offensive | +5.384 |
Anyway | +5.263 |
rubbish | +5.231 |
England | +5.088 |
Neg logit contributions | |
companions | -11.828 |
unborn | -11.792 |
newfound | -11.781 |
caregivers | -11.683 |
awakening | -11.646 |
Token | " |
Token ID | 1 |
Feature activation | -3.37e+00 |
Pos logit contributions | |
libel | +16.513 |
offensive | +13.976 |
England | +13.303 |
rubbish | +13.294 |
Anyway | +13.051 |
Neg logit contributions | |
companions | -18.981 |
unborn | -18.631 |
newfound | -18.478 |
grandchildren | -18.311 |
caregivers | -18.294 |
Token | think |
Token ID | 892 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
libel | +26.222 |
rubbish | +24.136 |
penal | +23.003 |
analyse | +22.963 |
punt | +22.878 |
Neg logit contributions | |
newfound | -20.841 |
unborn | -20.429 |
companions | -19.836 |
grandchildren | -19.308 |
occupants | -19.299 |
Token | you |
Token ID | 345 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
libel | +29.520 |
England | +26.126 |
cricket | +26.027 |
rubbish | +25.978 |
racket | +25.165 |
Neg logit contributions | |
newfound | -14.759 |
companions | -14.641 |
unborn | -14.566 |
reetings | -13.889 |
awakened | -13.801 |
Token | should |
Token ID | 815 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
libel | +23.037 |
rubbish | +20.165 |
punt | +19.446 |
penal | +18.924 |
England | +18.762 |
Neg logit contributions | |
companions | -17.283 |
newfound | -17.203 |
unborn | -17.025 |
awakening | -16.129 |
grandchildren | -16.124 |
Token | see |
Token ID | 766 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
libel | +30.938 |
rubbish | +28.148 |
penal | +27.941 |
punt | +27.730 |
analyse | +27.097 |
Neg logit contributions | |
newfound | -18.810 |
unborn | -18.175 |
companions | -18.052 |
awakening | -17.237 |
caregivers | -17.218 |
Token | ch |
Token ID | 442 |
Feature activation | -5.18e-01 |
Pos logit contributions | |
libel | +33.205 |
rubbish | +29.824 |
England | +29.683 |
cricket | +29.593 |
racket | +28.851 |
Neg logit contributions | |
companions | -13.306 |
ollower | -13.286 |
newfound | -13.247 |
unborn | -13.141 |
reetings | -13.012 |
Token | ucking |
Token ID | 19296 |
Feature activation | -3.95e+00 |
Pos logit contributions | |
libel | +5.165 |
rubbish | +4.075 |
offensive | +3.937 |
advert | +3.700 |
punt | +3.670 |
Neg logit contributions | |
companions | -7.735 |
unborn | -7.610 |
newfound | -7.606 |
grandchildren | -7.502 |
caregivers | -7.339 |
Token | as |
Token ID | 355 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
libel | +34.369 |
cricket | +32.301 |
rubbish | +31.992 |
racket | +31.351 |
penal | +31.173 |
Neg logit contributions | |
ollower | -15.977 |
companions | -15.143 |
unborn | -14.570 |
newfound | -14.484 |
caregivers | -14.453 |
Token | a |
Token ID | 257 |
Feature activation | -3.27e+00 |
Pos logit contributions | |
libel | +35.062 |
rubbish | +32.132 |
racket | +31.160 |
penal | +31.017 |
cricket | +30.909 |
Neg logit contributions | |
ollower | -17.233 |
reetings | -17.214 |
companions | -16.973 |
unborn | -16.895 |
grandchildren | -16.571 |
Token | crime |
Token ID | 4065 |
Feature activation | -3.05e+00 |
Pos logit contributions | |
libel | +33.695 |
penal | +30.030 |
rubbish | +29.751 |
racket | +29.609 |
cricket | +29.527 |
Neg logit contributions | |
reetings | -17.475 |
ollower | -16.526 |
companions | -16.477 |
unborn | -16.324 |
grandchildren | -16.322 |
Token | . |
Token ID | 13 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
libel | +30.018 |
rubbish | +26.093 |
racket | +25.950 |
penal | +24.894 |
advert | +24.839 |
Neg logit contributions | |
companions | -18.335 |
newfound | -18.127 |
grandchildren | -18.044 |
unborn | -18.023 |
caregivers | -17.739 |
Token | I |
Token ID | 314 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
England | +27.919 |
Anyway | +27.254 |
Bangladesh | +26.916 |
libel | +26.716 |
Fifa | +26.515 |
Neg logit contributions | |
newfound | -23.061 |
unborn | -22.458 |
companions | -21.953 |
awakening | -21.903 |
awakened | -20.941 |
Token | The |
Token ID | 464 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
England | +25.030 |
Anyway | +24.794 |
Football | +24.322 |
libel | +23.240 |
Basically | +23.059 |
Neg logit contributions | |
unborn | -26.459 |
companions | -25.802 |
newfound | -25.573 |
awakening | -25.082 |
caregivers | -25.045 |
Token | ICC |
Token ID | 32300 |
Feature activation | -3.04e+00 |
Pos logit contributions | |
libel | +27.016 |
rubbish | +24.034 |
racket | +23.510 |
England | +23.314 |
cricket | +23.003 |
Neg logit contributions | |
companions | -12.083 |
newfound | -11.587 |
unborn | -11.530 |
grandchildren | -11.466 |
caregivers | -10.761 |
Token | has |
Token ID | 468 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
libel | +31.677 |
penal | +28.109 |
rubbish | +27.895 |
advert | +27.762 |
racket | +27.629 |
Neg logit contributions | |
newfound | -16.143 |
unborn | -16.134 |
companions | -16.107 |
grandchildren | -14.863 |
caregivers | -14.860 |
Token | a |
Token ID | 257 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
libel | +24.824 |
rubbish | +22.070 |
penal | +21.097 |
advert | +20.798 |
racket | +20.622 |
Neg logit contributions | |
companions | -13.362 |
unborn | -12.967 |
caregivers | -12.724 |
reetings | -12.702 |
newfound | -12.694 |
Token | rule |
Token ID | 3896 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
libel | +24.848 |
rubbish | +21.672 |
racket | +20.971 |
penal | +20.522 |
punt | +20.428 |
Neg logit contributions | |
companions | -13.405 |
unborn | -13.115 |
caregivers | -12.923 |
grandchildren | -12.512 |
occupants | -12.217 |
Token | in |
Token ID | 287 |
Feature activation | -3.84e+00 |
Pos logit contributions | |
libel | +21.663 |
rubbish | +18.242 |
advert | +17.561 |
offensive | +17.495 |
racket | +17.417 |
Neg logit contributions | |
companions | -15.812 |
newfound | -15.628 |
grandchildren | -15.127 |
unborn | -15.097 |
caregivers | -14.730 |
Token | place |
Token ID | 1295 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
libel | +36.324 |
England | +33.115 |
cricket | +32.640 |
racket | +32.121 |
Switzerland | +31.447 |
Neg logit contributions | |
companions | -16.799 |
caregivers | -16.533 |
newfound | -16.374 |
unborn | -16.348 |
grandchildren | -16.253 |
Token | . |
Token ID | 13 |
Feature activation | -3.26e+00 |
Pos logit contributions | |
libel | +26.914 |
penal | +22.947 |
rubbish | +22.914 |
advert | +22.678 |
racket | +21.816 |
Neg logit contributions | |
newfound | -18.320 |
companions | -18.178 |
grandchildren | -17.586 |
unborn | -17.267 |
reetings | -17.006 |
Token | When |
Token ID | 1649 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
England | +26.725 |
libel | +26.221 |
Anyway | +25.822 |
Fifa | +25.547 |
Switzerland | +25.436 |
Neg logit contributions | |
newfound | -21.879 |
companions | -21.253 |
unborn | -20.935 |
awakening | -20.810 |
awakened | -20.071 |
Token | they |
Token ID | 484 |
Feature activation | -3.01e+00 |
Pos logit contributions | |
libel | +28.451 |
England | +25.240 |
rubbish | +25.121 |
racket | +24.939 |
cricket | +24.876 |
Neg logit contributions | |
newfound | -15.445 |
companions | -15.373 |
unborn | -14.671 |
grandchildren | -14.384 |
reetings | -14.082 |
Token | reviewed |
Token ID | 11765 |
Feature activation | -3.79e+00 |
Pos logit contributions | |
libel | +29.969 |
penal | +27.445 |
punt | +27.168 |
rubbish | +26.315 |
analyse | +25.862 |
Neg logit contributions | |
companions | -18.228 |
newfound | -18.042 |
unborn | -17.409 |
awakening | -17.050 |
caregivers | -16.428 |
Token | When |
Token ID | 1649 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
England | +26.725 |
libel | +26.221 |
Anyway | +25.822 |
Fifa | +25.547 |
Switzerland | +25.436 |
Neg logit contributions | |
newfound | -21.879 |
companions | -21.253 |
unborn | -20.935 |
awakening | -20.810 |
awakened | -20.071 |
Token | they |
Token ID | 484 |
Feature activation | -3.01e+00 |
Pos logit contributions | |
libel | +28.451 |
England | +25.240 |
rubbish | +25.121 |
racket | +24.939 |
cricket | +24.876 |
Neg logit contributions | |
newfound | -15.445 |
companions | -15.373 |
unborn | -14.671 |
grandchildren | -14.384 |
reetings | -14.082 |
Token | reviewed |
Token ID | 11765 |
Feature activation | -3.79e+00 |
Pos logit contributions | |
libel | +29.969 |
penal | +27.445 |
punt | +27.168 |
rubbish | +26.315 |
analyse | +25.862 |
Neg logit contributions | |
companions | -18.228 |
newfound | -18.042 |
unborn | -17.409 |
awakening | -17.050 |
caregivers | -16.428 |
Token | a |
Token ID | 257 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
libel | +35.603 |
England | +32.327 |
cricket | +32.165 |
rubbish | +31.117 |
racket | +30.798 |
Neg logit contributions | |
companions | -16.413 |
ollower | -15.847 |
newfound | -15.810 |
reetings | -15.713 |
unborn | -15.569 |
Token | lot |
Token ID | 1256 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
libel | +33.275 |
cricket | +29.753 |
racket | +29.706 |
rubbish | +28.712 |
penal | +28.666 |
Neg logit contributions | |
reetings | -17.030 |
companions | -16.759 |
grandchildren | -16.543 |
caregivers | -16.324 |
unborn | -16.245 |
Token | of |
Token ID | 286 |
Feature activation | -3.82e+00 |
Pos logit contributions | |
libel | +26.346 |
rubbish | +22.751 |
offensive | +21.196 |
racket | +21.011 |
England | +20.770 |
Neg logit contributions | |
companions | -17.641 |
newfound | -17.430 |
grandchildren | -16.780 |
unborn | -16.659 |
awakening | -16.381 |
Token | old |
Token ID | 1468 |
Feature activation | -3.72e+00 |
Pos logit contributions | |
libel | +36.436 |
cricket | +33.319 |
rubbish | +32.901 |
racket | +32.550 |
England | +32.264 |
Neg logit contributions | |
ollower | -15.599 |
companions | -15.362 |
reetings | -15.084 |
unborn | -14.722 |
grandchildren | -14.381 |
Token | film |
Token ID | 2646 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
libel | +36.516 |
cricket | +32.864 |
rubbish | +32.794 |
racket | +32.639 |
England | +32.494 |
Neg logit contributions | |
newfound | -15.324 |
unborn | -15.232 |
ollower | -14.774 |
caregivers | -14.583 |
companions | -14.415 |
Token | footage |
Token ID | 9640 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
libel | +27.100 |
rubbish | +23.677 |
offensive | +22.595 |
advert | +22.537 |
ograph | +22.118 |
Neg logit contributions | |
newfound | -14.471 |
unborn | -14.333 |
grandchildren | -13.872 |
companions | -13.782 |
caregivers | -13.350 |
Token | they |
Token ID | 484 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
libel | +25.729 |
rubbish | +22.265 |
advert | +20.972 |
offensive | +20.752 |
England | +20.646 |
Neg logit contributions | |
companions | -15.978 |
newfound | -15.944 |
unborn | -15.645 |
grandchildren | -15.099 |
caregivers | -15.068 |
Token | actually |
Token ID | 1682 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
libel | +23.314 |
rubbish | +20.310 |
penal | +19.787 |
advert | +19.486 |
punt | +19.138 |
Neg logit contributions | |
companions | -16.029 |
newfound | -15.757 |
unborn | -15.569 |
grandchildren | -15.197 |
caregivers | -15.141 |
Token | in |
Token ID | 287 |
Feature activation | -3.84e+00 |
Pos logit contributions | |
libel | +21.663 |
rubbish | +18.242 |
advert | +17.561 |
offensive | +17.495 |
racket | +17.417 |
Neg logit contributions | |
companions | -15.812 |
newfound | -15.628 |
grandchildren | -15.127 |
unborn | -15.097 |
caregivers | -14.730 |
Token | place |
Token ID | 1295 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
libel | +36.324 |
England | +33.115 |
cricket | +32.640 |
racket | +32.121 |
Switzerland | +31.447 |
Neg logit contributions | |
companions | -16.799 |
caregivers | -16.533 |
newfound | -16.374 |
unborn | -16.348 |
grandchildren | -16.253 |
Token | . |
Token ID | 13 |
Feature activation | -3.26e+00 |
Pos logit contributions | |
libel | +26.914 |
penal | +22.947 |
rubbish | +22.914 |
advert | +22.678 |
racket | +21.816 |
Neg logit contributions | |
newfound | -18.320 |
companions | -18.178 |
grandchildren | -17.586 |
unborn | -17.267 |
reetings | -17.006 |
Token | When |
Token ID | 1649 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
England | +26.725 |
libel | +26.221 |
Anyway | +25.822 |
Fifa | +25.547 |
Switzerland | +25.436 |
Neg logit contributions | |
newfound | -21.879 |
companions | -21.253 |
unborn | -20.935 |
awakening | -20.810 |
awakened | -20.071 |
Token | they |
Token ID | 484 |
Feature activation | -3.01e+00 |
Pos logit contributions | |
libel | +28.451 |
England | +25.240 |
rubbish | +25.121 |
racket | +24.939 |
cricket | +24.876 |
Neg logit contributions | |
newfound | -15.445 |
companions | -15.373 |
unborn | -14.671 |
grandchildren | -14.384 |
reetings | -14.082 |
Token | reviewed |
Token ID | 11765 |
Feature activation | -3.79e+00 |
Pos logit contributions | |
libel | +29.969 |
penal | +27.445 |
punt | +27.168 |
rubbish | +26.315 |
analyse | +25.862 |
Neg logit contributions | |
companions | -18.228 |
newfound | -18.042 |
unborn | -17.409 |
awakening | -17.050 |
caregivers | -16.428 |
Token | a |
Token ID | 257 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
libel | +35.603 |
England | +32.327 |
cricket | +32.165 |
rubbish | +31.117 |
racket | +30.798 |
Neg logit contributions | |
companions | -16.413 |
ollower | -15.847 |
newfound | -15.810 |
reetings | -15.713 |
unborn | -15.569 |
Token | lot |
Token ID | 1256 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
libel | +33.275 |
cricket | +29.753 |
racket | +29.706 |
rubbish | +28.712 |
penal | +28.666 |
Neg logit contributions | |
reetings | -17.030 |
companions | -16.759 |
grandchildren | -16.543 |
caregivers | -16.324 |
unborn | -16.245 |
Token | of |
Token ID | 286 |
Feature activation | -3.82e+00 |
Pos logit contributions | |
libel | +26.346 |
rubbish | +22.751 |
offensive | +21.196 |
racket | +21.011 |
England | +20.770 |
Neg logit contributions | |
companions | -17.641 |
newfound | -17.430 |
grandchildren | -16.780 |
unborn | -16.659 |
awakening | -16.381 |
Token | old |
Token ID | 1468 |
Feature activation | -3.72e+00 |
Pos logit contributions | |
libel | +36.436 |
cricket | +33.319 |
rubbish | +32.901 |
racket | +32.550 |
England | +32.264 |
Neg logit contributions | |
ollower | -15.599 |
companions | -15.362 |
reetings | -15.084 |
unborn | -14.722 |
grandchildren | -14.381 |
Token | film |
Token ID | 2646 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
libel | +36.516 |
cricket | +32.864 |
rubbish | +32.794 |
racket | +32.639 |
England | +32.494 |
Neg logit contributions | |
newfound | -15.324 |
unborn | -15.232 |
ollower | -14.774 |
caregivers | -14.583 |
companions | -14.415 |
Token | they |
Token ID | 484 |
Feature activation | -3.01e+00 |
Pos logit contributions | |
libel | +28.451 |
England | +25.240 |
rubbish | +25.121 |
racket | +24.939 |
cricket | +24.876 |
Neg logit contributions | |
newfound | -15.445 |
companions | -15.373 |
unborn | -14.671 |
grandchildren | -14.384 |
reetings | -14.082 |
Token | reviewed |
Token ID | 11765 |
Feature activation | -3.79e+00 |
Pos logit contributions | |
libel | +29.969 |
penal | +27.445 |
punt | +27.168 |
rubbish | +26.315 |
analyse | +25.862 |
Neg logit contributions | |
companions | -18.228 |
newfound | -18.042 |
unborn | -17.409 |
awakening | -17.050 |
caregivers | -16.428 |
Token | a |
Token ID | 257 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
libel | +35.603 |
England | +32.327 |
cricket | +32.165 |
rubbish | +31.117 |
racket | +30.798 |
Neg logit contributions | |
companions | -16.413 |
ollower | -15.847 |
newfound | -15.810 |
reetings | -15.713 |
unborn | -15.569 |
Token | lot |
Token ID | 1256 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
libel | +33.275 |
cricket | +29.753 |
racket | +29.706 |
rubbish | +28.712 |
penal | +28.666 |
Neg logit contributions | |
reetings | -17.030 |
companions | -16.759 |
grandchildren | -16.543 |
caregivers | -16.324 |
unborn | -16.245 |
Token | of |
Token ID | 286 |
Feature activation | -3.82e+00 |
Pos logit contributions | |
libel | +26.346 |
rubbish | +22.751 |
offensive | +21.196 |
racket | +21.011 |
England | +20.770 |
Neg logit contributions | |
companions | -17.641 |
newfound | -17.430 |
grandchildren | -16.780 |
unborn | -16.659 |
awakening | -16.381 |
Token | old |
Token ID | 1468 |
Feature activation | -3.72e+00 |
Pos logit contributions | |
libel | +36.436 |
cricket | +33.319 |
rubbish | +32.901 |
racket | +32.550 |
England | +32.264 |
Neg logit contributions | |
ollower | -15.599 |
companions | -15.362 |
reetings | -15.084 |
unborn | -14.722 |
grandchildren | -14.381 |
Token | film |
Token ID | 2646 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
libel | +36.516 |
cricket | +32.864 |
rubbish | +32.794 |
racket | +32.639 |
England | +32.494 |
Neg logit contributions | |
newfound | -15.324 |
unborn | -15.232 |
ollower | -14.774 |
caregivers | -14.583 |
companions | -14.415 |
Token | footage |
Token ID | 9640 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
libel | +27.100 |
rubbish | +23.677 |
offensive | +22.595 |
advert | +22.537 |
ograph | +22.118 |
Neg logit contributions | |
newfound | -14.471 |
unborn | -14.333 |
grandchildren | -13.872 |
companions | -13.782 |
caregivers | -13.350 |
Token | they |
Token ID | 484 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
libel | +25.729 |
rubbish | +22.265 |
advert | +20.972 |
offensive | +20.752 |
England | +20.646 |
Neg logit contributions | |
companions | -15.978 |
newfound | -15.944 |
unborn | -15.645 |
grandchildren | -15.099 |
caregivers | -15.068 |
Token | actually |
Token ID | 1682 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
libel | +23.314 |
rubbish | +20.310 |
penal | +19.787 |
advert | +19.486 |
punt | +19.138 |
Neg logit contributions | |
companions | -16.029 |
newfound | -15.757 |
unborn | -15.569 |
grandchildren | -15.197 |
caregivers | -15.141 |
Token | found |
Token ID | 1043 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
libel | +27.851 |
penal | +24.919 |
rubbish | +24.606 |
advert | +23.857 |
analyse | +23.640 |
Neg logit contributions | |
companions | -16.324 |
newfound | -15.806 |
unborn | -15.555 |
awakening | -15.378 |
caregivers | -15.259 |
Token | and |
Token ID | 290 |
Feature activation | -2.16e+00 |
Pos logit contributions | |
libel | +26.505 |
rubbish | +24.176 |
England | +22.629 |
punt | +22.454 |
advert | +22.385 |
Neg logit contributions | |
reetings | -15.173 |
companions | -15.052 |
ollower | -14.673 |
attendees | -14.656 |
Guests | -14.403 |
Token | view |
Token ID | 1570 |
Feature activation | -2.44e+00 |
Pos logit contributions | |
libel | +26.291 |
rubbish | +24.032 |
England | +22.449 |
cricket | +22.402 |
punt | +22.214 |
Neg logit contributions | |
companions | -13.875 |
newfound | -13.790 |
unborn | -13.566 |
awakening | -12.862 |
reetings | -12.773 |
Token | it |
Token ID | 340 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
libel | +28.580 |
rubbish | +26.131 |
cricket | +25.466 |
England | +25.106 |
offensive | +25.003 |
Neg logit contributions | |
companions | -14.628 |
newfound | -14.571 |
unborn | -14.333 |
grandchildren | -13.809 |
awakened | -13.719 |
Token | like |
Token ID | 588 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
libel | +26.729 |
rubbish | +24.751 |
advert | +22.399 |
penal | +22.328 |
offensive | +22.193 |
Neg logit contributions | |
unborn | -16.984 |
grandchildren | -16.892 |
newfound | -16.879 |
companions | -16.735 |
reetings | -16.014 |
Token | that |
Token ID | 326 |
Feature activation | -2.82e+00 |
Pos logit contributions | |
libel | +26.192 |
rubbish | +24.016 |
racket | +22.227 |
cricket | +21.935 |
tabloid | +21.891 |
Neg logit contributions | |
companions | -14.115 |
newfound | -14.033 |
unborn | -13.835 |
grandchildren | -13.250 |
reetings | -13.191 |
Token | . |
Token ID | 13 |
Feature activation | -3.71e+00 |
Pos logit contributions | |
libel | +29.757 |
rubbish | +27.184 |
advert | +25.377 |
England | +25.084 |
offensive | +24.819 |
Neg logit contributions | |
companions | -16.930 |
newfound | -16.710 |
unborn | -16.352 |
grandchildren | -16.024 |
reetings | -15.611 |
Token | You |
Token ID | 921 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
England | +28.051 |
Anyway | +27.980 |
Bangladesh | +26.880 |
Fifa | +26.722 |
Football | +26.537 |
Neg logit contributions | |
newfound | -23.637 |
unborn | -22.690 |
companions | -22.326 |
awakening | -22.149 |
awakened | -21.185 |
Token | have |
Token ID | 423 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
libel | +24.341 |
rubbish | +21.452 |
punt | +20.866 |
analyse | +20.356 |
penal | +20.013 |
Neg logit contributions | |
newfound | -18.083 |
companions | -18.036 |
unborn | -17.327 |
awakening | -16.830 |
grandchildren | -16.667 |
Token | a |
Token ID | 257 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
libel | +27.829 |
rubbish | +25.182 |
England | +23.862 |
cricket | +23.681 |
racket | +23.624 |
Neg logit contributions | |
companions | -13.576 |
newfound | -13.337 |
reetings | -13.261 |
unborn | -13.081 |
ollower | -12.934 |
Token | technical |
Token ID | 6276 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
libel | +27.086 |
rubbish | +24.141 |
racket | +23.426 |
punt | +23.355 |
cricket | +23.219 |
Neg logit contributions | |
companions | -13.873 |
unborn | -13.511 |
reetings | -13.503 |
grandchildren | -13.402 |
attendees | -12.828 |
Token | fault |
Token ID | 8046 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
libel | +29.013 |
rubbish | +25.305 |
racket | +24.350 |
punt | +24.124 |
England | +23.992 |
Neg logit contributions | |
companions | -14.888 |
grandchildren | -14.664 |
newfound | -14.371 |
unborn | -14.195 |
reetings | -14.144 |
Token | scoring |
Token ID | 9689 |
Feature activation | -2.59e+00 |
Pos logit contributions | |
libel | +24.489 |
rubbish | +21.583 |
England | +21.392 |
Serie | +20.423 |
punt | +20.423 |
Neg logit contributions | |
companions | -15.108 |
unborn | -14.922 |
newfound | -14.582 |
caregivers | -14.374 |
grandchildren | -14.097 |
Token | those |
Token ID | 883 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
libel | +29.348 |
rubbish | +26.093 |
England | +26.048 |
punt | +24.917 |
cricket | +24.672 |
Neg logit contributions | |
unborn | -14.848 |
ollower | -14.361 |
companions | -14.275 |
caregivers | -13.929 |
newfound | -13.887 |
Token | two |
Token ID | 734 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
libel | +24.911 |
rubbish | +21.837 |
England | +21.336 |
punt | +21.183 |
advert | +20.437 |
Neg logit contributions | |
unborn | -13.568 |
companions | -12.879 |
caregivers | -12.763 |
newfound | -12.376 |
awakening | -12.083 |
Token | 50 |
Token ID | 2026 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
libel | +26.929 |
rubbish | +24.027 |
England | +23.042 |
punt | +22.834 |
advert | +22.265 |
Neg logit contributions | |
unborn | -13.366 |
companions | -12.621 |
caregivers | -12.527 |
newfound | -12.233 |
awakening | -12.070 |
Token | s |
Token ID | 82 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
libel | +26.800 |
rubbish | +23.406 |
offensive | +22.936 |
England | +22.828 |
punt | +22.463 |
Neg logit contributions | |
unborn | -15.143 |
companions | -14.524 |
caregivers | -14.503 |
newfound | -14.036 |
awakening | -13.742 |
Token | in |
Token ID | 287 |
Feature activation | -3.69e+00 |
Pos logit contributions | |
libel | +24.693 |
rubbish | +22.016 |
England | +20.902 |
punt | +20.489 |
offensive | +20.450 |
Neg logit contributions | |
unborn | -15.939 |
newfound | -15.671 |
companions | -15.601 |
caregivers | -14.862 |
grandchildren | -14.338 |
Token | really |
Token ID | 1107 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
libel | +33.795 |
England | +32.124 |
Jama | +30.050 |
Bangladesh | +30.021 |
cricket | +29.763 |
Neg logit contributions | |
ollower | -16.972 |
unborn | -16.940 |
companions | -16.198 |
caregivers | -15.784 |
newfound | -15.510 |
Token | difficult |
Token ID | 2408 |
Feature activation | -2.99e+00 |
Pos logit contributions | |
libel | +26.512 |
rubbish | +24.266 |
England | +22.888 |
offensive | +22.470 |
Serie | +22.464 |
Neg logit contributions | |
companions | -12.785 |
unborn | -12.672 |
grandchildren | -12.107 |
newfound | -11.724 |
caregivers | -11.715 |
Token | conditions |
Token ID | 3403 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
libel | +31.473 |
England | +28.960 |
cricket | +28.412 |
rubbish | +27.458 |
Bangladesh | +26.981 |
Neg logit contributions | |
unborn | -16.455 |
ollower | -15.928 |
newfound | -15.412 |
grandchildren | -14.832 |
caregivers | -14.749 |
Token | and |
Token ID | 290 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
libel | +25.105 |
rubbish | +22.337 |
England | +21.571 |
penal | +20.994 |
advert | +20.720 |
Neg logit contributions | |
companions | -16.249 |
newfound | -16.159 |
unborn | -16.062 |
grandchildren | -15.535 |
caregivers | -15.390 |
Token | winning |
Token ID | 5442 |
Feature activation | -2.82e+00 |
Pos logit contributions | |
libel | +21.325 |
rubbish | +19.056 |
England | +18.282 |
punt | +18.065 |
offensive | +17.775 |
Neg logit contributions | |
unborn | -10.787 |
companions | -10.680 |
newfound | -10.289 |
grandchildren | -10.126 |
caregivers | -10.024 |
Token | you |
Token ID | 345 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
libel | +29.520 |
England | +26.126 |
cricket | +26.027 |
rubbish | +25.978 |
racket | +25.165 |
Neg logit contributions | |
newfound | -14.759 |
companions | -14.641 |
unborn | -14.566 |
reetings | -13.889 |
awakened | -13.801 |
Token | should |
Token ID | 815 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
libel | +23.037 |
rubbish | +20.165 |
punt | +19.446 |
penal | +18.924 |
England | +18.762 |
Neg logit contributions | |
companions | -17.283 |
newfound | -17.203 |
unborn | -17.025 |
awakening | -16.129 |
grandchildren | -16.124 |
Token | see |
Token ID | 766 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
libel | +30.938 |
rubbish | +28.148 |
penal | +27.941 |
punt | +27.730 |
analyse | +27.097 |
Neg logit contributions | |
newfound | -18.810 |
unborn | -18.175 |
companions | -18.052 |
awakening | -17.237 |
caregivers | -17.218 |
Token | ch |
Token ID | 442 |
Feature activation | -5.18e-01 |
Pos logit contributions | |
libel | +33.205 |
rubbish | +29.824 |
England | +29.683 |
cricket | +29.593 |
racket | +28.851 |
Neg logit contributions | |
companions | -13.306 |
ollower | -13.286 |
newfound | -13.247 |
unborn | -13.141 |
reetings | -13.012 |
Token | ucking |
Token ID | 19296 |
Feature activation | -3.95e+00 |
Pos logit contributions | |
libel | +5.165 |
rubbish | +4.075 |
offensive | +3.937 |
advert | +3.700 |
punt | +3.670 |
Neg logit contributions | |
companions | -7.735 |
unborn | -7.610 |
newfound | -7.606 |
grandchildren | -7.502 |
caregivers | -7.339 |
Token | as |
Token ID | 355 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
libel | +34.369 |
cricket | +32.301 |
rubbish | +31.992 |
racket | +31.351 |
penal | +31.173 |
Neg logit contributions | |
ollower | -15.977 |
companions | -15.143 |
unborn | -14.570 |
newfound | -14.484 |
caregivers | -14.453 |
Token | a |
Token ID | 257 |
Feature activation | -3.27e+00 |
Pos logit contributions | |
libel | +35.062 |
rubbish | +32.132 |
racket | +31.160 |
penal | +31.017 |
cricket | +30.909 |
Neg logit contributions | |
ollower | -17.233 |
reetings | -17.214 |
companions | -16.973 |
unborn | -16.895 |
grandchildren | -16.571 |
Token | crime |
Token ID | 4065 |
Feature activation | -3.05e+00 |
Pos logit contributions | |
libel | +33.695 |
penal | +30.030 |
rubbish | +29.751 |
racket | +29.609 |
cricket | +29.527 |
Neg logit contributions | |
reetings | -17.475 |
ollower | -16.526 |
companions | -16.477 |
unborn | -16.324 |
grandchildren | -16.322 |
Token | . |
Token ID | 13 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
libel | +30.018 |
rubbish | +26.093 |
racket | +25.950 |
penal | +24.894 |
advert | +24.839 |
Neg logit contributions | |
companions | -18.335 |
newfound | -18.127 |
grandchildren | -18.044 |
unborn | -18.023 |
caregivers | -17.739 |
Token | I |
Token ID | 314 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
England | +27.919 |
Anyway | +27.254 |
Bangladesh | +26.916 |
libel | +26.716 |
Fifa | +26.515 |
Neg logit contributions | |
newfound | -23.061 |
unborn | -22.458 |
companions | -21.953 |
awakening | -21.903 |
awakened | -20.941 |
Token | think |
Token ID | 892 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
libel | +26.789 |
rubbish | +23.367 |
punt | +23.033 |
analyse | +22.666 |
penal | +22.541 |
Neg logit contributions | |
newfound | -20.776 |
companions | -20.481 |
awakening | -20.192 |
unborn | -19.968 |
occupants | -19.333 |
Token | ch |
Token ID | 442 |
Feature activation | -5.18e-01 |
Pos logit contributions | |
libel | +33.205 |
rubbish | +29.824 |
England | +29.683 |
cricket | +29.593 |
racket | +28.851 |
Neg logit contributions | |
companions | -13.306 |
ollower | -13.286 |
newfound | -13.247 |
unborn | -13.141 |
reetings | -13.012 |
Token | ucking |
Token ID | 19296 |
Feature activation | -3.95e+00 |
Pos logit contributions | |
libel | +5.165 |
rubbish | +4.075 |
offensive | +3.937 |
advert | +3.700 |
punt | +3.670 |
Neg logit contributions | |
companions | -7.735 |
unborn | -7.610 |
newfound | -7.606 |
grandchildren | -7.502 |
caregivers | -7.339 |
Token | as |
Token ID | 355 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
libel | +34.369 |
cricket | +32.301 |
rubbish | +31.992 |
racket | +31.351 |
penal | +31.173 |
Neg logit contributions | |
ollower | -15.977 |
companions | -15.143 |
unborn | -14.570 |
newfound | -14.484 |
caregivers | -14.453 |
Token | a |
Token ID | 257 |
Feature activation | -3.27e+00 |
Pos logit contributions | |
libel | +35.062 |
rubbish | +32.132 |
racket | +31.160 |
penal | +31.017 |
cricket | +30.909 |
Neg logit contributions | |
ollower | -17.233 |
reetings | -17.214 |
companions | -16.973 |
unborn | -16.895 |
grandchildren | -16.571 |
Token | crime |
Token ID | 4065 |
Feature activation | -3.05e+00 |
Pos logit contributions | |
libel | +33.695 |
penal | +30.030 |
rubbish | +29.751 |
racket | +29.609 |
cricket | +29.527 |
Neg logit contributions | |
reetings | -17.475 |
ollower | -16.526 |
companions | -16.477 |
unborn | -16.324 |
grandchildren | -16.322 |
Token | . |
Token ID | 13 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
libel | +30.018 |
rubbish | +26.093 |
racket | +25.950 |
penal | +24.894 |
advert | +24.839 |
Neg logit contributions | |
companions | -18.335 |
newfound | -18.127 |
grandchildren | -18.044 |
unborn | -18.023 |
caregivers | -17.739 |
Token | I |
Token ID | 314 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
England | +27.919 |
Anyway | +27.254 |
Bangladesh | +26.916 |
libel | +26.716 |
Fifa | +26.515 |
Neg logit contributions | |
newfound | -23.061 |
unborn | -22.458 |
companions | -21.953 |
awakening | -21.903 |
awakened | -20.941 |
Token | think |
Token ID | 892 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
libel | +26.789 |
rubbish | +23.367 |
punt | +23.033 |
analyse | +22.666 |
penal | +22.541 |
Neg logit contributions | |
newfound | -20.776 |
companions | -20.481 |
awakening | -20.192 |
unborn | -19.968 |
occupants | -19.333 |
Token | it |
Token ID | 340 |
Feature activation | -2.54e+00 |
Pos logit contributions | |
libel | +30.328 |
rubbish | +26.994 |
cricket | +26.557 |
England | +26.330 |
racket | +25.941 |
Neg logit contributions | |
newfound | -14.889 |
companions | -14.633 |
unborn | -14.506 |
reetings | -14.092 |
ollower | -13.778 |
Token | is |
Token ID | 318 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
libel | +27.160 |
rubbish | +23.753 |
advert | +23.175 |
penal | +22.863 |
offensive | +22.038 |
Neg logit contributions | |
companions | -17.994 |
newfound | -17.960 |
unborn | -17.550 |
grandchildren | -17.489 |
reetings | -16.703 |
Token | just |
Token ID | 655 |
Feature activation | -2.96e+00 |
Pos logit contributions | |
libel | +32.013 |
rubbish | +29.589 |
penal | +27.245 |
racket | +27.157 |
bullshit | +26.891 |
Neg logit contributions | |
ollower | -15.642 |
unborn | -15.297 |
companions | -15.114 |
reetings | -14.991 |
grandchildren | -14.803 |
Token | be |
Token ID | 307 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
libel | +14.281 |
rubbish | +12.137 |
punt | +11.399 |
offensive | +11.218 |
advert | +11.218 |
Neg logit contributions | |
companions | -13.095 |
newfound | -12.995 |
unborn | -12.970 |
grandchildren | -12.783 |
caregivers | -12.465 |
Token | corrected |
Token ID | 19267 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
libel | +18.448 |
rubbish | +15.820 |
advert | +15.092 |
penal | +14.984 |
punt | +14.846 |
Neg logit contributions | |
companions | -12.607 |
unborn | -12.174 |
newfound | -12.080 |
grandchildren | -12.013 |
blessings | -11.635 |
Token | . |
Token ID | 13 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
libel | +16.810 |
rubbish | +14.278 |
offensive | +13.560 |
advert | +13.367 |
vitro | +13.246 |
Neg logit contributions | |
newfound | -14.834 |
companions | -14.820 |
unborn | -14.591 |
grandchildren | -14.416 |
caregivers | -13.905 |
Token |
|
Token ID | 198 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
libel | +17.526 |
Serie | +14.747 |
rubbish | +14.636 |
offensive | +14.572 |
England | +14.564 |
Neg logit contributions | |
companions | -15.471 |
unborn | -15.370 |
newfound | -15.231 |
grandchildren | -14.830 |
awakening | -14.655 |
Token |
|
Token ID | 198 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
libel | +4.031 |
offensive | +3.216 |
rubbish | +3.205 |
Serie | +3.073 |
advert | +3.035 |
Neg logit contributions | |
companions | -5.446 |
unborn | -5.411 |
newfound | -5.387 |
awakening | -5.282 |
caregivers | -5.273 |
Token | " |
Token ID | 1 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
libel | +13.800 |
offensive | +11.647 |
rubbish | +11.226 |
England | +11.046 |
Anyway | +10.937 |
Neg logit contributions | |
companions | -14.820 |
unborn | -14.742 |
newfound | -14.488 |
grandchildren | -14.404 |
caregivers | -14.214 |
Token | The |
Token ID | 464 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
England | +25.030 |
Anyway | +24.794 |
Football | +24.322 |
libel | +23.240 |
Basically | +23.059 |
Neg logit contributions | |
unborn | -26.459 |
companions | -25.802 |
newfound | -25.573 |
awakening | -25.082 |
caregivers | -25.045 |
Token | ICC |
Token ID | 32300 |
Feature activation | -3.04e+00 |
Pos logit contributions | |
libel | +27.016 |
rubbish | +24.034 |
racket | +23.510 |
England | +23.314 |
cricket | +23.003 |
Neg logit contributions | |
companions | -12.083 |
newfound | -11.587 |
unborn | -11.530 |
grandchildren | -11.466 |
caregivers | -10.761 |
Token | has |
Token ID | 468 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
libel | +31.677 |
penal | +28.109 |
rubbish | +27.895 |
advert | +27.762 |
racket | +27.629 |
Neg logit contributions | |
newfound | -16.143 |
unborn | -16.134 |
companions | -16.107 |
grandchildren | -14.863 |
caregivers | -14.860 |
Token | a |
Token ID | 257 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
libel | +24.824 |
rubbish | +22.070 |
penal | +21.097 |
advert | +20.798 |
racket | +20.622 |
Neg logit contributions | |
companions | -13.362 |
unborn | -12.967 |
caregivers | -12.724 |
reetings | -12.702 |
newfound | -12.694 |
Token | rule |
Token ID | 3896 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
libel | +24.848 |
rubbish | +21.672 |
racket | +20.971 |
penal | +20.522 |
punt | +20.428 |
Neg logit contributions | |
companions | -13.405 |
unborn | -13.115 |
caregivers | -12.923 |
grandchildren | -12.512 |
occupants | -12.217 |
Token | Indies |
Token ID | 42556 |
Feature activation | -2.40e+00 |
Pos logit contributions | |
libel | +10.279 |
rubbish | +8.052 |
offensive | +7.631 |
England | +7.302 |
Serie | +7.212 |
Neg logit contributions | |
unborn | -16.427 |
newfound | -16.280 |
companions | -16.251 |
grandchildren | -15.946 |
awakening | -15.755 |
Token | in |
Token ID | 287 |
Feature activation | -3.24e+00 |
Pos logit contributions | |
libel | +27.678 |
England | +24.981 |
rubbish | +24.817 |
cricket | +23.933 |
offensive | +23.469 |
Neg logit contributions | |
newfound | -14.744 |
unborn | -14.691 |
companions | -14.265 |
caregivers | -13.950 |
grandchildren | -13.808 |
Token | a |
Token ID | 257 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
libel | +33.024 |
England | +30.817 |
Karachi | +29.235 |
Bangladesh | +28.836 |
rubbish | +28.778 |
Neg logit contributions | |
unborn | -16.029 |
grandchildren | -15.455 |
companions | -15.421 |
ollower | -15.087 |
newfound | -15.001 |
Token | Test |
Token ID | 6208 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
libel | +25.010 |
rubbish | +22.006 |
England | +21.060 |
punt | +20.939 |
Serie | +20.789 |
Neg logit contributions | |
unborn | -14.420 |
companions | -13.551 |
grandchildren | -13.430 |
caregivers | -13.350 |
newfound | -12.952 |
Token | match |
Token ID | 2872 |
Feature activation | -2.26e+00 |
Pos logit contributions | |
libel | +28.028 |
England | +25.351 |
cricket | +24.864 |
rubbish | +24.573 |
punt | +24.104 |
Neg logit contributions | |
unborn | -17.334 |
caregivers | -16.707 |
grandchildren | -16.565 |
companions | -16.339 |
newfound | -16.054 |
Token | in |
Token ID | 287 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
libel | +25.744 |
rubbish | +22.507 |
England | +22.060 |
offensive | +21.785 |
advert | +21.430 |
Neg logit contributions | |
companions | -16.223 |
unborn | -16.141 |
newfound | -15.991 |
grandchildren | -15.716 |
caregivers | -15.555 |
Token | Kingston |
Token ID | 34612 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
libel | +33.681 |
England | +32.144 |
Karachi | +30.509 |
Switzerland | +30.174 |
Bangladesh | +30.104 |
Neg logit contributions | |
unborn | -16.553 |
grandchildren | -16.236 |
companions | -16.154 |
ollower | -16.045 |
caregivers | -15.752 |
Token | in |
Token ID | 287 |
Feature activation | -3.29e+00 |
Pos logit contributions | |
libel | +27.173 |
England | +24.234 |
rubbish | +24.208 |
advert | +22.900 |
Switzerland | +22.790 |
Neg logit contributions | |
companions | -16.526 |
unborn | -16.179 |
grandchildren | -16.027 |
newfound | -15.859 |
caregivers | -15.793 |
Token | Jamaica |
Token ID | 31620 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
libel | +32.999 |
England | +31.144 |
Karachi | +29.232 |
Bangladesh | +29.085 |
Switzerland | +28.970 |
Neg logit contributions | |
unborn | -16.443 |
grandchildren | -15.607 |
ollower | -15.564 |
companions | -15.198 |
newfound | -15.131 |
Token | , |
Token ID | 11 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
libel | +24.654 |
rubbish | +21.448 |
England | +21.242 |
advert | +20.644 |
Switzerland | +20.355 |
Neg logit contributions | |
companions | -16.193 |
unborn | -15.753 |
newfound | -15.694 |
grandchildren | -15.548 |
caregivers | -15.436 |
Token | in |
Token ID | 287 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
libel | +22.023 |
rubbish | +19.314 |
England | +19.124 |
punt | +18.457 |
Switzerland | +18.432 |
Neg logit contributions | |
unborn | -12.585 |
companions | -12.566 |
newfound | -12.194 |
grandchildren | -11.966 |
caregivers | -11.901 |
Token | You |
Token ID | 921 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
England | +28.051 |
Anyway | +27.980 |
Bangladesh | +26.880 |
Fifa | +26.722 |
Football | +26.537 |
Neg logit contributions | |
newfound | -23.637 |
unborn | -22.690 |
companions | -22.326 |
awakening | -22.149 |
awakened | -21.185 |
Token | have |
Token ID | 423 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
libel | +24.341 |
rubbish | +21.452 |
punt | +20.866 |
analyse | +20.356 |
penal | +20.013 |
Neg logit contributions | |
newfound | -18.083 |
companions | -18.036 |
unborn | -17.327 |
awakening | -16.830 |
grandchildren | -16.667 |
Token | a |
Token ID | 257 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
libel | +27.829 |
rubbish | +25.182 |
England | +23.862 |
cricket | +23.681 |
racket | +23.624 |
Neg logit contributions | |
companions | -13.576 |
newfound | -13.337 |
reetings | -13.261 |
unborn | -13.081 |
ollower | -12.934 |
Token | technical |
Token ID | 6276 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
libel | +27.086 |
rubbish | +24.141 |
racket | +23.426 |
punt | +23.355 |
cricket | +23.219 |
Neg logit contributions | |
companions | -13.873 |
unborn | -13.511 |
reetings | -13.503 |
grandchildren | -13.402 |
attendees | -12.828 |
Token | fault |
Token ID | 8046 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
libel | +29.013 |
rubbish | +25.305 |
racket | +24.350 |
punt | +24.124 |
England | +23.992 |
Neg logit contributions | |
companions | -14.888 |
grandchildren | -14.664 |
newfound | -14.371 |
unborn | -14.195 |
reetings | -14.144 |
Token | in |
Token ID | 287 |
Feature activation | -3.47e+00 |
Pos logit contributions | |
libel | +20.388 |
rubbish | +17.626 |
offensive | +16.767 |
advert | +16.586 |
racket | +16.531 |
Neg logit contributions | |
companions | -15.263 |
newfound | -15.162 |
grandchildren | -14.911 |
unborn | -14.849 |
caregivers | -14.269 |
Token | your |
Token ID | 534 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
libel | +34.140 |
England | +31.991 |
cricket | +31.967 |
offensive | +30.759 |
Bangladesh | +30.599 |
Neg logit contributions | |
newfound | -15.217 |
companions | -15.164 |
ollower | -15.077 |
unborn | -14.420 |
reetings | -14.401 |
Token | action |
Token ID | 2223 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
libel | +22.339 |
rubbish | +19.916 |
racket | +19.564 |
offensive | +18.874 |
punt | +18.864 |
Neg logit contributions | |
companions | -12.715 |
newfound | -12.598 |
awakened | -12.297 |
unborn | -12.286 |
reetings | -12.123 |
Token | , |
Token ID | 11 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
libel | +18.265 |
rubbish | +15.762 |
offensive | +15.189 |
racket | +14.890 |
advert | +14.799 |
Neg logit contributions | |
newfound | -14.669 |
companions | -14.582 |
unborn | -14.472 |
grandchildren | -14.361 |
blessings | -13.921 |
Token | go |
Token ID | 467 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
libel | +27.294 |
rubbish | +24.696 |
punt | +23.333 |
England | +23.118 |
racket | +23.081 |
Neg logit contributions | |
newfound | -14.978 |
companions | -14.573 |
unborn | -14.562 |
reetings | -14.031 |
grandchildren | -13.852 |
Token | out |
Token ID | 503 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
libel | +24.255 |
rubbish | +22.030 |
punt | +20.510 |
advert | +20.472 |
offensive | +20.421 |
Neg logit contributions | |
newfound | -16.182 |
companions | -15.995 |
unborn | -15.677 |
grandchildren | -15.443 |
attendees | -14.690 |
Token | in |
Token ID | 287 |
Feature activation | -4.05e+00 |
Pos logit contributions | |
libel | +22.081 |
rubbish | +19.314 |
advert | +18.288 |
bullshit | +17.819 |
penal | +17.758 |
Neg logit contributions | |
companions | -16.978 |
newfound | -16.717 |
grandchildren | -16.345 |
unborn | -16.265 |
caregivers | -15.953 |
Token | place |
Token ID | 1295 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
libel | +30.973 |
England | +28.848 |
cricket | +27.878 |
Switzerland | +27.345 |
vitro | +27.107 |
Neg logit contributions | |
reetings | -21.438 |
companions | -21.381 |
newfound | -21.137 |
grandchildren | -21.019 |
unborn | -20.866 |
Token | . |
Token ID | 13 |
Feature activation | -2.85e+00 |
Pos logit contributions | |
libel | +25.806 |
rubbish | +22.798 |
advert | +21.866 |
penal | +21.725 |
England | +21.319 |
Neg logit contributions | |
newfound | -18.034 |
companions | -17.921 |
grandchildren | -17.361 |
unborn | -17.176 |
reetings | -17.104 |
Token |
|
Token ID | 198 |
Feature activation | -8.09e-01 |
Pos logit contributions | |
libel | +25.423 |
England | +25.137 |
Anyway | +24.999 |
Switzerland | +24.280 |
Fifa | +24.215 |
Neg logit contributions | |
newfound | -20.401 |
companions | -20.055 |
unborn | -19.854 |
awakening | -19.473 |
caregivers | -18.640 |
Token |
|
Token ID | 198 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
libel | +6.801 |
offensive | +5.384 |
Anyway | +5.263 |
rubbish | +5.231 |
England | +5.088 |
Neg logit contributions | |
companions | -11.828 |
unborn | -11.792 |
newfound | -11.781 |
caregivers | -11.683 |
awakening | -11.646 |
Token | " |
Token ID | 1 |
Feature activation | -3.37e+00 |
Pos logit contributions | |
libel | +16.513 |
offensive | +13.976 |
England | +13.303 |
rubbish | +13.294 |
Anyway | +13.051 |
Neg logit contributions | |
companions | -18.981 |
unborn | -18.631 |
newfound | -18.478 |
grandchildren | -18.311 |
caregivers | -18.294 |
Token | What |
Token ID | 2061 |
Feature activation | -2.57e+00 |
Pos logit contributions | |
Anyway | +24.352 |
England | +23.908 |
Football | +22.821 |
libel | +22.399 |
Basically | +21.905 |
Neg logit contributions | |
unborn | -26.339 |
newfound | -25.694 |
awakening | -25.671 |
companions | -25.620 |
caregivers | -25.022 |
Token | I |
Token ID | 314 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
libel | +29.743 |
rubbish | +26.708 |
England | +25.992 |
cricket | +25.787 |
Switzerland | +25.347 |
Neg logit contributions | |
companions | -14.917 |
newfound | -14.321 |
unborn | -14.226 |
reetings | -13.800 |
grandchildren | -13.478 |
Token | am |
Token ID | 716 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
libel | +21.448 |
rubbish | +18.808 |
advert | +17.453 |
punt | +17.412 |
analyse | +17.342 |
Neg logit contributions | |
newfound | -16.369 |
companions | -16.259 |
unborn | -16.077 |
awakening | -15.527 |
grandchildren | -15.526 |
Token | really |
Token ID | 1107 |
Feature activation | -8.73e-01 |
Pos logit contributions | |
libel | +14.002 |
rubbish | +12.167 |
offensive | +11.405 |
advert | +11.386 |
Serie | +11.198 |
Neg logit contributions | |
companions | -10.039 |
newfound | -9.947 |
unborn | -9.816 |
grandchildren | -9.682 |
blessings | -9.446 |
Token | glad |
Token ID | 9675 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
libel | +13.171 |
rubbish | +11.681 |
offensive | +10.990 |
advert | +10.923 |
punt | +10.762 |
Neg logit contributions | |
companions | -7.589 |
newfound | -7.479 |
unborn | -7.414 |
grandchildren | -7.254 |
caregivers | -6.994 |
Token | in |
Token ID | 287 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
libel | +25.744 |
rubbish | +22.507 |
England | +22.060 |
offensive | +21.785 |
advert | +21.430 |
Neg logit contributions | |
companions | -16.223 |
unborn | -16.141 |
newfound | -15.991 |
grandchildren | -15.716 |
caregivers | -15.555 |
Token | Kingston |
Token ID | 34612 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
libel | +33.681 |
England | +32.144 |
Karachi | +30.509 |
Switzerland | +30.174 |
Bangladesh | +30.104 |
Neg logit contributions | |
unborn | -16.553 |
grandchildren | -16.236 |
companions | -16.154 |
ollower | -16.045 |
caregivers | -15.752 |
Token | in |
Token ID | 287 |
Feature activation | -3.29e+00 |
Pos logit contributions | |
libel | +27.173 |
England | +24.234 |
rubbish | +24.208 |
advert | +22.900 |
Switzerland | +22.790 |
Neg logit contributions | |
companions | -16.526 |
unborn | -16.179 |
grandchildren | -16.027 |
newfound | -15.859 |
caregivers | -15.793 |
Token | Jamaica |
Token ID | 31620 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
libel | +32.999 |
England | +31.144 |
Karachi | +29.232 |
Bangladesh | +29.085 |
Switzerland | +28.970 |
Neg logit contributions | |
unborn | -16.443 |
grandchildren | -15.607 |
ollower | -15.564 |
companions | -15.198 |
newfound | -15.131 |
Token | , |
Token ID | 11 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
libel | +24.654 |
rubbish | +21.448 |
England | +21.242 |
advert | +20.644 |
Switzerland | +20.355 |
Neg logit contributions | |
companions | -16.193 |
unborn | -15.753 |
newfound | -15.694 |
grandchildren | -15.548 |
caregivers | -15.436 |
Token | in |
Token ID | 287 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
libel | +22.023 |
rubbish | +19.314 |
England | +19.124 |
punt | +18.457 |
Switzerland | +18.432 |
Neg logit contributions | |
unborn | -12.585 |
companions | -12.566 |
newfound | -12.194 |
grandchildren | -11.966 |
caregivers | -11.901 |
Token | 2006 |
Token ID | 4793 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
libel | +34.151 |
England | +31.943 |
rubbish | +30.235 |
offensive | +30.170 |
Karachi | +29.931 |
Neg logit contributions | |
unborn | -15.530 |
grandchildren | -14.780 |
caregivers | -14.664 |
companions | -14.397 |
newfound | -14.387 |
Token | . |
Token ID | 13 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
libel | +26.088 |
England | +22.677 |
rubbish | +22.506 |
cricket | +21.634 |
advert | +21.608 |
Neg logit contributions | |
unborn | -16.181 |
newfound | -15.841 |
companions | -15.782 |
caregivers | -15.669 |
grandchildren | -15.414 |
Token | The |
Token ID | 383 |
Feature activation | -9.87e-01 |
Pos logit contributions | |
England | +21.708 |
libel | +21.386 |
Anyway | +21.208 |
Switzerland | +20.277 |
Jama | +20.276 |
Neg logit contributions | |
newfound | -19.946 |
unborn | -19.936 |
companions | -19.780 |
awakening | -19.304 |
caregivers | -19.270 |
Token | series |
Token ID | 2168 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
libel | +15.018 |
rubbish | +13.111 |
offensive | +12.581 |
advert | +12.477 |
England | +12.449 |
Neg logit contributions | |
unborn | -8.057 |
companions | -8.002 |
newfound | -7.837 |
grandchildren | -7.645 |
caregivers | -7.527 |
Token | was |
Token ID | 373 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
libel | +14.820 |
rubbish | +12.829 |
offensive | +12.320 |
punt | +12.065 |
advert | +12.005 |
Neg logit contributions | |
unborn | -10.618 |
companions | -10.410 |
newfound | -10.227 |
grandchildren | -10.036 |
caregivers | -9.890 |
Token | a |
Token ID | 257 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
libel | +33.024 |
England | +30.817 |
Karachi | +29.235 |
Bangladesh | +28.836 |
rubbish | +28.778 |
Neg logit contributions | |
unborn | -16.029 |
grandchildren | -15.455 |
companions | -15.421 |
ollower | -15.087 |
newfound | -15.001 |
Token | Test |
Token ID | 6208 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
libel | +25.010 |
rubbish | +22.006 |
England | +21.060 |
punt | +20.939 |
Serie | +20.789 |
Neg logit contributions | |
unborn | -14.420 |
companions | -13.551 |
grandchildren | -13.430 |
caregivers | -13.350 |
newfound | -12.952 |
Token | match |
Token ID | 2872 |
Feature activation | -2.26e+00 |
Pos logit contributions | |
libel | +28.028 |
England | +25.351 |
cricket | +24.864 |
rubbish | +24.573 |
punt | +24.104 |
Neg logit contributions | |
unborn | -17.334 |
caregivers | -16.707 |
grandchildren | -16.565 |
companions | -16.339 |
newfound | -16.054 |
Token | in |
Token ID | 287 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
libel | +25.744 |
rubbish | +22.507 |
England | +22.060 |
offensive | +21.785 |
advert | +21.430 |
Neg logit contributions | |
companions | -16.223 |
unborn | -16.141 |
newfound | -15.991 |
grandchildren | -15.716 |
caregivers | -15.555 |
Token | Kingston |
Token ID | 34612 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
libel | +33.681 |
England | +32.144 |
Karachi | +30.509 |
Switzerland | +30.174 |
Bangladesh | +30.104 |
Neg logit contributions | |
unborn | -16.553 |
grandchildren | -16.236 |
companions | -16.154 |
ollower | -16.045 |
caregivers | -15.752 |
Token | in |
Token ID | 287 |
Feature activation | -3.29e+00 |
Pos logit contributions | |
libel | +27.173 |
England | +24.234 |
rubbish | +24.208 |
advert | +22.900 |
Switzerland | +22.790 |
Neg logit contributions | |
companions | -16.526 |
unborn | -16.179 |
grandchildren | -16.027 |
newfound | -15.859 |
caregivers | -15.793 |
Token | Jamaica |
Token ID | 31620 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
libel | +32.999 |
England | +31.144 |
Karachi | +29.232 |
Bangladesh | +29.085 |
Switzerland | +28.970 |
Neg logit contributions | |
unborn | -16.443 |
grandchildren | -15.607 |
ollower | -15.564 |
companions | -15.198 |
newfound | -15.131 |
Token | , |
Token ID | 11 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
libel | +24.654 |
rubbish | +21.448 |
England | +21.242 |
advert | +20.644 |
Switzerland | +20.355 |
Neg logit contributions | |
companions | -16.193 |
unborn | -15.753 |
newfound | -15.694 |
grandchildren | -15.548 |
caregivers | -15.436 |
Token | in |
Token ID | 287 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
libel | +22.023 |
rubbish | +19.314 |
England | +19.124 |
punt | +18.457 |
Switzerland | +18.432 |
Neg logit contributions | |
unborn | -12.585 |
companions | -12.566 |
newfound | -12.194 |
grandchildren | -11.966 |
caregivers | -11.901 |
Token | 2006 |
Token ID | 4793 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
libel | +34.151 |
England | +31.943 |
rubbish | +30.235 |
offensive | +30.170 |
Karachi | +29.931 |
Neg logit contributions | |
unborn | -15.530 |
grandchildren | -14.780 |
caregivers | -14.664 |
companions | -14.397 |
newfound | -14.387 |
Token | . |
Token ID | 13 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
libel | +26.088 |
England | +22.677 |
rubbish | +22.506 |
cricket | +21.634 |
advert | +21.608 |
Neg logit contributions | |
unborn | -16.181 |
newfound | -15.841 |
companions | -15.782 |
caregivers | -15.669 |
grandchildren | -15.414 |
Token | industry |
Token ID | 2831 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
libel | +28.829 |
racket | +25.314 |
rubbish | +25.136 |
Switzerland | +24.760 |
Brussels | +24.438 |
Neg logit contributions | |
unborn | -15.503 |
grandchildren | -14.497 |
newfound | -14.343 |
companions | -14.320 |
awakened | -13.988 |
Token | had |
Token ID | 550 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
libel | +25.533 |
rubbish | +22.080 |
advert | +21.852 |
Switzerland | +21.617 |
racket | +21.465 |
Neg logit contributions | |
unborn | -16.583 |
newfound | -16.507 |
companions | -15.749 |
awakening | -15.579 |
reetings | -15.513 |
Token | been |
Token ID | 587 |
Feature activation | -2.54e+00 |
Pos logit contributions | |
libel | +23.126 |
rubbish | +20.060 |
advert | +19.322 |
penal | +19.185 |
racket | +19.132 |
Neg logit contributions | |
unborn | -15.127 |
companions | -14.899 |
newfound | -14.758 |
awakening | -14.472 |
grandchildren | -14.425 |
Token | caught |
Token ID | 4978 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
libel | +27.543 |
penal | +25.148 |
rubbish | +24.194 |
fined | +23.527 |
Brussels | +23.099 |
Neg logit contributions | |
unborn | -17.107 |
companions | -17.043 |
grandchildren | -16.838 |
newfound | -16.749 |
reetings | -16.284 |
Token | engaging |
Token ID | 11932 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
libel | +26.586 |
rubbish | +23.167 |
racket | +22.286 |
advert | +22.186 |
illegally | +22.042 |
Neg logit contributions | |
newfound | -17.241 |
grandchildren | -17.108 |
unborn | -16.929 |
companions | -16.519 |
caregivers | -16.476 |
Token | in |
Token ID | 287 |
Feature activation | -3.29e+00 |
Pos logit contributions | |
libel | +26.171 |
rubbish | +22.892 |
advert | +22.248 |
Switzerland | +22.222 |
Brussels | +22.160 |
Neg logit contributions | |
unborn | -16.477 |
awakening | -16.222 |
newfound | -15.790 |
awakened | -15.695 |
companions | -15.670 |
Token | price |
Token ID | 2756 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
libel | +33.189 |
racket | +29.507 |
rubbish | +29.140 |
advert | +27.996 |
Switzerland | +27.712 |
Neg logit contributions | |
unborn | -17.993 |
reetings | -17.609 |
grandchildren | -17.038 |
companions | -16.895 |
ollower | -16.835 |
Token | - |
Token ID | 12 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
libel | +23.739 |
rubbish | +20.252 |
advert | +19.264 |
racket | +19.151 |
counterfe | +18.897 |
Neg logit contributions | |
unborn | -15.940 |
newfound | -15.542 |
grandchildren | -15.126 |
companions | -14.997 |
caregivers | -14.740 |
Token | fix |
Token ID | 13049 |
Feature activation | -9.69e-01 |
Pos logit contributions | |
libel | +17.314 |
offensive | +14.570 |
rubbish | +14.236 |
football | +13.350 |
pub | +13.224 |
Neg logit contributions | |
unborn | -17.956 |
companions | -17.719 |
grandchildren | -17.558 |
newfound | -17.409 |
caregivers | -17.099 |
Token | ing |
Token ID | 278 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
libel | +7.666 |
rubbish | +5.850 |
offensive | +5.509 |
advert | +5.079 |
vitro | +5.034 |
Neg logit contributions | |
unborn | -15.169 |
companions | -15.137 |
newfound | -14.949 |
grandchildren | -14.865 |
caregivers | -14.639 |
Token | . |
Token ID | 13 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
libel | +28.343 |
rubbish | +24.987 |
racket | +24.844 |
advert | +23.877 |
Switzerland | +23.722 |
Neg logit contributions | |
unborn | -18.544 |
reetings | -18.134 |
newfound | -17.599 |
companions | -17.595 |
ollower | -17.136 |
Token | , |
Token ID | 11 |
Feature activation | -3.84e-01 |
Pos logit contributions | |
libel | +7.572 |
rubbish | +6.236 |
offensive | +6.044 |
advert | +5.795 |
Serie | +5.771 |
Neg logit contributions | |
companions | -8.289 |
unborn | -8.198 |
newfound | -8.188 |
grandchildren | -8.046 |
caregivers | -7.825 |
Token | it |
Token ID | 340 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
libel | +4.936 |
rubbish | +4.091 |
offensive | +3.993 |
advert | +3.834 |
Serie | +3.819 |
Neg logit contributions | |
companions | -4.673 |
unborn | -4.581 |
newfound | -4.578 |
grandchildren | -4.514 |
caregivers | -4.379 |
Token | 's |
Token ID | 338 |
Feature activation | -3.93e-01 |
Pos logit contributions | |
libel | +11.735 |
rubbish | +9.774 |
offensive | +9.331 |
advert | +9.318 |
punt | +9.023 |
Neg logit contributions | |
unborn | -12.448 |
companions | -12.445 |
grandchildren | -12.327 |
newfound | -12.296 |
caregivers | -11.826 |
Token | different |
Token ID | 1180 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
libel | +5.247 |
rubbish | +4.413 |
offensive | +4.281 |
advert | +4.126 |
Serie | +4.118 |
Neg logit contributions | |
companions | -4.530 |
unborn | -4.458 |
newfound | -4.424 |
grandchildren | -4.377 |
caregivers | -4.246 |
Token | than |
Token ID | 621 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
libel | +16.396 |
rubbish | +14.021 |
offensive | +13.296 |
Serie | +13.285 |
Switzerland | +13.224 |
Neg logit contributions | |
unborn | -13.934 |
newfound | -13.716 |
companions | -13.662 |
grandchildren | -13.431 |
caregivers | -13.211 |
Token | in |
Token ID | 287 |
Feature activation | -3.28e+00 |
Pos logit contributions | |
libel | +28.403 |
Switzerland | +26.250 |
England | +25.690 |
rubbish | +25.415 |
Serie | +25.206 |
Neg logit contributions | |
unborn | -15.142 |
companions | -14.566 |
newfound | -14.190 |
grandchildren | -13.977 |
caregivers | -13.616 |
Token | Sweden |
Token ID | 10710 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
libel | +32.406 |
Switzerland | +31.073 |
England | +30.515 |
Brussels | +29.051 |
Serie | +28.972 |
Neg logit contributions | |
unborn | -16.148 |
newfound | -15.330 |
companions | -15.286 |
grandchildren | -15.264 |
blessings | -15.082 |
Token | ." |
Token ID | 526 |
Feature activation | +5.77e-02 |
Pos logit contributions | |
libel | +19.873 |
rubbish | +17.146 |
Switzerland | +16.272 |
offensive | +16.243 |
England | +16.049 |
Neg logit contributions | |
companions | -16.895 |
newfound | -16.749 |
unborn | -16.653 |
grandchildren | -16.214 |
caregivers | -15.880 |
Token |
|
Token ID | 198 |
Feature activation | +7.68e-02 |
Pos logit contributions | |
companions | +0.662 |
unborn | +0.650 |
newfound | +0.647 |
grandchildren | +0.641 |
blessings | +0.620 |
Neg logit contributions | |
libel | -0.781 |
rubbish | -0.653 |
offensive | -0.634 |
advert | -0.616 |
vitro | -0.614 |
Token |
|
Token ID | 198 |
Feature activation | -4.44e-01 |
Pos logit contributions | |
companions | +0.972 |
unborn | +0.956 |
newfound | +0.955 |
grandchildren | +0.939 |
caregivers | +0.918 |
Neg logit contributions | |
libel | -0.951 |
rubbish | -0.782 |
offensive | -0.768 |
advert | -0.733 |
Serie | -0.732 |
Token | He |
Token ID | 1544 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
libel | +5.331 |
rubbish | +4.354 |
offensive | +4.288 |
Serie | +4.061 |
advert | +4.053 |
Neg logit contributions | |
companions | -5.745 |
unborn | -5.647 |
newfound | -5.628 |
grandchildren | -5.562 |
caregivers | -5.418 |
Token | should |
Token ID | 815 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
libel | +23.037 |
rubbish | +20.165 |
punt | +19.446 |
penal | +18.924 |
England | +18.762 |
Neg logit contributions | |
companions | -17.283 |
newfound | -17.203 |
unborn | -17.025 |
awakening | -16.129 |
grandchildren | -16.124 |
Token | see |
Token ID | 766 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
libel | +30.938 |
rubbish | +28.148 |
penal | +27.941 |
punt | +27.730 |
analyse | +27.097 |
Neg logit contributions | |
newfound | -18.810 |
unborn | -18.175 |
companions | -18.052 |
awakening | -17.237 |
caregivers | -17.218 |
Token | ch |
Token ID | 442 |
Feature activation | -5.18e-01 |
Pos logit contributions | |
libel | +33.205 |
rubbish | +29.824 |
England | +29.683 |
cricket | +29.593 |
racket | +28.851 |
Neg logit contributions | |
companions | -13.306 |
ollower | -13.286 |
newfound | -13.247 |
unborn | -13.141 |
reetings | -13.012 |
Token | ucking |
Token ID | 19296 |
Feature activation | -3.95e+00 |
Pos logit contributions | |
libel | +5.165 |
rubbish | +4.075 |
offensive | +3.937 |
advert | +3.700 |
punt | +3.670 |
Neg logit contributions | |
companions | -7.735 |
unborn | -7.610 |
newfound | -7.606 |
grandchildren | -7.502 |
caregivers | -7.339 |
Token | as |
Token ID | 355 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
libel | +34.369 |
cricket | +32.301 |
rubbish | +31.992 |
racket | +31.351 |
penal | +31.173 |
Neg logit contributions | |
ollower | -15.977 |
companions | -15.143 |
unborn | -14.570 |
newfound | -14.484 |
caregivers | -14.453 |
Token | a |
Token ID | 257 |
Feature activation | -3.27e+00 |
Pos logit contributions | |
libel | +35.062 |
rubbish | +32.132 |
racket | +31.160 |
penal | +31.017 |
cricket | +30.909 |
Neg logit contributions | |
ollower | -17.233 |
reetings | -17.214 |
companions | -16.973 |
unborn | -16.895 |
grandchildren | -16.571 |
Token | crime |
Token ID | 4065 |
Feature activation | -3.05e+00 |
Pos logit contributions | |
libel | +33.695 |
penal | +30.030 |
rubbish | +29.751 |
racket | +29.609 |
cricket | +29.527 |
Neg logit contributions | |
reetings | -17.475 |
ollower | -16.526 |
companions | -16.477 |
unborn | -16.324 |
grandchildren | -16.322 |
Token | . |
Token ID | 13 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
libel | +30.018 |
rubbish | +26.093 |
racket | +25.950 |
penal | +24.894 |
advert | +24.839 |
Neg logit contributions | |
companions | -18.335 |
newfound | -18.127 |
grandchildren | -18.044 |
unborn | -18.023 |
caregivers | -17.739 |
Token | I |
Token ID | 314 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
England | +27.919 |
Anyway | +27.254 |
Bangladesh | +26.916 |
libel | +26.716 |
Fifa | +26.515 |
Neg logit contributions | |
newfound | -23.061 |
unborn | -22.458 |
companions | -21.953 |
awakening | -21.903 |
awakened | -20.941 |
Token | think |
Token ID | 892 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
libel | +26.789 |
rubbish | +23.367 |
punt | +23.033 |
analyse | +22.666 |
penal | +22.541 |
Neg logit contributions | |
newfound | -20.776 |
companions | -20.481 |
awakening | -20.192 |
unborn | -19.968 |
occupants | -19.333 |
Token | it |
Token ID | 340 |
Feature activation | -2.54e+00 |
Pos logit contributions | |
libel | +30.328 |
rubbish | +26.994 |
cricket | +26.557 |
England | +26.330 |
racket | +25.941 |
Neg logit contributions | |
newfound | -14.889 |
companions | -14.633 |
unborn | -14.506 |
reetings | -14.092 |
ollower | -13.778 |
Token | them |
Token ID | 606 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
libel | +24.160 |
rubbish | +21.356 |
England | +20.560 |
Serie | +20.474 |
offensive | +20.407 |
Neg logit contributions | |
unborn | -10.694 |
companions | -10.425 |
newfound | -10.141 |
caregivers | -9.912 |
grandchildren | -9.844 |
Token | the |
Token ID | 262 |
Feature activation | -4.51e-01 |
Pos logit contributions | |
libel | +20.567 |
rubbish | +18.167 |
offensive | +17.277 |
Serie | +17.237 |
advert | +17.218 |
Neg logit contributions | |
unborn | -10.299 |
companions | -10.159 |
newfound | -9.708 |
caregivers | -9.659 |
grandchildren | -9.483 |
Token | benefit |
Token ID | 4414 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
libel | +7.076 |
rubbish | +6.094 |
offensive | +5.958 |
advert | +5.790 |
Serie | +5.773 |
Neg logit contributions | |
companions | -4.169 |
unborn | -4.065 |
newfound | -4.052 |
grandchildren | -3.973 |
caregivers | -3.832 |
Token | of |
Token ID | 286 |
Feature activation | -8.96e-01 |
Pos logit contributions | |
libel | +17.503 |
rubbish | +14.350 |
advert | +13.658 |
offensive | +13.593 |
vitro | +13.326 |
Neg logit contributions | |
companions | -16.728 |
newfound | -16.654 |
unborn | -16.564 |
grandchildren | -16.430 |
awakening | -15.990 |
Token | doubt |
Token ID | 4719 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
libel | +10.276 |
rubbish | +8.344 |
offensive | +8.090 |
advert | +7.834 |
Serie | +7.753 |
Neg logit contributions | |
companions | -11.547 |
unborn | -11.429 |
newfound | -11.329 |
grandchildren | -11.236 |
caregivers | -10.952 |
Token | . |
Token ID | 13 |
Feature activation | -3.27e+00 |
Pos logit contributions | |
libel | +20.483 |
rubbish | +17.726 |
advert | +16.240 |
offensive | +16.239 |
punt | +16.063 |
Neg logit contributions | |
companions | -15.342 |
newfound | -15.304 |
unborn | -15.212 |
caregivers | -14.669 |
grandchildren | -14.641 |
Token | The |
Token ID | 383 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
England | +26.191 |
Anyway | +25.899 |
libel | +25.630 |
Switzerland | +25.032 |
Fifa | +24.946 |
Neg logit contributions | |
newfound | -22.936 |
unborn | -22.468 |
companions | -22.069 |
awakening | -21.979 |
caregivers | -20.901 |
Token | ICC |
Token ID | 32300 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
libel | +23.739 |
rubbish | +20.849 |
racket | +19.987 |
England | +19.985 |
Serie | +19.869 |
Neg logit contributions | |
companions | -11.123 |
newfound | -10.777 |
unborn | -10.712 |
grandchildren | -10.315 |
awakened | -10.153 |
Token | is |
Token ID | 318 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
libel | +30.490 |
rubbish | +27.178 |
penal | +26.886 |
advert | +26.865 |
England | +26.718 |
Neg logit contributions | |
unborn | -15.876 |
newfound | -15.752 |
companions | -15.669 |
caregivers | -14.613 |
grandchildren | -14.449 |
Token | being |
Token ID | 852 |
Feature activation | -2.16e+00 |
Pos logit contributions | |
libel | +25.399 |
rubbish | +23.285 |
penal | +21.704 |
Serie | +21.364 |
England | +21.340 |
Neg logit contributions | |
companions | -13.250 |
newfound | -12.862 |
unborn | -12.808 |
grandchildren | -12.496 |
caregivers | -12.147 |
Token | more |
Token ID | 517 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
libel | +27.720 |
rubbish | +25.019 |
penal | +23.574 |
advert | +22.997 |
bullshit | +22.800 |
Neg logit contributions | |
newfound | -13.791 |
unborn | -13.718 |
companions | -13.715 |
grandchildren | -13.561 |
reetings | -13.354 |
Token | the |
Token ID | 262 |
Feature activation | +7.60e-01 |
Pos logit contributions | |
libel | +0.542 |
rubbish | +0.434 |
offensive | +0.424 |
vitro | +0.403 |
Serie | +0.401 |
Neg logit contributions | |
companions | -0.648 |
newfound | -0.639 |
unborn | -0.626 |
grandchildren | -0.622 |
awakening | -0.621 |
Token | course |
Token ID | 1781 |
Feature activation | +8.91e-01 |
Pos logit contributions | |
companions | +9.398 |
newfound | +9.298 |
awakening | +9.170 |
grandchildren | +9.112 |
arrival | +9.103 |
Neg logit contributions | |
libel | -8.299 |
offensive | -6.736 |
rubbish | -6.656 |
vitro | -6.501 |
ograph | -6.391 |
Token | of |
Token ID | 286 |
Feature activation | +9.22e-01 |
Pos logit contributions | |
companions | +11.040 |
newfound | +10.649 |
unborn | +10.619 |
survivors | +10.583 |
grandchildren | +10.559 |
Neg logit contributions | |
libel | -9.897 |
rubbish | -8.202 |
offensive | -7.901 |
Serie | -7.728 |
vitro | -7.573 |
Token | the |
Token ID | 262 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
companions | +11.051 |
newfound | +10.748 |
enduring | +10.689 |
awakening | +10.661 |
survivors | +10.583 |
Neg logit contributions | |
libel | -10.025 |
rubbish | -8.005 |
offensive | -7.972 |
vitro | -7.699 |
Anyway | -7.580 |
Token | game |
Token ID | 983 |
Feature activation | +1.77e+00 |
Pos logit contributions | |
companions | +12.532 |
newfound | +12.317 |
survivors | +12.160 |
enduring | +11.996 |
awakening | +11.995 |
Neg logit contributions | |
libel | -10.765 |
rubbish | -8.621 |
offensive | -8.590 |
vitro | -8.339 |
Anyway | -8.134 |
Token | , |
Token ID | 11 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
survivors | +17.577 |
companions | +17.145 |
attendees | +16.781 |
caregivers | +16.472 |
enduring | +16.415 |
Neg logit contributions | |
libel | -17.073 |
rubbish | -13.803 |
offensive | -13.216 |
Anyway | -13.194 |
redit | -13.078 |
Token | players |
Token ID | 1938 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
survivors | +18.652 |
companions | +18.497 |
newfound | +17.715 |
attendees | +17.543 |
followers | +17.395 |
Neg logit contributions | |
libel | -15.794 |
offensive | -12.353 |
vitro | -12.228 |
rubbish | -12.169 |
redit | -12.025 |
Token | must |
Token ID | 1276 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
companions | +16.095 |
survivors | +15.571 |
awakened | +15.521 |
unborn | +15.512 |
newfound | +15.476 |
Neg logit contributions | |
libel | -14.023 |
offensive | -12.129 |
rubbish | -11.508 |
Anyway | -11.364 |
vitro | -11.343 |
Token | explore |
Token ID | 7301 |
Feature activation | +6.76e-01 |
Pos logit contributions | |
companions | +13.325 |
newfound | +12.694 |
survivors | +12.663 |
unborn | +12.509 |
enduring | +12.450 |
Neg logit contributions | |
libel | -11.631 |
offensive | -10.044 |
Serie | -9.453 |
rubbish | -9.314 |
vitro | -9.293 |
Token | the |
Token ID | 262 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
newfound | +8.312 |
companions | +8.242 |
enduring | +7.974 |
survivors | +7.951 |
unborn | +7.925 |
Neg logit contributions | |
libel | -7.786 |
offensive | -6.214 |
rubbish | -6.187 |
vitro | -5.998 |
advert | -5.930 |
Token | ever |
Token ID | 1683 |
Feature activation | +7.74e-01 |
Pos logit contributions | |
newfound | +17.458 |
companions | +17.143 |
survivors | +16.838 |
enduring | +16.832 |
remaining | +16.688 |
Neg logit contributions | |
libel | -13.489 |
offensive | -10.815 |
England | -10.200 |
vitro | -10.200 |
ograph | -10.167 |
Token | count |
Token ID | 954 |
Feature activation | +6.09e-01 |
Pos logit contributions | |
libel | +2.241 |
rubbish | +1.839 |
offensive | +1.810 |
Serie | +1.728 |
advert | +1.724 |
Neg logit contributions | |
companions | -2.306 |
newfound | -2.278 |
unborn | -2.264 |
grandchildren | -2.222 |
awakening | -2.165 |
Token | , |
Token ID | 11 |
Feature activation | +6.42e-01 |
Pos logit contributions | |
companions | +5.847 |
unborn | +5.756 |
newfound | +5.661 |
blessings | +5.567 |
caregivers | +5.542 |
Neg logit contributions | |
libel | -8.562 |
rubbish | -7.283 |
offensive | -7.173 |
punt | -6.936 |
Serie | -6.895 |
Token | Good |
Token ID | 4599 |
Feature activation | +8.28e-01 |
Pos logit contributions | |
companions | +8.111 |
unborn | +7.952 |
newfound | +7.854 |
caregivers | +7.813 |
grandchildren | +7.804 |
Neg logit contributions | |
libel | -7.061 |
offensive | -5.891 |
rubbish | -5.644 |
Serie | -5.429 |
ograph | -5.391 |
Token | will |
Token ID | 10594 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
companions | +5.487 |
grandchildren | +5.216 |
newfound | +5.178 |
unborn | +5.144 |
blessings | +5.001 |
Neg logit contributions | |
libel | -14.165 |
rubbish | -12.417 |
offensive | -12.214 |
Serie | -12.150 |
punt | -11.997 |
Token | ie |
Token ID | 494 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
libel | +3.069 |
rubbish | +2.542 |
offensive | +2.491 |
Serie | +2.376 |
vitro | +2.371 |
Neg logit contributions | |
companions | -2.911 |
newfound | -2.852 |
unborn | -2.844 |
grandchildren | -2.812 |
caregivers | -2.741 |
Token | said |
Token ID | 531 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
companions | +1.718 |
newfound | +1.673 |
unborn | +1.664 |
grandchildren | +1.663 |
caregivers | +1.637 |
Neg logit contributions | |
libel | -1.619 |
rubbish | -1.326 |
offensive | -1.296 |
vitro | -1.232 |
Serie | -1.228 |
Token | he |
Token ID | 339 |
Feature activation | +1.28e-01 |
Pos logit contributions | |
unborn | +17.314 |
companions | +17.236 |
caregivers | +17.090 |
newfound | +16.979 |
grandchildren | +16.966 |
Neg logit contributions | |
libel | -14.968 |
offensive | -12.112 |
ictionary | -12.011 |
Anyway | -11.930 |
rubbish | -11.805 |
Token | � |
Token ID | 447 |
Feature activation | -8.03e-01 |
Pos logit contributions | |
companions | +1.603 |
newfound | +1.577 |
unborn | +1.574 |
grandchildren | +1.559 |
awakened | +1.522 |
Neg logit contributions | |
libel | -1.572 |
rubbish | -1.292 |
offensive | -1.273 |
Serie | -1.220 |
vitro | -1.195 |
Token | � |
Token ID | 247 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
libel | +7.465 |
offensive | +5.499 |
rubbish | +5.478 |
punt | +5.212 |
vitro | +5.211 |
Neg logit contributions | |
companions | -11.822 |
unborn | -11.670 |
newfound | -11.572 |
grandchildren | -11.257 |
awakening | -11.246 |
Token | d |
Token ID | 67 |
Feature activation | +4.01e-01 |
Pos logit contributions | |
companions | +2.847 |
grandchildren | +2.782 |
newfound | +2.776 |
unborn | +2.772 |
survivors | +2.685 |
Neg logit contributions | |
libel | -2.754 |
rubbish | -2.277 |
offensive | -2.187 |
Serie | -2.089 |
punt | -2.063 |
Token | be |
Token ID | 307 |
Feature activation | +1.46e-01 |
Pos logit contributions | |
companions | +4.857 |
unborn | +4.756 |
newfound | +4.736 |
grandchildren | +4.723 |
enduring | +4.569 |
Neg logit contributions | |
libel | -4.923 |
rubbish | -4.018 |
offensive | -3.981 |
Serie | -3.913 |
tabloid | -3.741 |
Token |
|
Token ID | 198 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
companions | +0.324 |
unborn | +0.319 |
newfound | +0.319 |
grandchildren | +0.313 |
caregivers | +0.307 |
Neg logit contributions | |
libel | -0.304 |
rubbish | -0.249 |
offensive | -0.245 |
Serie | -0.234 |
advert | -0.234 |
Token | Thank |
Token ID | 10449 |
Feature activation | +4.63e-01 |
Pos logit contributions | |
libel | +3.635 |
rubbish | +2.941 |
offensive | +2.851 |
advert | +2.735 |
Serie | +2.714 |
Neg logit contributions | |
companions | -4.236 |
newfound | -4.159 |
unborn | -4.154 |
grandchildren | -4.102 |
awakening | -3.993 |
Token | you |
Token ID | 345 |
Feature activation | +8.01e-01 |
Pos logit contributions | |
companions | +4.284 |
newfound | +4.114 |
blessings | +4.091 |
unborn | +4.077 |
grandchildren | +3.949 |
Neg logit contributions | |
libel | -6.909 |
offensive | -5.866 |
rubbish | -5.791 |
vitro | -5.737 |
advert | -5.644 |
Token | everyone |
Token ID | 2506 |
Feature activation | +9.24e-01 |
Pos logit contributions | |
companions | +9.713 |
newfound | +9.379 |
unborn | +9.290 |
blessings | +9.202 |
grandchildren | +9.193 |
Neg logit contributions | |
libel | -8.806 |
offensive | -7.418 |
rubbish | -7.053 |
vitro | -7.006 |
advert | -6.929 |
Token | again |
Token ID | 757 |
Feature activation | +8.67e-01 |
Pos logit contributions | |
companions | +10.758 |
newfound | +10.571 |
unborn | +10.436 |
awakening | +10.279 |
blessings | +10.198 |
Neg logit contributions | |
libel | -9.970 |
offensive | -8.521 |
vitro | -8.083 |
rubbish | -8.013 |
advert | -7.871 |
Token | for |
Token ID | 329 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
companions | +10.332 |
newfound | +9.956 |
unborn | +9.893 |
survivors | +9.854 |
blessings | +9.778 |
Neg logit contributions | |
libel | -9.454 |
offensive | -7.995 |
rubbish | -7.618 |
vitro | -7.576 |
advert | -7.556 |
Token | the |
Token ID | 262 |
Feature activation | +1.72e+00 |
Pos logit contributions | |
awakening | +17.679 |
enduring | +17.581 |
companions | +17.329 |
newfound | +17.243 |
remaining | +17.242 |
Neg logit contributions | |
libel | -15.687 |
ictionary | -13.012 |
ograph | -12.976 |
offensive | -12.896 |
vitro | -12.836 |
Token | love |
Token ID | 1842 |
Feature activation | +8.69e-01 |
Pos logit contributions | |
companions | +19.071 |
newfound | +19.051 |
blessings | +18.974 |
awakening | +18.491 |
enduring | +18.347 |
Neg logit contributions | |
libel | -14.606 |
vitro | -12.045 |
offensive | -11.841 |
ictionary | -11.574 |
ograph | -11.521 |
Token | and |
Token ID | 290 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
companions | +9.394 |
unborn | +9.350 |
newfound | +9.195 |
blessings | +9.131 |
awakening | +9.042 |
Neg logit contributions | |
libel | -10.275 |
offensive | -8.657 |
rubbish | -8.419 |
vitro | -8.365 |
Yugoslavia | -8.051 |
Token | support |
Token ID | 1104 |
Feature activation | +9.35e-01 |
Pos logit contributions | |
companions | +22.031 |
blessings | +21.949 |
newfound | +21.129 |
enduring | +20.475 |
followers | +20.263 |
Neg logit contributions | |
libel | -18.470 |
offensive | -15.034 |
vitro | -14.859 |
ograph | -14.538 |
Serie | -14.237 |
Token | , |
Token ID | 11 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
companions | +10.596 |
newfound | +10.341 |
unborn | +10.339 |
awakening | +10.063 |
blessings | +10.047 |
Neg logit contributions | |
libel | -10.515 |
offensive | -8.736 |
rubbish | -8.569 |
vitro | -8.309 |
advert | -8.082 |
Token | to |
Token ID | 284 |
Feature activation | +2.56e-01 |
Pos logit contributions | |
companions | +4.518 |
unborn | +4.513 |
newfound | +4.460 |
grandchildren | +4.245 |
awakening | +4.205 |
Neg logit contributions | |
libel | -6.154 |
rubbish | -5.253 |
offensive | -5.138 |
Serie | -5.000 |
vitro | -4.955 |
Token | increase |
Token ID | 2620 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
companions | +3.177 |
newfound | +3.125 |
unborn | +3.111 |
grandchildren | +3.043 |
awakening | +2.988 |
Neg logit contributions | |
libel | -3.103 |
offensive | -2.609 |
rubbish | -2.533 |
Serie | -2.438 |
vitro | -2.437 |
Token | the |
Token ID | 262 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
companions | +13.896 |
newfound | +13.844 |
attendees | +13.188 |
unborn | +13.003 |
followers | +12.993 |
Neg logit contributions | |
libel | -12.296 |
offensive | -10.662 |
rubbish | -10.577 |
Yugoslavia | -10.018 |
ictionary | -9.917 |
Token | diversity |
Token ID | 9573 |
Feature activation | +7.16e-01 |
Pos logit contributions | |
newfound | +19.939 |
companions | +19.785 |
unborn | +19.027 |
enduring | +18.960 |
arrival | +18.942 |
Neg logit contributions | |
libel | -13.780 |
offensive | -11.851 |
ictionary | -11.788 |
rubbish | -11.193 |
Yugoslavia | -11.129 |
Token | in |
Token ID | 287 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
companions | +8.628 |
newfound | +8.435 |
unborn | +8.434 |
awakening | +8.139 |
arrival | +8.087 |
Neg logit contributions | |
libel | -8.046 |
rubbish | -6.744 |
offensive | -6.732 |
vitro | -6.240 |
Yugoslavia | -6.215 |
Token | their |
Token ID | 511 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
companions | +4.948 |
unborn | +4.842 |
newfound | +4.819 |
grandchildren | +4.642 |
survivors | +4.623 |
Neg logit contributions | |
libel | -4.266 |
rubbish | -3.500 |
offensive | -3.402 |
punt | -3.220 |
ictionary | -3.212 |
Token | franchise |
Token ID | 8663 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
newfound | +18.556 |
companions | +18.503 |
unborn | +18.018 |
arrival | +17.460 |
visions | +17.132 |
Neg logit contributions | |
libel | -15.486 |
offensive | -12.765 |
ictionary | -12.739 |
rubbish | -12.606 |
ograph | -12.211 |
Token | , |
Token ID | 11 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
companions | +12.223 |
newfound | +11.888 |
unborn | +11.640 |
arrival | +11.341 |
survivors | +11.294 |
Neg logit contributions | |
libel | -15.219 |
rubbish | -12.510 |
offensive | -12.417 |
Serie | -11.760 |
punt | -11.705 |
Token | Warner |
Token ID | 14469 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
companions | +12.199 |
newfound | +11.946 |
unborn | +11.876 |
attendees | +11.720 |
survivors | +11.633 |
Neg logit contributions | |
libel | -11.158 |
offensive | -9.432 |
rubbish | -9.247 |
ictionary | -8.942 |
ograph | -8.775 |
Token | Bros |
Token ID | 14266 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
companions | +3.632 |
newfound | +3.559 |
unborn | +3.496 |
grandchildren | +3.457 |
awakened | +3.445 |
Neg logit contributions | |
libel | -3.483 |
rubbish | -2.948 |
offensive | -2.866 |
punt | -2.735 |
vitro | -2.708 |
Token | . |
Token ID | 13 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
companions | +3.726 |
newfound | +3.685 |
unborn | +3.663 |
grandchildren | +3.603 |
caregivers | +3.523 |
Neg logit contributions | |
libel | -3.504 |
rubbish | -2.868 |
offensive | -2.815 |
vitro | -2.685 |
punt | -2.684 |
Token | � |
Token ID | 246 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
companions | +0.607 |
newfound | +0.597 |
unborn | +0.592 |
grandchildren | +0.576 |
awakening | +0.576 |
Neg logit contributions | |
libel | -0.591 |
rubbish | -0.491 |
advert | -0.466 |
Serie | -0.460 |
offensive | -0.458 |
Token | first |
Token ID | 11085 |
Feature activation | +7.79e-01 |
Pos logit contributions | |
companions | +14.063 |
unborn | +13.861 |
blessings | +13.710 |
newfound | +13.622 |
grandchildren | +13.308 |
Neg logit contributions | |
libel | -12.308 |
rubbish | -10.049 |
punt | -9.985 |
tabloid | -9.914 |
Serie | -9.806 |
Token | shall |
Token ID | 2236 |
Feature activation | +4.53e-01 |
Pos logit contributions | |
companions | +10.763 |
unborn | +10.548 |
blessings | +10.217 |
grandchildren | +10.202 |
awakening | +10.098 |
Neg logit contributions | |
libel | -7.394 |
rubbish | -6.003 |
offensive | -5.964 |
Serie | -5.737 |
vitro | -5.603 |
Token | be |
Token ID | 307 |
Feature activation | +6.82e-01 |
Pos logit contributions | |
companions | +4.984 |
unborn | +4.965 |
grandchildren | +4.806 |
blessings | +4.695 |
newfound | +4.592 |
Neg logit contributions | |
libel | -6.019 |
offensive | -5.070 |
rubbish | -5.051 |
Serie | -4.965 |
vitro | -4.858 |
Token | last |
Token ID | 938 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
unborn | +8.236 |
companions | +8.075 |
grandchildren | +7.869 |
awakened | +7.691 |
newfound | +7.691 |
Neg logit contributions | |
libel | -7.947 |
rubbish | -6.450 |
offensive | -6.448 |
Serie | -6.442 |
vitro | -6.429 |
Token | and |
Token ID | 290 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
unborn | +10.247 |
companions | +9.985 |
grandchildren | +9.562 |
blessings | +9.383 |
survivors | +9.314 |
Neg logit contributions | |
libel | -12.734 |
rubbish | -10.687 |
offensive | -10.665 |
Serie | -10.554 |
vitro | -10.369 |
Token | the |
Token ID | 262 |
Feature activation | +1.84e+00 |
Pos logit contributions | |
companions | +19.521 |
unborn | +19.510 |
enduring | +18.913 |
blessings | +18.692 |
grandchildren | +18.647 |
Neg logit contributions | |
libel | -14.659 |
Serie | -12.030 |
offensive | -11.839 |
ograph | -11.768 |
vitro | -11.690 |
Token | last |
Token ID | 938 |
Feature activation | +9.52e-01 |
Pos logit contributions | |
companions | +20.898 |
unborn | +20.822 |
blessings | +20.333 |
grandchildren | +19.899 |
survivors | +19.767 |
Neg logit contributions | |
libel | -13.948 |
Serie | -11.255 |
offensive | -11.076 |
Anyway | -11.029 |
pub | -10.888 |
Token | shall |
Token ID | 2236 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
companions | +10.433 |
unborn | +10.356 |
enduring | +9.927 |
blessings | +9.920 |
survivors | +9.913 |
Neg logit contributions | |
libel | -10.917 |
offensive | -9.324 |
rubbish | -9.076 |
Serie | -9.067 |
advert | -8.990 |
Token | be |
Token ID | 307 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
companions | +5.681 |
unborn | +5.637 |
grandchildren | +5.357 |
blessings | +5.325 |
newfound | +5.222 |
Neg logit contributions | |
libel | -7.622 |
offensive | -6.606 |
Serie | -6.503 |
rubbish | -6.396 |
Anyway | -6.237 |
Token | first |
Token ID | 717 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
unborn | +14.789 |
companions | +14.297 |
enduring | +14.130 |
newfound | +14.011 |
blessings | +13.975 |
Neg logit contributions | |
libel | -13.911 |
Serie | -11.512 |
punt | -11.375 |
vitro | -11.302 |
ograph | -11.279 |
Token | team |
Token ID | 1074 |
Feature activation | +9.04e-01 |
Pos logit contributions | |
libel | +0.414 |
rubbish | +0.339 |
offensive | +0.336 |
vitro | +0.318 |
Serie | +0.315 |
Neg logit contributions | |
companions | -0.447 |
newfound | -0.432 |
unborn | -0.430 |
grandchildren | -0.426 |
blessings | -0.415 |
Token | has |
Token ID | 468 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
companions | +10.426 |
newfound | +10.113 |
unborn | +9.981 |
grandchildren | +9.895 |
caregivers | +9.793 |
Neg logit contributions | |
libel | -10.098 |
offensive | -8.410 |
rubbish | -8.356 |
Serie | -7.879 |
vitro | -7.851 |
Token | been |
Token ID | 587 |
Feature activation | +8.65e-01 |
Pos logit contributions | |
newfound | +16.241 |
companions | +16.124 |
awakened | +16.010 |
grandchildren | +15.402 |
unborn | +15.356 |
Neg logit contributions | |
libel | -14.493 |
offensive | -12.530 |
rubbish | -11.401 |
ictionary | -11.384 |
ograph | -11.174 |
Token | working |
Token ID | 1762 |
Feature activation | +3.60e-01 |
Pos logit contributions | |
companions | +10.052 |
awakened | +9.842 |
newfound | +9.822 |
awakening | +9.647 |
enduring | +9.646 |
Neg logit contributions | |
libel | -10.119 |
offensive | -8.479 |
rubbish | -7.836 |
Serie | -7.793 |
vitro | -7.675 |
Token | hard |
Token ID | 1327 |
Feature activation | +3.95e-01 |
Pos logit contributions | |
companions | +4.449 |
newfound | +4.357 |
unborn | +4.293 |
grandchildren | +4.257 |
blessings | +4.173 |
Neg logit contributions | |
libel | -4.433 |
offensive | -3.674 |
rubbish | -3.569 |
Serie | -3.402 |
punt | -3.369 |
Token | to |
Token ID | 284 |
Feature activation | +5.49e-01 |
Pos logit contributions | |
companions | +4.483 |
unborn | +4.464 |
newfound | +4.427 |
enduring | +4.291 |
awakening | +4.287 |
Neg logit contributions | |
libel | -5.174 |
rubbish | -4.252 |
offensive | -4.236 |
Serie | -4.029 |
advert | -3.984 |
Token | create |
Token ID | 2251 |
Feature activation | +8.69e-01 |
Pos logit contributions | |
companions | +6.469 |
newfound | +6.302 |
unborn | +6.162 |
grandchildren | +6.084 |
arrival | +5.978 |
Neg logit contributions | |
libel | -6.779 |
offensive | -5.765 |
rubbish | -5.464 |
vitro | -5.336 |
Serie | -5.299 |
Token | top |
Token ID | 1353 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
companions | +10.431 |
newfound | +10.423 |
enduring | +10.111 |
unborn | +9.937 |
grandchildren | +9.893 |
Neg logit contributions | |
libel | -9.460 |
offensive | -7.717 |
rubbish | -7.671 |
advert | -7.337 |
vitro | -7.296 |
Token | notch |
Token ID | 29838 |
Feature activation | +5.31e-01 |
Pos logit contributions | |
companions | +2.738 |
unborn | +2.685 |
newfound | +2.660 |
grandchildren | +2.624 |
blessings | +2.585 |
Neg logit contributions | |
libel | -1.987 |
rubbish | -1.548 |
offensive | -1.515 |
advert | -1.432 |
vitro | -1.422 |
Token | tools |
Token ID | 4899 |
Feature activation | +8.34e-01 |
Pos logit contributions | |
companions | +6.880 |
newfound | +6.567 |
unborn | +6.563 |
grandchildren | +6.507 |
blessings | +6.367 |
Neg logit contributions | |
libel | -5.982 |
offensive | -5.008 |
rubbish | -4.910 |
vitro | -4.635 |
Anyway | -4.559 |
Token | just |
Token ID | 655 |
Feature activation | +1.85e-03 |
Pos logit contributions | |
companions | +9.886 |
unborn | +9.451 |
newfound | +9.306 |
enduring | +9.120 |
grandchildren | +9.094 |
Neg logit contributions | |
libel | -9.686 |
rubbish | -7.808 |
offensive | -7.693 |
vitro | -7.459 |
punt | -7.405 |
Token | Korea |
Token ID | 4969 |
Feature activation | -7.67e-01 |
Pos logit contributions | |
libel | +4.918 |
rubbish | +3.429 |
offensive | +3.224 |
advert | +2.977 |
Serie | +2.918 |
Neg logit contributions | |
companions | -12.008 |
unborn | -11.878 |
newfound | -11.876 |
grandchildren | -11.743 |
caregivers | -11.527 |
Token | , |
Token ID | 11 |
Feature activation | -2.95e-01 |
Pos logit contributions | |
libel | +9.842 |
rubbish | +8.236 |
offensive | +7.955 |
advert | +7.838 |
Switzerland | +7.626 |
Neg logit contributions | |
companions | -8.845 |
newfound | -8.718 |
unborn | -8.613 |
grandchildren | -8.489 |
blessings | -8.259 |
Token | where |
Token ID | 810 |
Feature activation | +4.36e-01 |
Pos logit contributions | |
libel | +3.931 |
rubbish | +3.279 |
offensive | +3.207 |
advert | +3.080 |
Serie | +3.071 |
Neg logit contributions | |
companions | -3.460 |
unborn | -3.389 |
newfound | -3.386 |
grandchildren | -3.338 |
awakening | -3.234 |
Token | reports |
Token ID | 3136 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
companions | +5.254 |
unborn | +5.179 |
grandchildren | +5.087 |
newfound | +5.085 |
survivors | +5.037 |
Neg logit contributions | |
libel | -5.314 |
offensive | -4.420 |
rubbish | -4.276 |
Serie | -4.245 |
Anyway | -4.147 |
Token | have |
Token ID | 423 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
libel | +1.171 |
offensive | +0.943 |
rubbish | +0.935 |
Serie | +0.887 |
vitro | +0.878 |
Neg logit contributions | |
companions | -1.447 |
unborn | -1.421 |
newfound | -1.418 |
grandchildren | -1.400 |
survivors | -1.374 |
Token | emerged |
Token ID | 9349 |
Feature activation | -2.53e-01 |
Pos logit contributions | |
libel | +4.754 |
rubbish | +4.001 |
offensive | +3.929 |
advert | +3.774 |
Serie | +3.765 |
Neg logit contributions | |
companions | -3.792 |
newfound | -3.711 |
unborn | -3.711 |
grandchildren | -3.652 |
awakening | -3.532 |
Token | of |
Token ID | 286 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
libel | +2.914 |
rubbish | +2.360 |
offensive | +2.328 |
Serie | +2.214 |
punt | +2.206 |
Neg logit contributions | |
companions | -3.427 |
unborn | -3.372 |
newfound | -3.363 |
grandchildren | -3.321 |
awakening | -3.238 |
Token | 80 |
Token ID | 4019 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
libel | +1.665 |
rubbish | +1.383 |
offensive | +1.378 |
Serie | +1.320 |
punt | +1.314 |
Neg logit contributions | |
companions | -1.401 |
unborn | -1.379 |
newfound | -1.374 |
grandchildren | -1.353 |
survivors | -1.313 |
Token | people |
Token ID | 661 |
Feature activation | +3.67e-01 |
Pos logit contributions | |
unborn | +1.549 |
companions | +1.547 |
grandchildren | +1.499 |
newfound | +1.494 |
survivors | +1.447 |
Neg logit contributions | |
libel | -2.789 |
offensive | -2.399 |
rubbish | -2.384 |
Serie | -2.328 |
punt | -2.309 |
Token | being |
Token ID | 852 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
unborn | +3.642 |
companions | +3.598 |
newfound | +3.540 |
enduring | +3.539 |
grandchildren | +3.451 |
Neg logit contributions | |
libel | -5.272 |
offensive | -4.536 |
rubbish | -4.479 |
Serie | -4.382 |
punt | -4.338 |
Token | publicly |
Token ID | 7271 |
Feature activation | -2.89e-01 |
Pos logit contributions | |
libel | +1.648 |
rubbish | +1.367 |
offensive | +1.366 |
Serie | +1.308 |
advert | +1.296 |
Neg logit contributions | |
companions | -1.409 |
unborn | -1.392 |
newfound | -1.381 |
grandchildren | -1.361 |
enduring | -1.322 |
Token | contin |
Token ID | 18487 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
companions | +6.349 |
newfound | +6.195 |
unborn | +6.146 |
blessings | +6.146 |
grandchildren | +5.966 |
Neg logit contributions | |
libel | -5.763 |
rubbish | -4.767 |
tabloid | -4.600 |
advert | -4.460 |
Serie | -4.440 |
Token | ued |
Token ID | 1739 |
Feature activation | +4.50e-01 |
Pos logit contributions | |
companions | +3.405 |
unborn | +3.288 |
newfound | +3.206 |
grandchildren | +3.197 |
blessings | +3.177 |
Neg logit contributions | |
libel | -5.430 |
rubbish | -4.621 |
offensive | -4.501 |
Serie | -4.419 |
punt | -4.393 |
Token | ). |
Token ID | 737 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
companions | +5.492 |
unborn | +5.390 |
blessings | +5.301 |
newfound | +5.239 |
grandchildren | +5.232 |
Neg logit contributions | |
libel | -5.331 |
offensive | -4.472 |
rubbish | -4.386 |
punt | -4.159 |
Serie | -4.121 |
Token | Extreme |
Token ID | 18111 |
Feature activation | +6.77e-01 |
Pos logit contributions | |
companions | +14.081 |
blessings | +13.534 |
Resurrection | +13.156 |
unborn | +13.151 |
enduring | +12.993 |
Neg logit contributions | |
libel | -13.646 |
rubbish | -11.396 |
offensive | -11.148 |
vitro | -10.730 |
tabloid | -10.675 |
Token | Un |
Token ID | 791 |
Feature activation | +6.53e-01 |
Pos logit contributions | |
companions | +8.591 |
blessings | +8.082 |
newfound | +8.001 |
enduring | +7.909 |
awakening | +7.902 |
Neg logit contributions | |
libel | -7.259 |
offensive | -5.943 |
rubbish | -5.855 |
vitro | -5.736 |
ograph | -5.718 |
Token | ction |
Token ID | 596 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
companions | +7.830 |
unborn | +7.644 |
newfound | +7.558 |
blessings | +7.541 |
awakened | +7.354 |
Neg logit contributions | |
libel | -7.737 |
rubbish | -6.139 |
punt | -6.064 |
Serie | -5.936 |
tabloid | -5.910 |
Token | . |
Token ID | 13 |
Feature activation | +9.42e-01 |
Pos logit contributions | |
companions | +4.655 |
unborn | +4.589 |
blessings | +4.464 |
newfound | +4.454 |
grandchildren | +4.437 |
Neg logit contributions | |
libel | -4.381 |
rubbish | -3.645 |
offensive | -3.563 |
punt | -3.426 |
advert | -3.382 |
Token | Holy |
Token ID | 7439 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
companions | +10.670 |
blessings | +10.154 |
unborn | +10.147 |
Resurrection | +9.960 |
enduring | +9.959 |
Neg logit contributions | |
libel | -10.357 |
rubbish | -8.731 |
offensive | -8.583 |
vitro | -8.283 |
ograph | -8.156 |
Token | Orders |
Token ID | 30689 |
Feature activation | +6.13e-01 |
Pos logit contributions | |
companions | +13.359 |
blessings | +12.504 |
unborn | +12.288 |
enduring | +12.203 |
grandchildren | +12.172 |
Neg logit contributions | |
libel | -12.897 |
offensive | -11.142 |
rubbish | -10.965 |
Yugoslavia | -10.847 |
racket | -10.620 |
Token | . |
Token ID | 13 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
companions | +7.311 |
unborn | +7.091 |
blessings | +6.998 |
newfound | +6.950 |
grandchildren | +6.872 |
Neg logit contributions | |
libel | -7.150 |
rubbish | -5.983 |
offensive | -5.938 |
advert | -5.586 |
punt | -5.556 |
Token | Mat |
Token ID | 6550 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
companions | +12.181 |
blessings | +11.705 |
unborn | +11.371 |
Resurrection | +11.340 |
grandchildren | +11.265 |
Neg logit contributions | |
libel | -12.061 |
rubbish | -10.110 |
offensive | -10.021 |
vitro | -9.630 |
tabloid | -9.468 |
Token | , |
Token ID | 11 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
grandchildren | +20.647 |
blessings | +20.276 |
companions | +20.213 |
unborn | +19.780 |
newfound | +19.539 |
Neg logit contributions | |
libel | -16.530 |
offensive | -13.206 |
vitro | -13.129 |
Serie | -12.456 |
ictionary | -12.317 |
Token | � |
Token ID | 564 |
Feature activation | -9.56e-02 |
Pos logit contributions | |
companions | +12.602 |
grandchildren | +12.479 |
blessings | +12.159 |
unborn | +12.087 |
newfound | +12.068 |
Neg logit contributions | |
libel | -13.921 |
vitro | -11.474 |
offensive | -11.448 |
Serie | -11.039 |
rubbish | -10.946 |
Token | � |
Token ID | 250 |
Feature activation | +4.22e-01 |
Pos logit contributions | |
libel | +1.148 |
rubbish | +0.947 |
offensive | +0.908 |
Serie | +0.884 |
advert | +0.878 |
Neg logit contributions | |
companions | -1.263 |
newfound | -1.248 |
unborn | -1.235 |
grandchildren | -1.227 |
awakening | -1.201 |
Token | My |
Token ID | 3666 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
companions | +5.243 |
grandchildren | +5.220 |
unborn | +5.150 |
newfound | +5.143 |
blessings | +5.056 |
Neg logit contributions | |
libel | -4.969 |
rubbish | -4.020 |
offensive | -3.838 |
Serie | -3.812 |
vitro | -3.808 |
Token | head |
Token ID | 1182 |
Feature activation | -4.14e-02 |
Pos logit contributions | |
grandchildren | +19.295 |
companions | +19.077 |
unborn | +18.673 |
blessings | +18.235 |
newfound | +18.228 |
Neg logit contributions | |
libel | -13.928 |
offensive | -11.173 |
vitro | -10.973 |
Serie | -10.646 |
rubbish | -10.643 |
Token | is |
Token ID | 318 |
Feature activation | +3.11e-02 |
Pos logit contributions | |
libel | +0.491 |
rubbish | +0.397 |
offensive | +0.388 |
Serie | +0.375 |
vitro | +0.370 |
Neg logit contributions | |
companions | -0.551 |
unborn | -0.540 |
newfound | -0.538 |
grandchildren | -0.532 |
awakening | -0.526 |
Token | going |
Token ID | 1016 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
companions | +0.350 |
unborn | +0.343 |
newfound | +0.343 |
awakening | +0.337 |
grandchildren | +0.335 |
Neg logit contributions | |
libel | -0.427 |
offensive | -0.356 |
rubbish | -0.354 |
vitro | -0.341 |
Serie | -0.341 |
Token | to |
Token ID | 284 |
Feature activation | -4.83e-01 |
Pos logit contributions | |
libel | +2.789 |
rubbish | +2.294 |
offensive | +2.277 |
Serie | +2.189 |
advert | +2.178 |
Neg logit contributions | |
companions | -2.502 |
unborn | -2.460 |
newfound | -2.425 |
grandchildren | -2.408 |
awakening | -2.354 |
Token | explode |
Token ID | 22818 |
Feature activation | -6.36e-01 |
Pos logit contributions | |
libel | +7.193 |
rubbish | +6.126 |
offensive | +6.006 |
advert | +5.804 |
Serie | +5.785 |
Neg logit contributions | |
companions | -4.911 |
unborn | -4.794 |
newfound | -4.792 |
grandchildren | -4.711 |
awakening | -4.541 |
Token | with |
Token ID | 351 |
Feature activation | +6.98e-01 |
Pos logit contributions | |
libel | +8.136 |
rubbish | +6.769 |
offensive | +6.571 |
advert | +6.330 |
Serie | +6.277 |
Neg logit contributions | |
companions | -7.581 |
newfound | -7.451 |
unborn | -7.384 |
grandchildren | -7.308 |
caregivers | -7.098 |
Token | cut |
Token ID | 2005 |
Feature activation | -2.02e-02 |
Pos logit contributions | |
companions | +8.438 |
newfound | +8.339 |
grandchildren | +8.295 |
unborn | +8.173 |
blessings | +7.885 |
Neg logit contributions | |
libel | -8.057 |
offensive | -6.783 |
Serie | -6.465 |
vitro | -6.395 |
rubbish | -6.351 |
Token | San |
Token ID | 2986 |
Feature activation | -4.58e-02 |
Pos logit contributions | |
libel | +16.418 |
offensive | +14.064 |
punt | +13.834 |
rubbish | +13.761 |
Serie | +13.206 |
Neg logit contributions | |
companions | -13.179 |
unborn | -13.177 |
grandchildren | -13.148 |
newfound | -12.947 |
caregivers | -12.518 |
Token | Francisco |
Token ID | 6033 |
Feature activation | -6.97e-01 |
Pos logit contributions | |
libel | +0.501 |
rubbish | +0.403 |
offensive | +0.379 |
advert | +0.367 |
vitro | +0.367 |
Neg logit contributions | |
companions | -0.648 |
unborn | -0.637 |
newfound | -0.635 |
grandchildren | -0.624 |
blessings | -0.616 |
Token | . |
Token ID | 13 |
Feature activation | -5.99e-01 |
Pos logit contributions | |
libel | +8.045 |
rubbish | +6.499 |
offensive | +6.348 |
punt | +6.073 |
advert | +6.060 |
Neg logit contributions | |
companions | -9.189 |
unborn | -9.028 |
newfound | -9.003 |
grandchildren | -8.952 |
caregivers | -8.674 |
Token | This |
Token ID | 770 |
Feature activation | -6.45e-01 |
Pos logit contributions | |
libel | +7.170 |
rubbish | +5.870 |
offensive | +5.787 |
Serie | +5.552 |
punt | +5.516 |
Neg logit contributions | |
companions | -7.621 |
unborn | -7.507 |
newfound | -7.493 |
grandchildren | -7.387 |
awakening | -7.199 |
Token | week |
Token ID | 1285 |
Feature activation | +9.28e-02 |
Pos logit contributions | |
libel | +8.385 |
rubbish | +6.990 |
offensive | +6.869 |
punt | +6.628 |
advert | +6.586 |
Neg logit contributions | |
companions | -7.501 |
unborn | -7.353 |
grandchildren | -7.308 |
newfound | -7.265 |
caregivers | -7.056 |
Token | should |
Token ID | 815 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
companions | +1.057 |
newfound | +1.032 |
unborn | +1.031 |
grandchildren | +0.994 |
caregivers | +0.986 |
Neg logit contributions | |
libel | -1.274 |
rubbish | -1.073 |
offensive | -1.033 |
vitro | -1.011 |
Serie | -0.999 |
Token | be |
Token ID | 307 |
Feature activation | -4.93e-01 |
Pos logit contributions | |
libel | +1.973 |
rubbish | +1.637 |
offensive | +1.623 |
Serie | +1.549 |
vitro | +1.540 |
Neg logit contributions | |
companions | -1.807 |
newfound | -1.770 |
unborn | -1.758 |
grandchildren | -1.731 |
blessings | -1.688 |
Token | a |
Token ID | 257 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
libel | +6.463 |
rubbish | +5.378 |
offensive | +5.254 |
advert | +5.051 |
Serie | +5.031 |
Neg logit contributions | |
companions | -5.873 |
unborn | -5.756 |
newfound | -5.750 |
grandchildren | -5.671 |
caregivers | -5.497 |
Token | tougher |
Token ID | 20516 |
Feature activation | -8.27e-01 |
Pos logit contributions | |
libel | +1.675 |
rubbish | +1.398 |
offensive | +1.375 |
advert | +1.316 |
vitro | +1.312 |
Neg logit contributions | |
companions | -1.490 |
newfound | -1.468 |
unborn | -1.449 |
grandchildren | -1.429 |
awakening | -1.399 |
Token | task |
Token ID | 4876 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
libel | +10.116 |
rubbish | +8.248 |
offensive | +8.014 |
punt | +8.003 |
advert | +7.805 |
Neg logit contributions | |
companions | -9.758 |
unborn | -9.720 |
grandchildren | -9.693 |
newfound | -9.594 |
caregivers | -9.364 |
Token | , |
Token ID | 11 |
Feature activation | -8.62e-01 |
Pos logit contributions | |
libel | +7.057 |
rubbish | +5.719 |
offensive | +5.598 |
punt | +5.326 |
advert | +5.319 |
Neg logit contributions | |
companions | -7.800 |
unborn | -7.689 |
newfound | -7.681 |
grandchildren | -7.606 |
caregivers | -7.385 |
Token | needed |
Token ID | 2622 |
Feature activation | -3.37e-01 |
Pos logit contributions | |
libel | +1.685 |
rubbish | +1.390 |
offensive | +1.359 |
Serie | +1.304 |
advert | +1.297 |
Neg logit contributions | |
companions | -1.669 |
unborn | -1.637 |
newfound | -1.633 |
grandchildren | -1.613 |
caregivers | -1.570 |
Token | to |
Token ID | 284 |
Feature activation | -8.44e-01 |
Pos logit contributions | |
libel | +4.529 |
rubbish | +3.790 |
offensive | +3.696 |
Serie | +3.556 |
advert | +3.550 |
Neg logit contributions | |
companions | -3.988 |
unborn | -3.902 |
newfound | -3.883 |
grandchildren | -3.834 |
caregivers | -3.719 |
Token | find |
Token ID | 1064 |
Feature activation | -6.18e-03 |
Pos logit contributions | |
libel | +11.381 |
rubbish | +9.610 |
advert | +9.100 |
punt | +9.030 |
offensive | +8.970 |
Neg logit contributions | |
companions | -9.077 |
newfound | -8.907 |
unborn | -8.902 |
grandchildren | -8.737 |
caregivers | -8.494 |
Token | a |
Token ID | 257 |
Feature activation | +1.44e-01 |
Pos logit contributions | |
libel | +0.070 |
rubbish | +0.056 |
offensive | +0.056 |
vitro | +0.053 |
Serie | +0.053 |
Neg logit contributions | |
companions | -0.085 |
newfound | -0.083 |
unborn | -0.082 |
grandchildren | -0.082 |
survivors | -0.081 |
Token | buyer |
Token ID | 17872 |
Feature activation | -4.03e-01 |
Pos logit contributions | |
companions | +1.577 |
newfound | +1.568 |
unborn | +1.534 |
grandchildren | +1.507 |
enduring | +1.488 |
Neg logit contributions | |
libel | -1.987 |
offensive | -1.674 |
rubbish | -1.657 |
vitro | -1.601 |
advert | -1.591 |
Token | to |
Token ID | 284 |
Feature activation | -7.26e-01 |
Pos logit contributions | |
libel | +4.520 |
rubbish | +3.631 |
offensive | +3.528 |
advert | +3.356 |
Serie | +3.344 |
Neg logit contributions | |
companions | -5.599 |
unborn | -5.498 |
newfound | -5.494 |
grandchildren | -5.428 |
caregivers | -5.286 |
Token | haul |
Token ID | 25647 |
Feature activation | -5.69e-01 |
Pos logit contributions | |
libel | +9.696 |
rubbish | +8.175 |
advert | +7.743 |
offensive | +7.742 |
punt | +7.705 |
Neg logit contributions | |
companions | -8.057 |
newfound | -7.903 |
unborn | -7.896 |
grandchildren | -7.749 |
awakening | -7.561 |
Token | the |
Token ID | 262 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
libel | +6.854 |
rubbish | +5.627 |
offensive | +5.447 |
advert | +5.222 |
Serie | +5.196 |
Neg logit contributions | |
companions | -7.327 |
unborn | -7.200 |
newfound | -7.190 |
grandchildren | -7.091 |
awakening | -6.909 |
Token | rust |
Token ID | 17000 |
Feature activation | -3.72e-01 |
Pos logit contributions | |
companions | +1.502 |
newfound | +1.494 |
unborn | +1.481 |
grandchildren | +1.451 |
survivors | +1.421 |
Neg logit contributions | |
libel | -1.724 |
offensive | -1.440 |
rubbish | -1.400 |
vitro | -1.372 |
Serie | -1.370 |
Token | ing |
Token ID | 278 |
Feature activation | -6.91e-01 |
Pos logit contributions | |
libel | +4.296 |
rubbish | +3.460 |
offensive | +3.390 |
advert | +3.239 |
Serie | +3.234 |
Neg logit contributions | |
companions | -5.050 |
unborn | -4.961 |
newfound | -4.950 |
grandchildren | -4.884 |
caregivers | -4.755 |
Token | relic |
Token ID | 26341 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
libel | +9.446 |
rubbish | +8.066 |
offensive | +7.674 |
advert | +7.492 |
Serie | +7.424 |
Neg logit contributions | |
companions | -7.538 |
unborn | -7.403 |
newfound | -7.372 |
grandchildren | -7.287 |
caregivers | -7.080 |
Token | the |
Token ID | 262 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
libel | +10.360 |
rubbish | +8.832 |
offensive | +8.625 |
advert | +8.402 |
Serie | +8.341 |
Neg logit contributions | |
companions | -6.913 |
newfound | -6.789 |
unborn | -6.789 |
grandchildren | -6.685 |
caregivers | -6.459 |
Token | arguments |
Token ID | 7159 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
libel | +2.406 |
rubbish | +2.029 |
offensive | +2.000 |
Serie | +1.910 |
advert | +1.907 |
Neg logit contributions | |
companions | -1.880 |
newfound | -1.835 |
unborn | -1.835 |
grandchildren | -1.799 |
awakening | -1.744 |
Token | ap |
Token ID | 2471 |
Feature activation | +9.07e-02 |
Pos logit contributions | |
libel | +1.324 |
rubbish | +1.087 |
offensive | +1.079 |
Serie | +1.018 |
vitro | +1.012 |
Neg logit contributions | |
companions | -1.408 |
unborn | -1.377 |
newfound | -1.376 |
grandchildren | -1.354 |
awakening | -1.318 |
Token | = |
Token ID | 796 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
companions | +1.104 |
newfound | +1.080 |
unborn | +1.074 |
grandchildren | +1.064 |
arrival | +1.039 |
Neg logit contributions | |
libel | -1.157 |
rubbish | -0.969 |
offensive | -0.931 |
Serie | -0.903 |
advert | -0.890 |
Token | arg |
Token ID | 1822 |
Feature activation | -6.79e-01 |
Pos logit contributions | |
libel | +2.867 |
rubbish | +2.442 |
offensive | +2.411 |
Serie | +2.313 |
advert | +2.299 |
Neg logit contributions | |
companions | -2.047 |
newfound | -1.997 |
unborn | -1.993 |
grandchildren | -1.949 |
awakening | -1.888 |
Token | parse |
Token ID | 29572 |
Feature activation | -6.68e-01 |
Pos logit contributions | |
libel | +5.975 |
rubbish | +4.632 |
offensive | +4.495 |
advert | +4.253 |
vitro | +4.227 |
Neg logit contributions | |
companions | -10.416 |
newfound | -10.364 |
unborn | -10.336 |
grandchildren | -10.236 |
blessings | -10.047 |
Token | . |
Token ID | 13 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
libel | +7.064 |
rubbish | +5.604 |
offensive | +5.396 |
advert | +5.178 |
Serie | +5.127 |
Neg logit contributions | |
companions | -9.535 |
newfound | -9.399 |
unborn | -9.389 |
grandchildren | -9.277 |
caregivers | -9.065 |
Token | Arg |
Token ID | 28100 |
Feature activation | -3.19e-01 |
Pos logit contributions | |
libel | +2.457 |
rubbish | +1.885 |
offensive | +1.804 |
advert | +1.711 |
vitro | +1.693 |
Neg logit contributions | |
companions | -4.059 |
newfound | -4.000 |
unborn | -3.982 |
grandchildren | -3.929 |
awakening | -3.862 |
Token | ument |
Token ID | 1713 |
Feature activation | -4.16e-01 |
Pos logit contributions | |
libel | +3.935 |
rubbish | +3.206 |
offensive | +3.130 |
advert | +2.992 |
Serie | +2.984 |
Neg logit contributions | |
companions | -4.102 |
newfound | -4.009 |
unborn | -4.003 |
grandchildren | -3.964 |
caregivers | -3.846 |
Token | Parser |
Token ID | 46677 |
Feature activation | -4.92e-01 |
Pos logit contributions | |
libel | +4.141 |
rubbish | +3.206 |
offensive | +3.105 |
advert | +2.928 |
Serie | +2.911 |
Neg logit contributions | |
companions | -6.311 |
unborn | -6.200 |
newfound | -6.198 |
grandchildren | -6.141 |
awakening | -5.987 |
Token | () |
Token ID | 3419 |
Feature activation | -7.18e-01 |
Pos logit contributions | |
libel | +5.916 |
rubbish | +4.818 |
offensive | +4.713 |
advert | +4.478 |
Serie | +4.468 |
Neg logit contributions | |
companions | -6.480 |
unborn | -6.350 |
newfound | -6.343 |
grandchildren | -6.268 |
awakening | -6.097 |
Token | - |
Token ID | 12 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
libel | +9.418 |
rubbish | +8.001 |
offensive | +7.811 |
advert | +7.582 |
Serie | +7.581 |
Neg logit contributions | |
companions | -6.183 |
unborn | -6.065 |
newfound | -6.058 |
grandchildren | -5.939 |
caregivers | -5.728 |
Token | g |
Token ID | 70 |
Feature activation | +5.64e-01 |
Pos logit contributions | |
libel | +3.912 |
rubbish | +3.188 |
offensive | +3.078 |
advert | +2.976 |
Serie | +2.947 |
Neg logit contributions | |
companions | -4.374 |
newfound | -4.295 |
unborn | -4.285 |
grandchildren | -4.234 |
awakening | -4.117 |
Token | umi |
Token ID | 12994 |
Feature activation | -6.25e-01 |
Pos logit contributions | |
companions | +5.653 |
newfound | +5.380 |
unborn | +5.370 |
grandchildren | +5.296 |
survivors | +5.294 |
Neg logit contributions | |
libel | -8.010 |
rubbish | -6.755 |
punt | -6.535 |
offensive | -6.351 |
Serie | -6.340 |
Token | crime |
Token ID | 4065 |
Feature activation | -5.43e-01 |
Pos logit contributions | |
libel | +8.961 |
rubbish | +7.546 |
offensive | +7.379 |
advert | +7.155 |
Serie | +7.135 |
Neg logit contributions | |
companions | -6.535 |
unborn | -6.408 |
newfound | -6.397 |
grandchildren | -6.281 |
caregivers | -6.067 |
Token | synd |
Token ID | 11150 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
libel | +8.660 |
rubbish | +7.452 |
offensive | +7.307 |
advert | +7.098 |
Serie | +7.076 |
Neg logit contributions | |
companions | -4.854 |
newfound | -4.749 |
unborn | -4.748 |
grandchildren | -4.645 |
caregivers | -4.466 |
Token | icate |
Token ID | 5344 |
Feature activation | -4.67e-01 |
Pos logit contributions | |
libel | +1.590 |
rubbish | +1.321 |
offensive | +1.285 |
advert | +1.240 |
Serie | +1.233 |
Neg logit contributions | |
companions | -1.448 |
newfound | -1.419 |
unborn | -1.416 |
grandchildren | -1.402 |
blessings | -1.356 |
Token | , |
Token ID | 11 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
libel | +6.101 |
rubbish | +5.067 |
offensive | +4.943 |
advert | +4.767 |
Serie | +4.743 |
Neg logit contributions | |
companions | -5.563 |
unborn | -5.455 |
newfound | -5.452 |
grandchildren | -5.371 |
awakening | -5.209 |
Token | which |
Token ID | 543 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
libel | +4.041 |
rubbish | +3.287 |
offensive | +3.210 |
advert | +3.059 |
Serie | +3.040 |
Neg logit contributions | |
companions | -4.523 |
newfound | -4.438 |
unborn | -4.437 |
grandchildren | -4.381 |
awakening | -4.264 |
Token | marked |
Token ID | 7498 |
Feature activation | -6.84e-02 |
Pos logit contributions | |
libel | +14.710 |
rubbish | +12.460 |
advert | +12.237 |
offensive | +11.930 |
Serie | +11.904 |
Neg logit contributions | |
companions | -9.943 |
newfound | -9.758 |
unborn | -9.662 |
grandchildren | -9.559 |
awakening | -9.363 |
Token | its |
Token ID | 663 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
libel | +0.796 |
rubbish | +0.645 |
offensive | +0.634 |
advert | +0.599 |
vitro | +0.599 |
Neg logit contributions | |
companions | -0.919 |
newfound | -0.919 |
unborn | -0.902 |
grandchildren | -0.896 |
survivors | -0.879 |
Token | 100 |
Token ID | 1802 |
Feature activation | +1.97e-01 |
Pos logit contributions | |
arrival | +14.603 |
newfound | +14.500 |
companions | +14.215 |
awakening | +14.094 |
enduring | +13.901 |
Neg logit contributions | |
libel | -13.378 |
offensive | -11.614 |
rubbish | -11.379 |
Anyway | -11.309 |
ictionary | -11.266 |
Token | these |
Token ID | 777 |
Feature activation | +9.17e-01 |
Pos logit contributions | |
newfound | +9.002 |
companions | +8.985 |
grandchildren | +8.694 |
unborn | +8.662 |
enduring | +8.660 |
Neg logit contributions | |
libel | -8.720 |
offensive | -7.287 |
rubbish | -6.910 |
ictionary | -6.821 |
ograph | -6.693 |
Token | were |
Token ID | 547 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
newfound | +9.886 |
companions | +9.787 |
grandchildren | +9.509 |
enduring | +9.392 |
awakened | +9.370 |
Neg logit contributions | |
libel | -11.332 |
offensive | -9.671 |
rubbish | -9.195 |
ictionary | -9.033 |
ograph | -8.974 |
Token | badly |
Token ID | 11234 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
companions | +1.153 |
newfound | +1.129 |
unborn | +1.118 |
grandchildren | +1.109 |
awakened | +1.085 |
Neg logit contributions | |
libel | -1.395 |
offensive | -1.170 |
rubbish | -1.147 |
Serie | -1.097 |
vitro | -1.095 |
Token | damaged |
Token ID | 9694 |
Feature activation | -4.60e-01 |
Pos logit contributions | |
libel | +14.167 |
rubbish | +12.383 |
advert | +11.588 |
offensive | +11.404 |
punt | +11.109 |
Neg logit contributions | |
newfound | -10.460 |
companions | -10.453 |
grandchildren | -10.255 |
unborn | -10.224 |
blessings | -10.025 |
Token | during |
Token ID | 1141 |
Feature activation | -8.25e-01 |
Pos logit contributions | |
libel | +5.472 |
rubbish | +4.462 |
offensive | +4.333 |
advert | +4.153 |
Serie | +4.132 |
Neg logit contributions | |
companions | -6.013 |
newfound | -5.915 |
unborn | -5.914 |
grandchildren | -5.829 |
caregivers | -5.672 |
Token | refuel |
Token ID | 47874 |
Feature activation | -6.89e-01 |
Pos logit contributions | |
libel | +11.276 |
rubbish | +9.563 |
offensive | +9.208 |
advert | +9.029 |
punt | +8.939 |
Neg logit contributions | |
companions | -8.819 |
unborn | -8.728 |
newfound | -8.579 |
grandchildren | -8.508 |
caregivers | -8.251 |
Token | ing |
Token ID | 278 |
Feature activation | -9.13e-01 |
Pos logit contributions | |
libel | +6.943 |
rubbish | +5.525 |
offensive | +5.311 |
advert | +5.032 |
punt | +4.967 |
Neg logit contributions | |
companions | -10.026 |
unborn | -9.924 |
newfound | -9.890 |
grandchildren | -9.799 |
caregivers | -9.579 |
Token | in |
Token ID | 287 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
libel | +11.920 |
rubbish | +10.176 |
offensive | +9.745 |
advert | +9.529 |
punt | +9.483 |
Neg logit contributions | |
companions | -9.895 |
unborn | -9.853 |
newfound | -9.771 |
grandchildren | -9.621 |
caregivers | -9.353 |
Token | 1965 |
Token ID | 17672 |
Feature activation | -4.59e-01 |
Pos logit contributions | |
libel | +20.154 |
rubbish | +17.758 |
Switzerland | +17.401 |
Yugoslavia | +17.018 |
England | +17.003 |
Neg logit contributions | |
unborn | -14.745 |
companions | -14.597 |
newfound | -14.279 |
grandchildren | -13.965 |
caregivers | -13.820 |
Token | and |
Token ID | 290 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
libel | +5.395 |
rubbish | +4.370 |
offensive | +4.266 |
advert | +4.066 |
Serie | +4.051 |
Neg logit contributions | |
companions | -6.134 |
newfound | -6.017 |
unborn | -6.013 |
grandchildren | -5.945 |
awakening | -5.788 |
Token | 1967 |
Token ID | 15904 |
Feature activation | -3.19e-01 |
Pos logit contributions | |
companions | +1.435 |
newfound | +1.411 |
unborn | +1.400 |
grandchildren | +1.389 |
awakened | +1.361 |
Neg logit contributions | |
libel | -1.319 |
rubbish | -1.061 |
offensive | -1.057 |
advert | -0.999 |
Serie | -0.992 |
Token | show |
Token ID | 905 |
Feature activation | +3.60e-01 |
Pos logit contributions | |
libel | +11.358 |
rubbish | +9.478 |
advert | +9.011 |
punt | +8.962 |
offensive | +8.921 |
Neg logit contributions | |
companions | -10.298 |
unborn | -10.176 |
newfound | -10.099 |
grandchildren | -10.007 |
caregivers | -9.804 |
Token | your |
Token ID | 534 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
companions | +4.532 |
grandchildren | +4.473 |
newfound | +4.393 |
unborn | +4.383 |
caregivers | +4.332 |
Neg logit contributions | |
libel | -4.421 |
rubbish | -3.567 |
offensive | -3.558 |
Serie | -3.458 |
advert | -3.366 |
Token | child |
Token ID | 1200 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
grandchildren | +14.919 |
companions | +14.520 |
unborn | +14.518 |
newfound | +14.260 |
caregivers | +13.880 |
Neg logit contributions | |
libel | -13.927 |
offensive | -11.427 |
rubbish | -11.078 |
Serie | -10.970 |
football | -10.621 |
Token | how |
Token ID | 703 |
Feature activation | +4.42e-01 |
Pos logit contributions | |
companions | +2.702 |
newfound | +2.643 |
grandchildren | +2.615 |
unborn | +2.608 |
caregivers | +2.513 |
Neg logit contributions | |
libel | -2.931 |
rubbish | -2.395 |
offensive | -2.374 |
advert | -2.273 |
Serie | -2.269 |
Token | to |
Token ID | 284 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
companions | +4.340 |
unborn | +4.230 |
newfound | +4.165 |
grandchildren | +4.162 |
blessings | +4.043 |
Neg logit contributions | |
libel | -6.444 |
offensive | -5.474 |
rubbish | -5.305 |
Serie | -5.190 |
punt | -5.175 |
Token | thread |
Token ID | 4704 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
libel | +11.685 |
rubbish | +9.902 |
advert | +9.283 |
punt | +9.131 |
offensive | +9.041 |
Neg logit contributions | |
companions | -12.031 |
unborn | -11.921 |
newfound | -11.815 |
grandchildren | -11.738 |
caregivers | -11.423 |
Token | your |
Token ID | 534 |
Feature activation | +7.32e-02 |
Pos logit contributions | |
libel | +12.339 |
rubbish | +10.393 |
offensive | +9.952 |
advert | +9.604 |
vitro | +9.551 |
Neg logit contributions | |
companions | -11.994 |
unborn | -11.875 |
newfound | -11.771 |
grandchildren | -11.613 |
caregivers | -11.453 |
Token | machine |
Token ID | 4572 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
companions | +1.023 |
newfound | +1.013 |
unborn | +1.008 |
grandchildren | +0.998 |
blessings | +0.967 |
Neg logit contributions | |
libel | -0.820 |
offensive | -0.651 |
rubbish | -0.645 |
Serie | -0.612 |
advert | -0.598 |
Token | or |
Token ID | 393 |
Feature activation | -7.94e-01 |
Pos logit contributions | |
libel | +11.226 |
rubbish | +9.233 |
offensive | +8.792 |
advert | +8.753 |
vitro | +8.598 |
Neg logit contributions | |
newfound | -12.118 |
unborn | -12.100 |
companions | -12.071 |
grandchildren | -11.875 |
awakening | -11.563 |
Token | refer |
Token ID | 3522 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
libel | +9.958 |
rubbish | +8.382 |
offensive | +7.944 |
advert | +7.917 |
punt | +7.743 |
Neg logit contributions | |
companions | -9.082 |
newfound | -8.963 |
unborn | -8.963 |
grandchildren | -8.750 |
awakening | -8.544 |
Token | to |
Token ID | 284 |
Feature activation | -8.66e-01 |
Pos logit contributions | |
companions | +1.339 |
grandchildren | +1.297 |
unborn | +1.287 |
caregivers | +1.270 |
newfound | +1.268 |
Neg logit contributions | |
libel | -1.681 |
rubbish | -1.412 |
offensive | -1.396 |
Serie | -1.352 |
punt | -1.339 |
Token | sorts |
Token ID | 10524 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
libel | +27.540 |
rubbish | +25.241 |
vitro | +23.881 |
advert | +23.671 |
offensive | +23.616 |
Neg logit contributions | |
newfound | -12.648 |
grandchildren | -12.619 |
companions | -12.321 |
awakening | -12.192 |
awakened | -11.749 |
Token | of |
Token ID | 286 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
libel | +10.609 |
rubbish | +8.659 |
offensive | +7.569 |
advert | +7.563 |
vitro | +7.261 |
Neg logit contributions | |
newfound | -16.453 |
unborn | -16.346 |
companions | -16.227 |
grandchildren | -16.155 |
awakened | -16.018 |
Token | everyday |
Token ID | 10908 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
libel | +26.078 |
rubbish | +24.245 |
advert | +22.226 |
vitro | +22.034 |
Serie | +21.773 |
Neg logit contributions | |
grandchildren | -12.272 |
newfound | -12.101 |
companions | -12.005 |
awakening | -11.653 |
unborn | -11.454 |
Token | household |
Token ID | 6641 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
libel | +21.608 |
rubbish | +20.492 |
advert | +18.498 |
offensive | +17.926 |
vitro | +17.910 |
Neg logit contributions | |
newfound | -13.161 |
grandchildren | -12.817 |
awakening | -12.419 |
unborn | -12.398 |
awakened | -12.304 |
Token | products |
Token ID | 3186 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
libel | +15.236 |
rubbish | +14.101 |
offensive | +12.721 |
advert | +12.516 |
Serie | +12.101 |
Neg logit contributions | |
newfound | -11.877 |
grandchildren | -11.649 |
unborn | -11.631 |
companions | -11.392 |
awakening | -11.187 |
Token | . |
Token ID | 13 |
Feature activation | -2.52e+00 |
Pos logit contributions | |
libel | +12.316 |
rubbish | +10.410 |
offensive | +9.917 |
advert | +9.775 |
vitro | +9.552 |
Neg logit contributions | |
companions | -12.206 |
newfound | -12.142 |
unborn | -11.941 |
grandchildren | -11.870 |
awakening | -11.542 |
Token | It |
Token ID | 632 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
libel | +24.914 |
Switzerland | +23.795 |
Brussels | +23.781 |
England | +23.651 |
Serie | +23.349 |
Neg logit contributions | |
newfound | -19.412 |
awakening | -18.597 |
companions | -18.577 |
unborn | -18.434 |
awakened | -18.060 |
Token | stretches |
Token ID | 23687 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
libel | +22.485 |
advert | +20.413 |
rubbish | +20.110 |
offensive | +18.344 |
counterfe | +18.260 |
Neg logit contributions | |
newfound | -16.250 |
grandchildren | -16.113 |
companions | -15.877 |
unborn | -15.431 |
awakening | -15.198 |
Token | under |
Token ID | 739 |
Feature activation | -1.93e+00 |
Pos logit contributions | |
libel | +14.311 |
rubbish | +12.323 |
advert | +11.596 |
offensive | +11.512 |
Serie | +11.284 |
Neg logit contributions | |
newfound | -11.357 |
companions | -11.315 |
unborn | -11.057 |
grandchildren | -11.024 |
awakening | -10.773 |
Token | stress |
Token ID | 5503 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
libel | +24.775 |
rubbish | +22.990 |
offensive | +21.335 |
vitro | +20.959 |
advert | +20.829 |
Neg logit contributions | |
newfound | -13.869 |
companions | -13.610 |
grandchildren | -13.218 |
unborn | -13.187 |
awakening | -12.792 |
Token | , |
Token ID | 11 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
libel | +15.326 |
rubbish | +13.384 |
offensive | +12.835 |
advert | +12.398 |
vitro | +12.386 |
Neg logit contributions | |
newfound | -12.398 |
companions | -12.284 |
grandchildren | -11.989 |
unborn | -11.972 |
awakening | -11.477 |
Token | second |
Token ID | 1218 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
libel | +16.345 |
rubbish | +14.133 |
advert | +13.386 |
offensive | +13.376 |
punt | +13.285 |
Neg logit contributions | |
companions | -10.394 |
grandchildren | -10.146 |
unborn | -9.688 |
caregivers | -9.669 |
blessings | -9.429 |
Token | violation |
Token ID | 8747 |
Feature activation | -9.63e-01 |
Pos logit contributions | |
libel | +18.618 |
rubbish | +16.208 |
doping | +15.425 |
advert | +15.215 |
offensive | +15.196 |
Neg logit contributions | |
companions | -12.960 |
grandchildren | -12.764 |
caregivers | -12.258 |
newfound | -12.208 |
unborn | -12.136 |
Token | involving |
Token ID | 7411 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
libel | +12.588 |
rubbish | +10.568 |
offensive | +10.116 |
advert | +10.075 |
punt | +9.963 |
Neg logit contributions | |
companions | -10.371 |
grandchildren | -10.083 |
unborn | -10.002 |
newfound | -9.957 |
caregivers | -9.652 |
Token | the |
Token ID | 262 |
Feature activation | -8.34e-01 |
Pos logit contributions | |
libel | +16.889 |
rubbish | +14.655 |
offensive | +13.952 |
punt | +13.775 |
Serie | +13.768 |
Neg logit contributions | |
companions | -11.437 |
unborn | -11.182 |
grandchildren | -11.156 |
newfound | -10.946 |
caregivers | -10.782 |
Token | same |
Token ID | 976 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
libel | +11.735 |
rubbish | +10.157 |
offensive | +9.775 |
advert | +9.607 |
Serie | +9.550 |
Neg logit contributions | |
companions | -8.260 |
grandchildren | -7.970 |
unborn | -7.929 |
newfound | -7.928 |
caregivers | -7.763 |
Token | banned |
Token ID | 9301 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
libel | +22.952 |
rubbish | +20.528 |
doping | +19.888 |
advert | +19.539 |
steroids | +19.456 |
Neg logit contributions | |
grandchildren | -14.134 |
companions | -14.108 |
caregivers | -13.442 |
newfound | -13.105 |
unborn | -13.007 |
Token | substance |
Token ID | 9136 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
libel | +26.400 |
doping | +23.715 |
rubbish | +23.470 |
steroids | +22.813 |
advert | +22.205 |
Neg logit contributions | |
grandchildren | -17.803 |
companions | -16.936 |
caregivers | -16.760 |
attendants | -16.446 |
blessings | -16.100 |
Token | is |
Token ID | 318 |
Feature activation | -7.14e-01 |
Pos logit contributions | |
libel | +17.162 |
rubbish | +14.628 |
advert | +14.069 |
Serie | +13.939 |
Switzerland | +13.926 |
Neg logit contributions | |
companions | -11.991 |
grandchildren | -11.576 |
unborn | -11.464 |
newfound | -11.306 |
blessings | -11.004 |
Token | considered |
Token ID | 3177 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
libel | +10.508 |
rubbish | +8.960 |
offensive | +8.683 |
Serie | +8.514 |
advert | +8.468 |
Neg logit contributions | |
companions | -7.085 |
unborn | -6.874 |
newfound | -6.837 |
grandchildren | -6.810 |
caregivers | -6.572 |
Token | � |
Token ID | 564 |
Feature activation | -4.58e-01 |
Pos logit contributions | |
libel | +21.579 |
rubbish | +18.606 |
doping | +17.509 |
Serie | +17.463 |
offensive | +17.397 |
Neg logit contributions | |
companions | -13.678 |
grandchildren | -13.349 |
unborn | -13.124 |
caregivers | -12.874 |
newfound | -12.732 |
Token | � |
Token ID | 250 |
Feature activation | -5.94e-01 |
Pos logit contributions | |
libel | +5.310 |
rubbish | +4.315 |
offensive | +4.181 |
advert | +3.980 |
Serie | +3.978 |
Neg logit contributions | |
companions | -6.227 |
newfound | -6.115 |
unborn | -6.113 |
grandchildren | -6.019 |
awakening | -5.876 |
Token | You |
Token ID | 1639 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
Anyway | +23.493 |
England | +23.292 |
Football | +22.216 |
libel | +21.969 |
Basically | +21.229 |
Neg logit contributions | |
unborn | -26.115 |
newfound | -25.543 |
companions | -25.168 |
awakening | -24.915 |
caregivers | -24.482 |
Token | have |
Token ID | 423 |
Feature activation | -2.37e+00 |
Pos logit contributions | |
libel | +24.917 |
rubbish | +21.935 |
punt | +21.389 |
analyse | +20.851 |
penal | +20.644 |
Neg logit contributions | |
newfound | -18.046 |
companions | -17.881 |
unborn | -17.384 |
awakening | -16.717 |
grandchildren | -16.588 |
Token | ( |
Token ID | 357 |
Feature activation | -2.42e+00 |
Pos logit contributions | |
libel | +28.535 |
rubbish | +25.959 |
England | +24.752 |
cricket | +24.551 |
racket | +24.361 |
Neg logit contributions | |
companions | -13.603 |
reetings | -13.461 |
newfound | -13.426 |
unborn | -13.404 |
ollower | -13.292 |
Token | bow |
Token ID | 8176 |
Feature activation | -6.56e-01 |
Pos logit contributions | |
libel | +25.727 |
offensive | +25.378 |
England | +23.518 |
football | +23.515 |
pub | +23.055 |
Neg logit contributions | |
unborn | -17.505 |
companions | -17.424 |
caregivers | -16.973 |
grandchildren | -16.549 |
awakening | -16.528 |
Token | led |
Token ID | 992 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
libel | +8.600 |
rubbish | +7.185 |
offensive | +6.999 |
advert | +6.715 |
punt | +6.668 |
Neg logit contributions | |
companions | -7.707 |
newfound | -7.584 |
unborn | -7.556 |
grandchildren | -7.459 |
caregivers | -7.244 |
Token | ) |
Token ID | 8 |
Feature activation | -2.32e+00 |
Pos logit contributions | |
libel | +25.347 |
rubbish | +23.052 |
offensive | +22.205 |
England | +21.771 |
advert | +21.566 |
Neg logit contributions | |
unborn | -13.967 |
newfound | -13.762 |
companions | -13.705 |
caregivers | -13.368 |
grandchildren | -13.314 |
Token | a |
Token ID | 257 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
libel | +27.984 |
rubbish | +26.015 |
England | +24.585 |
offensive | +24.485 |
racket | +24.233 |
Neg logit contributions | |
newfound | -13.186 |
unborn | -13.122 |
companions | -13.115 |
awakened | -12.576 |
caregivers | -12.427 |
Token | no |
Token ID | 645 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
libel | +25.981 |
rubbish | +23.399 |
racket | +22.806 |
punt | +22.786 |
cricket | +22.031 |
Neg logit contributions | |
companions | -14.218 |
unborn | -14.037 |
caregivers | -13.833 |
grandchildren | -13.680 |
reetings | -13.389 |
Token | - |
Token ID | 12 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
libel | +22.514 |
offensive | +19.689 |
rubbish | +19.624 |
punt | +19.038 |
racket | +18.654 |
Neg logit contributions | |
companions | -14.089 |
newfound | -13.646 |
grandchildren | -13.536 |
unborn | -13.224 |
caregivers | -13.183 |
Token | ball |
Token ID | 1894 |
Feature activation | -2.53e+00 |
Pos logit contributions | |
libel | +15.234 |
offensive | +13.504 |
rubbish | +12.702 |
shit | +12.101 |
punt | +11.978 |
Neg logit contributions | |
companions | -15.361 |
newfound | -14.946 |
unborn | -14.921 |
grandchildren | -14.817 |
caregivers | -14.529 |
Token | when |
Token ID | 618 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
libel | +28.572 |
rubbish | +25.613 |
offensive | +25.385 |
racket | +24.922 |
punt | +24.822 |
Neg logit contributions | |
companions | -15.701 |
newfound | -15.190 |
caregivers | -15.181 |
grandchildren | -15.074 |
unborn | -14.728 |
Token | be |
Token ID | 307 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
libel | +14.281 |
rubbish | +12.137 |
punt | +11.399 |
offensive | +11.218 |
advert | +11.218 |
Neg logit contributions | |
companions | -13.095 |
newfound | -12.995 |
unborn | -12.970 |
grandchildren | -12.783 |
caregivers | -12.465 |
Token | corrected |
Token ID | 19267 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
libel | +18.448 |
rubbish | +15.820 |
advert | +15.092 |
penal | +14.984 |
punt | +14.846 |
Neg logit contributions | |
companions | -12.607 |
unborn | -12.174 |
newfound | -12.080 |
grandchildren | -12.013 |
blessings | -11.635 |
Token | . |
Token ID | 13 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
libel | +16.810 |
rubbish | +14.278 |
offensive | +13.560 |
advert | +13.367 |
vitro | +13.246 |
Neg logit contributions | |
newfound | -14.834 |
companions | -14.820 |
unborn | -14.591 |
grandchildren | -14.416 |
caregivers | -13.905 |
Token |
|
Token ID | 198 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
libel | +17.526 |
Serie | +14.747 |
rubbish | +14.636 |
offensive | +14.572 |
England | +14.564 |
Neg logit contributions | |
companions | -15.471 |
unborn | -15.370 |
newfound | -15.231 |
grandchildren | -14.830 |
awakening | -14.655 |
Token |
|
Token ID | 198 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
libel | +4.031 |
offensive | +3.216 |
rubbish | +3.205 |
Serie | +3.073 |
advert | +3.035 |
Neg logit contributions | |
companions | -5.446 |
unborn | -5.411 |
newfound | -5.387 |
awakening | -5.282 |
caregivers | -5.273 |
Token | " |
Token ID | 1 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
libel | +13.800 |
offensive | +11.647 |
rubbish | +11.226 |
England | +11.046 |
Anyway | +10.937 |
Neg logit contributions | |
companions | -14.820 |
unborn | -14.742 |
newfound | -14.488 |
grandchildren | -14.404 |
caregivers | -14.214 |
Token | The |
Token ID | 464 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
England | +25.030 |
Anyway | +24.794 |
Football | +24.322 |
libel | +23.240 |
Basically | +23.059 |
Neg logit contributions | |
unborn | -26.459 |
companions | -25.802 |
newfound | -25.573 |
awakening | -25.082 |
caregivers | -25.045 |
Token | ICC |
Token ID | 32300 |
Feature activation | -3.04e+00 |
Pos logit contributions | |
libel | +27.016 |
rubbish | +24.034 |
racket | +23.510 |
England | +23.314 |
cricket | +23.003 |
Neg logit contributions | |
companions | -12.083 |
newfound | -11.587 |
unborn | -11.530 |
grandchildren | -11.466 |
caregivers | -10.761 |
Token | has |
Token ID | 468 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
libel | +31.677 |
penal | +28.109 |
rubbish | +27.895 |
advert | +27.762 |
racket | +27.629 |
Neg logit contributions | |
newfound | -16.143 |
unborn | -16.134 |
companions | -16.107 |
grandchildren | -14.863 |
caregivers | -14.860 |
Token | a |
Token ID | 257 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
libel | +24.824 |
rubbish | +22.070 |
penal | +21.097 |
advert | +20.798 |
racket | +20.622 |
Neg logit contributions | |
companions | -13.362 |
unborn | -12.967 |
caregivers | -12.724 |
reetings | -12.702 |
newfound | -12.694 |
Token | rule |
Token ID | 3896 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
libel | +24.848 |
rubbish | +21.672 |
racket | +20.971 |
penal | +20.522 |
punt | +20.428 |
Neg logit contributions | |
companions | -13.405 |
unborn | -13.115 |
caregivers | -12.923 |
grandchildren | -12.512 |
occupants | -12.217 |
Token | not |
Token ID | 407 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
libel | +14.563 |
rubbish | +12.789 |
offensive | +12.044 |
punt | +11.729 |
advert | +11.629 |
Neg logit contributions | |
unborn | -10.199 |
companions | -10.103 |
newfound | -9.983 |
grandchildren | -9.927 |
caregivers | -9.606 |
Token | types |
Token ID | 3858 |
Feature activation | -8.49e-02 |
Pos logit contributions | |
libel | +14.446 |
rubbish | +12.440 |
offensive | +11.873 |
advert | +11.599 |
punt | +11.569 |
Neg logit contributions | |
unborn | -10.002 |
companions | -9.968 |
newfound | -9.794 |
grandchildren | -9.751 |
awakening | -9.381 |
Token | of |
Token ID | 286 |
Feature activation | -5.57e-01 |
Pos logit contributions | |
libel | +0.989 |
rubbish | +0.797 |
offensive | +0.783 |
Serie | +0.748 |
vitro | +0.746 |
Neg logit contributions | |
companions | -1.143 |
newfound | -1.120 |
unborn | -1.119 |
grandchildren | -1.095 |
awakening | -1.083 |
Token | questions |
Token ID | 2683 |
Feature activation | -3.02e-01 |
Pos logit contributions | |
libel | +8.304 |
rubbish | +7.125 |
offensive | +6.926 |
advert | +6.730 |
Serie | +6.675 |
Neg logit contributions | |
companions | -5.505 |
unborn | -5.400 |
newfound | -5.388 |
grandchildren | -5.316 |
caregivers | -5.104 |
Token | covered |
Token ID | 5017 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
libel | +3.771 |
rubbish | +3.088 |
offensive | +3.024 |
Serie | +2.891 |
advert | +2.887 |
Neg logit contributions | |
companions | -3.840 |
unborn | -3.757 |
newfound | -3.754 |
grandchildren | -3.709 |
caregivers | -3.605 |
Token | in |
Token ID | 287 |
Feature activation | -2.26e+00 |
Pos logit contributions | |
libel | +17.706 |
rubbish | +14.921 |
advert | +14.432 |
offensive | +14.180 |
wik | +13.913 |
Neg logit contributions | |
unborn | -15.413 |
companions | -15.342 |
newfound | -15.323 |
grandchildren | -15.279 |
blessings | -14.831 |
Token | interview |
Token ID | 2720 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
libel | +27.924 |
rubbish | +24.277 |
wik | +23.837 |
offensive | +23.776 |
advert | +23.763 |
Neg logit contributions | |
unborn | -14.591 |
companions | -13.897 |
grandchildren | -13.749 |
newfound | -13.448 |
caregivers | -13.418 |
Token | prep |
Token ID | 3143 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
libel | +15.454 |
rubbish | +13.436 |
offensive | +12.930 |
advert | +12.754 |
vitro | +12.448 |
Neg logit contributions | |
unborn | -10.469 |
grandchildren | -10.230 |
companions | -10.229 |
newfound | -10.127 |
caregivers | -9.737 |
Token | books |
Token ID | 3835 |
Feature activation | -7.83e-01 |
Pos logit contributions | |
libel | +18.378 |
rubbish | +16.052 |
advert | +15.078 |
wik | +15.070 |
offensive | +14.993 |
Neg logit contributions | |
unborn | -15.414 |
grandchildren | -14.804 |
newfound | -14.670 |
companions | -14.559 |
caregivers | -13.989 |
Token | . |
Token ID | 13 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
libel | +8.920 |
rubbish | +7.288 |
offensive | +7.030 |
advert | +6.822 |
Serie | +6.666 |
Neg logit contributions | |
companions | -10.193 |
unborn | -10.061 |
newfound | -10.029 |
grandchildren | -9.923 |
caregivers | -9.627 |
Token | Really |
Token ID | 26392 |
Feature activation | +6.22e-02 |
Pos logit contributions | |
libel | +13.870 |
rubbish | +11.597 |
Anyway | +11.278 |
Serie | +11.185 |
Switzerland | +11.153 |
Neg logit contributions | |
unborn | -13.579 |
companions | -13.515 |
newfound | -13.404 |
grandchildren | -13.188 |
awakening | -12.960 |