Token | like |
Token ID | 588 |
Feature activation | +5.51e+00 |
Pos logit contributions | |
BY | +1.182 |
Decay | +1.149 |
than | +1.073 |
unfavorable | +1.073 |
Geological | +1.046 |
Neg logit contributions | |
genders | -1.515 |
blance | -1.473 |
aults | -1.437 |
rils | -1.422 |
rights | -1.415 |
Token | to |
Token ID | 284 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
BY | +3.759 |
Decay | +3.645 |
unfavorable | +3.430 |
than | +3.423 |
periodic | +3.345 |
Neg logit contributions | |
genders | -4.362 |
blance | -4.286 |
aults | -4.140 |
rils | -4.120 |
rights | -4.068 |
Token | reflect |
Token ID | 4079 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
BY | +6.696 |
Decay | +6.181 |
than | +6.088 |
orally | +6.074 |
periodic | +6.039 |
Neg logit contributions | |
blance | -9.304 |
genders | -9.158 |
aults | -8.901 |
rights | -8.830 |
rils | -8.823 |
Token | in |
Token ID | 287 |
Feature activation | +9.18e+00 |
Pos logit contributions | |
BY | +1.405 |
Decay | +1.365 |
unfavorable | +1.290 |
than | +1.288 |
orally | +1.255 |
Neg logit contributions | |
genders | -1.568 |
blance | -1.520 |
aults | -1.477 |
rils | -1.467 |
empowerment | -1.455 |
Token | everything |
Token ID | 2279 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
BY | +5.998 |
Decay | +5.959 |
unfavorable | +5.564 |
periodic | +5.549 |
than | +5.474 |
Neg logit contributions | |
genders | -7.189 |
blance | -7.161 |
rils | -6.853 |
itans | -6.726 |
rights | -6.726 |
Token | we |
Token ID | 356 |
Feature activation | +3.03e+01 |
Pos logit contributions | |
Decay | +10.154 |
BY | +9.967 |
unfavorable | +9.196 |
periodic | +9.005 |
orally | +8.913 |
Neg logit contributions | |
blance | -15.152 |
rils | -14.876 |
genders | -14.743 |
itans | -14.397 |
OULD | -14.086 |
Token | do |
Token ID | 466 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
Decay | +11.239 |
BY | +10.745 |
orally | +10.696 |
administr | +10.233 |
Announce | +10.099 |
Neg logit contributions | |
blance | -21.768 |
srfAttach | -20.712 |
genders | -20.704 |
サーティワン | -20.533 |
rils | -20.335 |
Token | from |
Token ID | 422 |
Feature activation | +8.95e+00 |
Pos logit contributions | |
BY | +9.463 |
Decay | +9.187 |
orally | +8.999 |
than | +8.821 |
unfavorable | +8.616 |
Neg logit contributions | |
blance | -15.691 |
rils | -15.101 |
genders | -15.031 |
itans | -14.813 |
CLS | -14.676 |
Token | the |
Token ID | 262 |
Feature activation | +6.49e+00 |
Pos logit contributions | |
BY | +5.820 |
Decay | +5.701 |
unfavorable | +5.364 |
than | +5.342 |
periodic | +5.324 |
Neg logit contributions | |
blance | -7.099 |
genders | -6.908 |
rils | -6.735 |
aults | -6.574 |
mattered | -6.544 |
Token | posters |
Token ID | 19379 |
Feature activation | +5.62e-01 |
Pos logit contributions | |
BY | +4.561 |
Decay | +4.408 |
than | +4.170 |
unfavorable | +4.153 |
periodic | +4.106 |
Neg logit contributions | |
blance | -5.016 |
genders | -4.904 |
rils | -4.693 |
mattered | -4.639 |
rights | -4.634 |
Token | that |
Token ID | 326 |
Feature activation | +7.72e+00 |
Pos logit contributions | |
BY | +0.411 |
Decay | +0.401 |
than | +0.378 |
unfavorable | +0.377 |
Geological | +0.368 |
Neg logit contributions | |
genders | -0.430 |
blance | -0.413 |
aults | -0.402 |
rils | -0.398 |
empowerment | -0.398 |
Token |
|
Token ID | 198 |
Feature activation | -5.48e+00 |
Pos logit contributions | |
BY | +0.288 |
Decay | +0.279 |
than | +0.266 |
unfavorable | +0.263 |
Geological | +0.259 |
Neg logit contributions | |
genders | -0.264 |
blance | -0.255 |
aults | -0.246 |
empowerment | -0.244 |
rils | -0.244 |
Token | Order |
Token ID | 18743 |
Feature activation | -9.06e-01 |
Pos logit contributions | |
genders | +4.372 |
blance | +4.299 |
rights | +4.217 |
aults | +4.215 |
rils | +4.141 |
Neg logit contributions | |
Decay | -3.528 |
BY | -3.387 |
unfavorable | -3.317 |
orally | -3.256 |
periodic | -3.235 |
Token | Now |
Token ID | 2735 |
Feature activation | +6.83e+00 |
Pos logit contributions | |
genders | +0.766 |
blance | +0.735 |
aults | +0.721 |
empowerment | +0.717 |
rils | +0.713 |
Neg logit contributions | |
BY | -0.590 |
Decay | -0.568 |
than | -0.535 |
unfavorable | -0.534 |
Geological | -0.519 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +7.70e+00 |
Pos logit contributions | |
BY | +4.796 |
Decay | +4.690 |
than | +4.346 |
unfavorable | +4.281 |
Geological | +4.236 |
Neg logit contributions | |
genders | -5.329 |
blance | -5.224 |
aults | -4.996 |
rils | -4.982 |
mattered | -4.904 |
Token | After |
Token ID | 3260 |
Feature activation | +9.59e+00 |
Pos logit contributions | |
BY | +5.311 |
than | +4.729 |
Decay | +4.682 |
unfavorable | +4.322 |
Geological | +4.320 |
Neg logit contributions | |
genders | -6.404 |
blance | -6.048 |
mattered | -5.955 |
empowerment | -5.903 |
aults | -5.869 |
Token | much |
Token ID | 881 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
BY | +6.737 |
Decay | +6.586 |
unfavorable | +6.330 |
than | +6.204 |
periodic | +6.142 |
Neg logit contributions | |
genders | -6.989 |
blance | -6.892 |
aults | -6.652 |
rights | -6.510 |
rils | -6.503 |
Token | talk |
Token ID | 1561 |
Feature activation | +9.63e+00 |
Pos logit contributions | |
preparation | +17.258 |
unfavorable | +16.724 |
periodic | +16.250 |
BY | +15.998 |
Decay | +15.755 |
Neg logit contributions | |
blance | -15.984 |
rights | -15.962 |
rils | -15.883 |
aults | -15.564 |
genders | -15.442 |
Token | about |
Token ID | 546 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
BY | +5.920 |
Decay | +5.802 |
unfavorable | +5.537 |
than | +5.455 |
periodic | +5.302 |
Neg logit contributions | |
genders | -7.790 |
blance | -7.659 |
rils | -7.422 |
aults | -7.419 |
itans | -7.322 |
Token | the |
Token ID | 262 |
Feature activation | -3.59e+00 |
Pos logit contributions | |
genders | +10.721 |
empowerment | +10.045 |
equality | +10.043 |
wheelchair | +9.796 |
blance | +9.741 |
Neg logit contributions | |
BY | -8.582 |
Decay | -8.104 |
than | -7.830 |
Geological | -7.640 |
orally | -7.461 |
Token | upcoming |
Token ID | 7865 |
Feature activation | -2.46e+00 |
Pos logit contributions | |
genders | +2.905 |
blance | +2.724 |
empowerment | +2.700 |
aults | +2.668 |
wheelchair | +2.645 |
Neg logit contributions | |
BY | -2.472 |
Decay | -2.378 |
than | -2.252 |
unfavorable | -2.206 |
Geological | -2.181 |
Token | Fifty |
Token ID | 35351 |
Feature activation | +4.20e+00 |
Pos logit contributions | |
genders | +1.950 |
blance | +1.841 |
aults | +1.808 |
empowerment | +1.805 |
rils | +1.782 |
Neg logit contributions | |
BY | -1.725 |
Decay | -1.675 |
than | -1.588 |
unfavorable | -1.576 |
orally | -1.540 |
Token | articles |
Token ID | 6685 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
BY | +10.459 |
unfavorable | +10.247 |
than | +10.135 |
Decay | +9.910 |
orally | +9.809 |
Neg logit contributions | |
genders | -11.024 |
blance | -10.861 |
rils | -10.722 |
aults | -10.378 |
itans | -10.352 |
Token | , |
Token ID | 11 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
unfavorable | +11.258 |
BY | +10.899 |
orally | +10.819 |
incomplete | +10.415 |
Decay | +10.225 |
Neg logit contributions | |
blance | -12.770 |
genders | -12.745 |
rils | -12.440 |
itans | -12.269 |
empowerment | -12.261 |
Token | and |
Token ID | 290 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
BY | +6.959 |
Decay | +6.616 |
unfavorable | +6.602 |
than | +6.431 |
orally | +6.365 |
Neg logit contributions | |
blance | -7.653 |
genders | -7.562 |
rils | -7.284 |
aults | -7.280 |
itans | -7.204 |
Token | arguments |
Token ID | 7159 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
BY | +11.121 |
unfavorable | +10.886 |
orally | +10.422 |
Decay | +10.392 |
incomplete | +10.327 |
Neg logit contributions | |
blance | -10.208 |
genders | -9.673 |
rils | -9.652 |
aults | -9.601 |
itans | -9.549 |
Token | , |
Token ID | 11 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
unfavorable | +11.692 |
BY | +11.542 |
orally | +11.533 |
than | +10.762 |
Decay | +10.703 |
Neg logit contributions | |
genders | -13.437 |
rils | -13.296 |
blance | -13.165 |
empowerment | -12.931 |
aults | -12.901 |
Token | partly |
Token ID | 11476 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
BY | +11.685 |
unfavorable | +11.453 |
than | +11.169 |
Decay | +11.000 |
orally | +10.984 |
Neg logit contributions | |
genders | -11.655 |
blance | -11.594 |
rils | -11.382 |
aults | -11.140 |
itans | -11.124 |
Token | also |
Token ID | 635 |
Feature activation | +2.77e+01 |
Pos logit contributions | |
BY | +15.344 |
orally | +14.891 |
unfavorable | +14.503 |
incomplete | +14.012 |
periodic | +13.671 |
Neg logit contributions | |
blance | -16.738 |
genders | -16.638 |
rils | -16.519 |
rights | -16.211 |
OULD | -16.089 |
Token | because |
Token ID | 780 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
BY | +15.110 |
unfavorable | +14.718 |
orally | +14.614 |
incomplete | +13.852 |
periodic | +13.643 |
Neg logit contributions | |
genders | -16.124 |
blance | -15.902 |
rils | -15.874 |
OULD | -15.599 |
aults | -15.428 |
Token | those |
Token ID | 883 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
BY | +9.978 |
unfavorable | +9.757 |
orally | +9.583 |
Decay | +9.455 |
periodic | +9.125 |
Neg logit contributions | |
rils | -12.025 |
blance | -11.964 |
genders | -11.808 |
aults | -11.751 |
rights | -11.426 |
Token | things |
Token ID | 1243 |
Feature activation | +2.04e+01 |
Pos logit contributions | |
BY | +11.508 |
unfavorable | +11.318 |
Decay | +11.175 |
orally | +11.021 |
periodic | +10.887 |
Neg logit contributions | |
blance | -4.457 |
genders | -4.212 |
rils | -4.117 |
itans | -3.909 |
aults | -3.880 |
Token | that |
Token ID | 326 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
unfavorable | +13.402 |
BY | +13.354 |
orally | +12.973 |
Decay | +12.785 |
than | +12.132 |
Neg logit contributions | |
blance | -12.380 |
genders | -12.290 |
rils | -12.007 |
aults | -11.855 |
itans | -11.724 |
Token | 'll |
Token ID | 1183 |
Feature activation | +9.90e+00 |
Pos logit contributions | |
BY | +0.261 |
Decay | +0.255 |
than | +0.239 |
unfavorable | +0.239 |
Geological | +0.233 |
Neg logit contributions | |
genders | -0.284 |
blance | -0.274 |
aults | -0.267 |
rils | -0.264 |
empowerment | -0.263 |
Token | Feel |
Token ID | 18571 |
Feature activation | +7.10e+00 |
Pos logit contributions | |
Decay | +6.506 |
BY | +6.432 |
than | +5.961 |
Geological | +5.883 |
orally | +5.785 |
Neg logit contributions | |
genders | -7.758 |
blance | -7.692 |
aults | -7.357 |
rils | -7.350 |
rights | -7.306 |
Token | a |
Token ID | 257 |
Feature activation | +4.91e+00 |
Pos logit contributions | |
Decay | +4.139 |
BY | +4.101 |
than | +3.769 |
Geological | +3.676 |
unfavorable | +3.660 |
Neg logit contributions | |
genders | -6.299 |
blance | -6.132 |
aults | -5.937 |
rils | -5.889 |
rights | -5.853 |
Token | Whole |
Token ID | 23431 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
Decay | +3.217 |
BY | +3.187 |
than | +2.960 |
Geological | +2.924 |
unfavorable | +2.843 |
Neg logit contributions | |
genders | -4.123 |
blance | -3.938 |
aults | -3.851 |
empowerment | -3.837 |
rils | -3.818 |
Token | Lot |
Token ID | 15099 |
Feature activation | +1.81e+01 |
Pos logit contributions | |
Decay | +6.117 |
BY | +5.907 |
than | +5.672 |
Geological | +5.531 |
Expedition | +5.221 |
Neg logit contributions | |
genders | -8.922 |
blance | -8.640 |
rils | -8.542 |
empowerment | -8.394 |
rights | -8.346 |
Token | Better |
Token ID | 11625 |
Feature activation | +2.84e+01 |
Pos logit contributions | |
Decay | +9.798 |
BY | +9.311 |
than | +9.102 |
Regular | +8.366 |
Fish | +8.354 |
Neg logit contributions | |
genders | -14.324 |
OULD | -13.832 |
blance | -13.592 |
itans | -13.397 |
rights | -13.389 |
Token | " |
Token ID | 1 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
than | +15.495 |
Decay | +15.406 |
BY | +14.980 |
"( | +14.347 |
Geological | +14.065 |
Neg logit contributions | |
genders | -17.437 |
blance | -16.786 |
rils | -16.715 |
itans | -16.524 |
empowerment | -16.256 |
Token | ( |
Token ID | 357 |
Feature activation | +6.65e+00 |
Pos logit contributions | |
BY | +9.332 |
Decay | +9.210 |
Geological | +8.596 |
than | +8.472 |
unfavorable | +8.343 |
Neg logit contributions | |
blance | -10.007 |
genders | -9.776 |
aults | -9.495 |
rils | -9.457 |
rights | -9.218 |
Token | B |
Token ID | 33 |
Feature activation | -3.39e-01 |
Pos logit contributions | |
BY | +5.476 |
Decay | +5.204 |
than | +5.060 |
unfavorable | +4.854 |
Geological | +4.774 |
Neg logit contributions | |
genders | -4.508 |
blance | -4.348 |
aults | -4.167 |
mattered | -4.137 |
rils | -4.136 |
Token | yr |
Token ID | 2417 |
Feature activation | +5.64e+00 |
Pos logit contributions | |
genders | +0.264 |
blance | +0.254 |
aults | +0.248 |
rils | +0.245 |
empowerment | +0.244 |
Neg logit contributions | |
BY | -0.244 |
Decay | -0.238 |
than | -0.224 |
unfavorable | -0.224 |
Geological | -0.218 |
Token | ds |
Token ID | 9310 |
Feature activation | +8.73e+00 |
Pos logit contributions | |
BY | +4.061 |
Decay | +3.871 |
than | +3.754 |
unfavorable | +3.621 |
Geological | +3.584 |
Neg logit contributions | |
genders | -4.322 |
blance | -4.138 |
mattered | -4.007 |
aults | -4.005 |
empowerment | -3.976 |
Token | notion |
Token ID | 9495 |
Feature activation | +7.17e+00 |
Pos logit contributions | |
genders | +1.051 |
blance | +0.990 |
empowerment | +0.975 |
aults | +0.970 |
mattered | +0.958 |
Neg logit contributions | |
BY | -1.090 |
Decay | -1.066 |
than | -1.004 |
unfavorable | -0.986 |
Geological | -0.966 |
Token | of |
Token ID | 286 |
Feature activation | -4.30e+00 |
Pos logit contributions | |
BY | +4.300 |
Decay | +4.179 |
unfavorable | +4.017 |
than | +3.890 |
Geological | +3.883 |
Neg logit contributions | |
genders | -6.146 |
blance | -6.003 |
aults | -5.873 |
rils | -5.858 |
rights | -5.733 |
Token | a |
Token ID | 257 |
Feature activation | -6.54e+00 |
Pos logit contributions | |
genders | +3.503 |
empowerment | +3.323 |
blance | +3.294 |
aults | +3.255 |
equality | +3.244 |
Neg logit contributions | |
BY | -2.906 |
Decay | -2.848 |
than | -2.667 |
unfavorable | -2.570 |
orally | -2.522 |
Token | crisis |
Token ID | 4902 |
Feature activation | +5.42e+00 |
Pos logit contributions | |
genders | +5.250 |
empowerment | +4.948 |
aults | +4.886 |
blance | +4.879 |
wheelchair | +4.867 |
Neg logit contributions | |
BY | -4.339 |
Decay | -4.262 |
than | -4.009 |
unfavorable | -3.875 |
orally | -3.772 |
Token | caused |
Token ID | 4073 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
BY | +3.737 |
Decay | +3.652 |
unfavorable | +3.513 |
than | +3.460 |
Geological | +3.422 |
Neg logit contributions | |
genders | -4.248 |
blance | -4.142 |
aults | -4.027 |
rils | -4.007 |
rights | -3.935 |
Token | primarily |
Token ID | 7525 |
Feature activation | +2.83e+01 |
Pos logit contributions | |
BY | +4.969 |
Decay | +4.547 |
unfavorable | +4.547 |
orally | +4.376 |
periodic | +4.264 |
Neg logit contributions | |
genders | -10.562 |
blance | -10.329 |
aults | -10.001 |
rils | -10.000 |
rights | -9.780 |
Token | by |
Token ID | 416 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
BY | +12.310 |
unfavorable | +11.577 |
Geological | +11.156 |
orally | +11.033 |
by | +10.904 |
Neg logit contributions | |
genders | -20.715 |
blance | -20.296 |
rils | -19.719 |
aults | -19.196 |
CLS | -18.848 |
Token | climate |
Token ID | 4258 |
Feature activation | -2.99e+00 |
Pos logit contributions | |
BY | +6.844 |
Decay | +6.828 |
unfavorable | +6.760 |
periodic | +6.566 |
Geological | +6.410 |
Neg logit contributions | |
blance | -7.471 |
genders | -7.406 |
rils | -7.178 |
itans | -7.061 |
rights | -7.003 |
Token | changes |
Token ID | 2458 |
Feature activation | +6.46e+00 |
Pos logit contributions | |
genders | +1.705 |
empowerment | +1.561 |
blance | +1.557 |
aults | +1.556 |
mattered | +1.530 |
Neg logit contributions | |
BY | -2.776 |
Decay | -2.717 |
than | -2.590 |
unfavorable | -2.538 |
orally | -2.529 |
Token | . |
Token ID | 13 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
BY | +4.273 |
Decay | +4.109 |
unfavorable | +4.057 |
than | +3.983 |
Geological | +3.869 |
Neg logit contributions | |
genders | -5.163 |
blance | -5.079 |
rils | -4.904 |
aults | -4.852 |
empowerment | -4.808 |
Token | It |
Token ID | 632 |
Feature activation | -3.11e+00 |
Pos logit contributions | |
BY | +1.408 |
Decay | +1.382 |
than | +1.290 |
unfavorable | +1.278 |
Geological | +1.268 |
Neg logit contributions | |
genders | -1.647 |
blance | -1.588 |
aults | -1.539 |
empowerment | -1.534 |
rils | -1.529 |
Token | the |
Token ID | 262 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
genders | +1.608 |
blance | +1.532 |
aults | +1.502 |
empowerment | +1.493 |
rils | +1.483 |
Neg logit contributions | |
BY | -1.466 |
Decay | -1.438 |
than | -1.348 |
unfavorable | -1.331 |
Geological | -1.312 |
Token | campaign |
Token ID | 1923 |
Feature activation | +6.08e+00 |
Pos logit contributions | |
BY | +1.196 |
Decay | +1.168 |
unfavorable | +1.104 |
than | +1.100 |
Geological | +1.069 |
Neg logit contributions | |
genders | -1.300 |
blance | -1.265 |
aults | -1.224 |
rils | -1.215 |
rights | -1.205 |
Token | has |
Token ID | 468 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
BY | +4.005 |
Decay | +3.900 |
unfavorable | +3.720 |
than | +3.653 |
Geological | +3.604 |
Neg logit contributions | |
genders | -4.861 |
blance | -4.798 |
aults | -4.646 |
rils | -4.603 |
itans | -4.532 |
Token | further |
Token ID | 2252 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
BY | +7.577 |
Decay | +7.320 |
unfavorable | +7.271 |
orally | +7.126 |
periodic | +7.051 |
Neg logit contributions | |
blance | -8.333 |
genders | -8.156 |
itans | -7.955 |
aults | -7.819 |
rils | -7.818 |
Token | been |
Token ID | 587 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
BY | +8.411 |
Decay | +8.259 |
unfavorable | +8.202 |
orally | +7.894 |
than | +7.866 |
Neg logit contributions | |
blance | -8.347 |
genders | -8.105 |
itans | -7.874 |
aults | -7.786 |
rights | -7.736 |
Token | hampered |
Token ID | 42629 |
Feature activation | +2.81e+01 |
Pos logit contributions | |
BY | +7.954 |
unfavorable | +7.616 |
Decay | +7.575 |
than | +7.436 |
periodic | +7.377 |
Neg logit contributions | |
blance | -7.816 |
genders | -7.615 |
rils | -7.282 |
aults | -7.229 |
itans | -7.218 |
Token | by |
Token ID | 416 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
BY | +13.743 |
orally | +13.030 |
unfavorable | +13.029 |
by | +12.540 |
administr | +12.412 |
Neg logit contributions | |
blance | -18.238 |
aults | -18.113 |
genders | -17.818 |
rils | -17.467 |
itans | -17.204 |
Token | the |
Token ID | 262 |
Feature activation | +9.95e+00 |
Pos logit contributions | |
unfavorable | +10.797 |
BY | +10.634 |
Decay | +10.468 |
periodic | +10.218 |
incomplete | +9.899 |
Neg logit contributions | |
blance | -10.589 |
genders | -10.480 |
itans | -9.869 |
aults | -9.823 |
rils | -9.810 |
Token | press |
Token ID | 1803 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
BY | +6.799 |
Decay | +6.761 |
unfavorable | +6.617 |
periodic | +6.326 |
than | +6.306 |
Neg logit contributions | |
blance | -7.466 |
genders | -7.289 |
aults | -7.002 |
rils | -6.987 |
rights | -6.945 |
Token | - |
Token ID | 12 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
BY | +10.162 |
unfavorable | +10.096 |
Decay | +10.018 |
periodic | +9.600 |
than | +9.511 |
Neg logit contributions | |
genders | -9.710 |
blance | -9.643 |
rils | -9.070 |
aults | -9.013 |
itans | -8.988 |
Token | sh |
Token ID | 1477 |
Feature activation | -2.42e+00 |
Pos logit contributions | |
BY | +0.750 |
Decay | +0.731 |
than | +0.690 |
unfavorable | +0.688 |
Geological | +0.669 |
Neg logit contributions | |
genders | -0.805 |
blance | -0.774 |
aults | -0.753 |
rils | -0.745 |
empowerment | -0.744 |
Token | , |
Token ID | 11 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
unfavorable | +11.258 |
BY | +10.899 |
orally | +10.819 |
incomplete | +10.415 |
Decay | +10.225 |
Neg logit contributions | |
blance | -12.770 |
genders | -12.745 |
rils | -12.440 |
itans | -12.269 |
empowerment | -12.261 |
Token | and |
Token ID | 290 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
BY | +6.959 |
Decay | +6.616 |
unfavorable | +6.602 |
than | +6.431 |
orally | +6.365 |
Neg logit contributions | |
blance | -7.653 |
genders | -7.562 |
rils | -7.284 |
aults | -7.280 |
itans | -7.204 |
Token | arguments |
Token ID | 7159 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
BY | +11.121 |
unfavorable | +10.886 |
orally | +10.422 |
Decay | +10.392 |
incomplete | +10.327 |
Neg logit contributions | |
blance | -10.208 |
genders | -9.673 |
rils | -9.652 |
aults | -9.601 |
itans | -9.549 |
Token | , |
Token ID | 11 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
unfavorable | +11.692 |
BY | +11.542 |
orally | +11.533 |
than | +10.762 |
Decay | +10.703 |
Neg logit contributions | |
genders | -13.437 |
rils | -13.296 |
blance | -13.165 |
empowerment | -12.931 |
aults | -12.901 |
Token | partly |
Token ID | 11476 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
BY | +11.685 |
unfavorable | +11.453 |
than | +11.169 |
Decay | +11.000 |
orally | +10.984 |
Neg logit contributions | |
genders | -11.655 |
blance | -11.594 |
rils | -11.382 |
aults | -11.140 |
itans | -11.124 |
Token | also |
Token ID | 635 |
Feature activation | +2.77e+01 |
Pos logit contributions | |
BY | +15.344 |
orally | +14.891 |
unfavorable | +14.503 |
incomplete | +14.012 |
periodic | +13.671 |
Neg logit contributions | |
blance | -16.738 |
genders | -16.638 |
rils | -16.519 |
rights | -16.211 |
OULD | -16.089 |
Token | because |
Token ID | 780 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
BY | +15.110 |
unfavorable | +14.718 |
orally | +14.614 |
incomplete | +13.852 |
periodic | +13.643 |
Neg logit contributions | |
genders | -16.124 |
blance | -15.902 |
rils | -15.874 |
OULD | -15.599 |
aults | -15.428 |
Token | those |
Token ID | 883 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
BY | +9.978 |
unfavorable | +9.757 |
orally | +9.583 |
Decay | +9.455 |
periodic | +9.125 |
Neg logit contributions | |
rils | -12.025 |
blance | -11.964 |
genders | -11.808 |
aults | -11.751 |
rights | -11.426 |
Token | things |
Token ID | 1243 |
Feature activation | +2.04e+01 |
Pos logit contributions | |
BY | +11.508 |
unfavorable | +11.318 |
Decay | +11.175 |
orally | +11.021 |
periodic | +10.887 |
Neg logit contributions | |
blance | -4.457 |
genders | -4.212 |
rils | -4.117 |
itans | -3.909 |
aults | -3.880 |
Token | that |
Token ID | 326 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
unfavorable | +13.402 |
BY | +13.354 |
orally | +12.973 |
Decay | +12.785 |
than | +12.132 |
Neg logit contributions | |
blance | -12.380 |
genders | -12.290 |
rils | -12.007 |
aults | -11.855 |
itans | -11.724 |
Token | are |
Token ID | 389 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
BY | +9.268 |
unfavorable | +8.989 |
Decay | +8.957 |
orally | +8.711 |
Geological | +8.373 |
Neg logit contributions | |
blance | -10.311 |
genders | -10.178 |
rils | -10.071 |
aults | -10.057 |
itans | -9.720 |
Token | bad |
Token ID | 2089 |
Feature activation | +7.65e+00 |
Pos logit contributions | |
BY | +4.107 |
Decay | +3.924 |
unfavorable | +3.839 |
periodic | +3.746 |
than | +3.744 |
Neg logit contributions | |
genders | -4.569 |
blance | -4.497 |
rils | -4.428 |
aults | -4.372 |
rights | -4.272 |
Token | sign |
Token ID | 1051 |
Feature activation | +4.00e+00 |
Pos logit contributions | |
BY | +4.773 |
Decay | +4.436 |
unfavorable | +4.367 |
than | +4.264 |
periodic | +4.228 |
Neg logit contributions | |
genders | -6.535 |
blance | -6.461 |
rils | -6.337 |
aults | -6.319 |
rights | -6.163 |
Token | is |
Token ID | 318 |
Feature activation | +6.15e+00 |
Pos logit contributions | |
BY | +2.653 |
Decay | +2.566 |
unfavorable | +2.443 |
than | +2.430 |
Geological | +2.346 |
Neg logit contributions | |
genders | -3.295 |
blance | -3.195 |
aults | -3.114 |
rils | -3.078 |
empowerment | -3.055 |
Token | if |
Token ID | 611 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
BY | +4.359 |
Decay | +4.237 |
unfavorable | +4.117 |
than | +4.056 |
periodic | +3.998 |
Neg logit contributions | |
genders | -4.666 |
blance | -4.534 |
rils | -4.431 |
aults | -4.400 |
rights | -4.318 |
Token | a |
Token ID | 257 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
BY | +7.217 |
unfavorable | +6.874 |
Decay | +6.830 |
periodic | +6.800 |
than | +6.550 |
Neg logit contributions | |
blance | -8.584 |
genders | -8.529 |
rils | -8.350 |
aults | -8.137 |
rights | -8.083 |
Token | country |
Token ID | 1499 |
Feature activation | +2.77e+01 |
Pos logit contributions | |
BY | +7.082 |
Decay | +6.714 |
unfavorable | +6.693 |
periodic | +6.622 |
than | +6.582 |
Neg logit contributions | |
blance | -10.362 |
rils | -10.334 |
genders | -10.284 |
aults | -9.801 |
rights | -9.781 |
Token | � |
Token ID | 447 |
Feature activation | +5.08e+00 |
Pos logit contributions | |
unfavorable | +15.515 |
travels | +15.295 |
orally | +15.126 |
incomplete | +14.857 |
BY | +14.847 |
Neg logit contributions | |
blance | -16.239 |
rils | -16.031 |
itans | -14.225 |
empowerment | -14.202 |
rights | -14.095 |
Token | � |
Token ID | 247 |
Feature activation | +8.74e+00 |
Pos logit contributions | |
BY | +2.583 |
Decay | +2.532 |
unfavorable | +2.354 |
than | +2.352 |
periodic | +2.199 |
Neg logit contributions | |
genders | -4.916 |
blance | -4.682 |
empowerment | -4.642 |
aults | -4.620 |
rils | -4.594 |
Token | s |
Token ID | 82 |
Feature activation | +1.98e+01 |
Pos logit contributions | |
BY | +6.438 |
than | +6.197 |
Decay | +6.105 |
unfavorable | +5.958 |
periodic | +5.656 |
Neg logit contributions | |
genders | -6.213 |
blance | -6.106 |
empowerment | -5.865 |
rils | -5.840 |
wheelchair | -5.779 |
Token | economy |
Token ID | 3773 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
BY | +13.049 |
unfavorable | +12.818 |
periodic | +12.679 |
Decay | +12.622 |
than | +12.229 |
Neg logit contributions | |
blance | -12.172 |
rils | -11.776 |
genders | -11.631 |
rights | -11.395 |
itans | -11.278 |
Token | is |
Token ID | 318 |
Feature activation | +8.04e+00 |
Pos logit contributions | |
BY | +7.344 |
Decay | +7.171 |
unfavorable | +7.059 |
than | +6.811 |
periodic | +6.736 |
Neg logit contributions | |
blance | -8.591 |
genders | -8.410 |
rils | -8.275 |
rights | -8.065 |
empowerment | -7.972 |
Token | written |
Token ID | 3194 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
unfavorable | +13.839 |
orally | +13.225 |
BY | +12.885 |
incomplete | +12.550 |
favorable | +11.952 |
Neg logit contributions | |
blance | -13.483 |
rils | -13.076 |
genders | -12.910 |
itans | -12.741 |
rights | -12.552 |
Token | by |
Token ID | 416 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
orally | +11.833 |
unfavorable | +11.590 |
BY | +10.967 |
incomplete | +10.512 |
than | +10.248 |
Neg logit contributions | |
rils | -14.007 |
genders | -13.867 |
blance | -13.859 |
itans | -13.525 |
aults | -13.258 |
Token | other |
Token ID | 584 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
BY | +13.289 |
unfavorable | +12.917 |
orally | +12.803 |
Decay | +12.546 |
than | +12.098 |
Neg logit contributions | |
blance | -13.697 |
rils | -13.010 |
aults | -12.939 |
rights | -12.779 |
itans | -12.557 |
Token | authors |
Token ID | 7035 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
BY | +10.835 |
than | +10.236 |
Decay | +10.165 |
orally | +10.159 |
unfavorable | +10.123 |
Neg logit contributions | |
blance | -12.183 |
aults | -11.360 |
rils | -11.291 |
rights | -11.014 |
olver | -11.003 |
Token | , |
Token ID | 11 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
BY | +7.703 |
unfavorable | +7.519 |
than | +7.436 |
orally | +7.414 |
Decay | +7.372 |
Neg logit contributions | |
genders | -6.882 |
rils | -6.573 |
blance | -6.567 |
empowerment | -6.445 |
aults | -6.388 |
Token | partly |
Token ID | 11476 |
Feature activation | +2.73e+01 |
Pos logit contributions | |
BY | +9.100 |
unfavorable | +8.646 |
Decay | +8.613 |
than | +8.563 |
orally | +8.518 |
Neg logit contributions | |
genders | -6.309 |
blance | -6.222 |
rils | -6.073 |
aults | -5.891 |
empowerment | -5.861 |
Token | on |
Token ID | 319 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
BY | +16.055 |
unfavorable | +15.683 |
orally | +15.574 |
incomplete | +14.808 |
periodic | +14.159 |
Neg logit contributions | |
blance | -16.068 |
rils | -15.890 |
genders | -15.315 |
rights | -15.232 |
OULD | -15.011 |
Token | account |
Token ID | 1848 |
Feature activation | +9.15e+00 |
Pos logit contributions | |
BY | +10.690 |
unfavorable | +10.539 |
Decay | +10.083 |
orally | +9.968 |
than | +9.835 |
Neg logit contributions | |
rils | -11.436 |
blance | -11.434 |
genders | -11.278 |
aults | -11.160 |
itans | -11.074 |
Token | of |
Token ID | 286 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
BY | +5.121 |
unfavorable | +4.950 |
Decay | +4.839 |
than | +4.753 |
orally | +4.627 |
Neg logit contributions | |
blance | -7.875 |
genders | -7.853 |
rils | -7.606 |
aults | -7.460 |
empowerment | -7.457 |
Token | the |
Token ID | 262 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
unfavorable | +13.066 |
BY | +12.823 |
Decay | +12.308 |
orally | +12.199 |
incomplete | +12.154 |
Neg logit contributions | |
blance | -11.653 |
rils | -11.540 |
genders | -11.515 |
aults | -11.433 |
rights | -11.100 |
Token | multiplication |
Token ID | 48473 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
unfavorable | +15.561 |
BY | +14.831 |
Decay | +14.668 |
incomplete | +14.446 |
periodic | +14.399 |
Neg logit contributions | |
blance | -11.401 |
rils | -11.302 |
aults | -10.926 |
genders | -10.736 |
rights | -10.725 |
Token | and |
Token ID | 290 |
Feature activation | +7.92e-02 |
Pos logit contributions | |
BY | +3.491 |
Decay | +3.363 |
unfavorable | +3.199 |
than | +3.199 |
orally | +3.149 |
Neg logit contributions | |
genders | -4.215 |
blance | -4.118 |
aults | -3.984 |
rils | -3.977 |
empowerment | -3.924 |
Token | has |
Token ID | 468 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
BY | +0.054 |
Decay | +0.053 |
than | +0.049 |
unfavorable | +0.049 |
Geological | +0.048 |
Neg logit contributions | |
genders | -0.065 |
blance | -0.062 |
aults | -0.061 |
empowerment | -0.060 |
rils | -0.060 |
Token | been |
Token ID | 587 |
Feature activation | -2.79e+00 |
Pos logit contributions | |
genders | +0.335 |
blance | +0.320 |
aults | +0.313 |
empowerment | +0.311 |
mattered | +0.310 |
Neg logit contributions | |
BY | -0.301 |
Decay | -0.294 |
than | -0.275 |
unfavorable | -0.274 |
Geological | -0.267 |
Token | stunned |
Token ID | 19987 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
genders | +2.093 |
blance | +1.969 |
wheelchair | +1.949 |
empowerment | +1.947 |
aults | +1.940 |
Neg logit contributions | |
BY | -2.064 |
Decay | -2.037 |
than | -1.901 |
unfavorable | -1.876 |
Geological | -1.858 |
Token | and |
Token ID | 290 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
BY | +9.931 |
Decay | +8.967 |
orally | +8.842 |
unfavorable | +8.778 |
periodic | +8.637 |
Neg logit contributions | |
blance | -13.739 |
genders | -13.378 |
rils | -13.190 |
aults | -13.066 |
itans | -12.946 |
Token | saddened |
Token ID | 40434 |
Feature activation | +2.71e+01 |
Pos logit contributions | |
genders | +0.719 |
blance | +0.676 |
aults | +0.657 |
empowerment | +0.653 |
mattered | +0.650 |
Neg logit contributions | |
BY | -1.102 |
Decay | -1.084 |
than | -1.030 |
unfavorable | -1.022 |
Geological | -1.010 |
Token | to |
Token ID | 284 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
BY | +13.866 |
orally | +12.612 |
by | +12.390 |
periodic | +12.037 |
unfavorable | +11.962 |
Neg logit contributions | |
blance | -17.762 |
genders | -17.101 |
itans | -17.078 |
aults | -17.043 |
rils | -17.004 |
Token | see |
Token ID | 766 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
BY | +7.097 |
Decay | +6.463 |
than | +6.436 |
periodic | +6.368 |
unfavorable | +6.345 |
Neg logit contributions | |
genders | -13.210 |
blance | -13.196 |
aults | -12.877 |
rils | -12.748 |
mattered | -12.578 |
Token | the |
Token ID | 262 |
Feature activation | -3.88e+00 |
Pos logit contributions | |
genders | +1.462 |
blance | +1.383 |
aults | +1.354 |
empowerment | +1.348 |
rils | +1.339 |
Neg logit contributions | |
BY | -1.476 |
Decay | -1.451 |
than | -1.364 |
unfavorable | -1.346 |
Geological | -1.331 |
Token | huge |
Token ID | 3236 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
genders | +3.004 |
empowerment | +2.782 |
blance | +2.779 |
aults | +2.759 |
wheelchair | +2.746 |
Neg logit contributions | |
BY | -2.799 |
Decay | -2.715 |
than | -2.568 |
unfavorable | -2.507 |
Geological | -2.494 |
Token | tent |
Token ID | 11105 |
Feature activation | -3.97e+00 |
Pos logit contributions | |
genders | +1.219 |
blance | +1.149 |
aults | +1.134 |
empowerment | +1.133 |
mattered | +1.117 |
Neg logit contributions | |
BY | -1.270 |
Decay | -1.239 |
than | -1.171 |
unfavorable | -1.154 |
Geological | -1.137 |
Token | special |
Token ID | 2041 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
BY | +2.216 |
Decay | +2.110 |
periodic | +2.045 |
unfavorable | +2.028 |
than | +1.975 |
Neg logit contributions | |
genders | -4.597 |
blance | -4.544 |
itans | -4.435 |
rils | -4.391 |
aults | -4.381 |
Token | offers |
Token ID | 4394 |
Feature activation | +4.11e+00 |
Pos logit contributions | |
BY | +5.530 |
unfavorable | +5.290 |
periodic | +5.125 |
than | +4.838 |
installments | +4.685 |
Neg logit contributions | |
blance | -12.092 |
genders | -11.603 |
rils | -11.447 |
サーティワン | -11.267 |
itans | -11.205 |
Token | for |
Token ID | 329 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
BY | +2.950 |
Decay | +2.798 |
than | +2.720 |
unfavorable | +2.710 |
Geological | +2.604 |
Neg logit contributions | |
genders | -3.166 |
blance | -3.138 |
rils | -3.007 |
itans | -2.974 |
aults | -2.971 |
Token | The |
Token ID | 383 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
BY | +4.538 |
Decay | +4.118 |
than | +3.641 |
unfavorable | +3.585 |
Geological | +3.585 |
Neg logit contributions | |
genders | -12.128 |
blance | -11.992 |
rils | -11.868 |
itans | -11.709 |
mattered | -11.427 |
Token | New |
Token ID | 968 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
BY | +6.104 |
Decay | +5.574 |
Geological | +5.168 |
Organization | +4.970 |
Regular | +4.894 |
Neg logit contributions | |
blance | -18.022 |
rils | -17.661 |
genders | -17.555 |
eatures | -17.516 |
ailability | -17.349 |
Token | York |
Token ID | 1971 |
Feature activation | +2.69e+01 |
Pos logit contributions | |
BY | +8.077 |
Geological | +7.045 |
than | +6.940 |
Organization | +6.841 |
Decay | +6.275 |
Neg logit contributions | |
ailability | -23.012 |
eatures | -22.964 |
blance | -22.726 |
rils | -22.091 |
genders | -22.089 |
Token | Times |
Token ID | 3782 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
Times | +9.141 |
than | +8.711 |
BY | +8.704 |
Geological | +8.437 |
Decay | +8.168 |
Neg logit contributions | |
blance | -24.275 |
ailability | -23.881 |
eatures | -23.561 |
pione | -23.223 |
genders | -22.958 |
Token | 's |
Token ID | 338 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
BY | +4.691 |
Decay | +4.180 |
than | +3.951 |
unfavorable | +3.733 |
Organization | +3.695 |
Neg logit contributions | |
blance | -15.935 |
rils | -15.629 |
genders | -15.462 |
itans | -14.983 |
サーティワン | -14.934 |
Token | products |
Token ID | 3186 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
BY | +6.353 |
periodic | +6.293 |
Decay | +5.964 |
than | +5.751 |
unfavorable | +5.664 |
Neg logit contributions | |
rils | -17.875 |
blance | -17.469 |
サーティワン | -16.994 |
itans | -16.931 |
genders | -16.689 |
Token | and |
Token ID | 290 |
Feature activation | +2.88e+00 |
Pos logit contributions | |
BY | +2.194 |
Decay | +2.122 |
than | +2.032 |
unfavorable | +1.990 |
Geological | +1.967 |
Neg logit contributions | |
genders | -2.634 |
blance | -2.602 |
empowerment | -2.488 |
rils | -2.479 |
aults | -2.455 |
Token | services |
Token ID | 2594 |
Feature activation | +4.68e+00 |
Pos logit contributions | |
BY | +2.607 |
Decay | +2.512 |
unfavorable | +2.462 |
periodic | +2.405 |
than | +2.402 |
Neg logit contributions | |
blance | -1.666 |
genders | -1.666 |
rils | -1.555 |
itans | -1.544 |
aults | -1.536 |
Token |
|
Token ID | 198 |
Feature activation | +5.50e+00 |
Pos logit contributions | |
BY | +3.187 |
Decay | +3.086 |
unfavorable | +2.937 |
than | +2.934 |
Geological | +2.869 |
Neg logit contributions | |
genders | -3.724 |
blance | -3.601 |
aults | -3.490 |
rils | -3.473 |
rights | -3.450 |
Token |
|
Token ID | 198 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
BY | +3.830 |
Decay | +3.543 |
than | +3.528 |
Geological | +3.384 |
unfavorable | +3.302 |
Neg logit contributions | |
blance | -4.439 |
genders | -4.437 |
empowerment | -4.221 |
rils | -4.177 |
mattered | -4.166 |
Token | The |
Token ID | 464 |
Feature activation | +9.37e+00 |
Pos logit contributions | |
BY | +7.222 |
than | +6.499 |
Decay | +6.195 |
Geological | +5.932 |
unfavorable | +5.832 |
Neg logit contributions | |
genders | -9.112 |
blance | -8.605 |
mattered | -8.466 |
empowerment | -8.362 |
wheelchair | -8.303 |
Token | FIR |
Token ID | 23703 |
Feature activation | +6.72e+00 |
Pos logit contributions | |
BY | +6.498 |
Decay | +6.290 |
unfavorable | +6.092 |
than | +6.091 |
periodic | +6.020 |
Neg logit contributions | |
genders | -6.921 |
blance | -6.796 |
aults | -6.544 |
rils | -6.526 |
itans | -6.458 |
Token | further |
Token ID | 2252 |
Feature activation | +4.61e+00 |
Pos logit contributions | |
BY | +5.146 |
Decay | +4.819 |
unfavorable | +4.655 |
than | +4.623 |
orally | +4.620 |
Neg logit contributions | |
genders | -4.805 |
blance | -4.645 |
aults | -4.482 |
rils | -4.422 |
rights | -4.416 |
Token | quotes |
Token ID | 13386 |
Feature activation | +2.67e+01 |
Pos logit contributions | |
BY | +3.173 |
Decay | +2.985 |
than | +2.913 |
unfavorable | +2.908 |
orally | +2.854 |
Neg logit contributions | |
genders | -3.639 |
blance | -3.570 |
aults | -3.435 |
rils | -3.427 |
rights | -3.413 |
Token | the |
Token ID | 262 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
orally | +16.016 |
BY | +15.605 |
unfavorable | +15.238 |
than | +15.214 |
Geological | +15.202 |
Neg logit contributions | |
blance | -14.444 |
itans | -14.198 |
genders | -14.092 |
rils | -13.990 |
OULD | -13.758 |
Token | contents |
Token ID | 10154 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
BY | +12.523 |
than | +12.434 |
orally | +12.319 |
unfavorable | +12.198 |
Decay | +12.117 |
Neg logit contributions | |
blance | -12.000 |
rils | -11.532 |
genders | -11.438 |
aults | -11.221 |
OULD | -11.126 |
Token | of |
Token ID | 286 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
BY | +6.218 |
Decay | +5.892 |
orally | +5.815 |
unfavorable | +5.783 |
than | +5.768 |
Neg logit contributions | |
genders | -8.172 |
blance | -7.777 |
aults | -7.628 |
itans | -7.582 |
rils | -7.540 |
Token | the |
Token ID | 262 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
BY | +10.646 |
orally | +10.257 |
than | +10.062 |
Decay | +10.048 |
periodic | +9.988 |
Neg logit contributions | |
genders | -12.031 |
blance | -11.831 |
itans | -11.708 |
rils | -11.399 |
aults | -11.341 |
Token | audio |
Token ID | 6597 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
BY | +7.787 |
Decay | +7.408 |
than | +7.333 |
orally | +7.290 |
unfavorable | +7.249 |
Neg logit contributions | |
blance | -7.769 |
genders | -7.768 |
rils | -7.424 |
itans | -7.387 |
aults | -7.323 |
Token | has |
Token ID | 468 |
Feature activation | -6.11e+00 |
Pos logit contributions | |
genders | +3.535 |
mattered | +3.323 |
empowerment | +3.297 |
aults | +3.285 |
blance | +3.284 |
Neg logit contributions | |
BY | -3.139 |
Decay | -3.045 |
than | -2.908 |
unfavorable | -2.831 |
Geological | -2.773 |
Token | been |
Token ID | 587 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
genders | +4.388 |
mattered | +4.176 |
empowerment | +4.046 |
aults | +4.018 |
blance | +3.964 |
Neg logit contributions | |
BY | -4.666 |
Decay | -4.576 |
than | -4.354 |
Geological | -4.169 |
unfavorable | -4.149 |
Token | told |
Token ID | 1297 |
Feature activation | +1.59e+01 |
Pos logit contributions | |
BY | +11.100 |
Decay | +10.991 |
unfavorable | +10.965 |
orally | +10.956 |
periodic | +10.849 |
Neg logit contributions | |
blance | -12.184 |
genders | -11.567 |
rights | -11.271 |
aults | -11.160 |
itans | -11.128 |
Token | again |
Token ID | 757 |
Feature activation | +9.35e+00 |
Pos logit contributions | |
orally | +8.968 |
BY | +8.954 |
unfavorable | +8.882 |
periodic | +8.586 |
Decay | +8.505 |
Neg logit contributions | |
blance | -12.191 |
rils | -11.753 |
aults | -11.605 |
genders | -11.561 |
itans | -11.517 |
Token | and |
Token ID | 290 |
Feature activation | -4.15e-01 |
Pos logit contributions | |
BY | +5.759 |
Decay | +5.534 |
unfavorable | +5.393 |
than | +5.370 |
orally | +5.291 |
Neg logit contributions | |
genders | -7.593 |
blance | -7.459 |
itans | -7.214 |
rils | -7.197 |
empowerment | -7.190 |
Token | again |
Token ID | 757 |
Feature activation | +2.67e+01 |
Pos logit contributions | |
genders | +0.236 |
blance | +0.222 |
aults | +0.214 |
mattered | +0.212 |
rils | +0.211 |
Neg logit contributions | |
BY | -0.385 |
Decay | -0.379 |
than | -0.362 |
unfavorable | -0.359 |
Geological | -0.355 |
Token | over |
Token ID | 625 |
Feature activation | +5.15e-01 |
Pos logit contributions | |
orally | +13.788 |
BY | +13.637 |
unfavorable | +13.415 |
than | +12.847 |
periodic | +12.818 |
Neg logit contributions | |
blance | -16.735 |
rils | -16.240 |
CLS | -16.022 |
itans | -16.007 |
genders | -15.785 |
Token | the |
Token ID | 262 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
BY | +0.349 |
Decay | +0.340 |
than | +0.319 |
unfavorable | +0.318 |
Geological | +0.310 |
Neg logit contributions | |
genders | -0.423 |
blance | -0.407 |
aults | -0.397 |
empowerment | -0.393 |
rils | -0.393 |
Token | course |
Token ID | 1781 |
Feature activation | -3.28e+00 |
Pos logit contributions | |
genders | +1.697 |
blance | +1.562 |
empowerment | +1.539 |
aults | +1.524 |
rights | +1.507 |
Neg logit contributions | |
BY | -2.420 |
Decay | -2.364 |
than | -2.258 |
unfavorable | -2.229 |
Geological | -2.199 |
Token | of |
Token ID | 286 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
genders | +2.342 |
blance | +2.223 |
aults | +2.181 |
rights | +2.149 |
rils | +2.145 |
Neg logit contributions | |
BY | -2.547 |
Decay | -2.498 |
unfavorable | -2.338 |
than | -2.338 |
periodic | -2.293 |
Token | the |
Token ID | 262 |
Feature activation | -3.65e-01 |
Pos logit contributions | |
BY | +2.347 |
Decay | +2.296 |
unfavorable | +2.174 |
than | +2.165 |
periodic | +2.119 |
Neg logit contributions | |
genders | -2.480 |
blance | -2.408 |
aults | -2.348 |
rils | -2.316 |
mattered | -2.294 |
Token | theory |
Token ID | 4583 |
Feature activation | +1.95e+01 |
Pos logit contributions | |
BY | +6.934 |
Decay | +6.861 |
periodic | +6.590 |
unfavorable | +6.552 |
than | +6.335 |
Neg logit contributions | |
blance | -7.060 |
genders | -6.901 |
rils | -6.889 |
itans | -6.623 |
aults | -6.609 |
Token | that |
Token ID | 326 |
Feature activation | +6.16e+00 |
Pos logit contributions | |
BY | +11.534 |
Decay | +11.133 |
unfavorable | +11.009 |
orally | +10.972 |
Geological | +10.522 |
Neg logit contributions | |
blance | -13.199 |
rils | -12.736 |
itans | -12.659 |
genders | -12.550 |
CLS | -12.550 |
Token | is |
Token ID | 318 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
BY | +3.991 |
Decay | +3.877 |
unfavorable | +3.741 |
periodic | +3.639 |
orally | +3.621 |
Neg logit contributions | |
blance | -5.011 |
genders | -4.954 |
rils | -4.785 |
aults | -4.733 |
rights | -4.717 |
Token | being |
Token ID | 852 |
Feature activation | +1.98e+01 |
Pos logit contributions | |
BY | +8.415 |
unfavorable | +8.262 |
Decay | +8.041 |
orally | +7.974 |
periodic | +7.817 |
Neg logit contributions | |
blance | -9.394 |
genders | -8.847 |
rils | -8.711 |
aults | -8.659 |
itans | -8.640 |
Token | put |
Token ID | 1234 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
orally | +12.024 |
BY | +11.504 |
unfavorable | +11.418 |
Decay | +11.276 |
promulg | +11.273 |
Neg logit contributions | |
blance | -13.993 |
itans | -13.070 |
aults | -12.866 |
rights | -12.803 |
genders | -12.679 |
Token | forward |
Token ID | 2651 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
orally | +8.530 |
BY | +8.214 |
unfavorable | +8.061 |
periodic | +7.695 |
incomplete | +7.535 |
Neg logit contributions | |
blance | -14.714 |
aults | -13.825 |
CLS | -13.823 |
itans | -13.768 |
genders | -13.681 |
Token | now |
Token ID | 783 |
Feature activation | +2.52e+01 |
Pos logit contributions | |
orally | +14.673 |
unfavorable | +13.616 |
BY | +13.560 |
periodic | +13.069 |
incomplete | +12.988 |
Neg logit contributions | |
blance | -17.474 |
itans | -16.249 |
CLS | -16.193 |
rils | -16.032 |
aults | -15.565 |
Token | by |
Token ID | 416 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
BY | +13.971 |
orally | +13.872 |
unfavorable | +13.432 |
than | +13.274 |
periodic | +12.643 |
Neg logit contributions | |
blance | -16.097 |
rils | -15.091 |
CLS | -15.060 |
itans | -14.815 |
genders | -14.725 |
Token | CNN |
Token ID | 8100 |
Feature activation | +2.17e+01 |
Pos logit contributions | |
Decay | +10.004 |
BY | +9.941 |
unfavorable | +9.836 |
periodic | +9.626 |
Geological | +9.383 |
Neg logit contributions | |
blance | -12.334 |
itans | -11.531 |
genders | -11.454 |
rils | -11.395 |
aults | -11.314 |
Token | , |
Token ID | 11 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
Decay | +14.440 |
BY | +14.012 |
unfavorable | +13.861 |
Geological | +13.226 |
than | +13.196 |
Neg logit contributions | |
blance | -12.519 |
genders | -12.329 |
CLS | -11.831 |
rils | -11.523 |
mattered | -11.286 |
Token | by |
Token ID | 416 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
BY | +12.484 |
Decay | +12.225 |
unfavorable | +11.950 |
Geological | +11.656 |
periodic | +11.511 |
Neg logit contributions | |
blance | -10.484 |
genders | -9.797 |
itans | -9.452 |
サーティワン | -9.379 |
rils | -9.346 |
Token | special |
Token ID | 2041 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
BY | +2.086 |
Decay | +1.987 |
periodic | +1.912 |
unfavorable | +1.906 |
than | +1.856 |
Neg logit contributions | |
genders | -4.258 |
blance | -4.199 |
itans | -4.099 |
rils | -4.060 |
aults | -4.060 |
Token | offers |
Token ID | 4394 |
Feature activation | +3.75e+00 |
Pos logit contributions | |
BY | +5.374 |
unfavorable | +5.088 |
periodic | +4.900 |
than | +4.669 |
Decay | +4.527 |
Neg logit contributions | |
blance | -11.278 |
genders | -10.862 |
rils | -10.700 |
サーティワン | -10.478 |
itans | -10.459 |
Token | for |
Token ID | 329 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
BY | +2.714 |
Decay | +2.581 |
than | +2.502 |
unfavorable | +2.501 |
periodic | +2.403 |
Neg logit contributions | |
genders | -2.869 |
blance | -2.839 |
rils | -2.718 |
aults | -2.697 |
itans | -2.689 |
Token | The |
Token ID | 383 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
BY | +4.444 |
Decay | +4.064 |
than | +3.607 |
unfavorable | +3.573 |
Geological | +3.523 |
Neg logit contributions | |
genders | -11.498 |
blance | -11.339 |
rils | -11.203 |
itans | -11.091 |
mattered | -10.822 |
Token | New |
Token ID | 968 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
BY | +6.113 |
Decay | +5.514 |
Geological | +5.090 |
Regular | +4.857 |
Organization | +4.841 |
Neg logit contributions | |
blance | -17.843 |
rils | -17.516 |
genders | -17.447 |
eatures | -17.279 |
ailability | -17.110 |
Token | York |
Token ID | 1971 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
BY | +7.525 |
Geological | +6.442 |
than | +6.322 |
Organization | +6.110 |
Decay | +5.743 |
Neg logit contributions | |
eatures | -22.948 |
blance | -22.916 |
ailability | -22.900 |
genders | -22.393 |
rils | -22.372 |
Token | Times |
Token ID | 3782 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
Times | +8.759 |
BY | +8.444 |
than | +8.254 |
Geological | +8.065 |
Decay | +8.040 |
Neg logit contributions | |
blance | -24.264 |
ailability | -23.677 |
eatures | -23.231 |
genders | -23.069 |
aults | -22.796 |
Token | 's |
Token ID | 338 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
BY | +4.784 |
Decay | +4.249 |
than | +4.004 |
unfavorable | +3.862 |
Organization | +3.771 |
Neg logit contributions | |
blance | -15.764 |
rils | -15.493 |
genders | -15.320 |
itans | -14.881 |
サーティワン | -14.751 |
Token | products |
Token ID | 3186 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
BY | +6.355 |
periodic | +6.285 |
Decay | +5.948 |
than | +5.697 |
unfavorable | +5.672 |
Neg logit contributions | |
rils | -17.590 |
blance | -17.248 |
サーティワン | -16.756 |
itans | -16.725 |
genders | -16.532 |
Token | and |
Token ID | 290 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
BY | +1.229 |
Decay | +1.191 |
than | +1.135 |
unfavorable | +1.120 |
Geological | +1.101 |
Neg logit contributions | |
genders | -1.387 |
blance | -1.359 |
empowerment | -1.302 |
rils | -1.297 |
aults | -1.293 |
Token | services |
Token ID | 2594 |
Feature activation | +4.39e+00 |
Pos logit contributions | |
BY | +2.167 |
Decay | +2.090 |
unfavorable | +2.044 |
than | +2.002 |
periodic | +1.998 |
Neg logit contributions | |
genders | -1.362 |
blance | -1.354 |
rils | -1.265 |
aults | -1.255 |
itans | -1.255 |
Token | ability |
Token ID | 2694 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
BY | +2.452 |
Decay | +2.392 |
unfavorable | +2.255 |
than | +2.240 |
periodic | +2.199 |
Neg logit contributions | |
genders | -2.907 |
blance | -2.819 |
rils | -2.756 |
aults | -2.740 |
rights | -2.709 |
Token | can |
Token ID | 460 |
Feature activation | -6.40e+00 |
Pos logit contributions | |
BY | +0.014 |
Decay | +0.014 |
than | +0.013 |
unfavorable | +0.013 |
Geological | +0.013 |
Neg logit contributions | |
genders | -0.014 |
blance | -0.014 |
aults | -0.013 |
empowerment | -0.013 |
mattered | -0.013 |
Token | be |
Token ID | 307 |
Feature activation | +9.40e-01 |
Pos logit contributions | |
genders | +4.508 |
blance | +4.156 |
aults | +4.147 |
empowerment | +4.133 |
mattered | +4.131 |
Neg logit contributions | |
BY | -4.905 |
Decay | -4.821 |
than | -4.501 |
unfavorable | -4.434 |
Geological | -4.433 |
Token | strengthened |
Token ID | 27324 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
BY | +0.666 |
Decay | +0.650 |
than | +0.611 |
unfavorable | +0.610 |
Geological | +0.594 |
Neg logit contributions | |
genders | -0.741 |
blance | -0.713 |
aults | -0.695 |
rils | -0.688 |
empowerment | -0.686 |
Token | over |
Token ID | 625 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
BY | +10.493 |
orally | +10.382 |
unfavorable | +9.771 |
Decay | +9.495 |
than | +9.484 |
Neg logit contributions | |
rils | -14.768 |
blance | -14.745 |
genders | -14.571 |
itans | -14.141 |
CLS | -13.942 |
Token | time |
Token ID | 640 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
BY | +5.358 |
Decay | +5.129 |
unfavorable | +5.113 |
than | +4.938 |
periodic | +4.928 |
Neg logit contributions | |
blance | -13.407 |
genders | -13.322 |
rils | -13.279 |
itans | -13.192 |
aults | -13.126 |
Token | with |
Token ID | 351 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
BY | +13.440 |
orally | +13.117 |
unfavorable | +12.208 |
Decay | +12.141 |
than | +12.102 |
Neg logit contributions | |
rils | -17.401 |
blance | -17.347 |
genders | -16.954 |
CLS | -16.509 |
itans | -16.409 |
Token | practice |
Token ID | 3357 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
periodic | +13.394 |
unfavorable | +12.764 |
BY | +12.688 |
Decay | +12.649 |
orally | +12.549 |
Neg logit contributions | |
blance | -13.310 |
rils | -13.190 |
genders | -13.029 |
itans | -12.771 |
aults | -12.700 |
Token | . |
Token ID | 13 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
BY | +8.845 |
Decay | +8.270 |
orally | +8.142 |
unfavorable | +7.870 |
periodic | +7.859 |
Neg logit contributions | |
genders | -11.634 |
rils | -11.596 |
blance | -11.531 |
itans | -11.225 |
aults | -11.051 |
Token | But |
Token ID | 887 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
BY | +7.098 |
Decay | +7.050 |
Regular | +6.408 |
Geological | +6.304 |
than | +6.304 |
Neg logit contributions | |
genders | -9.862 |
blance | -9.702 |
rils | -9.507 |
empowerment | -9.263 |
rights | -9.210 |
Token | this |
Token ID | 428 |
Feature activation | +7.69e+00 |
Pos logit contributions | |
BY | +2.870 |
Decay | +2.804 |
unfavorable | +2.647 |
than | +2.632 |
periodic | +2.585 |
Neg logit contributions | |
genders | -3.184 |
blance | -3.075 |
rils | -2.996 |
aults | -2.995 |
rights | -2.947 |
Token | hear |
Token ID | 3285 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
genders | +1.026 |
blance | +0.985 |
aults | +0.957 |
empowerment | +0.953 |
mattered | +0.951 |
Neg logit contributions | |
BY | -0.910 |
Decay | -0.892 |
unfavorable | -0.831 |
than | -0.830 |
Geological | -0.810 |
Token | a |
Token ID | 257 |
Feature activation | +4.64e+00 |
Pos logit contributions | |
BY | +6.916 |
Decay | +6.788 |
unfavorable | +6.579 |
periodic | +6.488 |
than | +6.391 |
Neg logit contributions | |
blance | -8.833 |
genders | -8.664 |
aults | -8.370 |
rils | -8.330 |
CLS | -8.281 |
Token | lot |
Token ID | 1256 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
BY | +3.600 |
Decay | +3.525 |
than | +3.357 |
unfavorable | +3.349 |
periodic | +3.318 |
Neg logit contributions | |
genders | -3.275 |
blance | -3.195 |
rils | -3.086 |
aults | -3.079 |
rights | -3.026 |
Token | of |
Token ID | 286 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
BY | +11.603 |
Decay | +11.578 |
unfavorable | +11.360 |
orally | +11.233 |
than | +11.141 |
Neg logit contributions | |
blance | -14.522 |
genders | -14.239 |
rils | -14.057 |
CLS | -14.023 |
itans | -13.823 |
Token | different |
Token ID | 1180 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
BY | +7.464 |
Decay | +7.312 |
unfavorable | +7.240 |
than | +6.951 |
orally | +6.888 |
Neg logit contributions | |
blance | -8.577 |
genders | -8.305 |
rils | -8.191 |
rights | -8.020 |
aults | -7.963 |
Token | things |
Token ID | 1243 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
BY | +7.219 |
Decay | +6.872 |
than | +6.771 |
unfavorable | +6.765 |
Geological | +6.593 |
Neg logit contributions | |
blance | -7.921 |
genders | -7.572 |
rils | -7.570 |
aults | -7.380 |
rights | -7.351 |
Token | . |
Token ID | 13 |
Feature activation | +6.85e+00 |
Pos logit contributions | |
orally | +14.424 |
than | +14.128 |
BY | +14.116 |
Decay | +13.894 |
unfavorable | +13.840 |
Neg logit contributions | |
blance | -15.692 |
rils | -15.504 |
CLS | -15.079 |
genders | -14.736 |
wheelchair | -14.580 |
Token | The |
Token ID | 383 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
BY | +4.140 |
Decay | +4.113 |
Geological | +3.796 |
than | +3.785 |
unfavorable | +3.633 |
Neg logit contributions | |
genders | -6.002 |
blance | -5.837 |
rils | -5.645 |
aults | -5.636 |
empowerment | -5.627 |
Token | fundamental |
Token ID | 7531 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
BY | +1.125 |
Decay | +1.099 |
than | +1.036 |
unfavorable | +1.034 |
Geological | +1.010 |
Neg logit contributions | |
genders | -1.160 |
blance | -1.120 |
aults | -1.086 |
rils | -1.078 |
empowerment | -1.070 |
Token | issue |
Token ID | 2071 |
Feature activation | +7.60e+00 |
Pos logit contributions | |
genders | +1.696 |
blance | +1.597 |
empowerment | +1.569 |
aults | +1.569 |
mattered | +1.545 |
Neg logit contributions | |
BY | -1.825 |
Decay | -1.785 |
than | -1.687 |
unfavorable | -1.670 |
Geological | -1.642 |
Token | is |
Token ID | 318 |
Feature activation | -7.54e+00 |
Pos logit contributions | |
BY | +4.486 |
Decay | +4.341 |
unfavorable | +4.092 |
than | +4.086 |
Geological | +3.976 |
Neg logit contributions | |
genders | -6.500 |
blance | -6.406 |
rils | -6.228 |
aults | -6.200 |
itans | -6.075 |
Token | told |
Token ID | 1297 |
Feature activation | +8.87e+00 |
Pos logit contributions | |
BY | +4.576 |
Decay | +4.335 |
than | +4.189 |
unfavorable | +4.176 |
orally | +4.138 |
Neg logit contributions | |
genders | -5.174 |
blance | -5.109 |
rils | -4.882 |
rights | -4.853 |
empowerment | -4.814 |
Token | Congress |
Token ID | 3162 |
Feature activation | -2.94e-01 |
Pos logit contributions | |
BY | +5.608 |
Decay | +5.365 |
than | +5.022 |
unfavorable | +5.013 |
periodic | +4.971 |
Neg logit contributions | |
genders | -7.341 |
blance | -7.311 |
aults | -7.009 |
rils | -6.944 |
itans | -6.834 |
Token | that |
Token ID | 326 |
Feature activation | +8.65e+00 |
Pos logit contributions | |
genders | +0.230 |
blance | +0.221 |
aults | +0.216 |
rils | +0.214 |
empowerment | +0.213 |
Neg logit contributions | |
BY | -0.210 |
Decay | -0.205 |
than | -0.193 |
unfavorable | -0.192 |
Geological | -0.187 |
Token | after |
Token ID | 706 |
Feature activation | +8.49e+00 |
Pos logit contributions | |
BY | +5.626 |
Decay | +5.387 |
unfavorable | +5.235 |
periodic | +5.155 |
than | +5.096 |
Neg logit contributions | |
blance | -6.927 |
genders | -6.876 |
rils | -6.660 |
aults | -6.467 |
rights | -6.461 |
Token | months |
Token ID | 1933 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
BY | +6.170 |
Decay | +5.949 |
unfavorable | +5.839 |
periodic | +5.747 |
than | +5.707 |
Neg logit contributions | |
blance | -6.136 |
genders | -6.115 |
aults | -5.812 |
rils | -5.760 |
rights | -5.698 |
Token | of |
Token ID | 286 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
BY | +8.301 |
Decay | +8.080 |
unfavorable | +8.057 |
periodic | +7.854 |
than | +7.624 |
Neg logit contributions | |
genders | -12.486 |
blance | -12.016 |
rils | -12.003 |
itans | -11.947 |
rights | -11.821 |
Token | juggling |
Token ID | 48097 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
periodic | +15.800 |
unfavorable | +15.682 |
preparation | +15.590 |
BY | +14.836 |
incomplete | +14.757 |
Neg logit contributions | |
blance | -16.588 |
genders | -15.030 |
rils | -14.848 |
rights | -14.467 |
aults | -14.419 |
Token | spending |
Token ID | 4581 |
Feature activation | +9.70e+00 |
Pos logit contributions | |
BY | +9.181 |
unfavorable | +9.034 |
periodic | +8.829 |
Decay | +8.766 |
orally | +8.525 |
Neg logit contributions | |
blance | -10.368 |
rils | -10.089 |
genders | -9.932 |
itans | -9.922 |
aults | -9.893 |
Token | to |
Token ID | 284 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
BY | +6.299 |
Decay | +6.024 |
unfavorable | +5.900 |
than | +5.802 |
periodic | +5.753 |
Neg logit contributions | |
blance | -7.596 |
genders | -7.538 |
aults | -7.273 |
rils | -7.175 |
itans | -7.069 |
Token | meet |
Token ID | 1826 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
BY | +8.571 |
Decay | +8.291 |
unfavorable | +7.893 |
periodic | +7.745 |
than | +7.688 |
Neg logit contributions | |
blance | -9.509 |
genders | -9.453 |
aults | -9.171 |
rils | -9.029 |
rights | -9.012 |
Token | government |
Token ID | 1230 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
BY | +12.609 |
periodic | +12.511 |
unfavorable | +12.374 |
Decay | +12.129 |
than | +11.994 |
Neg logit contributions | |
blance | -12.506 |
genders | -11.898 |
rils | -11.827 |
itans | -11.615 |
aults | -11.489 |
Token | few |
Token ID | 1178 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
BY | +2.030 |
Decay | +1.979 |
than | +1.876 |
unfavorable | +1.860 |
Geological | +1.832 |
Neg logit contributions | |
genders | -2.108 |
blance | -2.045 |
aults | -1.989 |
rils | -1.972 |
rights | -1.954 |
Token | weird |
Token ID | 7650 |
Feature activation | +8.36e+00 |
Pos logit contributions | |
BY | +8.560 |
periodic | +8.326 |
Decay | +8.317 |
unfavorable | +8.302 |
than | +8.040 |
Neg logit contributions | |
blance | -9.138 |
rils | -8.738 |
rights | -8.632 |
itans | -8.570 |
genders | -8.566 |
Token | song |
Token ID | 3496 |
Feature activation | +6.18e+00 |
Pos logit contributions | |
BY | +5.973 |
Decay | +5.747 |
than | +5.509 |
periodic | +5.498 |
unfavorable | +5.476 |
Neg logit contributions | |
blance | -6.061 |
genders | -5.955 |
rights | -5.709 |
rils | -5.691 |
mattered | -5.686 |
Token | kind |
Token ID | 1611 |
Feature activation | -3.37e-01 |
Pos logit contributions | |
BY | +4.745 |
Decay | +4.616 |
than | +4.394 |
unfavorable | +4.357 |
periodic | +4.350 |
Neg logit contributions | |
genders | -4.287 |
blance | -4.237 |
aults | -4.021 |
mattered | -3.992 |
empowerment | -3.973 |
Token | of |
Token ID | 286 |
Feature activation | +4.44e+00 |
Pos logit contributions | |
genders | +0.254 |
blance | +0.244 |
aults | +0.237 |
rils | +0.235 |
empowerment | +0.235 |
Neg logit contributions | |
BY | -0.250 |
Decay | -0.244 |
than | -0.230 |
unfavorable | -0.230 |
Geological | -0.224 |
Token | things |
Token ID | 1243 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
BY | +3.290 |
Decay | +3.199 |
than | +3.038 |
unfavorable | +3.028 |
periodic | +3.002 |
Neg logit contributions | |
genders | -3.246 |
blance | -3.203 |
aults | -3.058 |
rights | -3.043 |
rils | -3.041 |
Token | . |
Token ID | 13 |
Feature activation | +4.72e+00 |
Pos logit contributions | |
Decay | +13.761 |
BY | +13.475 |
orally | +13.236 |
than | +12.866 |
periodic | +12.813 |
Neg logit contributions | |
blance | -17.207 |
rights | -15.621 |
genders | -15.601 |
サーティワン | -15.539 |
rils | -15.469 |
Token | Barry |
Token ID | 14488 |
Feature activation | +5.77e+00 |
Pos logit contributions | |
BY | +2.978 |
Decay | +2.959 |
than | +2.724 |
Geological | +2.681 |
unfavorable | +2.621 |
Neg logit contributions | |
genders | -4.072 |
blance | -3.989 |
empowerment | -3.847 |
aults | -3.838 |
rils | -3.821 |
Token | likes |
Token ID | 7832 |
Feature activation | +4.43e+00 |
Pos logit contributions | |
BY | +4.058 |
Decay | +3.970 |
than | +3.730 |
unfavorable | +3.690 |
Geological | +3.642 |
Neg logit contributions | |
genders | -4.480 |
blance | -4.389 |
rils | -4.214 |
aults | -4.210 |
rights | -4.167 |
Token | music |
Token ID | 2647 |
Feature activation | +5.84e+00 |
Pos logit contributions | |
BY | +3.093 |
Decay | +3.063 |
than | +2.865 |
unfavorable | +2.857 |
periodic | +2.810 |
Neg logit contributions | |
genders | -3.444 |
blance | -3.383 |
aults | -3.253 |
rights | -3.208 |
rils | -3.196 |
Token | , |
Token ID | 11 |
Feature activation | +8.63e-01 |
Pos logit contributions | |
BY | +3.859 |
Decay | +3.773 |
unfavorable | +3.564 |
than | +3.526 |
orally | +3.499 |
Neg logit contributions | |
blance | -4.643 |
genders | -4.637 |
aults | -4.417 |
itans | -4.400 |
rils | -4.390 |
Token | faded |
Token ID | 24887 |
Feature activation | -3.56e+00 |
Pos logit contributions | |
BY | +1.091 |
Decay | +1.064 |
than | +1.000 |
unfavorable | +0.999 |
Geological | +0.975 |
Neg logit contributions | |
genders | -1.226 |
blance | -1.182 |
aults | -1.150 |
rils | -1.139 |
empowerment | -1.137 |
Token | away |
Token ID | 1497 |
Feature activation | -5.44e+00 |
Pos logit contributions | |
genders | +2.755 |
blance | +2.579 |
empowerment | +2.548 |
mattered | +2.536 |
aults | +2.531 |
Neg logit contributions | |
BY | -2.570 |
Decay | -2.505 |
than | -2.361 |
unfavorable | -2.285 |
Geological | -2.258 |
Token | due |
Token ID | 2233 |
Feature activation | -7.40e-01 |
Pos logit contributions | |
genders | +4.029 |
blance | +3.758 |
mattered | +3.707 |
empowerment | +3.705 |
wheelchair | +3.684 |
Neg logit contributions | |
BY | -4.028 |
Decay | -3.934 |
than | -3.695 |
unfavorable | -3.569 |
Geological | -3.503 |
Token | to |
Token ID | 284 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
genders | +0.523 |
blance | +0.500 |
aults | +0.486 |
rils | +0.484 |
empowerment | +0.482 |
Neg logit contributions | |
BY | -0.586 |
Decay | -0.573 |
than | -0.543 |
unfavorable | -0.537 |
Geological | -0.526 |
Token | diversion |
Token ID | 34851 |
Feature activation | +3.82e+00 |
Pos logit contributions | |
unfavorable | +13.285 |
periodic | +13.068 |
incomplete | +12.163 |
Decay | +12.149 |
BY | +12.142 |
Neg logit contributions | |
blance | -13.326 |
genders | -12.434 |
rils | -12.399 |
itans | -12.030 |
aults | -11.983 |
Token | of |
Token ID | 286 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
BY | +2.590 |
Decay | +2.516 |
unfavorable | +2.426 |
than | +2.369 |
periodic | +2.331 |
Neg logit contributions | |
genders | -3.079 |
blance | -3.013 |
aults | -2.891 |
rils | -2.882 |
empowerment | -2.836 |
Token | water |
Token ID | 1660 |
Feature activation | +9.64e+00 |
Pos logit contributions | |
unfavorable | +15.378 |
periodic | +14.994 |
Geological | +14.372 |
Persian | +14.191 |
BY | +14.186 |
Neg logit contributions | |
blance | -17.432 |
aults | -15.360 |
rils | -15.313 |
genders | -14.746 |
itans | -14.665 |
Token | for |
Token ID | 329 |
Feature activation | +2.03e+01 |
Pos logit contributions | |
BY | +6.225 |
unfavorable | +5.910 |
Decay | +5.838 |
periodic | +5.676 |
than | +5.641 |
Neg logit contributions | |
blance | -7.618 |
genders | -7.553 |
aults | -7.209 |
rils | -7.157 |
CLS | -7.122 |
Token | agriculture |
Token ID | 14510 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
periodic | +12.131 |
BY | +12.002 |
unfavorable | +11.884 |
than | +11.767 |
Geological | +11.551 |
Neg logit contributions | |
blance | -14.010 |
rils | -13.172 |
genders | -13.117 |
itans | -12.665 |
aults | -12.567 |
Token | from |
Token ID | 422 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
BY | +2.299 |
Decay | +2.246 |
unfavorable | +2.119 |
than | +2.111 |
Geological | +2.069 |
Neg logit contributions | |
genders | -2.485 |
blance | -2.416 |
aults | -2.324 |
rils | -2.305 |
empowerment | -2.292 |
Token | its |
Token ID | 663 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
unfavorable | +12.301 |
Persian | +11.918 |
Decay | +11.914 |
periodic | +11.883 |
BY | +11.778 |
Neg logit contributions | |
blance | -15.082 |
rils | -13.780 |
genders | -13.657 |
itans | -13.210 |
mattered | -13.203 |
Token | righteousness |
Token ID | 33738 |
Feature activation | -4.61e-01 |
Pos logit contributions | |
BY | +6.197 |
Decay | +5.851 |
unfavorable | +5.830 |
periodic | +5.771 |
than | +5.726 |
Neg logit contributions | |
blance | -5.941 |
genders | -5.772 |
aults | -5.672 |
rils | -5.576 |
itans | -5.453 |
Token | . |
Token ID | 13 |
Feature activation | -6.93e+00 |
Pos logit contributions | |
genders | +0.343 |
blance | +0.328 |
aults | +0.321 |
empowerment | +0.318 |
mattered | +0.318 |
Neg logit contributions | |
BY | -0.346 |
Decay | -0.338 |
than | -0.319 |
unfavorable | -0.318 |
Geological | -0.310 |
Token | But |
Token ID | 887 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
genders | +5.324 |
mattered | +4.988 |
aults | +4.981 |
itans | +4.968 |
CLS | +4.965 |
Neg logit contributions | |
BY | -4.553 |
unfavorable | -4.399 |
Decay | -4.387 |
periodic | -4.309 |
orally | -4.277 |
Token | that |
Token ID | 326 |
Feature activation | -6.93e+00 |
Pos logit contributions | |
genders | +7.491 |
equality | +7.001 |
empowerment | +6.969 |
mattered | +6.942 |
rights | +6.624 |
Neg logit contributions | |
BY | -7.045 |
Decay | -6.977 |
than | -6.545 |
unfavorable | -6.246 |
orally | -6.183 |
Token | has |
Token ID | 468 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
genders | +5.530 |
empowerment | +5.275 |
mattered | +5.259 |
equality | +5.185 |
blance | +5.063 |
Neg logit contributions | |
BY | -4.649 |
Decay | -4.628 |
than | -4.288 |
unfavorable | -4.092 |
orally | -4.076 |
Token | never |
Token ID | 1239 |
Feature activation | -3.55e+01 |
Pos logit contributions | |
genders | +10.347 |
mattered | +10.248 |
equality | +9.663 |
empowerment | +9.483 |
wheelchair | +9.327 |
Neg logit contributions | |
Decay | -10.392 |
BY | -10.029 |
than | -9.786 |
Reviewer | -9.393 |
iatus | -9.043 |
Token | been |
Token ID | 587 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
mattered | +20.400 |
genders | +17.356 |
bothered | +16.104 |
equality | +15.370 |
hood | +15.349 |
Neg logit contributions | |
Reviewer | -23.031 |
Decay | -21.643 |
BY | -20.213 |
estern | -19.343 |
ERAL | -19.278 |
Token | wholly |
Token ID | 18174 |
Feature activation | -5.45e+00 |
Pos logit contributions | |
genders | +8.868 |
mattered | +8.368 |
equality | +8.326 |
empowerment | +8.150 |
blance | +7.716 |
Neg logit contributions | |
Decay | -10.790 |
BY | -10.453 |
than | -9.933 |
iatus | -9.818 |
terness | -9.659 |
Token | true |
Token ID | 2081 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
genders | +3.540 |
empowerment | +3.227 |
mattered | +3.227 |
blance | +3.215 |
equality | +3.177 |
Neg logit contributions | |
Decay | -4.552 |
BY | -4.484 |
than | -4.222 |
Geological | -4.122 |
unfavorable | -4.120 |
Token | , |
Token ID | 11 |
Feature activation | -6.12e+00 |
Pos logit contributions | |
genders | +6.455 |
mattered | +6.069 |
blance | +5.977 |
equality | +5.857 |
empowerment | +5.827 |
Neg logit contributions | |
Decay | -7.966 |
BY | -7.954 |
than | -7.453 |
unfavorable | -7.286 |
periodic | -7.274 |
Token | and |
Token ID | 290 |
Feature activation | -3.82e+00 |
Pos logit contributions | |
genders | +4.572 |
mattered | +4.258 |
empowerment | +4.244 |
aults | +4.208 |
blance | +4.204 |
Neg logit contributions | |
BY | -4.524 |
Decay | -4.385 |
than | -4.124 |
unfavorable | -4.011 |
Geological | -3.946 |
Token | Nevertheless |
Token ID | 15933 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
genders | +3.574 |
blance | +3.426 |
aults | +3.368 |
mattered | +3.338 |
rights | +3.326 |
Neg logit contributions | |
BY | -2.974 |
Decay | -2.857 |
unfavorable | -2.794 |
periodic | -2.747 |
than | -2.731 |
Token | , |
Token ID | 11 |
Feature activation | +6.98e-01 |
Pos logit contributions | |
BY | +1.320 |
Decay | +1.287 |
than | +1.207 |
unfavorable | +1.206 |
Geological | +1.173 |
Neg logit contributions | |
genders | -1.534 |
blance | -1.479 |
aults | -1.442 |
rils | -1.428 |
empowerment | -1.423 |
Token | as |
Token ID | 355 |
Feature activation | -3.31e+00 |
Pos logit contributions | |
BY | +0.489 |
Decay | +0.477 |
than | +0.448 |
unfavorable | +0.447 |
Geological | +0.435 |
Neg logit contributions | |
genders | -0.556 |
blance | -0.535 |
aults | -0.521 |
rils | -0.517 |
empowerment | -0.515 |
Token | feminist |
Token ID | 14314 |
Feature activation | -7.55e+00 |
Pos logit contributions | |
genders | +2.637 |
blance | +2.501 |
empowerment | +2.460 |
aults | +2.456 |
mattered | +2.454 |
Neg logit contributions | |
BY | -2.311 |
Decay | -2.235 |
than | -2.106 |
unfavorable | -2.067 |
Geological | -2.042 |
Token | debates |
Token ID | 15389 |
Feature activation | -8.58e+00 |
Pos logit contributions | |
genders | +6.652 |
empowerment | +6.333 |
equality | +6.180 |
mattered | +6.087 |
wheelchair | +6.041 |
Neg logit contributions | |
BY | -4.531 |
Decay | -4.304 |
unfavorable | -4.005 |
than | -3.979 |
Geological | -3.901 |
Token | on |
Token ID | 319 |
Feature activation | -3.10e+01 |
Pos logit contributions | |
genders | +6.840 |
mattered | +6.465 |
aults | +6.205 |
equality | +6.181 |
empowerment | +6.175 |
Neg logit contributions | |
BY | -5.990 |
Decay | -5.712 |
than | -5.209 |
Geological | -5.150 |
Reviewer | -5.062 |
Token | the |
Token ID | 262 |
Feature activation | -2.19e+01 |
Pos logit contributions | |
genders | +20.202 |
equality | +20.013 |
empowerment | +19.483 |
feminism | +18.415 |
sexes | +17.270 |
Neg logit contributions | |
earchers | -14.854 |
BY | -14.809 |
Decay | -14.712 |
terness | -14.546 |
than | -14.089 |
Token | topic |
Token ID | 7243 |
Feature activation | -8.21e+00 |
Pos logit contributions | |
genders | +16.186 |
empowerment | +15.381 |
equality | +15.304 |
sexes | +14.368 |
wheelchair | +14.086 |
Neg logit contributions | |
BY | -12.662 |
Decay | -11.419 |
earchers | -11.294 |
terness | -11.160 |
than | -11.106 |
Token | illustrate |
Token ID | 19418 |
Feature activation | -5.84e+00 |
Pos logit contributions | |
genders | +6.541 |
mattered | +6.172 |
equality | +5.939 |
blance | +5.938 |
aults | +5.908 |
Neg logit contributions | |
BY | -5.723 |
Decay | -5.501 |
Geological | -4.969 |
than | -4.957 |
unfavorable | -4.859 |
Token | this |
Token ID | 428 |
Feature activation | -7.46e+00 |
Pos logit contributions | |
genders | +4.176 |
blance | +3.866 |
empowerment | +3.859 |
equality | +3.806 |
mattered | +3.805 |
Neg logit contributions | |
BY | -4.430 |
Decay | -4.373 |
than | -4.090 |
unfavorable | -3.997 |
Geological | -3.991 |
Token | is |
Token ID | 318 |
Feature activation | -2.31e+00 |
Pos logit contributions | |
genders | +5.172 |
empowerment | +4.898 |
mattered | +4.823 |
equality | +4.809 |
blance | +4.673 |
Neg logit contributions | |
Decay | -5.755 |
BY | -5.744 |
than | -5.261 |
Geological | -5.216 |
unfavorable | -5.100 |
Token | relations |
Token ID | 2316 |
Feature activation | -9.35e-01 |
Pos logit contributions | |
genders | +4.595 |
empowerment | +4.454 |
rights | +4.370 |
wheelchair | +4.352 |
equality | +4.337 |
Neg logit contributions | |
BY | -4.504 |
Decay | -4.497 |
than | -4.205 |
unfavorable | -4.117 |
Geological | -4.048 |
Token | perspective |
Token ID | 6650 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
genders | +0.628 |
blance | +0.594 |
aults | +0.580 |
empowerment | +0.580 |
mattered | +0.572 |
Neg logit contributions | |
BY | -0.772 |
Decay | -0.754 |
than | -0.715 |
unfavorable | -0.712 |
Geological | -0.696 |
Token | , |
Token ID | 11 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
genders | +8.591 |
equality | +8.164 |
empowerment | +8.099 |
mattered | +8.065 |
blance | +8.049 |
Neg logit contributions | |
Decay | -9.424 |
BY | -9.320 |
than | -9.072 |
unfavorable | -8.627 |
orally | -8.543 |
Token | this |
Token ID | 428 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
genders | +9.194 |
equality | +8.742 |
empowerment | +8.655 |
wheelchair | +8.615 |
mattered | +8.600 |
Neg logit contributions | |
Decay | -7.798 |
BY | -7.756 |
than | -7.564 |
unfavorable | -7.016 |
Reviewer | -6.953 |
Token | hasn |
Token ID | 5818 |
Feature activation | -7.41e+00 |
Pos logit contributions | |
genders | +7.641 |
mattered | +7.323 |
empowerment | +7.322 |
equality | +7.188 |
wheelchair | +7.060 |
Neg logit contributions | |
Decay | -7.185 |
BY | -7.041 |
than | -6.588 |
risome | -6.270 |
Geological | -6.220 |
Token | 't |
Token ID | 470 |
Feature activation | -3.04e+01 |
Pos logit contributions | |
genders | +5.838 |
aults | +5.631 |
rights | +5.568 |
itans | +5.503 |
blance | +5.446 |
Neg logit contributions | |
Decay | -4.841 |
BY | -4.730 |
unfavorable | -4.512 |
periodic | -4.479 |
orally | -4.413 |
Token | played |
Token ID | 2826 |
Feature activation | -1.89e+01 |
Pos logit contributions | |
mattered | +18.418 |
genders | +16.038 |
wheelchair | +14.830 |
bothered | +14.588 |
blinded | +14.365 |
Neg logit contributions | |
Reviewer | -20.229 |
Decay | -19.373 |
earchers | -18.445 |
BY | -18.370 |
estern | -18.225 |
Token | well |
Token ID | 880 |
Feature activation | -4.13e-02 |
Pos logit contributions | |
genders | +11.406 |
mattered | +10.735 |
empowerment | +10.497 |
wheelchair | +10.434 |
equality | +10.426 |
Neg logit contributions | |
Decay | -13.242 |
BY | -12.934 |
than | -12.865 |
earchers | -12.078 |
terness | -11.848 |
Token | with |
Token ID | 351 |
Feature activation | -3.09e+00 |
Pos logit contributions | |
genders | +0.032 |
blance | +0.031 |
aults | +0.030 |
empowerment | +0.030 |
rils | +0.030 |
Neg logit contributions | |
BY | -0.029 |
Decay | -0.029 |
than | -0.027 |
unfavorable | -0.027 |
Geological | -0.026 |
Token | London |
Token ID | 3576 |
Feature activation | -2.68e-01 |
Pos logit contributions | |
genders | +2.519 |
blance | +2.380 |
empowerment | +2.330 |
aults | +2.328 |
wheelchair | +2.318 |
Neg logit contributions | |
BY | -2.086 |
Decay | -2.055 |
than | -1.932 |
unfavorable | -1.898 |
orally | -1.849 |
Token | ers |
Token ID | 364 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
genders | +0.224 |
blance | +0.215 |
aults | +0.211 |
rils | +0.209 |
empowerment | +0.208 |
Neg logit contributions | |
BY | -0.177 |
Decay | -0.173 |
than | -0.162 |
unfavorable | -0.162 |
Geological | -0.157 |
Token |
|
Token ID | 198 |
Feature activation | -4.40e+00 |
Pos logit contributions | |
genders | +6.574 |
blance | +6.257 |
CLS | +6.175 |
mattered | +6.164 |
aults | +6.156 |
Neg logit contributions | |
BY | -5.769 |
unfavorable | -5.511 |
Decay | -5.503 |
periodic | -5.378 |
orally | -5.329 |
Token |
|
Token ID | 198 |
Feature activation | -7.40e+00 |
Pos logit contributions | |
genders | +2.674 |
aults | +2.495 |
blance | +2.481 |
rights | +2.453 |
rils | +2.415 |
Neg logit contributions | |
Decay | -3.734 |
BY | -3.721 |
unfavorable | -3.570 |
periodic | -3.534 |
orally | -3.490 |
Token | I |
Token ID | 40 |
Feature activation | -8.88e+00 |
Pos logit contributions | |
genders | +5.657 |
blance | +5.552 |
rights | +5.492 |
aults | +5.444 |
rils | +5.357 |
Neg logit contributions | |
Decay | -4.879 |
unfavorable | -4.642 |
BY | -4.627 |
orally | -4.566 |
periodic | -4.537 |
Token | don |
Token ID | 836 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
genders | +6.624 |
blance | +6.267 |
mattered | +6.201 |
empowerment | +6.124 |
rils | +6.080 |
Neg logit contributions | |
BY | -6.033 |
Decay | -5.985 |
unfavorable | -5.563 |
Geological | -5.479 |
than | -5.417 |
Token | 't |
Token ID | 470 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
genders | +7.440 |
aults | +7.252 |
rights | +7.111 |
itans | +7.095 |
blance | +6.865 |
Neg logit contributions | |
Decay | -7.236 |
BY | -6.948 |
periodic | -6.900 |
unfavorable | -6.812 |
orally | -6.685 |
Token | see |
Token ID | 766 |
Feature activation | -2.99e+01 |
Pos logit contributions | |
genders | +12.029 |
wheelchair | +11.433 |
mattered | +11.164 |
empowerment | +10.986 |
equality | +10.983 |
Neg logit contributions | |
BY | -15.128 |
Decay | -14.957 |
Reviewer | -14.497 |
terness | -13.806 |
Geological | -13.640 |
Token | this |
Token ID | 428 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
genders | +16.773 |
equality | +16.616 |
barriers | +16.131 |
empowerment | +15.998 |
mattered | +15.778 |
Neg logit contributions | |
BY | -15.491 |
terness | -14.373 |
hyde | -14.355 |
than | -14.043 |
risome | -13.944 |
Token | as |
Token ID | 355 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
genders | +8.736 |
mattered | +8.482 |
empowerment | +8.358 |
equality | +8.328 |
wheelchair | +8.125 |
Neg logit contributions | |
BY | -7.644 |
Decay | -7.443 |
than | -6.977 |
Geological | -6.755 |
Reviewer | -6.728 |
Token | too |
Token ID | 1165 |
Feature activation | -7.92e+00 |
Pos logit contributions | |
genders | +8.427 |
empowerment | +8.174 |
equality | +8.074 |
mattered | +8.009 |
blance | +7.881 |
Neg logit contributions | |
BY | -8.099 |
Decay | -7.888 |
than | -7.261 |
Geological | -7.184 |
orally | -6.982 |
Token | big |
Token ID | 1263 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
genders | +5.940 |
empowerment | +5.607 |
mattered | +5.595 |
blance | +5.569 |
aults | +5.439 |
Neg logit contributions | |
BY | -5.721 |
Decay | -5.574 |
than | -5.101 |
Geological | -5.016 |
orally | -4.940 |
Token | of |
Token ID | 286 |
Feature activation | -5.35e+00 |
Pos logit contributions | |
genders | +3.284 |
blance | +3.114 |
mattered | +3.063 |
empowerment | +3.061 |
aults | +3.040 |
Neg logit contributions | |
BY | -3.208 |
Decay | -3.128 |
than | -2.916 |
unfavorable | -2.872 |
Geological | -2.870 |
Token | in |
Token ID | 287 |
Feature activation | -8.09e+00 |
Pos logit contributions | |
genders | +14.043 |
aults | +13.577 |
wheelchair | +13.398 |
mattered | +13.313 |
empowerment | +13.236 |
Neg logit contributions | |
Decay | -11.310 |
BY | -11.200 |
than | -10.461 |
unfavorable | -10.446 |
risome | -10.352 |
Token | a |
Token ID | 257 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
genders | +6.085 |
wheelchair | +5.757 |
aults | +5.631 |
empowerment | +5.619 |
blance | +5.533 |
Neg logit contributions | |
BY | -5.667 |
Decay | -5.527 |
than | -5.219 |
unfavorable | -5.197 |
Geological | -5.037 |
Token | race |
Token ID | 3234 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
wheelchair | +8.784 |
genders | +8.778 |
aults | +8.236 |
empowerment | +8.168 |
CLS | +8.138 |
Neg logit contributions | |
BY | -7.620 |
Decay | -7.604 |
unfavorable | -7.125 |
than | -6.980 |
Reviewer | -6.785 |
Token | of |
Token ID | 286 |
Feature activation | -9.81e+00 |
Pos logit contributions | |
genders | +11.831 |
wheelchair | +11.658 |
blance | +11.385 |
rights | +11.330 |
equality | +11.193 |
Neg logit contributions | |
Decay | -11.580 |
BY | -11.522 |
than | -11.042 |
unfavorable | -10.923 |
Geological | -10.480 |
Token | remote |
Token ID | 6569 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
genders | +7.404 |
wheelchair | +6.988 |
empowerment | +6.967 |
aults | +6.896 |
blance | +6.838 |
Neg logit contributions | |
BY | -6.584 |
Decay | -6.425 |
than | -6.147 |
unfavorable | -6.103 |
Geological | -5.879 |
Token | control |
Token ID | 1630 |
Feature activation | -2.95e+01 |
Pos logit contributions | |
genders | +8.401 |
empowerment | +7.990 |
wheelchair | +7.951 |
mattered | +7.742 |
aults | +7.509 |
Neg logit contributions | |
BY | -12.312 |
Decay | -12.251 |
than | -11.942 |
unfavorable | -11.542 |
Geological | -11.298 |
Token | cars |
Token ID | 5006 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
genders | +17.460 |
wheelchair | +17.319 |
empowerment | +16.933 |
aults | +16.755 |
mattered | +16.399 |
Neg logit contributions | |
BY | -14.368 |
risome | -13.998 |
Decay | -13.807 |
than | -13.732 |
unfavorable | -13.731 |
Token | 1993 |
Token ID | 9656 |
Feature activation | -8.80e-01 |
Pos logit contributions | |
genders | +13.794 |
mattered | +13.340 |
aults | +13.260 |
wheelchair | +13.020 |
ault | +12.845 |
Neg logit contributions | |
BY | -12.552 |
Decay | -12.206 |
unfavorable | -11.604 |
than | -11.503 |
risome | -11.457 |
Token | : |
Token ID | 25 |
Feature activation | -4.99e-01 |
Pos logit contributions | |
genders | +0.794 |
blance | +0.766 |
aults | +0.753 |
rils | +0.746 |
empowerment | +0.744 |
Neg logit contributions | |
BY | -0.520 |
Decay | -0.506 |
unfavorable | -0.473 |
than | -0.471 |
Geological | -0.452 |
Token | Father |
Token ID | 9190 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
genders | +0.411 |
blance | +0.396 |
aults | +0.387 |
rils | +0.382 |
empowerment | +0.382 |
Neg logit contributions | |
BY | -0.336 |
Decay | -0.327 |
unfavorable | -0.307 |
than | -0.306 |
Geological | -0.297 |
Token | buys |
Token ID | 24779 |
Feature activation | -4.74e+00 |
Pos logit contributions | |
genders | +8.370 |
mattered | +7.887 |
empowerment | +7.876 |
aults | +7.834 |
blance | +7.759 |
Neg logit contributions | |
BY | -8.211 |
Decay | -7.872 |
unfavorable | -7.405 |
than | -7.243 |
Geological | -7.096 |
Token | Of |
Token ID | 5189 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
genders | +1.976 |
blance | +1.924 |
aults | +1.893 |
rights | +1.887 |
rils | +1.858 |
Neg logit contributions | |
Decay | -1.619 |
BY | -1.581 |
unfavorable | -1.521 |
periodic | -1.493 |
orally | -1.488 |
Token | course |
Token ID | 1781 |
Feature activation | -4.44e+00 |
Pos logit contributions | |
genders | +6.304 |
blance | +5.838 |
aults | +5.798 |
rights | +5.702 |
empowerment | +5.646 |
Neg logit contributions | |
BY | -8.472 |
Decay | -8.363 |
unfavorable | -7.972 |
Geological | -7.968 |
orally | -7.947 |
Token | , |
Token ID | 11 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
genders | +3.227 |
blance | +3.033 |
empowerment | +3.028 |
mattered | +2.975 |
aults | +2.973 |
Neg logit contributions | |
BY | -3.300 |
Decay | -3.243 |
than | -3.081 |
unfavorable | -3.012 |
Geological | -3.009 |
Token | that |
Token ID | 326 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
genders | +0.958 |
blance | +0.914 |
aults | +0.892 |
empowerment | +0.889 |
mattered | +0.881 |
Neg logit contributions | |
BY | -0.886 |
Decay | -0.865 |
than | -0.815 |
unfavorable | -0.807 |
Geological | -0.793 |
Token | doesn |
Token ID | 1595 |
Feature activation | -7.59e+00 |
Pos logit contributions | |
genders | +1.456 |
blance | +1.379 |
empowerment | +1.369 |
mattered | +1.360 |
aults | +1.358 |
Neg logit contributions | |
BY | -1.148 |
Decay | -1.124 |
than | -1.052 |
unfavorable | -1.031 |
Geological | -1.012 |
Token | 't |
Token ID | 470 |
Feature activation | -2.90e+01 |
Pos logit contributions | |
genders | +5.758 |
aults | +5.579 |
rights | +5.492 |
itans | +5.428 |
blance | +5.334 |
Neg logit contributions | |
Decay | -5.101 |
BY | -4.889 |
periodic | -4.835 |
unfavorable | -4.812 |
orally | -4.719 |
Token | always |
Token ID | 1464 |
Feature activation | -2.03e+01 |
Pos logit contributions | |
genders | +13.183 |
mattered | +13.056 |
equality | +13.038 |
mean | +12.620 |
entitle | +12.477 |
Neg logit contributions | |
Decay | -19.981 |
Reviewer | -19.605 |
estern | -19.387 |
BY | -19.246 |
WithNo | -19.016 |
Token | happen |
Token ID | 1645 |
Feature activation | -5.97e+00 |
Pos logit contributions | |
genders | +12.251 |
mattered | +12.015 |
equality | +11.703 |
wheelchair | +11.295 |
empowerment | +11.200 |
Neg logit contributions | |
Decay | -13.887 |
Reviewer | -13.851 |
BY | -13.313 |
estern | -12.560 |
WithNo | -12.370 |
Token | . |
Token ID | 13 |
Feature activation | +6.06e+00 |
Pos logit contributions | |
genders | +4.150 |
mattered | +3.805 |
blance | +3.799 |
empowerment | +3.789 |
equality | +3.755 |
Neg logit contributions | |
Decay | -4.704 |
BY | -4.634 |
than | -4.338 |
Geological | -4.272 |
unfavorable | -4.241 |
Token | Mer |
Token ID | 4638 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
BY | +3.692 |
Decay | +3.664 |
than | +3.329 |
Geological | +3.296 |
unfavorable | +3.171 |
Neg logit contributions | |
genders | -5.415 |
blance | -5.275 |
empowerment | -5.124 |
rils | -5.121 |
aults | -5.061 |
Token | ri |
Token ID | 380 |
Feature activation | -2.13e+00 |
Pos logit contributions | |
BY | +3.072 |
Decay | +2.946 |
than | +2.876 |
unfavorable | +2.754 |
periodic | +2.704 |
Neg logit contributions | |
genders | -3.102 |
blance | -2.939 |
empowerment | -2.888 |
mattered | -2.850 |
aults | -2.817 |
Token | either |
Token ID | 2035 |
Feature activation | +2.84e+00 |
Pos logit contributions | |
genders | +4.559 |
empowerment | +4.162 |
blance | +4.150 |
equality | +4.134 |
rights | +4.112 |
Neg logit contributions | |
BY | -4.286 |
Decay | -4.231 |
than | -3.902 |
Geological | -3.761 |
unfavorable | -3.741 |
Token | camp |
Token ID | 1413 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
BY | +1.908 |
Decay | +1.847 |
unfavorable | +1.770 |
than | +1.748 |
periodic | +1.702 |
Neg logit contributions | |
genders | -2.283 |
blance | -2.251 |
aults | -2.189 |
rils | -2.182 |
itans | -2.137 |
Token | of |
Token ID | 286 |
Feature activation | -5.63e+00 |
Pos logit contributions | |
BY | +0.132 |
Decay | +0.129 |
than | +0.121 |
unfavorable | +0.121 |
Geological | +0.118 |
Neg logit contributions | |
genders | -0.141 |
blance | -0.136 |
aults | -0.132 |
rils | -0.131 |
empowerment | -0.131 |
Token | the |
Token ID | 262 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
genders | +4.502 |
empowerment | +4.149 |
equality | +4.109 |
blance | +4.070 |
mattered | +4.059 |
Neg logit contributions | |
BY | -3.951 |
Decay | -3.929 |
than | -3.581 |
Geological | -3.507 |
unfavorable | -3.465 |
Token | debate |
Token ID | 4384 |
Feature activation | -2.24e+00 |
Pos logit contributions | |
genders | +8.451 |
equality | +7.722 |
empowerment | +7.670 |
wheelchair | +7.522 |
rights | +7.401 |
Neg logit contributions | |
BY | -7.484 |
Decay | -7.286 |
than | -6.826 |
Geological | -6.534 |
orally | -6.443 |
Token | about |
Token ID | 546 |
Feature activation | -2.89e+01 |
Pos logit contributions | |
genders | +1.716 |
blance | +1.616 |
mattered | +1.584 |
aults | +1.583 |
empowerment | +1.581 |
Neg logit contributions | |
BY | -1.648 |
Decay | -1.619 |
than | -1.501 |
unfavorable | -1.482 |
Geological | -1.473 |
Token | the |
Token ID | 262 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
equality | +18.786 |
genders | +18.481 |
empowerment | +17.274 |
feminism | +16.621 |
mattered | +16.065 |
Neg logit contributions | |
Decay | -15.712 |
BY | -15.694 |
Reviewer | -14.701 |
terness | -14.597 |
ngth | -14.333 |
Token | viability |
Token ID | 32141 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
genders | +11.379 |
equality | +10.921 |
empowerment | +10.595 |
mattered | +10.029 |
wheelchair | +9.990 |
Neg logit contributions | |
BY | -10.367 |
Decay | -9.976 |
than | -9.148 |
Geological | -9.033 |
terness | -9.003 |
Token | of |
Token ID | 286 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
genders | +6.912 |
blance | +6.570 |
equality | +6.477 |
mattered | +6.437 |
empowerment | +6.424 |
Neg logit contributions | |
BY | -9.483 |
Decay | -9.282 |
than | -8.705 |
Geological | -8.652 |
unfavorable | -8.507 |
Token | Hume |
Token ID | 45485 |
Feature activation | +3.80e+00 |
Pos logit contributions | |
genders | +11.995 |
equality | +11.668 |
empowerment | +11.012 |
feminism | +10.393 |
mattered | +10.340 |
Neg logit contributions | |
Decay | -11.188 |
BY | -11.073 |
Reviewer | -10.118 |
than | -10.068 |
terness | -9.987 |
Token | 's |
Token ID | 338 |
Feature activation | -2.89e+00 |
Pos logit contributions | |
BY | +2.030 |
Decay | +1.967 |
than | +1.833 |
unfavorable | +1.811 |
periodic | +1.739 |
Neg logit contributions | |
genders | -3.629 |
blance | -3.526 |
aults | -3.448 |
rils | -3.433 |
empowerment | -3.393 |
Token | is |
Token ID | 318 |
Feature activation | +3.81e+00 |
Pos logit contributions | |
genders | +5.888 |
mattered | +5.545 |
aults | +5.420 |
blance | +5.379 |
equality | +5.368 |
Neg logit contributions | |
BY | -5.301 |
Decay | -5.236 |
than | -4.900 |
unfavorable | -4.759 |
periodic | -4.704 |
Token | the |
Token ID | 262 |
Feature activation | -3.18e+00 |
Pos logit contributions | |
BY | +2.557 |
Decay | +2.478 |
unfavorable | +2.349 |
than | +2.313 |
periodic | +2.259 |
Neg logit contributions | |
genders | -3.126 |
blance | -3.045 |
aults | -2.947 |
rils | -2.936 |
rights | -2.898 |
Token | first |
Token ID | 717 |
Feature activation | -2.38e+00 |
Pos logit contributions | |
genders | +2.304 |
blance | +2.138 |
empowerment | +2.131 |
aults | +2.109 |
mattered | +2.083 |
Neg logit contributions | |
BY | -2.449 |
Decay | -2.384 |
than | -2.260 |
unfavorable | -2.218 |
Geological | -2.201 |
Token | national |
Token ID | 2260 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
genders | +1.915 |
blance | +1.809 |
empowerment | +1.779 |
aults | +1.777 |
mattered | +1.767 |
Neg logit contributions | |
BY | -1.644 |
Decay | -1.604 |
than | -1.510 |
unfavorable | -1.479 |
Geological | -1.453 |
Token | survey |
Token ID | 5526 |
Feature activation | -6.53e-01 |
Pos logit contributions | |
BY | +0.727 |
Decay | +0.706 |
unfavorable | +0.658 |
than | +0.656 |
Geological | +0.637 |
Neg logit contributions | |
genders | -1.036 |
blance | -1.006 |
aults | -0.982 |
rils | -0.975 |
empowerment | -0.967 |
Token | on |
Token ID | 319 |
Feature activation | -2.88e+01 |
Pos logit contributions | |
genders | +0.521 |
blance | +0.500 |
aults | +0.486 |
empowerment | +0.484 |
rils | +0.482 |
Neg logit contributions | |
BY | -0.457 |
Decay | -0.446 |
than | -0.420 |
unfavorable | -0.416 |
Geological | -0.407 |
Token | the |
Token ID | 262 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
genders | +19.356 |
equality | +18.929 |
empowerment | +18.696 |
wheelchair | +17.405 |
barriers | +17.120 |
Neg logit contributions | |
Decay | -13.034 |
terness | -12.931 |
BY | -12.586 |
earchers | -12.319 |
than | -12.117 |
Token | pending |
Token ID | 13310 |
Feature activation | -7.76e+00 |
Pos logit contributions | |
genders | +15.058 |
empowerment | +14.283 |
equality | +14.103 |
wheelchair | +13.403 |
barriers | +13.279 |
Neg logit contributions | |
BY | -11.036 |
Decay | -10.383 |
terness | -10.363 |
Reviewer | -10.056 |
earchers | -9.981 |
Token | proposal |
Token ID | 6961 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
genders | +6.321 |
empowerment | +5.935 |
equality | +5.832 |
aults | +5.750 |
wheelchair | +5.737 |
Neg logit contributions | |
BY | -4.984 |
Decay | -4.789 |
than | -4.576 |
orally | -4.489 |
Geological | -4.401 |
Token | . |
Token ID | 13 |
Feature activation | -7.15e+00 |
Pos logit contributions | |
genders | +0.176 |
blance | +0.169 |
aults | +0.165 |
empowerment | +0.163 |
rils | +0.163 |
Neg logit contributions | |
BY | -0.155 |
Decay | -0.151 |
than | -0.142 |
unfavorable | -0.141 |
Geological | -0.138 |
Token |
|
Token ID | 198 |
Feature activation | -5.06e+00 |
Pos logit contributions | |
genders | +5.368 |
blance | +5.153 |
aults | +5.066 |
CLS | +5.039 |
mattered | +5.000 |
Neg logit contributions | |
BY | -4.723 |
Decay | -4.644 |
unfavorable | -4.550 |
periodic | -4.540 |
orally | -4.424 |
Token | � |
Token ID | 246 |
Feature activation | +5.29e+00 |
Pos logit contributions | |
genders | +2.795 |
blance | +2.728 |
aults | +2.654 |
rils | +2.638 |
rights | +2.622 |
Neg logit contributions | |
BY | -2.088 |
Decay | -2.037 |
than | -1.908 |
unfavorable | -1.893 |
orally | -1.827 |
Token | Far |
Token ID | 21428 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
BY | +3.485 |
Decay | +3.325 |
than | +3.180 |
unfavorable | +3.047 |
Geological | +3.009 |
Neg logit contributions | |
genders | -4.467 |
blance | -4.268 |
aults | -4.139 |
mattered | -4.138 |
empowerment | -4.133 |
Token | Away |
Token ID | 21986 |
Feature activation | +6.83e+00 |
Pos logit contributions | |
BY | +1.266 |
Decay | +1.237 |
than | +1.161 |
unfavorable | +1.146 |
Geological | +1.118 |
Neg logit contributions | |
genders | -1.638 |
blance | -1.575 |
aults | -1.536 |
empowerment | -1.522 |
rils | -1.519 |
Token | � |
Token ID | 447 |
Feature activation | -4.95e+00 |
Pos logit contributions | |
Decay | +4.440 |
BY | +4.414 |
than | +4.035 |
Geological | +4.013 |
unfavorable | +3.964 |
Neg logit contributions | |
genders | -5.592 |
blance | -5.439 |
aults | -5.271 |
rils | -5.206 |
rights | -5.187 |
Token | � |
Token ID | 247 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
genders | +3.552 |
blance | +3.411 |
aults | +3.317 |
rils | +3.311 |
empowerment | +3.276 |
Neg logit contributions | |
BY | -3.832 |
Decay | -3.662 |
than | -3.542 |
unfavorable | -3.494 |
orally | -3.429 |
Token | that |
Token ID | 326 |
Feature activation | -2.87e+01 |
Pos logit contributions | |
genders | +1.841 |
blance | +1.786 |
aults | +1.735 |
empowerment | +1.729 |
mattered | +1.715 |
Neg logit contributions | |
BY | -1.573 |
Decay | -1.527 |
unfavorable | -1.430 |
than | -1.424 |
Geological | -1.391 |
Token | stuck |
Token ID | 7819 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
mattered | +18.007 |
genders | +15.840 |
wheelchair | +15.067 |
empowerment | +14.689 |
equality | +14.524 |
Neg logit contributions | |
BY | -14.838 |
Decay | -14.761 |
than | -14.640 |
terness | -13.630 |
unfavorable | -13.560 |
Token | in |
Token ID | 287 |
Feature activation | -3.50e+00 |
Pos logit contributions | |
genders | +8.354 |
mattered | +7.947 |
empowerment | +7.753 |
blance | +7.700 |
aults | +7.633 |
Neg logit contributions | |
BY | -8.788 |
Decay | -8.463 |
than | -8.098 |
unfavorable | -7.945 |
Geological | -7.796 |
Token | the |
Token ID | 262 |
Feature activation | -7.43e+00 |
Pos logit contributions | |
genders | +2.730 |
blance | +2.626 |
aults | +2.564 |
mattered | +2.555 |
empowerment | +2.546 |
Neg logit contributions | |
BY | -2.451 |
Decay | -2.376 |
than | -2.246 |
unfavorable | -2.230 |
Geological | -2.183 |
Token | mind |
Token ID | 2000 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
genders | +4.974 |
aults | +4.711 |
blance | +4.663 |
empowerment | +4.611 |
mattered | +4.593 |
Neg logit contributions | |
BY | -5.797 |
Decay | -5.717 |
than | -5.408 |
unfavorable | -5.314 |
Geological | -5.228 |
Token | long |
Token ID | 890 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
genders | +7.865 |
blance | +7.699 |
aults | +7.648 |
mattered | +7.542 |
rils | +7.418 |
Neg logit contributions | |
BY | -9.174 |
Decay | -8.643 |
unfavorable | -8.303 |
than | -8.273 |
Geological | -8.127 |
Token | have |
Token ID | 423 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
genders | +8.319 |
mattered | +7.753 |
blance | +7.741 |
empowerment | +7.714 |
rights | +7.629 |
Neg logit contributions | |
Decay | -9.720 |
BY | -9.685 |
periodic | -8.858 |
unfavorable | -8.784 |
Geological | -8.762 |
Token | any |
Token ID | 597 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
genders | +9.245 |
empowerment | +8.455 |
equality | +8.436 |
rights | +8.173 |
blance | +8.108 |
Neg logit contributions | |
Decay | -12.481 |
BY | -12.412 |
than | -11.682 |
Geological | -11.353 |
hyde | -11.173 |
Token | room |
Token ID | 2119 |
Feature activation | -3.83e+00 |
Pos logit contributions | |
genders | +9.188 |
empowerment | +8.504 |
equality | +8.379 |
mattered | +8.178 |
blance | +8.159 |
Neg logit contributions | |
BY | -8.165 |
Decay | -8.039 |
than | -7.406 |
risome | -7.179 |
Geological | -7.135 |
Token | to |
Token ID | 284 |
Feature activation | -3.09e+00 |
Pos logit contributions | |
genders | +2.533 |
blance | +2.402 |
aults | +2.301 |
rights | +2.301 |
mattered | +2.299 |
Neg logit contributions | |
BY | -3.151 |
Decay | -3.140 |
than | -2.932 |
unfavorable | -2.906 |
Geological | -2.894 |
Token | speak |
Token ID | 2740 |
Feature activation | -6.70e+00 |
Pos logit contributions | |
genders | +2.509 |
blance | +2.375 |
empowerment | +2.336 |
aults | +2.317 |
mattered | +2.305 |
Neg logit contributions | |
BY | -2.113 |
Decay | -2.073 |
than | -1.911 |
unfavorable | -1.903 |
Geological | -1.862 |
Token | about |
Token ID | 546 |
Feature activation | -2.83e+01 |
Pos logit contributions | |
genders | +5.141 |
blance | +4.755 |
empowerment | +4.744 |
equality | +4.741 |
mattered | +4.694 |
Neg logit contributions | |
BY | -4.838 |
Decay | -4.690 |
than | -4.386 |
Geological | -4.256 |
periodic | -4.238 |
Token | how |
Token ID | 703 |
Feature activation | -2.40e+01 |
Pos logit contributions | |
genders | +17.777 |
equality | +17.148 |
empowerment | +16.367 |
feminism | +15.981 |
sexism | +15.075 |
Neg logit contributions | |
BY | -15.408 |
earchers | -15.232 |
terness | -14.682 |
Decay | -14.674 |
ngth | -14.153 |
Token | anybody |
Token ID | 9599 |
Feature activation | -5.03e+00 |
Pos logit contributions | |
genders | +16.808 |
equality | +15.534 |
empowerment | +15.328 |
mattered | +14.648 |
feminism | +14.519 |
Neg logit contributions | |
BY | -13.753 |
Decay | -13.139 |
hyde | -12.723 |
earchers | -12.544 |
than | -12.366 |
Token | on |
Token ID | 319 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
genders | +3.874 |
blance | +3.599 |
mattered | +3.584 |
empowerment | +3.525 |
aults | +3.505 |
Neg logit contributions | |
BY | -3.723 |
Decay | -3.643 |
than | -3.349 |
Geological | -3.287 |
unfavorable | -3.253 |
Token | the |
Token ID | 262 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
genders | +8.645 |
equality | +8.057 |
empowerment | +7.911 |
blance | +7.709 |
rights | +7.615 |
Neg logit contributions | |
BY | -9.562 |
Decay | -9.518 |
orally | -8.902 |
than | -8.870 |
Geological | -8.750 |
Token | left |
Token ID | 1364 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
genders | +11.045 |
equality | +9.925 |
empowerment | +9.639 |
wheelchair | +9.571 |
sexes | +8.891 |
Neg logit contributions | |
BY | -14.955 |
Decay | -14.594 |
terness | -13.829 |
than | -13.746 |
orally | -13.535 |
Token | EPA |
Token ID | 10193 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
BY | +0.670 |
Decay | +0.652 |
than | +0.610 |
unfavorable | +0.608 |
Geological | +0.591 |
Neg logit contributions | |
genders | -0.866 |
blance | -0.834 |
aults | -0.814 |
empowerment | -0.808 |
rils | -0.807 |
Token | � |
Token ID | 447 |
Feature activation | -4.85e+00 |
Pos logit contributions | |
BY | +6.592 |
Decay | +6.296 |
unfavorable | +5.972 |
periodic | +5.894 |
orally | +5.891 |
Neg logit contributions | |
genders | -7.994 |
blance | -7.894 |
aults | -7.651 |
rils | -7.645 |
itans | -7.575 |
Token | � |
Token ID | 247 |
Feature activation | +5.71e-01 |
Pos logit contributions | |
genders | +3.533 |
blance | +3.400 |
aults | +3.334 |
rils | +3.280 |
empowerment | +3.247 |
Neg logit contributions | |
BY | -3.672 |
Decay | -3.565 |
than | -3.369 |
unfavorable | -3.364 |
orally | -3.320 |
Token | s |
Token ID | 82 |
Feature activation | +9.51e-01 |
Pos logit contributions | |
BY | +0.373 |
Decay | +0.364 |
than | +0.340 |
unfavorable | +0.339 |
Geological | +0.329 |
Neg logit contributions | |
genders | -0.481 |
blance | -0.464 |
aults | -0.453 |
rils | -0.449 |
empowerment | -0.448 |
Token | civil |
Token ID | 3026 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
BY | +0.712 |
Decay | +0.696 |
than | +0.656 |
unfavorable | +0.654 |
Geological | +0.639 |
Neg logit contributions | |
genders | -0.712 |
blance | -0.683 |
aults | -0.665 |
empowerment | -0.658 |
rils | -0.658 |
Token | - |
Token ID | 12 |
Feature activation | -2.80e+01 |
Pos logit contributions | |
equality | +10.768 |
genders | +10.526 |
rights | +10.522 |
empowerment | +10.034 |
barriers | +8.838 |
Neg logit contributions | |
Decay | -19.318 |
BY | -18.021 |
risome | -17.318 |
earchers | -17.045 |
terness | -17.006 |
Token | rights |
Token ID | 28046 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
rights | +15.292 |
equality | +10.084 |
genders | +9.367 |
aults | +9.105 |
rils | +8.735 |
Neg logit contributions | |
Decay | -25.072 |
Expedition | -22.353 |
Nanto | -22.070 |
Disciple | -22.042 |
Geological | -21.967 |
Token | office |
Token ID | 2607 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
genders | +1.014 |
blance | +0.971 |
empowerment | +0.958 |
aults | +0.956 |
rils | +0.943 |
Neg logit contributions | |
BY | -0.782 |
Decay | -0.765 |
than | -0.712 |
unfavorable | -0.704 |
Geological | -0.690 |
Token | has |
Token ID | 468 |
Feature activation | +4.97e+00 |
Pos logit contributions | |
BY | +1.339 |
Decay | +1.302 |
than | +1.222 |
unfavorable | +1.220 |
Geological | +1.186 |
Neg logit contributions | |
genders | -1.682 |
blance | -1.628 |
aults | -1.587 |
rils | -1.574 |
empowerment | -1.565 |
Token | long |
Token ID | 890 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
BY | +3.306 |
Decay | +3.208 |
unfavorable | +3.086 |
than | +3.054 |
periodic | +3.030 |
Neg logit contributions | |
genders | -4.000 |
blance | -3.933 |
aults | -3.781 |
rils | -3.756 |
itans | -3.744 |
Token | been |
Token ID | 587 |
Feature activation | +4.59e+00 |
Pos logit contributions | |
BY | +1.657 |
Decay | +1.611 |
unfavorable | +1.534 |
than | +1.531 |
orally | +1.492 |
Neg logit contributions | |
genders | -1.680 |
blance | -1.629 |
aults | -1.573 |
rils | -1.557 |
empowerment | -1.553 |
Token | global |
Token ID | 3298 |
Feature activation | -8.70e+00 |
Pos logit contributions | |
genders | +7.984 |
empowerment | +7.631 |
equality | +7.518 |
mattered | +7.277 |
wheelchair | +7.186 |
Neg logit contributions | |
BY | -7.269 |
Decay | -7.192 |
than | -6.664 |
Reviewer | -6.522 |
unfavorable | -6.390 |
Token | isation |
Token ID | 5612 |
Feature activation | -2.52e+00 |
Pos logit contributions | |
genders | +5.874 |
empowerment | +5.687 |
equality | +5.496 |
mattered | +5.436 |
aults | +5.319 |
Neg logit contributions | |
BY | -6.800 |
Decay | -6.672 |
than | -6.237 |
Geological | -6.123 |
unfavorable | -6.073 |
Token | or |
Token ID | 393 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
genders | +2.044 |
blance | +1.934 |
empowerment | +1.915 |
mattered | +1.912 |
aults | +1.898 |
Neg logit contributions | |
BY | -1.722 |
Decay | -1.687 |
than | -1.575 |
unfavorable | -1.553 |
Geological | -1.527 |
Token | immigration |
Token ID | 6272 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
genders | +8.986 |
empowerment | +8.761 |
equality | +8.621 |
mattered | +8.240 |
wheelchair | +8.166 |
Neg logit contributions | |
BY | -8.000 |
Decay | -7.884 |
than | -7.396 |
Reviewer | -7.142 |
risome | -7.058 |
Token | that |
Token ID | 326 |
Feature activation | -1.69e+01 |
Pos logit contributions | |
genders | +8.113 |
empowerment | +7.870 |
mattered | +7.796 |
equality | +7.757 |
rights | +7.403 |
Neg logit contributions | |
BY | -8.586 |
Decay | -8.376 |
than | -7.777 |
Geological | -7.572 |
risome | -7.485 |
Token | has |
Token ID | 468 |
Feature activation | -2.78e+01 |
Pos logit contributions | |
mattered | +11.121 |
genders | +11.068 |
empowerment | +10.488 |
equality | +10.168 |
wheelchair | +10.044 |
Neg logit contributions | |
BY | -11.227 |
Decay | -11.042 |
than | -10.637 |
Reviewer | -10.426 |
terness | -9.939 |
Token | been |
Token ID | 587 |
Feature activation | -9.79e+00 |
Pos logit contributions | |
mattered | +17.060 |
genders | +15.408 |
empowerment | +14.690 |
equality | +14.455 |
wheelchair | +14.450 |
Neg logit contributions | |
Decay | -16.656 |
BY | -16.376 |
Reviewer | -16.320 |
than | -15.814 |
terness | -15.282 |
Token | creating |
Token ID | 4441 |
Feature activation | -2.22e+01 |
Pos logit contributions | |
genders | +6.825 |
mattered | +6.647 |
empowerment | +6.506 |
wheelchair | +6.340 |
blance | +6.305 |
Neg logit contributions | |
BY | -7.126 |
Decay | -7.091 |
than | -6.715 |
Geological | -6.484 |
periodic | -6.271 |
Token | a |
Token ID | 257 |
Feature activation | -2.03e+01 |
Pos logit contributions | |
barriers | +13.902 |
genders | +13.609 |
equality | +13.567 |
empowerment | +13.431 |
wheelchair | +12.790 |
Neg logit contributions | |
BY | -13.904 |
Decay | -13.422 |
Plot | -12.960 |
terness | -12.879 |
Reviewer | -12.842 |
Token | disp |
Token ID | 4596 |
Feature activation | -8.60e+00 |
Pos logit contributions | |
wheelchair | +12.799 |
empowerment | +12.717 |
genders | +12.690 |
equality | +12.287 |
mattered | +12.182 |
Neg logit contributions | |
BY | -12.698 |
Decay | -12.063 |
terness | -11.623 |
Plot | -11.411 |
earchers | -11.396 |
Token | oss |
Token ID | 793 |
Feature activation | -2.62e+00 |
Pos logit contributions | |
genders | +4.579 |
blance | +4.531 |
aults | +4.463 |
rils | +4.410 |
itans | +4.333 |
Neg logit contributions | |
Decay | -7.816 |
BY | -7.717 |
unfavorable | -7.212 |
Geological | -7.165 |
orally | -7.126 |
Token | but |
Token ID | 475 |
Feature activation | -4.11e+00 |
Pos logit contributions | |
genders | +6.436 |
blance | +6.016 |
empowerment | +5.981 |
aults | +5.928 |
mattered | +5.878 |
Neg logit contributions | |
BY | -5.986 |
Decay | -5.734 |
than | -5.438 |
unfavorable | -5.301 |
Geological | -5.219 |
Token | that |
Token ID | 326 |
Feature activation | -7.17e+00 |
Pos logit contributions | |
genders | +3.171 |
blance | +3.013 |
aults | +2.955 |
mattered | +2.943 |
empowerment | +2.941 |
Neg logit contributions | |
BY | -2.952 |
Decay | -2.837 |
than | -2.712 |
unfavorable | -2.653 |
Geological | -2.601 |
Token | didn |
Token ID | 1422 |
Feature activation | -8.58e+00 |
Pos logit contributions | |
genders | +4.938 |
mattered | +4.738 |
blance | +4.715 |
aults | +4.585 |
empowerment | +4.566 |
Neg logit contributions | |
BY | -5.473 |
Decay | -5.385 |
than | -5.096 |
unfavorable | -5.044 |
periodic | -4.914 |
Token | � |
Token ID | 447 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
genders | +6.128 |
aults | +5.995 |
rights | +5.830 |
itans | +5.821 |
OULD | +5.806 |
Neg logit contributions | |
Decay | -6.042 |
BY | -5.834 |
periodic | -5.794 |
unfavorable | -5.679 |
orally | -5.608 |
Token | � |
Token ID | 247 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
genders | +7.170 |
blance | +6.950 |
aults | +6.942 |
rils | +6.901 |
OULD | +6.730 |
Neg logit contributions | |
BY | -11.325 |
Decay | -10.920 |
than | -10.633 |
unfavorable | -10.475 |
orally | -10.451 |
Token | t |
Token ID | 83 |
Feature activation | -2.77e+01 |
Pos logit contributions | |
genders | +9.162 |
rils | +8.875 |
aults | +8.815 |
itans | +8.729 |
blance | +8.719 |
Neg logit contributions | |
BY | -6.832 |
Decay | -6.726 |
unfavorable | -6.087 |
orally | -6.077 |
periodic | -6.008 |
Token | cut |
Token ID | 2005 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
mattered | +14.905 |
genders | +14.489 |
equality | +13.972 |
wheelchair | +13.493 |
aults | +13.083 |
Neg logit contributions | |
Reviewer | -16.944 |
BY | -16.775 |
Decay | -16.655 |
terness | -15.221 |
estern | -15.193 |
Token | it |
Token ID | 340 |
Feature activation | -9.30e+00 |
Pos logit contributions | |
genders | +7.767 |
blance | +7.258 |
empowerment | +7.218 |
mattered | +7.167 |
equality | +7.147 |
Neg logit contributions | |
BY | -8.699 |
Decay | -8.286 |
than | -7.913 |
orally | -7.727 |
Geological | -7.688 |
Token | . |
Token ID | 13 |
Feature activation | -5.73e+00 |
Pos logit contributions | |
genders | +6.430 |
blance | +6.040 |
mattered | +6.028 |
aults | +6.012 |
empowerment | +5.842 |
Neg logit contributions | |
BY | -6.876 |
Decay | -6.690 |
than | -6.390 |
unfavorable | -6.240 |
periodic | -6.200 |
Token |
|
Token ID | 198 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
genders | +4.635 |
blance | +4.438 |
aults | +4.380 |
mattered | +4.346 |
rils | +4.307 |
Neg logit contributions | |
BY | -3.698 |
Decay | -3.469 |
unfavorable | -3.429 |
than | -3.365 |
periodic | -3.353 |
Token |
|
Token ID | 198 |
Feature activation | -6.49e+00 |
Pos logit contributions | |
genders | +1.072 |
blance | +1.018 |
aults | +0.997 |
rils | +0.981 |
rights | +0.979 |
Neg logit contributions | |
BY | -1.295 |
Decay | -1.274 |
unfavorable | -1.208 |
than | -1.200 |
periodic | -1.181 |
Token | but |
Token ID | 475 |
Feature activation | +3.13e+00 |
Pos logit contributions | |
BY | +3.228 |
Decay | +3.107 |
than | +2.976 |
unfavorable | +2.904 |
Geological | +2.868 |
Neg logit contributions | |
genders | -3.819 |
blance | -3.697 |
rils | -3.589 |
aults | -3.573 |
empowerment | -3.547 |
Token | it |
Token ID | 340 |
Feature activation | -4.99e+00 |
Pos logit contributions | |
BY | +2.177 |
Decay | +2.128 |
than | +2.004 |
unfavorable | +1.989 |
periodic | +1.938 |
Neg logit contributions | |
genders | -2.485 |
blance | -2.405 |
aults | -2.337 |
rils | -2.329 |
rights | -2.296 |
Token | hasn |
Token ID | 5818 |
Feature activation | -6.15e+00 |
Pos logit contributions | |
genders | +3.942 |
mattered | +3.784 |
blance | +3.737 |
aults | +3.698 |
empowerment | +3.612 |
Neg logit contributions | |
BY | -3.444 |
Decay | -3.406 |
unfavorable | -3.151 |
than | -3.130 |
periodic | -3.064 |
Token | � |
Token ID | 447 |
Feature activation | -8.30e+00 |
Pos logit contributions | |
genders | +4.799 |
aults | +4.634 |
blance | +4.566 |
rights | +4.539 |
itans | +4.494 |
Neg logit contributions | |
Decay | -4.105 |
BY | -4.063 |
unfavorable | -3.862 |
periodic | -3.859 |
orally | -3.763 |
Token | � |
Token ID | 247 |
Feature activation | -6.66e+00 |
Pos logit contributions | |
genders | +5.740 |
blance | +5.550 |
aults | +5.436 |
rils | +5.405 |
rights | +5.290 |
Neg logit contributions | |
BY | -6.404 |
Decay | -6.085 |
than | -5.912 |
unfavorable | -5.797 |
orally | -5.763 |
Token | t |
Token ID | 83 |
Feature activation | -2.73e+01 |
Pos logit contributions | |
genders | +6.067 |
aults | +5.891 |
mattered | +5.826 |
rils | +5.800 |
blance | +5.791 |
Neg logit contributions | |
BY | -3.704 |
Decay | -3.551 |
unfavorable | -3.248 |
than | -3.200 |
Geological | -3.166 |
Token | always |
Token ID | 1464 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
mattered | +16.890 |
genders | +15.269 |
wheelchair | +14.202 |
hood | +13.647 |
equality | +13.612 |
Neg logit contributions | |
Decay | -16.652 |
Reviewer | -16.535 |
BY | -16.438 |
than | -15.107 |
earchers | -14.789 |
Token | been |
Token ID | 587 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
mattered | +15.318 |
genders | +12.923 |
equality | +11.649 |
wheelchair | +11.393 |
aults | +11.315 |
Neg logit contributions | |
Decay | -17.528 |
BY | -17.331 |
Reviewer | -17.200 |
than | -16.417 |
iatus | -15.776 |
Token | like |
Token ID | 588 |
Feature activation | -5.23e+00 |
Pos logit contributions | |
genders | +7.042 |
mattered | +6.787 |
equality | +6.731 |
empowerment | +6.730 |
blance | +6.555 |
Neg logit contributions | |
BY | -7.397 |
Decay | -7.370 |
than | -6.703 |
orally | -6.650 |
unfavorable | -6.612 |
Token | that |
Token ID | 326 |
Feature activation | -8.15e+00 |
Pos logit contributions | |
genders | +3.975 |
empowerment | +3.760 |
blance | +3.745 |
mattered | +3.731 |
equality | +3.692 |
Neg logit contributions | |
BY | -3.727 |
Decay | -3.609 |
unfavorable | -3.420 |
than | -3.406 |
orally | -3.334 |
Token | . |
Token ID | 13 |
Feature activation | +7.98e-01 |
Pos logit contributions | |
genders | +5.498 |
mattered | +5.164 |
blance | +5.100 |
empowerment | +5.063 |
aults | +5.052 |
Neg logit contributions | |
BY | -6.281 |
Decay | -6.146 |
than | -5.850 |
unfavorable | -5.822 |
periodic | -5.688 |
Token | I |
Token ID | 314 |
Feature activation | -5.53e+00 |
Pos logit contributions | |
genders | +0.520 |
blance | +0.501 |
aults | +0.489 |
rils | +0.483 |
empowerment | +0.483 |
Neg logit contributions | |
BY | -0.442 |
Decay | -0.430 |
unfavorable | -0.407 |
than | -0.405 |
periodic | -0.395 |
Token | don |
Token ID | 836 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
genders | +4.271 |
mattered | +4.088 |
blance | +4.035 |
empowerment | +3.977 |
rils | +3.923 |
Neg logit contributions | |
BY | -3.847 |
Decay | -3.793 |
unfavorable | -3.536 |
than | -3.511 |
periodic | -3.451 |
Token | � |
Token ID | 447 |
Feature activation | -9.41e+00 |
Pos logit contributions | |
genders | +7.201 |
aults | +7.011 |
rights | +6.880 |
itans | +6.839 |
OULD | +6.798 |
Neg logit contributions | |
Decay | -7.912 |
periodic | -7.674 |
BY | -7.540 |
unfavorable | -7.473 |
orally | -7.361 |
Token | � |
Token ID | 247 |
Feature activation | -9.37e+00 |
Pos logit contributions | |
genders | +6.444 |
blance | +6.267 |
rils | +6.187 |
aults | +6.167 |
rights | +6.016 |
Neg logit contributions | |
BY | -7.029 |
Decay | -6.819 |
unfavorable | -6.451 |
than | -6.440 |
orally | -6.423 |
Token | t |
Token ID | 83 |
Feature activation | -1.72e+01 |
Pos logit contributions | |
genders | +7.892 |
blance | +7.521 |
rils | +7.481 |
aults | +7.471 |
mattered | +7.401 |
Neg logit contributions | |
BY | -5.516 |
Decay | -5.440 |
unfavorable | -4.942 |
Geological | -4.893 |
orally | -4.791 |
Token | know |
Token ID | 760 |
Feature activation | -2.73e+01 |
Pos logit contributions | |
genders | +9.977 |
mattered | +9.511 |
wheelchair | +9.354 |
empowerment | +9.255 |
equality | +9.008 |
Neg logit contributions | |
BY | -12.570 |
Decay | -12.471 |
Reviewer | -11.794 |
earchers | -11.461 |
unfavorable | -11.411 |
Token | how |
Token ID | 703 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
genders | +13.367 |
who | +12.612 |
mattered | +12.420 |
empowerment | +12.340 |
equality | +12.108 |
Neg logit contributions | |
BY | -17.124 |
Decay | -16.902 |
earchers | -16.580 |
than | -16.455 |
risome | -16.307 |
Token | , |
Token ID | 11 |
Feature activation | -7.81e+00 |
Pos logit contributions | |
genders | +8.074 |
mattered | +7.568 |
empowerment | +7.486 |
blance | +7.357 |
wheelchair | +7.257 |
Neg logit contributions | |
BY | -8.991 |
Decay | -8.846 |
than | -8.420 |
Geological | -8.107 |
periodic | -8.000 |
Token | but |
Token ID | 475 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
genders | +6.009 |
mattered | +5.623 |
blance | +5.601 |
empowerment | +5.543 |
rils | +5.518 |
Neg logit contributions | |
BY | -5.324 |
Decay | -5.223 |
than | -4.870 |
unfavorable | -4.844 |
Geological | -4.777 |
Token | this |
Token ID | 428 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
BY | +0.891 |
Decay | +0.868 |
than | +0.815 |
unfavorable | +0.814 |
Geological | +0.792 |
Neg logit contributions | |
genders | -1.031 |
blance | -0.995 |
aults | -0.969 |
rils | -0.959 |
empowerment | -0.956 |
Token | is |
Token ID | 318 |
Feature activation | +6.08e-01 |
Pos logit contributions | |
genders | +1.243 |
blance | +1.194 |
empowerment | +1.172 |
mattered | +1.171 |
aults | +1.163 |
Neg logit contributions | |
BY | -0.982 |
Decay | -0.963 |
than | -0.896 |
unfavorable | -0.887 |
Geological | -0.866 |
Token | , |
Token ID | 11 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
genders | +1.633 |
blance | +1.543 |
empowerment | +1.514 |
mattered | +1.509 |
aults | +1.506 |
Neg logit contributions | |
BY | -1.616 |
Decay | -1.584 |
than | -1.490 |
unfavorable | -1.455 |
Geological | -1.445 |
Token | this |
Token ID | 428 |
Feature activation | -7.77e+00 |
Pos logit contributions | |
genders | +0.899 |
blance | +0.856 |
aults | +0.836 |
empowerment | +0.830 |
mattered | +0.825 |
Neg logit contributions | |
BY | -0.898 |
Decay | -0.875 |
than | -0.825 |
unfavorable | -0.816 |
Geological | -0.802 |
Token | arrangement |
Token ID | 13888 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
genders | +5.865 |
mattered | +5.660 |
empowerment | +5.554 |
equality | +5.467 |
wheelchair | +5.423 |
Neg logit contributions | |
BY | -5.482 |
Decay | -5.380 |
than | -4.951 |
Geological | -4.817 |
unfavorable | -4.687 |
Token | would |
Token ID | 561 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
genders | +7.544 |
mattered | +7.427 |
wheelchair | +6.754 |
equality | +6.721 |
empowerment | +6.618 |
Neg logit contributions | |
Decay | -8.987 |
BY | -8.824 |
than | -8.080 |
Reviewer | -8.002 |
Geological | -7.915 |
Token | not |
Token ID | 407 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
genders | +7.975 |
mattered | +7.489 |
equality | +7.391 |
wheelchair | +7.365 |
blance | +7.292 |
Neg logit contributions | |
BY | -7.641 |
Decay | -7.526 |
than | -6.821 |
Geological | -6.705 |
Reviewer | -6.579 |
Token | have |
Token ID | 423 |
Feature activation | -2.72e+01 |
Pos logit contributions | |
genders | +12.940 |
mattered | +12.197 |
equality | +12.168 |
wheelchair | +12.038 |
aults | +11.626 |
Neg logit contributions | |
Decay | -13.358 |
BY | -13.230 |
Reviewer | -12.048 |
estern | -11.877 |
than | -11.757 |
Token | function |
Token ID | 2163 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
mattered | +17.308 |
genders | +15.873 |
equality | +14.383 |
wheelchair | +14.250 |
barriers | +13.471 |
Neg logit contributions | |
Decay | -16.877 |
BY | -16.300 |
Reviewer | -15.787 |
terness | -15.293 |
than | -15.239 |
Token | ed |
Token ID | 276 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
genders | +8.087 |
mattered | +7.750 |
blance | +7.608 |
aults | +7.546 |
equality | +7.376 |
Neg logit contributions | |
Decay | -9.382 |
BY | -9.248 |
than | -8.525 |
Geological | -8.380 |
unfavorable | -8.074 |
Token | well |
Token ID | 880 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
genders | +8.481 |
mattered | +7.938 |
equality | +7.693 |
wheelchair | +7.687 |
aults | +7.664 |
Neg logit contributions | |
Decay | -8.872 |
BY | -8.675 |
than | -7.879 |
Geological | -7.778 |
risome | -7.681 |
Token | in |
Token ID | 287 |
Feature activation | +8.00e-01 |
Pos logit contributions | |
BY | +0.746 |
Decay | +0.725 |
than | +0.684 |
unfavorable | +0.684 |
orally | +0.664 |
Neg logit contributions | |
genders | -0.846 |
blance | -0.817 |
aults | -0.795 |
rils | -0.789 |
empowerment | -0.787 |
Token | a |
Token ID | 257 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
BY | +0.549 |
Decay | +0.535 |
than | +0.503 |
unfavorable | +0.502 |
Geological | +0.488 |
Neg logit contributions | |
genders | -0.647 |
blance | -0.625 |
aults | -0.608 |
rils | -0.604 |
empowerment | -0.601 |
Token | Lee |
Token ID | 5741 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
BY | +0.121 |
Decay | +0.118 |
than | +0.111 |
unfavorable | +0.111 |
Geological | +0.108 |
Neg logit contributions | |
genders | -0.140 |
blance | -0.134 |
aults | -0.131 |
empowerment | -0.130 |
rils | -0.130 |
Token | didn |
Token ID | 1422 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
BY | +1.568 |
Decay | +1.524 |
than | +1.437 |
unfavorable | +1.428 |
Geological | +1.397 |
Neg logit contributions | |
genders | -1.762 |
blance | -1.703 |
aults | -1.656 |
rils | -1.642 |
empowerment | -1.637 |
Token | � |
Token ID | 447 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
genders | +2.000 |
blance | +1.926 |
aults | +1.904 |
rils | +1.877 |
rights | +1.875 |
Neg logit contributions | |
BY | -1.302 |
Decay | -1.286 |
unfavorable | -1.190 |
than | -1.166 |
periodic | -1.161 |
Token | � |
Token ID | 247 |
Feature activation | -2.73e+00 |
Pos logit contributions | |
genders | +1.322 |
blance | +1.283 |
aults | +1.247 |
rils | +1.238 |
empowerment | +1.232 |
Neg logit contributions | |
BY | -1.064 |
Decay | -1.035 |
than | -0.971 |
unfavorable | -0.966 |
Geological | -0.941 |
Token | t |
Token ID | 83 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
genders | +2.612 |
blance | +2.523 |
aults | +2.480 |
rils | +2.466 |
mattered | +2.447 |
Neg logit contributions | |
BY | -1.458 |
Decay | -1.441 |
unfavorable | -1.281 |
than | -1.267 |
Geological | -1.260 |
Token | seem |
Token ID | 1283 |
Feature activation | -2.72e+01 |
Pos logit contributions | |
genders | +10.163 |
mattered | +9.598 |
wheelchair | +9.401 |
blance | +9.314 |
empowerment | +9.187 |
Neg logit contributions | |
BY | -10.366 |
Decay | -10.282 |
Reviewer | -9.456 |
unfavorable | -9.137 |
than | -9.018 |
Token | f |
Token ID | 277 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
genders | +14.979 |
mattered | +14.288 |
bothered | +14.222 |
empowerment | +14.073 |
wheelchair | +13.946 |
Neg logit contributions | |
Decay | -17.072 |
BY | -16.015 |
Reviewer | -14.523 |
risome | -14.332 |
Geological | -14.140 |
Token | azed |
Token ID | 13865 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
genders | +4.505 |
aults | +4.136 |
blance | +4.126 |
rights | +4.017 |
itans | +3.951 |
Neg logit contributions | |
Decay | -12.538 |
BY | -12.463 |
unfavorable | -11.740 |
periodic | -11.483 |
Geological | -11.457 |
Token | . |
Token ID | 13 |
Feature activation | -3.65e+00 |
Pos logit contributions | |
BY | +6.620 |
Decay | +6.275 |
orally | +5.982 |
unfavorable | +5.944 |
than | +5.886 |
Neg logit contributions | |
genders | -9.264 |
blance | -9.101 |
aults | -8.923 |
rils | -8.885 |
itans | -8.801 |
Token |
|
Token ID | 198 |
Feature activation | +5.16e-01 |
Pos logit contributions | |
genders | +2.788 |
blance | +2.689 |
aults | +2.618 |
rils | +2.595 |
mattered | +2.593 |
Neg logit contributions | |
BY | -2.574 |
Decay | -2.491 |
unfavorable | -2.410 |
than | -2.368 |
periodic | -2.360 |
Token |
|
Token ID | 198 |
Feature activation | -3.24e+00 |
Pos logit contributions | |
BY | +0.403 |
Decay | +0.391 |
than | +0.374 |
unfavorable | +0.368 |
Geological | +0.363 |
Neg logit contributions | |
genders | -0.374 |
blance | -0.361 |
aults | -0.347 |
empowerment | -0.346 |
rils | -0.345 |
Token | wich |
Token ID | 11451 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
itans | +9.865 |
mattered | +9.821 |
genders | +9.763 |
rils | +9.624 |
blance | +9.561 |
Neg logit contributions | |
Decay | -11.909 |
BY | -11.861 |
unfavorable | -11.327 |
periodic | -11.267 |
orally | -10.845 |
Token | Albion |
Token ID | 47995 |
Feature activation | -1.89e+01 |
Pos logit contributions | |
genders | +4.997 |
itans | +4.955 |
aults | +4.853 |
mattered | +4.770 |
rights | +4.731 |
Neg logit contributions | |
Decay | -9.927 |
BY | -9.565 |
unfavorable | -9.411 |
periodic | -9.276 |
orally | -9.229 |
Token | at |
Token ID | 379 |
Feature activation | -7.27e+00 |
Pos logit contributions | |
mattered | +10.161 |
genders | +10.108 |
equality | +9.761 |
itans | +9.755 |
rils | +9.483 |
Neg logit contributions | |
Decay | -13.152 |
BY | -13.054 |
unfavorable | -12.424 |
periodic | -12.405 |
Reviewer | -12.063 |
Token | Anfield |
Token ID | 44303 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
genders | +5.181 |
aults | +4.821 |
blance | +4.809 |
empowerment | +4.782 |
wheelchair | +4.774 |
Neg logit contributions | |
Decay | -5.341 |
BY | -5.266 |
unfavorable | -5.066 |
than | -4.890 |
orally | -4.832 |
Token | in |
Token ID | 287 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
genders | +11.318 |
mattered | +11.065 |
equality | +11.019 |
itans | +10.770 |
empowerment | +10.658 |
Neg logit contributions | |
Decay | -14.281 |
BY | -13.924 |
unfavorable | -13.315 |
Reviewer | -13.128 |
periodic | -12.919 |
Token | October |
Token ID | 3267 |
Feature activation | -2.71e+01 |
Pos logit contributions | |
genders | +9.738 |
equality | +9.358 |
empowerment | +8.943 |
wheelchair | +8.856 |
itans | +8.511 |
Neg logit contributions | |
Decay | -13.981 |
Reviewer | -13.924 |
BY | -13.870 |
hyde | -13.154 |
terness | -13.125 |
Token | . |
Token ID | 13 |
Feature activation | -8.78e+00 |
Pos logit contributions | |
genders | +12.450 |
mattered | +12.178 |
equality | +11.912 |
2012 | +11.641 |
1992 | +11.625 |
Neg logit contributions | |
BY | -17.849 |
Decay | -17.692 |
earchers | -17.240 |
hyde | -17.021 |
Reviewer | -16.970 |
Token | Photograph |
Token ID | 18903 |
Feature activation | +9.19e+00 |
Pos logit contributions | |
genders | +4.712 |
blance | +4.570 |
itans | +4.550 |
rils | +4.413 |
aults | +4.406 |
Neg logit contributions | |
BY | -7.461 |
unfavorable | -7.319 |
Decay | -7.258 |
periodic | -7.189 |
orally | -7.032 |
Token | : |
Token ID | 25 |
Feature activation | -5.29e+00 |
Pos logit contributions | |
BY | +3.614 |
Decay | +3.264 |
than | +3.260 |
Geological | +3.096 |
unfavorable | +2.719 |
Neg logit contributions | |
blance | -9.712 |
genders | -9.699 |
empowerment | -9.451 |
rights | -9.261 |
rils | -9.203 |
Token | Clive |
Token ID | 47722 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
genders | +3.494 |
blance | +3.313 |
aults | +3.291 |
itans | +3.237 |
mattered | +3.229 |
Neg logit contributions | |
BY | -4.161 |
Decay | -4.116 |
unfavorable | -3.982 |
periodic | -3.861 |
than | -3.846 |
Token | Brun |
Token ID | 15700 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
genders | +0.823 |
blance | +0.789 |
aults | +0.769 |
empowerment | +0.760 |
rils | +0.759 |
Neg logit contributions | |
BY | -0.810 |
Decay | -0.791 |
unfavorable | -0.746 |
than | -0.746 |
Geological | -0.726 |
Token | EPA |
Token ID | 10193 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
BY | +1.074 |
Decay | +1.047 |
than | +0.981 |
unfavorable | +0.979 |
Geological | +0.954 |
Neg logit contributions | |
genders | -1.300 |
blance | -1.256 |
aults | -1.224 |
rils | -1.212 |
empowerment | -1.205 |
Token | � |
Token ID | 447 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
BY | +7.294 |
Decay | +6.901 |
than | +6.533 |
Geological | +6.494 |
periodic | +6.482 |
Neg logit contributions | |
genders | -10.196 |
blance | -10.101 |
aults | -9.888 |
itans | -9.768 |
rils | -9.661 |
Token | � |
Token ID | 247 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
genders | +1.052 |
blance | +1.014 |
aults | +0.988 |
rils | +0.978 |
empowerment | +0.975 |
Neg logit contributions | |
BY | -0.949 |
Decay | -0.924 |
than | -0.869 |
unfavorable | -0.867 |
Geological | -0.844 |
Token | s |
Token ID | 82 |
Feature activation | +2.74e+00 |
Pos logit contributions | |
BY | +1.204 |
Decay | +1.167 |
than | +1.104 |
unfavorable | +1.089 |
Geological | +1.062 |
Neg logit contributions | |
genders | -1.653 |
blance | -1.603 |
aults | -1.553 |
rils | -1.546 |
empowerment | -1.545 |
Token | civil |
Token ID | 3026 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
BY | +2.096 |
Decay | +2.048 |
than | +1.943 |
unfavorable | +1.939 |
periodic | +1.900 |
Neg logit contributions | |
genders | -1.993 |
blance | -1.926 |
aults | -1.866 |
rils | -1.843 |
rights | -1.835 |
Token | - |
Token ID | 12 |
Feature activation | -2.71e+01 |
Pos logit contributions | |
equality | +9.637 |
genders | +9.545 |
rights | +9.517 |
empowerment | +9.206 |
wheelchair | +8.040 |
Neg logit contributions | |
Decay | -16.611 |
BY | -15.619 |
risome | -14.635 |
than | -14.505 |
Geological | -14.471 |
Token | rights |
Token ID | 28046 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
rights | +14.454 |
equality | +9.494 |
genders | +8.796 |
aults | +8.410 |
rils | +8.057 |
Neg logit contributions | |
Decay | -25.349 |
Expedition | -22.511 |
Geological | -22.182 |
Disciple | -22.175 |
orally | -22.119 |
Token | office |
Token ID | 2607 |
Feature activation | +6.71e+00 |
Pos logit contributions | |
genders | +0.113 |
blance | +0.109 |
aults | +0.107 |
empowerment | +0.107 |
rils | +0.106 |
Neg logit contributions | |
BY | -0.085 |
Decay | -0.083 |
than | -0.077 |
unfavorable | -0.077 |
Geological | -0.075 |
Token | : |
Token ID | 25 |
Feature activation | +7.99e+00 |
Pos logit contributions | |
BY | +4.112 |
Decay | +3.952 |
than | +3.767 |
unfavorable | +3.690 |
periodic | +3.645 |
Neg logit contributions | |
genders | -5.750 |
blance | -5.585 |
aults | -5.495 |
rils | -5.398 |
rights | -5.390 |
Token | develop |
Token ID | 1205 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
BY | +5.611 |
Decay | +5.471 |
periodic | +5.180 |
unfavorable | +5.171 |
than | +5.141 |
Neg logit contributions | |
genders | -6.040 |
blance | -5.891 |
aults | -5.754 |
rights | -5.602 |
rils | -5.598 |
Token | a |
Token ID | 257 |
Feature activation | -5.85e+00 |
Pos logit contributions | |
genders | +1.669 |
blance | +1.586 |
empowerment | +1.564 |
aults | +1.560 |
rils | +1.543 |
Neg logit contributions | |
BY | -1.493 |
Decay | -1.469 |
than | -1.364 |
unfavorable | -1.358 |
Geological | -1.338 |
Token | University |
Token ID | 2059 |
Feature activation | -1.00e+01 |
Pos logit contributions | |
genders | +1.108 |
blance | +1.069 |
aults | +1.049 |
rils | +1.043 |
empowerment | +1.043 |
Neg logit contributions | |
BY | -0.715 |
Decay | -0.687 |
unfavorable | -0.649 |
than | -0.644 |
orally | -0.619 |
Token | , |
Token ID | 11 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
genders | +6.724 |
empowerment | +6.376 |
blance | +6.254 |
rils | +6.138 |
equality | +6.097 |
Neg logit contributions | |
BY | -7.455 |
Decay | -7.189 |
unfavorable | -7.099 |
than | -6.732 |
orally | -6.690 |
Token | he |
Token ID | 339 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
genders | +8.025 |
empowerment | +7.460 |
CLS | +7.433 |
aults | +7.391 |
blance | +7.367 |
Neg logit contributions | |
BY | -8.802 |
Decay | -8.352 |
unfavorable | -8.059 |
than | -8.038 |
orally | -7.919 |
Token | continues |
Token ID | 4477 |
Feature activation | +5.76e+00 |
Pos logit contributions | |
genders | +1.917 |
blance | +1.797 |
aults | +1.790 |
mattered | +1.776 |
empowerment | +1.762 |
Neg logit contributions | |
BY | -1.615 |
Decay | -1.574 |
unfavorable | -1.464 |
than | -1.463 |
Geological | -1.409 |
Token | to |
Token ID | 284 |
Feature activation | +5.87e+00 |
Pos logit contributions | |
BY | +4.138 |
Decay | +4.026 |
than | +3.818 |
unfavorable | +3.796 |
periodic | +3.760 |
Neg logit contributions | |
genders | -4.384 |
blance | -4.235 |
aults | -4.108 |
itans | -4.012 |
mattered | -3.998 |
Token | investigate |
Token ID | 9161 |
Feature activation | -2.71e+01 |
Pos logit contributions | |
BY | +3.928 |
Decay | +3.837 |
orally | +3.676 |
than | +3.656 |
unfavorable | +3.643 |
Neg logit contributions | |
genders | -4.634 |
blance | -4.578 |
aults | -4.439 |
rights | -4.346 |
rils | -4.310 |
Token | the |
Token ID | 262 |
Feature activation | -2.00e+01 |
Pos logit contributions | |
genders | +16.145 |
empowerment | +16.116 |
equality | +16.004 |
barriers | +15.738 |
mattered | +14.975 |
Neg logit contributions | |
BY | -14.380 |
Decay | -14.238 |
terness | -14.051 |
iatus | -13.171 |
Reviewer | -12.934 |
Token | intriguing |
Token ID | 19827 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
genders | +14.051 |
empowerment | +13.989 |
equality | +13.395 |
barriers | +13.301 |
wheelchair | +12.868 |
Neg logit contributions | |
BY | -11.691 |
terness | -10.699 |
Decay | -10.675 |
Reviewer | -10.537 |
than | -10.006 |
Token | and |
Token ID | 290 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
genders | +8.225 |
empowerment | +7.771 |
equality | +7.597 |
aults | +7.311 |
mattered | +7.304 |
Neg logit contributions | |
BY | -8.569 |
Decay | -8.354 |
than | -7.805 |
unfavorable | -7.741 |
terness | -7.618 |
Token | often |
Token ID | 1690 |
Feature activation | +3.59e+00 |
Pos logit contributions | |
genders | +1.358 |
blance | +1.296 |
empowerment | +1.270 |
aults | +1.269 |
rils | +1.261 |
Neg logit contributions | |
BY | -1.098 |
Decay | -1.075 |
than | -0.999 |
unfavorable | -0.989 |
Geological | -0.973 |
Token | terrifying |
Token ID | 17623 |
Feature activation | -9.45e+00 |
Pos logit contributions | |
BY | +2.442 |
Decay | +2.324 |
unfavorable | +2.269 |
than | +2.225 |
periodic | +2.188 |
Neg logit contributions | |
genders | -2.894 |
blance | -2.861 |
aults | -2.760 |
rils | -2.723 |
rights | -2.718 |
Token | � |
Token ID | 250 |
Feature activation | +5.98e+00 |
Pos logit contributions | |
BY | +6.330 |
Decay | +6.202 |
unfavorable | +5.805 |
than | +5.755 |
periodic | +5.551 |
Neg logit contributions | |
genders | -8.206 |
blance | -7.644 |
empowerment | -7.599 |
aults | -7.527 |
wheelchair | -7.501 |
Token | Better |
Token ID | 28971 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
BY | +4.203 |
Decay | +3.968 |
than | +3.908 |
unfavorable | +3.715 |
Geological | +3.619 |
Neg logit contributions | |
genders | -4.756 |
blance | -4.574 |
rils | -4.415 |
aults | -4.384 |
empowerment | -4.384 |
Token | to |
Token ID | 284 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
BY | +9.295 |
than | +8.797 |
Decay | +8.591 |
unfavorable | +8.339 |
Geological | +8.315 |
Neg logit contributions | |
genders | -9.725 |
blance | -9.433 |
aults | -9.190 |
rights | -9.017 |
rils | -9.008 |
Token | remain |
Token ID | 3520 |
Feature activation | +7.59e+00 |
Pos logit contributions | |
BY | +7.827 |
Decay | +7.711 |
than | +7.522 |
unfavorable | +7.254 |
Geological | +7.160 |
Neg logit contributions | |
blance | -8.694 |
genders | -8.678 |
aults | -8.319 |
rils | -8.279 |
rights | -8.136 |
Token | silent |
Token ID | 10574 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
BY | +5.234 |
Decay | +5.107 |
unfavorable | +4.929 |
than | +4.920 |
orally | +4.757 |
Neg logit contributions | |
genders | -5.832 |
blance | -5.701 |
rils | -5.548 |
aults | -5.480 |
rights | -5.430 |
Token | and |
Token ID | 290 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
than | +7.881 |
BY | +7.871 |
Decay | +7.826 |
unfavorable | +7.428 |
orally | +7.340 |
Neg logit contributions | |
blance | -10.403 |
genders | -10.388 |
rils | -9.928 |
empowerment | -9.755 |
CLS | -9.737 |
Token | be |
Token ID | 307 |
Feature activation | +7.16e+00 |
Pos logit contributions | |
unfavorable | +10.487 |
BY | +10.331 |
Decay | +10.305 |
than | +10.126 |
orally | +10.045 |
Neg logit contributions | |
blance | -11.551 |
genders | -11.203 |
aults | -10.959 |
rils | -10.794 |
itans | -10.643 |
Token | thought |
Token ID | 1807 |
Feature activation | +6.67e+00 |
Pos logit contributions | |
BY | +5.347 |
Decay | +5.166 |
unfavorable | +5.065 |
than | +5.023 |
periodic | +4.855 |
Neg logit contributions | |
genders | -5.145 |
blance | -5.050 |
rils | -4.824 |
aults | -4.784 |
rights | -4.711 |
Token | a |
Token ID | 257 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
BY | +4.586 |
Decay | +4.426 |
unfavorable | +4.385 |
than | +4.266 |
orally | +4.181 |
Neg logit contributions | |
genders | -5.193 |
blance | -5.020 |
rils | -4.845 |
empowerment | -4.784 |
aults | -4.767 |
Token | fool |
Token ID | 9192 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
BY | +7.916 |
Decay | +7.842 |
unfavorable | +7.414 |
than | +7.394 |
periodic | +7.280 |
Neg logit contributions | |
genders | -8.399 |
blance | -8.289 |
rils | -8.034 |
aults | -7.716 |
empowerment | -7.470 |
Token | , |
Token ID | 11 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
than | +11.412 |
BY | +11.410 |
Decay | +11.092 |
unfavorable | +10.614 |
orally | +10.329 |
Neg logit contributions | |
genders | -10.933 |
blance | -10.547 |
rils | -10.240 |
CLS | -10.107 |
wheelchair | -10.052 |
Token | rast |
Token ID | 5685 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
genders | +1.121 |
blance | +1.041 |
aults | +1.015 |
rils | +0.996 |
rights | +0.980 |
Neg logit contributions | |
BY | -2.431 |
Decay | -2.403 |
unfavorable | -2.297 |
than | -2.289 |
Geological | -2.249 |
Token | inated |
Token ID | 3898 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
genders | +1.509 |
blance | +1.455 |
aults | +1.420 |
rils | +1.406 |
empowerment | +1.401 |
Neg logit contributions | |
BY | -1.229 |
Decay | -1.199 |
than | -1.121 |
unfavorable | -1.120 |
Geological | -1.088 |
Token | in |
Token ID | 287 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
BY | +8.402 |
orally | +8.302 |
unfavorable | +8.105 |
periodic | +8.052 |
than | +7.965 |
Neg logit contributions | |
blance | -11.724 |
itans | -11.441 |
rils | -11.398 |
aults | -11.286 |
genders | -11.205 |
Token | writing |
Token ID | 3597 |
Feature activation | +9.23e+00 |
Pos logit contributions | |
BY | +6.490 |
Decay | +6.268 |
unfavorable | +6.156 |
periodic | +6.004 |
than | +5.924 |
Neg logit contributions | |
blance | -8.300 |
genders | -8.246 |
aults | -7.974 |
rils | -7.892 |
itans | -7.808 |
Token | them |
Token ID | 606 |
Feature activation | +5.94e+00 |
Pos logit contributions | |
BY | +5.842 |
Decay | +5.790 |
unfavorable | +5.593 |
periodic | +5.500 |
orally | +5.422 |
Neg logit contributions | |
blance | -7.274 |
genders | -7.206 |
rils | -7.024 |
itans | -6.946 |
aults | -6.939 |
Token | , |
Token ID | 11 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
BY | +3.907 |
Decay | +3.801 |
unfavorable | +3.662 |
orally | +3.627 |
than | +3.602 |
Neg logit contributions | |
genders | -4.786 |
blance | -4.725 |
rils | -4.555 |
aults | -4.518 |
itans | -4.500 |
Token | often |
Token ID | 1690 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
BY | +8.889 |
Decay | +8.791 |
unfavorable | +8.512 |
periodic | +8.468 |
orally | +8.447 |
Neg logit contributions | |
blance | -10.050 |
genders | -9.738 |
rils | -9.663 |
itans | -9.644 |
aults | -9.478 |
Token | changing |
Token ID | 5609 |
Feature activation | +5.49e+00 |
Pos logit contributions | |
BY | +9.177 |
orally | +9.043 |
unfavorable | +8.926 |
periodic | +8.749 |
Decay | +8.601 |
Neg logit contributions | |
blance | -10.943 |
rils | -10.696 |
itans | -10.444 |
rights | -10.282 |
genders | -10.256 |
Token | the |
Token ID | 262 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
BY | +3.526 |
Decay | +3.448 |
unfavorable | +3.315 |
than | +3.219 |
periodic | +3.203 |
Neg logit contributions | |
blance | -4.434 |
genders | -4.401 |
rils | -4.315 |
aults | -4.286 |
rights | -4.271 |
Token | content |
Token ID | 2695 |
Feature activation | +7.10e+00 |
Pos logit contributions | |
BY | +1.687 |
Decay | +1.652 |
unfavorable | +1.563 |
than | +1.561 |
periodic | +1.522 |
Neg logit contributions | |
genders | -1.856 |
blance | -1.829 |
aults | -1.772 |
rils | -1.769 |
rights | -1.753 |
Token | and |
Token ID | 290 |
Feature activation | +7.75e+00 |
Pos logit contributions | |
Decay | +4.579 |
BY | +4.578 |
unfavorable | +4.358 |
orally | +4.306 |
periodic | +4.238 |
Neg logit contributions | |
genders | -5.562 |
blance | -5.554 |
itans | -5.404 |
aults | -5.368 |
rils | -5.324 |
Token | . |
Token ID | 13 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
genders | +2.441 |
aults | +2.280 |
blance | +2.275 |
rights | +2.237 |
empowerment | +2.237 |
Neg logit contributions | |
BY | -2.674 |
Decay | -2.631 |
than | -2.475 |
unfavorable | -2.440 |
Geological | -2.377 |
Token |
|
Token ID | 198 |
Feature activation | +5.97e+00 |
Pos logit contributions | |
BY | +0.956 |
Decay | +0.934 |
unfavorable | +0.887 |
than | +0.886 |
Geological | +0.861 |
Neg logit contributions | |
genders | -0.835 |
blance | -0.799 |
aults | -0.777 |
rils | -0.767 |
empowerment | -0.767 |
Token |
|
Token ID | 198 |
Feature activation | +8.54e+00 |
Pos logit contributions | |
BY | +4.041 |
than | +3.752 |
Decay | +3.731 |
Geological | +3.568 |
unfavorable | +3.452 |
Neg logit contributions | |
genders | -4.937 |
blance | -4.921 |
empowerment | -4.699 |
mattered | -4.635 |
rils | -4.627 |
Token | D |
Token ID | 35 |
Feature activation | +5.92e-01 |
Pos logit contributions | |
BY | +5.595 |
Decay | +5.000 |
than | +4.996 |
Geological | +4.616 |
unfavorable | +4.578 |
Neg logit contributions | |
genders | -7.434 |
blance | -7.040 |
mattered | -6.880 |
aults | -6.810 |
rils | -6.786 |
Token | uke |
Token ID | 4649 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
BY | +0.442 |
Decay | +0.433 |
unfavorable | +0.407 |
than | +0.406 |
Geological | +0.397 |
Neg logit contributions | |
genders | -0.443 |
blance | -0.426 |
aults | -0.416 |
rils | -0.410 |
empowerment | -0.409 |
Token | Energy |
Token ID | 6682 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
Decay | +9.333 |
BY | +9.281 |
Geological | +8.918 |
than | +8.439 |
unfavorable | +8.395 |
Neg logit contributions | |
genders | -12.860 |
blance | -12.775 |
rils | -12.294 |
aults | -12.163 |
itans | -12.027 |
Token | � |
Token ID | 447 |
Feature activation | -6.43e+00 |
Pos logit contributions | |
BY | +10.687 |
Decay | +10.659 |
Geological | +10.266 |
periodic | +10.030 |
unfavorable | +9.962 |
Neg logit contributions | |
blance | -12.371 |
genders | -12.245 |
rils | -11.750 |
itans | -11.595 |
aults | -11.492 |
Token | � |
Token ID | 247 |
Feature activation | +4.25e+00 |
Pos logit contributions | |
genders | +4.487 |
blance | +4.344 |
aults | +4.282 |
rils | +4.217 |
rights | +4.124 |
Neg logit contributions | |
BY | -5.053 |
Decay | -4.834 |
than | -4.648 |
unfavorable | -4.626 |
orally | -4.554 |
Token | s |
Token ID | 82 |
Feature activation | +6.38e+00 |
Pos logit contributions | |
BY | +2.637 |
Decay | +2.567 |
than | +2.410 |
unfavorable | +2.391 |
Geological | +2.334 |
Neg logit contributions | |
genders | -3.682 |
blance | -3.576 |
aults | -3.466 |
rils | -3.450 |
empowerment | -3.436 |
Token | considered |
Token ID | 3177 |
Feature activation | -8.47e-01 |
Pos logit contributions | |
BY | +4.382 |
Decay | +4.321 |
unfavorable | +4.070 |
than | +4.030 |
periodic | +3.995 |
Neg logit contributions | |
genders | -5.030 |
blance | -4.893 |
rils | -4.717 |
aults | -4.709 |
rights | -4.664 |
Token | retirement |
Token ID | 10737 |
Feature activation | -2.61e+00 |
Pos logit contributions | |
genders | +0.684 |
blance | +0.658 |
aults | +0.645 |
empowerment | +0.638 |
rights | +0.634 |
Neg logit contributions | |
BY | -0.582 |
Decay | -0.566 |
than | -0.530 |
unfavorable | -0.524 |
Geological | -0.514 |
Token | , |
Token ID | 11 |
Feature activation | +4.70e+00 |
Pos logit contributions | |
BY | +2.240 |
Decay | +2.177 |
unfavorable | +2.059 |
than | +2.049 |
periodic | +2.008 |
Neg logit contributions | |
genders | -2.586 |
blance | -2.529 |
aults | -2.469 |
rils | -2.452 |
rights | -2.420 |
Token | al |
Token ID | 435 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
BY | +3.316 |
Decay | +3.219 |
unfavorable | +3.072 |
than | +3.040 |
periodic | +3.027 |
Neg logit contributions | |
genders | -3.576 |
blance | -3.563 |
aults | -3.456 |
rils | -3.455 |
rights | -3.363 |
Token | - |
Token ID | 12 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
BY | +1.247 |
Decay | +1.210 |
than | +1.151 |
unfavorable | +1.137 |
Geological | +1.120 |
Neg logit contributions | |
genders | -1.312 |
blance | -1.284 |
aults | -1.230 |
rils | -1.227 |
mattered | -1.216 |
Token | Sh |
Token ID | 2484 |
Feature activation | +3.85e+00 |
Pos logit contributions | |
BY | +5.782 |
Decay | +5.388 |
than | +5.165 |
periodic | +4.861 |
unfavorable | +4.841 |
Neg logit contributions | |
genders | -9.156 |
blance | -8.953 |
aults | -8.596 |
rils | -8.547 |
mattered | -8.474 |
Token | ab |
Token ID | 397 |
Feature activation | +6.29e+00 |
Pos logit contributions | |
BY | +2.438 |
Decay | +2.308 |
than | +2.250 |
unfavorable | +2.158 |
Geological | +2.110 |
Neg logit contributions | |
genders | -3.345 |
blance | -3.170 |
CLS | -3.111 |
empowerment | -3.097 |
mattered | -3.082 |
Token | ab |
Token ID | 397 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
BY | +3.722 |
Decay | +3.469 |
than | +3.455 |
unfavorable | +3.294 |
periodic | +3.188 |
Neg logit contributions | |
genders | -5.646 |
blance | -5.334 |
CLS | -5.333 |
empowerment | -5.203 |
mattered | -5.179 |
Token | has |
Token ID | 468 |
Feature activation | +8.79e+00 |
Pos logit contributions | |
BY | +11.691 |
periodic | +11.606 |
orally | +11.356 |
Decay | +11.294 |
than | +11.101 |
Neg logit contributions | |
blance | -13.577 |
rils | -12.327 |
CLS | -12.157 |
genders | -12.062 |
aults | -12.057 |
Token | increasingly |
Token ID | 6481 |
Feature activation | +6.81e+00 |
Pos logit contributions | |
BY | +6.199 |
Decay | +6.011 |
orally | +5.920 |
unfavorable | +5.867 |
periodic | +5.826 |
Neg logit contributions | |
blance | -6.426 |
genders | -6.218 |
aults | -5.970 |
rils | -5.960 |
rights | -5.928 |
Token | been |
Token ID | 587 |
Feature activation | +8.20e+00 |
Pos logit contributions | |
BY | +4.922 |
Decay | +4.743 |
unfavorable | +4.672 |
orally | +4.627 |
than | +4.612 |
Neg logit contributions | |
blance | -4.961 |
genders | -4.847 |
aults | -4.700 |
rils | -4.655 |
rights | -4.641 |
Token | forcibly |
Token ID | 30522 |
Feature activation | +5.00e+00 |
Pos logit contributions | |
BY | +5.915 |
Decay | +5.633 |
unfavorable | +5.565 |
than | +5.499 |
periodic | +5.488 |
Neg logit contributions | |
blance | -5.994 |
genders | -5.877 |
rils | -5.673 |
aults | -5.628 |
rights | -5.542 |
Token | abduct |
Token ID | 24827 |
Feature activation | -3.20e+00 |
Pos logit contributions | |
BY | +3.435 |
Decay | +3.289 |
unfavorable | +3.179 |
than | +3.150 |
orally | +3.130 |
Neg logit contributions | |
blance | -3.930 |
genders | -3.896 |
rils | -3.763 |
aults | -3.721 |
rights | -3.676 |
Token | ] |
Token ID | 2361 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
BY | +1.380 |
Decay | +1.347 |
than | +1.257 |
unfavorable | +1.252 |
Geological | +1.218 |
Neg logit contributions | |
genders | -1.834 |
blance | -1.777 |
aults | -1.733 |
rils | -1.719 |
empowerment | -1.711 |
Token | due |
Token ID | 2233 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
Decay | +9.875 |
BY | +9.569 |
than | +9.414 |
unfavorable | +8.970 |
periodic | +8.961 |
Neg logit contributions | |
blance | -11.868 |
genders | -11.671 |
rils | -11.415 |
aults | -11.396 |
wheelchair | -11.119 |
Token | to |
Token ID | 284 |
Feature activation | +1.57e+01 |
Pos logit contributions | |
BY | +1.018 |
Decay | +0.996 |
unfavorable | +0.941 |
than | +0.941 |
Geological | +0.919 |
Neg logit contributions | |
genders | -0.946 |
blance | -0.908 |
aults | -0.883 |
rils | -0.870 |
empowerment | -0.869 |
Token | fertil |
Token ID | 19078 |
Feature activation | +5.13e+00 |
Pos logit contributions | |
Decay | +10.483 |
unfavorable | +10.440 |
periodic | +10.340 |
BY | +10.085 |
than | +9.681 |
Neg logit contributions | |
blance | -10.699 |
genders | -10.350 |
rils | -10.277 |
aults | -10.187 |
rights | -10.068 |
Token | ization |
Token ID | 1634 |
Feature activation | +9.41e+00 |
Pos logit contributions | |
BY | +3.711 |
Decay | +3.683 |
than | +3.455 |
unfavorable | +3.436 |
Geological | +3.377 |
Neg logit contributions | |
genders | -3.846 |
blance | -3.719 |
rils | -3.575 |
mattered | -3.566 |
wheelchair | -3.529 |
Token | of |
Token ID | 286 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
Decay | +5.926 |
BY | +5.868 |
unfavorable | +5.614 |
periodic | +5.490 |
than | +5.452 |
Neg logit contributions | |
blance | -7.490 |
genders | -7.448 |
rils | -7.199 |
aults | -7.098 |
itans | -7.010 |
Token | the |
Token ID | 262 |
Feature activation | +9.81e+00 |
Pos logit contributions | |
unfavorable | +9.763 |
Decay | +9.721 |
BY | +9.622 |
periodic | +9.400 |
than | +9.222 |
Neg logit contributions | |
blance | -12.173 |
genders | -11.283 |
itans | -11.061 |
aults | -10.983 |
rils | -10.977 |
Token | air |
Token ID | 1633 |
Feature activation | +5.97e+00 |
Pos logit contributions | |
Decay | +6.287 |
BY | +6.203 |
unfavorable | +6.110 |
periodic | +6.027 |
than | +5.902 |
Neg logit contributions | |
blance | -7.888 |
genders | -7.491 |
aults | -7.317 |
rils | -7.270 |
rights | -7.205 |
Token | by |
Token ID | 416 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
BY | +3.991 |
Decay | +3.917 |
unfavorable | +3.718 |
than | +3.691 |
periodic | +3.613 |
Neg logit contributions | |
genders | -4.754 |
blance | -4.698 |
aults | -4.484 |
empowerment | -4.466 |
rils | -4.415 |
Token | CO |
Token ID | 7375 |
Feature activation | +2.56e+00 |
Pos logit contributions | |
Decay | +11.243 |
periodic | +11.122 |
unfavorable | +11.095 |
BY | +10.943 |
than | +10.674 |
Neg logit contributions | |
blance | -12.659 |
aults | -11.588 |
genders | -11.562 |
itans | -11.448 |
rights | -11.384 |
Token | 2 |
Token ID | 362 |
Feature activation | +4.87e+00 |
Pos logit contributions | |
BY | +1.975 |
Decay | +1.930 |
than | +1.824 |
unfavorable | +1.819 |
Geological | +1.775 |
Neg logit contributions | |
genders | -1.846 |
blance | -1.786 |
aults | -1.729 |
rils | -1.707 |
empowerment | -1.703 |
Token | fall |
Token ID | 2121 |
Feature activation | -5.57e+00 |
Pos logit contributions | |
genders | +0.509 |
blance | +0.487 |
aults | +0.476 |
rils | +0.473 |
empowerment | +0.471 |
Neg logit contributions | |
BY | -0.464 |
Decay | -0.452 |
than | -0.424 |
unfavorable | -0.423 |
Geological | -0.413 |
Token | shortly |
Token ID | 8972 |
Feature activation | +3.70e+00 |
Pos logit contributions | |
genders | +4.038 |
blance | +3.784 |
aults | +3.764 |
mattered | +3.751 |
rils | +3.731 |
Neg logit contributions | |
BY | -4.162 |
Decay | -4.097 |
than | -3.839 |
unfavorable | -3.750 |
Geological | -3.683 |
Token | after |
Token ID | 706 |
Feature activation | +4.09e+00 |
Pos logit contributions | |
BY | +2.153 |
Decay | +2.063 |
than | +1.929 |
unfavorable | +1.926 |
orally | +1.863 |
Neg logit contributions | |
genders | -3.367 |
blance | -3.281 |
aults | -3.183 |
rils | -3.170 |
empowerment | -3.161 |
Token | he |
Token ID | 339 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
BY | +2.932 |
Decay | +2.833 |
than | +2.685 |
unfavorable | +2.668 |
orally | +2.608 |
Neg logit contributions | |
genders | -3.161 |
blance | -3.083 |
aults | -2.980 |
rights | -2.934 |
rils | -2.932 |
Token | left |
Token ID | 1364 |
Feature activation | -3.89e+00 |
Pos logit contributions | |
genders | +1.071 |
blance | +1.016 |
aults | +0.991 |
rils | +0.977 |
mattered | +0.976 |
Neg logit contributions | |
BY | -1.341 |
Decay | -1.316 |
than | -1.245 |
unfavorable | -1.243 |
Geological | -1.218 |
Token | the |
Token ID | 262 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
genders | +2.667 |
blance | +2.503 |
empowerment | +2.470 |
aults | +2.466 |
rils | +2.461 |
Neg logit contributions | |
BY | -3.079 |
Decay | -3.001 |
than | -2.833 |
unfavorable | -2.825 |
periodic | -2.772 |
Token | palace |
Token ID | 20562 |
Feature activation | -8.56e+00 |
Pos logit contributions | |
BY | +1.928 |
Decay | +1.886 |
unfavorable | +1.793 |
than | +1.791 |
Geological | +1.756 |
Neg logit contributions | |
genders | -1.514 |
blance | -1.458 |
aults | -1.399 |
rils | -1.385 |
rights | -1.382 |
Token |
|
Token ID | 198 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
genders | +5.428 |
aults | +5.145 |
blance | +5.070 |
rils | +5.050 |
wheelchair | +5.018 |
Neg logit contributions | |
BY | -6.835 |
Decay | -6.743 |
than | -6.341 |
unfavorable | -6.294 |
periodic | -6.204 |
Token |
|
Token ID | 198 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
BY | +0.134 |
Decay | +0.130 |
than | +0.124 |
unfavorable | +0.123 |
Geological | +0.120 |
Neg logit contributions | |
genders | -0.122 |
blance | -0.117 |
aults | -0.113 |
empowerment | -0.112 |
rils | -0.112 |
Token | he |
Token ID | 258 |
Feature activation | +3.31e+00 |
Pos logit contributions | |
BY | +1.069 |
Decay | +1.036 |
than | +0.977 |
unfavorable | +0.967 |
Geological | +0.940 |
Neg logit contributions | |
genders | -1.338 |
blance | -1.289 |
aults | -1.257 |
empowerment | -1.245 |
rils | -1.244 |
Token | was |
Token ID | 373 |
Feature activation | -2.62e+00 |
Pos logit contributions | |
BY | +2.542 |
Decay | +2.469 |
than | +2.367 |
unfavorable | +2.356 |
orally | +2.310 |
Neg logit contributions | |
genders | -2.356 |
blance | -2.302 |
empowerment | -2.209 |
aults | -2.197 |
rils | -2.194 |
Token | . |
Token ID | 13 |
Feature activation | -5.89e+00 |
Pos logit contributions | |
genders | +3.871 |
aults | +3.655 |
blance | +3.574 |
rights | +3.551 |
rils | +3.486 |
Neg logit contributions | |
BY | -4.855 |
Decay | -4.853 |
unfavorable | -4.654 |
periodic | -4.628 |
orally | -4.557 |
Token | We |
Token ID | 775 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
genders | +4.824 |
aults | +4.565 |
blance | +4.548 |
mattered | +4.493 |
rights | +4.464 |
Neg logit contributions | |
BY | -3.742 |
Decay | -3.641 |
unfavorable | -3.507 |
periodic | -3.462 |
than | -3.443 |
Token | � |
Token ID | 447 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
genders | +2.853 |
blance | +2.712 |
aults | +2.669 |
mattered | +2.657 |
rights | +2.655 |
Neg logit contributions | |
BY | -2.553 |
Decay | -2.531 |
unfavorable | -2.362 |
than | -2.335 |
Geological | -2.277 |
Token | � |
Token ID | 247 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
genders | +7.988 |
aults | +7.685 |
blance | +7.614 |
OULD | +7.489 |
rights | +7.439 |
Neg logit contributions | |
BY | -12.928 |
Decay | -12.452 |
unfavorable | -11.960 |
orally | -11.934 |
periodic | -11.921 |
Token | ll |
Token ID | 297 |
Feature activation | +3.75e+00 |
Pos logit contributions | |
genders | +5.887 |
aults | +5.385 |
mattered | +5.194 |
rights | +5.179 |
blance | +5.022 |
Neg logit contributions | |
BY | -11.794 |
Decay | -11.728 |
periodic | -11.121 |
unfavorable | -11.046 |
than | -10.852 |
Token | announce |
Token ID | 5453 |
Feature activation | +7.59e+00 |
Pos logit contributions | |
BY | +0.884 |
Decay | +0.819 |
than | +0.684 |
unfavorable | +0.671 |
orally | +0.614 |
Neg logit contributions | |
genders | -4.654 |
blance | -4.598 |
aults | -4.490 |
rils | -4.466 |
rights | -4.452 |
Token | the |
Token ID | 262 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
BY | +4.069 |
Decay | +3.912 |
than | +3.662 |
unfavorable | +3.587 |
Geological | +3.514 |
Neg logit contributions | |
blance | -7.099 |
genders | -7.018 |
rils | -6.761 |
mattered | -6.705 |
aults | -6.696 |
Token | hilarious |
Token ID | 20105 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
genders | +0.011 |
blance | +0.011 |
aults | +0.010 |
empowerment | +0.010 |
rils | +0.010 |
Neg logit contributions | |
BY | -0.008 |
Decay | -0.007 |
than | -0.007 |
unfavorable | -0.007 |
Geological | -0.007 |
Token | results |
Token ID | 2482 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
genders | +0.135 |
blance | +0.129 |
aults | +0.126 |
empowerment | +0.125 |
rils | +0.125 |
Neg logit contributions | |
BY | -0.111 |
Decay | -0.109 |
than | -0.102 |
unfavorable | -0.101 |
Geological | -0.099 |
Token | in |
Token ID | 287 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
genders | +1.273 |
blance | +1.213 |
aults | +1.185 |
rils | +1.170 |
empowerment | +1.168 |
Neg logit contributions | |
BY | -1.409 |
Decay | -1.381 |
unfavorable | -1.300 |
than | -1.300 |
Geological | -1.271 |
Token | next |
Token ID | 1306 |
Feature activation | +5.98e+00 |
Pos logit contributions | |
genders | +0.157 |
blance | +0.149 |
aults | +0.144 |
empowerment | +0.142 |
rils | +0.142 |
Neg logit contributions | |
BY | -0.237 |
Decay | -0.232 |
unfavorable | -0.221 |
than | -0.221 |
Geological | -0.216 |
Token | from |
Token ID | 422 |
Feature activation | +2.47e+00 |
Pos logit contributions | |
genders | +9.845 |
empowerment | +9.632 |
rights | +9.131 |
blance | +9.090 |
equality | +9.069 |
Neg logit contributions | |
BY | -10.776 |
Decay | -10.427 |
than | -9.950 |
unfavorable | -9.811 |
risome | -9.606 |
Token | Yale |
Token ID | 19681 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
BY | +1.715 |
Decay | +1.666 |
than | +1.562 |
unfavorable | +1.552 |
Geological | +1.528 |
Neg logit contributions | |
genders | -1.983 |
blance | -1.922 |
aults | -1.865 |
rils | -1.858 |
empowerment | -1.838 |
Token | . |
Token ID | 13 |
Feature activation | -6.09e+00 |
Pos logit contributions | |
genders | +1.857 |
blance | +1.780 |
aults | +1.739 |
empowerment | +1.739 |
rights | +1.721 |
Neg logit contributions | |
BY | -1.547 |
Decay | -1.510 |
unfavorable | -1.430 |
than | -1.413 |
periodic | -1.375 |
Token | � |
Token ID | 564 |
Feature activation | +9.46e+00 |
Pos logit contributions | |
genders | +4.362 |
blance | +4.207 |
aults | +4.112 |
CLS | +4.080 |
mattered | +4.063 |
Neg logit contributions | |
BY | -4.366 |
Decay | -4.223 |
unfavorable | -4.190 |
periodic | -4.068 |
than | -4.024 |
Token | � |
Token ID | 250 |
Feature activation | +2.28e+00 |
Pos logit contributions | |
BY | +4.952 |
Decay | +4.876 |
than | +4.460 |
unfavorable | +4.428 |
periodic | +4.247 |
Neg logit contributions | |
genders | -8.689 |
blance | -8.211 |
aults | -8.155 |
empowerment | -8.113 |
wheelchair | -8.063 |
Token | There |
Token ID | 1858 |
Feature activation | +4.17e+00 |
Pos logit contributions | |
BY | +1.486 |
Decay | +1.416 |
than | +1.349 |
unfavorable | +1.310 |
Geological | +1.289 |
Neg logit contributions | |
genders | -1.959 |
blance | -1.884 |
aults | -1.835 |
rils | -1.822 |
empowerment | -1.818 |
Token | is |
Token ID | 318 |
Feature activation | -5.86e+00 |
Pos logit contributions | |
BY | +2.501 |
Decay | +2.402 |
than | +2.280 |
unfavorable | +2.241 |
Geological | +2.174 |
Neg logit contributions | |
genders | -3.708 |
blance | -3.587 |
aults | -3.512 |
rils | -3.473 |
empowerment | -3.461 |
Token | that |
Token ID | 326 |
Feature activation | -7.18e+00 |
Pos logit contributions | |
genders | +4.309 |
empowerment | +4.215 |
blance | +4.200 |
equality | +4.066 |
mattered | +4.038 |
Neg logit contributions | |
BY | -4.193 |
Decay | -4.127 |
than | -3.845 |
unfavorable | -3.837 |
orally | -3.794 |
Token | same |
Token ID | 976 |
Feature activation | -9.13e+00 |
Pos logit contributions | |
genders | +5.269 |
empowerment | +5.164 |
blance | +5.140 |
mattered | +5.003 |
equality | +4.967 |
Neg logit contributions | |
BY | -5.055 |
Decay | -5.004 |
than | -4.731 |
unfavorable | -4.563 |
orally | -4.511 |
Token | aspect |
Token ID | 4843 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
genders | +6.240 |
empowerment | +6.217 |
blance | +6.084 |
equality | +5.933 |
mattered | +5.881 |
Neg logit contributions | |
Decay | -6.710 |
BY | -6.650 |
than | -6.173 |
orally | -5.983 |
unfavorable | -5.976 |
Token | of |
Token ID | 286 |
Feature activation | -5.89e+00 |
Pos logit contributions | |
genders | +1.417 |
blance | +1.370 |
aults | +1.319 |
empowerment | +1.319 |
rils | +1.306 |
Neg logit contributions | |
BY | -1.482 |
Decay | -1.446 |
than | -1.363 |
unfavorable | -1.352 |
Geological | -1.328 |
Token | he |
Token ID | 339 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
genders | +0.638 |
blance | +0.610 |
aults | +0.596 |
empowerment | +0.595 |
mattered | +0.592 |
Neg logit contributions | |
BY | -0.539 |
Decay | -0.526 |
than | -0.495 |
unfavorable | -0.490 |
Geological | -0.481 |
Token | was |
Token ID | 373 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
genders | +0.118 |
blance | +0.112 |
aults | +0.109 |
empowerment | +0.108 |
rils | +0.108 |
Neg logit contributions | |
BY | -0.135 |
Decay | -0.132 |
than | -0.125 |
unfavorable | -0.125 |
Geological | -0.122 |
Token | the |
Token ID | 262 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
genders | +0.986 |
blance | +0.943 |
aults | +0.923 |
empowerment | +0.920 |
mattered | +0.917 |
Neg logit contributions | |
BY | -0.776 |
Decay | -0.760 |
than | -0.708 |
unfavorable | -0.702 |
Geological | -0.688 |
Token | only |
Token ID | 691 |
Feature activation | +2.18e+00 |
Pos logit contributions | |
BY | +0.859 |
Decay | +0.839 |
unfavorable | +0.791 |
than | +0.788 |
Geological | +0.770 |
Neg logit contributions | |
genders | -0.899 |
blance | -0.874 |
aults | -0.846 |
rils | -0.840 |
rights | -0.828 |
Token | realistic |
Token ID | 12653 |
Feature activation | -3.80e-01 |
Pos logit contributions | |
BY | +1.397 |
Decay | +1.353 |
unfavorable | +1.270 |
than | +1.264 |
periodic | +1.226 |
Neg logit contributions | |
genders | -1.867 |
blance | -1.824 |
aults | -1.773 |
rils | -1.763 |
rights | -1.740 |
Token | option |
Token ID | 3038 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
genders | +0.288 |
blance | +0.274 |
aults | +0.267 |
empowerment | +0.266 |
rils | +0.264 |
Neg logit contributions | |
BY | -0.281 |
Decay | -0.275 |
than | -0.259 |
unfavorable | -0.258 |
Geological | -0.252 |
Token | as |
Token ID | 355 |
Feature activation | -9.47e-01 |
Pos logit contributions | |
BY | +1.797 |
Decay | +1.744 |
unfavorable | +1.666 |
than | +1.657 |
orally | +1.614 |
Neg logit contributions | |
genders | -1.750 |
blance | -1.692 |
aults | -1.644 |
rils | -1.632 |
empowerment | -1.613 |
Token | Kenya |
Token ID | 21506 |
Feature activation | +8.94e+00 |
Pos logit contributions | |
genders | +0.775 |
blance | +0.740 |
aults | +0.725 |
empowerment | +0.723 |
rils | +0.720 |
Neg logit contributions | |
BY | -0.643 |
Decay | -0.627 |
than | -0.588 |
unfavorable | -0.583 |
Geological | -0.571 |
Token | 's |
Token ID | 338 |
Feature activation | +8.51e+00 |
Pos logit contributions | |
BY | +6.279 |
Decay | +6.233 |
unfavorable | +5.917 |
than | +5.861 |
orally | +5.796 |
Neg logit contributions | |
blance | -6.535 |
genders | -6.430 |
aults | -6.254 |
rils | -6.205 |
rights | -6.049 |
Token | future |
Token ID | 2003 |
Feature activation | -6.26e+00 |
Pos logit contributions | |
BY | +5.705 |
Decay | +5.668 |
unfavorable | +5.413 |
periodic | +5.313 |
Geological | +5.228 |
Neg logit contributions | |
blance | -6.656 |
genders | -6.396 |
aults | -6.237 |
rils | -6.215 |
itans | -6.205 |
Token | leader |
Token ID | 3554 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
genders | +4.848 |
mattered | +4.649 |
empowerment | +4.548 |
equality | +4.460 |
blance | +4.431 |
Neg logit contributions | |
Decay | -4.376 |
BY | -4.369 |
than | -4.114 |
unfavorable | -3.957 |
Geological | -3.846 |
Token | at |
Token ID | 379 |
Feature activation | -4.46e-01 |
Pos logit contributions | |
genders | +3.023 |
blance | +2.894 |
aults | +2.853 |
mattered | +2.850 |
rils | +2.799 |
Neg logit contributions | |
BY | -3.029 |
Decay | -3.014 |
unfavorable | -2.797 |
than | -2.755 |
Geological | -2.733 |
Token | IM |
Token ID | 8959 |
Feature activation | +2.36e+00 |
Pos logit contributions | |
genders | +0.357 |
blance | +0.343 |
aults | +0.335 |
empowerment | +0.332 |
rils | +0.330 |
Neg logit contributions | |
BY | -0.309 |
Decay | -0.302 |
unfavorable | -0.283 |
than | -0.283 |
Geological | -0.275 |
Token | G |
Token ID | 38 |
Feature activation | -7.66e+00 |
Pos logit contributions | |
BY | +1.481 |
Decay | +1.422 |
than | +1.324 |
unfavorable | +1.316 |
Geological | +1.287 |
Neg logit contributions | |
genders | -2.056 |
blance | -1.993 |
aults | -1.954 |
rils | -1.934 |
empowerment | -1.928 |
Token | handled |
Token ID | 12118 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
genders | +6.198 |
mattered | +5.932 |
blance | +5.863 |
rights | +5.844 |
empowerment | +5.808 |
Neg logit contributions | |
Decay | -4.823 |
BY | -4.749 |
unfavorable | -4.481 |
than | -4.472 |
periodic | -4.358 |
Token | the |
Token ID | 262 |
Feature activation | +3.79e+00 |
Pos logit contributions | |
BY | +1.356 |
Decay | +1.318 |
unfavorable | +1.241 |
than | +1.238 |
periodic | +1.200 |
Neg logit contributions | |
genders | -1.675 |
blance | -1.614 |
aults | -1.575 |
rils | -1.563 |
empowerment | -1.554 |
Token | deal |
Token ID | 1730 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
BY | +2.740 |
Decay | +2.648 |
unfavorable | +2.548 |
than | +2.507 |
periodic | +2.457 |
Neg logit contributions | |
genders | -2.896 |
blance | -2.825 |
rils | -2.739 |
aults | -2.734 |
empowerment | -2.665 |
Token | . |
Token ID | 13 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
BY | +0.771 |
Decay | +0.753 |
than | +0.709 |
unfavorable | +0.708 |
Geological | +0.690 |
Neg logit contributions | |
genders | -0.806 |
blance | -0.775 |
aults | -0.754 |
rils | -0.747 |
empowerment | -0.746 |
Token | After |
Token ID | 3260 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
BY | +1.702 |
Decay | +1.641 |
than | +1.535 |
unfavorable | +1.504 |
Geological | +1.483 |
Neg logit contributions | |
genders | -2.368 |
blance | -2.283 |
empowerment | -2.222 |
aults | -2.220 |
rils | -2.213 |
Token | a |
Token ID | 257 |
Feature activation | +5.02e+00 |
Pos logit contributions | |
BY | +0.876 |
Decay | +0.853 |
than | +0.800 |
unfavorable | +0.799 |
Geological | +0.774 |
Neg logit contributions | |
genders | -1.071 |
blance | -1.034 |
aults | -1.007 |
rils | -0.999 |
empowerment | -0.995 |
Token | fruitful |
Token ID | 44474 |
Feature activation | +9.04e+00 |
Pos logit contributions | |
BY | +3.250 |
Decay | +3.098 |
unfavorable | +2.955 |
than | +2.940 |
periodic | +2.869 |
Neg logit contributions | |
genders | -4.261 |
blance | -4.108 |
rils | -4.049 |
aults | -4.016 |
empowerment | -3.944 |
Token | 2010 |
Token ID | 3050 |
Feature activation | +6.46e+00 |
Pos logit contributions | |
BY | +6.441 |
Decay | +6.099 |
unfavorable | +5.898 |
than | +5.868 |
periodic | +5.854 |
Neg logit contributions | |
genders | -6.625 |
blance | -6.547 |
rils | -6.447 |
aults | -6.370 |
itans | -6.216 |
Token | failed |
Token ID | 4054 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
BY | +5.758 |
Decay | +5.596 |
unfavorable | +5.541 |
periodic | +5.444 |
than | +5.289 |
Neg logit contributions | |
genders | -6.066 |
blance | -6.040 |
rils | -5.868 |
aults | -5.802 |
itans | -5.745 |
Token | promises |
Token ID | 10497 |
Feature activation | +3.56e+00 |
Pos logit contributions | |
BY | +1.198 |
Decay | +1.166 |
unfavorable | +1.094 |
than | +1.093 |
periodic | +1.067 |
Neg logit contributions | |
genders | -1.420 |
blance | -1.374 |
aults | -1.339 |
rils | -1.329 |
mattered | -1.315 |
Token | of |
Token ID | 286 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
BY | +2.574 |
Decay | +2.490 |
unfavorable | +2.382 |
than | +2.367 |
orally | +2.317 |
Neg logit contributions | |
genders | -2.719 |
blance | -2.614 |
aults | -2.561 |
rils | -2.535 |
empowerment | -2.510 |
Token | a |
Token ID | 257 |
Feature activation | -6.17e+00 |
Pos logit contributions | |
genders | +0.853 |
blance | +0.813 |
empowerment | +0.797 |
aults | +0.792 |
rights | +0.786 |
Neg logit contributions | |
BY | -0.781 |
Decay | -0.765 |
than | -0.719 |
unfavorable | -0.711 |
Geological | -0.698 |
Token | dialogue |
Token ID | 10721 |
Feature activation | -2.66e-01 |
Pos logit contributions | |
genders | +4.737 |
empowerment | +4.449 |
equality | +4.420 |
blance | +4.418 |
wheelchair | +4.380 |
Neg logit contributions | |
Decay | -4.371 |
BY | -4.300 |
than | -3.998 |
unfavorable | -3.921 |
Geological | -3.852 |
Token | . |
Token ID | 13 |
Feature activation | -2.63e+00 |
Pos logit contributions | |
genders | +0.211 |
blance | +0.202 |
aults | +0.197 |
empowerment | +0.196 |
rils | +0.195 |
Neg logit contributions | |
BY | -0.188 |
Decay | -0.184 |
than | -0.172 |
unfavorable | -0.171 |
Geological | -0.167 |
Token | They |
Token ID | 1119 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
genders | +1.755 |
blance | +1.685 |
aults | +1.634 |
rights | +1.623 |
rils | +1.601 |
Neg logit contributions | |
BY | -2.128 |
Decay | -2.086 |
unfavorable | -2.002 |
than | -1.988 |
periodic | -1.941 |
Token | believe |
Token ID | 1975 |
Feature activation | +3.42e+00 |
Pos logit contributions | |
genders | +2.391 |
blance | +2.279 |
aults | +2.233 |
mattered | +2.224 |
empowerment | +2.203 |
Neg logit contributions | |
BY | -2.063 |
Decay | -2.027 |
than | -1.880 |
unfavorable | -1.875 |
Geological | -1.830 |
Token | the |
Token ID | 262 |
Feature activation | +5.36e+00 |
Pos logit contributions | |
BY | +2.297 |
Decay | +2.223 |
unfavorable | +2.108 |
than | +2.088 |
periodic | +2.056 |
Neg logit contributions | |
genders | -2.798 |
blance | -2.712 |
aults | -2.627 |
rils | -2.617 |
empowerment | -2.583 |
Token | least |
Token ID | 1551 |
Feature activation | +4.79e+00 |
Pos logit contributions | |
BY | +3.672 |
Decay | +3.552 |
unfavorable | +3.425 |
periodic | +3.343 |
than | +3.340 |
Neg logit contributions | |
genders | -4.215 |
blance | -4.162 |
aults | -4.009 |
rils | -3.978 |
itans | -3.919 |
Token | the |
Token ID | 262 |
Feature activation | +7.31e+00 |
Pos logit contributions | |
BY | +3.294 |
Decay | +3.154 |
unfavorable | +3.088 |
than | +3.046 |
periodic | +2.959 |
Neg logit contributions | |
genders | -3.785 |
blance | -3.660 |
aults | -3.600 |
rils | -3.584 |
itans | -3.505 |
Token | them |
Token ID | 606 |
Feature activation | -8.09e-01 |
Pos logit contributions | |
BY | +2.355 |
Decay | +2.321 |
unfavorable | +2.198 |
than | +2.169 |
periodic | +2.120 |
Neg logit contributions | |
genders | -2.883 |
blance | -2.816 |
aults | -2.699 |
rils | -2.693 |
rights | -2.678 |
Token | a |
Token ID | 257 |
Feature activation | -7.03e+00 |
Pos logit contributions | |
genders | +0.678 |
blance | +0.649 |
aults | +0.636 |
empowerment | +0.634 |
mattered | +0.629 |
Neg logit contributions | |
BY | -0.531 |
Decay | -0.519 |
than | -0.485 |
unfavorable | -0.477 |
Geological | -0.470 |
Token | questionable |
Token ID | 18269 |
Feature activation | -3.45e+00 |
Pos logit contributions | |
genders | +5.138 |
empowerment | +4.916 |
wheelchair | +4.902 |
mattered | +4.891 |
aults | +4.814 |
Neg logit contributions | |
BY | -4.961 |
Decay | -4.863 |
than | -4.550 |
Geological | -4.522 |
orally | -4.476 |
Token | choice |
Token ID | 3572 |
Feature activation | -4.02e+00 |
Pos logit contributions | |
genders | +2.342 |
empowerment | +2.184 |
blance | +2.167 |
aults | +2.160 |
mattered | +2.146 |
Neg logit contributions | |
BY | -2.771 |
Decay | -2.709 |
than | -2.597 |
unfavorable | -2.529 |
orally | -2.496 |
Token | against |
Token ID | 1028 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
genders | +2.774 |
blance | +2.612 |
aults | +2.571 |
mattered | +2.557 |
empowerment | +2.551 |
Neg logit contributions | |
BY | -3.204 |
Decay | -3.145 |
than | -2.940 |
Geological | -2.897 |
unfavorable | -2.878 |
Token | rocket |
Token ID | 10701 |
Feature activation | -8.17e+00 |
Pos logit contributions | |
BY | +1.340 |
Decay | +1.312 |
unfavorable | +1.236 |
than | +1.232 |
periodic | +1.196 |
Neg logit contributions | |
genders | -1.574 |
blance | -1.529 |
aults | -1.478 |
rils | -1.466 |
rights | -1.461 |
Token | launchers |
Token ID | 41065 |
Feature activation | -9.73e+00 |
Pos logit contributions | |
genders | +5.670 |
aults | +5.271 |
empowerment | +5.257 |
mattered | +5.175 |
blance | +5.143 |
Neg logit contributions | |
BY | -6.245 |
Decay | -6.075 |
than | -5.810 |
unfavorable | -5.684 |
orally | -5.664 |
Token | and |
Token ID | 290 |
Feature activation | -4.00e+00 |
Pos logit contributions | |
genders | +6.235 |
aults | +5.950 |
mattered | +5.864 |
blance | +5.766 |
empowerment | +5.745 |
Neg logit contributions | |
BY | -7.664 |
Decay | -7.507 |
than | -6.977 |
Geological | -6.857 |
unfavorable | -6.773 |
Token | grenades |
Token ID | 28850 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
genders | +3.156 |
blance | +2.955 |
empowerment | +2.953 |
aults | +2.950 |
mattered | +2.928 |
Neg logit contributions | |
BY | -2.769 |
Decay | -2.662 |
than | -2.529 |
unfavorable | -2.467 |
orally | -2.455 |
Token | . |
Token ID | 13 |
Feature activation | -4.19e+00 |
Pos logit contributions | |
genders | +6.981 |
aults | +6.703 |
mattered | +6.600 |
empowerment | +6.424 |
blance | +6.374 |
Neg logit contributions | |
BY | -9.148 |
Decay | -8.856 |
than | -8.308 |
Geological | -8.187 |
terness | -8.065 |
Token |
|
Token ID | 198 |
Feature activation | -3.49e+00 |
Pos logit contributions | |
genders | +2.949 |
blance | +2.797 |
aults | +2.795 |
mattered | +2.731 |
rils | +2.720 |
Neg logit contributions | |
BY | -3.161 |
Decay | -3.031 |
unfavorable | -2.951 |
than | -2.914 |
periodic | -2.903 |
Token | revolution |
Token ID | 5854 |
Feature activation | -1.45e+01 |
Pos logit contributions | |
empowerment | +9.918 |
genders | +9.892 |
equality | +9.744 |
mattered | +9.207 |
wheelchair | +9.097 |
Neg logit contributions | |
BY | -9.529 |
Decay | -9.174 |
than | -8.897 |
unfavorable | -8.564 |
Geological | -8.562 |
Token | - |
Token ID | 532 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
mattered | +9.680 |
genders | +9.528 |
empowerment | +9.050 |
equality | +8.854 |
wheelchair | +8.632 |
Neg logit contributions | |
Decay | -10.338 |
BY | -10.302 |
than | -9.317 |
unfavorable | -9.314 |
risome | -9.237 |
Token | with |
Token ID | 351 |
Feature activation | -9.37e+00 |
Pos logit contributions | |
genders | +10.325 |
equality | +10.038 |
empowerment | +10.034 |
wheelchair | +9.815 |
blance | +9.795 |
Neg logit contributions | |
BY | -8.854 |
Decay | -8.785 |
than | -8.030 |
Geological | -7.984 |
unfavorable | -7.950 |
Token | the |
Token ID | 262 |
Feature activation | -8.09e+00 |
Pos logit contributions | |
genders | +7.109 |
empowerment | +6.711 |
equality | +6.683 |
wheelchair | +6.498 |
mattered | +6.412 |
Neg logit contributions | |
BY | -6.564 |
Decay | -6.353 |
than | -5.971 |
Geological | -5.843 |
unfavorable | -5.763 |
Token | impact |
Token ID | 2928 |
Feature activation | -5.22e+00 |
Pos logit contributions | |
genders | +6.362 |
empowerment | +6.108 |
equality | +5.899 |
wheelchair | +5.816 |
blance | +5.771 |
Neg logit contributions | |
BY | -5.535 |
Decay | -5.325 |
than | -5.075 |
unfavorable | -4.862 |
orally | -4.857 |
Token | of |
Token ID | 286 |
Feature activation | -8.15e+00 |
Pos logit contributions | |
genders | +3.911 |
blance | +3.695 |
mattered | +3.662 |
empowerment | +3.656 |
wheelchair | +3.586 |
Neg logit contributions | |
BY | -3.855 |
Decay | -3.783 |
than | -3.516 |
unfavorable | -3.422 |
Geological | -3.402 |
Token | automation |
Token ID | 22771 |
Feature activation | -7.22e+00 |
Pos logit contributions | |
genders | +5.870 |
empowerment | +5.576 |
equality | +5.498 |
wheelchair | +5.378 |
blance | +5.361 |
Neg logit contributions | |
BY | -6.075 |
Decay | -5.908 |
than | -5.591 |
unfavorable | -5.411 |
Geological | -5.394 |
Token | and |
Token ID | 290 |
Feature activation | -6.39e+00 |
Pos logit contributions | |
genders | +5.313 |
empowerment | +4.977 |
mattered | +4.938 |
blance | +4.868 |
equality | +4.852 |
Neg logit contributions | |
BY | -5.328 |
Decay | -5.208 |
than | -4.810 |
unfavorable | -4.739 |
Geological | -4.695 |
Token | ' |
Token ID | 705 |
Feature activation | -2.21e+00 |
Pos logit contributions | |
genders | +4.718 |
empowerment | +4.502 |
equality | +4.413 |
mattered | +4.352 |
wheelchair | +4.352 |
Neg logit contributions | |
BY | -4.772 |
Decay | -4.646 |
than | -4.352 |
unfavorable | -4.223 |
Geological | -4.212 |
Token | cy |
Token ID | 948 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
genders | +1.654 |
blance | +1.598 |
rights | +1.561 |
aults | +1.559 |
empowerment | +1.546 |
Neg logit contributions | |
BY | -1.625 |
Decay | -1.609 |
unfavorable | -1.512 |
than | -1.486 |
Geological | -1.485 |
Token | ber |
Token ID | 527 |
Feature activation | -8.09e+00 |
Pos logit contributions | |
genders | +1.574 |
blance | +1.521 |
aults | +1.467 |
rils | +1.467 |
empowerment | +1.463 |
Neg logit contributions | |
BY | -1.452 |
Decay | -1.434 |
unfavorable | -1.345 |
than | -1.332 |
Geological | -1.312 |
Token | low |
Token ID | 1877 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
BY | +2.985 |
Decay | +2.903 |
unfavorable | +2.802 |
than | +2.728 |
periodic | +2.670 |
Neg logit contributions | |
genders | -3.553 |
blance | -3.512 |
rils | -3.372 |
aults | -3.362 |
rights | -3.324 |
Token | risk |
Token ID | 2526 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
BY | +0.271 |
Decay | +0.265 |
than | +0.250 |
unfavorable | +0.248 |
Geological | +0.243 |
Neg logit contributions | |
genders | -0.273 |
blance | -0.261 |
aults | -0.254 |
empowerment | -0.252 |
rils | -0.251 |
Token | for |
Token ID | 329 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
BY | +1.579 |
Decay | +1.541 |
unfavorable | +1.453 |
than | +1.447 |
Geological | +1.405 |
Neg logit contributions | |
genders | -1.761 |
blance | -1.711 |
aults | -1.653 |
rils | -1.645 |
rights | -1.630 |
Token | the |
Token ID | 262 |
Feature activation | -8.96e-01 |
Pos logit contributions | |
genders | +3.452 |
blance | +3.227 |
empowerment | +3.202 |
aults | +3.200 |
wheelchair | +3.157 |
Neg logit contributions | |
BY | -3.105 |
Decay | -2.971 |
than | -2.844 |
unfavorable | -2.783 |
Geological | -2.746 |
Token | students |
Token ID | 2444 |
Feature activation | -6.30e+00 |
Pos logit contributions | |
genders | +0.720 |
blance | +0.685 |
aults | +0.672 |
empowerment | +0.668 |
rils | +0.663 |
Neg logit contributions | |
BY | -0.624 |
Decay | -0.606 |
than | -0.570 |
unfavorable | -0.566 |
Geological | -0.551 |
Token | , |
Token ID | 11 |
Feature activation | -8.19e+00 |
Pos logit contributions | |
genders | +4.566 |
mattered | +4.206 |
blance | +4.203 |
aults | +4.179 |
empowerment | +4.162 |
Neg logit contributions | |
BY | -4.724 |
Decay | -4.699 |
than | -4.310 |
unfavorable | -4.282 |
Geological | -4.236 |
Token | so |
Token ID | 523 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
genders | +6.090 |
wheelchair | +5.550 |
mattered | +5.550 |
empowerment | +5.539 |
blance | +5.520 |
Neg logit contributions | |
BY | -5.912 |
Decay | -5.784 |
than | -5.428 |
unfavorable | -5.256 |
Geological | -5.179 |
Token | they |
Token ID | 484 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
genders | +3.648 |
blance | +3.456 |
empowerment | +3.382 |
mattered | +3.379 |
aults | +3.370 |
Neg logit contributions | |
BY | -3.367 |
Decay | -3.296 |
than | -3.137 |
unfavorable | -3.057 |
Geological | -3.019 |
Token | approached |
Token ID | 10448 |
Feature activation | -4.73e-01 |
Pos logit contributions | |
genders | +0.096 |
blance | +0.092 |
aults | +0.089 |
rils | +0.088 |
empowerment | +0.088 |
Neg logit contributions | |
BY | -0.097 |
Decay | -0.095 |
than | -0.089 |
unfavorable | -0.089 |
Geological | -0.087 |
Token | assignments |
Token ID | 25815 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
genders | +0.384 |
blance | +0.368 |
aults | +0.360 |
empowerment | +0.357 |
rils | +0.356 |
Neg logit contributions | |
BY | -0.325 |
Decay | -0.316 |
than | -0.298 |
unfavorable | -0.296 |
Geological | -0.288 |
Token | more |
Token ID | 517 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
BY | +1.081 |
Decay | +1.054 |
unfavorable | +0.995 |
than | +0.989 |
orally | +0.966 |
Neg logit contributions | |
genders | -1.274 |
blance | -1.237 |
aults | -1.199 |
rils | -1.194 |
empowerment | -1.183 |
Token | ashi |
Token ID | 12144 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
BY | +1.834 |
Decay | +1.707 |
than | +1.694 |
unfavorable | +1.566 |
Geological | +1.522 |
Neg logit contributions | |
genders | -3.732 |
blance | -3.644 |
empowerment | -3.562 |
mattered | -3.504 |
aults | -3.493 |
Token | � |
Token ID | 447 |
Feature activation | +2.41e+00 |
Pos logit contributions | |
BY | +1.432 |
Decay | +1.395 |
than | +1.325 |
unfavorable | +1.324 |
Geological | +1.294 |
Neg logit contributions | |
genders | -1.269 |
blance | -1.223 |
aults | -1.182 |
rils | -1.172 |
empowerment | -1.167 |
Token | � |
Token ID | 247 |
Feature activation | -3.95e+00 |
Pos logit contributions | |
BY | +1.682 |
Decay | +1.655 |
unfavorable | +1.549 |
than | +1.545 |
Geological | +1.501 |
Neg logit contributions | |
genders | -1.911 |
blance | -1.826 |
aults | -1.784 |
empowerment | -1.774 |
rils | -1.761 |
Token | s |
Token ID | 82 |
Feature activation | +2.91e+00 |
Pos logit contributions | |
genders | +2.943 |
blance | +2.810 |
aults | +2.780 |
mattered | +2.744 |
rils | +2.731 |
Neg logit contributions | |
Decay | -2.886 |
BY | -2.875 |
unfavorable | -2.666 |
than | -2.627 |
Geological | -2.614 |
Token | personal |
Token ID | 2614 |
Feature activation | -6.96e+00 |
Pos logit contributions | |
BY | +2.100 |
Decay | +2.037 |
unfavorable | +1.930 |
than | +1.928 |
Geological | +1.876 |
Neg logit contributions | |
genders | -2.238 |
blance | -2.169 |
aults | -2.109 |
rils | -2.091 |
empowerment | -2.067 |
Token | manager |
Token ID | 4706 |
Feature activation | -6.28e+00 |
Pos logit contributions | |
genders | +5.134 |
wheelchair | +4.933 |
blance | +4.889 |
empowerment | +4.860 |
aults | +4.795 |
Neg logit contributions | |
Decay | -4.965 |
BY | -4.899 |
than | -4.584 |
unfavorable | -4.518 |
orally | -4.415 |
Token | — |
Token ID | 851 |
Feature activation | -6.97e+00 |
Pos logit contributions | |
genders | +4.594 |
blance | +4.368 |
mattered | +4.342 |
aults | +4.264 |
empowerment | +4.260 |
Neg logit contributions | |
Decay | -4.510 |
BY | -4.505 |
unfavorable | -4.168 |
than | -4.161 |
Geological | -4.065 |
Token | and |
Token ID | 290 |
Feature activation | +4.45e+00 |
Pos logit contributions | |
genders | +5.087 |
blance | +4.850 |
wheelchair | +4.740 |
empowerment | +4.728 |
aults | +4.720 |
Neg logit contributions | |
BY | -5.023 |
Decay | -4.960 |
unfavorable | -4.587 |
than | -4.560 |
Geological | -4.498 |
Token | girlfriend |
Token ID | 11077 |
Feature activation | -6.32e+00 |
Pos logit contributions | |
BY | +2.994 |
Decay | +2.884 |
unfavorable | +2.734 |
than | +2.724 |
periodic | +2.661 |
Neg logit contributions | |
genders | -3.634 |
blance | -3.524 |
aults | -3.459 |
rils | -3.426 |
rights | -3.366 |
Token | — |
Token ID | 851 |
Feature activation | -9.70e+00 |
Pos logit contributions | |
genders | +4.886 |
blance | +4.646 |
empowerment | +4.601 |
mattered | +4.556 |
aults | +4.511 |
Neg logit contributions | |
BY | -4.349 |
Decay | -4.227 |
unfavorable | -3.952 |
than | -3.946 |
Geological | -3.870 |
Token | sent |
Token ID | 1908 |
Feature activation | +5.79e+00 |
Pos logit contributions | |
genders | +7.178 |
mattered | +6.781 |
blance | +6.704 |
empowerment | +6.641 |
wheelchair | +6.552 |
Neg logit contributions | |
BY | -6.515 |
Decay | -6.457 |
unfavorable | -6.044 |
than | -5.893 |
Geological | -5.871 |
Token | we |
Token ID | 356 |
Feature activation | +9.44e+00 |
Pos logit contributions | |
BY | +1.500 |
Decay | +1.460 |
unfavorable | +1.375 |
than | +1.368 |
Geological | +1.335 |
Neg logit contributions | |
genders | -1.767 |
blance | -1.707 |
aults | -1.662 |
rils | -1.650 |
empowerment | -1.639 |
Token | don |
Token ID | 836 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
BY | +5.302 |
Decay | +4.931 |
unfavorable | +4.886 |
orally | +4.841 |
than | +4.617 |
Neg logit contributions | |
blance | -8.257 |
genders | -8.243 |
aults | -8.135 |
rils | -8.068 |
empowerment | -7.795 |
Token | � |
Token ID | 447 |
Feature activation | -9.68e+00 |
Pos logit contributions | |
genders | +4.196 |
aults | +4.020 |
blance | +4.001 |
rights | +3.969 |
itans | +3.948 |
Neg logit contributions | |
Decay | -3.280 |
BY | -3.240 |
periodic | -3.076 |
unfavorable | -3.064 |
orally | -2.962 |
Token | � |
Token ID | 247 |
Feature activation | -7.35e+00 |
Pos logit contributions | |
genders | +6.474 |
blance | +6.280 |
rils | +6.165 |
aults | +6.152 |
rights | +6.003 |
Neg logit contributions | |
BY | -7.475 |
Decay | -7.105 |
than | -6.848 |
unfavorable | -6.741 |
periodic | -6.734 |
Token | t |
Token ID | 83 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
genders | +6.579 |
aults | +6.321 |
blance | +6.291 |
rils | +6.290 |
rights | +6.162 |
Neg logit contributions | |
Decay | -4.161 |
BY | -4.125 |
unfavorable | -3.705 |
periodic | -3.670 |
orally | -3.623 |
Token | know |
Token ID | 760 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
genders | +6.944 |
mattered | +6.442 |
wheelchair | +6.396 |
itans | +6.241 |
blance | +6.241 |
Neg logit contributions | |
Decay | -8.588 |
BY | -8.278 |
than | -7.653 |
unfavorable | -7.619 |
Geological | -7.547 |
Token | why |
Token ID | 1521 |
Feature activation | +2.11e+00 |
Pos logit contributions | |
genders | +11.195 |
who | +10.118 |
mattered | +10.039 |
equality | +10.010 |
wheelchair | +9.941 |
Neg logit contributions | |
Decay | -13.905 |
BY | -13.644 |
terness | -13.076 |
than | -13.062 |
risome | -12.832 |
Token | and |
Token ID | 290 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
BY | +1.474 |
Decay | +1.435 |
unfavorable | +1.352 |
than | +1.348 |
Geological | +1.315 |
Neg logit contributions | |
genders | -1.678 |
blance | -1.622 |
aults | -1.576 |
rils | -1.562 |
empowerment | -1.556 |
Token | therefore |
Token ID | 4361 |
Feature activation | +4.90e+00 |
Pos logit contributions | |
genders | +1.774 |
blance | +1.677 |
empowerment | +1.628 |
rights | +1.621 |
mattered | +1.620 |
Neg logit contributions | |
BY | -2.036 |
Decay | -1.992 |
than | -1.878 |
unfavorable | -1.854 |
Geological | -1.822 |
Token | should |
Token ID | 815 |
Feature activation | +6.04e+00 |
Pos logit contributions | |
BY | +3.212 |
Decay | +3.127 |
unfavorable | +3.008 |
than | +2.937 |
Geological | +2.892 |
Neg logit contributions | |
genders | -4.028 |
blance | -3.923 |
rils | -3.827 |
aults | -3.826 |
rights | -3.746 |
Token | be |
Token ID | 307 |
Feature activation | +4.39e+00 |
Pos logit contributions | |
BY | +3.137 |
Decay | +3.014 |
unfavorable | +2.887 |
than | +2.807 |
orally | +2.743 |
Neg logit contributions | |
genders | -5.767 |
blance | -5.590 |
aults | -5.456 |
rils | -5.440 |
empowerment | -5.406 |
Token | filtering |
Token ID | 25431 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
genders | +12.466 |
empowerment | +12.332 |
equality | +12.260 |
mattered | +11.568 |
aults | +11.568 |
Neg logit contributions | |
Decay | -11.604 |
BY | -11.127 |
than | -10.630 |
Geological | -10.476 |
terness | -10.215 |
Token | systems |
Token ID | 3341 |
Feature activation | -9.47e+00 |
Pos logit contributions | |
genders | +11.446 |
empowerment | +10.826 |
equality | +10.823 |
mattered | +10.801 |
rights | +10.494 |
Neg logit contributions | |
Decay | -10.187 |
BY | -9.803 |
than | -9.216 |
terness | -9.045 |
Geological | -8.814 |
Token | did |
Token ID | 750 |
Feature activation | -6.26e+00 |
Pos logit contributions | |
genders | +7.182 |
mattered | +6.855 |
empowerment | +6.689 |
blance | +6.640 |
aults | +6.625 |
Neg logit contributions | |
BY | -6.570 |
Decay | -6.442 |
than | -5.939 |
Geological | -5.739 |
unfavorable | -5.655 |
Token | little |
Token ID | 1310 |
Feature activation | +4.28e-01 |
Pos logit contributions | |
genders | +5.156 |
blance | +4.967 |
empowerment | +4.921 |
aults | +4.881 |
mattered | +4.868 |
Neg logit contributions | |
BY | -3.976 |
Decay | -3.916 |
than | -3.607 |
unfavorable | -3.558 |
Geological | -3.526 |
Token | to |
Token ID | 284 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
BY | +0.329 |
Decay | +0.322 |
than | +0.304 |
unfavorable | +0.303 |
Geological | +0.296 |
Neg logit contributions | |
genders | -0.311 |
blance | -0.298 |
aults | -0.290 |
rils | -0.287 |
empowerment | -0.286 |
Token | curb |
Token ID | 20799 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
genders | +8.551 |
equality | +8.249 |
empowerment | +8.247 |
mattered | +7.858 |
wheelchair | +7.726 |
Neg logit contributions | |
BY | -10.744 |
Decay | -10.600 |
than | -9.806 |
terness | -9.686 |
Reviewer | -9.680 |
Token | the |
Token ID | 262 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
genders | +13.023 |
equality | +12.457 |
empowerment | +12.404 |
wheelchair | +11.837 |
rights | +11.487 |
Neg logit contributions | |
Decay | -12.700 |
BY | -12.353 |
terness | -11.780 |
Geological | -11.608 |
than | -11.265 |
Token | trade |
Token ID | 3292 |
Feature activation | -8.34e+00 |
Pos logit contributions | |
genders | +8.309 |
empowerment | +8.007 |
equality | +7.692 |
wheelchair | +7.472 |
rights | +7.371 |
Neg logit contributions | |
BY | -7.626 |
Decay | -7.358 |
than | -6.751 |
Geological | -6.721 |
orally | -6.531 |
Token | of |
Token ID | 286 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
genders | +5.525 |
empowerment | +5.317 |
rights | +5.191 |
aults | +5.170 |
equality | +5.165 |
Neg logit contributions | |
BY | -6.652 |
Decay | -6.558 |
Geological | -6.063 |
than | -5.997 |
periodic | -5.794 |
Token | child |
Token ID | 1200 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
genders | +7.734 |
empowerment | +7.250 |
equality | +7.084 |
wheelchair | +6.891 |
rights | +6.801 |
Neg logit contributions | |
Decay | -8.010 |
BY | -7.936 |
than | -7.400 |
Geological | -7.309 |
terness | -7.301 |
Token | pornography |
Token ID | 18384 |
Feature activation | -5.27e+00 |
Pos logit contributions | |
genders | +5.780 |
empowerment | +5.343 |
equality | +5.052 |
rights | +4.966 |
aults | +4.850 |
Neg logit contributions | |
BY | -10.908 |
Decay | -10.826 |
than | -10.543 |
Geological | -10.231 |
unfavorable | -10.067 |
Token | but |
Token ID | 475 |
Feature activation | -8.21e-01 |
Pos logit contributions | |
genders | +9.574 |
empowerment | +8.891 |
equality | +8.874 |
CLS | +8.674 |
rights | +8.637 |
Neg logit contributions | |
Decay | -11.328 |
BY | -11.268 |
Reviewer | -10.568 |
Geological | -10.506 |
than | -10.476 |
Token | again |
Token ID | 757 |
Feature activation | +4.31e-01 |
Pos logit contributions | |
genders | +0.651 |
blance | +0.624 |
aults | +0.610 |
empowerment | +0.604 |
rils | +0.603 |
Neg logit contributions | |
BY | -0.577 |
Decay | -0.563 |
than | -0.528 |
unfavorable | -0.526 |
Geological | -0.514 |
Token | , |
Token ID | 11 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
BY | +0.303 |
Decay | +0.296 |
than | +0.278 |
unfavorable | +0.277 |
Geological | +0.270 |
Neg logit contributions | |
genders | -0.341 |
blance | -0.328 |
aults | -0.320 |
rils | -0.317 |
empowerment | -0.317 |
Token | that |
Token ID | 326 |
Feature activation | +7.17e+00 |
Pos logit contributions | |
genders | +2.326 |
blance | +2.205 |
aults | +2.169 |
empowerment | +2.150 |
mattered | +2.139 |
Neg logit contributions | |
BY | -2.113 |
Decay | -2.068 |
than | -1.938 |
unfavorable | -1.918 |
Geological | -1.881 |
Token | has |
Token ID | 468 |
Feature activation | -5.29e+00 |
Pos logit contributions | |
BY | +4.162 |
Decay | +4.057 |
unfavorable | +3.889 |
than | +3.758 |
periodic | +3.736 |
Neg logit contributions | |
genders | -6.242 |
blance | -6.238 |
rils | -6.030 |
aults | -6.014 |
rights | -5.883 |
Token | not |
Token ID | 407 |
Feature activation | -2.50e+01 |
Pos logit contributions | |
genders | +4.133 |
blance | +3.866 |
mattered | +3.865 |
aults | +3.833 |
rils | +3.823 |
Neg logit contributions | |
BY | -3.666 |
Decay | -3.625 |
than | -3.409 |
unfavorable | -3.314 |
orally | -3.275 |
Token | been |
Token ID | 587 |
Feature activation | -4.31e+00 |
Pos logit contributions | |
mattered | +13.836 |
genders | +13.062 |
wheelchair | +11.995 |
rils | +11.430 |
equality | +11.257 |
Neg logit contributions | |
Decay | -17.181 |
Reviewer | -16.936 |
ngth | -16.551 |
BY | -16.435 |
earchers | -15.938 |
Token | confirmed |
Token ID | 4999 |
Feature activation | +2.17e+00 |
Pos logit contributions | |
genders | +3.537 |
mattered | +3.323 |
blance | +3.319 |
aults | +3.281 |
empowerment | +3.260 |
Neg logit contributions | |
BY | -2.859 |
Decay | -2.802 |
than | -2.603 |
unfavorable | -2.536 |
Geological | -2.514 |
Token | just |
Token ID | 655 |
Feature activation | +2.79e+00 |
Pos logit contributions | |
BY | +1.481 |
Decay | +1.432 |
unfavorable | +1.352 |
than | +1.349 |
orally | +1.313 |
Neg logit contributions | |
genders | -1.767 |
blance | -1.720 |
aults | -1.667 |
rils | -1.655 |
empowerment | -1.648 |
Token | yet |
Token ID | 1865 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
BY | +1.966 |
Decay | +1.914 |
unfavorable | +1.806 |
than | +1.806 |
orally | +1.758 |
Neg logit contributions | |
genders | -2.184 |
blance | -2.133 |
aults | -2.051 |
rils | -2.039 |
empowerment | -2.039 |
Token | . |
Token ID | 13 |
Feature activation | -6.57e+00 |
Pos logit contributions | |
BY | +7.658 |
Decay | +7.056 |
than | +6.750 |
unfavorable | +6.706 |
orally | +6.676 |
Neg logit contributions | |
genders | -10.655 |
blance | -10.526 |
aults | -10.154 |
rils | -10.133 |
empowerment | -10.127 |
Token |
|
Token ID | 198 |
Feature activation | -6.54e+00 |
Pos logit contributions | |
CLS | +11.091 |
genders | +10.944 |
aults | +10.606 |
itans | +10.575 |
mattered | +10.362 |
Neg logit contributions | |
periodic | -13.112 |
unfavorable | -13.010 |
orally | -12.717 |
BY | -12.643 |
earchers | -12.449 |
Token |
|
Token ID | 198 |
Feature activation | -1.87e+01 |
Pos logit contributions | |
genders | +3.641 |
aults | +3.408 |
rights | +3.338 |
blance | +3.279 |
itans | +3.265 |
Neg logit contributions | |
Decay | -5.805 |
BY | -5.708 |
unfavorable | -5.581 |
periodic | -5.539 |
orally | -5.434 |
Token | But |
Token ID | 1537 |
Feature activation | -1.84e+01 |
Pos logit contributions | |
STEM | +11.920 |
OULD | +11.768 |
rights | +11.735 |
aults | +11.369 |
blance | +11.088 |
Neg logit contributions | |
Decay | -12.397 |
periodic | -12.302 |
orally | -12.027 |
unfavorable | -11.901 |
terness | -11.385 |
Token | this |
Token ID | 428 |
Feature activation | -8.13e+00 |
Pos logit contributions | |
genders | +12.231 |
equality | +12.025 |
empowerment | +11.951 |
mattered | +11.520 |
wheelchair | +11.413 |
Neg logit contributions | |
BY | -11.635 |
Decay | -11.287 |
Reviewer | -10.571 |
than | -10.370 |
Plot | -10.248 |
Token | isn |
Token ID | 2125 |
Feature activation | -3.30e+00 |
Pos logit contributions | |
genders | +6.355 |
empowerment | +6.095 |
mattered | +6.012 |
equality | +5.949 |
wheelchair | +5.851 |
Neg logit contributions | |
BY | -5.587 |
Decay | -5.463 |
than | -5.058 |
Geological | -4.826 |
unfavorable | -4.802 |
Token | 't |
Token ID | 470 |
Feature activation | -2.00e+01 |
Pos logit contributions | |
genders | +2.879 |
blance | +2.758 |
aults | +2.756 |
rights | +2.714 |
itans | +2.695 |
Neg logit contributions | |
BY | -1.971 |
Decay | -1.969 |
unfavorable | -1.832 |
periodic | -1.807 |
orally | -1.771 |
Token | a |
Token ID | 257 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
genders | +12.463 |
equality | +12.404 |
empowerment | +12.387 |
mattered | +12.013 |
wheelchair | +11.923 |
Neg logit contributions | |
Decay | -13.008 |
Reviewer | -12.542 |
BY | -12.410 |
than | -11.973 |
terness | -11.792 |
Token | new |
Token ID | 649 |
Feature activation | -4.13e+00 |
Pos logit contributions | |
genders | +7.799 |
empowerment | +7.457 |
wheelchair | +7.359 |
equality | +7.301 |
mattered | +7.280 |
Neg logit contributions | |
BY | -7.138 |
Decay | -7.076 |
than | -6.598 |
orally | -6.312 |
unfavorable | -6.305 |
Token | issue |
Token ID | 2071 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
genders | +2.785 |
empowerment | +2.629 |
blance | +2.590 |
mattered | +2.550 |
equality | +2.537 |
Neg logit contributions | |
BY | -3.322 |
Decay | -3.273 |
than | -3.081 |
unfavorable | -3.033 |
orally | -3.000 |
Token | . |
Token ID | 13 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
genders | +3.534 |
blance | +3.345 |
mattered | +3.270 |
empowerment | +3.270 |
aults | +3.259 |
Neg logit contributions | |
BY | -3.827 |
Decay | -3.766 |
than | -3.519 |
unfavorable | -3.490 |
periodic | -3.427 |
Token | Indeed |
Token ID | 9676 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
genders | +11.091 |
CLS | +10.984 |
mattered | +10.596 |
aults | +10.549 |
itans | +10.368 |
Neg logit contributions | |
BY | -10.253 |
unfavorable | -10.131 |
orally | -9.538 |
terness | -9.466 |
periodic | -9.445 |
Token | This |
Token ID | 770 |
Feature activation | +8.87e-01 |
Pos logit contributions | |
genders | +2.235 |
blance | +2.138 |
aults | +2.097 |
rils | +2.076 |
empowerment | +2.075 |
Neg logit contributions | |
BY | -1.758 |
Decay | -1.705 |
unfavorable | -1.636 |
than | -1.608 |
periodic | -1.583 |
Token | is |
Token ID | 318 |
Feature activation | -2.31e+00 |
Pos logit contributions | |
BY | +0.541 |
Decay | +0.525 |
than | +0.489 |
unfavorable | +0.487 |
Geological | +0.473 |
Neg logit contributions | |
genders | -0.787 |
blance | -0.761 |
aults | -0.744 |
rils | -0.737 |
empowerment | -0.736 |
Token | a |
Token ID | 257 |
Feature activation | -4.94e+00 |
Pos logit contributions | |
genders | +1.859 |
blance | +1.767 |
empowerment | +1.738 |
aults | +1.724 |
mattered | +1.715 |
Neg logit contributions | |
BY | -1.586 |
Decay | -1.551 |
than | -1.458 |
unfavorable | -1.446 |
Geological | -1.410 |
Token | guy |
Token ID | 3516 |
Feature activation | +2.57e-02 |
Pos logit contributions | |
genders | +3.799 |
empowerment | +3.545 |
wheelchair | +3.537 |
blance | +3.532 |
mattered | +3.503 |
Neg logit contributions | |
BY | -3.495 |
Decay | -3.433 |
unfavorable | -3.235 |
than | -3.229 |
orally | -3.104 |
Token | who |
Token ID | 508 |
Feature activation | -6.19e-01 |
Pos logit contributions | |
BY | +0.024 |
Decay | +0.024 |
than | +0.023 |
unfavorable | +0.023 |
Geological | +0.022 |
Neg logit contributions | |
genders | -0.014 |
blance | -0.013 |
aults | -0.013 |
empowerment | -0.013 |
rils | -0.013 |
Token | developed |
Token ID | 4166 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
genders | +0.515 |
blance | +0.493 |
aults | +0.483 |
empowerment | +0.478 |
mattered | +0.477 |
Neg logit contributions | |
BY | -0.413 |
Decay | -0.403 |
than | -0.377 |
unfavorable | -0.375 |
Geological | -0.365 |
Token | games |
Token ID | 1830 |
Feature activation | -9.40e+00 |
Pos logit contributions | |
genders | +13.792 |
wheelchair | +13.212 |
equality | +12.986 |
empowerment | +12.735 |
barriers | +12.295 |
Neg logit contributions | |
BY | -12.675 |
terness | -12.400 |
Decay | -12.069 |
iatus | -11.884 |
than | -11.584 |
Token | for |
Token ID | 329 |
Feature activation | -4.40e+00 |
Pos logit contributions | |
genders | +6.876 |
aults | +6.364 |
rights | +6.298 |
empowerment | +6.296 |
blance | +6.287 |
Neg logit contributions | |
BY | -6.790 |
Decay | -6.527 |
than | -6.272 |
unfavorable | -6.210 |
Geological | -6.048 |
Token | Play |
Token ID | 3811 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
genders | +3.396 |
empowerment | +3.142 |
wheelchair | +3.117 |
aults | +3.092 |
blance | +3.085 |
Neg logit contributions | |
BY | -3.172 |
Decay | -3.077 |
than | -2.923 |
unfavorable | -2.890 |
Geological | -2.812 |
Token | St |
Token ID | 1273 |
Feature activation | -8.92e+00 |
Pos logit contributions | |
genders | +1.308 |
blance | +1.256 |
aults | +1.226 |
rights | +1.223 |
rils | +1.213 |
Neg logit contributions | |
BY | -1.157 |
Decay | -1.130 |
unfavorable | -1.073 |
than | -1.068 |
orally | -1.041 |
Token | ations |
Token ID | 602 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
genders | +4.826 |
rils | +4.539 |
blance | +4.535 |
aults | +4.471 |
rights | +4.447 |
Neg logit contributions | |
Decay | -7.856 |
BY | -7.716 |
orally | -7.573 |
unfavorable | -7.539 |
than | -7.507 |