Token | < |
Token ID | 1279 |
Feature activation | -2.89e-01 |
Pos logit contributions | |
augmented | +0.454 |
asses | +0.442 |
offending | +0.431 |
ingle | +0.413 |
routed | +0.410 |
Neg logit contributions | |
ulia | -0.816 |
cott | -0.810 |
icas | -0.748 |
tsky | -0.740 |
kamp | -0.722 |
Token | li |
Token ID | 4528 |
Feature activation | -5.29e-02 |
Pos logit contributions | |
ulia | +0.882 |
cott | +0.867 |
icas | +0.793 |
tsky | +0.775 |
kamp | +0.760 |
Neg logit contributions | |
augmented | -0.613 |
asses | -0.606 |
offending | -0.591 |
ingle | -0.574 |
routed | -0.566 |
Token | ng |
Token ID | 23370 |
Feature activation | +5.51e-01 |
Pos logit contributions | |
ulia | +0.177 |
cott | +0.175 |
icas | +0.161 |
tsky | +0.158 |
kamp | +0.155 |
Neg logit contributions | |
augmented | -0.096 |
asses | -0.094 |
offending | -0.093 |
ingle | -0.089 |
routed | -0.088 |
Token | - |
Token ID | 12 |
Feature activation | +2.83e-01 |
Pos logit contributions | |
augmented | +1.175 |
asses | +1.151 |
offending | +1.129 |
ingle | +1.093 |
routed | +1.084 |
Neg logit contributions | |
ulia | -1.674 |
cott | -1.651 |
icas | -1.512 |
tsky | -1.472 |
kamp | -1.441 |
Token | repeat |
Token ID | 44754 |
Feature activation | +5.20e-01 |
Pos logit contributions | |
augmented | +0.596 |
asses | +0.591 |
offending | +0.574 |
ingle | +0.557 |
routed | +0.551 |
Neg logit contributions | |
ulia | -0.864 |
cott | -0.850 |
icas | -0.778 |
tsky | -0.761 |
kamp | -0.743 |
Token | =" |
Token ID | 2625 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
augmented | +0.656 |
asses | +0.626 |
offending | +0.609 |
routed | +0.570 |
ingle | +0.568 |
Neg logit contributions | |
ulia | -2.036 |
cott | -2.020 |
icas | -1.881 |
tsky | -1.851 |
kamp | -1.822 |
Token | phone |
Token ID | 4862 |
Feature activation | +2.99e-01 |
Pos logit contributions | |
augmented | +4.301 |
asses | +4.279 |
ingle | +4.102 |
offending | +4.085 |
routed | +3.984 |
Neg logit contributions | |
ulia | -4.558 |
cott | -4.483 |
icas | -4.091 |
tsky | -4.088 |
doms | -3.910 |
Token | in |
Token ID | 287 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
augmented | +0.748 |
asses | +0.735 |
offending | +0.724 |
ingle | +0.708 |
routed | +0.701 |
Neg logit contributions | |
ulia | -0.802 |
cott | -0.788 |
icas | -0.712 |
tsky | -0.694 |
kamp | -0.674 |
Token | phones |
Token ID | 9512 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
augmented | +0.316 |
asses | +0.310 |
offending | +0.304 |
ingle | +0.294 |
routed | +0.291 |
Neg logit contributions | |
ulia | -0.457 |
cott | -0.451 |
icas | -0.412 |
tsky | -0.402 |
kamp | -0.394 |
Token | "> |
Token ID | 5320 |
Feature activation | -1.73e-02 |
Pos logit contributions | |
augmented | +0.409 |
asses | +0.401 |
offending | +0.394 |
ingle | +0.382 |
routed | +0.377 |
Neg logit contributions | |
ulia | -0.595 |
cott | -0.587 |
icas | -0.538 |
tsky | -0.524 |
kamp | -0.514 |
Token | {{ |
Token ID | 22935 |
Feature activation | -3.95e-02 |
Pos logit contributions | |
ulia | +0.055 |
cott | +0.054 |
icas | +0.050 |
tsky | +0.049 |
kamp | +0.048 |
Neg logit contributions | |
augmented | -0.034 |
asses | -0.034 |
offending | -0.033 |
ingle | -0.032 |
routed | -0.031 |
Token | < |
Token ID | 1279 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
augmented | +0.575 |
asses | +0.555 |
offending | +0.544 |
ingle | +0.521 |
routed | +0.517 |
Neg logit contributions | |
ulia | -1.062 |
cott | -1.061 |
icas | -0.973 |
tsky | -0.964 |
kamp | -0.941 |
Token | li |
Token ID | 4528 |
Feature activation | -3.78e-02 |
Pos logit contributions | |
ulia | +0.824 |
cott | +0.811 |
icas | +0.743 |
tsky | +0.727 |
kamp | +0.712 |
Neg logit contributions | |
augmented | -0.557 |
asses | -0.553 |
offending | -0.537 |
ingle | -0.522 |
routed | -0.514 |
Token | ng |
Token ID | 23370 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
ulia | +0.117 |
cott | +0.116 |
icas | +0.106 |
tsky | +0.104 |
kamp | +0.101 |
Neg logit contributions | |
augmented | -0.078 |
asses | -0.077 |
offending | -0.075 |
ingle | -0.073 |
routed | -0.072 |
Token | - |
Token ID | 12 |
Feature activation | +2.95e-01 |
Pos logit contributions | |
augmented | +1.064 |
offending | +1.050 |
asses | +1.049 |
disse | +1.000 |
ingle | +0.998 |
Neg logit contributions | |
ulia | -1.382 |
cott | -1.366 |
icas | -1.238 |
tsky | -1.202 |
kamp | -1.186 |
Token | repeat |
Token ID | 44754 |
Feature activation | +4.85e-01 |
Pos logit contributions | |
augmented | +0.926 |
asses | +0.921 |
offending | +0.902 |
ingle | +0.887 |
routed | +0.879 |
Neg logit contributions | |
ulia | -0.600 |
cott | -0.586 |
icas | -0.511 |
tsky | -0.493 |
kamp | -0.472 |
Token | =" |
Token ID | 2625 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
augmented | +0.645 |
asses | +0.630 |
offending | +0.618 |
ingle | +0.578 |
routed | +0.568 |
Neg logit contributions | |
ulia | -1.862 |
cott | -1.842 |
icas | -1.715 |
tsky | -1.679 |
kamp | -1.655 |
Token | phone |
Token ID | 4862 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
asses | +2.750 |
augmented | +2.693 |
ingle | +2.545 |
offending | +2.496 |
routed | +2.407 |
Neg logit contributions | |
ulia | -5.867 |
cott | -5.763 |
tsky | -5.411 |
icas | -5.381 |
doms | -5.241 |
Token | in |
Token ID | 287 |
Feature activation | +9.78e-02 |
Pos logit contributions | |
augmented | +0.502 |
asses | +0.491 |
offending | +0.486 |
ingle | +0.472 |
routed | +0.469 |
Neg logit contributions | |
ulia | -0.575 |
cott | -0.567 |
icas | -0.513 |
tsky | -0.501 |
kamp | -0.489 |
Token | phones |
Token ID | 9512 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
augmented | +0.127 |
asses | +0.123 |
offending | +0.119 |
ingle | +0.112 |
routed | +0.111 |
Neg logit contributions | |
ulia | -0.380 |
cott | -0.376 |
icas | -0.350 |
tsky | -0.344 |
kamp | -0.339 |
Token | "> |
Token ID | 5320 |
Feature activation | -5.48e-02 |
Pos logit contributions | |
augmented | +0.175 |
asses | +0.170 |
offending | +0.165 |
ingle | +0.158 |
routed | +0.155 |
Neg logit contributions | |
ulia | -0.462 |
cott | -0.458 |
icas | -0.425 |
tsky | -0.417 |
kamp | -0.411 |
Token | < |
Token ID | 1279 |
Feature activation | -3.63e-01 |
Pos logit contributions | |
ulia | +0.186 |
cott | +0.186 |
icas | +0.171 |
tsky | +0.169 |
kamp | +0.165 |
Neg logit contributions | |
augmented | -0.097 |
asses | -0.094 |
offending | -0.092 |
ingle | -0.089 |
routed | -0.087 |
Token | mentioned |
Token ID | 4750 |
Feature activation | +3.27e-01 |
Pos logit contributions | |
ulia | +0.375 |
cott | +0.370 |
icas | +0.339 |
tsky | +0.329 |
kamp | +0.324 |
Neg logit contributions | |
augmented | -0.259 |
asses | -0.256 |
offending | -0.252 |
ingle | -0.244 |
routed | -0.239 |
Token | . |
Token ID | 13 |
Feature activation | +7.12e-02 |
Pos logit contributions | |
augmented | +0.785 |
asses | +0.769 |
offending | +0.757 |
routed | +0.728 |
ingle | +0.727 |
Neg logit contributions | |
ulia | -0.913 |
cott | -0.902 |
icas | -0.819 |
tsky | -0.797 |
doms | -0.777 |
Token |
|
Token ID | 198 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
augmented | +0.188 |
asses | +0.186 |
offending | +0.182 |
ingle | +0.178 |
routed | +0.176 |
Neg logit contributions | |
ulia | -0.180 |
cott | -0.177 |
icas | -0.159 |
tsky | -0.154 |
kamp | -0.149 |
Token |
|
Token ID | 198 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
augmented | +0.296 |
asses | +0.292 |
offending | +0.292 |
ingle | +0.281 |
routed | +0.281 |
Neg logit contributions | |
ulia | -0.259 |
cott | -0.256 |
icas | -0.227 |
tsky | -0.219 |
kamp | -0.215 |
Token | No |
Token ID | 2949 |
Feature activation | +3.62e-01 |
Pos logit contributions | |
augmented | +0.399 |
asses | +0.394 |
offending | +0.386 |
ingle | +0.378 |
routed | +0.372 |
Neg logit contributions | |
ulia | -0.407 |
cott | -0.399 |
icas | -0.360 |
tsky | -0.349 |
kamp | -0.340 |
Token | word |
Token ID | 1573 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
augmented | +0.755 |
asses | +0.735 |
offending | +0.729 |
ingle | +0.697 |
routed | +0.687 |
Neg logit contributions | |
ulia | -1.123 |
cott | -1.109 |
icas | -1.012 |
tsky | -0.985 |
doms | -0.965 |
Token | if |
Token ID | 611 |
Feature activation | +7.06e-01 |
Pos logit contributions | |
augmented | +3.279 |
asses | +3.152 |
offending | +3.128 |
routed | +2.972 |
ingle | +2.939 |
Neg logit contributions | |
ulia | -5.380 |
cott | -5.239 |
icas | -4.830 |
tsky | -4.781 |
doms | -4.612 |
Token | the |
Token ID | 262 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
augmented | +1.643 |
asses | +1.592 |
offending | +1.577 |
routed | +1.503 |
ingle | +1.501 |
Neg logit contributions | |
ulia | -2.010 |
cott | -1.983 |
icas | -1.803 |
tsky | -1.757 |
doms | -1.713 |
Token | Str |
Token ID | 4285 |
Feature activation | +5.79e-01 |
Pos logit contributions | |
augmented | +0.027 |
asses | +0.026 |
offending | +0.026 |
ingle | +0.025 |
routed | +0.025 |
Neg logit contributions | |
ulia | -0.036 |
cott | -0.035 |
icas | -0.032 |
tsky | -0.031 |
kamp | -0.031 |
Token | and |
Token ID | 392 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
augmented | +1.060 |
offending | +1.021 |
asses | +1.021 |
routed | +0.965 |
ingle | +0.962 |
Neg logit contributions | |
ulia | -1.945 |
cott | -1.926 |
icas | -1.775 |
tsky | -1.725 |
kamp | -1.700 |
Token | Craft |
Token ID | 15745 |
Feature activation | +3.81e-01 |
Pos logit contributions | |
augmented | +0.510 |
asses | +0.502 |
offending | +0.496 |
ingle | +0.482 |
routed | +0.476 |
Neg logit contributions | |
ulia | -0.499 |
cott | -0.489 |
icas | -0.438 |
tsky | -0.425 |
doms | -0.413 |
Token | < |
Token ID | 27 |
Feature activation | +1.27e-01 |
Pos logit contributions | |
augmented | +0.604 |
asses | +0.597 |
offending | +0.584 |
ingle | +0.571 |
routed | +0.563 |
Neg logit contributions | |
ulia | -0.633 |
cott | -0.621 |
icas | -0.562 |
tsky | -0.548 |
kamp | -0.533 |
Token | body |
Token ID | 2618 |
Feature activation | +4.89e-01 |
Pos logit contributions | |
augmented | +0.298 |
asses | +0.294 |
offending | +0.289 |
ingle | +0.280 |
routed | +0.278 |
Neg logit contributions | |
ulia | -0.357 |
cott | -0.352 |
icas | -0.318 |
tsky | -0.311 |
kamp | -0.304 |
Token | ng |
Token ID | 23370 |
Feature activation | +8.82e-01 |
Pos logit contributions | |
augmented | +0.847 |
asses | +0.818 |
offending | +0.802 |
routed | +0.766 |
ingle | +0.765 |
Neg logit contributions | |
ulia | -1.691 |
cott | -1.677 |
icas | -1.539 |
tsky | -1.513 |
kamp | -1.488 |
Token | - |
Token ID | 12 |
Feature activation | +2.99e-01 |
Pos logit contributions | |
augmented | +1.811 |
asses | +1.758 |
offending | +1.721 |
routed | +1.700 |
ingle | +1.656 |
Neg logit contributions | |
ulia | -2.776 |
cott | -2.729 |
icas | -2.512 |
tsky | -2.488 |
kamp | -2.394 |
Token | controller |
Token ID | 36500 |
Feature activation | +6.22e-01 |
Pos logit contributions | |
augmented | +0.637 |
asses | +0.626 |
offending | +0.617 |
ingle | +0.596 |
routed | +0.587 |
Neg logit contributions | |
ulia | -0.905 |
cott | -0.894 |
icas | -0.816 |
tsky | -0.791 |
kamp | -0.779 |
Token | =" |
Token ID | 2625 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
augmented | +1.250 |
asses | +1.218 |
offending | +1.205 |
routed | +1.158 |
ingle | +1.156 |
Neg logit contributions | |
ulia | -1.977 |
cott | -1.952 |
icas | -1.783 |
tsky | -1.748 |
kamp | -1.710 |
Token | Phone |
Token ID | 6132 |
Feature activation | -2.46e-01 |
Pos logit contributions | |
asses | +4.139 |
augmented | +4.092 |
offending | +3.949 |
ingle | +3.937 |
routed | +3.833 |
Neg logit contributions | |
ulia | -4.245 |
cott | -4.081 |
tsky | -3.754 |
icas | -3.736 |
kamp | -3.606 |
Token | List |
Token ID | 8053 |
Feature activation | +3.80e-02 |
Pos logit contributions | |
ulia | +0.739 |
cott | +0.730 |
icas | +0.666 |
tsky | +0.647 |
kamp | +0.636 |
Neg logit contributions | |
augmented | -0.531 |
asses | -0.523 |
offending | -0.514 |
ingle | -0.497 |
routed | -0.491 |
Token | Ctrl |
Token ID | 40069 |
Feature activation | +6.53e-01 |
Pos logit contributions | |
augmented | +0.072 |
asses | +0.070 |
offending | +0.069 |
ingle | +0.066 |
routed | +0.065 |
Neg logit contributions | |
ulia | -0.125 |
cott | -0.123 |
icas | -0.114 |
tsky | -0.111 |
kamp | -0.109 |
Token | "> |
Token ID | 5320 |
Feature activation | +6.97e-02 |
Pos logit contributions | |
augmented | +1.168 |
asses | +1.130 |
offending | +1.113 |
ingle | +1.076 |
routed | +1.064 |
Neg logit contributions | |
ulia | -2.214 |
cott | -2.196 |
icas | -2.025 |
tsky | -1.981 |
kamp | -1.943 |
Token | < |
Token ID | 1279 |
Feature activation | -4.18e-01 |
Pos logit contributions | |
augmented | +0.136 |
asses | +0.133 |
offending | +0.130 |
ingle | +0.125 |
routed | +0.124 |
Neg logit contributions | |
ulia | -0.225 |
cott | -0.223 |
icas | -0.205 |
tsky | -0.201 |
kamp | -0.196 |
Token | < |
Token ID | 27 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
augmented | +0.636 |
asses | +0.629 |
offending | +0.610 |
ingle | +0.595 |
routed | +0.582 |
Neg logit contributions | |
ulia | -1.042 |
cott | -1.025 |
icas | -0.943 |
tsky | -0.927 |
kamp | -0.906 |
Token | body |
Token ID | 2618 |
Feature activation | +4.60e-01 |
Pos logit contributions | |
augmented | +0.329 |
asses | +0.326 |
offending | +0.320 |
ingle | +0.312 |
routed | +0.309 |
Neg logit contributions | |
ulia | -0.342 |
cott | -0.336 |
icas | -0.301 |
tsky | -0.295 |
kamp | -0.287 |
Token | ng |
Token ID | 23370 |
Feature activation | +7.04e-01 |
Pos logit contributions | |
augmented | +0.930 |
asses | +0.907 |
offending | +0.893 |
ingle | +0.857 |
routed | +0.856 |
Neg logit contributions | |
ulia | -1.452 |
cott | -1.441 |
icas | -1.312 |
tsky | -1.287 |
kamp | -1.261 |
Token | - |
Token ID | 12 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
augmented | +1.542 |
asses | +1.519 |
offending | +1.501 |
ingle | +1.445 |
routed | +1.427 |
Neg logit contributions | |
ulia | -2.098 |
cott | -2.070 |
icas | -1.888 |
tsky | -1.832 |
kamp | -1.801 |
Token | controller |
Token ID | 36500 |
Feature activation | +5.63e-01 |
Pos logit contributions | |
augmented | +0.579 |
asses | +0.574 |
offending | +0.554 |
ingle | +0.535 |
routed | +0.527 |
Neg logit contributions | |
ulia | -1.153 |
cott | -1.135 |
icas | -1.047 |
tsky | -1.029 |
kamp | -1.004 |
Token | =" |
Token ID | 2625 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
augmented | +0.677 |
asses | +0.645 |
offending | +0.628 |
ingle | +0.596 |
routed | +0.595 |
Neg logit contributions | |
ulia | -2.234 |
cott | -2.221 |
icas | -2.064 |
tsky | -2.039 |
kamp | -1.997 |
Token | Phone |
Token ID | 6132 |
Feature activation | -3.90e-01 |
Pos logit contributions | |
asses | +2.708 |
augmented | +2.690 |
ingle | +2.538 |
offending | +2.452 |
routed | +2.394 |
Neg logit contributions | |
ulia | -5.536 |
cott | -5.407 |
tsky | -5.097 |
icas | -5.064 |
doms | -4.885 |
Token | List |
Token ID | 8053 |
Feature activation | +5.52e-02 |
Pos logit contributions | |
ulia | +0.963 |
cott | +0.947 |
icas | +0.847 |
tsky | +0.816 |
kamp | +0.798 |
Neg logit contributions | |
augmented | -1.050 |
asses | -1.036 |
offending | -1.024 |
ingle | -0.994 |
routed | -0.985 |
Token | Ctrl |
Token ID | 40069 |
Feature activation | +7.26e-01 |
Pos logit contributions | |
augmented | +0.113 |
asses | +0.111 |
offending | +0.109 |
ingle | +0.105 |
routed | +0.104 |
Neg logit contributions | |
ulia | -0.173 |
cott | -0.171 |
icas | -0.156 |
tsky | -0.153 |
kamp | -0.150 |
Token | "> |
Token ID | 5320 |
Feature activation | +9.22e-02 |
Pos logit contributions | |
augmented | +0.986 |
asses | +0.944 |
offending | +0.923 |
ingle | +0.878 |
routed | +0.874 |
Neg logit contributions | |
ulia | -2.772 |
cott | -2.756 |
icas | -2.562 |
tsky | -2.530 |
kamp | -2.480 |
Token | < |
Token ID | 1279 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
augmented | +0.172 |
asses | +0.167 |
offending | +0.163 |
ingle | +0.157 |
routed | +0.155 |
Neg logit contributions | |
ulia | -0.306 |
cott | -0.304 |
icas | -0.279 |
tsky | -0.275 |
kamp | -0.268 |
Token | the |
Token ID | 262 |
Feature activation | +3.08e-02 |
Pos logit contributions | |
augmented | +0.522 |
asses | +0.511 |
offending | +0.504 |
ingle | +0.486 |
routed | +0.484 |
Neg logit contributions | |
ulia | -0.593 |
cott | -0.583 |
icas | -0.525 |
tsky | -0.514 |
kamp | -0.503 |
Token | Nexus |
Token ID | 16756 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
augmented | +0.075 |
asses | +0.074 |
offending | +0.073 |
ingle | +0.071 |
routed | +0.070 |
Neg logit contributions | |
ulia | -0.084 |
cott | -0.083 |
icas | -0.075 |
tsky | -0.073 |
kamp | -0.071 |
Token | 6 |
Token ID | 718 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
augmented | +0.706 |
asses | +0.681 |
offending | +0.672 |
ingle | +0.635 |
routed | +0.626 |
Neg logit contributions | |
ulia | -1.685 |
cott | -1.669 |
icas | -1.546 |
tsky | -1.520 |
kamp | -1.495 |
Token | . |
Token ID | 13 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
augmented | +0.647 |
asses | +0.635 |
offending | +0.627 |
ingle | +0.606 |
routed | +0.601 |
Neg logit contributions | |
ulia | -0.778 |
cott | -0.767 |
icas | -0.695 |
tsky | -0.676 |
kamp | -0.661 |
Token | No |
Token ID | 1400 |
Feature activation | +2.94e-01 |
Pos logit contributions | |
augmented | +0.390 |
asses | +0.384 |
offending | +0.378 |
ingle | +0.369 |
routed | +0.364 |
Neg logit contributions | |
ulia | -0.383 |
cott | -0.376 |
icas | -0.339 |
tsky | -0.327 |
kamp | -0.319 |
Token | word |
Token ID | 1573 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
augmented | +0.631 |
asses | +0.615 |
offending | +0.611 |
ingle | +0.584 |
routed | +0.579 |
Neg logit contributions | |
ulia | -0.893 |
cott | -0.882 |
icas | -0.804 |
tsky | -0.784 |
kamp | -0.767 |
Token | on |
Token ID | 319 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
augmented | +3.099 |
asses | +3.002 |
offending | +2.960 |
routed | +2.813 |
ingle | +2.811 |
Neg logit contributions | |
ulia | -5.161 |
cott | -5.022 |
icas | -4.629 |
tsky | -4.589 |
doms | -4.416 |
Token | if |
Token ID | 611 |
Feature activation | +6.13e-01 |
Pos logit contributions | |
augmented | +1.024 |
asses | +0.986 |
offending | +0.985 |
ingle | +0.941 |
routed | +0.937 |
Neg logit contributions | |
ulia | -1.400 |
cott | -1.378 |
icas | -1.260 |
tsky | -1.233 |
kamp | -1.203 |
Token | there |
Token ID | 612 |
Feature activation | -6.82e-02 |
Pos logit contributions | |
augmented | +1.397 |
asses | +1.353 |
offending | +1.340 |
routed | +1.284 |
ingle | +1.273 |
Neg logit contributions | |
ulia | -1.781 |
cott | -1.757 |
icas | -1.599 |
tsky | -1.564 |
kamp | -1.535 |
Token | will |
Token ID | 481 |
Feature activation | -4.28e-01 |
Pos logit contributions | |
ulia | +0.208 |
cott | +0.205 |
icas | +0.188 |
tsky | +0.184 |
kamp | +0.179 |
Neg logit contributions | |
augmented | -0.145 |
asses | -0.142 |
offending | -0.140 |
ingle | -0.135 |
routed | -0.134 |
Token | be |
Token ID | 307 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
ulia | +1.193 |
cott | +1.177 |
icas | +1.065 |
tsky | +1.035 |
kamp | +1.011 |
Neg logit contributions | |
augmented | -1.022 |
asses | -1.003 |
offending | -0.991 |
ingle | -0.962 |
routed | -0.950 |
Token | Legends |
Token ID | 14270 |
Feature activation | -9.23e-02 |
Pos logit contributions | |
ulia | +0.442 |
cott | +0.436 |
icas | +0.396 |
tsky | +0.384 |
kamp | +0.377 |
Neg logit contributions | |
augmented | -0.356 |
asses | -0.352 |
offending | -0.346 |
ingle | -0.336 |
routed | -0.332 |
Token | of |
Token ID | 286 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
ulia | +0.284 |
cott | +0.276 |
icas | +0.254 |
tsky | +0.249 |
kamp | +0.241 |
Neg logit contributions | |
augmented | -0.198 |
asses | -0.192 |
offending | -0.191 |
ingle | -0.183 |
routed | -0.181 |
Token | Tomorrow |
Token ID | 25939 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
ulia | +0.292 |
cott | +0.287 |
icas | +0.255 |
tsky | +0.247 |
kamp | +0.240 |
Neg logit contributions | |
augmented | -0.351 |
asses | -0.346 |
offending | -0.341 |
ingle | -0.335 |
routed | -0.330 |
Token | . |
Token ID | 13 |
Feature activation | +8.22e-02 |
Pos logit contributions | |
augmented | +0.258 |
asses | +0.252 |
offending | +0.249 |
ingle | +0.240 |
routed | +0.238 |
Neg logit contributions | |
ulia | -0.308 |
cott | -0.303 |
icas | -0.275 |
tsky | -0.267 |
kamp | -0.260 |
Token | No |
Token ID | 1400 |
Feature activation | +5.96e-02 |
Pos logit contributions | |
augmented | +0.217 |
asses | +0.214 |
offending | +0.211 |
ingle | +0.205 |
routed | +0.203 |
Neg logit contributions | |
ulia | -0.208 |
cott | -0.205 |
icas | -0.184 |
tsky | -0.178 |
kamp | -0.173 |
Token | word |
Token ID | 1573 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
augmented | +0.132 |
asses | +0.129 |
offending | +0.128 |
ingle | +0.123 |
routed | +0.122 |
Neg logit contributions | |
ulia | -0.177 |
cott | -0.174 |
icas | -0.159 |
tsky | -0.155 |
kamp | -0.151 |
Token | on |
Token ID | 319 |
Feature activation | +3.85e-01 |
Pos logit contributions | |
augmented | +3.052 |
asses | +2.978 |
offending | +2.915 |
routed | +2.779 |
ingle | +2.764 |
Neg logit contributions | |
ulia | -5.025 |
cott | -4.886 |
icas | -4.521 |
tsky | -4.506 |
doms | -4.310 |
Token | what |
Token ID | 644 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
augmented | +0.807 |
asses | +0.782 |
offending | +0.781 |
ingle | +0.746 |
routed | +0.738 |
Neg logit contributions | |
ulia | -1.187 |
cott | -1.170 |
icas | -1.074 |
tsky | -1.049 |
kamp | -1.021 |
Token | this |
Token ID | 428 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
augmented | +0.256 |
asses | +0.252 |
offending | +0.248 |
ingle | +0.240 |
routed | +0.237 |
Neg logit contributions | |
ulia | -0.346 |
cott | -0.341 |
icas | -0.311 |
tsky | -0.302 |
kamp | -0.296 |
Token | collaboration |
Token ID | 12438 |
Feature activation | +5.62e-01 |
Pos logit contributions | |
ulia | +0.664 |
cott | +0.657 |
icas | +0.602 |
tsky | +0.586 |
kamp | +0.577 |
Neg logit contributions | |
augmented | -0.416 |
asses | -0.410 |
offending | -0.401 |
ingle | -0.388 |
routed | -0.383 |
Token | will |
Token ID | 481 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
augmented | +1.220 |
asses | +1.189 |
offending | +1.170 |
ingle | +1.126 |
routed | +1.113 |
Neg logit contributions | |
ulia | -1.714 |
cott | -1.680 |
icas | -1.533 |
tsky | -1.491 |
kamp | -1.449 |
Token | ADVERTISEMENT |
Token ID | 19053 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
augmented | +0.120 |
asses | +0.119 |
offending | +0.117 |
ingle | +0.114 |
routed | +0.112 |
Neg logit contributions | |
ulia | -0.122 |
cott | -0.119 |
icas | -0.108 |
tsky | -0.104 |
kamp | -0.102 |
Token |
|
Token ID | 198 |
Feature activation | -2.18e-01 |
Pos logit contributions | |
augmented | +0.657 |
asses | +0.650 |
offending | +0.637 |
ingle | +0.634 |
routed | +0.617 |
Neg logit contributions | |
ulia | -0.710 |
cott | -0.697 |
icas | -0.631 |
tsky | -0.605 |
doms | -0.599 |
Token |
|
Token ID | 198 |
Feature activation | +6.42e-03 |
Pos logit contributions | |
ulia | +0.499 |
cott | +0.493 |
icas | +0.429 |
tsky | +0.412 |
kamp | +0.409 |
Neg logit contributions | |
augmented | -0.629 |
offending | -0.629 |
asses | -0.618 |
disse | -0.609 |
routed | -0.601 |
Token | How |
Token ID | 2437 |
Feature activation | -3.19e-01 |
Pos logit contributions | |
augmented | +0.016 |
asses | +0.016 |
offending | +0.016 |
ingle | +0.015 |
routed | +0.015 |
Neg logit contributions | |
ulia | -0.017 |
cott | -0.017 |
icas | -0.015 |
tsky | -0.015 |
kamp | -0.014 |
Token | a |
Token ID | 257 |
Feature activation | +7.53e-02 |
Pos logit contributions | |
ulia | +0.885 |
cott | +0.872 |
icas | +0.790 |
tsky | +0.766 |
kamp | +0.749 |
Neg logit contributions | |
augmented | -0.766 |
asses | -0.754 |
offending | -0.743 |
ingle | -0.721 |
routed | -0.713 |
Token | pro |
Token ID | 1676 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
augmented | +0.158 |
asses | +0.154 |
offending | +0.153 |
routed | +0.146 |
ingle | +0.146 |
Neg logit contributions | |
ulia | -0.233 |
cott | -0.228 |
icas | -0.210 |
tsky | -0.204 |
kamp | -0.200 |
Token | pos |
Token ID | 1930 |
Feature activation | +3.38e-01 |
Pos logit contributions | |
asses | +3.161 |
offending | +3.114 |
augmented | +3.078 |
ingle | +2.940 |
routed | +2.899 |
Neg logit contributions | |
ulia | -4.593 |
cott | -4.478 |
icas | -4.172 |
kamp | -3.940 |
tsky | -3.918 |
Token | that |
Token ID | 326 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
augmented | +0.758 |
asses | +0.740 |
offending | +0.735 |
ingle | +0.704 |
routed | +0.698 |
Neg logit contributions | |
ulia | -0.993 |
cott | -0.974 |
icas | -0.892 |
tsky | -0.863 |
kamp | -0.851 |
Token | this |
Token ID | 428 |
Feature activation | -6.49e-02 |
Pos logit contributions | |
augmented | +0.509 |
asses | +0.498 |
offending | +0.495 |
ingle | +0.475 |
routed | +0.472 |
Neg logit contributions | |
ulia | -0.628 |
cott | -0.618 |
icas | -0.564 |
tsky | -0.545 |
kamp | -0.537 |
Token | famous |
Token ID | 5863 |
Feature activation | +4.28e-01 |
Pos logit contributions | |
ulia | +0.186 |
cott | +0.183 |
icas | +0.167 |
tsky | +0.162 |
kamp | +0.159 |
Neg logit contributions | |
augmented | -0.150 |
asses | -0.147 |
offending | -0.145 |
ingle | -0.140 |
routed | -0.139 |
Token | and |
Token ID | 290 |
Feature activation | +4.21e-01 |
Pos logit contributions | |
augmented | +0.930 |
offending | +0.907 |
asses | +0.902 |
ingle | +0.860 |
routed | +0.858 |
Neg logit contributions | |
ulia | -1.306 |
cott | -1.272 |
icas | -1.168 |
tsky | -1.122 |
doms | -1.111 |
Token | / |
Token ID | 14 |
Feature activation | -5.97e-02 |
Pos logit contributions | |
ulia | +0.020 |
cott | +0.019 |
icas | +0.018 |
tsky | +0.017 |
kamp | +0.017 |
Neg logit contributions | |
augmented | -0.012 |
asses | -0.012 |
offending | -0.012 |
ingle | -0.011 |
routed | -0.011 |
Token | communication |
Token ID | 32560 |
Feature activation | +2.26e-01 |
Pos logit contributions | |
ulia | +0.160 |
cott | +0.157 |
icas | +0.143 |
tsky | +0.139 |
kamp | +0.134 |
Neg logit contributions | |
augmented | -0.149 |
asses | -0.147 |
offending | -0.145 |
ingle | -0.141 |
routed | -0.139 |
Token | preference |
Token ID | 12741 |
Feature activation | -9.08e-02 |
Pos logit contributions | |
augmented | +0.478 |
asses | +0.468 |
offending | +0.461 |
ingle | +0.443 |
routed | +0.441 |
Neg logit contributions | |
ulia | -0.693 |
cott | -0.684 |
icas | -0.624 |
tsky | -0.608 |
kamp | -0.596 |
Token | , |
Token ID | 11 |
Feature activation | +8.50e-02 |
Pos logit contributions | |
ulia | +0.257 |
cott | +0.253 |
icas | +0.230 |
tsky | +0.223 |
kamp | +0.218 |
Neg logit contributions | |
augmented | -0.213 |
asses | -0.210 |
offending | -0.207 |
ingle | -0.200 |
routed | -0.198 |
Token | any |
Token ID | 597 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
augmented | +0.189 |
asses | +0.184 |
offending | +0.182 |
ingle | +0.176 |
routed | +0.174 |
Neg logit contributions | |
ulia | -0.253 |
cott | -0.248 |
icas | -0.227 |
tsky | -0.221 |
kamp | -0.217 |
Token | word |
Token ID | 1573 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
augmented | +0.490 |
asses | +0.476 |
offending | +0.473 |
ingle | +0.451 |
routed | +0.447 |
Neg logit contributions | |
ulia | -0.732 |
cott | -0.716 |
icas | -0.658 |
tsky | -0.641 |
kamp | -0.629 |
Token | of |
Token ID | 286 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
augmented | +3.102 |
offending | +3.021 |
asses | +2.998 |
routed | +2.873 |
ingle | +2.834 |
Neg logit contributions | |
ulia | -4.550 |
cott | -4.352 |
icas | -4.145 |
tsky | -4.027 |
doms | -3.890 |
Token | mouth |
Token ID | 5422 |
Feature activation | +3.68e-01 |
Pos logit contributions | |
augmented | +1.073 |
offending | +1.042 |
asses | +1.032 |
ingle | +0.987 |
routed | +0.983 |
Neg logit contributions | |
ulia | -1.352 |
cott | -1.301 |
icas | -1.207 |
tsky | -1.178 |
doms | -1.148 |
Token | you |
Token ID | 345 |
Feature activation | +1.57e-01 |
Pos logit contributions | |
augmented | +0.826 |
offending | +0.801 |
asses | +0.800 |
ingle | +0.767 |
routed | +0.764 |
Neg logit contributions | |
ulia | -1.089 |
cott | -1.068 |
icas | -0.981 |
tsky | -0.954 |
kamp | -0.930 |
Token | can |
Token ID | 460 |
Feature activation | -8.75e-02 |
Pos logit contributions | |
augmented | +0.352 |
asses | +0.346 |
offending | +0.341 |
ingle | +0.330 |
routed | +0.326 |
Neg logit contributions | |
ulia | -0.461 |
cott | -0.455 |
icas | -0.414 |
tsky | -0.403 |
kamp | -0.394 |
Token | help |
Token ID | 1037 |
Feature activation | +1.49e-02 |
Pos logit contributions | |
ulia | +0.267 |
cott | +0.262 |
icas | +0.240 |
tsky | +0.233 |
kamp | +0.229 |
Neg logit contributions | |
augmented | -0.185 |
asses | -0.182 |
offending | -0.179 |
ingle | -0.173 |
routed | -0.171 |
Token |
|
Token ID | 198 |
Feature activation | -3.03e-02 |
Pos logit contributions | |
ulia | +0.065 |
cott | +0.064 |
icas | +0.057 |
tsky | +0.056 |
kamp | +0.054 |
Neg logit contributions | |
augmented | -0.065 |
asses | -0.065 |
offending | -0.063 |
ingle | -0.061 |
routed | -0.061 |
Token |
|
Token ID | 198 |
Feature activation | +3.13e-02 |
Pos logit contributions | |
ulia | +0.071 |
cott | +0.070 |
icas | +0.062 |
tsky | +0.059 |
kamp | +0.059 |
Neg logit contributions | |
augmented | -0.085 |
offending | -0.085 |
asses | -0.084 |
disse | -0.081 |
routed | -0.081 |
Token | No |
Token ID | 2949 |
Feature activation | +2.76e-01 |
Pos logit contributions | |
augmented | +0.078 |
asses | +0.078 |
offending | +0.075 |
ingle | +0.074 |
routed | +0.073 |
Neg logit contributions | |
ulia | -0.083 |
cott | -0.082 |
icas | -0.074 |
tsky | -0.072 |
kamp | -0.070 |
Token | one |
Token ID | 530 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
augmented | +0.549 |
asses | +0.537 |
offending | +0.530 |
ingle | +0.504 |
disse | +0.499 |
Neg logit contributions | |
ulia | -0.877 |
cott | -0.866 |
icas | -0.794 |
tsky | -0.775 |
kamp | -0.759 |
Token | knows |
Token ID | 4206 |
Feature activation | +7.41e-01 |
Pos logit contributions | |
ulia | +0.305 |
cott | +0.301 |
icas | +0.271 |
tsky | +0.263 |
kamp | +0.257 |
Neg logit contributions | |
augmented | -0.273 |
asses | -0.270 |
offending | -0.265 |
ingle | -0.259 |
routed | -0.255 |
Token | exactly |
Token ID | 3446 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
augmented | +1.330 |
asses | +1.275 |
offending | +1.273 |
ingle | +1.191 |
routed | +1.187 |
Neg logit contributions | |
ulia | -2.524 |
cott | -2.476 |
icas | -2.311 |
tsky | -2.254 |
kamp | -2.192 |
Token | how |
Token ID | 703 |
Feature activation | +5.69e-01 |
Pos logit contributions | |
augmented | +2.227 |
asses | +2.054 |
offending | +2.053 |
routed | +1.927 |
ingle | +1.896 |
Neg logit contributions | |
ulia | -5.318 |
cott | -5.245 |
icas | -4.903 |
tsky | -4.835 |
doms | -4.712 |
Token | they |
Token ID | 484 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
augmented | +1.259 |
asses | +1.222 |
offending | +1.209 |
routed | +1.158 |
disse | +1.140 |
Neg logit contributions | |
ulia | -1.692 |
cott | -1.672 |
icas | -1.540 |
tsky | -1.506 |
kamp | -1.471 |
Token | were |
Token ID | 547 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
augmented | +0.410 |
asses | +0.403 |
offending | +0.397 |
ingle | +0.385 |
routed | +0.382 |
Neg logit contributions | |
ulia | -0.480 |
cott | -0.473 |
icas | -0.429 |
tsky | -0.416 |
kamp | -0.408 |
Token | made |
Token ID | 925 |
Feature activation | -2.73e-02 |
Pos logit contributions | |
augmented | +0.616 |
asses | +0.599 |
offending | +0.591 |
routed | +0.566 |
ingle | +0.566 |
Neg logit contributions | |
ulia | -0.927 |
cott | -0.913 |
icas | -0.836 |
tsky | -0.815 |
kamp | -0.800 |
Token | — |
Token ID | 851 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
ulia | +0.077 |
cott | +0.075 |
icas | +0.068 |
tsky | +0.066 |
kamp | +0.065 |
Neg logit contributions | |
augmented | -0.065 |
asses | -0.064 |
offending | -0.063 |
ingle | -0.061 |
routed | -0.060 |
Token | activists |
Token ID | 7941 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
augmented | +0.115 |
asses | +0.113 |
offending | +0.111 |
ingle | +0.107 |
routed | +0.106 |
Neg logit contributions | |
ulia | -0.175 |
cott | -0.172 |
icas | -0.158 |
tsky | -0.154 |
kamp | -0.151 |
Token | on |
Token ID | 319 |
Feature activation | -9.49e-02 |
Pos logit contributions | |
augmented | +0.584 |
asses | +0.573 |
offending | +0.570 |
ingle | +0.546 |
routed | +0.543 |
Neg logit contributions | |
ulia | -0.761 |
cott | -0.745 |
icas | -0.686 |
tsky | -0.659 |
kamp | -0.647 |
Token | even |
Token ID | 772 |
Feature activation | -4.41e-02 |
Pos logit contributions | |
ulia | +0.280 |
cott | +0.276 |
icas | +0.251 |
tsky | +0.244 |
kamp | +0.239 |
Neg logit contributions | |
augmented | -0.212 |
asses | -0.208 |
offending | -0.205 |
ingle | -0.198 |
routed | -0.196 |
Token | that |
Token ID | 326 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
ulia | +0.128 |
cott | +0.126 |
icas | +0.114 |
tsky | +0.111 |
kamp | +0.109 |
Neg logit contributions | |
augmented | -0.101 |
asses | -0.099 |
offending | -0.098 |
ingle | -0.094 |
routed | -0.093 |
Token | single |
Token ID | 2060 |
Feature activation | +3.96e-01 |
Pos logit contributions | |
augmented | +0.310 |
asses | +0.303 |
offending | +0.300 |
ingle | +0.288 |
routed | +0.286 |
Neg logit contributions | |
ulia | -0.456 |
cott | -0.449 |
icas | -0.412 |
tsky | -0.398 |
kamp | -0.393 |
Token | word |
Token ID | 1573 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
augmented | +0.731 |
asses | +0.709 |
offending | +0.707 |
ingle | +0.670 |
routed | +0.663 |
Neg logit contributions | |
ulia | -1.325 |
cott | -1.306 |
icas | -1.208 |
tsky | -1.169 |
kamp | -1.156 |
Token | hurts |
Token ID | 20406 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
augmented | +3.297 |
asses | +3.249 |
offending | +3.232 |
routed | +3.054 |
ingle | +3.024 |
Neg logit contributions | |
ulia | -4.048 |
cott | -3.937 |
icas | -3.685 |
tsky | -3.510 |
doms | -3.433 |
Token | women |
Token ID | 1466 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
augmented | +0.702 |
asses | +0.690 |
offending | +0.688 |
ingle | +0.645 |
routed | +0.643 |
Neg logit contributions | |
ulia | -1.106 |
cott | -1.090 |
icas | -1.002 |
tsky | -0.973 |
kamp | -0.956 |
Token | and |
Token ID | 290 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
augmented | +0.586 |
asses | +0.583 |
offending | +0.575 |
ingle | +0.549 |
routed | +0.547 |
Neg logit contributions | |
ulia | -0.683 |
cott | -0.669 |
icas | -0.606 |
tsky | -0.585 |
kamp | -0.574 |
Token | the |
Token ID | 262 |
Feature activation | +1.28e-01 |
Pos logit contributions | |
augmented | +0.729 |
asses | +0.716 |
offending | +0.709 |
ingle | +0.676 |
routed | +0.671 |
Neg logit contributions | |
ulia | -1.040 |
cott | -1.022 |
icas | -0.935 |
tsky | -0.906 |
kamp | -0.891 |
Token | cause |
Token ID | 2728 |
Feature activation | +3.27e-01 |
Pos logit contributions | |
augmented | +0.250 |
asses | +0.246 |
offending | +0.242 |
ingle | +0.230 |
routed | +0.229 |
Neg logit contributions | |
ulia | -0.416 |
cott | -0.410 |
icas | -0.376 |
tsky | -0.367 |
kamp | -0.361 |
Token | the |
Token ID | 262 |
Feature activation | -7.28e-02 |
Pos logit contributions | |
ulia | +1.817 |
cott | +1.794 |
icas | +1.617 |
tsky | +1.567 |
kamp | +1.539 |
Neg logit contributions | |
augmented | -1.697 |
asses | -1.679 |
offending | -1.652 |
ingle | -1.604 |
routed | -1.594 |
Token | day |
Token ID | 1110 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
ulia | +0.226 |
cott | +0.223 |
icas | +0.204 |
tsky | +0.198 |
kamp | +0.194 |
Neg logit contributions | |
augmented | -0.152 |
asses | -0.149 |
offending | -0.147 |
ingle | -0.141 |
routed | -0.139 |
Token | after |
Token ID | 706 |
Feature activation | +3.63e-02 |
Pos logit contributions | |
ulia | +0.311 |
cott | +0.307 |
icas | +0.279 |
tsky | +0.270 |
kamp | +0.265 |
Neg logit contributions | |
augmented | -0.246 |
asses | -0.241 |
offending | -0.238 |
ingle | -0.230 |
routed | -0.227 |
Token | the |
Token ID | 262 |
Feature activation | +3.72e-01 |
Pos logit contributions | |
augmented | +0.090 |
asses | +0.088 |
offending | +0.087 |
ingle | +0.084 |
routed | +0.083 |
Neg logit contributions | |
ulia | -0.099 |
cott | -0.097 |
icas | -0.088 |
tsky | -0.085 |
kamp | -0.083 |
Token | final |
Token ID | 2457 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
augmented | +0.780 |
asses | +0.757 |
offending | +0.756 |
ingle | +0.719 |
routed | +0.710 |
Neg logit contributions | |
ulia | -1.157 |
cott | -1.134 |
icas | -1.040 |
tsky | -1.016 |
doms | -0.991 |
Token | Force |
Token ID | 5221 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
augmented | +0.685 |
asses | +0.667 |
offending | +0.664 |
ingle | +0.635 |
routed | +0.629 |
Neg logit contributions | |
ulia | -1.029 |
cott | -1.013 |
icas | -0.928 |
tsky | -0.902 |
kamp | -0.885 |
Token | Awakens |
Token ID | 39613 |
Feature activation | +7.71e-01 |
Pos logit contributions | |
augmented | +3.072 |
asses | +2.990 |
offending | +2.970 |
ingle | +2.892 |
routed | +2.836 |
Neg logit contributions | |
ulia | -4.347 |
cott | -4.215 |
icas | -3.878 |
tsky | -3.775 |
doms | -3.632 |
Token | trailer |
Token ID | 12268 |
Feature activation | +3.00e-01 |
Pos logit contributions | |
augmented | +1.713 |
offending | +1.656 |
asses | +1.635 |
ingle | +1.586 |
routed | +1.586 |
Neg logit contributions | |
ulia | -2.314 |
cott | -2.239 |
icas | -2.076 |
tsky | -2.012 |
kamp | -1.947 |
Token | premiered |
Token ID | 44119 |
Feature activation | +3.33e-01 |
Pos logit contributions | |
augmented | +0.707 |
asses | +0.688 |
offending | +0.684 |
ingle | +0.661 |
routed | +0.659 |
Neg logit contributions | |
ulia | -0.853 |
cott | -0.836 |
icas | -0.765 |
tsky | -0.745 |
kamp | -0.725 |
Token | ( |
Token ID | 357 |
Feature activation | -3.68e-01 |
Pos logit contributions | |
augmented | +0.770 |
asses | +0.744 |
offending | +0.742 |
ingle | +0.716 |
routed | +0.713 |
Neg logit contributions | |
ulia | -0.958 |
cott | -0.944 |
icas | -0.863 |
tsky | -0.838 |
kamp | -0.816 |
Token | along |
Token ID | 24176 |
Feature activation | +3.00e-01 |
Pos logit contributions | |
ulia | +1.048 |
cott | +1.036 |
icas | +0.939 |
tsky | +0.909 |
kamp | +0.894 |
Neg logit contributions | |
augmented | -0.851 |
asses | -0.837 |
offending | -0.826 |
ingle | -0.799 |
routed | -0.791 |
Token | Sign |
Token ID | 5865 |
Feature activation | +3.29e-01 |
Pos logit contributions | |
augmented | +1.416 |
asses | +1.398 |
offending | +1.387 |
ingle | +1.364 |
routed | +1.351 |
Neg logit contributions | |
ulia | -0.502 |
cott | -0.483 |
icas | -0.392 |
tsky | -0.361 |
doms | -0.339 |
Token | up |
Token ID | 510 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
augmented | +0.785 |
asses | +0.776 |
offending | +0.764 |
ingle | +0.740 |
routed | +0.734 |
Neg logit contributions | |
ulia | -0.911 |
cott | -0.898 |
icas | -0.813 |
tsky | -0.789 |
kamp | -0.773 |
Token | for |
Token ID | 329 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
augmented | +0.562 |
asses | +0.558 |
offending | +0.549 |
ingle | +0.526 |
disse | +0.524 |
Neg logit contributions | |
ulia | -0.909 |
cott | -0.901 |
icas | -0.816 |
tsky | -0.800 |
kamp | -0.794 |
Token | Take |
Token ID | 7214 |
Feature activation | +7.25e-01 |
Pos logit contributions | |
ulia | +0.047 |
cott | +0.046 |
icas | +0.042 |
tsky | +0.041 |
kamp | +0.040 |
Neg logit contributions | |
augmented | -0.036 |
asses | -0.036 |
offending | -0.035 |
routed | -0.034 |
ingle | -0.034 |
Token | Action |
Token ID | 7561 |
Feature activation | +9.54e-01 |
Pos logit contributions | |
augmented | +1.216 |
asses | +1.207 |
offending | +1.153 |
ingle | +1.124 |
routed | +1.082 |
Neg logit contributions | |
ulia | -2.535 |
cott | -2.489 |
icas | -2.309 |
tsky | -2.254 |
doms | -2.212 |
Token | Now |
Token ID | 2735 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
augmented | +2.110 |
asses | +2.106 |
offending | +2.035 |
ingle | +2.028 |
routed | +1.953 |
Neg logit contributions | |
ulia | -2.761 |
cott | -2.678 |
icas | -2.473 |
tsky | -2.383 |
doms | -2.334 |
Token | and |
Token ID | 290 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
augmented | +3.514 |
asses | +3.410 |
offending | +3.346 |
ingle | +3.300 |
routed | +3.217 |
Neg logit contributions | |
ulia | -3.847 |
cott | -3.760 |
icas | -3.444 |
tsky | -3.276 |
doms | -3.237 |
Token | we |
Token ID | 356 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
augmented | +0.547 |
asses | +0.545 |
offending | +0.536 |
disse | +0.514 |
ingle | +0.513 |
Neg logit contributions | |
ulia | -0.722 |
cott | -0.717 |
icas | -0.649 |
tsky | -0.632 |
kamp | -0.620 |
Token | � |
Token ID | 447 |
Feature activation | +3.55e-01 |
Pos logit contributions | |
augmented | +0.357 |
asses | +0.352 |
offending | +0.348 |
ingle | +0.338 |
routed | +0.335 |
Neg logit contributions | |
ulia | -0.352 |
cott | -0.347 |
icas | -0.311 |
tsky | -0.301 |
kamp | -0.294 |
Token | � |
Token ID | 247 |
Feature activation | +3.59e-01 |
Pos logit contributions | |
augmented | +0.729 |
asses | +0.716 |
offending | +0.705 |
ingle | +0.678 |
routed | +0.670 |
Neg logit contributions | |
ulia | -1.107 |
cott | -1.090 |
icas | -0.999 |
tsky | -0.972 |
kamp | -0.957 |
Token | ll |
Token ID | 297 |
Feature activation | -1.40e-02 |
Pos logit contributions | |
augmented | +1.034 |
asses | +1.023 |
offending | +1.007 |
ingle | +0.992 |
routed | +0.975 |
Neg logit contributions | |
ulia | -0.813 |
cott | -0.798 |
icas | -0.711 |
tsky | -0.683 |
doms | -0.661 |
Token | Sign |
Token ID | 5865 |
Feature activation | +3.55e-01 |
Pos logit contributions | |
augmented | +1.634 |
asses | +1.620 |
offending | +1.598 |
ingle | +1.580 |
routed | +1.563 |
Neg logit contributions | |
ulia | -0.563 |
cott | -0.545 |
icas | -0.437 |
tsky | -0.401 |
kamp | -0.381 |
Token | up |
Token ID | 510 |
Feature activation | -6.14e-02 |
Pos logit contributions | |
augmented | +0.817 |
asses | +0.800 |
offending | +0.785 |
ingle | +0.766 |
routed | +0.749 |
Neg logit contributions | |
ulia | -1.028 |
cott | -1.006 |
icas | -0.918 |
tsky | -0.892 |
doms | -0.871 |
Token | for |
Token ID | 329 |
Feature activation | +7.01e-02 |
Pos logit contributions | |
ulia | +0.195 |
cott | +0.192 |
icas | +0.175 |
tsky | +0.172 |
kamp | +0.170 |
Neg logit contributions | |
augmented | -0.122 |
asses | -0.120 |
offending | -0.118 |
ingle | -0.114 |
disse | -0.112 |
Token | Take |
Token ID | 7214 |
Feature activation | +6.51e-01 |
Pos logit contributions | |
asses | +0.164 |
offending | +0.163 |
augmented | +0.161 |
routed | +0.154 |
ingle | +0.153 |
Neg logit contributions | |
ulia | -0.193 |
cott | -0.193 |
icas | -0.174 |
tsky | -0.172 |
kamp | -0.167 |
Token | Action |
Token ID | 7561 |
Feature activation | +9.22e-01 |
Pos logit contributions | |
augmented | +1.033 |
asses | +1.028 |
offending | +0.959 |
ingle | +0.947 |
routed | +0.901 |
Neg logit contributions | |
ulia | -2.343 |
cott | -2.291 |
icas | -2.121 |
tsky | -2.082 |
kamp | -2.044 |
Token | Now |
Token ID | 2735 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
augmented | +2.117 |
asses | +2.097 |
offending | +2.063 |
ingle | +2.020 |
routed | +1.969 |
Neg logit contributions | |
ulia | -2.632 |
cott | -2.552 |
icas | -2.330 |
tsky | -2.245 |
kamp | -2.209 |
Token | and |
Token ID | 290 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
augmented | +3.384 |
asses | +3.317 |
ingle | +3.281 |
offending | +3.250 |
routed | +3.170 |
Neg logit contributions | |
ulia | -3.982 |
cott | -3.835 |
icas | -3.525 |
tsky | -3.361 |
kamp | -3.272 |
Token | we |
Token ID | 356 |
Feature activation | +8.68e-02 |
Pos logit contributions | |
augmented | +0.423 |
asses | +0.418 |
offending | +0.408 |
ingle | +0.394 |
routed | +0.389 |
Neg logit contributions | |
ulia | -0.617 |
cott | -0.609 |
icas | -0.558 |
tsky | -0.542 |
kamp | -0.533 |
Token | � |
Token ID | 447 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
augmented | +0.162 |
asses | +0.159 |
offending | +0.156 |
ingle | +0.148 |
routed | +0.146 |
Neg logit contributions | |
ulia | -0.288 |
cott | -0.283 |
icas | -0.262 |
tsky | -0.255 |
kamp | -0.251 |
Token | � |
Token ID | 247 |
Feature activation | +3.33e-01 |
Pos logit contributions | |
augmented | +0.502 |
asses | +0.495 |
offending | +0.488 |
ingle | +0.468 |
disse | +0.466 |
Neg logit contributions | |
ulia | -0.689 |
cott | -0.677 |
icas | -0.619 |
tsky | -0.602 |
kamp | -0.595 |
Token | ll |
Token ID | 297 |
Feature activation | +6.15e-02 |
Pos logit contributions | |
augmented | +0.646 |
asses | +0.634 |
offending | +0.622 |
ingle | +0.600 |
routed | +0.591 |
Neg logit contributions | |
ulia | -1.073 |
cott | -1.059 |
icas | -0.975 |
tsky | -0.950 |
kamp | -0.932 |
Token | Sign |
Token ID | 5865 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
augmented | +0.457 |
asses | +0.449 |
offending | +0.448 |
ingle | +0.438 |
routed | +0.432 |
Neg logit contributions | |
ulia | -0.253 |
cott | -0.250 |
icas | -0.220 |
tsky | -0.206 |
doms | -0.201 |
Token | up |
Token ID | 510 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
augmented | +0.781 |
offending | +0.758 |
asses | +0.749 |
ingle | +0.731 |
routed | +0.700 |
Neg logit contributions | |
ulia | -1.072 |
cott | -1.053 |
icas | -0.963 |
tsky | -0.940 |
doms | -0.911 |
Token | for |
Token ID | 329 |
Feature activation | -9.30e-02 |
Pos logit contributions | |
augmented | +0.258 |
asses | +0.252 |
offending | +0.251 |
ingle | +0.239 |
routed | +0.237 |
Neg logit contributions | |
ulia | -0.464 |
cott | -0.461 |
icas | -0.426 |
tsky | -0.412 |
doms | -0.404 |
Token | Take |
Token ID | 7214 |
Feature activation | +7.36e-01 |
Pos logit contributions | |
ulia | +0.287 |
cott | +0.283 |
icas | +0.259 |
tsky | +0.253 |
kamp | +0.247 |
Neg logit contributions | |
augmented | -0.194 |
asses | -0.191 |
offending | -0.188 |
ingle | -0.182 |
routed | -0.178 |
Token | Action |
Token ID | 7561 |
Feature activation | +8.69e-01 |
Pos logit contributions | |
augmented | +1.231 |
asses | +1.222 |
offending | +1.166 |
ingle | +1.137 |
routed | +1.093 |
Neg logit contributions | |
ulia | -2.573 |
cott | -2.529 |
icas | -2.341 |
tsky | -2.291 |
kamp | -2.251 |
Token | Now |
Token ID | 2735 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
augmented | +1.961 |
asses | +1.940 |
offending | +1.913 |
ingle | +1.870 |
routed | +1.828 |
Neg logit contributions | |
ulia | -2.502 |
cott | -2.437 |
icas | -2.225 |
tsky | -2.157 |
doms | -2.107 |
Token | and |
Token ID | 290 |
Feature activation | +2.81e-01 |
Pos logit contributions | |
augmented | +3.237 |
offending | +3.190 |
asses | +3.186 |
ingle | +3.138 |
routed | +3.022 |
Neg logit contributions | |
ulia | -4.033 |
cott | -3.899 |
icas | -3.619 |
tsky | -3.456 |
doms | -3.373 |
Token | get |
Token ID | 651 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
augmented | +0.573 |
asses | +0.566 |
offending | +0.554 |
ingle | +0.533 |
routed | +0.526 |
Neg logit contributions | |
ulia | -0.877 |
cott | -0.865 |
icas | -0.793 |
tsky | -0.770 |
kamp | -0.757 |
Token | three |
Token ID | 1115 |
Feature activation | +4.79e-03 |
Pos logit contributions | |
augmented | +0.293 |
asses | +0.285 |
offending | +0.280 |
ingle | +0.266 |
routed | +0.262 |
Neg logit contributions | |
ulia | -0.676 |
cott | -0.668 |
icas | -0.620 |
tsky | -0.606 |
kamp | -0.597 |
Token | actions |
Token ID | 4028 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
augmented | +0.010 |
asses | +0.010 |
offending | +0.010 |
ingle | +0.009 |
routed | +0.009 |
Neg logit contributions | |
ulia | -0.015 |
cott | -0.015 |
icas | -0.013 |
tsky | -0.013 |
kamp | -0.013 |
Token | in |
Token ID | 287 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
augmented | +0.610 |
asses | +0.606 |
offending | +0.598 |
ingle | +0.577 |
routed | +0.573 |
Neg logit contributions | |
ulia | -0.625 |
cott | -0.615 |
icas | -0.552 |
tsky | -0.534 |
kamp | -0.523 |
Token | � |
Token ID | 447 |
Feature activation | +4.59e-01 |
Pos logit contributions | |
augmented | +0.394 |
asses | +0.384 |
offending | +0.383 |
ingle | +0.370 |
routed | +0.367 |
Neg logit contributions | |
ulia | -0.435 |
cott | -0.422 |
icas | -0.387 |
tsky | -0.371 |
kamp | -0.365 |
Token | � |
Token ID | 247 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
augmented | +0.906 |
asses | +0.887 |
offending | +0.871 |
ingle | +0.843 |
routed | +0.832 |
Neg logit contributions | |
ulia | -1.464 |
cott | -1.449 |
icas | -1.328 |
tsky | -1.298 |
kamp | -1.268 |
Token | s |
Token ID | 82 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
augmented | +0.497 |
asses | +0.492 |
offending | +0.486 |
ingle | +0.474 |
routed | +0.462 |
Neg logit contributions | |
ulia | -0.563 |
cott | -0.544 |
icas | -0.502 |
tsky | -0.481 |
doms | -0.473 |
Token | US |
Token ID | 1294 |
Feature activation | -4.37e-01 |
Pos logit contributions | |
augmented | +0.325 |
offending | +0.317 |
asses | +0.316 |
ingle | +0.301 |
routed | +0.300 |
Neg logit contributions | |
ulia | -0.418 |
cott | -0.407 |
icas | -0.374 |
tsky | -0.363 |
doms | -0.356 |
Token | Cons |
Token ID | 3515 |
Feature activation | -1.48e-01 |
Pos logit contributions | |
ulia | +1.294 |
cott | +1.270 |
icas | +1.160 |
tsky | +1.129 |
kamp | +1.105 |
Neg logit contributions | |
augmented | -0.972 |
asses | -0.955 |
offending | -0.942 |
ingle | -0.909 |
routed | -0.900 |
Token | ulate |
Token ID | 5039 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
ulia | +0.436 |
cott | +0.420 |
icas | +0.391 |
tsky | +0.383 |
doms | +0.375 |
Neg logit contributions | |
asses | -0.325 |
augmented | -0.324 |
offending | -0.310 |
ingle | -0.307 |
routed | -0.297 |
Token | to |
Token ID | 284 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
augmented | +3.093 |
offending | +2.988 |
asses | +2.956 |
ingle | +2.858 |
routed | +2.820 |
Neg logit contributions | |
ulia | -4.191 |
cott | -4.017 |
icas | -3.791 |
doms | -3.580 |
tsky | -3.563 |
Token | protest |
Token ID | 5402 |
Feature activation | +1.44e-01 |
Pos logit contributions | |
ulia | +0.326 |
cott | +0.322 |
icas | +0.291 |
tsky | +0.282 |
kamp | +0.276 |
Neg logit contributions | |
augmented | -0.286 |
asses | -0.282 |
offending | -0.278 |
ingle | -0.270 |
routed | -0.267 |
Token | Trump |
Token ID | 1301 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
augmented | +0.347 |
asses | +0.340 |
offending | +0.338 |
ingle | +0.326 |
routed | +0.322 |
Neg logit contributions | |
ulia | -0.398 |
cott | -0.390 |
icas | -0.355 |
tsky | -0.343 |
kamp | -0.335 |
Token | � |
Token ID | 447 |
Feature activation | +1.77e-01 |
Pos logit contributions | |
augmented | +0.439 |
asses | +0.433 |
offending | +0.430 |
ingle | +0.412 |
routed | +0.409 |
Neg logit contributions | |
ulia | -0.486 |
cott | -0.471 |
icas | -0.430 |
tsky | -0.417 |
kamp | -0.404 |
Token | � |
Token ID | 247 |
Feature activation | +5.13e-02 |
Pos logit contributions | |
augmented | +0.367 |
asses | +0.361 |
offending | +0.355 |
ingle | +0.342 |
routed | +0.337 |
Neg logit contributions | |
ulia | -0.548 |
cott | -0.541 |
icas | -0.495 |
tsky | -0.481 |
kamp | -0.474 |
Token | supreme |
Token ID | 17700 |
Feature activation | +5.11e-02 |
Pos logit contributions | |
ulia | +0.382 |
cott | +0.376 |
icas | +0.344 |
tsky | +0.334 |
kamp | +0.328 |
Neg logit contributions | |
augmented | -0.256 |
asses | -0.251 |
offending | -0.248 |
ingle | -0.237 |
routed | -0.235 |
Token | leader |
Token ID | 3554 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
augmented | +0.089 |
asses | +0.086 |
offending | +0.085 |
ingle | +0.081 |
routed | +0.080 |
Neg logit contributions | |
ulia | -0.178 |
cott | -0.175 |
icas | -0.161 |
tsky | -0.157 |
kamp | -0.155 |
Token | of |
Token ID | 286 |
Feature activation | +3.56e-02 |
Pos logit contributions | |
ulia | +0.363 |
cott | +0.355 |
icas | +0.324 |
tsky | +0.314 |
kamp | +0.308 |
Neg logit contributions | |
augmented | -0.255 |
asses | -0.250 |
offending | -0.247 |
ingle | -0.236 |
routed | -0.235 |
Token | North |
Token ID | 2258 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
augmented | +0.090 |
asses | +0.089 |
offending | +0.088 |
ingle | +0.084 |
routed | +0.084 |
Neg logit contributions | |
ulia | -0.095 |
cott | -0.093 |
icas | -0.084 |
tsky | -0.081 |
kamp | -0.079 |
Token | Korean |
Token ID | 6983 |
Feature activation | +2.73e-02 |
Pos logit contributions | |
ulia | +0.296 |
cott | +0.289 |
icas | +0.260 |
tsky | +0.253 |
doms | +0.245 |
Neg logit contributions | |
augmented | -0.289 |
asses | -0.286 |
offending | -0.283 |
ingle | -0.272 |
routed | -0.270 |
Token | albeit |
Token ID | 18244 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
augmented | +0.053 |
asses | +0.052 |
offending | +0.051 |
ingle | +0.049 |
routed | +0.049 |
Neg logit contributions | |
ulia | -0.089 |
cott | -0.087 |
icas | -0.080 |
tsky | -0.078 |
kamp | -0.077 |
Token | in |
Token ID | 287 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
augmented | +3.068 |
offending | +2.957 |
asses | +2.950 |
routed | +2.817 |
ingle | +2.770 |
Neg logit contributions | |
ulia | -4.207 |
cott | -4.081 |
icas | -3.700 |
tsky | -3.560 |
kamp | -3.545 |
Token | a |
Token ID | 257 |
Feature activation | +3.26e-02 |
Pos logit contributions | |
ulia | +0.472 |
cott | +0.464 |
icas | +0.420 |
tsky | +0.407 |
kamp | +0.399 |
Neg logit contributions | |
augmented | -0.408 |
asses | -0.402 |
offending | -0.396 |
ingle | -0.384 |
routed | -0.380 |
Token | particularly |
Token ID | 3573 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
augmented | +0.062 |
asses | +0.060 |
offending | +0.059 |
routed | +0.056 |
ingle | +0.056 |
Neg logit contributions | |
ulia | -0.108 |
cott | -0.106 |
icas | -0.097 |
tsky | -0.095 |
kamp | -0.093 |
Token | gore |
Token ID | 46835 |
Feature activation | +3.36e-01 |
Pos logit contributions | |
ulia | +0.713 |
cott | +0.703 |
icas | +0.645 |
tsky | +0.628 |
kamp | +0.616 |
Neg logit contributions | |
augmented | -0.460 |
asses | -0.452 |
offending | -0.445 |
ingle | -0.428 |
routed | -0.423 |
Token | filled |
Token ID | 5901 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
augmented | +0.723 |
offending | +0.700 |
asses | +0.700 |
routed | +0.658 |
ingle | +0.655 |
Neg logit contributions | |
ulia | -1.032 |
cott | -1.006 |
icas | -0.932 |
tsky | -0.896 |
doms | -0.885 |
Token | a |
Token ID | 257 |
Feature activation | -3.70e-02 |
Pos logit contributions | |
ulia | +0.272 |
cott | +0.269 |
icas | +0.240 |
tsky | +0.232 |
kamp | +0.228 |
Neg logit contributions | |
asses | -0.301 |
augmented | -0.298 |
offending | -0.293 |
ingle | -0.288 |
disse | -0.286 |
Token | robot |
Token ID | 9379 |
Feature activation | -9.55e-02 |
Pos logit contributions | |
ulia | +0.117 |
cott | +0.116 |
icas | +0.106 |
tsky | +0.104 |
kamp | +0.102 |
Neg logit contributions | |
augmented | -0.072 |
asses | -0.072 |
offending | -0.070 |
ingle | -0.069 |
routed | -0.067 |
Token | by |
Token ID | 416 |
Feature activation | +2.93e-01 |
Pos logit contributions | |
ulia | +0.206 |
cott | +0.201 |
icas | +0.177 |
tsky | +0.170 |
kamp | +0.169 |
Neg logit contributions | |
asses | -0.283 |
augmented | -0.283 |
offending | -0.281 |
ingle | -0.274 |
disse | -0.270 |
Token | clicking |
Token ID | 12264 |
Feature activation | -5.12e-02 |
Pos logit contributions | |
augmented | +0.986 |
asses | +0.978 |
offending | +0.971 |
ingle | +0.948 |
routed | +0.948 |
Neg logit contributions | |
ulia | -0.521 |
cott | -0.501 |
icas | -0.425 |
tsky | -0.411 |
kamp | -0.393 |
Token | the |
Token ID | 262 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
ulia | +0.118 |
cott | +0.116 |
icas | +0.103 |
tsky | +0.099 |
kamp | +0.096 |
Neg logit contributions | |
augmented | -0.146 |
asses | -0.144 |
offending | -0.143 |
ingle | -0.139 |
routed | -0.138 |
Token | box |
Token ID | 3091 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
augmented | +0.430 |
asses | +0.428 |
offending | +0.417 |
routed | +0.403 |
ingle | +0.400 |
Neg logit contributions | |
ulia | -0.860 |
cott | -0.853 |
icas | -0.782 |
tsky | -0.773 |
kamp | -0.752 |
Token | . |
Token ID | 13 |
Feature activation | +5.12e-01 |
Pos logit contributions | |
augmented | +3.234 |
asses | +3.186 |
offending | +3.077 |
ingle | +3.042 |
routed | +2.964 |
Neg logit contributions | |
ulia | -3.909 |
cott | -3.833 |
icas | -3.525 |
tsky | -3.384 |
doms | -3.343 |
Token | Invalid |
Token ID | 17665 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
augmented | +1.275 |
asses | +1.251 |
offending | +1.249 |
ingle | +1.205 |
routed | +1.201 |
Neg logit contributions | |
ulia | -1.368 |
cott | -1.357 |
icas | -1.218 |
tsky | -1.180 |
kamp | -1.155 |
Token | email |
Token ID | 3053 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
augmented | +0.382 |
asses | +0.380 |
offending | +0.373 |
ingle | +0.365 |
routed | +0.361 |
Neg logit contributions | |
ulia | -0.402 |
cott | -0.393 |
icas | -0.355 |
tsky | -0.341 |
kamp | -0.335 |
Token | address |
Token ID | 2209 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
augmented | +0.497 |
asses | +0.489 |
offending | +0.477 |
ingle | +0.456 |
routed | +0.448 |
Neg logit contributions | |
ulia | -1.142 |
cott | -1.127 |
icas | -1.046 |
tsky | -1.021 |
kamp | -1.007 |
Token | . |
Token ID | 13 |
Feature activation | +6.81e-01 |
Pos logit contributions | |
augmented | +0.386 |
asses | +0.380 |
offending | +0.379 |
ingle | +0.364 |
disse | +0.363 |
Neg logit contributions | |
ulia | -0.382 |
cott | -0.377 |
icas | -0.337 |
tsky | -0.326 |
kamp | -0.321 |
Token | a |
Token ID | 257 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
ulia | +0.373 |
cott | +0.369 |
icas | +0.328 |
tsky | +0.319 |
kamp | +0.313 |
Neg logit contributions | |
asses | -0.421 |
augmented | -0.417 |
offending | -0.410 |
ingle | -0.403 |
disse | -0.401 |
Token | robot |
Token ID | 9379 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
ulia | +0.316 |
cott | +0.313 |
icas | +0.286 |
tsky | +0.283 |
kamp | +0.276 |
Neg logit contributions | |
asses | -0.201 |
augmented | -0.200 |
offending | -0.195 |
ingle | -0.191 |
routed | -0.188 |
Token | by |
Token ID | 416 |
Feature activation | +2.92e-01 |
Pos logit contributions | |
ulia | +0.326 |
cott | +0.318 |
icas | +0.280 |
tsky | +0.269 |
kamp | +0.268 |
Neg logit contributions | |
asses | -0.450 |
augmented | -0.448 |
offending | -0.446 |
ingle | -0.434 |
disse | -0.429 |
Token | clicking |
Token ID | 12264 |
Feature activation | -9.74e-02 |
Pos logit contributions | |
augmented | +0.983 |
asses | +0.975 |
offending | +0.968 |
ingle | +0.946 |
routed | +0.945 |
Neg logit contributions | |
ulia | -0.518 |
cott | -0.497 |
icas | -0.423 |
tsky | -0.408 |
kamp | -0.389 |
Token | the |
Token ID | 262 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
ulia | +0.223 |
cott | +0.220 |
icas | +0.194 |
tsky | +0.187 |
kamp | +0.181 |
Neg logit contributions | |
augmented | -0.279 |
asses | -0.276 |
offending | -0.274 |
ingle | -0.266 |
routed | -0.265 |
Token | box |
Token ID | 3091 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
augmented | +0.338 |
asses | +0.335 |
offending | +0.327 |
routed | +0.315 |
ingle | +0.314 |
Neg logit contributions | |
ulia | -0.682 |
cott | -0.676 |
icas | -0.621 |
tsky | -0.613 |
kamp | -0.597 |
Token | . |
Token ID | 13 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
augmented | +3.208 |
asses | +3.155 |
offending | +3.052 |
ingle | +3.015 |
routed | +2.942 |
Neg logit contributions | |
ulia | -3.870 |
cott | -3.795 |
icas | -3.491 |
tsky | -3.350 |
doms | -3.312 |
Token | Invalid |
Token ID | 17665 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
augmented | +1.075 |
asses | +1.056 |
offending | +1.051 |
ingle | +1.015 |
routed | +1.010 |
Neg logit contributions | |
ulia | -1.167 |
cott | -1.157 |
icas | -1.039 |
tsky | -1.007 |
kamp | -0.986 |
Token | email |
Token ID | 3053 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
augmented | +0.342 |
asses | +0.341 |
offending | +0.335 |
ingle | +0.327 |
routed | +0.325 |
Neg logit contributions | |
ulia | -0.357 |
cott | -0.349 |
icas | -0.315 |
tsky | -0.303 |
kamp | -0.297 |
Token | address |
Token ID | 2209 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
augmented | +0.397 |
asses | +0.391 |
offending | +0.382 |
ingle | +0.364 |
routed | +0.358 |
Neg logit contributions | |
ulia | -0.904 |
cott | -0.892 |
icas | -0.828 |
tsky | -0.807 |
kamp | -0.797 |
Token | . |
Token ID | 13 |
Feature activation | +6.13e-01 |
Pos logit contributions | |
augmented | +0.291 |
offending | +0.286 |
asses | +0.286 |
disse | +0.274 |
ingle | +0.274 |
Neg logit contributions | |
ulia | -0.284 |
cott | -0.279 |
icas | -0.249 |
tsky | -0.242 |
kamp | -0.238 |
Token | a |
Token ID | 257 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
ulia | +0.398 |
cott | +0.393 |
icas | +0.351 |
tsky | +0.339 |
kamp | +0.333 |
Neg logit contributions | |
asses | -0.447 |
augmented | -0.443 |
offending | -0.436 |
ingle | -0.427 |
disse | -0.425 |
Token | robot |
Token ID | 9379 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
ulia | +0.411 |
cott | +0.407 |
icas | +0.372 |
tsky | +0.367 |
kamp | +0.359 |
Neg logit contributions | |
asses | -0.261 |
augmented | -0.261 |
offending | -0.254 |
ingle | -0.248 |
routed | -0.244 |
Token | by |
Token ID | 416 |
Feature activation | +2.56e-01 |
Pos logit contributions | |
ulia | +0.471 |
cott | +0.458 |
icas | +0.404 |
kamp | +0.388 |
tsky | +0.387 |
Neg logit contributions | |
asses | -0.666 |
augmented | -0.663 |
offending | -0.660 |
ingle | -0.643 |
disse | -0.635 |
Token | clicking |
Token ID | 12264 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
augmented | +0.863 |
asses | +0.857 |
offending | +0.851 |
routed | +0.831 |
ingle | +0.831 |
Neg logit contributions | |
ulia | -0.451 |
cott | -0.434 |
icas | -0.368 |
tsky | -0.357 |
kamp | -0.339 |
Token | the |
Token ID | 262 |
Feature activation | +2.05e-01 |
Pos logit contributions | |
ulia | +0.024 |
cott | +0.024 |
icas | +0.021 |
tsky | +0.020 |
kamp | +0.020 |
Neg logit contributions | |
augmented | -0.030 |
asses | -0.030 |
offending | -0.029 |
ingle | -0.029 |
routed | -0.028 |
Token | box |
Token ID | 3091 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
augmented | +0.352 |
asses | +0.351 |
offending | +0.342 |
routed | +0.331 |
ingle | +0.328 |
Neg logit contributions | |
ulia | -0.697 |
cott | -0.691 |
icas | -0.635 |
tsky | -0.627 |
kamp | -0.610 |
Token | . |
Token ID | 13 |
Feature activation | +4.78e-01 |
Pos logit contributions | |
augmented | +3.192 |
asses | +3.141 |
offending | +3.042 |
ingle | +3.003 |
routed | +2.928 |
Neg logit contributions | |
ulia | -3.816 |
cott | -3.741 |
icas | -3.437 |
tsky | -3.304 |
doms | -3.256 |
Token | Invalid |
Token ID | 17665 |
Feature activation | +2.02e-01 |
Pos logit contributions | |
augmented | +1.203 |
asses | +1.183 |
offending | +1.180 |
ingle | +1.139 |
routed | +1.136 |
Neg logit contributions | |
ulia | -1.262 |
cott | -1.255 |
icas | -1.123 |
tsky | -1.088 |
kamp | -1.065 |
Token | email |
Token ID | 3053 |
Feature activation | +3.33e-01 |
Pos logit contributions | |
augmented | +0.505 |
asses | +0.503 |
offending | +0.495 |
ingle | +0.482 |
routed | +0.478 |
Neg logit contributions | |
ulia | -0.532 |
cott | -0.521 |
icas | -0.470 |
tsky | -0.452 |
kamp | -0.444 |
Token | address |
Token ID | 2209 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
augmented | +0.524 |
asses | +0.516 |
offending | +0.503 |
ingle | +0.480 |
routed | +0.473 |
Neg logit contributions | |
ulia | -1.195 |
cott | -1.180 |
icas | -1.095 |
tsky | -1.068 |
kamp | -1.054 |
Token | . |
Token ID | 13 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
augmented | +0.342 |
offending | +0.337 |
asses | +0.336 |
disse | +0.322 |
ingle | +0.322 |
Neg logit contributions | |
ulia | -0.335 |
cott | -0.331 |
icas | -0.295 |
tsky | -0.286 |
kamp | -0.281 |
Token | 2012 |
Token ID | 2321 |
Feature activation | +6.95e-01 |
Pos logit contributions | |
augmented | +1.178 |
asses | +1.155 |
offending | +1.124 |
ingle | +1.083 |
routed | +1.061 |
Neg logit contributions | |
ulia | -2.215 |
cott | -2.190 |
icas | -2.024 |
tsky | -1.976 |
kamp | -1.934 |
Token | United |
Token ID | 1578 |
Feature activation | -2.75e-01 |
Pos logit contributions | |
augmented | +1.593 |
asses | +1.567 |
offending | +1.532 |
ingle | +1.498 |
routed | +1.473 |
Neg logit contributions | |
ulia | -1.994 |
cott | -1.961 |
icas | -1.791 |
tsky | -1.732 |
doms | -1.701 |
Token | States |
Token ID | 1829 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
ulia | +0.628 |
cott | +0.616 |
icas | +0.543 |
tsky | +0.527 |
kamp | +0.508 |
Neg logit contributions | |
augmented | -0.798 |
asses | -0.785 |
offending | -0.775 |
ingle | -0.757 |
routed | -0.753 |
Token | 3 |
Token ID | 513 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
augmented | +0.030 |
asses | +0.029 |
offending | +0.029 |
ingle | +0.028 |
routed | +0.027 |
Neg logit contributions | |
ulia | -0.053 |
cott | -0.052 |
icas | -0.048 |
tsky | -0.047 |
kamp | -0.046 |
Token | 240 |
Token ID | 16102 |
Feature activation | +4.46e-01 |
Pos logit contributions | |
augmented | +0.557 |
asses | +0.543 |
offending | +0.533 |
ingle | +0.512 |
routed | +0.503 |
Neg logit contributions | |
ulia | -1.073 |
cott | -1.059 |
icas | -0.978 |
tsky | -0.957 |
kamp | -0.936 |
Token | Posts |
Token ID | 12043 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
augmented | +0.798 |
asses | +0.782 |
offending | +0.774 |
ingle | +0.734 |
routed | +0.729 |
Neg logit contributions | |
ulia | -1.506 |
cott | -1.485 |
icas | -1.369 |
tsky | -1.330 |
kamp | -1.323 |
Token | # |
Token ID | 1303 |
Feature activation | -9.07e-01 |
Pos logit contributions | |
ulia | +3.117 |
cott | +3.058 |
icas | +2.606 |
tsky | +2.456 |
kamp | +2.423 |
Neg logit contributions | |
augmented | -5.439 |
asses | -5.426 |
offending | -5.330 |
ingle | -5.259 |
routed | -5.172 |
Token | 10 |
Token ID | 940 |
Feature activation | +7.58e-01 |
Pos logit contributions | |
ulia | +2.929 |
cott | +2.920 |
icas | +2.653 |
tsky | +2.581 |
kamp | +2.567 |
Neg logit contributions | |
offending | -1.716 |
augmented | -1.715 |
asses | -1.695 |
disse | -1.623 |
routed | -1.602 |
Token | Happy |
Token ID | 14628 |
Feature activation | +7.73e-01 |
Pos logit contributions | |
augmented | +1.852 |
asses | +1.812 |
offending | +1.793 |
routed | +1.735 |
ingle | +1.731 |
Neg logit contributions | |
ulia | -2.046 |
cott | -2.007 |
icas | -1.847 |
tsky | -1.770 |
doms | -1.735 |
Token | it |
Token ID | 340 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
augmented | +1.770 |
asses | +1.737 |
offending | +1.731 |
ingle | +1.662 |
routed | +1.654 |
Neg logit contributions | |
ulia | -2.235 |
cott | -2.187 |
icas | -1.992 |
tsky | -1.924 |
kamp | -1.896 |
Token | worked |
Token ID | 3111 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
augmented | +0.294 |
asses | +0.290 |
offending | +0.286 |
ingle | +0.278 |
routed | +0.276 |
Neg logit contributions | |
ulia | -0.316 |
cott | -0.310 |
icas | -0.281 |
tsky | -0.272 |
kamp | -0.265 |
Token | 2012 |
Token ID | 2321 |
Feature activation | +6.34e-01 |
Pos logit contributions | |
augmented | +0.854 |
asses | +0.835 |
offending | +0.828 |
ingle | +0.790 |
routed | +0.786 |
Neg logit contributions | |
ulia | -1.489 |
cott | -1.469 |
icas | -1.348 |
tsky | -1.313 |
kamp | -1.303 |
Token | United |
Token ID | 1578 |
Feature activation | -3.07e-01 |
Pos logit contributions | |
augmented | +1.476 |
asses | +1.453 |
offending | +1.422 |
ingle | +1.388 |
routed | +1.367 |
Neg logit contributions | |
ulia | -1.798 |
cott | -1.768 |
icas | -1.612 |
tsky | -1.564 |
doms | -1.531 |
Token | States |
Token ID | 1829 |
Feature activation | -9.19e-02 |
Pos logit contributions | |
ulia | +0.703 |
cott | +0.689 |
icas | +0.607 |
tsky | +0.592 |
kamp | +0.570 |
Neg logit contributions | |
augmented | -0.887 |
asses | -0.876 |
offending | -0.864 |
ingle | -0.844 |
routed | -0.837 |
Token | 5 |
Token ID | 642 |
Feature activation | +3.43e-01 |
Pos logit contributions | |
ulia | +0.299 |
cott | +0.296 |
icas | +0.272 |
tsky | +0.265 |
kamp | +0.261 |
Neg logit contributions | |
augmented | -0.175 |
asses | -0.173 |
offending | -0.170 |
ingle | -0.163 |
routed | -0.161 |
Token | 667 |
Token ID | 28933 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
augmented | +0.679 |
asses | +0.666 |
offending | +0.652 |
ingle | +0.632 |
routed | +0.620 |
Neg logit contributions | |
ulia | -1.092 |
cott | -1.077 |
icas | -0.991 |
tsky | -0.967 |
kamp | -0.945 |
Token | Posts |
Token ID | 12043 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
augmented | +0.288 |
offending | +0.284 |
asses | +0.283 |
ingle | +0.268 |
routed | +0.266 |
Neg logit contributions | |
ulia | -0.511 |
cott | -0.506 |
icas | -0.464 |
tsky | -0.451 |
kamp | -0.451 |
Token | # |
Token ID | 1303 |
Feature activation | -7.99e-01 |
Pos logit contributions | |
ulia | +3.030 |
cott | +2.964 |
icas | +2.558 |
tsky | +2.410 |
kamp | +2.361 |
Neg logit contributions | |
augmented | -5.062 |
asses | -5.047 |
offending | -4.956 |
ingle | -4.879 |
routed | -4.804 |
Token | 12 |
Token ID | 1065 |
Feature activation | +6.90e-01 |
Pos logit contributions | |
ulia | +2.539 |
cott | +2.510 |
icas | +2.282 |
tsky | +2.235 |
kamp | +2.221 |
Neg logit contributions | |
offending | -1.559 |
augmented | -1.558 |
asses | -1.499 |
disse | -1.490 |
routed | -1.454 |
Token | I |
Token ID | 314 |
Feature activation | -9.64e-02 |
Pos logit contributions | |
augmented | +1.670 |
asses | +1.609 |
offending | +1.607 |
routed | +1.557 |
ingle | +1.547 |
Neg logit contributions | |
ulia | -1.899 |
cott | -1.873 |
icas | -1.715 |
tsky | -1.649 |
kamp | -1.626 |
Token | 'm |
Token ID | 1101 |
Feature activation | -7.60e-02 |
Pos logit contributions | |
ulia | +0.275 |
cott | +0.271 |
icas | +0.246 |
tsky | +0.239 |
kamp | +0.234 |
Neg logit contributions | |
augmented | -0.223 |
asses | -0.220 |
offending | -0.216 |
ingle | -0.210 |
routed | -0.207 |
Token | glad |
Token ID | 9675 |
Feature activation | +1.04e-01 |
Pos logit contributions | |
ulia | +0.221 |
cott | +0.218 |
icas | +0.198 |
tsky | +0.193 |
kamp | +0.189 |
Neg logit contributions | |
augmented | -0.172 |
asses | -0.169 |
offending | -0.167 |
ingle | -0.161 |
routed | -0.160 |
Token | 2002 |
Token ID | 6244 |
Feature activation | +5.85e-01 |
Pos logit contributions | |
augmented | +0.895 |
asses | +0.877 |
offending | +0.872 |
ingle | +0.836 |
routed | +0.828 |
Neg logit contributions | |
ulia | -1.531 |
cott | -1.513 |
icas | -1.383 |
tsky | -1.344 |
kamp | -1.338 |
Token | United |
Token ID | 1578 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
augmented | +1.374 |
asses | +1.354 |
offending | +1.326 |
ingle | +1.291 |
routed | +1.276 |
Neg logit contributions | |
ulia | -1.645 |
cott | -1.621 |
icas | -1.477 |
tsky | -1.431 |
doms | -1.400 |
Token | States |
Token ID | 1829 |
Feature activation | -2.31e-02 |
Pos logit contributions | |
ulia | +0.548 |
cott | +0.539 |
icas | +0.474 |
tsky | +0.462 |
kamp | +0.444 |
Neg logit contributions | |
augmented | -0.697 |
asses | -0.688 |
offending | -0.679 |
ingle | -0.662 |
routed | -0.658 |
Token | 3 |
Token ID | 513 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
ulia | +0.075 |
cott | +0.074 |
icas | +0.068 |
tsky | +0.066 |
kamp | +0.065 |
Neg logit contributions | |
augmented | -0.044 |
asses | -0.044 |
offending | -0.043 |
ingle | -0.041 |
routed | -0.041 |
Token | 472 |
Token ID | 37856 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
augmented | +0.277 |
asses | +0.272 |
offending | +0.267 |
ingle | +0.257 |
routed | +0.254 |
Neg logit contributions | |
ulia | -0.437 |
cott | -0.431 |
icas | -0.396 |
tsky | -0.386 |
kamp | -0.378 |
Token | Posts |
Token ID | 12043 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
augmented | +0.439 |
offending | +0.435 |
asses | +0.428 |
routed | +0.408 |
ingle | +0.408 |
Neg logit contributions | |
ulia | -0.768 |
cott | -0.754 |
icas | -0.694 |
tsky | -0.674 |
kamp | -0.673 |
Token | # |
Token ID | 1303 |
Feature activation | -7.75e-01 |
Pos logit contributions | |
ulia | +3.014 |
cott | +2.943 |
icas | +2.537 |
tsky | +2.400 |
kamp | +2.349 |
Neg logit contributions | |
augmented | -5.052 |
asses | -5.049 |
offending | -4.945 |
ingle | -4.880 |
routed | -4.800 |
Token | 11 |
Token ID | 1157 |
Feature activation | +7.59e-01 |
Pos logit contributions | |
cott | +2.454 |
ulia | +2.380 |
icas | +2.184 |
tsky | +2.166 |
kamp | +2.112 |
Neg logit contributions | |
disse | -1.562 |
offending | -1.541 |
augmented | -1.523 |
routed | -1.448 |
asses | -1.420 |
Token | On |
Token ID | 1550 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
augmented | +1.872 |
asses | +1.811 |
offending | +1.805 |
routed | +1.753 |
ingle | +1.748 |
Neg logit contributions | |
ulia | -2.049 |
cott | -2.011 |
icas | -1.842 |
tsky | -1.768 |
kamp | -1.742 |
Token | September |
Token ID | 2693 |
Feature activation | +5.68e-01 |
Pos logit contributions | |
ulia | +0.268 |
cott | +0.266 |
icas | +0.232 |
tsky | +0.223 |
kamp | +0.216 |
Neg logit contributions | |
augmented | -0.389 |
asses | -0.382 |
offending | -0.380 |
ingle | -0.368 |
routed | -0.367 |
Token | 20 |
Token ID | 1160 |
Feature activation | +3.98e-01 |
Pos logit contributions | |
augmented | +0.957 |
asses | +0.936 |
offending | +0.922 |
ingle | +0.880 |
routed | +0.866 |
Neg logit contributions | |
ulia | -1.980 |
cott | -1.957 |
icas | -1.810 |
tsky | -1.769 |
kamp | -1.742 |
Token | pak |
Token ID | 41091 |
Feature activation | -5.79e-02 |
Pos logit contributions | |
ulia | +1.326 |
cott | +1.313 |
icas | +1.227 |
tsky | +1.202 |
kamp | +1.185 |
Neg logit contributions | |
augmented | -0.398 |
asses | -0.386 |
offending | -0.375 |
ingle | -0.352 |
routed | -0.343 |
Token | 's |
Token ID | 338 |
Feature activation | -4.02e-02 |
Pos logit contributions | |
ulia | +0.158 |
cott | +0.155 |
icas | +0.141 |
tsky | +0.136 |
kamp | +0.134 |
Neg logit contributions | |
augmented | -0.141 |
asses | -0.139 |
offending | -0.137 |
ingle | -0.133 |
routed | -0.132 |
Token | website |
Token ID | 3052 |
Feature activation | +4.67e-02 |
Pos logit contributions | |
ulia | +0.127 |
cott | +0.125 |
icas | +0.115 |
tsky | +0.112 |
kamp | +0.110 |
Neg logit contributions | |
augmented | -0.080 |
asses | -0.080 |
offending | -0.078 |
ingle | -0.075 |
routed | -0.074 |
Token | offers |
Token ID | 4394 |
Feature activation | -2.01e-01 |
Pos logit contributions | |
augmented | +0.113 |
asses | +0.111 |
offending | +0.109 |
ingle | +0.106 |
routed | +0.105 |
Neg logit contributions | |
ulia | -0.129 |
cott | -0.127 |
icas | -0.115 |
tsky | -0.111 |
kamp | -0.109 |
Token | the |
Token ID | 262 |
Feature activation | -4.16e-01 |
Pos logit contributions | |
ulia | +0.568 |
cott | +0.560 |
icas | +0.509 |
tsky | +0.493 |
kamp | +0.482 |
Neg logit contributions | |
augmented | -0.471 |
asses | -0.465 |
offending | -0.458 |
ingle | -0.444 |
routed | -0.439 |
Token | following |
Token ID | 1708 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
ulia | +1.258 |
cott | +1.245 |
icas | +1.136 |
tsky | +1.102 |
kamp | +1.082 |
Neg logit contributions | |
asses | -0.872 |
augmented | -0.869 |
offending | -0.841 |
ingle | -0.826 |
routed | -0.808 |
Token | description |
Token ID | 6764 |
Feature activation | -1.91e-01 |
Pos logit contributions | |
ulia | +4.443 |
cott | +4.431 |
icas | +4.068 |
tsky | +3.952 |
kamp | +3.808 |
Neg logit contributions | |
asses | -3.243 |
augmented | -3.109 |
offending | -3.072 |
ingle | -3.042 |
routed | -2.927 |
Token | of |
Token ID | 286 |
Feature activation | -6.33e-02 |
Pos logit contributions | |
ulia | +0.544 |
cott | +0.536 |
icas | +0.487 |
tsky | +0.472 |
kamp | +0.463 |
Neg logit contributions | |
augmented | -0.447 |
asses | -0.439 |
offending | -0.433 |
ingle | -0.420 |
routed | -0.415 |
Token | their |
Token ID | 511 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
ulia | +0.184 |
cott | +0.181 |
icas | +0.165 |
tsky | +0.160 |
kamp | +0.157 |
Neg logit contributions | |
augmented | -0.144 |
asses | -0.141 |
offending | -0.139 |
ingle | -0.135 |
routed | -0.133 |
Token | competing |
Token ID | 11780 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
ulia | +0.553 |
cott | +0.548 |
icas | +0.505 |
tsky | +0.490 |
kamp | +0.484 |
Neg logit contributions | |
asses | -0.315 |
augmented | -0.314 |
offending | -0.304 |
ingle | -0.297 |
routed | -0.290 |
Token | technology |
Token ID | 3037 |
Feature activation | -2.88e-02 |
Pos logit contributions | |
augmented | +0.332 |
asses | +0.326 |
offending | +0.320 |
ingle | +0.308 |
routed | +0.304 |
Neg logit contributions | |
ulia | -0.558 |
cott | -0.552 |
icas | -0.507 |
tsky | -0.494 |
kamp | -0.486 |
Token | 2010 |
Token ID | 3050 |
Feature activation | +7.32e-01 |
Pos logit contributions | |
augmented | +1.014 |
asses | +0.994 |
offending | +0.977 |
ingle | +0.938 |
routed | +0.925 |
Neg logit contributions | |
ulia | -1.813 |
cott | -1.792 |
icas | -1.650 |
tsky | -1.609 |
kamp | -1.582 |
Token | United |
Token ID | 1578 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
augmented | +1.684 |
asses | +1.657 |
offending | +1.616 |
ingle | +1.575 |
routed | +1.553 |
Neg logit contributions | |
ulia | -2.095 |
cott | -2.060 |
icas | -1.880 |
tsky | -1.823 |
doms | -1.792 |
Token | States |
Token ID | 1829 |
Feature activation | -5.61e-02 |
Pos logit contributions | |
ulia | +0.639 |
cott | +0.629 |
icas | +0.553 |
tsky | +0.537 |
kamp | +0.519 |
Neg logit contributions | |
augmented | -0.802 |
asses | -0.792 |
offending | -0.780 |
ingle | -0.763 |
routed | -0.756 |
Token | 10 |
Token ID | 838 |
Feature activation | +3.27e-01 |
Pos logit contributions | |
ulia | +0.183 |
cott | +0.181 |
icas | +0.166 |
tsky | +0.162 |
kamp | +0.160 |
Neg logit contributions | |
augmented | -0.107 |
asses | -0.105 |
offending | -0.103 |
ingle | -0.099 |
routed | -0.098 |
Token | 53 |
Token ID | 4310 |
Feature activation | +1.20e-01 |
Pos logit contributions | |
augmented | +0.667 |
asses | +0.655 |
offending | +0.642 |
ingle | +0.621 |
routed | +0.612 |
Neg logit contributions | |
ulia | -1.023 |
cott | -1.010 |
icas | -0.927 |
tsky | -0.903 |
kamp | -0.884 |
Token | Posts |
Token ID | 12043 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
augmented | +0.220 |
offending | +0.215 |
asses | +0.213 |
routed | +0.202 |
ingle | +0.202 |
Neg logit contributions | |
ulia | -0.402 |
cott | -0.398 |
icas | -0.367 |
tsky | -0.357 |
kamp | -0.354 |
Token | # |
Token ID | 1303 |
Feature activation | -8.81e-01 |
Pos logit contributions | |
ulia | +2.876 |
cott | +2.812 |
icas | +2.438 |
tsky | +2.307 |
kamp | +2.254 |
Neg logit contributions | |
augmented | -4.684 |
asses | -4.655 |
offending | -4.582 |
ingle | -4.502 |
routed | -4.442 |
Token | 15 |
Token ID | 1314 |
Feature activation | +5.37e-01 |
Pos logit contributions | |
cott | +2.395 |
ulia | +2.320 |
icas | +2.062 |
tsky | +2.014 |
jar | +1.981 |
Neg logit contributions | |
disse | -2.185 |
offending | -2.183 |
augmented | -2.148 |
��� | -2.146 |
routed | -2.103 |
Token | honestly |
Token ID | 12698 |
Feature activation | -3.08e-01 |
Pos logit contributions | |
augmented | +1.295 |
asses | +1.260 |
offending | +1.250 |
routed | +1.207 |
ingle | +1.206 |
Neg logit contributions | |
ulia | -1.484 |
cott | -1.459 |
icas | -1.333 |
tsky | -1.285 |
kamp | -1.265 |
Token | if |
Token ID | 611 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
ulia | +0.871 |
cott | +0.857 |
icas | +0.779 |
tsky | +0.755 |
kamp | +0.740 |
Neg logit contributions | |
augmented | -0.725 |
asses | -0.713 |
offending | -0.703 |
ingle | -0.680 |
routed | -0.674 |
Token | we |
Token ID | 356 |
Feature activation | -9.63e-02 |
Pos logit contributions | |
ulia | +0.062 |
cott | +0.062 |
icas | +0.056 |
tsky | +0.054 |
kamp | +0.053 |
Neg logit contributions | |
augmented | -0.048 |
asses | -0.047 |
offending | -0.046 |
ingle | -0.044 |
routed | -0.044 |
Token | ( |
Token ID | 357 |
Feature activation | -2.48e-02 |
Pos logit contributions | |
augmented | +0.415 |
asses | +0.403 |
offending | +0.397 |
routed | +0.388 |
ingle | +0.385 |
Neg logit contributions | |
ulia | -0.450 |
cott | -0.432 |
icas | -0.396 |
tsky | -0.382 |
doms | -0.371 |
Token | R |
Token ID | 49 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
ulia | +0.061 |
cott | +0.059 |
icas | +0.053 |
tsky | +0.051 |
kamp | +0.050 |
Neg logit contributions | |
augmented | -0.068 |
asses | -0.067 |
offending | -0.066 |
ingle | -0.065 |
routed | -0.064 |
Token | ) |
Token ID | 8 |
Feature activation | -4.14e-02 |
Pos logit contributions | |
augmented | +0.257 |
asses | +0.253 |
offending | +0.249 |
ingle | +0.243 |
routed | +0.240 |
Neg logit contributions | |
ulia | -0.292 |
cott | -0.288 |
icas | -0.261 |
tsky | -0.254 |
kamp | -0.247 |
Token | took |
Token ID | 1718 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
ulia | +0.114 |
cott | +0.111 |
icas | +0.101 |
tsky | +0.098 |
kamp | +0.095 |
Neg logit contributions | |
augmented | -0.102 |
asses | -0.099 |
offending | -0.098 |
routed | -0.095 |
ingle | -0.095 |
Token | fl |
Token ID | 781 |
Feature activation | -3.86e-02 |
Pos logit contributions | |
augmented | +0.273 |
offending | +0.265 |
asses | +0.265 |
ingle | +0.253 |
routed | +0.253 |
Neg logit contributions | |
ulia | -0.347 |
cott | -0.341 |
icas | -0.312 |
tsky | -0.303 |
kamp | -0.297 |
Token | ak |
Token ID | 461 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
ulia | +0.120 |
cott | +0.118 |
icas | +0.109 |
tsky | +0.106 |
kamp | +0.104 |
Neg logit contributions | |
augmented | -0.079 |
asses | -0.078 |
offending | -0.076 |
ingle | -0.074 |
routed | -0.072 |
Token | from |
Token ID | 422 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
ulia | +4.281 |
cott | +4.267 |
icas | +3.843 |
kamp | +3.757 |
tsky | +3.707 |
Neg logit contributions | |
augmented | -3.085 |
asses | -3.068 |
offending | -2.986 |
ingle | -2.933 |
disse | -2.885 |
Token | both |
Token ID | 1111 |
Feature activation | +3.87e-02 |
Pos logit contributions | |
augmented | +0.453 |
asses | +0.444 |
offending | +0.438 |
ingle | +0.421 |
routed | +0.417 |
Neg logit contributions | |
ulia | -0.673 |
cott | -0.664 |
icas | -0.609 |
tsky | -0.592 |
kamp | -0.581 |
Token | the |
Token ID | 262 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
augmented | +0.087 |
asses | +0.086 |
offending | +0.084 |
ingle | +0.082 |
routed | +0.081 |
Neg logit contributions | |
ulia | -0.113 |
cott | -0.111 |
icas | -0.102 |
tsky | -0.099 |
kamp | -0.097 |
Token | left |
Token ID | 1364 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
ulia | +0.495 |
cott | +0.490 |
icas | +0.450 |
tsky | +0.439 |
kamp | +0.432 |
Neg logit contributions | |
augmented | -0.283 |
asses | -0.278 |
offending | -0.272 |
ingle | -0.263 |
routed | -0.258 |
Token | and |
Token ID | 290 |
Feature activation | -3.79e-02 |
Pos logit contributions | |
augmented | +0.279 |
asses | +0.273 |
offending | +0.269 |
ingle | +0.262 |
routed | +0.260 |
Neg logit contributions | |
ulia | -0.280 |
cott | -0.273 |
icas | -0.249 |
tsky | -0.238 |
doms | -0.233 |
Token | also |
Token ID | 635 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
ulia | +1.087 |
cott | +1.074 |
icas | +0.971 |
tsky | +0.940 |
kamp | +0.921 |
Neg logit contributions | |
augmented | -0.966 |
asses | -0.952 |
offending | -0.942 |
ingle | -0.913 |
routed | -0.902 |
Token | directly |
Token ID | 3264 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
ulia | +0.654 |
cott | +0.649 |
icas | +0.589 |
tsky | +0.573 |
kamp | +0.561 |
Neg logit contributions | |
augmented | -0.514 |
asses | -0.508 |
offending | -0.501 |
ingle | -0.487 |
routed | -0.479 |
Token | admin |
Token ID | 13169 |
Feature activation | -3.33e-01 |
Pos logit contributions | |
augmented | +0.501 |
asses | +0.491 |
offending | +0.483 |
ingle | +0.461 |
routed | +0.460 |
Neg logit contributions | |
ulia | -0.728 |
cott | -0.709 |
icas | -0.652 |
tsky | -0.636 |
kamp | -0.622 |
Token | isters |
Token ID | 6223 |
Feature activation | +9.77e-02 |
Pos logit contributions | |
ulia | +0.855 |
cott | +0.840 |
icas | +0.760 |
tsky | +0.727 |
kamp | +0.713 |
Neg logit contributions | |
augmented | -0.867 |
offending | -0.849 |
asses | -0.840 |
routed | -0.818 |
ingle | -0.817 |
Token | the |
Token ID | 262 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
augmented | +0.223 |
asses | +0.217 |
offending | +0.215 |
ingle | +0.207 |
routed | +0.205 |
Neg logit contributions | |
ulia | -0.285 |
cott | -0.280 |
icas | -0.256 |
tsky | -0.249 |
kamp | -0.243 |
Token | following |
Token ID | 1708 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
ulia | +0.460 |
cott | +0.454 |
icas | +0.414 |
tsky | +0.402 |
kamp | +0.395 |
Neg logit contributions | |
augmented | -0.334 |
asses | -0.330 |
offending | -0.324 |
ingle | -0.314 |
routed | -0.310 |
Token | external |
Token ID | 7097 |
Feature activation | -1.63e-02 |
Pos logit contributions | |
cott | +4.187 |
ulia | +4.146 |
icas | +3.817 |
doms | +3.684 |
tsky | +3.667 |
Neg logit contributions | |
asses | -3.030 |
augmented | -2.971 |
ingle | -2.950 |
offending | -2.886 |
routed | -2.818 |
Token | territories |
Token ID | 16771 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
ulia | +0.054 |
cott | +0.053 |
icas | +0.049 |
tsky | +0.048 |
kamp | +0.047 |
Neg logit contributions | |
augmented | -0.031 |
asses | -0.030 |
offending | -0.030 |
ingle | -0.028 |
routed | -0.028 |
Token | : |
Token ID | 25 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
augmented | +0.407 |
asses | +0.398 |
offending | +0.395 |
ingle | +0.382 |
routed | +0.380 |
Neg logit contributions | |
ulia | -0.379 |
cott | -0.372 |
icas | -0.334 |
tsky | -0.323 |
kamp | -0.314 |
Token | Ash |
Token ID | 7844 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
ulia | +0.527 |
cott | +0.518 |
icas | +0.469 |
tsky | +0.455 |
kamp | +0.445 |
Neg logit contributions | |
augmented | -0.486 |
asses | -0.475 |
offending | -0.471 |
ingle | -0.457 |
routed | -0.451 |
Token | more |
Token ID | 3549 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
augmented | +0.354 |
asses | +0.352 |
offending | +0.348 |
ingle | +0.338 |
routed | +0.332 |
Neg logit contributions | |
ulia | -0.417 |
cott | -0.415 |
icas | -0.379 |
tsky | -0.374 |
kamp | -0.360 |
Token | things |
Token ID | 1243 |
Feature activation | +7.94e-02 |
Pos logit contributions | |
cott | +1.624 |
ulia | +1.603 |
icas | +1.446 |
doms | +1.354 |
tsky | +1.340 |
Neg logit contributions | |
augmented | -2.232 |
asses | -2.208 |
offending | -2.201 |
ingle | -2.189 |
disse | -2.181 |
Token | are |
Token ID | 389 |
Feature activation | -2.20e-01 |
Pos logit contributions | |
asses | +0.233 |
augmented | +0.231 |
offending | +0.230 |
disse | +0.223 |
ingle | +0.221 |
Neg logit contributions | |
ulia | -0.176 |
cott | -0.173 |
icas | -0.152 |
tsky | -0.144 |
kamp | -0.141 |
Token | moving |
Token ID | 3867 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
ulia | +0.523 |
cott | +0.513 |
icas | +0.455 |
tsky | +0.443 |
kamp | +0.430 |
Neg logit contributions | |
augmented | -0.597 |
asses | -0.593 |
offending | -0.583 |
ingle | -0.574 |
disse | -0.571 |
Token | along |
Token ID | 1863 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
asses | +0.265 |
augmented | +0.264 |
offending | +0.260 |
ingle | +0.252 |
disse | +0.251 |
Neg logit contributions | |
ulia | -0.445 |
cott | -0.443 |
icas | -0.401 |
tsky | -0.400 |
kamp | -0.388 |
Token | . |
Token ID | 13 |
Feature activation | -1.49e-01 |
Pos logit contributions | |
augmented | +1.181 |
asses | +1.164 |
offending | +1.148 |
ingle | +1.115 |
routed | +1.103 |
Neg logit contributions | |
ulia | -1.267 |
cott | -1.248 |
icas | -1.127 |
tsky | -1.091 |
kamp | -1.067 |
Token | @ |
Token ID | 2488 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
ulia | +0.380 |
cott | +0.375 |
icas | +0.337 |
tsky | +0.326 |
kamp | +0.318 |
Neg logit contributions | |
augmented | -0.391 |
asses | -0.385 |
offending | -0.381 |
ingle | -0.369 |
routed | -0.367 |
Token | Master |
Token ID | 18254 |
Feature activation | -3.91e-01 |
Pos logit contributions | |
ulia | +3.648 |
cott | +3.611 |
icas | +3.242 |
tsky | +3.151 |
kamp | +3.084 |
Neg logit contributions | |
augmented | -3.514 |
asses | -3.432 |
offending | -3.423 |
ingle | -3.312 |
routed | -3.295 |
Token | D |
Token ID | 35 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
ulia | +1.090 |
cott | +1.069 |
icas | +0.968 |
tsky | +0.940 |
kamp | +0.918 |
Neg logit contributions | |
augmented | -0.936 |
asses | -0.926 |
offending | -0.906 |
ingle | -0.890 |
routed | -0.869 |
Token | al |
Token ID | 282 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
ulia | +1.071 |
cott | +1.056 |
icas | +0.952 |
tsky | +0.923 |
kamp | +0.902 |
Neg logit contributions | |
augmented | -0.997 |
asses | -0.984 |
offending | -0.969 |
ingle | -0.943 |
routed | -0.931 |
Token | K |
Token ID | 42 |
Feature activation | -7.05e-01 |
Pos logit contributions | |
ulia | +0.829 |
cott | +0.809 |
icas | +0.714 |
tsky | +0.691 |
doms | +0.667 |
Neg logit contributions | |
augmented | -1.081 |
asses | -1.076 |
offending | -1.054 |
ingle | -1.036 |
routed | -1.024 |
Token | | |
Token ID | 930 |
Feature activation | -7.12e-01 |
Pos logit contributions | |
ulia | +1.891 |
cott | +1.863 |
icas | +1.682 |
tsky | +1.629 |
kamp | +1.592 |
Neg logit contributions | |
augmented | -1.754 |
asses | -1.728 |
offending | -1.704 |
ingle | -1.655 |
routed | -1.637 |
Token | TL |
Token ID | 24811 |
Feature activation | -5.39e-01 |
Pos logit contributions | |
augmented | +1.532 |
asses | +1.515 |
offending | +1.470 |
ingle | +1.434 |
routed | +1.412 |
Neg logit contributions | |
ulia | -1.896 |
cott | -1.869 |
icas | -1.704 |
tsky | -1.653 |
doms | -1.630 |
Token | AD |
Token ID | 2885 |
Feature activation | -9.09e-03 |
Pos logit contributions | |
ulia | +1.485 |
cott | +1.468 |
icas | +1.326 |
tsky | +1.282 |
kamp | +1.256 |
Neg logit contributions | |
augmented | -1.289 |
asses | -1.270 |
offending | -1.255 |
ingle | -1.217 |
routed | -1.202 |
Token | T |
Token ID | 51 |
Feature activation | -2.26e-01 |
Pos logit contributions | |
ulia | +0.020 |
cott | +0.020 |
icas | +0.017 |
tsky | +0.017 |
kamp | +0.016 |
Neg logit contributions | |
augmented | -0.027 |
asses | -0.027 |
offending | -0.026 |
ingle | -0.026 |
routed | -0.026 |
Token | 235 |
Token ID | 28878 |
Feature activation | +5.15e-02 |
Pos logit contributions | |
ulia | +0.699 |
cott | +0.691 |
icas | +0.632 |
tsky | +0.615 |
kamp | +0.604 |
Neg logit contributions | |
augmented | -0.467 |
asses | -0.458 |
offending | -0.451 |
ingle | -0.435 |
routed | -0.429 |
Token | 21 |
Token ID | 2481 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
augmented | +0.101 |
asses | +0.099 |
offending | +0.097 |
ingle | +0.094 |
routed | +0.093 |
Neg logit contributions | |
ulia | -0.165 |
cott | -0.163 |
icas | -0.150 |
tsky | -0.146 |
kamp | -0.143 |
Token | Posts |
Token ID | 12043 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
augmented | +0.635 |
offending | +0.617 |
asses | +0.617 |
ingle | +0.582 |
routed | +0.579 |
Neg logit contributions | |
ulia | -1.217 |
cott | -1.205 |
icas | -1.109 |
tsky | -1.081 |
kamp | -1.068 |
Token | # |
Token ID | 1303 |
Feature activation | -8.20e-01 |
Pos logit contributions | |
ulia | +2.746 |
cott | +2.685 |
icas | +2.327 |
tsky | +2.206 |
kamp | +2.154 |
Neg logit contributions | |
augmented | -4.407 |
asses | -4.379 |
offending | -4.311 |
ingle | -4.236 |
routed | -4.177 |
Token | 18 |
Token ID | 1507 |
Feature activation | +3.96e-01 |
Pos logit contributions | |
ulia | +2.653 |
cott | +2.546 |
icas | +2.311 |
kamp | +2.271 |
tsky | +2.237 |
Neg logit contributions | |
offending | -1.632 |
augmented | -1.594 |
asses | -1.583 |
disse | -1.519 |
routed | -1.509 |
Token | Good |
Token ID | 4599 |
Feature activation | +4.07e-01 |
Pos logit contributions | |
augmented | +0.976 |
asses | +0.948 |
offending | +0.942 |
ingle | +0.914 |
routed | +0.913 |
Neg logit contributions | |
ulia | -1.076 |
cott | -1.058 |
icas | -0.966 |
tsky | -0.931 |
kamp | -0.918 |
Token | stuff |
Token ID | 3404 |
Feature activation | +8.52e-02 |
Pos logit contributions | |
augmented | +0.778 |
asses | +0.764 |
offending | +0.748 |
ingle | +0.719 |
routed | +0.715 |
Neg logit contributions | |
ulia | -1.329 |
cott | -1.306 |
icas | -1.210 |
tsky | -1.175 |
kamp | -1.154 |
Token | ! |
Token ID | 0 |
Feature activation | +1.20e-01 |
Pos logit contributions | |
augmented | +0.195 |
asses | +0.191 |
offending | +0.189 |
ingle | +0.182 |
routed | +0.182 |
Neg logit contributions | |
ulia | -0.247 |
cott | -0.243 |
icas | -0.221 |
tsky | -0.215 |
kamp | -0.210 |
Token | 2011 |
Token ID | 2813 |
Feature activation | +7.45e-01 |
Pos logit contributions | |
augmented | +1.206 |
asses | +1.181 |
offending | +1.161 |
ingle | +1.113 |
routed | +1.098 |
Neg logit contributions | |
ulia | -2.207 |
cott | -2.180 |
icas | -2.009 |
tsky | -1.959 |
kamp | -1.929 |
Token | United |
Token ID | 1578 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
augmented | +1.705 |
asses | +1.678 |
offending | +1.638 |
ingle | +1.600 |
routed | +1.575 |
Neg logit contributions | |
ulia | -2.132 |
cott | -2.097 |
icas | -1.919 |
tsky | -1.863 |
doms | -1.827 |
Token | States |
Token ID | 1829 |
Feature activation | -6.24e-02 |
Pos logit contributions | |
ulia | +0.595 |
cott | +0.585 |
icas | +0.515 |
tsky | +0.501 |
kamp | +0.483 |
Neg logit contributions | |
augmented | -0.744 |
asses | -0.736 |
offending | -0.725 |
ingle | -0.707 |
routed | -0.702 |
Token | 228 |
Token ID | 29041 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
ulia | +0.203 |
cott | +0.201 |
icas | +0.184 |
tsky | +0.179 |
kamp | +0.177 |
Neg logit contributions | |
augmented | -0.119 |
asses | -0.118 |
offending | -0.116 |
ingle | -0.111 |
routed | -0.109 |
Token | 65 |
Token ID | 2996 |
Feature activation | +4.68e-02 |
Pos logit contributions | |
augmented | +0.546 |
asses | +0.535 |
offending | +0.525 |
ingle | +0.505 |
routed | +0.498 |
Neg logit contributions | |
ulia | -0.953 |
cott | -0.941 |
icas | -0.866 |
tsky | -0.845 |
kamp | -0.828 |
Token | Posts |
Token ID | 12043 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
augmented | +0.089 |
offending | +0.088 |
asses | +0.086 |
routed | +0.083 |
disse | +0.083 |
Neg logit contributions | |
ulia | -0.153 |
cott | -0.151 |
icas | -0.139 |
kamp | -0.135 |
tsky | -0.134 |
Token | # |
Token ID | 1303 |
Feature activation | -8.04e-01 |
Pos logit contributions | |
ulia | +2.728 |
cott | +2.666 |
icas | +2.313 |
tsky | +2.196 |
kamp | +2.141 |
Neg logit contributions | |
augmented | -4.381 |
asses | -4.355 |
offending | -4.284 |
ingle | -4.210 |
routed | -4.153 |
Token | 13 |
Token ID | 1485 |
Feature activation | +6.31e-01 |
Pos logit contributions | |
cott | +2.364 |
ulia | +2.318 |
icas | +2.091 |
jar | +2.055 |
tsky | +2.037 |
Neg logit contributions | |
offending | -1.766 |
disse | -1.736 |
augmented | -1.722 |
��� | -1.695 |
routed | -1.679 |
Token | On |
Token ID | 1550 |
Feature activation | -4.20e-02 |
Pos logit contributions | |
augmented | +1.537 |
asses | +1.486 |
offending | +1.485 |
routed | +1.435 |
ingle | +1.429 |
Neg logit contributions | |
ulia | -1.728 |
cott | -1.698 |
icas | -1.554 |
tsky | -1.495 |
kamp | -1.475 |
Token | September |
Token ID | 2693 |
Feature activation | +6.20e-01 |
Pos logit contributions | |
ulia | +0.092 |
cott | +0.091 |
icas | +0.080 |
tsky | +0.077 |
kamp | +0.074 |
Neg logit contributions | |
augmented | -0.125 |
asses | -0.124 |
offending | -0.122 |
ingle | -0.119 |
routed | -0.118 |
Token | 20 |
Token ID | 1160 |
Feature activation | +4.00e-01 |
Pos logit contributions | |
augmented | +1.149 |
asses | +1.122 |
offending | +1.081 |
ingle | +1.034 |
routed | +1.030 |
Neg logit contributions | |
ulia | -2.070 |
cott | -2.062 |
icas | -1.881 |
tsky | -1.822 |
doms | -1.801 |
Token | am |
Token ID | 321 |
Feature activation | -5.82e-01 |
Pos logit contributions | |
augmented | +0.050 |
asses | +0.050 |
offending | +0.048 |
ingle | +0.048 |
routed | +0.047 |
Neg logit contributions | |
ulia | -0.059 |
cott | -0.058 |
icas | -0.053 |
tsky | -0.051 |
kamp | -0.050 |
Token | , |
Token ID | 11 |
Feature activation | +7.47e-02 |
Pos logit contributions | |
ulia | +1.568 |
cott | +1.544 |
icas | +1.395 |
tsky | +1.352 |
kamp | +1.322 |
Neg logit contributions | |
augmented | -1.441 |
asses | -1.421 |
offending | -1.401 |
ingle | -1.361 |
routed | -1.344 |
Token | Holland |
Token ID | 16070 |
Feature activation | +7.13e-02 |
Pos logit contributions | |
augmented | +0.183 |
asses | +0.180 |
offending | +0.177 |
ingle | +0.173 |
routed | +0.170 |
Neg logit contributions | |
ulia | -0.203 |
cott | -0.199 |
icas | -0.180 |
tsky | -0.175 |
doms | -0.170 |
Token | ( |
Token ID | 357 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
augmented | +0.172 |
asses | +0.168 |
offending | +0.167 |
ingle | +0.161 |
routed | +0.159 |
Neg logit contributions | |
ulia | -0.197 |
cott | -0.193 |
icas | -0.176 |
tsky | -0.172 |
doms | -0.167 |
Token | Bern |
Token ID | 23927 |
Feature activation | -7.27e-01 |
Pos logit contributions | |
augmented | +0.531 |
asses | +0.528 |
offending | +0.517 |
ingle | +0.508 |
routed | +0.499 |
Neg logit contributions | |
ulia | -0.506 |
cott | -0.492 |
icas | -0.445 |
tsky | -0.434 |
kamp | -0.416 |
Token | ard |
Token ID | 446 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
ulia | +1.910 |
cott | +1.885 |
icas | +1.699 |
tsky | +1.636 |
kamp | +1.608 |
Neg logit contributions | |
augmented | -1.849 |
asses | -1.812 |
offending | -1.805 |
ingle | -1.739 |
routed | -1.734 |
Token | 80 |
Token ID | 4019 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
ulia | +4.058 |
cott | +4.019 |
icas | +3.670 |
kamp | +3.523 |
tsky | +3.521 |
Neg logit contributions | |
augmented | -3.006 |
asses | -2.954 |
offending | -2.933 |
ingle | -2.802 |
routed | -2.778 |
Token | ), |
Token ID | 828 |
Feature activation | +4.01e-02 |
Pos logit contributions | |
augmented | +0.254 |
asses | +0.250 |
offending | +0.246 |
ingle | +0.239 |
routed | +0.236 |
Neg logit contributions | |
ulia | -0.275 |
cott | -0.271 |
icas | -0.245 |
tsky | -0.238 |
kamp | -0.231 |
Token | Ben |
Token ID | 3932 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
augmented | +0.099 |
asses | +0.098 |
offending | +0.096 |
ingle | +0.094 |
routed | +0.092 |
Neg logit contributions | |
ulia | -0.108 |
cott | -0.106 |
icas | -0.096 |
tsky | -0.093 |
doms | -0.090 |
Token | rou |
Token ID | 472 |
Feature activation | -2.44e-01 |
Pos logit contributions | |
ulia | +0.611 |
cott | +0.600 |
icas | +0.542 |
tsky | +0.527 |
kamp | +0.514 |
Neg logit contributions | |
augmented | -0.559 |
asses | -0.554 |
offending | -0.545 |
ingle | -0.531 |
routed | -0.522 |
Token | gg |
Token ID | 1130 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
ulia | +0.674 |
cott | +0.660 |
icas | +0.601 |
tsky | +0.580 |
kamp | +0.567 |
Neg logit contributions | |
augmented | -0.584 |
asses | -0.579 |
offending | -0.568 |
ingle | -0.555 |
routed | -0.546 |
Token | 2010 |
Token ID | 3050 |
Feature activation | +5.53e-01 |
Pos logit contributions | |
augmented | +0.848 |
asses | +0.832 |
offending | +0.826 |
ingle | +0.788 |
routed | +0.783 |
Neg logit contributions | |
ulia | -1.429 |
cott | -1.412 |
icas | -1.292 |
tsky | -1.258 |
kamp | -1.249 |
Token | United |
Token ID | 1578 |
Feature activation | -2.55e-01 |
Pos logit contributions | |
augmented | +1.282 |
asses | +1.266 |
offending | +1.233 |
ingle | +1.201 |
routed | +1.184 |
Neg logit contributions | |
ulia | -1.572 |
cott | -1.547 |
icas | -1.410 |
tsky | -1.368 |
doms | -1.345 |
Token | States |
Token ID | 1829 |
Feature activation | -5.41e-02 |
Pos logit contributions | |
ulia | +0.586 |
cott | +0.576 |
icas | +0.506 |
tsky | +0.492 |
kamp | +0.475 |
Neg logit contributions | |
augmented | -0.735 |
asses | -0.727 |
offending | -0.716 |
ingle | -0.700 |
routed | -0.694 |
Token | 21 |
Token ID | 2310 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
ulia | +0.176 |
cott | +0.175 |
icas | +0.160 |
tsky | +0.156 |
kamp | +0.154 |
Neg logit contributions | |
augmented | -0.102 |
asses | -0.101 |
offending | -0.099 |
ingle | -0.095 |
routed | -0.094 |
Token | 50 |
Token ID | 1120 |
Feature activation | -9.81e-02 |
Pos logit contributions | |
augmented | +0.627 |
asses | +0.619 |
offending | +0.603 |
ingle | +0.584 |
routed | +0.572 |
Neg logit contributions | |
ulia | -1.142 |
cott | -1.126 |
icas | -1.038 |
tsky | -1.018 |
kamp | -0.992 |
Token | Posts |
Token ID | 12043 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
ulia | +0.320 |
cott | +0.319 |
icas | +0.292 |
kamp | +0.284 |
tsky | +0.283 |
Neg logit contributions | |
augmented | -0.185 |
offending | -0.183 |
asses | -0.180 |
disse | -0.172 |
ingle | -0.171 |
Token | # |
Token ID | 1303 |
Feature activation | -8.05e-01 |
Pos logit contributions | |
ulia | +2.717 |
cott | +2.658 |
icas | +2.308 |
tsky | +2.189 |
kamp | +2.135 |
Neg logit contributions | |
augmented | -4.333 |
asses | -4.303 |
offending | -4.236 |
ingle | -4.163 |
routed | -4.106 |
Token | 16 |
Token ID | 1433 |
Feature activation | +4.27e-01 |
Pos logit contributions | |
ulia | +2.521 |
cott | +2.502 |
icas | +2.228 |
tsky | +2.191 |
doms | +2.161 |
Neg logit contributions | |
augmented | -1.627 |
offending | -1.603 |
asses | -1.567 |
disse | -1.558 |
routed | -1.515 |
Token | Glad |
Token ID | 28442 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
augmented | +1.024 |
asses | +0.998 |
offending | +0.989 |
routed | +0.954 |
ingle | +0.953 |
Neg logit contributions | |
ulia | -1.188 |
cott | -1.171 |
icas | -1.069 |
tsky | -1.031 |
kamp | -1.018 |
Token | to |
Token ID | 284 |
Feature activation | -3.77e-02 |
Pos logit contributions | |
augmented | +0.419 |
asses | +0.413 |
offending | +0.406 |
ingle | +0.390 |
routed | +0.390 |
Neg logit contributions | |
ulia | -0.549 |
cott | -0.541 |
icas | -0.494 |
tsky | -0.479 |
kamp | -0.471 |
Token | hear |
Token ID | 3285 |
Feature activation | +6.17e-01 |
Pos logit contributions | |
ulia | +0.108 |
cott | +0.107 |
icas | +0.097 |
tsky | +0.094 |
kamp | +0.092 |
Neg logit contributions | |
augmented | -0.087 |
asses | -0.085 |
offending | -0.084 |
ingle | -0.081 |
routed | -0.081 |
Token | without |
Token ID | 19419 |
Feature activation | -4.86e-01 |
Pos logit contributions | |
ulia | +0.469 |
cott | +0.463 |
icas | +0.421 |
tsky | +0.408 |
kamp | +0.400 |
Neg logit contributions | |
augmented | -0.381 |
asses | -0.375 |
offending | -0.369 |
ingle | -0.358 |
routed | -0.353 |
Token | religion |
Token ID | 5737 |
Feature activation | +8.11e-02 |
Pos logit contributions | |
ulia | +1.451 |
cott | +1.432 |
icas | +1.307 |
tsky | +1.270 |
kamp | +1.246 |
Neg logit contributions | |
augmented | -1.061 |
asses | -1.044 |
offending | -1.026 |
ingle | -0.994 |
routed | -0.982 |
Token | � |
Token ID | 447 |
Feature activation | -3.93e-04 |
Pos logit contributions | |
augmented | +0.223 |
asses | +0.220 |
offending | +0.218 |
ingle | +0.211 |
routed | +0.210 |
Neg logit contributions | |
ulia | -0.197 |
cott | -0.193 |
icas | -0.172 |
tsky | -0.166 |
kamp | -0.162 |
Token | � |
Token ID | 251 |
Feature activation | +3.34e-02 |
Pos logit contributions | |
ulia | +0.001 |
cott | +0.001 |
icas | +0.001 |
tsky | +0.001 |
kamp | +0.001 |
Neg logit contributions | |
augmented | -0.001 |
asses | -0.001 |
offending | -0.001 |
ingle | -0.001 |
routed | -0.001 |
Token | fl |
Token ID | 781 |
Feature activation | -8.16e-02 |
Pos logit contributions | |
augmented | +0.081 |
asses | +0.080 |
offending | +0.079 |
ingle | +0.077 |
routed | +0.076 |
Neg logit contributions | |
ulia | -0.091 |
cott | -0.090 |
icas | -0.082 |
tsky | -0.079 |
kamp | -0.077 |
Token | it |
Token ID | 270 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
ulia | +0.225 |
cott | +0.222 |
icas | +0.200 |
tsky | +0.195 |
kamp | +0.190 |
Neg logit contributions | |
augmented | -0.196 |
asses | -0.195 |
offending | -0.190 |
ingle | -0.187 |
routed | -0.183 |
Token | between |
Token ID | 1022 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
ulia | +4.017 |
cott | +3.953 |
icas | +3.539 |
tsky | +3.521 |
doms | +3.450 |
Neg logit contributions | |
augmented | -2.952 |
asses | -2.925 |
offending | -2.837 |
disse | -2.770 |
ingle | -2.767 |
Token | Pent |
Token ID | 9696 |
Feature activation | +5.35e-02 |
Pos logit contributions | |
augmented | +0.543 |
offending | +0.529 |
asses | +0.529 |
ingle | +0.504 |
routed | +0.503 |
Neg logit contributions | |
ulia | -0.650 |
cott | -0.641 |
icas | -0.581 |
tsky | -0.563 |
kamp | -0.555 |
Token | ec |
Token ID | 721 |
Feature activation | -9.01e-02 |
Pos logit contributions | |
augmented | +0.173 |
asses | +0.172 |
offending | +0.169 |
ingle | +0.167 |
routed | +0.164 |
Neg logit contributions | |
ulia | -0.102 |
cott | -0.100 |
icas | -0.086 |
tsky | -0.083 |
kamp | -0.080 |
Token | ost |
Token ID | 455 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
ulia | +0.279 |
cott | +0.276 |
icas | +0.252 |
tsky | +0.245 |
kamp | +0.240 |
Neg logit contributions | |
augmented | -0.189 |
offending | -0.182 |
asses | -0.182 |
routed | -0.174 |
ingle | -0.173 |
Token | al |
Token ID | 282 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
augmented | +0.269 |
asses | +0.267 |
offending | +0.259 |
ingle | +0.253 |
routed | +0.247 |
Neg logit contributions | |
ulia | -0.357 |
cott | -0.353 |
icas | -0.319 |
tsky | -0.314 |
kamp | -0.308 |
Token | � |
Token ID | 447 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
augmented | +0.495 |
asses | +0.477 |
offending | +0.470 |
routed | +0.457 |
ingle | +0.457 |
Neg logit contributions | |
ulia | -0.622 |
cott | -0.614 |
icas | -0.563 |
tsky | -0.541 |
doms | -0.529 |
Token | � |
Token ID | 251 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
ulia | +0.332 |
cott | +0.326 |
icas | +0.297 |
tsky | +0.288 |
kamp | +0.286 |
Neg logit contributions | |
augmented | -0.242 |
asses | -0.240 |
offending | -0.237 |
disse | -0.227 |
ingle | -0.225 |
Token | – |
Token ID | 784 |
Feature activation | -5.66e-02 |
Pos logit contributions | |
ulia | +0.283 |
cott | +0.279 |
icas | +0.254 |
tsky | +0.246 |
kamp | +0.240 |
Neg logit contributions | |
augmented | -0.238 |
asses | -0.234 |
offending | -0.230 |
ingle | -0.223 |
routed | -0.221 |
Token | is |
Token ID | 318 |
Feature activation | -5.18e-01 |
Pos logit contributions | |
ulia | +0.159 |
cott | +0.157 |
icas | +0.143 |
tsky | +0.138 |
kamp | +0.135 |
Neg logit contributions | |
augmented | -0.134 |
asses | -0.131 |
offending | -0.130 |
ingle | -0.125 |
routed | -0.125 |
Token | at |
Token ID | 379 |
Feature activation | -8.57e-02 |
Pos logit contributions | |
ulia | +1.477 |
cott | +1.461 |
icas | +1.327 |
tsky | +1.287 |
kamp | +1.266 |
Neg logit contributions | |
augmented | -1.179 |
asses | -1.171 |
offending | -1.149 |
ingle | -1.121 |
routed | -1.098 |
Token | once |
Token ID | 1752 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
ulia | +0.224 |
cott | +0.220 |
icas | +0.198 |
tsky | +0.192 |
kamp | +0.187 |
Neg logit contributions | |
augmented | -0.220 |
asses | -0.217 |
offending | -0.214 |
ingle | -0.209 |
routed | -0.205 |
Token | relentlessly |
Token ID | 37952 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
cott | +3.925 |
ulia | +3.907 |
icas | +3.563 |
tsky | +3.464 |
kamp | +3.423 |
Neg logit contributions | |
asses | -2.812 |
augmented | -2.775 |
offending | -2.706 |
ingle | -2.703 |
routed | -2.583 |
Token | cynical |
Token ID | 28858 |
Feature activation | -4.21e-01 |
Pos logit contributions | |
ulia | +0.736 |
cott | +0.728 |
icas | +0.666 |
tsky | +0.648 |
kamp | +0.636 |
Neg logit contributions | |
augmented | -0.496 |
asses | -0.488 |
offending | -0.479 |
ingle | -0.464 |
routed | -0.457 |
Token | and |
Token ID | 290 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
ulia | +1.097 |
cott | +1.080 |
icas | +0.972 |
tsky | +0.940 |
kamp | +0.918 |
Neg logit contributions | |
augmented | -1.080 |
asses | -1.065 |
offending | -1.051 |
ingle | -1.021 |
routed | -1.011 |
Token | outward |
Token ID | 23537 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
augmented | +0.037 |
asses | +0.036 |
offending | +0.036 |
routed | +0.034 |
ingle | +0.034 |
Neg logit contributions | |
ulia | -0.058 |
cott | -0.057 |
icas | -0.052 |
tsky | -0.051 |
kamp | -0.050 |
Token | ly |
Token ID | 306 |
Feature activation | -6.21e-01 |
Pos logit contributions | |
ulia | +0.558 |
cott | +0.544 |
icas | +0.494 |
tsky | +0.480 |
kamp | +0.468 |
Neg logit contributions | |
augmented | -0.487 |
asses | -0.474 |
offending | -0.473 |
ingle | -0.454 |
routed | -0.453 |
Token | bullying |
Token ID | 20714 |
Feature activation | -3.58e-01 |
Pos logit contributions | |
ulia | +0.847 |
cott | +0.835 |
icas | +0.761 |
tsky | +0.740 |
kamp | +0.724 |
Neg logit contributions | |
augmented | -0.632 |
asses | -0.619 |
offending | -0.614 |
ingle | -0.589 |
routed | -0.584 |
Token | , |
Token ID | 11 |
Feature activation | -6.80e-02 |
Pos logit contributions | |
ulia | +1.019 |
cott | +1.003 |
icas | +0.910 |
tsky | +0.883 |
kamp | +0.863 |
Neg logit contributions | |
augmented | -0.837 |
asses | -0.822 |
offending | -0.817 |
ingle | -0.784 |
routed | -0.778 |
Token | dominance |
Token ID | 18648 |
Feature activation | -4.77e-01 |
Pos logit contributions | |
ulia | +0.199 |
cott | +0.196 |
icas | +0.178 |
tsky | +0.173 |
kamp | +0.169 |
Neg logit contributions | |
augmented | -0.155 |
offending | -0.152 |
asses | -0.151 |
routed | -0.144 |
ingle | -0.143 |
Token | , |
Token ID | 11 |
Feature activation | +3.13e-02 |
Pos logit contributions | |
ulia | +1.311 |
cott | +1.295 |
icas | +1.168 |
tsky | +1.131 |
kamp | +1.103 |
Neg logit contributions | |
augmented | -1.166 |
asses | -1.143 |
offending | -1.134 |
ingle | -1.092 |
routed | -1.085 |
Token | and |
Token ID | 290 |
Feature activation | -2.82e-01 |
Pos logit contributions | |
augmented | +0.081 |
offending | +0.080 |
asses | +0.079 |
routed | +0.075 |
ingle | +0.075 |
Neg logit contributions | |
ulia | -0.082 |
cott | -0.081 |
icas | -0.072 |
tsky | -0.070 |
kamp | -0.068 |
Token | victim |
Token ID | 3117 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
ulia | +0.840 |
cott | +0.828 |
icas | +0.755 |
tsky | +0.734 |
kamp | +0.719 |
Neg logit contributions | |
augmented | -0.621 |
asses | -0.609 |
offending | -0.602 |
ingle | -0.580 |
routed | -0.574 |
Token | ization |
Token ID | 1634 |
Feature activation | -6.00e-01 |
Pos logit contributions | |
ulia | +3.419 |
cott | +3.368 |
icas | +3.027 |
tsky | +2.922 |
kamp | +2.888 |
Neg logit contributions | |
augmented | -3.423 |
asses | -3.406 |
offending | -3.275 |
ingle | -3.258 |
routed | -3.199 |
Token | during |
Token ID | 1141 |
Feature activation | -7.93e-01 |
Pos logit contributions | |
ulia | +1.613 |
cott | +1.589 |
icas | +1.435 |
tsky | +1.390 |
kamp | +1.360 |
Neg logit contributions | |
augmented | -1.487 |
asses | -1.466 |
offending | -1.443 |
ingle | -1.404 |
routed | -1.388 |
Token | the |
Token ID | 262 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
ulia | +2.413 |
cott | +2.386 |
icas | +2.182 |
tsky | +2.120 |
kamp | +2.088 |
Neg logit contributions | |
augmented | -1.652 |
asses | -1.645 |
offending | -1.586 |
ingle | -1.559 |
routed | -1.532 |
Token | transition |
Token ID | 6801 |
Feature activation | -3.23e-01 |
Pos logit contributions | |
ulia | +0.570 |
cott | +0.563 |
icas | +0.516 |
tsky | +0.502 |
kamp | +0.494 |
Neg logit contributions | |
augmented | -0.362 |
asses | -0.358 |
offending | -0.348 |
ingle | -0.339 |
routed | -0.334 |
Token | from |
Token ID | 422 |
Feature activation | -2.45e-01 |
Pos logit contributions | |
ulia | +1.008 |
cott | +0.998 |
icas | +0.916 |
tsky | +0.889 |
kamp | +0.875 |
Neg logit contributions | |
augmented | -0.666 |
asses | -0.653 |
offending | -0.646 |
ingle | -0.621 |
routed | -0.612 |
Token |
|
Token ID | 198 |
Feature activation | -9.94e-02 |
Pos logit contributions | |
ulia | +0.667 |
cott | +0.663 |
icas | +0.598 |
tsky | +0.579 |
kamp | +0.565 |
Neg logit contributions | |
augmented | -0.638 |
asses | -0.630 |
offending | -0.615 |
ingle | -0.602 |
routed | -0.595 |
Token |
|
Token ID | 198 |
Feature activation | -4.57e-02 |
Pos logit contributions | |
ulia | +0.231 |
cott | +0.228 |
icas | +0.200 |
tsky | +0.192 |
kamp | +0.190 |
Neg logit contributions | |
augmented | -0.282 |
offending | -0.281 |
asses | -0.278 |
disse | -0.271 |
routed | -0.269 |
Token | For |
Token ID | 1890 |
Feature activation | -6.05e-02 |
Pos logit contributions | |
ulia | +0.120 |
cott | +0.118 |
icas | +0.107 |
tsky | +0.104 |
kamp | +0.101 |
Neg logit contributions | |
augmented | -0.116 |
asses | -0.115 |
offending | -0.112 |
ingle | -0.110 |
routed | -0.108 |
Token | the |
Token ID | 262 |
Feature activation | +6.46e-02 |
Pos logit contributions | |
ulia | +0.173 |
cott | +0.171 |
icas | +0.155 |
tsky | +0.150 |
kamp | +0.147 |
Neg logit contributions | |
augmented | -0.140 |
asses | -0.138 |
offending | -0.136 |
ingle | -0.131 |
routed | -0.130 |
Token | most |
Token ID | 749 |
Feature activation | +3.26e-02 |
Pos logit contributions | |
augmented | +0.145 |
asses | +0.142 |
offending | +0.141 |
ingle | +0.135 |
routed | +0.134 |
Neg logit contributions | |
ulia | -0.189 |
cott | -0.187 |
icas | -0.170 |
tsky | -0.166 |
kamp | -0.162 |
Token | part |
Token ID | 636 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
augmented | +0.055 |
asses | +0.055 |
offending | +0.053 |
ingle | +0.051 |
disse | +0.050 |
Neg logit contributions | |
ulia | -0.113 |
cott | -0.112 |
icas | -0.103 |
tsky | -0.101 |
kamp | -0.099 |
Token | , |
Token ID | 11 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
ulia | +3.581 |
cott | +3.515 |
icas | +3.176 |
tsky | +3.067 |
kamp | +3.009 |
Neg logit contributions | |
augmented | -3.273 |
asses | -3.228 |
offending | -3.179 |
ingle | -3.112 |
routed | -3.053 |
Token | Fowler |
Token ID | 33693 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
ulia | +0.666 |
cott | +0.657 |
icas | +0.590 |
tsky | +0.571 |
kamp | +0.558 |
Neg logit contributions | |
augmented | -0.676 |
asses | -0.664 |
offending | -0.657 |
ingle | -0.636 |
routed | -0.633 |
Token | has |
Token ID | 468 |
Feature activation | -6.59e-03 |
Pos logit contributions | |
augmented | +0.388 |
asses | +0.378 |
offending | +0.374 |
routed | +0.361 |
ingle | +0.360 |
Neg logit contributions | |
ulia | -0.447 |
cott | -0.437 |
icas | -0.399 |
tsky | -0.383 |
doms | -0.377 |
Token | kept |
Token ID | 4030 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
ulia | +0.018 |
cott | +0.018 |
icas | +0.016 |
tsky | +0.016 |
kamp | +0.015 |
Neg logit contributions | |
augmented | -0.016 |
asses | -0.015 |
offending | -0.015 |
routed | -0.015 |
ingle | -0.015 |
Token | the |
Token ID | 262 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
augmented | +0.304 |
offending | +0.295 |
asses | +0.293 |
routed | +0.282 |
ingle | +0.278 |
Neg logit contributions | |
ulia | -0.399 |
cott | -0.391 |
icas | -0.357 |
tsky | -0.348 |
kamp | -0.342 |
Token | June |
Token ID | 2795 |
Feature activation | +6.90e-01 |
Pos logit contributions | |
ulia | +1.299 |
cott | +1.279 |
icas | +1.114 |
tsky | +1.063 |
kamp | +1.038 |
Neg logit contributions | |
augmented | -1.922 |
asses | -1.911 |
offending | -1.893 |
ingle | -1.856 |
routed | -1.829 |
Token | 2012 |
Token ID | 2321 |
Feature activation | +6.82e-01 |
Pos logit contributions | |
augmented | +1.274 |
asses | +1.247 |
offending | +1.230 |
ingle | +1.179 |
routed | +1.164 |
Neg logit contributions | |
ulia | -2.295 |
cott | -2.268 |
icas | -2.086 |
tsky | -2.035 |
kamp | -2.006 |
Token | Canada |
Token ID | 3340 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
augmented | +1.586 |
asses | +1.562 |
offending | +1.527 |
ingle | +1.490 |
routed | +1.469 |
Neg logit contributions | |
ulia | -1.941 |
cott | -1.907 |
icas | -1.737 |
tsky | -1.684 |
doms | -1.653 |
Token | 16 |
Token ID | 1467 |
Feature activation | +3.98e-01 |
Pos logit contributions | |
augmented | +0.207 |
asses | +0.204 |
offending | +0.202 |
ingle | +0.194 |
routed | +0.191 |
Neg logit contributions | |
ulia | -0.337 |
cott | -0.334 |
icas | -0.306 |
tsky | -0.297 |
kamp | -0.295 |
Token | 10 |
Token ID | 940 |
Feature activation | +2.64e-01 |
Pos logit contributions | |
augmented | +0.787 |
asses | +0.770 |
offending | +0.755 |
ingle | +0.731 |
routed | +0.719 |
Neg logit contributions | |
ulia | -1.270 |
cott | -1.253 |
icas | -1.153 |
tsky | -1.124 |
kamp | -1.099 |
Token | Posts |
Token ID | 12043 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
augmented | +0.490 |
offending | +0.479 |
asses | +0.477 |
ingle | +0.455 |
disse | +0.450 |
Neg logit contributions | |
ulia | -0.874 |
cott | -0.869 |
icas | -0.796 |
tsky | -0.774 |
kamp | -0.772 |
Token | # |
Token ID | 1303 |
Feature activation | -8.42e-01 |
Pos logit contributions | |
ulia | +2.625 |
cott | +2.570 |
icas | +2.229 |
tsky | +2.117 |
kamp | +2.065 |
Neg logit contributions | |
augmented | -4.201 |
asses | -4.174 |
offending | -4.107 |
ingle | -4.035 |
routed | -3.982 |
Token | 14 |
Token ID | 1415 |
Feature activation | +5.33e-01 |
Pos logit contributions | |
ulia | +2.449 |
cott | +2.418 |
icas | +2.151 |
jar | +2.129 |
kamp | +2.101 |
Neg logit contributions | |
offending | -1.865 |
augmented | -1.823 |
��� | -1.807 |
disse | -1.805 |
routed | -1.749 |
Token | On |
Token ID | 1550 |
Feature activation | -3.12e-02 |
Pos logit contributions | |
augmented | +1.289 |
asses | +1.251 |
offending | +1.244 |
routed | +1.202 |
ingle | +1.202 |
Neg logit contributions | |
ulia | -1.470 |
cott | -1.444 |
icas | -1.321 |
tsky | -1.272 |
kamp | -1.254 |
Token | September |
Token ID | 2693 |
Feature activation | +5.75e-01 |
Pos logit contributions | |
ulia | +0.067 |
cott | +0.066 |
icas | +0.058 |
tsky | +0.056 |
kamp | +0.054 |
Neg logit contributions | |
augmented | -0.094 |
asses | -0.093 |
offending | -0.092 |
ingle | -0.090 |
routed | -0.089 |
Token | 20 |
Token ID | 1160 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
augmented | +1.082 |
asses | +1.063 |
offending | +1.024 |
ingle | +0.978 |
routed | +0.976 |
Neg logit contributions | |
ulia | -1.904 |
cott | -1.898 |
icas | -1.724 |
tsky | -1.672 |
doms | -1.653 |
Token | credit |
Token ID | 3884 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
augmented | +0.106 |
asses | +0.103 |
offending | +0.103 |
ingle | +0.098 |
routed | +0.097 |
Neg logit contributions | |
ulia | -0.152 |
cott | -0.150 |
icas | -0.137 |
tsky | -0.133 |
kamp | -0.131 |
Token | card |
Token ID | 2657 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
augmented | +0.320 |
asses | +0.312 |
offending | +0.311 |
ingle | +0.299 |
routed | +0.294 |
Neg logit contributions | |
ulia | -0.469 |
cott | -0.465 |
icas | -0.426 |
tsky | -0.414 |
kamp | -0.406 |
Token | report |
Token ID | 989 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
ulia | +0.480 |
cott | +0.474 |
icas | +0.434 |
tsky | +0.423 |
kamp | +0.415 |
Neg logit contributions | |
augmented | -0.308 |
asses | -0.302 |
offending | -0.297 |
ingle | -0.286 |
routed | -0.283 |
Token | can |
Token ID | 460 |
Feature activation | +2.62e-02 |
Pos logit contributions | |
ulia | +1.613 |
cott | +1.588 |
icas | +1.443 |
tsky | +1.401 |
kamp | +1.375 |
Neg logit contributions | |
augmented | -1.261 |
asses | -1.248 |
offending | -1.221 |
ingle | -1.189 |
routed | -1.169 |
Token | be |
Token ID | 307 |
Feature activation | -9.68e-02 |
Pos logit contributions | |
augmented | +0.057 |
asses | +0.056 |
offending | +0.055 |
ingle | +0.053 |
routed | +0.053 |
Neg logit contributions | |
ulia | -0.079 |
cott | -0.078 |
icas | -0.071 |
tsky | -0.069 |
kamp | -0.068 |
Token | found |
Token ID | 1043 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
ulia | +0.286 |
cott | +0.282 |
icas | +0.257 |
tsky | +0.250 |
kamp | +0.245 |
Neg logit contributions | |
augmented | -0.214 |
asses | -0.211 |
offending | -0.207 |
ingle | -0.201 |
routed | -0.198 |
Token | at |
Token ID | 379 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
ulia | +3.893 |
cott | +3.835 |
icas | +3.487 |
tsky | +3.370 |
kamp | +3.333 |
Neg logit contributions | |
asses | -2.858 |
augmented | -2.808 |
offending | -2.731 |
ingle | -2.671 |
disse | -2.639 |
Token | bit |
Token ID | 1643 |
Feature activation | +1.46e-01 |
Pos logit contributions | |
ulia | +0.644 |
cott | +0.632 |
icas | +0.568 |
tsky | +0.548 |
kamp | +0.538 |
Neg logit contributions | |
augmented | -0.689 |
asses | -0.677 |
offending | -0.670 |
ingle | -0.650 |
routed | -0.644 |
Token | . |
Token ID | 13 |
Feature activation | -2.60e-01 |
Pos logit contributions | |
augmented | +0.364 |
asses | +0.361 |
offending | +0.352 |
ingle | +0.346 |
routed | +0.336 |
Neg logit contributions | |
ulia | -0.386 |
cott | -0.381 |
icas | -0.346 |
tsky | -0.336 |
kamp | -0.326 |
Token | ly |
Token ID | 306 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
ulia | +0.698 |
cott | +0.688 |
icas | +0.621 |
tsky | +0.602 |
kamp | +0.588 |
Neg logit contributions | |
augmented | -0.648 |
asses | -0.639 |
offending | -0.630 |
ingle | -0.612 |
routed | -0.605 |
Token | / |
Token ID | 14 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
ulia | +0.639 |
cott | +0.629 |
icas | +0.567 |
tsky | +0.550 |
kamp | +0.538 |
Neg logit contributions | |
augmented | -0.593 |
asses | -0.584 |
offending | -0.576 |
ingle | -0.559 |
routed | -0.553 |
Token | � |
Token ID | 447 |
Feature activation | +6.83e-02 |
Pos logit contributions | |
ulia | +0.204 |
cott | +0.202 |
icas | +0.182 |
tsky | +0.176 |
kamp | +0.172 |
Neg logit contributions | |
augmented | -0.192 |
asses | -0.187 |
offending | -0.186 |
ingle | -0.179 |
routed | -0.178 |
Token | � |
Token ID | 251 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
augmented | +0.135 |
asses | +0.132 |
offending | +0.130 |
ingle | +0.125 |
routed | +0.123 |
Neg logit contributions | |
ulia | -0.218 |
cott | -0.216 |
icas | -0.198 |
tsky | -0.193 |
kamp | -0.189 |
Token | he |
Token ID | 339 |
Feature activation | -2.33e-01 |
Pos logit contributions | |
ulia | +0.379 |
cott | +0.375 |
icas | +0.338 |
tsky | +0.327 |
doms | +0.320 |
Neg logit contributions | |
augmented | -0.349 |
asses | -0.340 |
offending | -0.338 |
ingle | -0.325 |
routed | -0.322 |
Token | said |
Token ID | 531 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
ulia | +0.553 |
cott | +0.546 |
icas | +0.484 |
tsky | +0.466 |
kamp | +0.454 |
Neg logit contributions | |
augmented | -0.656 |
asses | -0.644 |
offending | -0.636 |
ingle | -0.617 |
routed | -0.614 |
Token | without |
Token ID | 1231 |
Feature activation | -4.81e-01 |
Pos logit contributions | |
ulia | +0.349 |
cott | +0.345 |
icas | +0.313 |
tsky | +0.302 |
doms | +0.296 |
Neg logit contributions | |
augmented | -0.294 |
asses | -0.287 |
offending | -0.285 |
ingle | -0.273 |
routed | -0.271 |
Token | hesitation |
Token ID | 29592 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
ulia | +1.522 |
cott | +1.504 |
icas | +1.373 |
tsky | +1.342 |
kamp | +1.318 |
Neg logit contributions | |
augmented | -0.978 |
asses | -0.957 |
offending | -0.953 |
ingle | -0.902 |
routed | -0.894 |
Token | . |
Token ID | 13 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
ulia | +3.400 |
cott | +3.328 |
icas | +2.995 |
tsky | +2.895 |
kamp | +2.843 |
Neg logit contributions | |
augmented | -3.360 |
asses | -3.323 |
offending | -3.267 |
ingle | -3.202 |
routed | -3.152 |
Token | � |
Token ID | 564 |
Feature activation | +2.27e-02 |
Pos logit contributions | |
ulia | +0.334 |
cott | +0.332 |
icas | +0.298 |
tsky | +0.287 |
doms | +0.280 |
Neg logit contributions | |
augmented | -0.343 |
asses | -0.339 |
offending | -0.333 |
ingle | -0.323 |
routed | -0.318 |
Token | � |
Token ID | 250 |
Feature activation | -9.54e-02 |
Pos logit contributions | |
augmented | +0.045 |
asses | +0.045 |
offending | +0.044 |
ingle | +0.042 |
disse | +0.042 |
Neg logit contributions | |
ulia | -0.072 |
cott | -0.071 |
icas | -0.065 |
tsky | -0.063 |
kamp | -0.062 |
Token | I |
Token ID | 40 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
ulia | +0.246 |
cott | +0.242 |
icas | +0.218 |
tsky | +0.211 |
kamp | +0.205 |
Neg logit contributions | |
augmented | -0.247 |
asses | -0.244 |
offending | -0.240 |
ingle | -0.234 |
routed | -0.231 |
Token | can |
Token ID | 460 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
ulia | +0.483 |
cott | +0.476 |
icas | +0.433 |
tsky | +0.419 |
kamp | +0.411 |
Neg logit contributions | |
augmented | -0.395 |
asses | -0.388 |
offending | -0.383 |
ingle | -0.371 |
routed | -0.367 |
Token | sad |
Token ID | 6507 |
Feature activation | -8.24e-03 |
Pos logit contributions | |
ulia | +0.314 |
cott | +0.310 |
icas | +0.284 |
tsky | +0.276 |
kamp | +0.270 |
Neg logit contributions | |
augmented | -0.218 |
asses | -0.214 |
offending | -0.211 |
ingle | -0.203 |
routed | -0.201 |
Token | book |
Token ID | 1492 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
ulia | +0.023 |
cott | +0.022 |
icas | +0.020 |
tsky | +0.020 |
kamp | +0.019 |
Neg logit contributions | |
augmented | -0.020 |
asses | -0.020 |
offending | -0.019 |
ingle | -0.019 |
routed | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | -2.06e-01 |
Pos logit contributions | |
ulia | +0.475 |
cott | +0.467 |
icas | +0.425 |
tsky | +0.412 |
kamp | +0.402 |
Neg logit contributions | |
augmented | -0.395 |
asses | -0.388 |
offending | -0.383 |
ingle | -0.370 |
routed | -0.367 |
Token | In |
Token ID | 554 |
Feature activation | +7.70e-02 |
Pos logit contributions | |
ulia | +0.485 |
cott | +0.477 |
icas | +0.424 |
tsky | +0.408 |
kamp | +0.397 |
Neg logit contributions | |
augmented | -0.578 |
asses | -0.572 |
offending | -0.563 |
ingle | -0.549 |
routed | -0.543 |
Token | some |
Token ID | 617 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
augmented | +0.184 |
asses | +0.180 |
offending | +0.179 |
ingle | +0.171 |
routed | +0.170 |
Neg logit contributions | |
ulia | -0.215 |
cott | -0.213 |
icas | -0.193 |
tsky | -0.186 |
kamp | -0.183 |
Token | ways |
Token ID | 2842 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
augmented | +0.293 |
asses | +0.287 |
offending | +0.283 |
ingle | +0.272 |
routed | +0.271 |
Neg logit contributions | |
ulia | -0.341 |
cott | -0.336 |
icas | -0.303 |
tsky | -0.294 |
kamp | -0.288 |
Token | , |
Token ID | 11 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
ulia | +3.492 |
cott | +3.433 |
icas | +3.102 |
tsky | +3.012 |
kamp | +2.945 |
Neg logit contributions | |
augmented | -3.243 |
asses | -3.215 |
offending | -3.149 |
ingle | -3.094 |
routed | -3.044 |
Token | it |
Token ID | 340 |
Feature activation | -4.14e-02 |
Pos logit contributions | |
ulia | +0.641 |
cott | +0.633 |
icas | +0.570 |
tsky | +0.550 |
kamp | +0.539 |
Neg logit contributions | |
augmented | -0.599 |
asses | -0.588 |
offending | -0.584 |
ingle | -0.561 |
routed | -0.558 |
Token | � |
Token ID | 447 |
Feature activation | +6.94e-02 |
Pos logit contributions | |
ulia | +0.114 |
cott | +0.113 |
icas | +0.102 |
tsky | +0.098 |
doms | +0.096 |
Neg logit contributions | |
augmented | -0.101 |
asses | -0.099 |
offending | -0.098 |
routed | -0.094 |
ingle | -0.094 |
Token | � |
Token ID | 247 |
Feature activation | +4.47e-02 |
Pos logit contributions | |
augmented | +0.146 |
asses | +0.144 |
offending | +0.142 |
ingle | +0.136 |
disse | +0.135 |
Neg logit contributions | |
ulia | -0.213 |
cott | -0.209 |
icas | -0.192 |
tsky | -0.186 |
kamp | -0.184 |
Token | s |
Token ID | 82 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
augmented | +0.114 |
asses | +0.113 |
offending | +0.110 |
ingle | +0.107 |
routed | +0.106 |
Neg logit contributions | |
ulia | -0.118 |
cott | -0.115 |
icas | -0.104 |
tsky | -0.101 |
kamp | -0.098 |
Token | institutions |
Token ID | 6712 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
ulia | +1.201 |
cott | +1.183 |
icas | +1.080 |
tsky | +1.048 |
kamp | +1.029 |
Neg logit contributions | |
augmented | -0.890 |
asses | -0.875 |
offending | -0.862 |
ingle | -0.832 |
routed | -0.823 |
Token | that |
Token ID | 326 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
ulia | +0.728 |
cott | +0.718 |
icas | +0.657 |
tsky | +0.639 |
kamp | +0.627 |
Neg logit contributions | |
augmented | -0.500 |
asses | -0.492 |
offending | -0.484 |
ingle | -0.467 |
routed | -0.461 |
Token | have |
Token ID | 423 |
Feature activation | +8.58e-02 |
Pos logit contributions | |
ulia | +0.049 |
cott | +0.048 |
icas | +0.044 |
tsky | +0.042 |
kamp | +0.042 |
Neg logit contributions | |
augmented | -0.038 |
asses | -0.037 |
offending | -0.037 |
ingle | -0.035 |
routed | -0.035 |
Token | been |
Token ID | 587 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
augmented | +0.188 |
asses | +0.181 |
offending | +0.180 |
routed | +0.174 |
ingle | +0.171 |
Neg logit contributions | |
ulia | -0.260 |
cott | -0.255 |
icas | -0.234 |
tsky | -0.226 |
kamp | -0.223 |
Token | the |
Token ID | 262 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
augmented | +0.763 |
asses | +0.741 |
offending | +0.735 |
routed | +0.707 |
ingle | +0.689 |
Neg logit contributions | |
ulia | -1.077 |
cott | -1.050 |
icas | -0.965 |
tsky | -0.935 |
kamp | -0.926 |
Token | basis |
Token ID | 4308 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
augmented | +0.435 |
asses | +0.424 |
offending | +0.419 |
ingle | +0.395 |
routed | +0.395 |
Neg logit contributions | |
ulia | -0.807 |
cott | -0.793 |
icas | -0.733 |
tsky | -0.714 |
kamp | -0.706 |
Token | of |
Token ID | 286 |
Feature activation | +2.37e-01 |
Pos logit contributions | |
augmented | +2.014 |
asses | +1.997 |
offending | +1.898 |
routed | +1.830 |
ingle | +1.827 |
Neg logit contributions | |
ulia | -3.445 |
cott | -3.408 |
icas | -3.112 |
tsky | -3.032 |
kamp | -2.973 |
Token | American |
Token ID | 1605 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
augmented | +0.562 |
asses | +0.551 |
offending | +0.545 |
ingle | +0.522 |
routed | +0.521 |
Neg logit contributions | |
ulia | -0.668 |
cott | -0.656 |
icas | -0.597 |
tsky | -0.576 |
kamp | -0.566 |
Token | foreign |
Token ID | 3215 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
augmented | +1.052 |
asses | +1.030 |
offending | +1.017 |
routed | +0.970 |
ingle | +0.967 |
Neg logit contributions | |
ulia | -1.515 |
cott | -1.480 |
icas | -1.356 |
tsky | -1.311 |
kamp | -1.294 |
Token | policy |
Token ID | 2450 |
Feature activation | +1.68e-01 |
Pos logit contributions | |
augmented | +0.364 |
asses | +0.349 |
offending | +0.344 |
routed | +0.311 |
ingle | +0.309 |
Neg logit contributions | |
ulia | -1.280 |
cott | -1.258 |
icas | -1.181 |
tsky | -1.153 |
kamp | -1.139 |
Token | for |
Token ID | 329 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
augmented | +0.331 |
asses | +0.324 |
offending | +0.319 |
ingle | +0.306 |
routed | +0.303 |
Neg logit contributions | |
ulia | -0.539 |
cott | -0.532 |
icas | -0.489 |
tsky | -0.475 |
kamp | -0.467 |
Token | saying |
Token ID | 2282 |
Feature activation | +5.14e-01 |
Pos logit contributions | |
augmented | +1.107 |
asses | +1.089 |
offending | +1.087 |
ingle | +1.043 |
routed | +1.034 |
Neg logit contributions | |
ulia | -1.482 |
cott | -1.453 |
icas | -1.326 |
tsky | -1.295 |
doms | -1.248 |
Token | , |
Token ID | 11 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
augmented | +1.121 |
asses | +1.093 |
offending | +1.092 |
ingle | +1.040 |
routed | +1.037 |
Neg logit contributions | |
ulia | -1.545 |
cott | -1.516 |
icas | -1.388 |
tsky | -1.356 |
kamp | -1.316 |
Token | ' |
Token ID | 705 |
Feature activation | +1.77e-01 |
Pos logit contributions | |
augmented | +0.549 |
asses | +0.537 |
offending | +0.533 |
ingle | +0.513 |
routed | +0.509 |
Neg logit contributions | |
ulia | -0.709 |
cott | -0.700 |
icas | -0.639 |
tsky | -0.621 |
kamp | -0.606 |
Token | Please |
Token ID | 5492 |
Feature activation | +5.20e-01 |
Pos logit contributions | |
augmented | +0.440 |
asses | +0.436 |
offending | +0.428 |
ingle | +0.417 |
routed | +0.411 |
Neg logit contributions | |
ulia | -0.471 |
cott | -0.462 |
icas | -0.419 |
tsky | -0.407 |
kamp | -0.395 |
Token | , |
Token ID | 11 |
Feature activation | +5.10e-01 |
Pos logit contributions | |
augmented | +1.201 |
asses | +1.176 |
offending | +1.163 |
ingle | +1.121 |
routed | +1.113 |
Neg logit contributions | |
ulia | -1.495 |
cott | -1.469 |
icas | -1.340 |
tsky | -1.302 |
kamp | -1.272 |
Token | Hon |
Token ID | 8835 |
Feature activation | +9.17e-01 |
Pos logit contributions | |
augmented | +1.137 |
asses | +1.114 |
offending | +1.106 |
ingle | +1.056 |
routed | +1.051 |
Neg logit contributions | |
ulia | -1.504 |
cott | -1.482 |
icas | -1.355 |
tsky | -1.317 |
kamp | -1.287 |
Token | oured |
Token ID | 8167 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
asses | +2.122 |
augmented | +2.079 |
offending | +2.049 |
ingle | +1.992 |
disse | +1.945 |
Neg logit contributions | |
ulia | -2.585 |
cott | -2.526 |
icas | -2.312 |
tsky | -2.292 |
kamp | -2.182 |
Token | Master |
Token ID | 5599 |
Feature activation | +7.44e-01 |
Pos logit contributions | |
augmented | +0.431 |
asses | +0.425 |
offending | +0.418 |
ingle | +0.404 |
routed | +0.400 |
Neg logit contributions | |
ulia | -0.566 |
cott | -0.558 |
icas | -0.508 |
tsky | -0.494 |
kamp | -0.484 |
Token | , |
Token ID | 11 |
Feature activation | +5.89e-01 |
Pos logit contributions | |
augmented | +1.664 |
asses | +1.648 |
offending | +1.620 |
ingle | +1.570 |
disse | +1.536 |
Neg logit contributions | |
ulia | -2.161 |
cott | -2.125 |
icas | -1.942 |
tsky | -1.884 |
kamp | -1.833 |
Token | accept |
Token ID | 2453 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
augmented | +1.363 |
asses | +1.336 |
offending | +1.325 |
ingle | +1.278 |
routed | +1.264 |
Neg logit contributions | |
ulia | -1.685 |
cott | -1.660 |
icas | -1.512 |
tsky | -1.469 |
kamp | -1.436 |
Token | this |
Token ID | 428 |
Feature activation | +6.08e-01 |
Pos logit contributions | |
augmented | +0.593 |
asses | +0.581 |
offending | +0.578 |
ingle | +0.556 |
routed | +0.550 |
Neg logit contributions | |
ulia | -0.704 |
cott | -0.695 |
icas | -0.632 |
tsky | -0.613 |
kamp | -0.600 |
Token | the |
Token ID | 262 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
ulia | +0.976 |
cott | +0.962 |
icas | +0.868 |
tsky | +0.841 |
kamp | +0.823 |
Neg logit contributions | |
augmented | -0.898 |
asses | -0.885 |
offending | -0.873 |
ingle | -0.848 |
routed | -0.839 |
Token | red |
Token ID | 2266 |
Feature activation | -3.90e-01 |
Pos logit contributions | |
ulia | +0.648 |
cott | +0.640 |
icas | +0.585 |
tsky | +0.570 |
kamp | +0.558 |
Neg logit contributions | |
augmented | -0.434 |
asses | -0.430 |
offending | -0.415 |
ingle | -0.408 |
routed | -0.400 |
Token | lines |
Token ID | 3951 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
ulia | +1.190 |
cott | +1.174 |
icas | +1.074 |
tsky | +1.044 |
kamp | +1.023 |
Neg logit contributions | |
augmented | -0.826 |
asses | -0.811 |
offending | -0.797 |
ingle | -0.771 |
routed | -0.761 |
Token | under |
Token ID | 739 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
ulia | +0.702 |
cott | +0.692 |
icas | +0.628 |
tsky | +0.615 |
kamp | +0.598 |
Neg logit contributions | |
augmented | -0.539 |
asses | -0.536 |
offending | -0.521 |
ingle | -0.506 |
disse | -0.500 |
Token | the |
Token ID | 262 |
Feature activation | -1.16e-03 |
Pos logit contributions | |
ulia | +0.707 |
cott | +0.695 |
icas | +0.626 |
tsky | +0.605 |
kamp | +0.592 |
Neg logit contributions | |
augmented | -0.697 |
asses | -0.686 |
offending | -0.680 |
ingle | -0.658 |
routed | -0.652 |
Token | word |
Token ID | 1573 |
Feature activation | +9.59e-01 |
Pos logit contributions | |
ulia | +0.004 |
cott | +0.003 |
icas | +0.003 |
tsky | +0.003 |
kamp | +0.003 |
Neg logit contributions | |
augmented | -0.002 |
asses | -0.002 |
offending | -0.002 |
ingle | -0.002 |
routed | -0.002 |
Token | " |
Token ID | 366 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
augmented | +2.247 |
offending | +2.197 |
asses | +2.180 |
ingle | +2.081 |
routed | +2.057 |
Neg logit contributions | |
ulia | -2.714 |
cott | -2.657 |
icas | -2.451 |
kamp | -2.332 |
tsky | -2.330 |
Token | custom |
Token ID | 23144 |
Feature activation | +2.17e-01 |
Pos logit contributions | |
augmented | +0.056 |
asses | +0.056 |
offending | +0.055 |
ingle | +0.053 |
routed | +0.052 |
Neg logit contributions | |
ulia | -0.060 |
cott | -0.059 |
icas | -0.054 |
tsky | -0.052 |
kamp | -0.051 |
Token | ize |
Token ID | 1096 |
Feature activation | +3.49e-01 |
Pos logit contributions | |
augmented | +0.455 |
asses | +0.441 |
offending | +0.441 |
ingle | +0.424 |
routed | +0.417 |
Neg logit contributions | |
ulia | -0.667 |
cott | -0.658 |
icas | -0.601 |
tsky | -0.589 |
kamp | -0.581 |
Token | " |
Token ID | 1 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
augmented | +0.712 |
asses | +0.690 |
offending | +0.690 |
ingle | +0.660 |
routed | +0.652 |
Neg logit contributions | |
ulia | -1.094 |
cott | -1.080 |
icas | -0.993 |
tsky | -0.968 |
kamp | -0.954 |
Token | disappear |
Token ID | 10921 |
Feature activation | +5.17e-03 |
Pos logit contributions | |
ulia | +1.207 |
cott | +1.189 |
icas | +1.077 |
tsky | +1.055 |
kamp | +1.026 |
Neg logit contributions | |
augmented | -0.965 |
asses | -0.963 |
offending | -0.939 |
ingle | -0.913 |
disse | -0.901 |
Token | If |
Token ID | 1532 |
Feature activation | +6.53e-02 |
Pos logit contributions | |
augmented | +0.058 |
asses | +0.058 |
offending | +0.056 |
ingle | +0.055 |
routed | +0.054 |
Neg logit contributions | |
ulia | -0.059 |
cott | -0.058 |
icas | -0.052 |
tsky | -0.051 |
kamp | -0.049 |
Token | Matthew |
Token ID | 9308 |
Feature activation | +4.54e-01 |
Pos logit contributions | |
augmented | +0.137 |
asses | +0.134 |
offending | +0.132 |
ingle | +0.127 |
routed | +0.126 |
Neg logit contributions | |
ulia | -0.201 |
cott | -0.199 |
icas | -0.182 |
tsky | -0.177 |
kamp | -0.175 |
Token | directly |
Token ID | 3264 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
augmented | +1.099 |
asses | +1.079 |
offending | +1.067 |
ingle | +1.025 |
routed | +1.022 |
Neg logit contributions | |
ulia | -1.253 |
cott | -1.233 |
icas | -1.119 |
tsky | -1.085 |
kamp | -1.060 |
Token | impacts |
Token ID | 12751 |
Feature activation | +5.44e-03 |
Pos logit contributions | |
augmented | +0.980 |
asses | +0.962 |
offending | +0.949 |
ingle | +0.913 |
routed | +0.907 |
Neg logit contributions | |
ulia | -1.319 |
cott | -1.297 |
icas | -1.186 |
tsky | -1.153 |
kamp | -1.128 |
Token | Florida |
Token ID | 4744 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
augmented | +0.013 |
asses | +0.013 |
offending | +0.013 |
ingle | +0.012 |
routed | +0.012 |
Neg logit contributions | |
ulia | -0.015 |
cott | -0.015 |
icas | -0.013 |
tsky | -0.013 |
kamp | -0.013 |
Token | ," |
Token ID | 553 |
Feature activation | +9.81e-01 |
Pos logit contributions | |
augmented | +0.742 |
asses | +0.726 |
offending | +0.721 |
ingle | +0.693 |
routed | +0.686 |
Neg logit contributions | |
ulia | -0.908 |
cott | -0.905 |
icas | -0.811 |
tsky | -0.795 |
kamp | -0.771 |
Token | he |
Token ID | 339 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
augmented | +2.416 |
offending | +2.337 |
asses | +2.323 |
routed | +2.242 |
ingle | +2.227 |
Neg logit contributions | |
ulia | -2.659 |
cott | -2.600 |
icas | -2.357 |
tsky | -2.289 |
doms | -2.234 |
Token | said |
Token ID | 531 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
ulia | +0.243 |
cott | +0.238 |
icas | +0.210 |
tsky | +0.202 |
kamp | +0.196 |
Neg logit contributions | |
augmented | -0.319 |
asses | -0.314 |
offending | -0.311 |
ingle | -0.303 |
routed | -0.301 |
Token | , |
Token ID | 11 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
ulia | +0.368 |
cott | +0.362 |
icas | +0.330 |
tsky | +0.321 |
kamp | +0.312 |
Neg logit contributions | |
augmented | -0.298 |
asses | -0.292 |
offending | -0.289 |
ingle | -0.278 |
routed | -0.276 |
Token | " |
Token ID | 366 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
augmented | +0.259 |
asses | +0.254 |
offending | +0.253 |
ingle | +0.241 |
routed | +0.240 |
Neg logit contributions | |
ulia | -0.357 |
cott | -0.354 |
icas | -0.322 |
tsky | -0.317 |
kamp | -0.310 |
Token | there |
Token ID | 8117 |
Feature activation | +1.04e-01 |
Pos logit contributions | |
augmented | +0.570 |
asses | +0.568 |
offending | +0.554 |
ingle | +0.542 |
routed | +0.531 |
Neg logit contributions | |
ulia | -0.638 |
cott | -0.627 |
icas | -0.571 |
tsky | -0.561 |
kamp | -0.541 |
Token | � |
Token ID | 447 |
Feature activation | +5.10e-01 |
Pos logit contributions | |
augmented | +1.354 |
asses | +1.332 |
offending | +1.325 |
routed | +1.267 |
disse | +1.265 |
Neg logit contributions | |
ulia | -1.535 |
cott | -1.515 |
icas | -1.370 |
tsky | -1.337 |
kamp | -1.299 |
Token | � |
Token ID | 247 |
Feature activation | +2.73e-01 |
Pos logit contributions | |
augmented | +1.135 |
asses | +1.109 |
offending | +1.083 |
ingle | +1.072 |
routed | +1.052 |
Neg logit contributions | |
ulia | -1.499 |
cott | -1.476 |
icas | -1.340 |
tsky | -1.313 |
doms | -1.294 |
Token | s |
Token ID | 82 |
Feature activation | +3.39e-01 |
Pos logit contributions | |
augmented | +0.618 |
asses | +0.606 |
offending | +0.592 |
ingle | +0.575 |
routed | +0.568 |
Neg logit contributions | |
ulia | -0.789 |
cott | -0.774 |
icas | -0.715 |
tsky | -0.690 |
kamp | -0.677 |
Token | glaciers |
Token ID | 40509 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
augmented | +0.756 |
asses | +0.741 |
offending | +0.731 |
ingle | +0.703 |
routed | +0.693 |
Neg logit contributions | |
ulia | -1.000 |
cott | -0.982 |
icas | -0.905 |
tsky | -0.880 |
kamp | -0.862 |
Token | are |
Token ID | 389 |
Feature activation | +1.86e-01 |
Pos logit contributions | |
augmented | +0.599 |
asses | +0.586 |
offending | +0.577 |
ingle | +0.560 |
routed | +0.557 |
Neg logit contributions | |
ulia | -0.748 |
cott | -0.737 |
icas | -0.673 |
tsky | -0.650 |
kamp | -0.639 |
Token | now |
Token ID | 783 |
Feature activation | +9.39e-01 |
Pos logit contributions | |
augmented | +0.415 |
asses | +0.405 |
offending | +0.402 |
routed | +0.385 |
ingle | +0.382 |
Neg logit contributions | |
ulia | -0.553 |
cott | -0.545 |
icas | -0.499 |
tsky | -0.485 |
kamp | -0.479 |
Token | losing |
Token ID | 6078 |
Feature activation | +3.48e-02 |
Pos logit contributions | |
augmented | +2.076 |
offending | +2.002 |
asses | +1.999 |
routed | +1.909 |
ingle | +1.883 |
Neg logit contributions | |
ulia | -2.808 |
cott | -2.749 |
icas | -2.536 |
tsky | -2.473 |
kamp | -2.452 |
Token | 75 |
Token ID | 5441 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
augmented | +0.080 |
asses | +0.079 |
offending | +0.077 |
ingle | +0.075 |
routed | +0.074 |
Neg logit contributions | |
ulia | -0.100 |
cott | -0.099 |
icas | -0.090 |
tsky | -0.087 |
kamp | -0.086 |
Token | billion |
Token ID | 2997 |
Feature activation | +4.35e-01 |
Pos logit contributions | |
ulia | +0.279 |
cott | +0.273 |
icas | +0.243 |
tsky | +0.237 |
kamp | +0.231 |
Neg logit contributions | |
augmented | -0.318 |
asses | -0.315 |
offending | -0.309 |
ingle | -0.301 |
routed | -0.298 |
Token | tons |
Token ID | 10860 |
Feature activation | +2.42e-01 |
Pos logit contributions | |
augmented | +1.016 |
asses | +1.009 |
offending | +0.981 |
ingle | +0.942 |
routed | +0.936 |
Neg logit contributions | |
ulia | -1.253 |
cott | -1.237 |
icas | -1.113 |
tsky | -1.081 |
kamp | -1.069 |
Token | of |
Token ID | 286 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
augmented | +0.543 |
asses | +0.537 |
offending | +0.522 |
ingle | +0.507 |
routed | +0.501 |
Neg logit contributions | |
ulia | -0.715 |
cott | -0.703 |
icas | -0.640 |
tsky | -0.622 |
kamp | -0.608 |
Token | . |
Token ID | 13 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
ulia | +0.464 |
cott | +0.459 |
icas | +0.414 |
tsky | +0.402 |
kamp | +0.393 |
Neg logit contributions | |
augmented | -0.415 |
asses | -0.407 |
offending | -0.404 |
ingle | -0.390 |
routed | -0.387 |
Token | Instead |
Token ID | 5455 |
Feature activation | +5.24e-01 |
Pos logit contributions | |
augmented | +0.277 |
asses | +0.274 |
offending | +0.269 |
ingle | +0.263 |
routed | +0.260 |
Neg logit contributions | |
ulia | -0.247 |
cott | -0.242 |
icas | -0.217 |
tsky | -0.209 |
kamp | -0.204 |
Token | , |
Token ID | 11 |
Feature activation | +2.83e-01 |
Pos logit contributions | |
augmented | +1.085 |
offending | +1.063 |
asses | +1.063 |
ingle | +1.005 |
routed | +1.001 |
Neg logit contributions | |
ulia | -1.622 |
cott | -1.602 |
icas | -1.459 |
tsky | -1.424 |
kamp | -1.398 |
Token | the |
Token ID | 262 |
Feature activation | +8.07e-02 |
Pos logit contributions | |
augmented | +0.677 |
asses | +0.660 |
offending | +0.659 |
ingle | +0.633 |
routed | +0.629 |
Neg logit contributions | |
ulia | -0.788 |
cott | -0.779 |
icas | -0.705 |
tsky | -0.683 |
kamp | -0.670 |
Token | failures |
Token ID | 15536 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
augmented | +0.174 |
asses | +0.170 |
offending | +0.169 |
ingle | +0.162 |
routed | +0.160 |
Neg logit contributions | |
ulia | -0.244 |
cott | -0.241 |
icas | -0.220 |
tsky | -0.214 |
kamp | -0.210 |
Token | seem |
Token ID | 1283 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
augmented | +0.261 |
asses | +0.255 |
offending | +0.252 |
ingle | +0.243 |
routed | +0.241 |
Neg logit contributions | |
ulia | -0.335 |
cott | -0.331 |
icas | -0.301 |
tsky | -0.292 |
kamp | -0.286 |
Token | to |
Token ID | 284 |
Feature activation | -5.51e-02 |
Pos logit contributions | |
augmented | +0.719 |
offending | +0.684 |
asses | +0.683 |
routed | +0.669 |
ingle | +0.650 |
Neg logit contributions | |
ulia | -0.955 |
cott | -0.935 |
icas | -0.861 |
tsky | -0.838 |
kamp | -0.817 |
Token | be |
Token ID | 307 |
Feature activation | -4.41e-01 |
Pos logit contributions | |
ulia | +0.160 |
cott | +0.158 |
icas | +0.144 |
tsky | +0.139 |
kamp | +0.136 |
Neg logit contributions | |
augmented | -0.126 |
asses | -0.123 |
offending | -0.122 |
ingle | -0.118 |
routed | -0.116 |
Token | much |
Token ID | 881 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
ulia | +1.333 |
cott | +1.317 |
icas | +1.203 |
tsky | +1.169 |
kamp | +1.146 |
Neg logit contributions | |
augmented | -0.939 |
asses | -0.930 |
offending | -0.911 |
ingle | -0.884 |
routed | -0.866 |
Token | more |
Token ID | 517 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
augmented | +0.405 |
asses | +0.391 |
offending | +0.387 |
routed | +0.374 |
ingle | +0.373 |
Neg logit contributions | |
ulia | -0.560 |
cott | -0.549 |
icas | -0.505 |
tsky | -0.490 |
kamp | -0.481 |
Token | and |
Token ID | 290 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
augmented | +0.299 |
asses | +0.288 |
offending | +0.287 |
routed | +0.276 |
ingle | +0.274 |
Neg logit contributions | |
ulia | -0.472 |
cott | -0.462 |
icas | -0.428 |
tsky | -0.415 |
kamp | -0.408 |
Token | er |
Token ID | 263 |
Feature activation | -9.85e-01 |
Pos logit contributions | |
augmented | +0.932 |
asses | +0.932 |
offending | +0.910 |
ingle | +0.886 |
routed | +0.868 |
Neg logit contributions | |
ulia | -1.134 |
cott | -1.104 |
icas | -1.008 |
tsky | -0.986 |
kamp | -0.958 |
Token | Podcast |
Token ID | 16036 |
Feature activation | +9.37e-02 |
Pos logit contributions | |
ulia | +2.639 |
cott | +2.634 |
icas | +2.362 |
tsky | +2.274 |
kamp | +2.236 |
Neg logit contributions | |
augmented | -2.399 |
asses | -2.367 |
offending | -2.334 |
ingle | -2.275 |
routed | -2.236 |
Token | , |
Token ID | 11 |
Feature activation | +2.02e-01 |
Pos logit contributions | |
augmented | +0.217 |
asses | +0.213 |
offending | +0.210 |
ingle | +0.204 |
routed | +0.201 |
Neg logit contributions | |
ulia | -0.268 |
cott | -0.264 |
icas | -0.240 |
tsky | -0.233 |
kamp | -0.228 |
Token | I |
Token ID | 314 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
augmented | +0.475 |
asses | +0.462 |
offending | +0.457 |
ingle | +0.442 |
routed | +0.438 |
Neg logit contributions | |
ulia | -0.575 |
cott | -0.569 |
icas | -0.516 |
tsky | -0.501 |
kamp | -0.492 |
Token | � |
Token ID | 447 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
augmented | +0.489 |
asses | +0.480 |
offending | +0.472 |
ingle | +0.457 |
routed | +0.451 |
Neg logit contributions | |
ulia | -0.690 |
cott | -0.681 |
icas | -0.623 |
tsky | -0.605 |
kamp | -0.594 |
Token | � |
Token ID | 247 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
augmented | +0.253 |
asses | +0.248 |
offending | +0.244 |
ingle | +0.237 |
routed | +0.234 |
Neg logit contributions | |
ulia | -0.370 |
cott | -0.365 |
icas | -0.334 |
tsky | -0.325 |
kamp | -0.318 |
Token | m |
Token ID | 76 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
augmented | +0.573 |
asses | +0.565 |
offending | +0.553 |
ingle | +0.545 |
routed | +0.535 |
Neg logit contributions | |
ulia | -0.584 |
cott | -0.575 |
icas | -0.522 |
tsky | -0.505 |
kamp | -0.489 |
Token | joined |
Token ID | 5399 |
Feature activation | -4.49e-01 |
Pos logit contributions | |
ulia | +0.576 |
cott | +0.568 |
icas | +0.517 |
tsky | +0.503 |
kamp | +0.492 |
Neg logit contributions | |
augmented | -0.436 |
asses | -0.429 |
offending | -0.422 |
ingle | -0.407 |
routed | -0.402 |
Token | by |
Token ID | 416 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
ulia | +1.090 |
cott | +1.079 |
icas | +0.959 |
tsky | +0.927 |
kamp | +0.902 |
Neg logit contributions | |
augmented | -1.237 |
asses | -1.221 |
offending | -1.199 |
ingle | -1.172 |
routed | -1.157 |
Token | Will |
Token ID | 2561 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
augmented | +0.285 |
asses | +0.278 |
offending | +0.275 |
ingle | +0.265 |
routed | +0.262 |
Neg logit contributions | |
ulia | -0.334 |
cott | -0.330 |
icas | -0.299 |
tsky | -0.289 |
kamp | -0.284 |
Token | Lar |
Token ID | 25577 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
ulia | +0.450 |
cott | +0.442 |
icas | +0.400 |
tsky | +0.387 |
kamp | +0.378 |
Neg logit contributions | |
augmented | -0.410 |
asses | -0.406 |
offending | -0.398 |
ingle | -0.389 |
routed | -0.381 |
Token | unfolded |
Token ID | 34660 |
Feature activation | -2.61e-02 |
Pos logit contributions | |
ulia | +0.226 |
cott | +0.223 |
icas | +0.203 |
tsky | +0.197 |
kamp | +0.193 |
Neg logit contributions | |
augmented | -0.181 |
asses | -0.178 |
offending | -0.175 |
ingle | -0.170 |
routed | -0.168 |
Token | the |
Token ID | 262 |
Feature activation | -5.32e-02 |
Pos logit contributions | |
ulia | +0.067 |
cott | +0.066 |
icas | +0.059 |
tsky | +0.057 |
kamp | +0.056 |
Neg logit contributions | |
augmented | -0.069 |
asses | -0.067 |
offending | -0.067 |
ingle | -0.065 |
routed | -0.064 |
Token | wings |
Token ID | 12098 |
Feature activation | -4.39e-03 |
Pos logit contributions | |
ulia | +0.162 |
cott | +0.160 |
icas | +0.146 |
tsky | +0.143 |
kamp | +0.140 |
Neg logit contributions | |
augmented | -0.113 |
asses | -0.111 |
offending | -0.110 |
ingle | -0.105 |
routed | -0.104 |
Token | . |
Token ID | 13 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
ulia | +0.013 |
cott | +0.013 |
icas | +0.012 |
tsky | +0.011 |
kamp | +0.011 |
Neg logit contributions | |
augmented | -0.010 |
asses | -0.010 |
offending | -0.009 |
ingle | -0.009 |
routed | -0.009 |
Token | After |
Token ID | 2293 |
Feature activation | +2.54e-02 |
Pos logit contributions | |
augmented | +0.352 |
asses | +0.348 |
offending | +0.342 |
ingle | +0.334 |
routed | +0.331 |
Neg logit contributions | |
ulia | -0.318 |
cott | -0.314 |
icas | -0.281 |
tsky | -0.270 |
kamp | -0.263 |
Token | all |
Token ID | 477 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
augmented | +0.061 |
asses | +0.060 |
offending | +0.059 |
ingle | +0.057 |
routed | +0.057 |
Neg logit contributions | |
ulia | -0.070 |
cott | -0.069 |
icas | -0.063 |
tsky | -0.061 |
kamp | -0.060 |
Token | , |
Token ID | 11 |
Feature activation | -3.08e-02 |
Pos logit contributions | |
augmented | +0.494 |
asses | +0.483 |
offending | +0.478 |
routed | +0.457 |
ingle | +0.455 |
Neg logit contributions | |
ulia | -0.611 |
cott | -0.605 |
icas | -0.549 |
tsky | -0.531 |
kamp | -0.523 |
Token | I |
Token ID | 314 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
ulia | +0.083 |
cott | +0.082 |
icas | +0.074 |
tsky | +0.071 |
kamp | +0.070 |
Neg logit contributions | |
augmented | -0.076 |
asses | -0.075 |
offending | -0.074 |
ingle | -0.072 |
routed | -0.071 |
Token | always |
Token ID | 1464 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
augmented | +0.380 |
asses | +0.373 |
offending | +0.368 |
ingle | +0.356 |
routed | +0.353 |
Neg logit contributions | |
ulia | -0.459 |
cott | -0.453 |
icas | -0.411 |
tsky | -0.398 |
kamp | -0.390 |
Token | unfold |
Token ID | 16631 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
ulia | +0.350 |
cott | +0.345 |
icas | +0.313 |
tsky | +0.305 |
kamp | +0.298 |
Neg logit contributions | |
augmented | -0.279 |
asses | -0.277 |
offending | -0.272 |
ingle | -0.264 |
routed | -0.259 |
Token | the |
Token ID | 262 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
augmented | +0.333 |
asses | +0.327 |
offending | +0.325 |
routed | +0.311 |
ingle | +0.311 |
Neg logit contributions | |
ulia | -0.346 |
cott | -0.338 |
icas | -0.305 |
tsky | -0.296 |
kamp | -0.288 |
Token | him |
Token ID | 683 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
ulia | +0.201 |
cott | +0.198 |
icas | +0.181 |
tsky | +0.175 |
kamp | +0.171 |
Neg logit contributions | |
augmented | -0.151 |
asses | -0.149 |
offending | -0.146 |
ingle | -0.141 |
routed | -0.140 |
Token | in |
Token ID | 287 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
augmented | +0.349 |
asses | +0.340 |
offending | +0.337 |
ingle | +0.324 |
routed | +0.322 |
Neg logit contributions | |
ulia | -0.434 |
cott | -0.427 |
icas | -0.390 |
tsky | -0.375 |
doms | -0.368 |
Token | the |
Token ID | 262 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
augmented | +0.231 |
asses | +0.225 |
offending | +0.223 |
ingle | +0.215 |
routed | +0.214 |
Neg logit contributions | |
ulia | -0.298 |
cott | -0.294 |
icas | -0.267 |
tsky | -0.259 |
kamp | -0.253 |
Token | past |
Token ID | 1613 |
Feature activation | +2.84e-01 |
Pos logit contributions | |
ulia | +0.053 |
cott | +0.053 |
icas | +0.049 |
tsky | +0.048 |
kamp | +0.047 |
Neg logit contributions | |
augmented | -0.025 |
asses | -0.025 |
offending | -0.024 |
ingle | -0.023 |
routed | -0.023 |
Token | but |
Token ID | 475 |
Feature activation | -1.42e-01 |
Pos logit contributions | |
augmented | +0.688 |
asses | +0.672 |
offending | +0.665 |
ingle | +0.640 |
routed | +0.636 |
Neg logit contributions | |
ulia | -0.788 |
cott | -0.774 |
icas | -0.708 |
tsky | -0.678 |
doms | -0.666 |
Token | he |
Token ID | 339 |
Feature activation | +9.75e-02 |
Pos logit contributions | |
ulia | +0.402 |
cott | +0.396 |
icas | +0.359 |
tsky | +0.349 |
kamp | +0.342 |
Neg logit contributions | |
augmented | -0.332 |
asses | -0.326 |
offending | -0.321 |
ingle | -0.311 |
routed | -0.308 |
Token | said |
Token ID | 531 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
augmented | +0.234 |
asses | +0.229 |
offending | +0.226 |
ingle | +0.219 |
routed | +0.218 |
Neg logit contributions | |
ulia | -0.271 |
cott | -0.267 |
icas | -0.242 |
tsky | -0.234 |
kamp | -0.229 |
Token | he |
Token ID | 339 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
ulia | +0.477 |
cott | +0.468 |
icas | +0.426 |
tsky | +0.413 |
kamp | +0.405 |
Neg logit contributions | |
augmented | -0.384 |
asses | -0.377 |
offending | -0.372 |
ingle | -0.359 |
routed | -0.356 |
Token | was |
Token ID | 373 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
augmented | +0.314 |
asses | +0.308 |
offending | +0.304 |
ingle | +0.293 |
routed | +0.292 |
Neg logit contributions | |
ulia | -0.392 |
cott | -0.386 |
icas | -0.352 |
tsky | -0.340 |
kamp | -0.334 |
Token | too |
Token ID | 1165 |
Feature activation | +8.48e-02 |
Pos logit contributions | |
ulia | +0.572 |
cott | +0.565 |
icas | +0.514 |
tsky | +0.500 |
kamp | +0.490 |
Neg logit contributions | |
augmented | -0.433 |
asses | -0.426 |
offending | -0.419 |
ingle | -0.407 |
routed | -0.401 |
Token | young |
Token ID | 1862 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
augmented | +0.171 |
asses | +0.168 |
offending | +0.165 |
ingle | +0.159 |
routed | +0.158 |
Neg logit contributions | |
ulia | -0.268 |
cott | -0.264 |
icas | -0.243 |
tsky | -0.236 |
kamp | -0.232 |
Token | to |
Token ID | 284 |
Feature activation | +3.88e-02 |
Pos logit contributions | |
augmented | +1.015 |
asses | +0.984 |
offending | +0.978 |
ingle | +0.942 |
routed | +0.929 |
Neg logit contributions | |
ulia | -1.281 |
cott | -1.258 |
icas | -1.145 |
tsky | -1.116 |
kamp | -1.086 |
Token | be |
Token ID | 307 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
augmented | +0.083 |
asses | +0.082 |
offending | +0.081 |
ingle | +0.078 |
routed | +0.078 |
Neg logit contributions | |
ulia | -0.116 |
cott | -0.114 |
icas | -0.105 |
tsky | -0.102 |
kamp | -0.100 |
Token | perceived |
Token ID | 11067 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
ulia | +0.047 |
cott | +0.046 |
icas | +0.043 |
tsky | +0.041 |
kamp | +0.041 |
Neg logit contributions | |
asses | -0.028 |
augmented | -0.028 |
offending | -0.027 |
ingle | -0.026 |
routed | -0.025 |
Token | as |
Token ID | 355 |
Feature activation | -3.50e-02 |
Pos logit contributions | |
ulia | +1.080 |
cott | +1.067 |
icas | +0.977 |
tsky | +0.948 |
kamp | +0.933 |
Neg logit contributions | |
augmented | -0.763 |
asses | -0.754 |
offending | -0.741 |
ingle | -0.720 |
routed | -0.708 |
Token | such |
Token ID | 884 |
Feature activation | +1.37e-02 |
Pos logit contributions | |
ulia | +0.114 |
cott | +0.113 |
icas | +0.104 |
tsky | +0.101 |
kamp | +0.100 |
Neg logit contributions | |
augmented | -0.066 |
asses | -0.065 |
offending | -0.063 |
ingle | -0.061 |
routed | -0.060 |
Token | socially |
Token ID | 18118 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
augmented | +0.034 |
asses | +0.033 |
offending | +0.033 |
ingle | +0.032 |
routed | +0.032 |
Neg logit contributions | |
ulia | -0.037 |
cott | -0.036 |
icas | -0.033 |
tsky | -0.032 |
kamp | -0.031 |
Token | ( |
Token ID | 357 |
Feature activation | -7.09e-02 |
Pos logit contributions | |
augmented | +0.840 |
asses | +0.826 |
offending | +0.816 |
ingle | +0.786 |
routed | +0.776 |
Neg logit contributions | |
ulia | -0.935 |
cott | -0.919 |
icas | -0.834 |
tsky | -0.802 |
doms | -0.785 |
Token | including |
Token ID | 8201 |
Feature activation | +4.17e-02 |
Pos logit contributions | |
ulia | +0.206 |
cott | +0.203 |
icas | +0.185 |
tsky | +0.180 |
kamp | +0.176 |
Neg logit contributions | |
augmented | -0.161 |
asses | -0.159 |
offending | -0.156 |
ingle | -0.151 |
routed | -0.149 |
Token | the |
Token ID | 262 |
Feature activation | -6.47e-02 |
Pos logit contributions | |
augmented | +0.091 |
asses | +0.090 |
offending | +0.088 |
ingle | +0.085 |
routed | +0.084 |
Neg logit contributions | |
ulia | -0.125 |
cott | -0.123 |
icas | -0.112 |
tsky | -0.109 |
kamp | -0.107 |
Token | use |
Token ID | 779 |
Feature activation | +2.81e-01 |
Pos logit contributions | |
ulia | +0.204 |
cott | +0.201 |
icas | +0.185 |
tsky | +0.180 |
kamp | +0.177 |
Neg logit contributions | |
augmented | -0.130 |
asses | -0.128 |
offending | -0.126 |
ingle | -0.121 |
routed | -0.120 |
Token | of |
Token ID | 286 |
Feature activation | -1.58e-02 |
Pos logit contributions | |
augmented | +0.604 |
asses | +0.593 |
offending | +0.583 |
ingle | +0.563 |
routed | +0.555 |
Neg logit contributions | |
ulia | -0.852 |
cott | -0.839 |
icas | -0.764 |
tsky | -0.743 |
kamp | -0.728 |
Token | was |
Token ID | 373 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
ulia | +0.464 |
cott | +0.458 |
icas | +0.415 |
tsky | +0.402 |
kamp | +0.393 |
Neg logit contributions | |
augmented | -0.389 |
asses | -0.382 |
offending | -0.377 |
ingle | -0.364 |
routed | -0.363 |
Token | ok |
Token ID | 12876 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
ulia | +1.344 |
cott | +1.328 |
icas | +1.210 |
tsky | +1.173 |
kamp | +1.150 |
Neg logit contributions | |
augmented | -1.070 |
asses | -1.056 |
offending | -1.037 |
ingle | -1.012 |
disse | -0.990 |
Token | , |
Token ID | 11 |
Feature activation | +3.87e-02 |
Pos logit contributions | |
ulia | +0.394 |
cott | +0.390 |
icas | +0.351 |
tsky | +0.340 |
doms | +0.333 |
Neg logit contributions | |
augmented | -0.355 |
asses | -0.349 |
offending | -0.344 |
ingle | -0.333 |
routed | -0.332 |
Token | a |
Token ID | 257 |
Feature activation | +1.93e-02 |
Pos logit contributions | |
augmented | +0.102 |
asses | +0.100 |
offending | +0.099 |
routed | +0.096 |
ingle | +0.095 |
Neg logit contributions | |
ulia | -0.099 |
cott | -0.098 |
icas | -0.088 |
tsky | -0.085 |
doms | -0.083 |
Token | quick |
Token ID | 2068 |
Feature activation | -9.17e-02 |
Pos logit contributions | |
augmented | +0.038 |
asses | +0.038 |
offending | +0.037 |
ingle | +0.036 |
routed | +0.035 |
Neg logit contributions | |
ulia | -0.061 |
cott | -0.061 |
icas | -0.056 |
tsky | -0.054 |
kamp | -0.053 |
Token | search |
Token ID | 2989 |
Feature activation | +4.92e-03 |
Pos logit contributions | |
ulia | +0.283 |
cott | +0.279 |
icas | +0.255 |
tsky | +0.248 |
kamp | +0.243 |
Neg logit contributions | |
augmented | -0.193 |
asses | -0.189 |
offending | -0.186 |
ingle | -0.179 |
routed | -0.178 |
Token | revealed |
Token ID | 4602 |
Feature activation | -7.82e-02 |
Pos logit contributions | |
augmented | +0.011 |
asses | +0.010 |
offending | +0.010 |
ingle | +0.010 |
routed | +0.010 |
Neg logit contributions | |
ulia | -0.015 |
cott | -0.015 |
icas | -0.013 |
tsky | -0.013 |
kamp | -0.013 |
Token | that |
Token ID | 326 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
ulia | +0.233 |
cott | +0.230 |
icas | +0.209 |
tsky | +0.204 |
kamp | +0.200 |
Neg logit contributions | |
augmented | -0.172 |
asses | -0.169 |
offending | -0.167 |
ingle | -0.161 |
routed | -0.160 |
Token | they |
Token ID | 484 |
Feature activation | +8.95e-03 |
Pos logit contributions | |
ulia | +0.358 |
cott | +0.353 |
icas | +0.320 |
tsky | +0.310 |
kamp | +0.304 |
Neg logit contributions | |
augmented | -0.302 |
asses | -0.297 |
offending | -0.293 |
ingle | -0.283 |
routed | -0.281 |
Token | had |
Token ID | 550 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
augmented | +0.021 |
asses | +0.020 |
offending | +0.020 |
routed | +0.019 |
ingle | +0.019 |
Neg logit contributions | |
ulia | -0.026 |
cott | -0.025 |
icas | -0.023 |
tsky | -0.022 |
doms | -0.022 |
Token | been |
Token ID | 587 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
ulia | +0.423 |
cott | +0.417 |
icas | +0.379 |
tsky | +0.368 |
kamp | +0.361 |
Neg logit contributions | |
augmented | -0.338 |
asses | -0.332 |
offending | -0.328 |
ingle | -0.317 |
routed | -0.315 |
Token | impact |
Token ID | 2928 |
Feature activation | +8.90e-02 |
Pos logit contributions | |
augmented | +0.596 |
asses | +0.583 |
offending | +0.580 |
ingle | +0.556 |
routed | +0.549 |
Neg logit contributions | |
ulia | -0.736 |
cott | -0.723 |
icas | -0.660 |
tsky | -0.638 |
doms | -0.625 |
Token | group |
Token ID | 1448 |
Feature activation | +3.24e-02 |
Pos logit contributions | |
augmented | +0.193 |
asses | +0.189 |
offending | +0.187 |
ingle | +0.179 |
routed | +0.178 |
Neg logit contributions | |
ulia | -0.269 |
cott | -0.265 |
icas | -0.243 |
tsky | -0.236 |
kamp | -0.231 |
Token | . |
Token ID | 13 |
Feature activation | -2.28e-02 |
Pos logit contributions | |
augmented | +0.076 |
asses | +0.074 |
offending | +0.073 |
ingle | +0.071 |
routed | +0.070 |
Neg logit contributions | |
ulia | -0.092 |
cott | -0.091 |
icas | -0.083 |
tsky | -0.080 |
kamp | -0.078 |
Token | � |
Token ID | 447 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
ulia | +0.055 |
cott | +0.054 |
icas | +0.049 |
tsky | +0.047 |
kamp | +0.046 |
Neg logit contributions | |
augmented | -0.063 |
asses | -0.062 |
offending | -0.061 |
ingle | -0.059 |
routed | -0.059 |
Token | � |
Token ID | 247 |
Feature activation | -7.88e-02 |
Pos logit contributions | |
ulia | +0.349 |
cott | +0.346 |
icas | +0.318 |
tsky | +0.309 |
kamp | +0.303 |
Neg logit contributions | |
augmented | -0.210 |
asses | -0.205 |
offending | -0.202 |
ingle | -0.195 |
routed | -0.193 |
Token | � |
Token ID | 447 |
Feature activation | -3.08e-01 |
Pos logit contributions | |
ulia | +0.204 |
cott | +0.201 |
icas | +0.182 |
tsky | +0.174 |
doms | +0.171 |
Neg logit contributions | |
augmented | -0.203 |
asses | -0.200 |
offending | -0.197 |
ingle | -0.191 |
routed | -0.190 |
Token | � |
Token ID | 251 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
ulia | +0.968 |
cott | +0.956 |
icas | +0.877 |
tsky | +0.852 |
kamp | +0.836 |
Neg logit contributions | |
augmented | -0.627 |
asses | -0.616 |
offending | -0.605 |
ingle | -0.585 |
routed | -0.577 |
Token |
|
Token ID | 198 |
Feature activation | +9.64e-03 |
Pos logit contributions | |
ulia | +0.757 |
cott | +0.745 |
icas | +0.672 |
tsky | +0.648 |
kamp | +0.634 |
Neg logit contributions | |
augmented | -0.743 |
asses | -0.732 |
offending | -0.722 |
ingle | -0.702 |
routed | -0.695 |
Token |
|
Token ID | 198 |
Feature activation | -6.98e-03 |
Pos logit contributions | |
augmented | +0.027 |
offending | +0.027 |
asses | +0.027 |
disse | +0.026 |
routed | +0.026 |
Neg logit contributions | |
ulia | -0.023 |
cott | -0.022 |
icas | -0.020 |
tsky | -0.019 |
kamp | -0.019 |
Token | Her |
Token ID | 9360 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
ulia | +0.018 |
cott | +0.018 |
icas | +0.016 |
tsky | +0.016 |
kamp | +0.015 |
Neg logit contributions | |
augmented | -0.018 |
asses | -0.017 |
offending | -0.017 |
ingle | -0.017 |
routed | -0.016 |
Token | itage |
Token ID | 10208 |
Feature activation | +2.69e-01 |
Pos logit contributions | |
ulia | +0.321 |
cott | +0.314 |
icas | +0.284 |
tsky | +0.273 |
kamp | +0.267 |
Neg logit contributions | |
augmented | -0.323 |
asses | -0.318 |
offending | -0.314 |
ingle | -0.305 |
routed | -0.302 |
Token | to |
Token ID | 284 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
augmented | +0.048 |
asses | +0.047 |
offending | +0.047 |
ingle | +0.045 |
routed | +0.044 |
Neg logit contributions | |
ulia | -0.064 |
cott | -0.064 |
icas | -0.058 |
tsky | -0.057 |
doms | -0.055 |
Token | sport |
Token ID | 6332 |
Feature activation | +3.74e-02 |
Pos logit contributions | |
ulia | +0.540 |
cott | +0.533 |
icas | +0.486 |
tsky | +0.472 |
kamp | +0.463 |
Neg logit contributions | |
augmented | -0.400 |
asses | -0.394 |
offending | -0.387 |
ingle | -0.375 |
routed | -0.370 |
Token | a |
Token ID | 257 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
augmented | +0.090 |
asses | +0.088 |
offending | +0.088 |
ingle | +0.084 |
routed | +0.084 |
Neg logit contributions | |
ulia | -0.104 |
cott | -0.102 |
icas | -0.093 |
tsky | -0.090 |
kamp | -0.088 |
Token | rum |
Token ID | 7440 |
Feature activation | +5.95e-02 |
Pos logit contributions | |
ulia | +0.371 |
cott | +0.366 |
icas | +0.335 |
tsky | +0.326 |
kamp | +0.319 |
Neg logit contributions | |
augmented | -0.252 |
asses | -0.245 |
offending | -0.243 |
ingle | -0.233 |
routed | -0.232 |
Token | pled |
Token ID | 10137 |
Feature activation | +1.00e-01 |
Pos logit contributions | |
augmented | +0.166 |
asses | +0.164 |
offending | +0.163 |
ingle | +0.159 |
routed | +0.157 |
Neg logit contributions | |
ulia | -0.143 |
cott | -0.139 |
icas | -0.124 |
tsky | -0.120 |
doms | -0.116 |
Token | suit |
Token ID | 6050 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
augmented | +0.210 |
asses | +0.205 |
offending | +0.204 |
ingle | +0.195 |
routed | +0.192 |
Neg logit contributions | |
ulia | -0.311 |
cott | -0.303 |
icas | -0.279 |
tsky | -0.271 |
kamp | -0.266 |
Token | than |
Token ID | 621 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
ulia | +1.736 |
cott | +1.714 |
icas | +1.559 |
tsky | +1.512 |
kamp | +1.484 |
Neg logit contributions | |
augmented | -1.367 |
asses | -1.348 |
offending | -1.323 |
ingle | -1.284 |
routed | -1.268 |
Token | a |
Token ID | 257 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
augmented | +0.536 |
asses | +0.525 |
offending | +0.522 |
ingle | +0.501 |
routed | +0.499 |
Neg logit contributions | |
ulia | -0.647 |
cott | -0.635 |
icas | -0.579 |
tsky | -0.562 |
kamp | -0.549 |
Token | hood |
Token ID | 14263 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
ulia | +0.483 |
cott | +0.475 |
icas | +0.434 |
tsky | +0.422 |
kamp | +0.414 |
Neg logit contributions | |
augmented | -0.336 |
asses | -0.327 |
offending | -0.326 |
ingle | -0.311 |
routed | -0.310 |
Token | ie |
Token ID | 494 |
Feature activation | -2.29e-01 |
Pos logit contributions | |
ulia | +0.263 |
cott | +0.256 |
icas | +0.227 |
tsky | +0.218 |
kamp | +0.212 |
Neg logit contributions | |
augmented | -0.357 |
asses | -0.352 |
offending | -0.350 |
ingle | -0.340 |
routed | -0.337 |
Token | , |
Token ID | 11 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
ulia | +0.656 |
cott | +0.646 |
icas | +0.589 |
tsky | +0.572 |
kamp | +0.559 |
Neg logit contributions | |
augmented | -0.533 |
asses | -0.520 |
offending | -0.517 |
ingle | -0.499 |
routed | -0.494 |
Token | , |
Token ID | 11 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
ulia | +0.262 |
cott | +0.257 |
icas | +0.234 |
tsky | +0.227 |
kamp | +0.219 |
Neg logit contributions | |
augmented | -0.241 |
asses | -0.235 |
offending | -0.231 |
ingle | -0.224 |
routed | -0.223 |
Token | Allen |
Token ID | 9659 |
Feature activation | -8.85e-02 |
Pos logit contributions | |
ulia | +0.277 |
cott | +0.271 |
icas | +0.247 |
tsky | +0.240 |
kamp | +0.234 |
Neg logit contributions | |
augmented | -0.253 |
asses | -0.247 |
offending | -0.244 |
ingle | -0.236 |
routed | -0.234 |
Token | H |
Token ID | 367 |
Feature activation | -3.64e-02 |
Pos logit contributions | |
ulia | +0.169 |
cott | +0.165 |
icas | +0.149 |
tsky | +0.136 |
kamp | +0.134 |
Neg logit contributions | |
augmented | -0.287 |
asses | -0.283 |
offending | -0.279 |
ingle | -0.274 |
routed | -0.271 |
Token | urn |
Token ID | 700 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
ulia | +0.094 |
cott | +0.093 |
icas | +0.083 |
tsky | +0.081 |
kamp | +0.079 |
Neg logit contributions | |
augmented | -0.094 |
asses | -0.093 |
offending | -0.091 |
ingle | -0.089 |
routed | -0.088 |
Token | s |
Token ID | 82 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
ulia | +0.271 |
cott | +0.265 |
icas | +0.240 |
tsky | +0.231 |
kamp | +0.224 |
Neg logit contributions | |
augmented | -0.271 |
asses | -0.268 |
offending | -0.263 |
ingle | -0.258 |
routed | -0.253 |
Token | and |
Token ID | 290 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
augmented | +0.911 |
asses | +0.898 |
offending | +0.872 |
ingle | +0.858 |
routed | +0.836 |
Neg logit contributions | |
ulia | -1.046 |
cott | -1.011 |
icas | -0.940 |
tsky | -0.908 |
doms | -0.880 |
Token | Julius |
Token ID | 32834 |
Feature activation | +2.64e-02 |
Pos logit contributions | |
ulia | +0.812 |
cott | +0.799 |
icas | +0.723 |
tsky | +0.701 |
kamp | +0.684 |
Neg logit contributions | |
augmented | -0.748 |
asses | -0.736 |
offending | -0.726 |
ingle | -0.703 |
routed | -0.697 |
Token | Thomas |
Token ID | 5658 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
augmented | +0.071 |
asses | +0.070 |
offending | +0.070 |
ingle | +0.068 |
routed | +0.067 |
Neg logit contributions | |
ulia | -0.065 |
cott | -0.064 |
icas | -0.058 |
tsky | -0.056 |
kamp | -0.054 |
Token | , |
Token ID | 11 |
Feature activation | -4.65e-02 |
Pos logit contributions | |
augmented | +0.560 |
asses | +0.543 |
offending | +0.537 |
ingle | +0.519 |
routed | +0.515 |
Neg logit contributions | |
ulia | -0.662 |
cott | -0.648 |
icas | -0.592 |
tsky | -0.574 |
doms | -0.561 |
Token | and |
Token ID | 290 |
Feature activation | -2.89e-01 |
Pos logit contributions | |
ulia | +0.127 |
cott | +0.125 |
icas | +0.114 |
tsky | +0.110 |
kamp | +0.108 |
Neg logit contributions | |
augmented | -0.114 |
asses | -0.112 |
offending | -0.111 |
ingle | -0.107 |
routed | -0.106 |
Token | he |
Token ID | 339 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
ulia | +0.814 |
cott | +0.802 |
icas | +0.728 |
tsky | +0.706 |
kamp | +0.691 |
Neg logit contributions | |
augmented | -0.681 |
asses | -0.670 |
offending | -0.660 |
ingle | -0.641 |
routed | -0.633 |
Token | . |
Token ID | 13 |
Feature activation | +1.65e-01 |
Pos logit contributions | |
ulia | +0.391 |
cott | +0.386 |
icas | +0.349 |
tsky | +0.339 |
kamp | +0.330 |
Neg logit contributions | |
augmented | -0.343 |
asses | -0.338 |
offending | -0.333 |
ingle | -0.323 |
routed | -0.319 |
Token | Our |
Token ID | 3954 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
augmented | +0.435 |
asses | +0.433 |
offending | +0.420 |
ingle | +0.412 |
routed | +0.405 |
Neg logit contributions | |
ulia | -0.413 |
cott | -0.406 |
icas | -0.368 |
tsky | -0.351 |
doms | -0.344 |
Token | goal |
Token ID | 3061 |
Feature activation | +1.86e-01 |
Pos logit contributions | |
ulia | +0.610 |
cott | +0.602 |
icas | +0.552 |
tsky | +0.538 |
kamp | +0.528 |
Neg logit contributions | |
augmented | -0.392 |
asses | -0.385 |
offending | -0.378 |
ingle | -0.365 |
routed | -0.360 |
Token | is |
Token ID | 318 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
augmented | +0.442 |
asses | +0.436 |
offending | +0.428 |
ingle | +0.414 |
routed | +0.410 |
Neg logit contributions | |
ulia | -0.520 |
cott | -0.512 |
icas | -0.464 |
tsky | -0.450 |
doms | -0.438 |
Token | to |
Token ID | 284 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
ulia | +0.354 |
cott | +0.349 |
icas | +0.317 |
tsky | +0.308 |
doms | +0.299 |
Neg logit contributions | |
augmented | -0.289 |
asses | -0.282 |
offending | -0.279 |
ingle | -0.270 |
routed | -0.267 |
Token | make |
Token ID | 787 |
Feature activation | -3.19e-01 |
Pos logit contributions | |
augmented | +0.392 |
asses | +0.384 |
offending | +0.379 |
ingle | +0.367 |
routed | +0.362 |
Neg logit contributions | |
ulia | -0.530 |
cott | -0.523 |
icas | -0.477 |
tsky | -0.463 |
kamp | -0.453 |
Token | it |
Token ID | 340 |
Feature activation | -4.52e-02 |
Pos logit contributions | |
ulia | +0.851 |
cott | +0.838 |
icas | +0.756 |
tsky | +0.732 |
kamp | +0.715 |
Neg logit contributions | |
augmented | -0.799 |
asses | -0.787 |
offending | -0.776 |
ingle | -0.754 |
routed | -0.746 |
Token | to |
Token ID | 284 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
ulia | +0.137 |
cott | +0.135 |
icas | +0.124 |
tsky | +0.120 |
kamp | +0.118 |
Neg logit contributions | |
augmented | -0.097 |
asses | -0.095 |
offending | -0.094 |
ingle | -0.091 |
routed | -0.090 |
Token | Queen |
Token ID | 7542 |
Feature activation | -5.05e-01 |
Pos logit contributions | |
ulia | +0.299 |
cott | +0.294 |
icas | +0.265 |
tsky | +0.256 |
doms | +0.249 |
Neg logit contributions | |
augmented | -0.290 |
asses | -0.283 |
offending | -0.280 |
ingle | -0.272 |
routed | -0.269 |
Token | stage |
Token ID | 3800 |
Feature activation | +8.50e-02 |
Pos logit contributions | |
ulia | +1.292 |
cott | +1.271 |
icas | +1.144 |
tsky | +1.108 |
kamp | +1.079 |
Neg logit contributions | |
augmented | -1.318 |
asses | -1.303 |
offending | -1.284 |
ingle | -1.252 |
routed | -1.236 |
Token | within |
Token ID | 1626 |
Feature activation | -5.05e-01 |
Pos logit contributions | |
augmented | +0.195 |
asses | +0.191 |
offending | +0.189 |
ingle | +0.182 |
routed | +0.181 |
Neg logit contributions | |
ulia | -0.243 |
cott | -0.241 |
icas | -0.220 |
tsky | -0.213 |
doms | -0.208 |
Token | upcoming |
Token ID | 7865 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
ulia | +0.166 |
cott | +0.164 |
icas | +0.150 |
tsky | +0.146 |
kamp | +0.143 |
Neg logit contributions | |
augmented | -0.122 |
asses | -0.120 |
offending | -0.118 |
ingle | -0.114 |
routed | -0.112 |
Token | Rally |
Token ID | 27752 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
augmented | +0.314 |
asses | +0.308 |
offending | +0.304 |
ingle | +0.294 |
routed | +0.290 |
Neg logit contributions | |
ulia | -0.408 |
cott | -0.402 |
icas | -0.366 |
tsky | -0.355 |
kamp | -0.348 |
Token | e |
Token ID | 68 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
ulia | +0.413 |
cott | +0.406 |
icas | +0.367 |
tsky | +0.355 |
kamp | +0.347 |
Neg logit contributions | |
augmented | -0.384 |
asses | -0.378 |
offending | -0.373 |
ingle | -0.363 |
routed | -0.358 |
Token | Monte |
Token ID | 22489 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
ulia | +0.589 |
cott | +0.580 |
icas | +0.523 |
tsky | +0.506 |
kamp | +0.495 |
Neg logit contributions | |
augmented | -0.556 |
asses | -0.549 |
offending | -0.541 |
ingle | -0.524 |
routed | -0.520 |
Token | - |
Token ID | 12 |
Feature activation | -6.75e-01 |
Pos logit contributions | |
augmented | +0.643 |
asses | +0.629 |
offending | +0.622 |
ingle | +0.609 |
routed | +0.601 |
Neg logit contributions | |
ulia | -0.571 |
cott | -0.553 |
icas | -0.496 |
tsky | -0.479 |
doms | -0.474 |
Token | Car |
Token ID | 9914 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
ulia | +1.373 |
cott | +1.338 |
icas | +1.172 |
tsky | +1.126 |
kamp | +1.088 |
Neg logit contributions | |
augmented | -2.122 |
asses | -2.092 |
offending | -2.067 |
ingle | -2.036 |
routed | -2.017 |
Token | lo |
Token ID | 5439 |
Feature activation | +2.43e-02 |
Pos logit contributions | |
ulia | +1.503 |
cott | +1.455 |
icas | +1.196 |
tsky | +1.095 |
kamp | +1.044 |
Neg logit contributions | |
augmented | -4.254 |
asses | -4.196 |
offending | -4.188 |
ingle | -4.083 |
disse | -4.054 |
Token | . |
Token ID | 13 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
augmented | +0.057 |
asses | +0.056 |
offending | +0.056 |
ingle | +0.054 |
routed | +0.053 |
Neg logit contributions | |
ulia | -0.068 |
cott | -0.067 |
icas | -0.061 |
tsky | -0.059 |
kamp | -0.058 |
Token | We |
Token ID | 775 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
augmented | +0.494 |
asses | +0.489 |
offending | +0.478 |
ingle | +0.469 |
routed | +0.460 |
Neg logit contributions | |
ulia | -0.500 |
cott | -0.491 |
icas | -0.445 |
tsky | -0.429 |
doms | -0.417 |
Token | spoke |
Token ID | 5158 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
augmented | +0.307 |
asses | +0.302 |
offending | +0.298 |
ingle | +0.288 |
routed | +0.285 |
Neg logit contributions | |
ulia | -0.388 |
cott | -0.382 |
icas | -0.348 |
tsky | -0.338 |
kamp | -0.331 |
Token | to |
Token ID | 284 |
Feature activation | +2.36e-02 |
Pos logit contributions | |
augmented | +0.319 |
asses | +0.313 |
offending | +0.308 |
ingle | +0.298 |
routed | +0.295 |
Neg logit contributions | |
ulia | -0.422 |
cott | -0.416 |
icas | -0.379 |
tsky | -0.369 |
kamp | -0.360 |
Token | - |
Token ID | 12 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
ulia | +0.187 |
cott | +0.183 |
icas | +0.169 |
tsky | +0.165 |
doms | +0.161 |
Neg logit contributions | |
augmented | -0.138 |
asses | -0.135 |
offending | -0.133 |
ingle | -0.128 |
routed | -0.127 |
Token | day |
Token ID | 820 |
Feature activation | -3.29e-01 |
Pos logit contributions | |
ulia | +0.643 |
cott | +0.632 |
icas | +0.575 |
tsky | +0.557 |
kamp | +0.544 |
Neg logit contributions | |
augmented | -0.572 |
asses | -0.564 |
offending | -0.554 |
ingle | -0.539 |
routed | -0.532 |
Token | V |
Token ID | 569 |
Feature activation | -8.86e-02 |
Pos logit contributions | |
ulia | +1.004 |
cott | +0.994 |
icas | +0.906 |
tsky | +0.880 |
kamp | +0.865 |
Neg logit contributions | |
augmented | -0.691 |
asses | -0.684 |
offending | -0.669 |
ingle | -0.649 |
routed | -0.639 |
Token | iva |
Token ID | 12151 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
ulia | +0.250 |
cott | +0.246 |
icas | +0.223 |
tsky | +0.217 |
kamp | +0.213 |
Neg logit contributions | |
augmented | -0.208 |
asses | -0.205 |
offending | -0.202 |
ingle | -0.196 |
routed | -0.193 |
Token | Cuba |
Token ID | 14159 |
Feature activation | -4.41e-01 |
Pos logit contributions | |
augmented | +0.439 |
asses | +0.431 |
offending | +0.426 |
ingle | +0.414 |
routed | +0.411 |
Neg logit contributions | |
ulia | -0.437 |
cott | -0.430 |
icas | -0.387 |
tsky | -0.377 |
kamp | -0.367 |
Token | family |
Token ID | 1641 |
Feature activation | -9.98e-01 |
Pos logit contributions | |
ulia | +1.317 |
cott | +1.301 |
icas | +1.187 |
tsky | +1.148 |
kamp | +1.127 |
Neg logit contributions | |
augmented | -0.956 |
asses | -0.948 |
offending | -0.929 |
ingle | -0.899 |
routed | -0.884 |
Token | holiday |
Token ID | 9912 |
Feature activation | +4.42e-01 |
Pos logit contributions | |
ulia | +2.962 |
cott | +2.959 |
icas | +2.678 |
tsky | +2.581 |
kamp | +2.543 |
Neg logit contributions | |
asses | -2.120 |
augmented | -2.111 |
offending | -2.041 |
ingle | -1.993 |
disse | -1.964 |
Token | that |
Token ID | 326 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
augmented | +0.954 |
asses | +0.928 |
offending | +0.919 |
ingle | +0.890 |
routed | +0.882 |
Neg logit contributions | |
ulia | -1.337 |
cott | -1.316 |
icas | -1.207 |
tsky | -1.177 |
kamp | -1.149 |
Token | includes |
Token ID | 3407 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
augmented | +0.538 |
asses | +0.528 |
offending | +0.522 |
ingle | +0.505 |
routed | +0.501 |
Neg logit contributions | |
ulia | -0.611 |
cott | -0.602 |
icas | -0.545 |
tsky | -0.529 |
kamp | -0.517 |
Token | visits |
Token ID | 11864 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
augmented | +0.415 |
asses | +0.401 |
offending | +0.399 |
ingle | +0.383 |
routed | +0.381 |
Neg logit contributions | |
ulia | -0.535 |
cott | -0.525 |
icas | -0.479 |
tsky | -0.469 |
kamp | -0.459 |
Token | to |
Token ID | 284 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
ulia | +0.695 |
cott | +0.689 |
icas | +0.624 |
tsky | +0.609 |
kamp | +0.595 |
Neg logit contributions | |
augmented | -0.556 |
asses | -0.542 |
offending | -0.535 |
ingle | -0.520 |
routed | -0.516 |
Token | emergency |
Token ID | 6334 |
Feature activation | +1.28e-01 |
Pos logit contributions | |
augmented | +0.354 |
asses | +0.348 |
offending | +0.343 |
ingle | +0.331 |
routed | +0.328 |
Neg logit contributions | |
ulia | -0.445 |
cott | -0.438 |
icas | -0.399 |
tsky | -0.387 |
kamp | -0.380 |
Token | evacuation |
Token ID | 24663 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
augmented | +0.267 |
asses | +0.260 |
offending | +0.258 |
ingle | +0.246 |
routed | +0.246 |
Neg logit contributions | |
ulia | -0.397 |
cott | -0.391 |
icas | -0.360 |
tsky | -0.351 |
kamp | -0.343 |
Token | ! |
Token ID | 0 |
Feature activation | +4.39e-01 |
Pos logit contributions | |
augmented | +0.450 |
asses | +0.441 |
offending | +0.435 |
routed | +0.420 |
ingle | +0.419 |
Neg logit contributions | |
ulia | -0.555 |
cott | -0.547 |
icas | -0.499 |
tsky | -0.485 |
kamp | -0.474 |
Token |
|
Token ID | 198 |
Feature activation | -6.48e-02 |
Pos logit contributions | |
augmented | +1.158 |
asses | +1.145 |
offending | +1.123 |
ingle | +1.098 |
routed | +1.086 |
Neg logit contributions | |
ulia | -1.106 |
cott | -1.089 |
icas | -0.979 |
tsky | -0.945 |
kamp | -0.922 |
Token |
|
Token ID | 198 |
Feature activation | -6.82e-02 |
Pos logit contributions | |
ulia | +0.152 |
cott | +0.150 |
icas | +0.132 |
tsky | +0.127 |
kamp | +0.125 |
Neg logit contributions | |
augmented | -0.182 |
offending | -0.181 |
asses | -0.180 |
disse | -0.175 |
routed | -0.174 |
Token | Rec |
Token ID | 6690 |
Feature activation | -8.69e-01 |
Pos logit contributions | |
ulia | +0.189 |
cott | +0.186 |
icas | +0.169 |
tsky | +0.164 |
kamp | +0.160 |
Neg logit contributions | |
augmented | -0.163 |
asses | -0.161 |
offending | -0.159 |
ingle | -0.154 |
routed | -0.152 |
Token | alling |
Token ID | 9221 |
Feature activation | -5.87e-01 |
Pos logit contributions | |
ulia | +2.389 |
cott | +2.356 |
icas | +2.135 |
tsky | +2.071 |
kamp | +2.029 |
Neg logit contributions | |
augmented | -2.099 |
asses | -2.073 |
offending | -2.040 |
ingle | -1.984 |
routed | -1.956 |
Token | that |
Token ID | 326 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
ulia | +1.638 |
cott | +1.611 |
icas | +1.463 |
tsky | +1.414 |
kamp | +1.379 |
Neg logit contributions | |
augmented | -1.373 |
asses | -1.367 |
offending | -1.332 |
ingle | -1.303 |
routed | -1.281 |
Token | , |
Token ID | 11 |
Feature activation | -7.07e-02 |
Pos logit contributions | |
augmented | +0.589 |
asses | +0.578 |
offending | +0.571 |
ingle | +0.551 |
routed | +0.545 |
Neg logit contributions | |
ulia | -0.791 |
cott | -0.781 |
icas | -0.712 |
tsky | -0.692 |
kamp | -0.679 |
Token | Ik |
Token ID | 32840 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
ulia | +0.191 |
cott | +0.189 |
icas | +0.170 |
tsky | +0.165 |
kamp | +0.162 |
Neg logit contributions | |
augmented | -0.175 |
asses | -0.171 |
offending | -0.169 |
ingle | -0.164 |
routed | -0.163 |
Token | ki |
Token ID | 4106 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
ulia | +0.495 |
cott | +0.489 |
icas | +0.431 |
tsky | +0.417 |
kamp | +0.401 |
Neg logit contributions | |
augmented | -0.689 |
asses | -0.683 |
offending | -0.671 |
ingle | -0.660 |
routed | -0.651 |
Token | study |
Token ID | 2050 |
Feature activation | +1.77e-01 |
Pos logit contributions | |
augmented | +0.154 |
asses | +0.151 |
offending | +0.149 |
ingle | +0.144 |
routed | +0.142 |
Neg logit contributions | |
ulia | -0.216 |
cott | -0.212 |
icas | -0.195 |
tsky | -0.189 |
kamp | -0.185 |
Token | both |
Token ID | 1111 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
augmented | +0.394 |
asses | +0.384 |
offending | +0.380 |
ingle | +0.366 |
routed | +0.362 |
Neg logit contributions | |
ulia | -0.526 |
cott | -0.520 |
icas | -0.473 |
tsky | -0.460 |
kamp | -0.450 |
Token | the |
Token ID | 262 |
Feature activation | +8.38e-02 |
Pos logit contributions | |
augmented | +0.029 |
asses | +0.028 |
offending | +0.028 |
ingle | +0.027 |
routed | +0.027 |
Neg logit contributions | |
ulia | -0.036 |
cott | -0.036 |
icas | -0.033 |
tsky | -0.032 |
kamp | -0.031 |
Token | nature |
Token ID | 3450 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
augmented | +0.172 |
asses | +0.168 |
offending | +0.166 |
ingle | +0.159 |
routed | +0.158 |
Neg logit contributions | |
ulia | -0.263 |
cott | -0.260 |
icas | -0.238 |
tsky | -0.232 |
kamp | -0.227 |
Token | of |
Token ID | 286 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
augmented | +0.528 |
asses | +0.518 |
offending | +0.504 |
ingle | +0.486 |
routed | +0.484 |
Neg logit contributions | |
ulia | -0.705 |
cott | -0.699 |
icas | -0.628 |
tsky | -0.615 |
kamp | -0.598 |
Token | seizures |
Token ID | 24715 |
Feature activation | -8.55e-01 |
Pos logit contributions | |
augmented | +0.026 |
asses | +0.025 |
offending | +0.025 |
ingle | +0.024 |
routed | +0.024 |
Neg logit contributions | |
ulia | -0.032 |
cott | -0.032 |
icas | -0.029 |
tsky | -0.028 |
kamp | -0.027 |
Token | and |
Token ID | 290 |
Feature activation | -8.20e-02 |
Pos logit contributions | |
ulia | +2.209 |
cott | +2.172 |
icas | +1.955 |
tsky | +1.894 |
kamp | +1.854 |
Neg logit contributions | |
augmented | -2.190 |
asses | -2.168 |
offending | -2.135 |
ingle | -2.077 |
routed | -2.050 |
Token | the |
Token ID | 262 |
Feature activation | +6.88e-02 |
Pos logit contributions | |
ulia | +0.244 |
cott | +0.241 |
icas | +0.220 |
tsky | +0.214 |
kamp | +0.209 |
Neg logit contributions | |
augmented | -0.180 |
asses | -0.177 |
offending | -0.175 |
ingle | -0.168 |
routed | -0.167 |
Token | best |
Token ID | 1266 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
augmented | +0.137 |
asses | +0.134 |
offending | +0.132 |
ingle | +0.127 |
routed | +0.126 |
Neg logit contributions | |
ulia | -0.220 |
cott | -0.217 |
icas | -0.199 |
tsky | -0.194 |
kamp | -0.190 |
Token | surgical |
Token ID | 21998 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
augmented | +0.294 |
asses | +0.289 |
offending | +0.283 |
routed | +0.270 |
ingle | +0.270 |
Neg logit contributions | |
ulia | -0.444 |
cott | -0.438 |
icas | -0.399 |
tsky | -0.391 |
kamp | -0.384 |
Token | path |
Token ID | 3108 |
Feature activation | +4.65e-01 |
Pos logit contributions | |
augmented | +0.239 |
asses | +0.233 |
offending | +0.231 |
disse | +0.219 |
routed | +0.219 |
Neg logit contributions | |
ulia | -0.378 |
cott | -0.371 |
icas | -0.339 |
tsky | -0.332 |
kamp | -0.324 |
Token | The |
Token ID | 464 |
Feature activation | -2.38e-02 |
Pos logit contributions | |
augmented | +0.403 |
asses | +0.398 |
offending | +0.388 |
ingle | +0.381 |
routed | +0.374 |
Neg logit contributions | |
ulia | -0.446 |
cott | -0.438 |
icas | -0.398 |
tsky | -0.388 |
kamp | -0.377 |
Token | program |
Token ID | 1430 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
ulia | +0.074 |
cott | +0.073 |
icas | +0.067 |
tsky | +0.065 |
kamp | +0.064 |
Neg logit contributions | |
augmented | -0.050 |
asses | -0.049 |
offending | -0.048 |
ingle | -0.046 |
routed | -0.046 |
Token | is |
Token ID | 318 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
ulia | +0.676 |
cott | +0.666 |
icas | +0.604 |
tsky | +0.586 |
kamp | +0.575 |
Neg logit contributions | |
augmented | -0.557 |
asses | -0.549 |
offending | -0.541 |
ingle | -0.525 |
routed | -0.519 |
Token | operated |
Token ID | 12228 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
ulia | +0.598 |
cott | +0.592 |
icas | +0.541 |
tsky | +0.525 |
kamp | +0.516 |
Neg logit contributions | |
augmented | -0.404 |
asses | -0.403 |
offending | -0.394 |
ingle | -0.383 |
routed | -0.374 |
Token | by |
Token ID | 416 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
ulia | +0.609 |
cott | +0.601 |
icas | +0.544 |
tsky | +0.527 |
kamp | +0.515 |
Neg logit contributions | |
augmented | -0.540 |
asses | -0.531 |
offending | -0.524 |
ingle | -0.508 |
routed | -0.503 |
Token | selecting |
Token ID | 17246 |
Feature activation | -8.48e-01 |
Pos logit contributions | |
ulia | +0.652 |
cott | +0.643 |
icas | +0.582 |
tsky | +0.564 |
kamp | +0.552 |
Neg logit contributions | |
augmented | -0.584 |
asses | -0.572 |
offending | -0.565 |
ingle | -0.547 |
routed | -0.543 |
Token | the |
Token ID | 262 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
ulia | +2.336 |
cott | +2.292 |
icas | +2.083 |
tsky | +1.990 |
kamp | +1.962 |
Neg logit contributions | |
augmented | -2.023 |
asses | -2.014 |
offending | -1.966 |
ingle | -1.919 |
disse | -1.894 |
Token | series |
Token ID | 2168 |
Feature activation | -6.82e-02 |
Pos logit contributions | |
ulia | +0.454 |
cott | +0.447 |
icas | +0.410 |
tsky | +0.398 |
kamp | +0.391 |
Neg logit contributions | |
augmented | -0.303 |
asses | -0.299 |
offending | -0.292 |
ingle | -0.284 |
routed | -0.279 |
Token | version |
Token ID | 2196 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
ulia | +0.205 |
cott | +0.202 |
icas | +0.184 |
tsky | +0.180 |
kamp | +0.176 |
Neg logit contributions | |
augmented | -0.148 |
asses | -0.146 |
offending | -0.144 |
ingle | -0.138 |
routed | -0.137 |
Token | using |
Token ID | 1262 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
ulia | +0.409 |
cott | +0.404 |
icas | +0.368 |
tsky | +0.357 |
kamp | +0.350 |
Neg logit contributions | |
augmented | -0.318 |
asses | -0.313 |
offending | -0.309 |
ingle | -0.299 |
routed | -0.295 |
Token | the |
Token ID | 262 |
Feature activation | -6.76e-02 |
Pos logit contributions | |
ulia | +0.715 |
cott | +0.706 |
icas | +0.634 |
tsky | +0.616 |
kamp | +0.601 |
Neg logit contributions | |
augmented | -0.689 |
asses | -0.676 |
offending | -0.668 |
ingle | -0.649 |
routed | -0.643 |