Token | a |
Token ID | 257 |
Feature activation | +3.00e+01 |
Pos logit contributions | |
unity | +34.867 |
prayers | +31.970 |
doors | +31.742 |
assemblies | +31.282 |
isans | +31.002 |
Neg logit contributions | |
paed | -16.700 |
HSBC | -14.293 |
ITV | -13.831 |
neurot | -13.481 |
ageing | -12.934 |
Token | lot |
Token ID | 1256 |
Feature activation | +2.95e+01 |
Pos logit contributions | |
unity | +28.380 |
prayers | +24.853 |
doors | +24.624 |
isans | +24.485 |
assemblies | +23.999 |
Neg logit contributions | |
paed | -18.310 |
HSBC | -16.246 |
unethical | -15.927 |
ITV | -15.791 |
ageing | -15.242 |
Token | of |
Token ID | 286 |
Feature activation | +3.36e+01 |
Pos logit contributions | |
unity | +26.459 |
isans | +25.205 |
doors | +24.304 |
prayers | +23.777 |
Commands | +23.653 |
Neg logit contributions | |
paed | -19.274 |
HSBC | -16.851 |
neurot | -16.524 |
ITV | -16.326 |
unethical | -16.155 |
Token | shared |
Token ID | 4888 |
Feature activation | +3.11e+01 |
Pos logit contributions | |
unity | +34.133 |
doors | +31.113 |
prayers | +31.069 |
assemblies | +30.171 |
isans | +29.726 |
Neg logit contributions | |
paed | -16.749 |
ITV | -13.518 |
HSBC | -13.516 |
neurot | -13.161 |
ageing | -12.268 |
Token | goals |
Token ID | 4661 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
unity | +29.793 |
prayers | +27.999 |
doors | +27.834 |
assemblies | +26.873 |
directives | +26.476 |
Neg logit contributions | |
paed | -18.266 |
HSBC | -15.941 |
ITV | -15.195 |
ageing | -14.768 |
neurot | -14.667 |
Token | and |
Token ID | 290 |
Feature activation | +4.79e+01 |
Pos logit contributions | |
unity | +20.324 |
isans | +19.156 |
assemblies | +18.870 |
Commands | +18.778 |
doors | +18.414 |
Neg logit contributions | |
paed | -17.356 |
neurot | -15.072 |
unethical | -14.707 |
HSBC | -14.688 |
piracy | -14.399 |
Token | that |
Token ID | 326 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
unity | +38.090 |
prayers | +36.022 |
doors | +34.888 |
assemblies | +34.653 |
isans | +34.464 |
Neg logit contributions | |
paed | -19.379 |
HSBC | -16.809 |
ITV | -15.597 |
ageing | -14.991 |
unethical | -14.848 |
Token | � |
Token ID | 447 |
Feature activation | -7.81e-01 |
Pos logit contributions | |
unity | +13.724 |
Commands | +12.328 |
isans | +12.153 |
assemblies | +12.132 |
prayers | +12.107 |
Neg logit contributions | |
paed | -12.278 |
neurot | -10.866 |
unethical | -10.717 |
HSBC | -10.553 |
Australian | -10.418 |
Token | � |
Token ID | 247 |
Feature activation | +4.65e+00 |
Pos logit contributions | |
paed | +0.599 |
neurot | +0.508 |
Australian | +0.505 |
HSBC | +0.494 |
unethical | +0.492 |
Neg logit contributions | |
unity | -1.039 |
Commands | -1.015 |
aturdays | -1.003 |
enaries | -0.998 |
assemblies | -0.985 |
Token | s |
Token ID | 82 |
Feature activation | +1.88e+01 |
Pos logit contributions | |
unity | +4.701 |
Commands | +4.470 |
enaries | +4.355 |
aturdays | +4.353 |
isans | +4.327 |
Neg logit contributions | |
paed | -5.067 |
neurot | -4.512 |
Australian | -4.453 |
unethical | -4.426 |
HSBC | -4.413 |
Token | what |
Token ID | 644 |
Feature activation | +2.26e+01 |
Pos logit contributions | |
unity | +20.455 |
isans | +18.267 |
prayers | +18.200 |
doors | +18.181 |
Commands | +18.166 |
Neg logit contributions | |
paed | -14.412 |
neurot | -12.367 |
HSBC | -12.306 |
Australian | -11.605 |
ITV | -11.602 |
Token | In |
Token ID | 818 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
Rules | +23.308 |
Commands | +21.660 |
unity | +21.597 |
Dialogue | +21.101 |
isans | +20.730 |
Neg logit contributions | |
paed | -21.130 |
unethical | -18.375 |
neurot | -18.319 |
piracy | -17.791 |
dermat | -17.598 |
Token | this |
Token ID | 428 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
unity | +18.439 |
Commands | +17.263 |
assemblies | +17.190 |
doors | +17.005 |
aturdays | +16.985 |
Neg logit contributions | |
paed | -11.684 |
neurot | -9.898 |
unethical | -9.628 |
ITV | -9.625 |
HSBC | -9.554 |
Token | country |
Token ID | 1499 |
Feature activation | +3.49e+01 |
Pos logit contributions | |
unity | +23.356 |
assemblies | +21.226 |
doors | +20.973 |
Commands | +20.787 |
prayers | +20.514 |
Neg logit contributions | |
paed | -15.104 |
neurot | -12.757 |
HSBC | -12.394 |
NZ | -12.239 |
ITV | -12.227 |
Token | , |
Token ID | 11 |
Feature activation | +3.77e+01 |
Pos logit contributions | |
unity | +31.409 |
prayers | +29.332 |
assemblies | +29.130 |
isans | +29.096 |
doors | +28.905 |
Neg logit contributions | |
paed | -18.700 |
ITV | -16.271 |
neurot | -16.268 |
HSBC | -16.254 |
NZ | -15.738 |
Token | we |
Token ID | 356 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
unity | +34.934 |
doors | +32.764 |
assemblies | +32.649 |
prayers | +32.484 |
isans | +30.912 |
Neg logit contributions | |
paed | -16.318 |
ITV | -13.775 |
neurot | -13.680 |
HSBC | -13.545 |
ASIC | -12.709 |
Token | have |
Token ID | 423 |
Feature activation | +4.66e+01 |
Pos logit contributions | |
unity | +21.441 |
assemblies | +19.936 |
doors | +19.848 |
Commands | +19.820 |
prayers | +19.404 |
Neg logit contributions | |
paed | -17.550 |
neurot | -14.972 |
unethical | -14.823 |
ITV | -14.650 |
HSBC | -14.548 |
Token | a |
Token ID | 257 |
Feature activation | +3.31e+01 |
Pos logit contributions | |
unity | +37.561 |
assemblies | +35.023 |
doors | +34.800 |
prayers | +34.380 |
isans | +33.282 |
Neg logit contributions | |
paed | -18.277 |
ITV | -15.508 |
HSBC | -15.090 |
neurot | -14.979 |
NZ | -14.751 |
Token | strong |
Token ID | 1913 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
unity | +31.995 |
doors | +28.078 |
assemblies | +27.710 |
prayers | +27.504 |
isans | +27.263 |
Neg logit contributions | |
paed | -16.853 |
ITV | -15.264 |
HSBC | -14.657 |
NZ | -13.858 |
unethical | -13.803 |
Token | tradition |
Token ID | 6761 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
unity | +20.190 |
assemblies | +17.985 |
doors | +17.967 |
isans | +17.589 |
Commands | +17.407 |
Neg logit contributions | |
paed | -14.529 |
ITV | -12.764 |
HSBC | -12.671 |
neurot | -12.509 |
unethical | -12.366 |
Token | of |
Token ID | 286 |
Feature activation | +2.52e+01 |
Pos logit contributions | |
unity | +17.142 |
isans | +15.884 |
assemblies | +15.464 |
doors | +15.411 |
prayers | +15.374 |
Neg logit contributions | |
paed | -16.473 |
neurot | -14.708 |
HSBC | -14.701 |
ITV | -14.630 |
NZ | -14.401 |
Token | gun |
Token ID | 2485 |
Feature activation | +2.29e+01 |
Pos logit contributions | |
unity | +26.669 |
doors | +24.284 |
prayers | +24.080 |
assemblies | +24.058 |
isans | +23.068 |
Neg logit contributions | |
paed | -15.780 |
HSBC | -13.916 |
ITV | -13.853 |
neurot | -13.546 |
NZ | -13.087 |
Token | the |
Token ID | 262 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
unity | +11.083 |
Commands | +10.641 |
assemblies | +10.377 |
Rules | +10.266 |
endas | +10.153 |
Neg logit contributions | |
paed | -10.652 |
neurot | -9.487 |
unethical | -9.109 |
piracy | -9.052 |
ITV | -9.009 |
Token | Constitution |
Token ID | 7965 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
unity | +18.418 |
Commands | +17.817 |
assemblies | +17.391 |
Rules | +17.310 |
prayers | +17.158 |
Neg logit contributions | |
paed | -12.297 |
neurot | -10.397 |
unethical | -10.095 |
piracy | -10.065 |
commercially | -9.877 |
Token | , |
Token ID | 11 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
unity | +11.038 |
Commands | +10.682 |
Rules | +10.319 |
enaries | +10.312 |
prayers | +10.297 |
Neg logit contributions | |
paed | -11.746 |
unethical | -10.404 |
neurot | -10.344 |
HSBC | -10.203 |
piracy | -10.069 |
Token | which |
Token ID | 543 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
unity | +13.374 |
Commands | +12.855 |
Rules | +12.540 |
assemblies | +12.534 |
prayers | +12.479 |
Neg logit contributions | |
paed | -10.636 |
neurot | -9.175 |
unethical | -8.937 |
HSBC | -8.824 |
ITV | -8.810 |
Token | says |
Token ID | 1139 |
Feature activation | +4.13e+01 |
Pos logit contributions | |
unity | +13.777 |
Commands | +13.410 |
assemblies | +12.866 |
prayers | +12.700 |
Rules | +12.617 |
Neg logit contributions | |
paed | -12.067 |
neurot | -10.663 |
unethical | -10.354 |
HSBC | -10.228 |
ITV | -10.219 |
Token | that |
Token ID | 326 |
Feature activation | +4.54e+01 |
Pos logit contributions | |
unity | +36.894 |
prayers | +34.865 |
assemblies | +34.153 |
Commands | +33.949 |
doors | +33.632 |
Neg logit contributions | |
paed | -16.824 |
ITV | -14.942 |
neurot | -14.432 |
HSBC | -14.329 |
NZ | -13.486 |
Token | the |
Token ID | 262 |
Feature activation | +3.45e+01 |
Pos logit contributions | |
unity | +38.844 |
prayers | +36.592 |
assemblies | +36.406 |
Commands | +35.542 |
doors | +35.258 |
Neg logit contributions | |
paed | -17.273 |
ITV | -15.212 |
HSBC | -15.113 |
neurot | -14.454 |
NZ | -13.885 |
Token | president |
Token ID | 1893 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
unity | +34.204 |
assemblies | +32.204 |
Commands | +32.045 |
doors | +31.826 |
prayers | +31.553 |
Neg logit contributions | |
paed | -16.443 |
HSBC | -13.931 |
ITV | -13.800 |
piracy | -13.454 |
neurot | -13.169 |
Token | � |
Token ID | 564 |
Feature activation | -7.35e+00 |
Pos logit contributions | |
unity | +14.868 |
Commands | +14.385 |
assemblies | +13.972 |
prayers | +13.893 |
doors | +13.637 |
Neg logit contributions | |
paed | -12.766 |
HSBC | -11.210 |
neurot | -11.132 |
piracy | -11.006 |
unethical | -10.979 |
Token | � |
Token ID | 250 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
paed | +6.399 |
Australian | +5.657 |
neurot | +5.565 |
HSBC | +5.488 |
unethical | +5.440 |
Neg logit contributions | |
unity | -8.561 |
aturdays | -8.468 |
Commands | -8.223 |
enaries | -8.204 |
assemblies | -8.069 |
Token | must |
Token ID | 27238 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
unity | +0.123 |
Commands | +0.118 |
aturdays | +0.115 |
enaries | +0.114 |
Rules | +0.112 |
Neg logit contributions | |
paed | -0.194 |
neurot | -0.177 |
Australian | -0.176 |
HSBC | -0.174 |
unethical | -0.174 |
Token | policy |
Token ID | 2450 |
Feature activation | +2.79e+01 |
Pos logit contributions | |
unity | +31.828 |
prayers | +29.642 |
doors | +29.362 |
assemblies | +29.016 |
isans | +28.659 |
Neg logit contributions | |
paed | -15.874 |
HSBC | -13.307 |
neurot | -13.151 |
ITV | -12.885 |
ageing | -11.768 |
Token | differences |
Token ID | 5400 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
unity | +27.121 |
assemblies | +24.963 |
prayers | +24.951 |
isans | +24.902 |
doors | +24.869 |
Neg logit contributions | |
paed | -18.463 |
HSBC | -16.072 |
neurot | -15.574 |
ITV | -15.516 |
unethical | -15.086 |
Token | , |
Token ID | 11 |
Feature activation | +2.22e+01 |
Pos logit contributions | |
unity | +17.417 |
isans | +16.681 |
Commands | +16.163 |
assemblies | +16.000 |
doors | +15.979 |
Neg logit contributions | |
paed | -16.092 |
neurot | -14.188 |
HSBC | -13.624 |
unethical | -13.579 |
Australian | -13.280 |
Token | but |
Token ID | 475 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
unity | +23.001 |
isans | +21.506 |
Commands | +21.213 |
prayers | +21.047 |
doors | +20.959 |
Neg logit contributions | |
paed | -15.692 |
neurot | -13.322 |
HSBC | -13.166 |
ITV | -12.833 |
Australian | -12.789 |
Token | there |
Token ID | 612 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
unity | +31.884 |
prayers | +28.302 |
doors | +28.230 |
isans | +28.094 |
assemblies | +27.822 |
Neg logit contributions | |
paed | -17.415 |
neurot | -14.570 |
unethical | -13.912 |
HSBC | -13.768 |
ITV | -13.678 |
Token | are |
Token ID | 389 |
Feature activation | +4.47e+01 |
Pos logit contributions | |
unity | +10.541 |
Commands | +9.880 |
isans | +9.674 |
prayers | +9.649 |
enaries | +9.646 |
Neg logit contributions | |
paed | -10.911 |
neurot | -9.779 |
HSBC | -9.604 |
unethical | -9.600 |
Australian | -9.553 |
Token | also |
Token ID | 635 |
Feature activation | +3.66e+01 |
Pos logit contributions | |
unity | +38.319 |
doors | +34.949 |
prayers | +34.356 |
assemblies | +33.840 |
isans | +33.296 |
Neg logit contributions | |
paed | -17.667 |
HSBC | -15.175 |
ITV | -14.230 |
neurot | -14.165 |
piracy | -13.520 |
Token | a |
Token ID | 257 |
Feature activation | +3.00e+01 |
Pos logit contributions | |
unity | +34.867 |
prayers | +31.970 |
doors | +31.742 |
assemblies | +31.282 |
isans | +31.002 |
Neg logit contributions | |
paed | -16.700 |
HSBC | -14.293 |
ITV | -13.831 |
neurot | -13.481 |
ageing | -12.934 |
Token | lot |
Token ID | 1256 |
Feature activation | +2.95e+01 |
Pos logit contributions | |
unity | +28.380 |
prayers | +24.853 |
doors | +24.624 |
isans | +24.485 |
assemblies | +23.999 |
Neg logit contributions | |
paed | -18.310 |
HSBC | -16.246 |
unethical | -15.927 |
ITV | -15.791 |
ageing | -15.242 |
Token | of |
Token ID | 286 |
Feature activation | +3.36e+01 |
Pos logit contributions | |
unity | +26.459 |
isans | +25.205 |
doors | +24.304 |
prayers | +23.777 |
Commands | +23.653 |
Neg logit contributions | |
paed | -19.274 |
HSBC | -16.851 |
neurot | -16.524 |
ITV | -16.326 |
unethical | -16.155 |
Token | shared |
Token ID | 4888 |
Feature activation | +3.11e+01 |
Pos logit contributions | |
unity | +34.133 |
doors | +31.113 |
prayers | +31.069 |
assemblies | +30.171 |
isans | +29.726 |
Neg logit contributions | |
paed | -16.749 |
ITV | -13.518 |
HSBC | -13.516 |
neurot | -13.161 |
ageing | -12.268 |
Token | that |
Token ID | 326 |
Feature activation | +3.24e+01 |
Pos logit contributions | |
unity | +20.922 |
assemblies | +19.599 |
Commands | +19.122 |
prayers | +19.068 |
Rules | +18.940 |
Neg logit contributions | |
paed | -17.039 |
HSBC | -15.047 |
unethical | -14.734 |
ITV | -14.730 |
neurot | -14.712 |
Token | denied |
Token ID | 6699 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
unity | +29.630 |
assemblies | +27.451 |
prayers | +26.870 |
Commands | +26.383 |
doors | +26.013 |
Neg logit contributions | |
paed | -18.202 |
ITV | -15.238 |
neurot | -15.092 |
HSBC | -15.075 |
unethical | -14.762 |
Token | rail |
Token ID | 6787 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
unity | +18.899 |
assemblies | +17.743 |
prayers | +17.336 |
Commands | +17.332 |
doors | +17.283 |
Neg logit contributions | |
paed | -12.622 |
neurot | -10.812 |
ITV | -10.738 |
HSBC | -10.628 |
ageing | -10.260 |
Token | roads |
Token ID | 21372 |
Feature activation | +2.78e+01 |
Pos logit contributions | |
unity | +15.513 |
Commands | +14.543 |
assemblies | +14.441 |
doors | +14.090 |
enaries | +13.997 |
Neg logit contributions | |
paed | -16.823 |
neurot | -15.001 |
HSBC | -14.982 |
ITV | -14.563 |
unethical | -14.389 |
Token | " |
Token ID | 366 |
Feature activation | +2.54e+01 |
Pos logit contributions | |
unity | +28.130 |
assemblies | +26.678 |
prayers | +26.146 |
doors | +25.942 |
Commands | +25.642 |
Neg logit contributions | |
paed | -15.972 |
neurot | -13.361 |
ageing | -13.088 |
ITV | -13.084 |
dermat | -13.076 |
Token | the |
Token ID | 1169 |
Feature activation | +4.33e+01 |
Pos logit contributions | |
unity | +23.742 |
Rules | +23.324 |
enaries | +22.911 |
Commands | +22.705 |
assemblies | +22.543 |
Neg logit contributions | |
paed | -17.580 |
neurot | -15.188 |
ageing | -15.119 |
HSBC | -15.097 |
ITV | -14.798 |
Token | right |
Token ID | 826 |
Feature activation | +2.92e+01 |
Pos logit contributions | |
unity | +37.671 |
doors | +34.266 |
prayers | +34.146 |
assemblies | +33.813 |
Commands | +33.195 |
Neg logit contributions | |
paed | -16.822 |
ITV | -15.176 |
HSBC | -14.907 |
neurot | -14.180 |
ageing | -13.996 |
Token | to |
Token ID | 284 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
unity | +25.943 |
assemblies | +23.892 |
enaries | +23.704 |
doors | +23.560 |
prayers | +23.417 |
Neg logit contributions | |
paed | -19.775 |
HSBC | -18.116 |
ITV | -17.243 |
neurot | -17.013 |
NZ | -16.819 |
Token | deduct |
Token ID | 18777 |
Feature activation | +2.21e+01 |
Pos logit contributions | |
unity | +28.075 |
assemblies | +26.888 |
Commands | +26.116 |
doors | +25.788 |
prayers | +25.552 |
Neg logit contributions | |
paed | -15.452 |
HSBC | -13.009 |
ITV | -12.559 |
dermat | -12.468 |
neurot | -12.437 |
Token | the |
Token ID | 262 |
Feature activation | +2.17e+01 |
Pos logit contributions | |
unity | +23.846 |
enaries | +23.146 |
assemblies | +22.802 |
isans | +22.567 |
prayers | +22.542 |
Neg logit contributions | |
paed | -14.523 |
HSBC | -12.512 |
ITV | -12.156 |
neurot | -12.112 |
unethical | -11.698 |
Token | amount |
Token ID | 2033 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
unity | +24.545 |
assemblies | +23.252 |
prayers | +22.992 |
doors | +22.648 |
Commands | +22.629 |
Neg logit contributions | |
paed | -13.486 |
HSBC | -11.297 |
neurot | -11.078 |
ITV | -11.052 |
unethical | -10.710 |
Token |
|
Token ID | 198 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
unity | +0.156 |
Commands | +0.151 |
aturdays | +0.149 |
enaries | +0.148 |
Rules | +0.146 |
Neg logit contributions | |
paed | -0.128 |
neurot | -0.113 |
Australian | -0.112 |
HSBC | -0.110 |
unethical | -0.110 |
Token | At |
Token ID | 2953 |
Feature activation | +9.43e+00 |
Pos logit contributions | |
Rules | +13.972 |
unity | +13.370 |
Commands | +13.019 |
aturdays | +12.872 |
enaries | +12.758 |
Neg logit contributions | |
paed | -13.959 |
neurot | -12.367 |
ageing | -11.962 |
unethical | -11.948 |
piracy | -11.891 |
Token | the |
Token ID | 262 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
unity | +9.787 |
Commands | +9.371 |
assemblies | +9.068 |
doors | +9.014 |
Rules | +8.969 |
Neg logit contributions | |
paed | -9.286 |
neurot | -8.277 |
unethical | -8.035 |
Australian | -7.982 |
piracy | -7.949 |
Token | California |
Token ID | 3442 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
unity | +19.456 |
doors | +18.463 |
Commands | +18.454 |
assemblies | +17.937 |
prayers | +17.678 |
Neg logit contributions | |
paed | -13.420 |
neurot | -11.690 |
piracy | -11.227 |
unethical | -11.196 |
ITV | -10.912 |
Token | Constitutional |
Token ID | 26740 |
Feature activation | +2.04e+01 |
Pos logit contributions | |
unity | +13.081 |
Commands | +12.415 |
doors | +12.151 |
assemblies | +12.101 |
Rules | +11.986 |
Neg logit contributions | |
paed | -10.970 |
neurot | -9.636 |
unethical | -9.435 |
HSBC | -9.285 |
Australian | -9.226 |
Token | Convention |
Token ID | 11680 |
Feature activation | +4.21e+01 |
Pos logit contributions | |
unity | +17.493 |
Commands | +16.909 |
assemblies | +16.576 |
Rules | +15.817 |
doors | +15.814 |
Neg logit contributions | |
paed | -19.952 |
neurot | -17.476 |
HSBC | -17.178 |
commercially | -17.078 |
unethical | -17.041 |
Token | of |
Token ID | 286 |
Feature activation | +2.70e+01 |
Pos logit contributions | |
unity | +32.990 |
assemblies | +32.536 |
prayers | +32.468 |
Commands | +32.385 |
doors | +31.460 |
Neg logit contributions | |
paed | -19.097 |
neurot | -17.373 |
ageing | -16.278 |
ITV | -16.064 |
unethical | -15.725 |
Token | 18 |
Token ID | 1248 |
Feature activation | +9.33e+00 |
Pos logit contributions | |
unity | +25.101 |
Commands | +24.083 |
assemblies | +23.723 |
prayers | +23.302 |
doors | +23.154 |
Neg logit contributions | |
paed | -18.280 |
neurot | -15.893 |
unethical | -15.558 |
doping | -15.340 |
ageing | -15.310 |
Token | 78 |
Token ID | 3695 |
Feature activation | +3.35e+01 |
Pos logit contributions | |
unity | +7.928 |
Commands | +7.816 |
Rules | +7.580 |
doors | +7.305 |
assemblies | +7.267 |
Neg logit contributions | |
paed | -10.979 |
neurot | -9.948 |
unethical | -9.873 |
piracy | -9.756 |
ageing | -9.598 |
Token | – |
Token ID | 1906 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
unity | +29.983 |
assemblies | +29.053 |
prayers | +28.973 |
Commands | +28.480 |
Rules | +28.123 |
Neg logit contributions | |
paed | -18.192 |
neurot | -15.348 |
ageing | -15.117 |
ITV | -14.518 |
unethical | -14.376 |
Token | 79 |
Token ID | 3720 |
Feature activation | +3.74e+01 |
Pos logit contributions | |
unity | +10.494 |
Rules | +10.107 |
Commands | +10.095 |
aturdays | +9.981 |
enaries | +9.860 |
Neg logit contributions | |
paed | -14.411 |
neurot | -13.097 |
piracy | -12.630 |
HSBC | -12.526 |
unethical | -12.477 |
Token | � |
Token ID | 250 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
unity | +3.095 |
Commands | +3.019 |
aturdays | +2.964 |
enaries | +2.960 |
Rules | +2.936 |
Neg logit contributions | |
paed | -1.739 |
neurot | -1.471 |
Australian | -1.447 |
unethical | -1.421 |
HSBC | -1.419 |
Token | I |
Token ID | 40 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
unity | +20.009 |
Rules | +19.882 |
Commands | +18.563 |
isans | +18.450 |
aturdays | +18.285 |
Neg logit contributions | |
paed | -18.367 |
neurot | -16.073 |
unethical | -15.787 |
dermat | -15.741 |
NZ | -15.464 |
Token | have |
Token ID | 423 |
Feature activation | +4.18e+01 |
Pos logit contributions | |
unity | +14.328 |
Commands | +13.634 |
assemblies | +13.228 |
doors | +13.086 |
enaries | +13.017 |
Neg logit contributions | |
paed | -12.865 |
neurot | -11.200 |
piracy | -11.195 |
unethical | -11.176 |
Australian | -11.087 |
Token | said |
Token ID | 531 |
Feature activation | +2.73e+01 |
Pos logit contributions | |
unity | +36.841 |
prayers | +34.410 |
assemblies | +34.331 |
doors | +33.137 |
Commands | +32.495 |
Neg logit contributions | |
paed | -15.712 |
ITV | -13.146 |
HSBC | -12.908 |
piracy | -12.906 |
neurot | -12.643 |
Token | I |
Token ID | 314 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
unity | +28.113 |
prayers | +26.553 |
assemblies | +25.869 |
doors | +25.519 |
Commands | +25.063 |
Neg logit contributions | |
paed | -15.518 |
neurot | -13.195 |
dermat | -12.778 |
unethical | -12.679 |
HSBC | -12.667 |
Token | have |
Token ID | 423 |
Feature activation | +4.20e+01 |
Pos logit contributions | |
unity | +18.759 |
Commands | +17.671 |
doors | +17.217 |
assemblies | +17.139 |
prayers | +16.950 |
Neg logit contributions | |
paed | -16.355 |
piracy | -14.286 |
unethical | -14.278 |
neurot | -14.100 |
Australian | -13.877 |
Token | always |
Token ID | 1464 |
Feature activation | +3.47e+01 |
Pos logit contributions | |
unity | +38.088 |
prayers | +35.015 |
assemblies | +34.598 |
doors | +34.229 |
Commands | +33.075 |
Neg logit contributions | |
paed | -14.863 |
ITV | -12.688 |
unethical | -12.504 |
HSBC | -12.262 |
piracy | -12.199 |
Token | acted |
Token ID | 13134 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
unity | +32.573 |
doors | +29.783 |
prayers | +29.459 |
assemblies | +29.216 |
prayed | +28.731 |
Neg logit contributions | |
paed | -15.740 |
ITV | -14.544 |
unethical | -14.278 |
piracy | -14.219 |
HSBC | -14.032 |
Token | in |
Token ID | 287 |
Feature activation | +2.40e+01 |
Pos logit contributions | |
unity | +22.339 |
assemblies | +20.807 |
Commands | +20.616 |
prayers | +20.588 |
doors | +20.254 |
Neg logit contributions | |
paed | -14.615 |
ITV | -12.668 |
HSBC | -12.572 |
neurot | -12.355 |
piracy | -12.275 |
Token | accordance |
Token ID | 10213 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
unity | +27.067 |
assemblies | +25.287 |
prayers | +24.607 |
doors | +24.263 |
Commands | +23.705 |
Neg logit contributions | |
paed | -14.121 |
neurot | -12.352 |
ITV | -12.100 |
HSBC | -11.944 |
ageing | -11.920 |
Token | with |
Token ID | 351 |
Feature activation | +2.72e+01 |
Pos logit contributions | |
unity | +11.249 |
Commands | +10.226 |
assemblies | +10.189 |
Rules | +10.065 |
doors | +10.042 |
Neg logit contributions | |
paed | -14.517 |
neurot | -13.163 |
HSBC | -12.978 |
Australian | -12.823 |
unethical | -12.788 |
Token | into |
Token ID | 656 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
unity | +22.476 |
prayers | +22.122 |
doors | +21.250 |
Commands | +21.048 |
assemblies | +21.026 |
Neg logit contributions | |
paed | -16.705 |
neurot | -14.638 |
unethical | -14.404 |
HSBC | -14.023 |
piracy | -13.987 |
Token | the |
Token ID | 262 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
unity | +14.918 |
prayers | +14.059 |
doors | +13.977 |
Commands | +13.832 |
assemblies | +13.813 |
Neg logit contributions | |
paed | -12.195 |
unethical | -10.802 |
neurot | -10.780 |
HSBC | -10.491 |
piracy | -10.444 |
Token | microphone |
Token ID | 21822 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
unity | +20.238 |
prayers | +19.254 |
doors | +19.040 |
assemblies | +18.744 |
Commands | +18.584 |
Neg logit contributions | |
paed | -12.209 |
unethical | -10.590 |
piracy | -10.420 |
HSBC | -10.305 |
neurot | -10.216 |
Token | as |
Token ID | 355 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
unity | +18.358 |
doors | +17.759 |
prayers | +17.507 |
assemblies | +17.310 |
Commands | +17.277 |
Neg logit contributions | |
paed | -17.642 |
unethical | -15.264 |
neurot | -15.123 |
HSBC | -14.942 |
piracy | -14.734 |
Token | the |
Token ID | 262 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
unity | +26.099 |
prayers | +25.392 |
doors | +24.925 |
assemblies | +24.526 |
Commands | +24.204 |
Neg logit contributions | |
paed | -13.801 |
neurot | -12.104 |
unethical | -12.008 |
HSBC | -11.524 |
piracy | -11.258 |
Token | teenagers |
Token ID | 17366 |
Feature activation | +4.18e+01 |
Pos logit contributions | |
unity | +27.141 |
doors | +26.419 |
prayers | +26.245 |
assemblies | +25.832 |
Commands | +24.841 |
Neg logit contributions | |
paed | -12.906 |
unethical | -10.786 |
HSBC | -10.542 |
neurot | -10.525 |
piracy | -10.359 |
Token | dropped |
Token ID | 5710 |
Feature activation | +8.58e+00 |
Pos logit contributions | |
unity | +33.121 |
prayed | +32.078 |
prayers | +31.609 |
assemblies | +30.858 |
doors | +30.783 |
Neg logit contributions | |
paed | -19.375 |
unethical | -16.275 |
piracy | -15.741 |
neurot | -15.248 |
HSBC | -14.896 |
Token | their |
Token ID | 511 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
unity | +9.525 |
Commands | +9.086 |
prayers | +8.941 |
doors | +8.909 |
assemblies | +8.899 |
Neg logit contributions | |
paed | -8.026 |
neurot | -6.908 |
unethical | -6.857 |
Australian | -6.797 |
HSBC | -6.793 |
Token | notes |
Token ID | 4710 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
unity | +20.044 |
prayers | +19.502 |
assemblies | +19.189 |
doors | +19.166 |
Commands | +18.984 |
Neg logit contributions | |
paed | -11.284 |
unethical | -9.152 |
HSBC | -9.121 |
neurot | -9.056 |
piracy | -8.965 |
Token | into |
Token ID | 656 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
unity | +16.124 |
prayers | +15.725 |
Commands | +15.696 |
doors | +15.366 |
assemblies | +15.352 |
Neg logit contributions | |
paed | -16.631 |
neurot | -14.236 |
unethical | -14.128 |
Australian | -13.942 |
HSBC | -13.934 |
Token | the |
Token ID | 262 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
unity | +18.980 |
prayers | +17.996 |
doors | +17.953 |
assemblies | +17.702 |
Commands | +17.639 |
Neg logit contributions | |
paed | -13.262 |
unethical | -11.394 |
neurot | -11.391 |
piracy | -11.140 |
Australian | -11.021 |
Token | Format |
Token ID | 26227 |
Feature activation | +2.13e+01 |
Pos logit contributions | |
Rules | +12.722 |
unity | +11.780 |
Commands | +11.685 |
Dialogue | +10.963 |
Values | +10.919 |
Neg logit contributions | |
paed | -22.264 |
neurot | -20.208 |
unethical | -20.101 |
piracy | -20.052 |
ageing | -19.750 |
Token | . |
Token ID | 13 |
Feature activation | +3.42e+01 |
Pos logit contributions | |
unity | +18.309 |
Rules | +17.741 |
Commands | +17.705 |
assemblies | +16.593 |
doors | +16.556 |
Neg logit contributions | |
paed | -19.468 |
neurot | -17.439 |
unethical | -16.982 |
piracy | -16.980 |
commercially | -16.900 |
Token | Line |
Token ID | 13949 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
Rules | +27.947 |
unity | +26.720 |
Commands | +26.268 |
Values | +25.834 |
Dialogue | +25.063 |
Neg logit contributions | |
paed | -22.379 |
neurot | -20.014 |
unethical | -19.917 |
commercially | -19.806 |
piracy | -19.352 |
Token | Al |
Token ID | 2348 |
Feature activation | +9.99e+00 |
Pos logit contributions | |
unity | +19.985 |
Commands | +19.281 |
Rules | +19.270 |
aturdays | +18.454 |
assemblies | +18.143 |
Neg logit contributions | |
paed | -18.115 |
neurot | -16.241 |
unethical | -15.869 |
piracy | -15.797 |
commercially | -15.569 |
Token | ignment |
Token ID | 16747 |
Feature activation | +2.43e+01 |
Pos logit contributions | |
unity | +6.007 |
Commands | +5.430 |
isans | +5.276 |
Rules | +5.143 |
enaries | +5.137 |
Neg logit contributions | |
paed | -14.547 |
neurot | -13.360 |
unethical | -13.200 |
piracy | -13.101 |
Australian | -13.063 |
Token | = |
Token ID | 796 |
Feature activation | +4.18e+01 |
Pos logit contributions | |
unity | +19.686 |
Rules | +19.196 |
Commands | +18.814 |
endas | +17.689 |
enaries | +17.625 |
Neg logit contributions | |
paed | -21.629 |
neurot | -19.490 |
piracy | -19.353 |
unethical | -19.154 |
commercially | -18.792 |
Token | [ |
Token ID | 685 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
unity | +36.547 |
Commands | +33.281 |
doors | +32.245 |
assemblies | +31.508 |
Rules | +30.808 |
Neg logit contributions | |
paed | -19.461 |
neurot | -16.462 |
piracy | -15.615 |
unethical | -15.446 |
doping | -15.023 |
Token | system |
Token ID | 10057 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
unity | +24.385 |
Rules | +21.799 |
Commands | +21.614 |
aturdays | +21.404 |
assemblies | +21.309 |
Neg logit contributions | |
paed | -21.427 |
neurot | -18.948 |
ITV | -18.678 |
unethical | -18.285 |
HSBC | -17.991 |
Token | . |
Token ID | 13 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
unity | +11.284 |
Rules | +10.986 |
Commands | +10.881 |
isans | +10.652 |
enaries | +10.318 |
Neg logit contributions | |
paed | -16.360 |
unethical | -14.872 |
neurot | -14.727 |
piracy | -14.714 |
ageing | -14.252 |
Token | draw |
Token ID | 19334 |
Feature activation | +5.78e+00 |
Pos logit contributions | |
unity | +17.484 |
isans | +16.256 |
Commands | +16.161 |
enaries | +15.734 |
Rules | +15.727 |
Neg logit contributions | |
paed | -25.647 |
unethical | -22.892 |
ITV | -22.616 |
neurot | -22.483 |
piracy | -22.306 |
Token | ing |
Token ID | 278 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
unity | +5.249 |
Commands | +5.005 |
Rules | +4.916 |
enaries | +4.889 |
isans | +4.889 |
Neg logit contributions | |
paed | -6.749 |
neurot | -6.077 |
unethical | -6.023 |
piracy | -5.980 |
Australian | -5.902 |
Token | judges |
Token ID | 10266 |
Feature activation | +2.30e+01 |
Pos logit contributions | |
unity | +23.171 |
doors | +21.901 |
assemblies | +21.601 |
prayers | +21.054 |
Commands | +21.026 |
Neg logit contributions | |
paed | -12.837 |
neurot | -11.209 |
piracy | -10.671 |
unethical | -10.601 |
dermat | -10.327 |
Token | : |
Token ID | 25 |
Feature activation | +2.28e+01 |
Pos logit contributions | |
unity | +23.515 |
assemblies | +22.188 |
prayers | +21.786 |
doors | +21.778 |
Commands | +21.743 |
Neg logit contributions | |
paed | -15.327 |
neurot | -13.712 |
unethical | -13.137 |
dermat | -13.116 |
piracy | -12.543 |
Token | � |
Token ID | 564 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
unity | +23.375 |
Commands | +21.858 |
assemblies | +21.641 |
doors | +21.624 |
prayers | +21.424 |
Neg logit contributions | |
paed | -15.247 |
neurot | -13.372 |
unethical | -13.342 |
piracy | -12.899 |
HSBC | -12.699 |
Token | � |
Token ID | 250 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
unity | +3.095 |
Commands | +3.019 |
aturdays | +2.964 |
enaries | +2.960 |
Rules | +2.936 |
Neg logit contributions | |
paed | -1.739 |
neurot | -1.471 |
Australian | -1.447 |
unethical | -1.421 |
HSBC | -1.419 |
Token | I |
Token ID | 40 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
unity | +20.009 |
Rules | +19.882 |
Commands | +18.563 |
isans | +18.450 |
aturdays | +18.285 |
Neg logit contributions | |
paed | -18.367 |
neurot | -16.073 |
unethical | -15.787 |
dermat | -15.741 |
NZ | -15.464 |
Token | have |
Token ID | 423 |
Feature activation | +4.18e+01 |
Pos logit contributions | |
unity | +14.328 |
Commands | +13.634 |
assemblies | +13.228 |
doors | +13.086 |
enaries | +13.017 |
Neg logit contributions | |
paed | -12.865 |
neurot | -11.200 |
piracy | -11.195 |
unethical | -11.176 |
Australian | -11.087 |
Token | said |
Token ID | 531 |
Feature activation | +2.73e+01 |
Pos logit contributions | |
unity | +36.841 |
prayers | +34.410 |
assemblies | +34.331 |
doors | +33.137 |
Commands | +32.495 |
Neg logit contributions | |
paed | -15.712 |
ITV | -13.146 |
HSBC | -12.908 |
piracy | -12.906 |
neurot | -12.643 |
Token | I |
Token ID | 314 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
unity | +28.113 |
prayers | +26.553 |
assemblies | +25.869 |
doors | +25.519 |
Commands | +25.063 |
Neg logit contributions | |
paed | -15.518 |
neurot | -13.195 |
dermat | -12.778 |
unethical | -12.679 |
HSBC | -12.667 |
Token | have |
Token ID | 423 |
Feature activation | +4.20e+01 |
Pos logit contributions | |
unity | +18.759 |
Commands | +17.671 |
doors | +17.217 |
assemblies | +17.139 |
prayers | +16.950 |
Neg logit contributions | |
paed | -16.355 |
piracy | -14.286 |
unethical | -14.278 |
neurot | -14.100 |
Australian | -13.877 |
Token | always |
Token ID | 1464 |
Feature activation | +3.47e+01 |
Pos logit contributions | |
unity | +38.088 |
prayers | +35.015 |
assemblies | +34.598 |
doors | +34.229 |
Commands | +33.075 |
Neg logit contributions | |
paed | -14.863 |
ITV | -12.688 |
unethical | -12.504 |
HSBC | -12.262 |
piracy | -12.199 |
Token | acted |
Token ID | 13134 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
unity | +32.573 |
doors | +29.783 |
prayers | +29.459 |
assemblies | +29.216 |
prayed | +28.731 |
Neg logit contributions | |
paed | -15.740 |
ITV | -14.544 |
unethical | -14.278 |
piracy | -14.219 |
HSBC | -14.032 |
Token | begins |
Token ID | 6140 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
unity | +20.465 |
Commands | +20.202 |
prayers | +19.369 |
doors | +19.171 |
Rules | +19.154 |
Neg logit contributions | |
paed | -15.688 |
unethical | -13.459 |
neurot | -13.310 |
piracy | -13.224 |
HSBC | -13.145 |
Token | with |
Token ID | 351 |
Feature activation | +2.89e+01 |
Pos logit contributions | |
unity | +15.783 |
Commands | +15.046 |
prayers | +14.746 |
assemblies | +14.557 |
doors | +14.486 |
Neg logit contributions | |
paed | -16.176 |
neurot | -14.420 |
unethical | -13.904 |
Australian | -13.792 |
ITV | -13.761 |
Token | : |
Token ID | 25 |
Feature activation | +3.10e+01 |
Pos logit contributions | |
unity | +28.220 |
prayers | +26.987 |
Commands | +26.881 |
Rules | +25.729 |
doors | +25.627 |
Neg logit contributions | |
paed | -17.070 |
neurot | -14.411 |
unethical | -13.796 |
ITV | -13.613 |
commercially | -13.466 |
Token |
|
Token ID | 198 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
unity | +27.126 |
Commands | +25.663 |
Rules | +25.578 |
prayers | +24.689 |
endas | +24.565 |
Neg logit contributions | |
paed | -19.950 |
neurot | -17.362 |
unethical | -16.877 |
underestimate | -16.596 |
HSBC | -16.593 |
Token |
|
Token ID | 198 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
unity | +12.501 |
Rules | +12.289 |
Commands | +12.202 |
doors | +11.511 |
isans | +11.255 |
Neg logit contributions | |
paed | -19.921 |
unethical | -18.129 |
senal | -17.884 |
piracy | -17.854 |
neurot | -17.793 |
Token | The |
Token ID | 464 |
Feature activation | +4.17e+01 |
Pos logit contributions | |
Rules | +26.683 |
unity | +23.592 |
Commands | +22.536 |
Dialogue | +22.371 |
enaries | +22.102 |
Neg logit contributions | |
paed | -24.539 |
HSBC | -22.481 |
underestimate | -21.697 |
unethical | -21.659 |
neurot | -21.560 |
Token | Citizens |
Token ID | 18029 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
unity | +37.586 |
Commands | +35.573 |
prayers | +35.084 |
assemblies | +34.975 |
doors | +34.874 |
Neg logit contributions | |
paed | -16.954 |
HSBC | -15.024 |
ITV | -14.372 |
neurot | -14.278 |
unethical | -13.928 |
Token | of |
Token ID | 286 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
unity | +19.471 |
Commands | +18.980 |
assemblies | +18.767 |
prayers | +17.774 |
enaries | +17.705 |
Neg logit contributions | |
paed | -17.825 |
unethical | -15.524 |
neurot | -15.476 |
HSBC | -15.337 |
dermat | -15.285 |
Token | each |
Token ID | 1123 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
unity | +13.053 |
Commands | +12.585 |
assemblies | +12.044 |
enaries | +11.806 |
Rules | +11.797 |
Neg logit contributions | |
paed | -12.022 |
neurot | -10.772 |
unethical | -10.438 |
HSBC | -10.383 |
piracy | -10.335 |
Token | State |
Token ID | 1812 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
unity | +8.539 |
Commands | +7.925 |
Rules | +7.386 |
assemblies | +7.377 |
isans | +7.296 |
Neg logit contributions | |
paed | -14.920 |
neurot | -13.693 |
HSBC | -13.683 |
unethical | -13.551 |
piracy | -13.520 |
Token | shall |
Token ID | 2236 |
Feature activation | +2.50e+01 |
Pos logit contributions | |
unity | +19.328 |
Commands | +18.300 |
assemblies | +18.068 |
prayers | +17.371 |
Rules | +17.334 |
Neg logit contributions | |
paed | -16.492 |
HSBC | -14.563 |
unethical | -14.338 |
neurot | -14.267 |
NZ | -13.856 |
Token | The |
Token ID | 464 |
Feature activation | +2.55e+01 |
Pos logit contributions | |
Rules | +19.330 |
Dialogue | +17.565 |
unity | +17.233 |
Commands | +16.984 |
isans | +16.591 |
Neg logit contributions | |
paed | -19.266 |
piracy | -16.919 |
neurot | -16.875 |
unethical | -16.664 |
dermat | -16.530 |
Token | Los |
Token ID | 5401 |
Feature activation | +4.56e+00 |
Pos logit contributions | |
unity | +27.016 |
doors | +25.867 |
Commands | +25.814 |
assemblies | +25.490 |
prayers | +25.113 |
Neg logit contributions | |
paed | -14.995 |
neurot | -12.261 |
piracy | -12.124 |
ITV | -11.898 |
HSBC | -11.666 |
Token | Angeles |
Token ID | 5652 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
unity | +4.380 |
Commands | +4.270 |
enaries | +4.103 |
Rules | +4.080 |
assemblies | +4.044 |
Neg logit contributions | |
paed | -5.134 |
neurot | -4.610 |
unethical | -4.509 |
piracy | -4.500 |
Australian | -4.456 |
Token | City |
Token ID | 2254 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
unity | +21.912 |
Commands | +21.454 |
assemblies | +20.601 |
Rules | +20.589 |
doors | +20.566 |
Neg logit contributions | |
paed | -16.070 |
neurot | -14.293 |
unethical | -13.730 |
piracy | -13.599 |
HSBC | -13.502 |
Token | Council |
Token ID | 4281 |
Feature activation | +3.19e+01 |
Pos logit contributions | |
unity | +18.383 |
Commands | +18.160 |
Rules | +17.489 |
assemblies | +17.242 |
enaries | +16.971 |
Neg logit contributions | |
paed | -21.485 |
neurot | -19.133 |
piracy | -18.710 |
unethical | -18.397 |
HSBC | -18.231 |
Token | has |
Token ID | 468 |
Feature activation | +4.17e+01 |
Pos logit contributions | |
unity | +27.963 |
Commands | +27.884 |
assemblies | +27.686 |
Rules | +27.271 |
prayers | +27.057 |
Neg logit contributions | |
paed | -18.581 |
piracy | -15.032 |
unethical | -14.818 |
HSBC | -14.773 |
ITV | -14.768 |
Token | been |
Token ID | 587 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
unity | +33.266 |
assemblies | +32.333 |
prayers | +31.748 |
doors | +31.484 |
Commands | +31.115 |
Neg logit contributions | |
paed | -19.138 |
ITV | -15.911 |
piracy | -15.832 |
HSBC | -15.555 |
unethical | -14.872 |
Token | trying |
Token ID | 2111 |
Feature activation | +5.99e+00 |
Pos logit contributions | |
unity | +21.891 |
prayers | +20.788 |
assemblies | +20.743 |
Commands | +20.656 |
isans | +20.565 |
Neg logit contributions | |
paed | -15.833 |
HSBC | -13.248 |
ITV | -13.196 |
neurot | -13.110 |
piracy | -13.109 |
Token | for |
Token ID | 329 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
unity | +6.701 |
Commands | +6.424 |
enaries | +6.335 |
aturdays | +6.287 |
assemblies | +6.270 |
Neg logit contributions | |
paed | -5.731 |
neurot | -5.030 |
HSBC | -4.924 |
Australian | -4.909 |
unethical | -4.873 |
Token | six |
Token ID | 2237 |
Feature activation | +9.48e+00 |
Pos logit contributions | |
unity | +10.564 |
Commands | +9.913 |
doors | +9.673 |
assemblies | +9.618 |
enaries | +9.616 |
Neg logit contributions | |
paed | -11.526 |
neurot | -10.314 |
unethical | -10.073 |
HSBC | -10.072 |
piracy | -10.025 |
Token | years |
Token ID | 812 |
Feature activation | +4.97e-01 |
Pos logit contributions | |
unity | +8.749 |
assemblies | +8.273 |
Commands | +8.269 |
enaries | +8.180 |
doors | +8.134 |
Neg logit contributions | |
paed | -10.401 |
HSBC | -9.255 |
neurot | -9.242 |
Australian | -9.071 |
ITV | -9.070 |
Token | of |
Token ID | 286 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
unity | +13.771 |
Commands | +13.069 |
Rules | +12.756 |
prayers | +12.746 |
assemblies | +12.718 |
Neg logit contributions | |
paed | -12.366 |
neurot | -10.871 |
unethical | -10.787 |
HSBC | -10.601 |
ITV | -10.506 |
Token | the |
Token ID | 262 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
unity | +11.083 |
Commands | +10.641 |
assemblies | +10.377 |
Rules | +10.266 |
endas | +10.153 |
Neg logit contributions | |
paed | -10.652 |
neurot | -9.487 |
unethical | -9.109 |
piracy | -9.052 |
ITV | -9.009 |
Token | Constitution |
Token ID | 7965 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
unity | +18.418 |
Commands | +17.817 |
assemblies | +17.391 |
Rules | +17.310 |
prayers | +17.158 |
Neg logit contributions | |
paed | -12.297 |
neurot | -10.397 |
unethical | -10.095 |
piracy | -10.065 |
commercially | -9.877 |
Token | , |
Token ID | 11 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
unity | +11.038 |
Commands | +10.682 |
Rules | +10.319 |
enaries | +10.312 |
prayers | +10.297 |
Neg logit contributions | |
paed | -11.746 |
unethical | -10.404 |
neurot | -10.344 |
HSBC | -10.203 |
piracy | -10.069 |
Token | which |
Token ID | 543 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
unity | +13.374 |
Commands | +12.855 |
Rules | +12.540 |
assemblies | +12.534 |
prayers | +12.479 |
Neg logit contributions | |
paed | -10.636 |
neurot | -9.175 |
unethical | -8.937 |
HSBC | -8.824 |
ITV | -8.810 |
Token | says |
Token ID | 1139 |
Feature activation | +4.13e+01 |
Pos logit contributions | |
unity | +13.777 |
Commands | +13.410 |
assemblies | +12.866 |
prayers | +12.700 |
Rules | +12.617 |
Neg logit contributions | |
paed | -12.067 |
neurot | -10.663 |
unethical | -10.354 |
HSBC | -10.228 |
ITV | -10.219 |
Token | that |
Token ID | 326 |
Feature activation | +4.54e+01 |
Pos logit contributions | |
unity | +36.894 |
prayers | +34.865 |
assemblies | +34.153 |
Commands | +33.949 |
doors | +33.632 |
Neg logit contributions | |
paed | -16.824 |
ITV | -14.942 |
neurot | -14.432 |
HSBC | -14.329 |
NZ | -13.486 |
Token | the |
Token ID | 262 |
Feature activation | +3.45e+01 |
Pos logit contributions | |
unity | +38.844 |
prayers | +36.592 |
assemblies | +36.406 |
Commands | +35.542 |
doors | +35.258 |
Neg logit contributions | |
paed | -17.273 |
ITV | -15.212 |
HSBC | -15.113 |
neurot | -14.454 |
NZ | -13.885 |
Token | president |
Token ID | 1893 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
unity | +34.204 |
assemblies | +32.204 |
Commands | +32.045 |
doors | +31.826 |
prayers | +31.553 |
Neg logit contributions | |
paed | -16.443 |
HSBC | -13.931 |
ITV | -13.800 |
piracy | -13.454 |
neurot | -13.169 |
Token | � |
Token ID | 564 |
Feature activation | -7.35e+00 |
Pos logit contributions | |
unity | +14.868 |
Commands | +14.385 |
assemblies | +13.972 |
prayers | +13.893 |
doors | +13.637 |
Neg logit contributions | |
paed | -12.766 |
HSBC | -11.210 |
neurot | -11.132 |
piracy | -11.006 |
unethical | -10.979 |
Token | � |
Token ID | 250 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
paed | +6.399 |
Australian | +5.657 |
neurot | +5.565 |
HSBC | +5.488 |
unethical | +5.440 |
Neg logit contributions | |
unity | -8.561 |
aturdays | -8.468 |
Commands | -8.223 |
enaries | -8.204 |
assemblies | -8.069 |
Token | and |
Token ID | 290 |
Feature activation | +2.45e+01 |
Pos logit contributions | |
unity | +14.819 |
doors | +13.780 |
Commands | +13.768 |
prayers | +13.719 |
assemblies | +13.623 |
Neg logit contributions | |
paed | -14.230 |
neurot | -12.561 |
piracy | -12.213 |
unethical | -12.199 |
Australian | -12.154 |
Token | ' |
Token ID | 705 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
unity | +26.258 |
prayers | +24.196 |
doors | +23.961 |
assemblies | +23.707 |
Commands | +23.051 |
Neg logit contributions | |
paed | -15.217 |
piracy | -12.994 |
neurot | -12.978 |
unethical | -12.724 |
HSBC | -12.655 |
Token | stand |
Token ID | 1481 |
Feature activation | +2.57e+01 |
Pos logit contributions | |
unity | +15.339 |
Rules | +14.715 |
enaries | +14.625 |
isans | +14.546 |
Commands | +14.367 |
Neg logit contributions | |
paed | -15.872 |
unethical | -13.971 |
neurot | -13.882 |
piracy | -13.880 |
Australian | -13.603 |
Token | up |
Token ID | 510 |
Feature activation | +1.76e+01 |
Pos logit contributions | |
unity | +24.648 |
doors | +22.788 |
prayers | +22.200 |
assemblies | +21.918 |
Commands | +21.688 |
Neg logit contributions | |
paed | -18.397 |
neurot | -16.152 |
unethical | -15.418 |
ransomware | -15.307 |
HSBC | -15.285 |
Token | for |
Token ID | 329 |
Feature activation | +2.76e+01 |
Pos logit contributions | |
unity | +17.436 |
doors | +15.951 |
Commands | +15.711 |
prayers | +15.618 |
assemblies | +15.581 |
Neg logit contributions | |
paed | -15.461 |
neurot | -13.874 |
HSBC | -13.448 |
piracy | -13.406 |
unethical | -13.111 |
Token | our |
Token ID | 674 |
Feature activation | +4.12e+01 |
Pos logit contributions | |
unity | +29.130 |
doors | +26.708 |
prayers | +25.572 |
assemblies | +25.081 |
Commands | +24.520 |
Neg logit contributions | |
paed | -15.782 |
neurot | -14.364 |
HSBC | -13.690 |
ITV | -13.617 |
piracy | -13.313 |
Token | proud |
Token ID | 6613 |
Feature activation | +2.57e+01 |
Pos logit contributions | |
unity | +37.697 |
doors | +34.691 |
prayers | +34.064 |
assemblies | +32.360 |
Commands | +31.492 |
Neg logit contributions | |
paed | -17.269 |
ITV | -15.273 |
neurot | -15.046 |
piracy | -14.841 |
ASIC | -14.836 |
Token | American |
Token ID | 1605 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
unity | +27.528 |
doors | +25.052 |
prayers | +25.046 |
assemblies | +24.706 |
isans | +24.677 |
Neg logit contributions | |
paed | -15.815 |
neurot | -14.061 |
HSBC | -13.915 |
unethical | -13.868 |
piracy | -13.583 |
Token | values |
Token ID | 3815 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
unity | +30.075 |
doors | +26.913 |
isans | +26.790 |
prayers | +26.788 |
Commands | +26.221 |
Neg logit contributions | |
paed | -17.032 |
neurot | -14.988 |
unethical | -14.784 |
HSBC | -14.601 |
piracy | -14.408 |
Token | .' |
Token ID | 2637 |
Feature activation | +4.40e+00 |
Pos logit contributions | |
unity | +20.753 |
isans | +19.074 |
prayers | +18.923 |
assemblies | +18.815 |
Commands | +18.797 |
Neg logit contributions | |
paed | -18.233 |
unethical | -15.649 |
neurot | -15.517 |
piracy | -15.507 |
HSBC | -15.464 |
Token |
|
Token ID | 198 |
Feature activation | -6.07e+00 |
Pos logit contributions | |
unity | +4.824 |
Commands | +4.667 |
aturdays | +4.557 |
enaries | +4.541 |
Rules | +4.508 |
Neg logit contributions | |
paed | -4.369 |
neurot | -3.869 |
unethical | -3.792 |
Australian | -3.786 |
piracy | -3.777 |
Token | [ |
Token ID | 685 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
unity | +25.550 |
Commands | +25.176 |
Rules | +23.770 |
doors | +23.679 |
assemblies | +23.315 |
Neg logit contributions | |
paed | -16.489 |
neurot | -14.307 |
HSBC | -14.114 |
piracy | -13.499 |
unethical | -13.457 |
Token | text |
Token ID | 5239 |
Feature activation | +2.10e+01 |
Pos logit contributions | |
unity | +16.377 |
Commands | +15.649 |
Rules | +15.183 |
enaries | +14.866 |
aturdays | +14.617 |
Neg logit contributions | |
paed | -17.183 |
HSBC | -15.217 |
neurot | -15.093 |
piracy | -14.971 |
unethical | -14.934 |
Token | ] |
Token ID | 60 |
Feature activation | +2.79e+01 |
Pos logit contributions | |
unity | +17.934 |
Commands | +16.613 |
Rules | +16.030 |
doors | +15.937 |
assemblies | +15.920 |
Neg logit contributions | |
paed | -19.398 |
HSBC | -17.130 |
unethical | -17.128 |
neurot | -17.064 |
piracy | -16.883 |
Token | any |
Token ID | 597 |
Feature activation | +2.63e+01 |
Pos logit contributions | |
unity | +27.063 |
Commands | +26.983 |
doors | +25.132 |
Rules | +25.089 |
assemblies | +24.669 |
Neg logit contributions | |
paed | -17.018 |
neurot | -14.995 |
HSBC | -14.666 |
piracy | -14.006 |
unethical | -13.976 |
Token | text |
Token ID | 2420 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
unity | +25.193 |
Commands | +23.605 |
doors | +22.550 |
prayers | +22.104 |
assemblies | +21.943 |
Neg logit contributions | |
paed | -17.362 |
neurot | -15.658 |
HSBC | -15.656 |
unethical | -15.288 |
ITV | -15.163 |
Token | or |
Token ID | 393 |
Feature activation | +4.11e+01 |
Pos logit contributions | |
unity | +20.147 |
Commands | +19.620 |
doors | +18.568 |
Rules | +18.235 |
assemblies | +18.187 |
Neg logit contributions | |
paed | -16.992 |
neurot | -15.479 |
HSBC | -15.289 |
unethical | -14.720 |
piracy | -14.655 |
Token | empty |
Token ID | 6565 |
Feature activation | +3.52e+01 |
Pos logit contributions | |
unity | +33.823 |
doors | +31.276 |
Commands | +30.754 |
prayers | +29.655 |
assemblies | +29.260 |
Neg logit contributions | |
paed | -19.228 |
HSBC | -16.999 |
neurot | -16.513 |
ITV | -16.289 |
unethical | -16.244 |
Token | { |
Token ID | 1391 |
Feature activation | +2.19e+01 |
Pos logit contributions | |
unity | +30.820 |
Commands | +29.590 |
doors | +28.233 |
prayers | +27.600 |
Rules | +27.249 |
Neg logit contributions | |
paed | -19.734 |
neurot | -17.206 |
piracy | -16.690 |
HSBC | -16.597 |
unethical | -16.435 |
Token | white |
Token ID | 11186 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
unity | +18.041 |
Commands | +16.944 |
Rules | +16.575 |
enaries | +16.379 |
doors | +16.035 |
Neg logit contributions | |
paed | -20.264 |
HSBC | -18.076 |
neurot | -17.934 |
piracy | -17.856 |
unethical | -17.685 |
Token | } |
Token ID | 92 |
Feature activation | +3.70e+01 |
Pos logit contributions | |
unity | +16.385 |
Commands | +15.042 |
Rules | +14.686 |
doors | +14.616 |
enaries | +14.367 |
Neg logit contributions | |
paed | -19.786 |
HSBC | -17.636 |
neurot | -17.636 |
Australian | -17.438 |
unethical | -17.217 |
Token | at |
Token ID | 379 |
Feature activation | -5.18e+00 |
Pos logit contributions | |
unity | +31.957 |
Commands | +31.106 |
doors | +29.465 |
assemblies | +28.612 |
Rules | +28.345 |
Neg logit contributions | |
paed | -18.128 |
neurot | -16.226 |
HSBC | -15.838 |
unethical | -15.432 |
piracy | -15.250 |
Token | said |
Token ID | 531 |
Feature activation | +2.46e+01 |
Pos logit contributions | |
unity | +2.397 |
Commands | +2.304 |
aturdays | +2.262 |
enaries | +2.244 |
Rules | +2.214 |
Neg logit contributions | |
paed | -2.664 |
neurot | -2.382 |
Australian | -2.357 |
unethical | -2.335 |
HSBC | -2.330 |
Token | that |
Token ID | 326 |
Feature activation | +2.06e+01 |
Pos logit contributions | |
unity | +26.378 |
prayers | +24.401 |
doors | +23.993 |
Commands | +23.633 |
assemblies | +23.493 |
Neg logit contributions | |
paed | -14.837 |
neurot | -12.891 |
unethical | -12.428 |
HSBC | -12.008 |
ageing | -11.909 |
Token | � |
Token ID | 564 |
Feature activation | +2.42e+00 |
Pos logit contributions | |
unity | +23.736 |
prayers | +21.576 |
doors | +21.437 |
Commands | +21.200 |
assemblies | +21.103 |
Neg logit contributions | |
paed | -13.396 |
neurot | -11.416 |
HSBC | -10.940 |
unethical | -10.867 |
piracy | -10.780 |
Token | � |
Token ID | 250 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
unity | +3.647 |
Commands | +3.559 |
aturdays | +3.510 |
enaries | +3.503 |
Rules | +3.472 |
Neg logit contributions | |
paed | -1.429 |
neurot | -1.149 |
Australian | -1.126 |
HSBC | -1.097 |
unethical | -1.095 |
Token | Israel |
Token ID | 14040 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
unity | +14.462 |
Rules | +13.747 |
Commands | +13.412 |
aturdays | +13.376 |
isans | +13.289 |
Neg logit contributions | |
paed | -12.238 |
neurot | -10.767 |
HSBC | -10.546 |
unethical | -10.440 |
piracy | -10.334 |
Token | has |
Token ID | 468 |
Feature activation | +4.10e+01 |
Pos logit contributions | |
unity | +17.042 |
Commands | +15.851 |
isans | +15.721 |
enaries | +15.581 |
Rules | +15.519 |
Neg logit contributions | |
paed | -14.546 |
unethical | -12.467 |
neurot | -12.434 |
HSBC | -12.414 |
Australian | -12.388 |
Token | always |
Token ID | 1464 |
Feature activation | +3.35e+01 |
Pos logit contributions | |
unity | +36.075 |
prayers | +32.699 |
doors | +32.167 |
assemblies | +31.619 |
Rules | +31.460 |
Neg logit contributions | |
paed | -17.580 |
ITV | -14.599 |
HSBC | -14.197 |
piracy | -14.135 |
NZ | -14.104 |
Token | stri |
Token ID | 2338 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
unity | +29.767 |
doors | +27.135 |
prayers | +26.614 |
isans | +25.770 |
Commands | +25.646 |
Neg logit contributions | |
paed | -18.865 |
ITV | -16.859 |
HSBC | -16.359 |
piracy | -16.290 |
unethical | -16.162 |
Token | ved |
Token ID | 1079 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
unity | +13.280 |
Commands | +12.635 |
Rules | +12.498 |
enaries | +12.425 |
aturdays | +12.244 |
Neg logit contributions | |
paed | -11.060 |
neurot | -10.001 |
Australian | -9.766 |
HSBC | -9.750 |
unethical | -9.695 |
Token | for |
Token ID | 329 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
unity | +13.435 |
enaries | +12.152 |
Commands | +12.076 |
doors | +12.032 |
Rules | +11.977 |
Neg logit contributions | |
paed | -11.830 |
HSBC | -10.339 |
neurot | -10.310 |
ITV | -10.251 |
Australian | -10.228 |
Token | stable |
Token ID | 8245 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
unity | +21.423 |
doors | +18.706 |
isans | +18.394 |
prayers | +18.360 |
assemblies | +18.234 |
Neg logit contributions | |
paed | -13.425 |
ITV | -11.401 |
neurot | -11.351 |
HSBC | -11.266 |
piracy | -11.205 |
Token | ing |
Token ID | 278 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
unity | +7.847 |
Commands | +7.537 |
Rules | +7.507 |
isans | +7.316 |
enaries | +7.186 |
Neg logit contributions | |
paed | -11.647 |
neurot | -10.527 |
unethical | -10.485 |
piracy | -10.437 |
HSBC | -10.147 |
Token | . |
Token ID | 13 |
Feature activation | +2.69e+01 |
Pos logit contributions | |
Rules | +14.946 |
Commands | +14.333 |
unity | +14.107 |
Dialogue | +13.088 |
doors | +12.883 |
Neg logit contributions | |
paed | -22.307 |
unethical | -20.330 |
piracy | -20.260 |
neurot | -19.931 |
ageing | -19.789 |
Token | Rect |
Token ID | 45474 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
Rules | +22.089 |
unity | +21.290 |
Commands | +20.621 |
Dialogue | +19.906 |
Values | +19.539 |
Neg logit contributions | |
paed | -22.095 |
unethical | -19.575 |
piracy | -19.504 |
neurot | -19.449 |
ageing | -19.301 |
Token | angle |
Token ID | 9248 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
unity | +14.203 |
aturdays | +13.268 |
Commands | +13.176 |
Rules | +13.094 |
assemblies | +12.626 |
Neg logit contributions | |
paed | -17.382 |
unethical | -15.742 |
neurot | -15.694 |
piracy | -15.683 |
HSBC | -15.308 |
Token | F |
Token ID | 37 |
Feature activation | +1.73e+01 |
Pos logit contributions | |
unity | +23.947 |
Rules | +23.161 |
Commands | +22.725 |
aturdays | +22.274 |
assemblies | +21.899 |
Neg logit contributions | |
paed | -16.468 |
neurot | -14.349 |
piracy | -14.115 |
unethical | -13.848 |
HSBC | -13.638 |
Token | ( |
Token ID | 357 |
Feature activation | +4.08e+01 |
Pos logit contributions | |
unity | +16.297 |
aturdays | +15.196 |
Rules | +15.142 |
Commands | +14.940 |
endas | +14.776 |
Neg logit contributions | |
paed | -16.135 |
neurot | -14.594 |
piracy | -14.575 |
unethical | -14.170 |
commercially | -13.892 |
Token | 0 |
Token ID | 15 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
unity | +34.049 |
Commands | +31.715 |
Rules | +31.317 |
doors | +30.649 |
assemblies | +29.817 |
Neg logit contributions | |
paed | -20.232 |
neurot | -17.534 |
piracy | -16.995 |
doping | -16.593 |
unethical | -16.434 |
Token | , |
Token ID | 11 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
unity | +15.257 |
Commands | +14.004 |
enaries | +13.960 |
Rules | +13.956 |
aturdays | +13.684 |
Neg logit contributions | |
paed | -17.544 |
neurot | -15.915 |
unethical | -15.812 |
HSBC | -15.556 |
piracy | -15.287 |
Token | ($ |
Token ID | 16763 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
unity | +27.064 |
Rules | +25.484 |
Commands | +25.113 |
doors | +24.679 |
enaries | +24.214 |
Neg logit contributions | |
paed | -18.947 |
neurot | -16.752 |
piracy | -15.608 |
unethical | -15.569 |
ageing | -15.274 |
Token | s |
Token ID | 82 |
Feature activation | +9.45e+00 |
Pos logit contributions | |
unity | +11.869 |
Rules | +11.375 |
Commands | +11.257 |
enaries | +11.115 |
aturdays | +10.988 |
Neg logit contributions | |
paed | -12.302 |
neurot | -11.186 |
Australian | -10.998 |
HSBC | -10.698 |
unethical | -10.659 |
Token | z |
Token ID | 89 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
unity | +7.524 |
Commands | +7.323 |
Rules | +7.199 |
enaries | +6.987 |
isans | +6.961 |
Neg logit contributions | |
paed | -11.718 |
neurot | -10.494 |
unethical | -10.372 |
piracy | -10.362 |
Australian | -10.320 |
Token |
|
Token ID | 198 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
unity | +25.329 |
Commands | +24.367 |
assemblies | +23.148 |
doors | +23.138 |
endas | +22.538 |
Neg logit contributions | |
paed | -19.882 |
neurot | -17.293 |
unethical | -16.597 |
ITV | -16.449 |
piracy | -16.448 |
Token |
|
Token ID | 198 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
unity | +9.257 |
Commands | +9.025 |
Rules | +8.797 |
doors | +8.547 |
isans | +8.545 |
Neg logit contributions | |
paed | -11.397 |
neurot | -10.207 |
unethical | -10.186 |
piracy | -10.127 |
ageing | -9.909 |
Token | + |
Token ID | 10 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
Rules | +19.768 |
unity | +19.768 |
Commands | +19.276 |
aturdays | +18.698 |
enaries | +18.662 |
Neg logit contributions | |
paed | -19.477 |
HSBC | -17.144 |
Australian | -17.079 |
commercially | -17.030 |
neurot | -16.941 |
Token | -------------------- |
Token ID | 19351 |
Feature activation | -9.50e+00 |
Pos logit contributions | |
unity | +8.709 |
Commands | +8.530 |
enaries | +8.236 |
Rules | +8.219 |
doors | +7.910 |
Neg logit contributions | |
paed | -12.581 |
unethical | -11.151 |
neurot | -11.132 |
piracy | -11.076 |
HSBC | -11.067 |
Token | --+ |
Token ID | 44785 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
paed | +8.222 |
Australian | +7.374 |
neurot | +7.244 |
HSBC | +6.984 |
unethical | +6.857 |
Neg logit contributions | |
unity | -10.794 |
aturdays | -10.716 |
enaries | -10.318 |
Commands | -10.238 |
Rules | -10.100 |
Token | | |
Token ID | 930 |
Feature activation | +4.06e+01 |
Pos logit contributions | |
unity | +17.415 |
Commands | +17.000 |
doors | +16.017 |
enaries | +15.923 |
assemblies | +15.885 |
Neg logit contributions | |
paed | -17.627 |
neurot | -15.648 |
unethical | -15.567 |
HSBC | -15.541 |
piracy | -15.425 |
Token | ... |
Token ID | 2644 |
Feature activation | +1.87e+01 |
Pos logit contributions | |
unity | +34.262 |
Commands | +33.365 |
doors | +32.065 |
assemblies | +31.600 |
Rules | +30.216 |
Neg logit contributions | |
paed | -19.343 |
neurot | -15.191 |
commercially | -15.160 |
unethical | -14.969 |
piracy | -14.913 |
Token | | |
Token ID | 930 |
Feature activation | +3.10e+01 |
Pos logit contributions | |
unity | +13.681 |
Commands | +13.379 |
doors | +12.456 |
assemblies | +12.261 |
enaries | +12.225 |
Neg logit contributions | |
paed | -20.293 |
neurot | -18.530 |
unethical | -18.267 |
piracy | -18.132 |
ITV | -18.101 |
Token | + |
Token ID | 1343 |
Feature activation | +4.03e+00 |
Pos logit contributions | |
unity | +28.276 |
Commands | +27.105 |
doors | +26.634 |
assemblies | +25.849 |
enaries | +25.037 |
Neg logit contributions | |
paed | -18.113 |
neurot | -15.434 |
unethical | -15.119 |
HSBC | -15.062 |
dermat | -15.037 |
Token | -------------------- |
Token ID | 19351 |
Feature activation | -8.48e+00 |
Pos logit contributions | |
unity | +3.823 |
Commands | +3.702 |
enaries | +3.633 |
Rules | +3.597 |
aturdays | +3.532 |
Neg logit contributions | |
paed | -4.614 |
neurot | -4.106 |
Australian | -4.062 |
unethical | -4.049 |
HSBC | -4.044 |
Token | --+ |
Token ID | 44785 |
Feature activation | +2.53e+01 |
Pos logit contributions | |
paed | +7.536 |
Australian | +6.737 |
neurot | +6.584 |
HSBC | +6.465 |
unethical | +6.291 |
Neg logit contributions | |
unity | -9.622 |
aturdays | -9.516 |
Commands | -9.166 |
enaries | -9.140 |
Rules | -8.955 |
Token | imagined |
Token ID | 15758 |
Feature activation | +3.63e+01 |
Pos logit contributions | |
unity | +10.848 |
Commands | +10.223 |
enaries | +10.029 |
doors | +10.021 |
assemblies | +9.925 |
Neg logit contributions | |
paed | -11.406 |
neurot | -9.993 |
unethical | -9.979 |
HSBC | -9.935 |
Australian | -9.829 |
Token | that |
Token ID | 326 |
Feature activation | +3.24e+01 |
Pos logit contributions | |
unity | +33.192 |
doors | +31.936 |
Commands | +31.346 |
assemblies | +30.761 |
motions | +30.229 |
Neg logit contributions | |
paed | -17.398 |
neurot | -14.531 |
HSBC | -14.263 |
ITV | -13.937 |
unethical | -13.887 |
Token | each |
Token ID | 1123 |
Feature activation | +3.22e+01 |
Pos logit contributions | |
unity | +30.864 |
Commands | +29.529 |
doors | +29.244 |
assemblies | +28.315 |
enaries | +28.256 |
Neg logit contributions | |
paed | -17.119 |
neurot | -14.486 |
HSBC | -13.712 |
unethical | -13.662 |
ITV | -13.397 |
Token | battle |
Token ID | 3344 |
Feature activation | +1.89e+01 |
Pos logit contributions | |
unity | +30.765 |
doors | +29.637 |
Commands | +29.092 |
enaries | +27.624 |
assemblies | +27.597 |
Neg logit contributions | |
paed | -16.552 |
neurot | -13.828 |
unethical | -13.779 |
HSBC | -13.718 |
ITV | -13.689 |
Token | should |
Token ID | 815 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
unity | +18.791 |
Commands | +18.108 |
doors | +17.780 |
assemblies | +17.516 |
Rules | +17.361 |
Neg logit contributions | |
paed | -15.398 |
neurot | -13.755 |
unethical | -13.437 |
HSBC | -13.109 |
ITV | -13.034 |
Token | have |
Token ID | 423 |
Feature activation | +4.02e+01 |
Pos logit contributions | |
unity | +15.059 |
Commands | +14.305 |
doors | +14.014 |
assemblies | +13.935 |
enaries | +13.865 |
Neg logit contributions | |
paed | -12.910 |
unethical | -11.583 |
neurot | -11.331 |
piracy | -11.272 |
HSBC | -11.258 |
Token | happened |
Token ID | 3022 |
Feature activation | +2.73e+01 |
Pos logit contributions | |
unity | +34.646 |
doors | +34.026 |
Commands | +32.792 |
assemblies | +32.442 |
prayers | +31.572 |
Neg logit contributions | |
paed | -17.439 |
neurot | -15.038 |
unethical | -14.698 |
HSBC | -14.123 |
piracy | -13.754 |
Token | in |
Token ID | 287 |
Feature activation | +2.51e+01 |
Pos logit contributions | |
unity | +25.630 |
doors | +24.770 |
Commands | +24.752 |
assemblies | +24.349 |
enaries | +24.161 |
Neg logit contributions | |
paed | -17.781 |
neurot | -15.373 |
unethical | -14.991 |
HSBC | -14.550 |
ITV | -14.310 |
Token | a |
Token ID | 257 |
Feature activation | +3.36e+01 |
Pos logit contributions | |
unity | +25.825 |
Commands | +24.208 |
doors | +24.088 |
assemblies | +23.762 |
Rules | +22.942 |
Neg logit contributions | |
paed | -16.350 |
neurot | -14.273 |
unethical | -13.712 |
HSBC | -13.505 |
ITV | -13.170 |
Token | procedural |
Token ID | 27931 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
unity | +32.013 |
Commands | +29.304 |
doors | +28.977 |
assemblies | +28.264 |
prayers | +27.991 |
Neg logit contributions | |
paed | -16.820 |
ITV | -14.448 |
unethical | -14.417 |
HSBC | -14.155 |
neurot | -13.902 |
Token | map |
Token ID | 3975 |
Feature activation | +1.95e+01 |
Pos logit contributions | |
unity | +17.214 |
assemblies | +15.687 |
doors | +15.685 |
Commands | +15.610 |
Rules | +15.358 |
Neg logit contributions | |
paed | -14.203 |
neurot | -12.316 |
unethical | -12.251 |
HSBC | -12.136 |
ITV | -11.898 |
Token | as |
Token ID | 355 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
unity | +6.529 |
Commands | +6.274 |
assemblies | +6.112 |
aturdays | +6.094 |
enaries | +6.087 |
Neg logit contributions | |
paed | -5.880 |
neurot | -5.210 |
Australian | -5.054 |
unethical | -5.021 |
piracy | -5.004 |
Token | community |
Token ID | 2055 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
unity | +18.534 |
assemblies | +17.620 |
Commands | +17.579 |
doors | +17.418 |
prayers | +17.213 |
Neg logit contributions | |
paed | -8.543 |
neurot | -6.921 |
unethical | -6.571 |
Australian | -6.520 |
piracy | -6.450 |
Token | boards |
Token ID | 11490 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
unity | +16.112 |
assemblies | +15.265 |
Commands | +14.683 |
prayers | +14.593 |
doors | +14.518 |
Neg logit contributions | |
paed | -12.019 |
neurot | -10.504 |
unethical | -10.186 |
HSBC | -10.117 |
piracy | -10.105 |
Token | across |
Token ID | 1973 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
unity | +26.095 |
assemblies | +25.063 |
Commands | +24.458 |
doors | +24.014 |
prayers | +23.991 |
Neg logit contributions | |
paed | -17.339 |
neurot | -14.372 |
unethical | -14.012 |
ITV | -13.831 |
piracy | -13.782 |
Token | the |
Token ID | 262 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
unity | +13.153 |
Commands | +12.495 |
doors | +12.219 |
assemblies | +12.219 |
endas | +11.975 |
Neg logit contributions | |
paed | -11.822 |
neurot | -10.449 |
piracy | -10.190 |
unethical | -10.165 |
HSBC | -10.148 |
Token | city |
Token ID | 1748 |
Feature activation | +4.02e+01 |
Pos logit contributions | |
unity | +16.722 |
Commands | +15.869 |
doors | +15.595 |
assemblies | +15.584 |
prayers | +15.104 |
Neg logit contributions | |
paed | -12.142 |
neurot | -10.496 |
HSBC | -10.317 |
unethical | -10.273 |
piracy | -10.253 |
Token | weigh |
Token ID | 10164 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
unity | +33.076 |
assemblies | +32.301 |
doors | +30.915 |
Commands | +30.791 |
prayers | +30.724 |
Neg logit contributions | |
paed | -19.494 |
unethical | -15.539 |
neurot | -15.398 |
ITV | -15.373 |
ageing | -15.077 |
Token | in |
Token ID | 287 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
unity | +13.651 |
assemblies | +12.827 |
Commands | +12.814 |
prayers | +12.721 |
doors | +12.688 |
Neg logit contributions | |
paed | -11.614 |
neurot | -10.090 |
HSBC | -9.963 |
Australian | -9.816 |
ITV | -9.800 |
Token | on |
Token ID | 319 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
unity | +10.891 |
Commands | +10.285 |
assemblies | +10.183 |
doors | +10.034 |
enaries | +10.033 |
Neg logit contributions | |
paed | -11.406 |
neurot | -10.048 |
unethical | -9.768 |
piracy | -9.706 |
Australian | -9.699 |
Token | proposed |
Token ID | 5150 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
unity | +12.794 |
Commands | +12.078 |
assemblies | +11.999 |
doors | +11.936 |
Rules | +11.803 |
Neg logit contributions | |
paed | -9.801 |
neurot | -8.448 |
Australian | -8.262 |
HSBC | -8.157 |
unethical | -8.109 |
Token | housing |
Token ID | 5627 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
unity | +15.995 |
Commands | +14.999 |
assemblies | +14.991 |
doors | +14.778 |
prayers | +14.709 |
Neg logit contributions | |
paed | -10.924 |
neurot | -9.249 |
HSBC | -9.102 |
unethical | -9.025 |
ITV | -8.991 |
Token | FDA |
Token ID | 14672 |
Feature activation | -1.37e+01 |
Pos logit contributions | |
paed | +26.108 |
Australian | +25.333 |
HSBC | +24.817 |
NZ | +24.167 |
Malaysian | +24.154 |
Neg logit contributions | |
aturdays | -13.423 |
enaries | -12.970 |
endas | -12.780 |
Commands | -12.546 |
isans | -12.242 |
Token | announces |
Token ID | 26459 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
paed | +16.390 |
neurot | +15.251 |
Australian | +15.164 |
unethical | +14.921 |
piracy | +14.739 |
Neg logit contributions | |
aturdays | -10.019 |
enaries | -9.799 |
unity | -9.428 |
Commands | -9.416 |
isans | -9.341 |
Token | new |
Token ID | 649 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
paed | +21.190 |
Australian | +19.832 |
neurot | +19.425 |
unethical | +19.329 |
piracy | +19.166 |
Neg logit contributions | |
aturdays | -12.339 |
enaries | -12.306 |
Commands | -11.838 |
endas | -11.532 |
isans | -11.375 |
Token | plan |
Token ID | 1410 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
paed | +23.336 |
Australian | +21.845 |
neurot | +21.820 |
piracy | +21.176 |
unethical | +21.144 |
Neg logit contributions | |
enaries | -12.324 |
aturdays | -12.316 |
endas | -11.509 |
isans | -11.301 |
Commands | -11.064 |
Token | to |
Token ID | 284 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
paed | +24.265 |
Australian | +22.671 |
piracy | +22.325 |
unethical | +22.051 |
HSBC | +21.897 |
Neg logit contributions | |
aturdays | -17.050 |
unity | -15.931 |
enaries | -15.889 |
Commands | -15.720 |
assemblies | -15.574 |
Token | curb |
Token ID | 20799 |
Feature activation | -4.73e+01 |
Pos logit contributions | |
paed | +17.606 |
Australian | +16.228 |
commercially | +16.143 |
neurot | +15.957 |
piracy | +15.802 |
Neg logit contributions | |
aturdays | -16.692 |
enaries | -15.596 |
isans | -15.389 |
endas | -15.364 |
Commands | -15.177 |
Token | tobacco |
Token ID | 11219 |
Feature activation | -2.92e+01 |
Pos logit contributions | |
paed | +39.685 |
Australian | +37.009 |
neurot | +36.843 |
piracy | +36.748 |
pharmaceutical | +36.541 |
Neg logit contributions | |
aturdays | -19.770 |
enaries | -17.888 |
Dialogue | -17.534 |
Commands | -17.409 |
endas | -16.998 |
Token | 11 |
Token ID | 1367 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
paed | +29.267 |
piracy | +27.623 |
neurot | +27.575 |
Australian | +27.524 |
NZ | +27.004 |
Neg logit contributions | |
aturdays | -18.044 |
Rules | -15.817 |
endas | -15.731 |
endars | -15.701 |
enaries | -15.659 |
Token | : |
Token ID | 25 |
Feature activation | +5.84e+00 |
Pos logit contributions | |
paed | +14.014 |
Australian | +12.887 |
neurot | +12.567 |
NZ | +12.409 |
HSBC | +12.391 |
Neg logit contributions | |
unity | -11.751 |
enaries | -11.692 |
aturdays | -11.541 |
Commands | -11.477 |
endas | -11.018 |
Token | 50 |
Token ID | 1120 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
unity | +5.143 |
Commands | +5.028 |
Rules | +4.879 |
enaries | +4.771 |
isans | +4.727 |
Neg logit contributions | |
paed | -6.960 |
neurot | -6.241 |
unethical | -6.212 |
piracy | -6.163 |
Australian | -6.029 |
Token | AM |
Token ID | 3001 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
paed | +9.096 |
Australian | +8.219 |
neurot | +7.906 |
NZ | +7.852 |
ITV | +7.835 |
Neg logit contributions | |
unity | -15.463 |
enaries | -15.461 |
aturdays | -15.269 |
Commands | -15.170 |
endars | -14.965 |
Token | by |
Token ID | 416 |
Feature activation | -1.52e+01 |
Pos logit contributions | |
paed | +16.226 |
Australian | +14.762 |
HSBC | +14.592 |
neurot | +14.565 |
commercially | +14.306 |
Neg logit contributions | |
aturdays | -13.443 |
Commands | -13.354 |
enaries | -12.780 |
endars | -12.760 |
endas | -12.756 |
Token | going |
Token ID | 1016 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
paed | +15.788 |
Australian | +14.609 |
HSBC | +14.267 |
piracy | +14.199 |
unethical | +14.123 |
Neg logit contributions | |
aturdays | -13.322 |
Commands | -12.956 |
enaries | -12.711 |
endas | -12.652 |
isans | -12.503 |
Token | after |
Token ID | 706 |
Feature activation | -2.62e+01 |
Pos logit contributions | |
paed | +17.784 |
Australian | +16.803 |
viral | +16.314 |
HSBC | +16.252 |
commercially | +16.252 |
Neg logit contributions | |
Commands | -14.313 |
unity | -13.799 |
endars | -13.599 |
aturdays | -13.567 |
Rules | -13.431 |
Token | anyone |
Token ID | 2687 |
Feature activation | -2.86e+01 |
Pos logit contributions | |
paed | +28.481 |
Australian | +27.353 |
HSBC | +26.595 |
unethical | +26.535 |
piracy | +26.333 |
Neg logit contributions | |
aturdays | -14.582 |
enaries | -13.493 |
isans | -13.239 |
Commands | -13.132 |
Rules | -13.118 |
Token | they |
Token ID | 484 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
paed | +25.359 |
Australian | +23.954 |
unethical | +23.765 |
commercially | +23.447 |
HSBC | +23.172 |
Neg logit contributions | |
aturdays | -21.063 |
Commands | -19.311 |
endas | -19.158 |
Rules | -18.846 |
enaries | -18.746 |
Token | perceive |
Token ID | 19973 |
Feature activation | -4.47e+01 |
Pos logit contributions | |
paed | +12.008 |
commercially | +10.951 |
Australian | +10.878 |
neurot | +10.682 |
HSBC | +10.519 |
Neg logit contributions | |
aturdays | -15.995 |
unity | -15.383 |
enaries | -15.149 |
Commands | -15.074 |
Rules | -14.872 |
Token | to |
Token ID | 284 |
Feature activation | -3.87e+01 |
Pos logit contributions | |
paed | +34.931 |
unethical | +33.894 |
Australian | +32.321 |
piracy | +32.201 |
commercially | +31.929 |
Neg logit contributions | |
aturdays | -23.005 |
Commands | -20.868 |
Rules | -19.978 |
endas | -19.483 |
enaries | -19.414 |
Token | be |
Token ID | 307 |
Feature activation | -3.54e+01 |
Pos logit contributions | |
paed | +31.273 |
leak | +29.471 |
unethical | +29.005 |
commercially | +28.784 |
Australian | +28.484 |
Neg logit contributions | |
aturdays | -22.800 |
Commands | -20.096 |
Rules | -19.844 |
endars | -19.069 |
isans | -19.057 |
Token | using |
Token ID | 1262 |
Feature activation | -2.76e+01 |
Pos logit contributions | |
paed | +33.061 |
unethical | +31.784 |
Australian | +30.681 |
commercially | +30.229 |
piracy | +29.976 |
Neg logit contributions | |
aturdays | -20.482 |
Commands | -18.271 |
enaries | -18.059 |
endars | -17.601 |
Rules | -17.520 |
Token | their |
Token ID | 511 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
paed | +28.626 |
Australian | +27.662 |
unethical | +27.585 |
commercially | +26.901 |
piracy | +26.864 |
Neg logit contributions | |
aturdays | -16.245 |
enaries | -15.080 |
isans | -14.638 |
endas | -14.334 |
Commands | -14.260 |
Token | trademarks |
Token ID | 27346 |
Feature activation | -3.08e+01 |
Pos logit contributions | |
paed | +15.234 |
Australian | +14.365 |
unethical | +13.804 |
HSBC | +13.747 |
commercially | +13.709 |
Neg logit contributions | |
aturdays | -11.604 |
enaries | -11.037 |
Commands | -10.942 |
unity | -10.859 |
isans | -10.762 |
Token | gene |
Token ID | 9779 |
Feature activation | -6.36e+00 |
Pos logit contributions | |
paed | +31.099 |
neurot | +28.937 |
Australian | +28.921 |
commercially | +28.906 |
genetically | +28.679 |
Neg logit contributions | |
aturdays | -15.987 |
enaries | -15.009 |
isans | -14.742 |
endas | -14.376 |
Commands | -14.025 |
Token | fragments |
Token ID | 21441 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
paed | +6.764 |
neurot | +6.123 |
piracy | +5.944 |
Australian | +5.943 |
unethical | +5.900 |
Neg logit contributions | |
unity | -6.319 |
Commands | -6.207 |
aturdays | -6.162 |
enaries | -6.123 |
endas | -6.040 |
Token | in |
Token ID | 287 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
paed | +24.492 |
neurot | +22.682 |
commercially | +22.484 |
Australian | +22.332 |
genetically | +22.134 |
Neg logit contributions | |
aturdays | -17.507 |
Commands | -16.763 |
enaries | -16.329 |
endas | -16.233 |
Rules | -16.013 |
Token | order |
Token ID | 1502 |
Feature activation | -1.82e+01 |
Pos logit contributions | |
paed | +26.678 |
Australian | +24.299 |
neurot | +23.921 |
unethical | +23.889 |
commercially | +23.705 |
Neg logit contributions | |
aturdays | -16.180 |
enaries | -14.833 |
endas | -14.724 |
isans | -14.696 |
Rules | -14.261 |
Token | to |
Token ID | 284 |
Feature activation | -2.50e+01 |
Pos logit contributions | |
paed | +13.020 |
Australian | +11.431 |
neurot | +11.263 |
unethical | +11.043 |
commercially | +11.025 |
Neg logit contributions | |
aturdays | -21.262 |
Commands | -19.825 |
endars | -19.458 |
endas | -19.401 |
unity | -19.344 |
Token | undercut |
Token ID | 43726 |
Feature activation | -4.42e+01 |
Pos logit contributions | |
paed | +23.796 |
genetically | +22.506 |
commercially | +22.418 |
neurot | +21.622 |
unethical | +21.517 |
Neg logit contributions | |
aturdays | -19.580 |
Commands | -17.218 |
isans | -17.211 |
Rules | -17.155 |
enaries | -16.929 |
Token | private |
Token ID | 2839 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
paed | +39.283 |
unethical | +36.636 |
Australian | +36.501 |
pharmaceutical | +36.302 |
commercially | +36.227 |
Neg logit contributions | |
aturdays | -18.914 |
enaries | -17.185 |
endars | -16.879 |
Commands | -16.119 |
endas | -16.114 |
Token | efforts |
Token ID | 4040 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
paed | +19.278 |
Australian | +17.598 |
pharmaceutical | +17.467 |
unethical | +17.389 |
neurot | +17.272 |
Neg logit contributions | |
aturdays | -14.140 |
endas | -13.385 |
enaries | -13.338 |
Commands | -13.129 |
endars | -12.876 |
Token | to |
Token ID | 284 |
Feature activation | -2.56e+01 |
Pos logit contributions | |
paed | +17.201 |
unethical | +15.827 |
commercially | +15.484 |
Australian | +15.340 |
piracy | +15.148 |
Neg logit contributions | |
aturdays | -19.681 |
Commands | -18.715 |
unity | -18.567 |
endas | -18.465 |
enaries | -18.131 |
Token | patent |
Token ID | 12701 |
Feature activation | -3.04e+01 |
Pos logit contributions | |
paed | +24.681 |
genetically | +23.405 |
commercially | +23.375 |
neurot | +22.577 |
Australian | +22.525 |
Neg logit contributions | |
aturdays | -19.616 |
Rules | -17.186 |
Commands | -17.164 |
endas | -17.007 |
enaries | -16.983 |
Token | gene |
Token ID | 9779 |
Feature activation | -5.29e+00 |
Pos logit contributions | |
paed | +31.949 |
unethical | +29.674 |
neurot | +29.452 |
genetically | +29.194 |
pharmaceutical | +29.086 |
Neg logit contributions | |
aturdays | -17.108 |
endas | -14.766 |
Commands | -14.546 |
enaries | -14.502 |
isans | -14.330 |
Token | of |
Token ID | 286 |
Feature activation | -2.97e+01 |
Pos logit contributions | |
paed | +25.629 |
Australian | +22.844 |
ITV | +22.255 |
HSBC | +22.049 |
NZ | +21.797 |
Neg logit contributions | |
aturdays | -18.316 |
enaries | -17.919 |
unity | -17.696 |
endars | -17.407 |
endas | -17.249 |
Token | 13 |
Token ID | 1511 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
paed | +30.506 |
Australian | +28.153 |
ITV | +26.675 |
HSBC | +26.407 |
Malaysian | +26.216 |
Neg logit contributions | |
aturdays | -16.833 |
enaries | -16.381 |
endars | -16.265 |
endas | -15.986 |
isans | -15.935 |
Token | - |
Token ID | 12 |
Feature activation | -8.11e+00 |
Pos logit contributions | |
paed | +19.516 |
Australian | +17.771 |
HSBC | +17.088 |
piracy | +16.774 |
NZ | +16.641 |
Neg logit contributions | |
Commands | -18.119 |
unity | -17.922 |
enaries | -17.014 |
aturdays | -16.758 |
endas | -16.705 |
Token | year |
Token ID | 1941 |
Feature activation | -2.63e+01 |
Pos logit contributions | |
paed | +6.902 |
Australian | +6.054 |
neurot | +5.805 |
HSBC | +5.782 |
piracy | +5.704 |
Neg logit contributions | |
unity | -9.630 |
Commands | -9.427 |
enaries | -9.115 |
aturdays | -9.051 |
endas | -9.042 |
Token | - |
Token ID | 12 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
paed | +23.776 |
Australian | +21.563 |
ageing | +20.646 |
piracy | +20.618 |
HSBC | +20.316 |
Neg logit contributions | |
Commands | -19.823 |
enaries | -19.395 |
aturdays | -18.734 |
endas | -18.582 |
isans | -18.529 |
Token | old |
Token ID | 727 |
Feature activation | -4.28e+01 |
Pos logit contributions | |
paed | +11.642 |
Australian | +10.840 |
HSBC | +9.964 |
NZ | +9.636 |
ITV | +9.502 |
Neg logit contributions | |
aturdays | -19.088 |
unity | -18.610 |
Commands | -18.229 |
assemblies | -17.854 |
endas | -17.699 |
Token | Drew |
Token ID | 18624 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
paed | +37.473 |
Australian | +35.612 |
HSBC | +33.413 |
Malaysian | +33.263 |
ITV | +33.074 |
Neg logit contributions | |
aturdays | -17.516 |
endas | -17.325 |
enaries | -17.261 |
Commands | -16.928 |
endars | -16.736 |
Token | and |
Token ID | 290 |
Feature activation | -1.70e+01 |
Pos logit contributions | |
paed | +12.844 |
Australian | +11.735 |
HSBC | +11.310 |
neurot | +11.051 |
ITV | +10.942 |
Neg logit contributions | |
unity | -12.360 |
aturdays | -12.296 |
Commands | -12.014 |
Rules | -11.806 |
enaries | -11.800 |
Token | convinced |
Token ID | 9431 |
Feature activation | -2.56e+01 |
Pos logit contributions | |
paed | +18.893 |
Australian | +17.088 |
HSBC | +16.290 |
neurot | +16.278 |
ITV | +16.232 |
Neg logit contributions | |
aturdays | -13.250 |
unity | -13.005 |
endas | -12.883 |
isans | -12.685 |
enaries | -12.644 |
Token | the |
Token ID | 262 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
paed | +26.915 |
Australian | +24.348 |
ITV | +23.598 |
HSBC | +23.178 |
Malaysian | +22.758 |
Neg logit contributions | |
aturdays | -16.857 |
endas | -16.536 |
endars | -16.317 |
enaries | -16.279 |
Commands | -16.195 |
Token | youngsters |
Token ID | 33167 |
Feature activation | -9.62e+00 |
Pos logit contributions | |
paed | +21.326 |
Australian | +19.453 |
ITV | +18.559 |
neurot | +18.388 |
HSBC | +18.323 |
Neg logit contributions | |
aturdays | -13.357 |
Commands | -13.294 |
endas | -13.186 |
enaries | -13.122 |
unity | -12.733 |
Token | scrapped |
Token ID | 35034 |
Feature activation | -1.82e+01 |
Pos logit contributions | |
paed | +14.436 |
HSBC | +13.231 |
Australian | +13.025 |
NZ | +12.667 |
neurot | +12.665 |
Neg logit contributions | |
aturdays | -13.243 |
Commands | -12.865 |
unity | -12.699 |
enaries | -12.509 |
endas | -12.493 |
Token | because |
Token ID | 780 |
Feature activation | -3.06e+00 |
Pos logit contributions | |
paed | +16.261 |
Australian | +14.819 |
HSBC | +14.732 |
commercially | +14.666 |
unethical | +14.297 |
Neg logit contributions | |
aturdays | -16.690 |
unity | -16.447 |
Commands | -16.426 |
endas | -15.933 |
isans | -15.665 |
Token | it |
Token ID | 340 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
paed | +3.332 |
Australian | +2.967 |
neurot | +2.963 |
HSBC | +2.931 |
unethical | +2.914 |
Neg logit contributions | |
unity | -3.078 |
Commands | -3.012 |
aturdays | -2.992 |
enaries | -2.938 |
endas | -2.887 |
Token | was |
Token ID | 373 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
paed | +18.472 |
Australian | +16.832 |
commercially | +16.746 |
HSBC | +16.650 |
neurot | +16.576 |
Neg logit contributions | |
aturdays | -16.676 |
Commands | -15.540 |
unity | -15.179 |
Rules | -14.980 |
endas | -14.856 |
Token | the |
Token ID | 262 |
Feature activation | -2.60e+01 |
Pos logit contributions | |
paed | +18.040 |
unethical | +16.504 |
Australian | +16.479 |
HSBC | +16.242 |
neurot | +15.858 |
Neg logit contributions | |
aturdays | -16.749 |
Commands | -15.862 |
enaries | -15.758 |
unity | -15.482 |
endars | -15.234 |
Token | first |
Token ID | 717 |
Feature activation | -4.27e+01 |
Pos logit contributions | |
paed | +25.955 |
Australian | +24.071 |
unethical | +23.328 |
HSBC | +23.152 |
piracy | +23.148 |
Neg logit contributions | |
aturdays | -18.025 |
Commands | -17.309 |
enaries | -16.808 |
endas | -16.712 |
Rules | -16.342 |
Token | of |
Token ID | 286 |
Feature activation | -2.11e+01 |
Pos logit contributions | |
paed | +36.236 |
Australian | +34.336 |
UK | +33.303 |
pharmaceutical | +33.202 |
commercially | +32.959 |
Neg logit contributions | |
aturdays | -21.479 |
enaries | -19.905 |
endas | -19.853 |
Commands | -19.838 |
endars | -19.089 |
Token | the |
Token ID | 262 |
Feature activation | -1.70e+01 |
Pos logit contributions | |
paed | +21.263 |
HSBC | +19.692 |
Australian | +19.491 |
ITV | +19.068 |
commercially | +18.989 |
Neg logit contributions | |
aturdays | -16.481 |
endas | -15.482 |
enaries | -15.464 |
Commands | -15.375 |
unity | -14.991 |
Token | six |
Token ID | 2237 |
Feature activation | -3.04e+01 |
Pos logit contributions | |
paed | +18.944 |
Australian | +17.295 |
HSBC | +17.230 |
neurot | +16.811 |
unethical | +16.715 |
Neg logit contributions | |
aturdays | -13.395 |
enaries | -12.622 |
endas | -12.498 |
Commands | -12.487 |
unity | -12.449 |
Token | to |
Token ID | 284 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
paed | +29.921 |
Australian | +28.040 |
HSBC | +26.995 |
UK | +26.702 |
pharmaceutical | +26.624 |
Neg logit contributions | |
aturdays | -17.913 |
endas | -16.548 |
enaries | -15.981 |
endars | -15.919 |
Commands | -15.872 |
Token | own |
Token ID | 898 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
paed | +21.366 |
leak | +20.447 |
commercially | +19.845 |
HSBC | +19.783 |
Australian | +19.323 |
Neg logit contributions | |
aturdays | -18.703 |
Commands | -17.201 |
endars | -16.735 |
unity | -16.722 |
isans | -16.621 |
Token | athy |
Token ID | 10036 |
Feature activation | -2.51e+01 |
Pos logit contributions | |
unity | +3.021 |
Commands | +2.927 |
enaries | +2.874 |
aturdays | +2.872 |
endas | +2.837 |
Neg logit contributions | |
paed | -3.001 |
neurot | -2.683 |
Australian | -2.637 |
unethical | -2.627 |
piracy | -2.608 |
Token | this |
Token ID | 428 |
Feature activation | -1.77e+01 |
Pos logit contributions | |
paed | +24.947 |
Australian | +23.236 |
HSBC | +22.918 |
NZ | +22.045 |
unethical | +21.561 |
Neg logit contributions | |
aturdays | -17.206 |
unity | -16.318 |
assemblies | -15.252 |
enaries | -15.123 |
Rules | -15.013 |
Token | morning |
Token ID | 3329 |
Feature activation | -7.93e+00 |
Pos logit contributions | |
paed | +15.324 |
Australian | +14.165 |
NZ | +13.456 |
HSBC | +13.406 |
neurot | +13.175 |
Neg logit contributions | |
Commands | -16.886 |
endas | -16.860 |
aturdays | -16.754 |
Rules | -16.674 |
enaries | -16.655 |
Token | became |
Token ID | 2627 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
paed | +8.475 |
Australian | +7.732 |
neurot | +7.490 |
HSBC | +7.442 |
NZ | +7.343 |
Neg logit contributions | |
unity | -7.713 |
aturdays | -7.639 |
Commands | -7.408 |
endas | -7.327 |
enaries | -7.327 |
Token | the |
Token ID | 262 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
paed | +12.803 |
Australian | +12.276 |
HSBC | +11.534 |
NZ | +11.523 |
neurot | +11.133 |
Neg logit contributions | |
aturdays | -14.543 |
unity | -14.146 |
Commands | -14.135 |
enaries | -14.125 |
Rules | -13.939 |
Token | eighth |
Token ID | 16974 |
Feature activation | -4.21e+01 |
Pos logit contributions | |
paed | +12.285 |
Australian | +11.481 |
HSBC | +11.003 |
NZ | +10.814 |
neurot | +10.684 |
Neg logit contributions | |
aturdays | -10.922 |
unity | -10.679 |
Commands | -10.638 |
enaries | -10.593 |
endas | -10.505 |
Token | former |
Token ID | 1966 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
Australian | +37.537 |
paed | +37.515 |
HSBC | +34.648 |
NZ | +34.203 |
Malaysian | +33.540 |
Neg logit contributions | |
aturdays | -19.929 |
endas | -18.580 |
Rules | -18.061 |
endars | -17.785 |
enaries | -17.734 |
Token | executive |
Token ID | 4640 |
Feature activation | -2.51e+01 |
Pos logit contributions | |
paed | +22.283 |
Australian | +21.886 |
HSBC | +20.939 |
NZ | +20.625 |
Malaysian | +19.941 |
Neg logit contributions | |
aturdays | -14.788 |
endas | -13.513 |
enaries | -13.150 |
endars | -13.058 |
Rules | -12.977 |
Token | from |
Token ID | 422 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
paed | +25.217 |
Australian | +23.440 |
HSBC | +22.883 |
NZ | +21.895 |
unethical | +21.744 |
Neg logit contributions | |
aturdays | -18.359 |
Rules | -16.926 |
Commands | -16.616 |
endas | -16.500 |
endars | -16.360 |
Token | Sec |
Token ID | 1882 |
Feature activation | +8.52e+00 |
Pos logit contributions | |
paed | +19.990 |
Australian | +19.498 |
HSBC | +19.085 |
NZ | +18.308 |
Malaysian | +17.940 |
Neg logit contributions | |
aturdays | -14.889 |
enaries | -13.880 |
unity | -13.708 |
endars | -13.667 |
endas | -13.639 |
Token | uren |
Token ID | 23532 |
Feature activation | +5.19e+00 |
Pos logit contributions | |
unity | +8.172 |
enaries | +7.867 |
Commands | +7.856 |
endas | +7.610 |
Rules | +7.562 |
Neg logit contributions | |
paed | -9.399 |
neurot | -8.386 |
piracy | -8.135 |
unethical | -8.113 |
HSBC | -7.962 |
Token | vital |
Token ID | 9204 |
Feature activation | -7.05e-01 |
Pos logit contributions | |
unity | +4.012 |
Commands | +3.755 |
enaries | +3.659 |
aturdays | +3.652 |
assemblies | +3.619 |
Neg logit contributions | |
paed | -4.157 |
neurot | -3.697 |
Australian | -3.665 |
unethical | -3.643 |
HSBC | -3.625 |
Token | strategic |
Token ID | 10039 |
Feature activation | -5.14e-02 |
Pos logit contributions | |
paed | +0.707 |
neurot | +0.626 |
Australian | +0.625 |
HSBC | +0.612 |
unethical | +0.611 |
Neg logit contributions | |
unity | -0.769 |
Commands | -0.752 |
aturdays | -0.741 |
enaries | -0.737 |
Rules | -0.726 |
Token | position |
Token ID | 2292 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
paed | +0.047 |
neurot | +0.041 |
Australian | +0.040 |
HSBC | +0.040 |
unethical | +0.040 |
Neg logit contributions | |
unity | -0.061 |
Commands | -0.060 |
aturdays | -0.059 |
enaries | -0.059 |
Rules | -0.058 |
Token | that |
Token ID | 326 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
paed | +14.751 |
Australian | +14.036 |
HSBC | +13.524 |
commercially | +13.345 |
piracy | +13.295 |
Neg logit contributions | |
aturdays | -14.462 |
Commands | -14.138 |
endas | -13.916 |
endars | -13.843 |
enaries | -13.834 |
Token | some |
Token ID | 617 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
paed | +12.386 |
Australian | +11.508 |
HSBC | +11.204 |
neurot | +11.100 |
ITV | +10.949 |
Neg logit contributions | |
aturdays | -10.012 |
Commands | -9.796 |
enaries | -9.720 |
endas | -9.607 |
endars | -9.547 |
Token | fear |
Token ID | 3252 |
Feature activation | -4.20e+01 |
Pos logit contributions | |
unity | +2.483 |
Commands | +2.403 |
aturdays | +2.355 |
enaries | +2.353 |
assemblies | +2.331 |
Neg logit contributions | |
paed | -1.662 |
neurot | -1.437 |
Australian | -1.410 |
unethical | -1.398 |
HSBC | -1.392 |
Token | is |
Token ID | 318 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
paed | +34.144 |
Australian | +33.870 |
HSBC | +32.523 |
UK | +32.498 |
piracy | +32.309 |
Neg logit contributions | |
aturdays | -19.798 |
endars | -18.502 |
endas | -18.357 |
enaries | -18.296 |
Commands | -17.678 |
Token | threatened |
Token ID | 8556 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
paed | +10.168 |
Australian | +9.252 |
neurot | +9.121 |
ageing | +8.997 |
unethical | +8.953 |
Neg logit contributions | |
aturdays | -10.887 |
Commands | -10.585 |
enaries | -10.547 |
endars | -10.301 |
unity | -10.283 |
Token | by |
Token ID | 416 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
paed | +16.492 |
Australian | +15.635 |
commercially | +15.346 |
neurot | +15.059 |
piracy | +15.030 |
Neg logit contributions | |
Commands | -17.740 |
aturdays | -17.727 |
endars | -17.298 |
Rules | -17.019 |
endas | -17.014 |
Token | Brexit |
Token ID | 11435 |
Feature activation | -4.58e+00 |
Pos logit contributions | |
paed | +16.113 |
Australian | +14.941 |
piracy | +14.719 |
neurot | +14.599 |
HSBC | +14.538 |
Neg logit contributions | |
aturdays | -11.802 |
Commands | -11.763 |
enaries | -11.363 |
endars | -11.305 |
endas | -11.161 |
Token | . |
Token ID | 13 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
paed | +4.261 |
neurot | +3.764 |
Australian | +3.753 |
piracy | +3.644 |
HSBC | +3.641 |
Neg logit contributions | |
unity | -5.162 |
Commands | -5.132 |
aturdays | -5.083 |
enaries | -5.030 |
endas | -4.963 |
Token | - |
Token ID | 532 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
paed | +26.399 |
piracy | +25.050 |
Australian | +24.656 |
ITV | +24.079 |
HSBC | +23.457 |
Neg logit contributions | |
aturdays | -17.883 |
Commands | -16.499 |
endas | -16.243 |
enaries | -16.218 |
unity | -16.021 |
Token | deals |
Token ID | 7529 |
Feature activation | -3.28e+01 |
Pos logit contributions | |
paed | +16.376 |
Australian | +15.341 |
HSBC | +15.031 |
piracy | +14.905 |
ITV | +14.851 |
Neg logit contributions | |
unity | -12.457 |
aturdays | -12.433 |
enaries | -12.326 |
Commands | -12.268 |
endas | -12.054 |
Token | which |
Token ID | 543 |
Feature activation | -2.89e+01 |
Pos logit contributions | |
paed | +29.353 |
Australian | +28.166 |
HSBC | +27.695 |
ITV | +27.202 |
NZ | +27.189 |
Neg logit contributions | |
aturdays | -19.849 |
enaries | -18.344 |
Commands | -18.062 |
unity | -17.818 |
endas | -17.697 |
Token | pun |
Token ID | 4000 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
paed | +28.322 |
Australian | +27.458 |
HSBC | +26.972 |
NZ | +26.165 |
ITV | +26.011 |
Neg logit contributions | |
aturdays | -17.350 |
enaries | -16.212 |
endas | -15.671 |
unity | -15.552 |
isans | -15.510 |
Token | ters |
Token ID | 1010 |
Feature activation | -2.64e+01 |
Pos logit contributions | |
paed | +11.187 |
Australian | +10.276 |
neurot | +10.113 |
HSBC | +10.005 |
NZ | +9.869 |
Neg logit contributions | |
unity | -10.498 |
Commands | -10.360 |
aturdays | -10.192 |
assemblies | -10.033 |
endas | -9.938 |
Token | complain |
Token ID | 13121 |
Feature activation | -4.15e+01 |
Pos logit contributions | |
paed | +25.338 |
Australian | +23.475 |
HSBC | +23.038 |
commercially | +22.873 |
NZ | +22.537 |
Neg logit contributions | |
aturdays | -18.202 |
enaries | -16.576 |
endas | -16.408 |
isans | -16.342 |
Rules | -16.331 |
Token | are |
Token ID | 389 |
Feature activation | -1.88e+01 |
Pos logit contributions | |
paed | +34.941 |
Australian | +33.772 |
HSBC | +33.113 |
unethical | +32.588 |
piracy | +32.426 |
Neg logit contributions | |
aturdays | -19.303 |
enaries | -17.756 |
endars | -17.536 |
Commands | -17.309 |
endas | -16.982 |
Token | also |
Token ID | 635 |
Feature activation | -2.09e+01 |
Pos logit contributions | |
paed | +18.621 |
unethical | +17.620 |
Australian | +17.216 |
piracy | +17.077 |
neurot | +16.782 |
Neg logit contributions | |
aturdays | -16.022 |
enaries | -15.617 |
Commands | -15.532 |
unity | -15.220 |
endars | -14.692 |
Token | preventing |
Token ID | 12174 |
Feature activation | -2.70e+01 |
Pos logit contributions | |
paed | +21.047 |
unethical | +19.845 |
Australian | +19.670 |
piracy | +19.485 |
commercially | +19.098 |
Neg logit contributions | |
aturdays | -16.453 |
enaries | -15.911 |
Commands | -15.805 |
unity | -15.332 |
endars | -15.004 |
Token | them |
Token ID | 606 |
Feature activation | -1.47e+01 |
Pos logit contributions | |
paed | +29.204 |
Australian | +28.565 |
piracy | +27.809 |
HSBC | +27.271 |
ITV | +26.738 |
Neg logit contributions | |
aturdays | -14.626 |
Commands | -14.180 |
enaries | -13.775 |
Rules | -13.282 |
endas | -13.227 |
Token | from |
Token ID | 422 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
paed | +13.829 |
Australian | +12.588 |
HSBC | +12.274 |
neurot | +12.244 |
piracy | +12.185 |
Neg logit contributions | |
Commands | -14.348 |
aturdays | -14.009 |
Rules | -13.823 |
unity | -13.738 |
enaries | -13.653 |
Token | filtering |
Token ID | 25431 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
paed | +2.545 |
Australian | +2.261 |
neurot | +2.229 |
piracy | +2.197 |
HSBC | +2.194 |
Neg logit contributions | |
unity | -2.781 |
Commands | -2.711 |
aturdays | -2.689 |
enaries | -2.667 |
endas | -2.624 |
Token | systems |
Token ID | 3341 |
Feature activation | -1.71e+01 |
Pos logit contributions | |
paed | +13.564 |
Australian | +12.480 |
piracy | +12.097 |
unethical | +11.908 |
neurot | +11.851 |
Neg logit contributions | |
aturdays | -9.397 |
unity | -9.259 |
Commands | -9.126 |
enaries | -9.105 |
endas | -8.989 |
Token | did |
Token ID | 750 |
Feature activation | -3.12e+00 |
Pos logit contributions | |
paed | +15.812 |
Australian | +14.752 |
piracy | +14.082 |
unethical | +14.045 |
HSBC | +14.023 |
Neg logit contributions | |
aturdays | -15.968 |
Commands | -15.336 |
unity | -15.208 |
endars | -14.900 |
enaries | -14.884 |
Token | little |
Token ID | 1310 |
Feature activation | -2.06e+01 |
Pos logit contributions | |
paed | +3.303 |
Australian | +2.954 |
neurot | +2.936 |
unethical | +2.888 |
HSBC | +2.878 |
Neg logit contributions | |
unity | -3.221 |
Commands | -3.164 |
aturdays | -3.122 |
enaries | -3.061 |
Rules | -3.021 |
Token | to |
Token ID | 284 |
Feature activation | -8.66e+00 |
Pos logit contributions | |
paed | +19.096 |
Australian | +17.771 |
unethical | +17.014 |
piracy | +16.968 |
commercially | +16.885 |
Neg logit contributions | |
aturdays | -17.892 |
Commands | -17.736 |
endars | -17.311 |
endas | -17.024 |
enaries | -16.863 |
Token | curb |
Token ID | 20799 |
Feature activation | -4.13e+01 |
Pos logit contributions | |
paed | +8.291 |
Australian | +7.469 |
neurot | +7.268 |
piracy | +7.162 |
HSBC | +7.162 |
Neg logit contributions | |
aturdays | -9.345 |
Commands | -9.152 |
unity | -9.046 |
enaries | -9.022 |
endars | -8.908 |
Token | the |
Token ID | 262 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
paed | +38.012 |
piracy | +34.664 |
Australian | +34.093 |
unethical | +32.319 |
endemic | +31.749 |
Neg logit contributions | |
aturdays | -20.654 |
Commands | -20.507 |
enaries | -19.697 |
endars | -19.380 |
endas | -19.099 |
Token | trade |
Token ID | 3292 |
Feature activation | -5.95e+00 |
Pos logit contributions | |
paed | +22.234 |
piracy | +20.114 |
Australian | +20.046 |
unethical | +19.435 |
neurot | +19.117 |
Neg logit contributions | |
aturdays | -15.040 |
Commands | -14.251 |
endars | -13.946 |
enaries | -13.854 |
Rules | -13.759 |
Token | of |
Token ID | 286 |
Feature activation | -2.87e+01 |
Pos logit contributions | |
paed | +6.381 |
Australian | +5.654 |
piracy | +5.653 |
neurot | +5.604 |
unethical | +5.542 |
Neg logit contributions | |
unity | -5.970 |
Commands | -5.945 |
aturdays | -5.888 |
enaries | -5.776 |
endas | -5.635 |
Token | child |
Token ID | 1200 |
Feature activation | -2.11e+01 |
Pos logit contributions | |
paed | +30.717 |
Australian | +27.440 |
piracy | +27.092 |
unethical | +26.104 |
commercially | +25.649 |
Neg logit contributions | |
aturdays | -19.468 |
endas | -17.934 |
Commands | -17.787 |
enaries | -17.748 |
Rules | -17.625 |
Token | pornography |
Token ID | 18384 |
Feature activation | -2.74e+01 |
Pos logit contributions | |
paed | +21.002 |
piracy | +18.149 |
Australian | +17.947 |
neurot | +17.344 |
NZ | +16.947 |
Neg logit contributions | |
aturdays | -18.567 |
Commands | -17.997 |
unity | -17.241 |
endas | -17.195 |
Rules | -17.076 |
Token | protect |
Token ID | 1805 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
paed | +20.214 |
neurot | +19.453 |
leak | +19.088 |
commercially | +18.895 |
underestimate | +18.706 |
Neg logit contributions | |
aturdays | -23.082 |
Rules | -21.807 |
endars | -21.714 |
Commands | -21.179 |
enaries | -20.914 |
Token | heterosexual |
Token ID | 24026 |
Feature activation | -7.59e+00 |
Pos logit contributions | |
paed | +20.695 |
Australian | +18.419 |
neurot | +18.158 |
unethical | +17.894 |
commercially | +17.437 |
Neg logit contributions | |
aturdays | -16.364 |
Commands | -15.772 |
Rules | -15.338 |
enaries | -15.066 |
endas | -15.045 |
Token | men |
Token ID | 1450 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
paed | +8.362 |
Australian | +7.297 |
neurot | +7.182 |
unethical | +7.049 |
piracy | +7.024 |
Neg logit contributions | |
Commands | -7.338 |
unity | -7.242 |
aturdays | -7.177 |
Rules | -7.116 |
endas | -7.098 |
Token | against |
Token ID | 1028 |
Feature activation | -3.91e+01 |
Pos logit contributions | |
paed | +11.370 |
neurot | +9.826 |
Australian | +9.799 |
unethical | +9.694 |
commercially | +9.509 |
Neg logit contributions | |
Commands | -13.790 |
unity | -13.739 |
aturdays | -13.347 |
Rules | -13.309 |
endas | -13.025 |
Token | HIV |
Token ID | 10498 |
Feature activation | -1.80e+01 |
Pos logit contributions | |
paed | +36.239 |
viral | +32.204 |
neurot | +31.557 |
unethical | +31.133 |
Australian | +31.052 |
Neg logit contributions | |
aturdays | -21.205 |
enaries | -20.464 |
endars | -20.089 |
Rules | -19.818 |
endas | -19.668 |
Token | and |
Token ID | 290 |
Feature activation | -4.13e+01 |
Pos logit contributions | |
paed | +16.786 |
neurot | +15.266 |
piracy | +14.782 |
viral | +14.761 |
Australian | +14.464 |
Neg logit contributions | |
aturdays | -16.862 |
Commands | -16.400 |
Rules | -16.356 |
endars | -16.122 |
unity | -16.016 |
Token | that |
Token ID | 326 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
paed | +36.825 |
viral | +32.595 |
neurot | +32.384 |
malaria | +31.815 |
Australian | +31.688 |
Neg logit contributions | |
aturdays | -22.811 |
enaries | -20.229 |
isans | -19.884 |
endars | -19.446 |
Rules | -19.358 |
Token | the |
Token ID | 262 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
paed | +21.480 |
Australian | +19.324 |
unethical | +18.946 |
neurot | +18.778 |
piracy | +18.424 |
Neg logit contributions | |
aturdays | -13.255 |
Commands | -13.070 |
enaries | -13.026 |
endas | -12.614 |
endars | -12.603 |
Token | health |
Token ID | 1535 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
paed | +20.202 |
Australian | +18.623 |
neurot | +18.197 |
unethical | +18.181 |
dermat | +17.560 |
Neg logit contributions | |
enaries | -13.017 |
aturdays | -12.987 |
Commands | -12.893 |
endars | -12.539 |
endas | -12.526 |
Token | benefits |
Token ID | 4034 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
paed | +1.969 |
neurot | +1.738 |
Australian | +1.731 |
unethical | +1.700 |
HSBC | +1.686 |
Neg logit contributions | |
unity | -2.190 |
Commands | -2.144 |
aturdays | -2.112 |
enaries | -2.092 |
Rules | -2.063 |
Token | outwe |
Token ID | 26644 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
paed | +22.066 |
neurot | +19.889 |
Australian | +19.760 |
unethical | +19.431 |
HSBC | +19.199 |
Neg logit contributions | |
aturdays | -18.296 |
Commands | -18.293 |
Rules | -17.658 |
endas | -17.177 |
unity | -17.031 |
Token | have |
Token ID | 423 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
unity | +8.376 |
Commands | +8.012 |
enaries | +7.808 |
assemblies | +7.802 |
doors | +7.771 |
Neg logit contributions | |
paed | -6.683 |
neurot | -5.784 |
Australian | -5.716 |
HSBC | -5.684 |
ITV | -5.670 |
Token | taken |
Token ID | 2077 |
Feature activation | -4.58e+00 |
Pos logit contributions | |
unity | +13.747 |
doors | +12.834 |
Commands | +12.766 |
assemblies | +12.685 |
Rules | +12.663 |
Neg logit contributions | |
paed | -11.148 |
neurot | -9.751 |
ITV | -9.633 |
Australian | -9.617 |
HSBC | -9.586 |
Token | additional |
Token ID | 3224 |
Feature activation | -3.57e+00 |
Pos logit contributions | |
paed | +6.043 |
Australian | +5.554 |
neurot | +5.524 |
unethical | +5.503 |
HSBC | +5.466 |
Neg logit contributions | |
unity | -3.450 |
aturdays | -3.401 |
Commands | -3.367 |
enaries | -3.292 |
endas | -3.211 |
Token | steps |
Token ID | 4831 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
paed | +5.704 |
Australian | +5.314 |
neurot | +5.310 |
unethical | +5.268 |
HSBC | +5.241 |
Neg logit contributions | |
unity | -1.728 |
aturdays | -1.667 |
Commands | -1.643 |
enaries | -1.587 |
endas | -1.549 |
Token | to |
Token ID | 284 |
Feature activation | -1.87e+01 |
Pos logit contributions | |
paed | +11.523 |
unethical | +10.213 |
Australian | +10.136 |
commercially | +10.049 |
neurot | +10.011 |
Neg logit contributions | |
aturdays | -15.925 |
unity | -15.374 |
Commands | -15.225 |
endas | -15.200 |
enaries | -14.927 |
Token | regulate |
Token ID | 16697 |
Feature activation | -4.09e+01 |
Pos logit contributions | |
paed | +17.047 |
commercially | +15.789 |
Australian | +15.686 |
neurot | +15.595 |
leak | +15.417 |
Neg logit contributions | |
aturdays | -17.767 |
enaries | -16.197 |
endars | -16.183 |
Commands | -16.149 |
endas | -15.851 |
Token | tobacco |
Token ID | 11219 |
Feature activation | -2.45e+01 |
Pos logit contributions | |
paed | +33.919 |
unethical | +33.300 |
pharmaceutical | +32.958 |
neurot | +32.910 |
commercially | +32.697 |
Neg logit contributions | |
aturdays | -22.312 |
Commands | -19.114 |
enaries | -18.723 |
endas | -18.596 |
endars | -18.279 |
Token | as |
Token ID | 355 |
Feature activation | -9.85e+00 |
Pos logit contributions | |
paed | +22.960 |
neurot | +22.069 |
commercially | +21.768 |
piracy | +21.405 |
Australian | +21.203 |
Neg logit contributions | |
aturdays | -19.069 |
Commands | -17.223 |
endars | -16.999 |
Rules | -16.786 |
unity | -16.696 |
Token | a |
Token ID | 257 |
Feature activation | -1.89e+01 |
Pos logit contributions | |
paed | +9.473 |
neurot | +8.697 |
Australian | +8.533 |
unethical | +8.519 |
commercially | +8.333 |
Neg logit contributions | |
aturdays | -10.389 |
unity | -10.243 |
enaries | -10.141 |
Commands | -10.137 |
endas | -9.999 |
Token | drug |
Token ID | 2563 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
paed | +18.215 |
neurot | +17.597 |
pharmaceutical | +16.421 |
unethical | +16.294 |
commercially | +16.287 |
Neg logit contributions | |
aturdays | -17.572 |
enaries | -16.831 |
endas | -16.626 |
Commands | -16.354 |
endars | -16.256 |
Token | . |
Token ID | 13 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
paed | +19.328 |
neurot | +18.481 |
unethical | +17.373 |
commercially | +17.310 |
Australian | +17.117 |
Neg logit contributions | |
aturdays | -20.543 |
enaries | -19.808 |
Commands | -19.370 |
endas | -19.280 |
endars | -19.029 |
Token | For |
Token ID | 1114 |
Feature activation | -1.49e+01 |
Pos logit contributions | |
paed | +12.357 |
Australian | +11.859 |
HSBC | +11.606 |
NZ | +11.178 |
neurot | +11.038 |
Neg logit contributions | |
unity | -12.166 |
aturdays | -11.802 |
enaries | -11.449 |
assemblies | -11.380 |
endas | -11.351 |
Token | tips |
Token ID | 9040 |
Feature activation | -6.91e+00 |
Pos logit contributions | |
paed | +16.205 |
Australian | +15.043 |
HSBC | +14.636 |
piracy | +14.528 |
unethical | +14.489 |
Neg logit contributions | |
unity | -11.667 |
aturdays | -11.646 |
Commands | -11.457 |
enaries | -11.315 |
endas | -11.153 |
Token | on |
Token ID | 319 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
paed | +6.980 |
Australian | +6.304 |
neurot | +6.192 |
HSBC | +6.096 |
piracy | +6.072 |
Neg logit contributions | |
unity | -7.096 |
Commands | -6.944 |
aturdays | -6.847 |
enaries | -6.708 |
endas | -6.692 |
Token | protecting |
Token ID | 10192 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
paed | +17.022 |
Australian | +15.803 |
piracy | +15.428 |
unethical | +15.345 |
neurot | +15.337 |
Neg logit contributions | |
aturdays | -13.889 |
Commands | -13.321 |
endas | -13.289 |
unity | -13.227 |
enaries | -13.201 |
Token | yourself |
Token ID | 3511 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
paed | +15.207 |
Australian | +14.007 |
HSBC | +13.641 |
neurot | +13.405 |
unethical | +13.364 |
Neg logit contributions | |
Commands | -15.653 |
aturdays | -15.583 |
unity | -15.338 |
endas | -15.195 |
Rules | -14.853 |
Token | from |
Token ID | 422 |
Feature activation | -4.08e+01 |
Pos logit contributions | |
paed | +9.458 |
Australian | +8.425 |
neurot | +8.317 |
commercially | +8.200 |
HSBC | +8.160 |
Neg logit contributions | |
unity | -12.120 |
Commands | -12.056 |
aturdays | -11.769 |
Rules | -11.577 |
endas | -11.497 |
Token | identity |
Token ID | 5369 |
Feature activation | -2.11e+01 |
Pos logit contributions | |
paed | +34.743 |
unethical | +33.223 |
Australian | +32.881 |
malware | +32.681 |
ransomware | +32.622 |
Neg logit contributions | |
aturdays | -19.681 |
enaries | -18.895 |
Commands | -18.708 |
unity | -18.413 |
Rules | -18.032 |
Token | theft |
Token ID | 12402 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
paed | +17.850 |
piracy | +16.690 |
Australian | +16.226 |
neurot | +16.030 |
leak | +16.027 |
Neg logit contributions | |
Commands | -19.350 |
aturdays | -19.142 |
endas | -19.030 |
unity | -19.009 |
Rules | -18.467 |
Token | related |
Token ID | 3519 |
Feature activation | -3.39e+01 |
Pos logit contributions | |
paed | +15.768 |
Australian | +14.482 |
piracy | +14.252 |
neurot | +14.016 |
unethical | +13.905 |
Neg logit contributions | |
unity | -15.088 |
Commands | -14.926 |
aturdays | -14.576 |
endas | -14.370 |
Rules | -14.160 |
Token | tax |
Token ID | 1687 |
Feature activation | -8.96e+00 |
Pos logit contributions | |
paed | +29.921 |
unethical | +28.520 |
Australian | +28.476 |
malware | +28.267 |
ransomware | +28.131 |
Neg logit contributions | |
endas | -18.880 |
aturdays | -18.712 |
unity | -18.329 |
Commands | -18.264 |
isans | -18.192 |
Token | fraud |
Token ID | 7394 |
Feature activation | -8.99e+00 |
Pos logit contributions | |
paed | +8.348 |
Australian | +7.439 |
piracy | +7.329 |
neurot | +7.327 |
unethical | +7.305 |
Neg logit contributions | |
unity | -9.687 |
Commands | -9.510 |
aturdays | -9.400 |
enaries | -9.211 |
Rules | -9.182 |
Token | levied |
Token ID | 43383 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
paed | +17.667 |
HSBC | +16.073 |
Australian | +15.686 |
NZ | +15.317 |
commercially | +15.188 |
Neg logit contributions | |
aturdays | -17.593 |
Commands | -16.819 |
unity | -16.768 |
endas | -16.713 |
enaries | -16.306 |
Token | because |
Token ID | 780 |
Feature activation | -3.03e+00 |
Pos logit contributions | |
paed | +12.614 |
Australian | +11.167 |
HSBC | +11.127 |
commercially | +10.874 |
piracy | +10.867 |
Neg logit contributions | |
Commands | -12.769 |
unity | -12.736 |
aturdays | -12.704 |
endas | -12.465 |
enaries | -12.299 |
Token | it |
Token ID | 340 |
Feature activation | -1.68e+01 |
Pos logit contributions | |
paed | +3.274 |
Australian | +2.911 |
neurot | +2.903 |
HSBC | +2.870 |
unethical | +2.856 |
Neg logit contributions | |
unity | -3.067 |
Commands | -3.001 |
aturdays | -2.980 |
enaries | -2.927 |
Rules | -2.874 |
Token | was |
Token ID | 373 |
Feature activation | -1.88e+01 |
Pos logit contributions | |
paed | +16.704 |
Australian | +15.139 |
neurot | +15.111 |
commercially | +15.099 |
HSBC | +14.896 |
Neg logit contributions | |
aturdays | -15.162 |
Commands | -14.299 |
unity | -14.114 |
Rules | -13.931 |
endas | -13.728 |
Token | the |
Token ID | 262 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
paed | +18.671 |
unethical | +17.283 |
Australian | +16.933 |
commercially | +16.933 |
neurot | +16.881 |
Neg logit contributions | |
aturdays | -16.405 |
Commands | -15.866 |
enaries | -15.721 |
unity | -15.201 |
isans | -15.092 |
Token | third |
Token ID | 2368 |
Feature activation | -4.08e+01 |
Pos logit contributions | |
paed | +20.007 |
Australian | +18.246 |
unethical | +17.886 |
piracy | +17.658 |
neurot | +17.644 |
Neg logit contributions | |
aturdays | -15.484 |
Commands | -14.920 |
enaries | -14.657 |
endas | -14.459 |
Rules | -14.296 |
Token | time |
Token ID | 640 |
Feature activation | -1.97e+01 |
Pos logit contributions | |
paed | +35.774 |
Australian | +32.954 |
piracy | +32.158 |
HSBC | +31.969 |
commercially | +31.688 |
Neg logit contributions | |
endas | -19.924 |
aturdays | -19.414 |
Commands | -19.198 |
enaries | -18.956 |
Rules | -18.612 |
Token | En |
Token ID | 2039 |
Feature activation | +2.96e+00 |
Pos logit contributions | |
paed | +20.564 |
HSBC | +18.605 |
Australian | +18.565 |
unethical | +18.106 |
piracy | +18.027 |
Neg logit contributions | |
aturdays | -16.024 |
endas | -14.718 |
Commands | -14.652 |
unity | -14.611 |
enaries | -14.341 |
Token | i |
Token ID | 72 |
Feature activation | -2.62e+01 |
Pos logit contributions | |
unity | +3.254 |
Commands | +3.142 |
enaries | +3.092 |
isans | +3.059 |
aturdays | +3.053 |
Neg logit contributions | |
paed | -2.970 |
neurot | -2.624 |
Australian | -2.584 |
unethical | -2.564 |
HSBC | -2.540 |
Token | had |
Token ID | 550 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
paed | +25.174 |
Australian | +23.025 |
neurot | +22.671 |
commercially | +22.652 |
HSBC | +22.548 |
Neg logit contributions | |
aturdays | -18.745 |
Commands | -16.535 |
unity | -16.439 |
endas | -16.285 |
enaries | -16.106 |
Token | been |
Token ID | 587 |
Feature activation | -2.65e+01 |
Pos logit contributions | |
paed | +21.277 |
commercially | +19.267 |
neurot | +19.244 |
Australian | +19.187 |
HSBC | +19.170 |
Neg logit contributions | |
aturdays | -17.791 |
Commands | -16.373 |
unity | -15.912 |
endas | -15.843 |
endars | -15.650 |
Token | Commission |
Token ID | 4513 |
Feature activation | -7.58e-01 |
Pos logit contributions | |
paed | +15.923 |
Australian | +14.760 |
HSBC | +14.619 |
unethical | +14.308 |
neurot | +14.258 |
Neg logit contributions | |
aturdays | -10.464 |
enaries | -10.089 |
unity | -9.985 |
Commands | -9.941 |
endas | -9.708 |
Token | said |
Token ID | 531 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
paed | +0.785 |
neurot | +0.697 |
Australian | +0.693 |
HSBC | +0.682 |
unethical | +0.681 |
Neg logit contributions | |
unity | -0.808 |
Commands | -0.782 |
aturdays | -0.774 |
enaries | -0.767 |
Rules | -0.753 |
Token | this |
Token ID | 428 |
Feature activation | -1.62e+01 |
Pos logit contributions | |
paed | +14.116 |
Australian | +12.811 |
HSBC | +12.760 |
unethical | +12.542 |
piracy | +12.518 |
Neg logit contributions | |
aturdays | -11.932 |
Commands | -11.558 |
unity | -11.449 |
enaries | -11.366 |
endars | -11.252 |
Token | was |
Token ID | 373 |
Feature activation | -9.15e+00 |
Pos logit contributions | |
paed | +17.129 |
Australian | +15.581 |
unethical | +15.504 |
HSBC | +15.390 |
piracy | +15.338 |
Neg logit contributions | |
aturdays | -13.627 |
Commands | -13.526 |
enaries | -13.381 |
endas | -13.295 |
endars | -12.945 |
Token | the |
Token ID | 262 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
paed | +9.027 |
unethical | +8.165 |
Australian | +8.090 |
neurot | +7.904 |
piracy | +7.889 |
Neg logit contributions | |
aturdays | -9.557 |
enaries | -9.443 |
Commands | -9.431 |
unity | -9.348 |
endas | -9.105 |
Token | third |
Token ID | 2368 |
Feature activation | -4.06e+01 |
Pos logit contributions | |
paed | +17.812 |
Australian | +16.343 |
unethical | +15.933 |
piracy | +15.877 |
HSBC | +15.709 |
Neg logit contributions | |
aturdays | -15.562 |
enaries | -14.894 |
Commands | -14.786 |
endas | -14.548 |
isans | -14.246 |
Token | time |
Token ID | 640 |
Feature activation | -2.38e+01 |
Pos logit contributions | |
paed | +34.426 |
Australian | +32.092 |
piracy | +31.794 |
HSBC | +31.521 |
unethical | +31.348 |
Neg logit contributions | |
endas | -20.683 |
enaries | -20.429 |
aturdays | -20.322 |
Commands | -20.039 |
isans | -19.232 |
Token | that |
Token ID | 326 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
paed | +24.366 |
Australian | +22.624 |
HSBC | +22.427 |
unethical | +22.151 |
piracy | +21.932 |
Neg logit contributions | |
aturdays | -17.434 |
enaries | -15.461 |
Commands | -15.417 |
unity | -15.380 |
endas | -15.342 |
Token | the |
Token ID | 262 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
paed | +22.310 |
Australian | +20.607 |
unethical | +20.452 |
HSBC | +20.408 |
piracy | +19.973 |
Neg logit contributions | |
aturdays | -14.826 |
enaries | -13.436 |
Commands | -13.339 |
endas | -13.251 |
unity | -13.073 |
Token | rubber |
Token ID | 14239 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
paed | +17.618 |
Australian | +16.247 |
HSBC | +16.020 |
unethical | +15.840 |
neurot | +15.724 |
Neg logit contributions | |
aturdays | -12.163 |
enaries | -11.461 |
unity | -11.289 |
Commands | -11.274 |
endas | -11.183 |
Token | industry |
Token ID | 2831 |
Feature activation | -2.55e+01 |
Pos logit contributions | |
paed | +26.673 |
Australian | +24.417 |
piracy | +24.069 |
neurot | +23.932 |
HSBC | +23.728 |
Neg logit contributions | |
aturdays | -15.702 |
Commands | -14.648 |
endas | -14.155 |
enaries | -14.136 |
unity | -14.054 |
Token | of |
Token ID | 286 |
Feature activation | -2.03e+01 |
Pos logit contributions | |
paed | +22.165 |
Australian | +20.343 |
HSBC | +19.751 |
commercially | +19.442 |
NZ | +19.377 |
Neg logit contributions | |
aturdays | -19.296 |
Commands | -18.430 |
unity | -18.396 |
enaries | -18.120 |
endas | -17.909 |
Token | $ |
Token ID | 720 |
Feature activation | +2.94e-01 |
Pos logit contributions | |
paed | +20.151 |
Australian | +19.638 |
NZ | +18.713 |
HSBC | +18.412 |
neurot | +17.975 |
Neg logit contributions | |
aturdays | -16.377 |
Commands | -15.398 |
unity | -15.292 |
isans | -15.070 |
Rules | -14.915 |
Token | 17 |
Token ID | 1558 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
unity | +0.269 |
Commands | +0.260 |
aturdays | +0.254 |
enaries | +0.253 |
Rules | +0.248 |
Neg logit contributions | |
paed | -0.348 |
neurot | -0.314 |
Australian | -0.312 |
HSBC | -0.308 |
unethical | -0.308 |
Token | . |
Token ID | 13 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
paed | +18.258 |
Australian | +17.227 |
NZ | +16.269 |
HSBC | +15.948 |
neurot | +15.822 |
Neg logit contributions | |
Commands | -17.263 |
unity | -16.834 |
aturdays | -16.804 |
endas | -16.563 |
enaries | -16.500 |
Token | 2 |
Token ID | 17 |
Feature activation | -2.45e+01 |
Pos logit contributions | |
paed | +1.578 |
Australian | +1.429 |
neurot | +1.424 |
HSBC | +1.407 |
unethical | +1.391 |
Neg logit contributions | |
unity | -1.169 |
Commands | -1.121 |
aturdays | -1.106 |
enaries | -1.095 |
assemblies | -1.075 |
Token | million |
Token ID | 1510 |
Feature activation | -4.00e+01 |
Pos logit contributions | |
paed | +20.652 |
Australian | +19.742 |
NZ | +18.584 |
HSBC | +18.080 |
commercially | +17.865 |
Neg logit contributions | |
Commands | -19.782 |
aturdays | -19.553 |
enaries | -19.308 |
unity | -19.265 |
endas | -19.009 |
Token | in |
Token ID | 287 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
paed | +32.381 |
Australian | +32.046 |
NZ | +30.394 |
HSBC | +30.071 |
Malaysian | +29.177 |
Neg logit contributions | |
aturdays | -20.745 |
Commands | -19.946 |
unity | -19.350 |
Rules | -18.631 |
endas | -18.599 |
Token | commissions |
Token ID | 30421 |
Feature activation | -2.58e+01 |
Pos logit contributions | |
Australian | +27.278 |
paed | +27.003 |
HSBC | +25.531 |
Malaysian | +25.439 |
NZ | +25.437 |
Neg logit contributions | |
aturdays | -16.194 |
isans | -14.677 |
endas | -14.558 |
Commands | -14.540 |
Rules | -14.517 |
Token | to |
Token ID | 284 |
Feature activation | -2.62e+01 |
Pos logit contributions | |
paed | +23.037 |
Australian | +21.857 |
NZ | +21.004 |
HSBC | +20.874 |
commercially | +20.397 |
Neg logit contributions | |
aturdays | -19.520 |
unity | -18.793 |
Commands | -18.545 |
endas | -18.376 |
Rules | -17.815 |
Token | an |
Token ID | 281 |
Feature activation | -3.73e+01 |
Pos logit contributions | |
paed | +27.645 |
Australian | +27.228 |
HSBC | +26.319 |
Malaysian | +25.509 |
NZ | +25.335 |
Neg logit contributions | |
aturdays | -15.970 |
unity | -14.180 |
Commands | -13.672 |
Rules | -13.651 |
isans | -13.577 |
Token | agent |
Token ID | 5797 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
Australian | +34.181 |
HSBC | +31.735 |
paed | +31.576 |
unethical | +30.107 |
Malaysian | +29.971 |
Neg logit contributions | |
aturdays | -20.098 |
enaries | -19.202 |
Commands | -18.450 |
unity | -18.347 |
Dialogue | -17.529 |
Token | � |
Token ID | 251 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
paed | +5.556 |
Australian | +4.858 |
neurot | +4.850 |
HSBC | +4.791 |
unethical | +4.748 |
Neg logit contributions | |
unity | -6.845 |
Commands | -6.697 |
aturdays | -6.627 |
enaries | -6.530 |
endas | -6.460 |
Token | said |
Token ID | 531 |
Feature activation | -2.95e+01 |
Pos logit contributions | |
paed | +25.303 |
Australian | +23.256 |
neurot | +23.017 |
HSBC | +22.699 |
unethical | +22.480 |
Neg logit contributions | |
Commands | -16.368 |
aturdays | -15.902 |
unity | -15.815 |
enaries | -15.572 |
endas | -15.555 |
Token | Edward |
Token ID | 10443 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
paed | +29.661 |
Australian | +27.747 |
HSBC | +26.945 |
neurot | +26.748 |
dermat | +26.457 |
Neg logit contributions | |
aturdays | -16.761 |
Commands | -16.007 |
endars | -15.988 |
enaries | -15.979 |
endas | -15.791 |
Token | Chan |
Token ID | 18704 |
Feature activation | -6.42e+00 |
Pos logit contributions | |
paed | +12.829 |
Australian | +12.161 |
HSBC | +11.857 |
Malaysian | +11.238 |
NZ | +11.238 |
Neg logit contributions | |
aturdays | -14.922 |
unity | -14.829 |
assemblies | -14.168 |
enaries | -14.063 |
Rules | -14.008 |
Token | , |
Token ID | 11 |
Feature activation | -1.59e+01 |
Pos logit contributions | |
paed | +6.094 |
Australian | +5.385 |
neurot | +5.350 |
HSBC | +5.317 |
piracy | +5.192 |
Neg logit contributions | |
unity | -7.133 |
Commands | -6.960 |
aturdays | -6.877 |
enaries | -6.777 |
assemblies | -6.733 |
Token | an |
Token ID | 281 |
Feature activation | -3.98e+01 |
Pos logit contributions | |
paed | +15.180 |
Australian | +13.697 |
neurot | +13.480 |
HSBC | +13.185 |
dermat | +12.856 |
Neg logit contributions | |
aturdays | -15.292 |
Commands | -14.818 |
unity | -14.804 |
enaries | -14.800 |
endas | -14.562 |
Token | official |
Token ID | 1743 |
Feature activation | -9.25e+00 |
Pos logit contributions | |
Australian | +32.880 |
paed | +32.765 |
HSBC | +30.194 |
dermat | +30.069 |
neurot | +29.844 |
Neg logit contributions | |
enaries | -22.607 |
aturdays | -22.052 |
endars | -21.489 |
Commands | -20.615 |
unity | -20.126 |
Token | with |
Token ID | 351 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
paed | +9.264 |
Australian | +8.278 |
neurot | +8.170 |
HSBC | +7.992 |
unethical | +7.930 |
Neg logit contributions | |
unity | -9.426 |
aturdays | -9.391 |
Commands | -9.390 |
enaries | -9.272 |
endas | -9.199 |
Token | Greenpeace |
Token ID | 42793 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
paed | +21.458 |
Australian | +20.237 |
HSBC | +19.705 |
neurot | +19.558 |
Malaysian | +18.869 |
Neg logit contributions | |
aturdays | -16.855 |
enaries | -15.405 |
unity | -15.326 |
endars | -15.283 |
isans | -15.233 |
Token | in |
Token ID | 287 |
Feature activation | -1.71e+01 |
Pos logit contributions | |
paed | +10.197 |
Australian | +9.329 |
HSBC | +8.935 |
neurot | +8.831 |
NZ | +8.644 |
Neg logit contributions | |
unity | -12.490 |
aturdays | -12.446 |
Commands | -12.228 |
enaries | -11.930 |
endars | -11.904 |
Token | southern |
Token ID | 8372 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
paed | +15.163 |
Australian | +14.259 |
HSBC | +13.642 |
neurot | +13.331 |
Malaysian | +13.314 |
Neg logit contributions | |
aturdays | -16.530 |
enaries | -16.144 |
endas | -16.031 |
Commands | -15.927 |
Rules | -15.833 |
Token | food |
Token ID | 2057 |
Feature activation | -6.92e+00 |
Pos logit contributions | |
paed | +2.586 |
neurot | +2.344 |
Australian | +2.325 |
unethical | +2.281 |
HSBC | +2.281 |
Neg logit contributions | |
unity | -1.995 |
Commands | -1.938 |
aturdays | -1.897 |
enaries | -1.885 |
endas | -1.852 |
Token | from |
Token ID | 422 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
paed | +8.056 |
neurot | +7.382 |
Australian | +7.290 |
piracy | +7.241 |
unethical | +7.153 |
Neg logit contributions | |
unity | -6.030 |
Commands | -5.953 |
aturdays | -5.889 |
enaries | -5.746 |
endas | -5.669 |
Token | each |
Token ID | 1123 |
Feature activation | -5.01e+00 |
Pos logit contributions | |
paed | +14.818 |
Australian | +13.614 |
neurot | +13.588 |
unethical | +13.213 |
piracy | +13.187 |
Neg logit contributions | |
aturdays | -10.838 |
Commands | -10.817 |
unity | -10.804 |
enaries | -10.720 |
endas | -10.394 |
Token | state |
Token ID | 1181 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
paed | +5.606 |
neurot | +5.080 |
Australian | +5.075 |
unethical | +4.937 |
piracy | +4.914 |
Neg logit contributions | |
unity | -4.766 |
Commands | -4.705 |
aturdays | -4.653 |
enaries | -4.606 |
Rules | -4.521 |
Token | � |
Token ID | 447 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
paed | +19.949 |
Australian | +18.636 |
neurot | +18.389 |
HSBC | +18.116 |
piracy | +17.976 |
Neg logit contributions | |
aturdays | -14.855 |
enaries | -14.565 |
Commands | -14.413 |
unity | -14.353 |
endas | -14.332 |
Token | � |
Token ID | 251 |
Feature activation | -3.97e+01 |
Pos logit contributions | |
paed | +8.946 |
Australian | +7.845 |
neurot | +7.785 |
HSBC | +7.728 |
unethical | +7.579 |
Neg logit contributions | |
unity | -11.560 |
aturdays | -11.393 |
Commands | -11.391 |
enaries | -11.234 |
endas | -11.082 |
Token | and |
Token ID | 290 |
Feature activation | -8.55e+00 |
Pos logit contributions | |
paed | +31.792 |
Australian | +30.767 |
leak | +30.515 |
viral | +29.941 |
neurot | +29.894 |
Neg logit contributions | |
aturdays | -18.127 |
Commands | -17.127 |
unity | -16.792 |
endas | -16.557 |
enaries | -16.512 |
Token | � |
Token ID | 564 |
Feature activation | -5.29e+00 |
Pos logit contributions | |
paed | +9.312 |
neurot | +8.541 |
Australian | +8.491 |
unethical | +8.206 |
piracy | +8.202 |
Neg logit contributions | |
unity | -7.886 |
Commands | -7.750 |
aturdays | -7.716 |
enaries | -7.653 |
endas | -7.496 |
Token | � |
Token ID | 250 |
Feature activation | -2.73e+01 |
Pos logit contributions | |
paed | +3.185 |
neurot | +2.613 |
Australian | +2.596 |
unethical | +2.487 |
HSBC | +2.485 |
Neg logit contributions | |
unity | -7.734 |
Commands | -7.570 |
aturdays | -7.500 |
enaries | -7.451 |
assemblies | -7.390 |
Token | most |
Token ID | 1712 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
paed | +27.455 |
neurot | +25.644 |
Australian | +25.617 |
piracy | +24.878 |
viral | +24.697 |
Neg logit contributions | |
unity | -14.563 |
Commands | -14.466 |
assemblies | -13.407 |
aturdays | -13.407 |
enaries | -13.228 |
Token | popular |
Token ID | 2968 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
paed | +13.019 |
Australian | +11.818 |
neurot | +11.803 |
unethical | +11.549 |
viral | +11.373 |
Neg logit contributions | |
unity | -10.860 |
Commands | -10.630 |
enaries | -10.626 |
endas | -10.395 |
aturdays | -10.358 |
Token | allies |
Token ID | 7681 |
Feature activation | -2.70e+01 |
Pos logit contributions | |
paed | +29.895 |
Australian | +29.106 |
HSBC | +27.964 |
UK | +27.165 |
NZ | +26.799 |
Neg logit contributions | |
aturdays | -16.983 |
endars | -15.763 |
Commands | -15.675 |
isans | -15.577 |
Rules | -15.422 |
Token | to |
Token ID | 284 |
Feature activation | -8.27e+00 |
Pos logit contributions | |
paed | +24.210 |
Australian | +23.161 |
HSBC | +22.723 |
NZ | +21.648 |
UK | +21.636 |
Neg logit contributions | |
aturdays | -20.397 |
isans | -18.661 |
endars | -18.604 |
endas | -18.563 |
Commands | -18.444 |
Token | open |
Token ID | 1280 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
paed | +8.539 |
Australian | +7.717 |
neurot | +7.601 |
HSBC | +7.569 |
unethical | +7.461 |
Neg logit contributions | |
aturdays | -8.324 |
Commands | -8.126 |
unity | -8.043 |
Rules | -7.895 |
isans | -7.891 |
Token | criminal |
Token ID | 4301 |
Feature activation | -6.89e+00 |
Pos logit contributions | |
paed | +15.091 |
Australian | +14.095 |
HSBC | +13.797 |
unethical | +13.621 |
piracy | +13.595 |
Neg logit contributions | |
aturdays | -6.738 |
Commands | -6.697 |
unity | -6.486 |
isans | -6.398 |
endas | -6.396 |
Token | investigations |
Token ID | 10986 |
Feature activation | -8.52e+00 |
Pos logit contributions | |
paed | +8.054 |
Australian | +7.206 |
HSBC | +7.167 |
piracy | +7.070 |
unethical | +7.049 |
Neg logit contributions | |
unity | -6.079 |
Commands | -6.019 |
aturdays | -5.999 |
endas | -5.877 |
enaries | -5.868 |
Token | into |
Token ID | 656 |
Feature activation | -3.97e+01 |
Pos logit contributions | |
paed | +8.245 |
Australian | +7.316 |
unethical | +7.192 |
HSBC | +7.187 |
neurot | +7.117 |
Neg logit contributions | |
unity | -9.041 |
aturdays | -9.037 |
Commands | -8.898 |
enaries | -8.659 |
Rules | -8.586 |
Token | Assange |
Token ID | 21882 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
paed | +36.668 |
Australian | +34.400 |
HSBC | +33.156 |
unethical | +32.901 |
piracy | +32.379 |
Neg logit contributions | |
aturdays | -19.537 |
endars | -18.251 |
Commands | -18.013 |
enaries | -17.830 |
isans | -17.820 |
Token | , |
Token ID | 11 |
Feature activation | -2.37e+01 |
Pos logit contributions | |
paed | +16.963 |
Australian | +15.053 |
neurot | +14.844 |
HSBC | +14.802 |
unethical | +14.686 |
Neg logit contributions | |
aturdays | -16.912 |
unity | -16.495 |
Commands | -16.220 |
endas | -15.722 |
enaries | -15.709 |
Token | while |
Token ID | 981 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
paed | +23.670 |
Australian | +22.035 |
unethical | +21.351 |
HSBC | +21.344 |
piracy | +20.824 |
Neg logit contributions | |
aturdays | -16.906 |
enaries | -16.406 |
Commands | -16.224 |
endas | -16.088 |
endars | -15.804 |
Token | the |
Token ID | 262 |
Feature activation | -9.89e+00 |
Pos logit contributions | |
paed | +14.884 |
Australian | +13.793 |
HSBC | +13.318 |
unethical | +13.078 |
neurot | +12.912 |
Neg logit contributions | |
aturdays | -12.567 |
Commands | -12.231 |
unity | -12.098 |
endars | -12.090 |
enaries | -12.029 |
Token | US |
Token ID | 1294 |
Feature activation | -6.06e+00 |
Pos logit contributions | |
paed | +10.755 |
Australian | +9.935 |
HSBC | +9.487 |
neurot | +9.391 |
unethical | +9.362 |
Neg logit contributions | |
aturdays | -9.212 |
Commands | -9.059 |
unity | -9.048 |
enaries | -8.996 |
Rules | -8.811 |
Token | - |
Token ID | 532 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
paed | +13.084 |
Australian | +11.853 |
HSBC | +11.273 |
neurot | +11.068 |
unethical | +11.053 |
Neg logit contributions | |
aturdays | -15.380 |
unity | -15.066 |
Commands | -14.695 |
endas | -14.434 |
enaries | -14.382 |
Token | up |
Token ID | 510 |
Feature activation | -1.60e+01 |
Pos logit contributions | |
paed | +21.502 |
Australian | +19.986 |
HSBC | +19.793 |
unethical | +19.252 |
NZ | +18.894 |
Neg logit contributions | |
aturdays | -14.282 |
Commands | -14.105 |
unity | -14.104 |
enaries | -13.691 |
endas | -13.582 |
Token | to |
Token ID | 284 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
paed | +16.215 |
Australian | +14.799 |
NZ | +14.389 |
HSBC | +14.352 |
piracy | +14.304 |
Neg logit contributions | |
unity | -13.733 |
Commands | -13.598 |
assemblies | -13.035 |
endas | -12.986 |
aturdays | -12.888 |
Token | $ |
Token ID | 720 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
paed | +17.338 |
Australian | +16.116 |
HSBC | +15.818 |
NZ | +15.548 |
unethical | +15.186 |
Neg logit contributions | |
aturdays | -13.566 |
endas | -13.416 |
Commands | -13.248 |
unity | -13.048 |
enaries | -12.963 |
Token | 17 |
Token ID | 1558 |
Feature activation | -2.45e+01 |
Pos logit contributions | |
unity | +1.526 |
Commands | +1.472 |
enaries | +1.427 |
aturdays | +1.426 |
Rules | +1.415 |
Neg logit contributions | |
paed | -2.159 |
neurot | -1.958 |
Australian | -1.933 |
unethical | -1.924 |
piracy | -1.913 |
Token | million |
Token ID | 1510 |
Feature activation | -3.96e+01 |
Pos logit contributions | |
paed | +21.650 |
Australian | +20.614 |
NZ | +19.491 |
HSBC | +19.462 |
neurot | +19.079 |
Neg logit contributions | |
endas | -18.405 |
Commands | -18.291 |
aturdays | -18.236 |
unity | -18.119 |
enaries | -17.882 |
Token | . |
Token ID | 13 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
paed | +32.773 |
Australian | +32.112 |
HSBC | +30.845 |
NZ | +30.319 |
(£ | +29.638 |
Neg logit contributions | |
aturdays | -20.710 |
unity | -19.607 |
endas | -19.286 |
Commands | -19.124 |
enaries | -18.526 |
Token |
|
Token ID | 198 |
Feature activation | -9.17e+00 |
Pos logit contributions | |
Australian | +16.944 |
paed | +16.913 |
HSBC | +16.299 |
NZ | +15.610 |
ITV | +15.299 |
Neg logit contributions | |
unity | -17.054 |
aturdays | -16.898 |
enaries | -16.474 |
assemblies | -16.278 |
endas | -16.024 |
Token |
|
Token ID | 198 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
paed | +6.699 |
Australian | +6.280 |
HSBC | +5.879 |
NZ | +5.730 |
neurot | +5.670 |
Neg logit contributions | |
aturdays | -11.995 |
unity | -11.539 |
enaries | -11.277 |
endars | -11.243 |
endas | -11.159 |
Token | Former |
Token ID | 14282 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
paed | +15.785 |
Australian | +14.926 |
HSBC | +14.474 |
NZ | +13.890 |
Australian | +13.789 |
Neg logit contributions | |
unity | -13.114 |
aturdays | -12.816 |
Commands | -12.300 |
assemblies | -12.181 |
enaries | -12.125 |
Token | Sec |
Token ID | 1882 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
paed | +26.444 |
Australian | +26.373 |
HSBC | +25.512 |
NZ | +24.725 |
Malaysian | +24.307 |
Neg logit contributions | |
aturdays | -14.460 |
endas | -13.271 |
enaries | -13.117 |
endars | -12.927 |
isans | -12.891 |
Token | executives |
Token ID | 12353 |
Feature activation | -1.68e+01 |
Pos logit contributions | |
paed | +5.471 |
Australian | +4.956 |
neurot | +4.873 |
HSBC | +4.811 |
piracy | +4.777 |
Neg logit contributions | |
unity | -4.541 |
aturdays | -4.476 |
Commands | -4.454 |
endas | -4.356 |
enaries | -4.349 |
Token | that |
Token ID | 326 |
Feature activation | -2.30e+01 |
Pos logit contributions | |
paed | +15.205 |
Australian | +13.868 |
HSBC | +13.592 |
commercially | +13.342 |
neurot | +13.229 |
Neg logit contributions | |
aturdays | -16.163 |
unity | -16.009 |
Commands | -15.559 |
Rules | -15.360 |
endas | -15.322 |
Token | the |
Token ID | 262 |
Feature activation | -6.65e+00 |
Pos logit contributions | |
paed | +22.811 |
Australian | +21.459 |
HSBC | +21.264 |
Malaysian | +20.217 |
neurot | +20.216 |
Neg logit contributions | |
aturdays | -17.289 |
unity | -15.821 |
endas | -15.702 |
enaries | -15.495 |
endars | -15.485 |
Token | NDP |
Token ID | 20392 |
Feature activation | -6.69e+00 |
Pos logit contributions | |
paed | +6.719 |
Australian | +6.091 |
neurot | +5.964 |
HSBC | +5.963 |
unethical | +5.857 |
Neg logit contributions | |
aturdays | -6.882 |
unity | -6.848 |
Commands | -6.808 |
enaries | -6.676 |
endas | -6.593 |
Token | critic |
Token ID | 4014 |
Feature activation | -1.68e+01 |
Pos logit contributions | |
paed | +7.209 |
neurot | +6.521 |
Australian | +6.488 |
unethical | +6.341 |
HSBC | +6.308 |
Neg logit contributions | |
unity | -6.411 |
aturdays | -6.368 |
Commands | -6.317 |
enaries | -6.301 |
endas | -6.154 |
Token | estimates |
Token ID | 7746 |
Feature activation | -3.94e+01 |
Pos logit contributions | |
paed | +17.840 |
Australian | +16.221 |
neurot | +16.004 |
HSBC | +15.925 |
unethical | +15.895 |
Neg logit contributions | |
aturdays | -12.972 |
unity | -12.898 |
Commands | -12.884 |
endas | -12.858 |
enaries | -12.792 |
Token | cost |
Token ID | 1575 |
Feature activation | -2.09e+01 |
Pos logit contributions | |
paed | +32.677 |
Australian | +31.225 |
HSBC | +30.829 |
leak | +29.983 |
unethical | +29.966 |
Neg logit contributions | |
aturdays | -21.076 |
endars | -18.631 |
endas | -18.472 |
Dialogue | -18.117 |
unity | -18.053 |
Token | the |
Token ID | 262 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
paed | +20.575 |
Australian | +19.669 |
HSBC | +19.087 |
unethical | +18.552 |
NZ | +18.487 |
Neg logit contributions | |
aturdays | -16.202 |
Commands | -15.684 |
isans | -14.991 |
endas | -14.982 |
Rules | -14.893 |
Token | federal |
Token ID | 2717 |
Feature activation | -7.33e+00 |
Pos logit contributions | |
paed | +10.978 |
Australian | +10.117 |
neurot | +9.677 |
HSBC | +9.622 |
unethical | +9.490 |
Neg logit contributions | |
aturdays | -12.020 |
Commands | -11.842 |
enaries | -11.579 |
unity | -11.566 |
endas | -11.449 |
Token | treasury |
Token ID | 38115 |
Feature activation | -2.04e+01 |
Pos logit contributions | |
paed | +6.199 |
Australian | +5.493 |
neurot | +5.429 |
HSBC | +5.278 |
unethical | +5.222 |
Neg logit contributions | |
Commands | -8.607 |
aturdays | -8.596 |
unity | -8.560 |
endas | -8.410 |
enaries | -8.354 |
Token | $ |
Token ID | 720 |
Feature activation | +6.79e+00 |
Pos logit contributions | |
paed | +19.157 |
Australian | +17.927 |
HSBC | +17.387 |
neurot | +17.259 |
NZ | +17.200 |
Neg logit contributions | |
aturdays | -17.162 |
endas | -16.353 |
Commands | -16.277 |
endars | -15.992 |
unity | -15.975 |
Token | the |
Token ID | 262 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
unity | +16.523 |
prayers | +15.261 |
Commands | +15.179 |
assemblies | +15.145 |
doors | +15.124 |
Neg logit contributions | |
paed | -11.000 |
neurot | -9.408 |
piracy | -9.374 |
HSBC | -9.327 |
Australian | -9.124 |
Token | government |
Token ID | 1230 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
unity | +18.862 |
doors | +17.510 |
prayers | +17.485 |
Commands | +17.375 |
assemblies | +17.197 |
Neg logit contributions | |
paed | -11.429 |
neurot | -9.633 |
HSBC | -9.583 |
piracy | -9.572 |
NZ | -9.168 |
Token | and |
Token ID | 290 |
Feature activation | +8.65e+00 |
Pos logit contributions | |
unity | +13.889 |
Commands | +12.853 |
assemblies | +12.812 |
isans | +12.760 |
prayers | +12.738 |
Neg logit contributions | |
paed | -13.255 |
Australian | -11.561 |
piracy | -11.550 |
neurot | -11.511 |
NZ | -11.479 |
Token | the |
Token ID | 262 |
Feature activation | +1.57e+01 |
Pos logit contributions | |
unity | +9.791 |
Commands | +9.144 |
prayers | +8.978 |
assemblies | +8.966 |
isans | +8.943 |
Neg logit contributions | |
paed | -8.027 |
neurot | -7.027 |
HSBC | -6.852 |
piracy | -6.834 |
Australian | -6.797 |
Token | public |
Token ID | 1171 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
unity | +18.250 |
prayers | +16.957 |
doors | +16.898 |
Commands | +16.867 |
assemblies | +16.744 |
Neg logit contributions | |
paed | -11.943 |
neurot | -10.101 |
HSBC | -10.040 |
piracy | -9.928 |
NZ | -9.656 |
Token | require |
Token ID | 2421 |
Feature activation | +2.77e+01 |
Pos logit contributions | |
unity | +18.977 |
assemblies | +17.651 |
prayers | +17.421 |
Commands | +17.308 |
isans | +17.279 |
Neg logit contributions | |
paed | -13.314 |
piracy | -11.357 |
neurot | -11.246 |
NZ | -11.234 |
unethical | -11.223 |
Token | more |
Token ID | 517 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
unity | +29.955 |
prayers | +26.719 |
doors | +26.706 |
assemblies | +26.131 |
isans | +25.955 |
Neg logit contributions | |
paed | -15.812 |
HSBC | -13.262 |
piracy | -13.010 |
ITV | -12.698 |
NZ | -12.624 |
Token | order |
Token ID | 1502 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
unity | +24.552 |
doors | +21.945 |
prayers | +21.848 |
isans | +21.777 |
Commands | +21.679 |
Neg logit contributions | |
paed | -15.166 |
HSBC | -12.830 |
piracy | -12.574 |
ITV | -12.512 |
NZ | -12.408 |
Token | and |
Token ID | 290 |
Feature activation | +3.24e+01 |
Pos logit contributions | |
unity | +15.888 |
isans | +14.777 |
Commands | +14.644 |
assemblies | +14.446 |
enaries | +14.438 |
Neg logit contributions | |
paed | -15.505 |
HSBC | -13.501 |
piracy | -13.431 |
unethical | -13.239 |
neurot | -13.223 |
Token | certainty |
Token ID | 18979 |
Feature activation | +8.61e+00 |
Pos logit contributions | |
unity | +33.531 |
doors | +29.265 |
prayers | +29.151 |
assemblies | +28.906 |
Commands | +28.570 |
Neg logit contributions | |
paed | -16.352 |
HSBC | -13.916 |
ITV | -13.742 |
piracy | -13.547 |
NZ | -13.125 |
Token | . |
Token ID | 13 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
unity | +8.891 |
Commands | +8.451 |
enaries | +8.293 |
assemblies | +8.241 |
isans | +8.235 |
Neg logit contributions | |
paed | -8.738 |
neurot | -7.597 |
HSBC | -7.579 |
piracy | -7.552 |
Australian | -7.522 |
Token | " |
Token ID | 366 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
unity | +26.942 |
Commands | +25.150 |
doors | +23.840 |
assemblies | +23.692 |
prayers | +23.145 |
Neg logit contributions | |
paed | -15.908 |
neurot | -14.059 |
HSBC | -13.651 |
unethical | -13.243 |
Malaysian | -13.085 |
Token | c |
Token ID | 66 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
unity | +16.570 |
Commands | +15.913 |
enaries | +15.541 |
Rules | +15.382 |
aturdays | +15.096 |
Neg logit contributions | |
paed | -15.512 |
neurot | -13.980 |
HSBC | -13.585 |
unethical | -13.579 |
Australian | -13.494 |
Token | :\ |
Token ID | 7479 |
Feature activation | +5.91e+00 |
Pos logit contributions | |
unity | +13.165 |
Commands | +12.536 |
enaries | +12.243 |
endas | +11.975 |
Rules | +11.960 |
Neg logit contributions | |
paed | -14.609 |
neurot | -13.157 |
HSBC | -12.986 |
Australian | -12.976 |
unethical | -12.952 |
Token | tmp |
Token ID | 22065 |
Feature activation | +1.59e+01 |
Pos logit contributions | |
unity | +5.995 |
Commands | +5.765 |
enaries | +5.641 |
aturdays | +5.611 |
Rules | +5.573 |
Neg logit contributions | |
paed | -6.192 |
neurot | -5.586 |
Australian | -5.516 |
HSBC | -5.468 |
unethical | -5.459 |
Token | ". |
Token ID | 1911 |
Feature activation | +2.10e+01 |
Pos logit contributions | |
unity | +13.656 |
Commands | +13.170 |
enaries | +12.741 |
Rules | +12.477 |
doors | +12.397 |
Neg logit contributions | |
paed | -16.058 |
neurot | -14.734 |
unethical | -14.362 |
Australian | -14.186 |
HSBC | -14.164 |
Token | Only |
Token ID | 5514 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
Commands | +21.556 |
unity | +20.601 |
Rules | +19.187 |
doors | +19.167 |
assemblies | +18.585 |
Neg logit contributions | |
paed | -16.105 |
neurot | -14.384 |
unethical | -13.847 |
HSBC | -13.548 |
piracy | -13.294 |
Token | a |
Token ID | 257 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
unity | +26.846 |
Commands | +26.276 |
doors | +25.011 |
assemblies | +24.378 |
directives | +24.281 |
Neg logit contributions | |
paed | -15.761 |
neurot | -14.855 |
HSBC | -13.694 |
unethical | -13.570 |
ITV | -13.259 |
Token | single |
Token ID | 2060 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
unity | +23.381 |
Commands | +21.985 |
doors | +20.666 |
prayers | +20.280 |
Rules | +20.224 |
Neg logit contributions | |
paed | -14.797 |
neurot | -13.611 |
unethical | -13.224 |
HSBC | -13.220 |
ITV | -12.951 |
Token | back |
Token ID | 736 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
unity | +15.100 |
Commands | +14.380 |
doors | +13.677 |
assemblies | +13.305 |
prayers | +13.195 |
Neg logit contributions | |
paed | -13.650 |
neurot | -12.501 |
HSBC | -12.070 |
unethical | -12.034 |
ITV | -11.771 |
Token | sl |
Token ID | 6649 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
unity | +10.426 |
Commands | +10.073 |
doors | +9.639 |
enaries | +9.318 |
endas | +9.308 |
Neg logit contributions | |
paed | -14.023 |
neurot | -12.912 |
unethical | -12.558 |
HSBC | -12.511 |
ITV | -12.400 |
Token | ash |
Token ID | 1077 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
unity | +9.383 |
Commands | +8.926 |
enaries | +8.844 |
isans | +8.597 |
endas | +8.567 |
Neg logit contributions | |
paed | -13.587 |
neurot | -12.528 |
piracy | -12.123 |
unethical | -12.107 |
Australian | -11.901 |
Token | . |
Token ID | 13 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
unity | +12.691 |
Commands | +11.768 |
enaries | +11.683 |
isans | +11.563 |
aturdays | +11.527 |
Neg logit contributions | |
paed | -14.184 |
neurot | -12.767 |
HSBC | -12.498 |
Australian | -12.323 |
unethical | -12.285 |
Token | From |
Token ID | 3574 |
Feature activation | +9.09e+00 |
Pos logit contributions | |
unity | +14.807 |
Commands | +14.794 |
Rules | +14.113 |
isans | +13.568 |
doors | +13.535 |
Neg logit contributions | |
paed | -13.925 |
neurot | -12.694 |
unethical | -12.413 |
piracy | -12.216 |
commercially | -11.929 |
Token | now |
Token ID | 783 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
unity | +10.114 |
Commands | +9.461 |
assemblies | +9.309 |
doors | +9.274 |
aturdays | +9.260 |
Neg logit contributions | |
paed | -8.269 |
neurot | -7.309 |
unethical | -7.144 |
HSBC | -7.098 |
Australian | -7.061 |
Token | on |
Token ID | 319 |
Feature activation | +2.72e+01 |
Pos logit contributions | |
unity | +12.826 |
Commands | +11.850 |
prayers | +11.825 |
aturdays | +11.804 |
doors | +11.659 |
Neg logit contributions | |
paed | -17.516 |
neurot | -15.826 |
HSBC | -15.397 |
ITV | -15.263 |
unethical | -15.163 |
Token | , |
Token ID | 11 |
Feature activation | +2.69e+01 |
Pos logit contributions | |
unity | +26.951 |
prayers | +25.166 |
doors | +25.024 |
assemblies | +24.930 |
isans | +24.246 |
Neg logit contributions | |
paed | -15.901 |
neurot | -14.421 |
HSBC | -13.858 |
ITV | -13.444 |
piracy | -13.396 |
Token | the |
Token ID | 262 |
Feature activation | +2.68e+01 |
Pos logit contributions | |
unity | +28.785 |
prayers | +26.960 |
doors | +26.902 |
assemblies | +26.467 |
Commands | +25.920 |
Neg logit contributions | |
paed | -13.690 |
neurot | -12.475 |
HSBC | -11.687 |
ITV | -11.460 |
piracy | -11.311 |
Token | phrase |
Token ID | 9546 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
unity | +30.033 |
doors | +28.760 |
prayers | +28.075 |
assemblies | +27.587 |
Commands | +27.484 |
Neg logit contributions | |
paed | -13.168 |
neurot | -11.339 |
ITV | -10.977 |
HSBC | -10.749 |
piracy | -10.570 |
Token | I |
Token ID | 314 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
unity | +11.146 |
Commands | +10.384 |
doors | +10.149 |
assemblies | +10.111 |
prayers | +10.061 |
Neg logit contributions | |
paed | -11.100 |
neurot | -9.978 |
HSBC | -9.830 |
unethical | -9.769 |
ITV | -9.719 |
Token | 'll |
Token ID | 1183 |
Feature activation | -2.89e+00 |
Pos logit contributions | |
paed | +2.445 |
neurot | +2.175 |
Australian | +2.150 |
HSBC | +2.114 |
unethical | +2.104 |
Neg logit contributions | |
unity | -2.790 |
aturdays | -2.710 |
Commands | -2.702 |
enaries | -2.659 |
Rules | -2.628 |
Token | be |
Token ID | 307 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
paed | +2.601 |
neurot | +2.290 |
Australian | +2.270 |
HSBC | +2.215 |
unethical | +2.205 |
Neg logit contributions | |
unity | -3.433 |
aturdays | -3.359 |
Commands | -3.351 |
enaries | -3.288 |
Rules | -3.262 |
Token | using |
Token ID | 1262 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
paed | +1.911 |
neurot | +1.670 |
Australian | +1.665 |
unethical | +1.627 |
HSBC | +1.619 |
Neg logit contributions | |
unity | -2.530 |
Commands | -2.471 |
aturdays | -2.457 |
enaries | -2.432 |
Rules | -2.392 |
Token | In |
Token ID | 554 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
Commands | +11.044 |
unity | +10.984 |
Rules | +10.346 |
isans | +10.215 |
doors | +10.134 |
Neg logit contributions | |
paed | -11.319 |
neurot | -10.079 |
unethical | -9.965 |
piracy | -9.900 |
commercially | -9.659 |
Token | doing |
Token ID | 1804 |
Feature activation | +7.77e+00 |
Pos logit contributions | |
unity | +1.330 |
Commands | +1.284 |
aturdays | +1.261 |
enaries | +1.254 |
assemblies | +1.238 |
Neg logit contributions | |
paed | -1.232 |
neurot | -1.091 |
Australian | -1.080 |
HSBC | -1.067 |
unethical | -1.064 |
Token | so |
Token ID | 523 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
unity | +7.494 |
Commands | +6.931 |
assemblies | +6.868 |
enaries | +6.834 |
doors | +6.770 |
Neg logit contributions | |
paed | -8.522 |
neurot | -7.578 |
Australian | -7.507 |
HSBC | -7.447 |
unethical | -7.432 |
Token | , |
Token ID | 11 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
unity | +12.076 |
assemblies | +11.082 |
enaries | +11.068 |
Commands | +11.033 |
isans | +10.999 |
Neg logit contributions | |
paed | -14.044 |
neurot | -12.419 |
HSBC | -12.361 |
Australian | -12.278 |
unethical | -12.181 |
Token | I |
Token ID | 314 |
Feature activation | +6.54e+00 |
Pos logit contributions | |
unity | +11.934 |
assemblies | +10.966 |
Commands | +10.939 |
prayers | +10.866 |
doors | +10.729 |
Neg logit contributions | |
paed | -13.110 |
neurot | -11.788 |
HSBC | -11.707 |
piracy | -11.440 |
unethical | -11.369 |
Token | have |
Token ID | 423 |
Feature activation | +2.94e+01 |
Pos logit contributions | |
unity | +7.187 |
Commands | +6.853 |
enaries | +6.701 |
assemblies | +6.669 |
doors | +6.606 |
Neg logit contributions | |
paed | -6.416 |
neurot | -5.623 |
Australian | -5.522 |
piracy | -5.507 |
unethical | -5.475 |
Token | also |
Token ID | 635 |
Feature activation | +2.13e+01 |
Pos logit contributions | |
unity | +27.374 |
doors | +25.538 |
assemblies | +25.090 |
prayers | +24.837 |
isans | +24.006 |
Neg logit contributions | |
paed | -18.008 |
piracy | -15.597 |
HSBC | -15.294 |
ITV | -15.112 |
neurot | -14.815 |
Token | become |
Token ID | 1716 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
unity | +20.057 |
doors | +18.802 |
assemblies | +18.474 |
prayers | +18.172 |
Commands | +17.988 |
Neg logit contributions | |
paed | -17.053 |
piracy | -15.052 |
HSBC | -14.645 |
ITV | -14.642 |
neurot | -14.466 |
Token | aware |
Token ID | 3910 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
unity | +12.562 |
doors | +11.754 |
Commands | +11.719 |
assemblies | +11.714 |
isans | +11.548 |
Neg logit contributions | |
paed | -10.879 |
neurot | -9.460 |
piracy | -9.448 |
HSBC | -9.445 |
ITV | -9.263 |
Token | of |
Token ID | 286 |
Feature activation | +9.04e+00 |
Pos logit contributions | |
unity | +10.665 |
isans | +9.751 |
Commands | +9.730 |
doors | +9.697 |
assemblies | +9.672 |
Neg logit contributions | |
paed | -13.089 |
neurot | -11.840 |
HSBC | -11.740 |
Australian | -11.593 |
unethical | -11.529 |
Token | who |
Token ID | 508 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
unity | +9.657 |
Commands | +9.027 |
assemblies | +8.957 |
doors | +8.956 |
prayers | +8.819 |
Neg logit contributions | |
paed | -8.633 |
neurot | -7.706 |
HSBC | -7.650 |
Australian | -7.454 |
piracy | -7.443 |
Token | different |
Token ID | 1180 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
unity | +10.540 |
Commands | +10.290 |
assemblies | +10.011 |
enaries | +9.853 |
Rules | +9.792 |
Neg logit contributions | |
paed | -7.441 |
neurot | -6.454 |
unethical | -6.348 |
piracy | -6.317 |
Australian | -6.211 |
Token | political |
Token ID | 1964 |
Feature activation | +8.58e+00 |
Pos logit contributions | |
Commands | +11.690 |
unity | +11.627 |
assemblies | +11.279 |
doors | +10.780 |
enaries | +10.675 |
Neg logit contributions | |
paed | -11.147 |
neurot | -9.999 |
unethical | -9.900 |
piracy | -9.841 |
HSBC | -9.700 |
Token | parties |
Token ID | 4671 |
Feature activation | +9.35e+00 |
Pos logit contributions | |
unity | +6.983 |
Commands | +6.767 |
assemblies | +6.504 |
doors | +6.173 |
prayers | +6.165 |
Neg logit contributions | |
paed | -10.489 |
neurot | -9.678 |
Australian | -9.504 |
unethical | -9.480 |
HSBC | -9.458 |
Token | participated |
Token ID | 14888 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
unity | +9.134 |
Commands | +8.635 |
assemblies | +8.545 |
enaries | +8.378 |
prayers | +8.260 |
Neg logit contributions | |
paed | -9.684 |
neurot | -8.738 |
piracy | -8.642 |
unethical | -8.597 |
Australian | -8.575 |
Token | in |
Token ID | 287 |
Feature activation | +8.79e+00 |
Pos logit contributions | |
unity | +10.560 |
Commands | +10.133 |
enaries | +9.989 |
assemblies | +9.920 |
prayers | +9.775 |
Neg logit contributions | |
paed | -12.601 |
neurot | -11.425 |
piracy | -11.256 |
HSBC | -11.197 |
Australian | -11.146 |
Token | these |
Token ID | 777 |
Feature activation | +3.03e+01 |
Pos logit contributions | |
unity | +9.337 |
Commands | +8.857 |
assemblies | +8.755 |
enaries | +8.706 |
doors | +8.550 |
Neg logit contributions | |
paed | -8.575 |
neurot | -7.641 |
Australian | -7.480 |
piracy | -7.476 |
unethical | -7.428 |
Token | meetings |
Token ID | 8292 |
Feature activation | +6.58e+00 |
Pos logit contributions | |
assemblies | +28.424 |
unity | +27.781 |
Commands | +27.109 |
doors | +26.536 |
prayers | +26.421 |
Neg logit contributions | |
paed | -18.009 |
piracy | -16.228 |
HSBC | -15.583 |
neurot | -15.508 |
ITV | -15.043 |
Token | and |
Token ID | 290 |
Feature activation | +3.01e+01 |
Pos logit contributions | |
unity | +6.825 |
Commands | +6.597 |
enaries | +6.426 |
assemblies | +6.413 |
Rules | +6.314 |
Neg logit contributions | |
paed | -6.732 |
neurot | -6.014 |
Australian | -5.884 |
piracy | -5.876 |
HSBC | -5.837 |
Token | they |
Token ID | 484 |
Feature activation | +2.57e+01 |
Pos logit contributions | |
unity | +30.230 |
assemblies | +29.056 |
Commands | +28.675 |
prayers | +28.303 |
doors | +27.780 |
Neg logit contributions | |
paed | -15.367 |
piracy | -13.451 |
unethical | -12.696 |
neurot | -12.671 |
HSBC | -12.439 |
Token | have |
Token ID | 423 |
Feature activation | +2.80e+01 |
Pos logit contributions | |
unity | +23.485 |
Commands | +22.181 |
assemblies | +21.833 |
prayers | +21.353 |
doors | +21.342 |
Neg logit contributions | |
paed | -18.421 |
piracy | -16.901 |
unethical | -15.940 |
ITV | -15.877 |
HSBC | -15.787 |
Token | submitted |
Token ID | 8948 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
unity | +26.288 |
assemblies | +24.438 |
prayers | +24.064 |
Commands | +24.025 |
doors | +23.514 |
Neg logit contributions | |
paed | -17.667 |
piracy | -16.309 |
ITV | -15.503 |
unethical | -15.058 |
HSBC | -14.994 |
Token | Under |
Token ID | 4698 |
Feature activation | -3.96e+00 |
Pos logit contributions | |
paed | +2.777 |
Australian | +2.455 |
neurot | +2.443 |
HSBC | +2.396 |
piracy | +2.382 |
Neg logit contributions | |
unity | -3.242 |
Commands | -3.148 |
aturdays | -3.104 |
enaries | -3.083 |
assemblies | -3.046 |
Token | : |
Token ID | 25 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
paed | +3.916 |
Australian | +3.516 |
neurot | +3.482 |
HSBC | +3.428 |
unethical | +3.384 |
Neg logit contributions | |
unity | -4.378 |
aturdays | -4.259 |
Commands | -4.164 |
enaries | -4.113 |
endas | -4.059 |
Token | c |
Token ID | 269 |
Feature activation | +9.78e+00 |
Pos logit contributions | |
paed | +2.658 |
Australian | +2.362 |
neurot | +2.350 |
HSBC | +2.308 |
piracy | +2.297 |
Neg logit contributions | |
unity | -3.074 |
Commands | -2.972 |
aturdays | -2.954 |
enaries | -2.930 |
endas | -2.886 |
Token | bp |
Token ID | 46583 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
unity | +9.956 |
Commands | +9.589 |
enaries | +9.485 |
aturdays | +9.455 |
Rules | +9.396 |
Neg logit contributions | |
paed | -9.799 |
neurot | -8.744 |
Australian | -8.600 |
unethical | -8.537 |
HSBC | -8.433 |
Token | , |
Token ID | 11 |
Feature activation | -2.93e+00 |
Pos logit contributions | |
unity | +1.274 |
Commands | +1.234 |
aturdays | +1.210 |
enaries | +1.205 |
Rules | +1.190 |
Neg logit contributions | |
paed | -1.202 |
neurot | -1.064 |
Australian | -1.057 |
HSBC | -1.041 |
unethical | -1.040 |
Token | d |
Token ID | 288 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
paed | +2.879 |
Australian | +2.538 |
neurot | +2.538 |
HSBC | +2.495 |
piracy | +2.487 |
Neg logit contributions | |
unity | -3.246 |
Commands | -3.161 |
aturdays | -3.141 |
enaries | -3.113 |
Rules | -3.066 |
Token | hs |
Token ID | 11994 |
Feature activation | +3.17e+00 |
Pos logit contributions | |
unity | +1.695 |
Commands | +1.643 |
aturdays | +1.609 |
enaries | +1.604 |
Rules | +1.579 |
Neg logit contributions | |
paed | -1.794 |
neurot | -1.601 |
Australian | -1.591 |
unethical | -1.567 |
HSBC | -1.566 |
Token | , |
Token ID | 11 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
unity | +3.389 |
Commands | +3.285 |
enaries | +3.202 |
aturdays | +3.199 |
Rules | +3.174 |
Neg logit contributions | |
paed | -3.261 |
neurot | -2.891 |
Australian | -2.861 |
unethical | -2.829 |
HSBC | -2.819 |
Token | do |
Token ID | 466 |
Feature activation | +9.83e+00 |
Pos logit contributions | |
unity | +3.094 |
Commands | +2.980 |
enaries | +2.908 |
aturdays | +2.907 |
assemblies | +2.877 |
Neg logit contributions | |
paed | -2.543 |
neurot | -2.232 |
Australian | -2.208 |
unethical | -2.180 |
HSBC | -2.167 |
Token | j |
Token ID | 73 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
unity | +10.408 |
Commands | +9.933 |
aturdays | +9.790 |
enaries | +9.709 |
Rules | +9.694 |
Neg logit contributions | |
paed | -9.566 |
neurot | -8.388 |
Australian | -8.326 |
unethical | -8.211 |
ITV | -8.118 |
Token | , |
Token ID | 11 |
Feature activation | -5.52e-01 |
Pos logit contributions | |
unity | +1.349 |
Commands | +1.306 |
aturdays | +1.280 |
enaries | +1.276 |
Rules | +1.259 |
Neg logit contributions | |
paed | -1.282 |
neurot | -1.136 |
Australian | -1.128 |
unethical | -1.111 |
HSBC | -1.110 |
Token | said |
Token ID | 531 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
unity | +5.961 |
Commands | +5.724 |
enaries | +5.548 |
doors | +5.447 |
assemblies | +5.441 |
Neg logit contributions | |
paed | -6.822 |
neurot | -6.053 |
Australian | -6.011 |
piracy | -5.991 |
unethical | -5.967 |
Token | � |
Token ID | 564 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
unity | +22.662 |
prayers | +21.379 |
Commands | +20.878 |
doors | +20.689 |
assemblies | +20.270 |
Neg logit contributions | |
paed | -17.368 |
neurot | -15.178 |
HSBC | -14.918 |
unethical | -14.621 |
ITV | -14.515 |
Token | � |
Token ID | 250 |
Feature activation | -7.74e-01 |
Pos logit contributions | |
paed | +1.400 |
neurot | +1.225 |
Australian | +1.220 |
HSBC | +1.197 |
unethical | +1.192 |
Neg logit contributions | |
unity | -1.831 |
Commands | -1.775 |
aturdays | -1.766 |
enaries | -1.745 |
assemblies | -1.722 |
Token | Of |
Token ID | 5189 |
Feature activation | +9.29e+00 |
Pos logit contributions | |
paed | +0.894 |
neurot | +0.807 |
Australian | +0.803 |
HSBC | +0.791 |
unethical | +0.791 |
Neg logit contributions | |
unity | -0.730 |
Commands | -0.705 |
aturdays | -0.689 |
enaries | -0.687 |
assemblies | -0.675 |
Token | course |
Token ID | 1781 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
unity | +7.283 |
Commands | +6.802 |
enaries | +6.556 |
doors | +6.477 |
prayers | +6.471 |
Neg logit contributions | |
paed | -11.537 |
neurot | -10.601 |
HSBC | -10.457 |
Australian | -10.371 |
unethical | -10.350 |
Token | not |
Token ID | 407 |
Feature activation | +5.22e+00 |
Pos logit contributions | |
unity | +17.765 |
Commands | +16.733 |
doors | +16.582 |
prayers | +16.411 |
enaries | +16.265 |
Neg logit contributions | |
paed | -16.369 |
neurot | -14.721 |
HSBC | -14.185 |
unethical | -14.121 |
Australian | -14.120 |
Token | ! |
Token ID | 0 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
unity | +5.342 |
Commands | +5.116 |
enaries | +5.025 |
aturdays | +4.997 |
Rules | +4.920 |
Neg logit contributions | |
paed | -5.498 |
neurot | -4.894 |
Australian | -4.827 |
HSBC | -4.811 |
unethical | -4.773 |
Token | That |
Token ID | 1320 |
Feature activation | +6.48e+00 |
Pos logit contributions | |
Commands | +11.883 |
unity | +11.857 |
Rules | +11.060 |
doors | +11.007 |
prayers | +10.957 |
Neg logit contributions | |
paed | -12.109 |
neurot | -10.896 |
unethical | -10.664 |
piracy | -10.442 |
commercially | -10.286 |
Token | is |
Token ID | 318 |
Feature activation | -3.73e+00 |
Pos logit contributions | |
unity | +6.767 |
Commands | +6.466 |
enaries | +6.305 |
aturdays | +6.290 |
prayers | +6.215 |
Neg logit contributions | |
paed | -6.639 |
neurot | -5.972 |
Australian | -5.805 |
HSBC | -5.766 |
unethical | -5.727 |
Token | way |
Token ID | 835 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
paed | +3.846 |
Australian | +3.420 |
neurot | +3.410 |
unethical | +3.404 |
piracy | +3.359 |
Neg logit contributions | |
unity | -3.902 |
Commands | -3.830 |
aturdays | -3.793 |
enaries | -3.757 |
endas | -3.680 |
Token | too |
Token ID | 1165 |
Feature activation | -3.97e+00 |
Pos logit contributions | |
paed | +10.746 |
unethical | +9.904 |
Australian | +9.606 |
neurot | +9.534 |
piracy | +9.446 |
Neg logit contributions | |
unity | -12.955 |
Commands | -12.944 |
aturdays | -12.889 |
enaries | -12.763 |
assemblies | -12.453 |
Token | mother |
Token ID | 2802 |
Feature activation | +8.80e+00 |
Pos logit contributions | |
unity | +14.936 |
prayers | +14.000 |
doors | +13.933 |
assemblies | +13.809 |
Commands | +13.803 |
Neg logit contributions | |
paed | -10.360 |
neurot | -9.259 |
unethical | -9.216 |
HSBC | -9.200 |
piracy | -9.147 |
Token | die |
Token ID | 4656 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
unity | +9.808 |
Commands | +9.193 |
enaries | +9.126 |
prayers | +8.987 |
aturdays | +8.976 |
Neg logit contributions | |
paed | -8.093 |
neurot | -7.152 |
HSBC | -7.097 |
unethical | -7.092 |
Australian | -7.008 |
Token | . |
Token ID | 13 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
unity | +12.106 |
Commands | +11.394 |
prayers | +11.342 |
doors | +11.305 |
enaries | +11.281 |
Neg logit contributions | |
paed | -11.844 |
neurot | -10.702 |
unethical | -10.473 |
HSBC | -10.422 |
piracy | -10.373 |
Token | He |
Token ID | 679 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
unity | +4.477 |
Commands | +4.348 |
enaries | +4.225 |
aturdays | +4.211 |
Rules | +4.171 |
Neg logit contributions | |
paed | -3.990 |
neurot | -3.545 |
unethical | -3.480 |
piracy | -3.433 |
Australian | -3.427 |
Token | saw |
Token ID | 2497 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
unity | +12.591 |
Commands | +11.968 |
prayers | +11.800 |
enaries | +11.724 |
doors | +11.702 |
Neg logit contributions | |
paed | -12.882 |
unethical | -11.574 |
neurot | -11.485 |
piracy | -11.430 |
HSBC | -11.280 |
Token | everybody |
Token ID | 7288 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
unity | +18.792 |
prayers | +17.629 |
doors | +17.475 |
enaries | +17.108 |
Commands | +17.058 |
Neg logit contributions | |
paed | -12.008 |
neurot | -10.919 |
unethical | -10.598 |
HSBC | -10.251 |
piracy | -10.241 |
Token | getting |
Token ID | 1972 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
unity | +19.244 |
doors | +17.931 |
prayers | +17.853 |
enaries | +17.716 |
assemblies | +17.472 |
Neg logit contributions | |
paed | -13.979 |
neurot | -12.472 |
HSBC | -12.467 |
unethical | -12.250 |
piracy | -12.210 |
Token | killed |
Token ID | 2923 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
unity | +12.260 |
prayers | +11.442 |
doors | +11.411 |
Commands | +11.383 |
assemblies | +11.306 |
Neg logit contributions | |
paed | -9.578 |
neurot | -8.494 |
HSBC | -8.471 |
unethical | -8.470 |
piracy | -8.323 |
Token | . |
Token ID | 13 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
unity | +14.552 |
doors | +13.726 |
prayers | +13.687 |
enaries | +13.682 |
Commands | +13.412 |
Neg logit contributions | |
paed | -13.381 |
neurot | -11.905 |
HSBC | -11.870 |
unethical | -11.790 |
piracy | -11.655 |
Token | � |
Token ID | 447 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
unity | +11.956 |
Commands | +11.571 |
enaries | +11.120 |
doors | +11.102 |
prayers | +11.039 |
Neg logit contributions | |
paed | -11.090 |
neurot | -10.081 |
unethical | -9.987 |
piracy | -9.701 |
ageing | -9.515 |
Token | � |
Token ID | 251 |
Feature activation | -2.66e+00 |
Pos logit contributions | |
unity | +2.288 |
Commands | +2.218 |
aturdays | +2.177 |
enaries | +2.166 |
Rules | +2.141 |
Neg logit contributions | |
paed | -1.953 |
neurot | -1.721 |
Australian | -1.706 |
HSBC | -1.675 |
unethical | -1.675 |
Token | + |
Token ID | 10 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
unity | +10.078 |
Commands | +9.647 |
enaries | +9.578 |
assemblies | +9.328 |
Rules | +9.325 |
Neg logit contributions | |
paed | -9.010 |
neurot | -8.055 |
unethical | -7.753 |
Australian | -7.725 |
HSBC | -7.641 |
Token | 30 |
Token ID | 1270 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
unity | +10.714 |
Commands | +10.231 |
enaries | +10.088 |
Rules | +10.044 |
aturdays | +9.940 |
Neg logit contributions | |
paed | -12.271 |
neurot | -11.031 |
unethical | -10.754 |
Australian | -10.733 |
piracy | -10.613 |
Token | : |
Token ID | 25 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
unity | +10.260 |
Commands | +9.932 |
enaries | +9.831 |
Rules | +9.603 |
assemblies | +9.596 |
Neg logit contributions | |
paed | -9.889 |
neurot | -8.830 |
unethical | -8.624 |
Australian | -8.540 |
HSBC | -8.450 |
Token | 20 |
Token ID | 1238 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
unity | +13.396 |
Commands | +13.081 |
Rules | +12.782 |
enaries | +12.371 |
doors | +12.291 |
Neg logit contributions | |
paed | -18.502 |
neurot | -16.439 |
unethical | -16.303 |
piracy | -16.087 |
ageing | -15.763 |
Token | / |
Token ID | 14 |
Feature activation | +4.21e+00 |
Pos logit contributions | |
unity | +10.464 |
Commands | +9.970 |
enaries | +9.915 |
Rules | +9.577 |
assemblies | +9.560 |
Neg logit contributions | |
paed | -11.729 |
neurot | -10.565 |
unethical | -10.221 |
Australian | -10.160 |
piracy | -10.099 |
Token | 3000 |
Token ID | 23924 |
Feature activation | +8.12e+00 |
Pos logit contributions | |
unity | +3.956 |
Commands | +3.813 |
aturdays | +3.739 |
enaries | +3.735 |
Rules | +3.686 |
Neg logit contributions | |
paed | -4.865 |
neurot | -4.360 |
Australian | -4.315 |
unethical | -4.283 |
HSBC | -4.255 |
Token | + |
Token ID | 10 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
unity | +8.741 |
Commands | +8.372 |
enaries | +8.314 |
assemblies | +8.130 |
Rules | +8.114 |
Neg logit contributions | |
paed | -7.988 |
neurot | -7.050 |
unethical | -6.872 |
Australian | -6.834 |
piracy | -6.743 |
Token | 30 |
Token ID | 1270 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
Rules | +10.548 |
unity | +10.462 |
Commands | +10.212 |
enaries | +9.947 |
isans | +9.797 |
Neg logit contributions | |
paed | -17.503 |
unethical | -15.909 |
neurot | -15.894 |
piracy | -15.658 |
ageing | -15.437 |
Token | : |
Token ID | 25 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
unity | +13.104 |
Commands | +12.595 |
enaries | +12.576 |
Rules | +12.243 |
assemblies | +12.110 |
Neg logit contributions | |
paed | -15.117 |
neurot | -13.632 |
unethical | -13.359 |
Australian | -13.240 |
HSBC | -13.028 |
Token | 900 |
Token ID | 12865 |
Feature activation | +7.27e+00 |
Pos logit contributions | |
Rules | +11.040 |
unity | +10.992 |
Commands | +10.831 |
enaries | +10.292 |
isans | +10.238 |
Neg logit contributions | |
paed | -18.178 |
neurot | -16.414 |
unethical | -16.394 |
piracy | -16.186 |
commercially | -15.915 |
Token | + |
Token ID | 10 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
unity | +7.709 |
Commands | +7.419 |
enaries | +7.299 |
aturdays | +7.212 |
Rules | +7.182 |
Neg logit contributions | |
paed | -7.283 |
neurot | -6.532 |
unethical | -6.330 |
Australian | -6.298 |
HSBC | -6.229 |
Token | bike |
Token ID | 7161 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
unity | +6.149 |
Commands | +5.880 |
doors | +5.785 |
assemblies | +5.774 |
aturdays | +5.694 |
Neg logit contributions | |
paed | -5.590 |
neurot | -4.966 |
Australian | -4.872 |
HSBC | -4.849 |
unethical | -4.839 |
Token | cannot |
Token ID | 2314 |
Feature activation | -4.32e+00 |
Pos logit contributions | |
paed | +1.464 |
neurot | +1.295 |
Australian | +1.290 |
unethical | +1.266 |
HSBC | +1.265 |
Neg logit contributions | |
unity | -1.614 |
Commands | -1.568 |
aturdays | -1.552 |
enaries | -1.537 |
Rules | -1.517 |
Token | ," |
Token ID | 553 |
Feature activation | +6.13e+00 |
Pos logit contributions | |
paed | +3.615 |
Australian | +3.128 |
neurot | +3.106 |
piracy | +3.032 |
HSBC | +3.022 |
Neg logit contributions | |
unity | -5.346 |
Commands | -5.242 |
aturdays | -5.219 |
Rules | -5.127 |
enaries | -5.106 |
Token | he |
Token ID | 339 |
Feature activation | +4.25e+00 |
Pos logit contributions | |
unity | +7.920 |
Commands | +7.621 |
enaries | +7.496 |
aturdays | +7.467 |
doors | +7.438 |
Neg logit contributions | |
paed | -4.716 |
neurot | -4.068 |
unethical | -3.933 |
Australian | -3.907 |
piracy | -3.890 |
Token | said |
Token ID | 531 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
unity | +4.023 |
Commands | +3.858 |
enaries | +3.752 |
aturdays | +3.719 |
assemblies | +3.685 |
Neg logit contributions | |
paed | -4.847 |
neurot | -4.347 |
Australian | -4.298 |
unethical | -4.289 |
HSBC | -4.267 |
Token | . |
Token ID | 13 |
Feature activation | +5.25e+00 |
Pos logit contributions | |
unity | +9.732 |
Commands | +9.229 |
enaries | +9.104 |
doors | +9.041 |
assemblies | +9.020 |
Neg logit contributions | |
paed | -10.484 |
neurot | -9.374 |
Australian | -9.127 |
unethical | -9.118 |
HSBC | -9.079 |
Token |
|
Token ID | 198 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
unity | +5.420 |
Commands | +5.265 |
enaries | +5.132 |
aturdays | +5.107 |
endas | +5.048 |
Neg logit contributions | |
paed | -5.487 |
neurot | -4.900 |
unethical | -4.785 |
Australian | -4.775 |
piracy | -4.737 |
Token |
|
Token ID | 198 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
unity | +1.684 |
Commands | +1.635 |
enaries | +1.594 |
Rules | +1.582 |
aturdays | +1.580 |
Neg logit contributions | |
paed | -1.471 |
neurot | -1.296 |
Australian | -1.274 |
unethical | -1.269 |
piracy | -1.261 |
Token | But |
Token ID | 1537 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
unity | +3.897 |
Commands | +3.778 |
Rules | +3.757 |
enaries | +3.718 |
aturdays | +3.715 |
Neg logit contributions | |
paed | -3.960 |
neurot | -3.529 |
Australian | -3.479 |
unethical | -3.455 |
piracy | -3.430 |
Token | the |
Token ID | 262 |
Feature activation | -6.87e+00 |
Pos logit contributions | |
unity | +2.039 |
Commands | +1.974 |
aturdays | +1.944 |
enaries | +1.937 |
assemblies | +1.913 |
Neg logit contributions | |
paed | -1.486 |
neurot | -1.295 |
Australian | -1.277 |
unethical | -1.256 |
HSBC | -1.254 |
Token | bike |
Token ID | 7161 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
paed | +7.007 |
Australian | +6.248 |
neurot | +6.138 |
HSBC | +6.049 |
unethical | +6.038 |
Neg logit contributions | |
unity | -7.115 |
Commands | -7.043 |
aturdays | -6.982 |
enaries | -6.950 |
endas | -6.890 |
Token | or |
Token ID | 393 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
paed | +4.188 |
Australian | +3.675 |
neurot | +3.663 |
piracy | +3.567 |
HSBC | +3.565 |
Neg logit contributions | |
unity | -5.066 |
Commands | -4.977 |
aturdays | -4.931 |
enaries | -4.872 |
endas | -4.825 |
Token | human |
Token ID | 1692 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
paed | +14.994 |
Australian | +13.692 |
neurot | +13.447 |
piracy | +13.363 |
commercially | +13.097 |
Neg logit contributions | |
aturdays | -11.063 |
enaries | -10.993 |
Commands | -10.946 |
Rules | -10.932 |
endas | -10.931 |
Token | intelligence |
Token ID | 4430 |
Feature activation | -6.72e+00 |
Pos logit contributions | |
paed | +11.614 |
neurot | +10.399 |
Australian | +10.366 |
piracy | +10.215 |
unethical | +10.173 |
Neg logit contributions | |
Commands | -9.455 |
aturdays | -9.450 |
unity | -9.399 |
endas | -9.345 |
enaries | -9.330 |
Token | , |
Token ID | 11 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
paed | +6.308 |
Australian | +5.569 |
neurot | +5.531 |
piracy | +5.406 |
HSBC | +5.377 |
Neg logit contributions | |
unity | -7.427 |
aturdays | -7.277 |
Commands | -7.261 |
enaries | -7.105 |
endas | -7.103 |
Token | incl |
Token ID | 13358 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
paed | +3.029 |
Australian | +2.679 |
neurot | +2.676 |
unethical | +2.614 |
HSBC | +2.613 |
Neg logit contributions | |
unity | -3.197 |
Commands | -3.109 |
aturdays | -3.082 |
enaries | -3.059 |
endas | -3.016 |
Token | ining |
Token ID | 3191 |
Feature activation | -6.52e+00 |
Pos logit contributions | |
paed | +0.227 |
neurot | +0.204 |
Australian | +0.202 |
HSBC | +0.199 |
unethical | +0.199 |
Neg logit contributions | |
unity | -0.198 |
Commands | -0.192 |
aturdays | -0.188 |
enaries | -0.187 |
Rules | -0.184 |
Token | them |
Token ID | 606 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
paed | +6.327 |
Australian | +5.642 |
neurot | +5.595 |
unethical | +5.465 |
HSBC | +5.440 |
Neg logit contributions | |
unity | -6.973 |
Commands | -6.923 |
aturdays | -6.884 |
enaries | -6.798 |
endas | -6.743 |
Token | in |
Token ID | 287 |
Feature activation | -6.62e+00 |
Pos logit contributions | |
unity | +1.867 |
Commands | +1.811 |
aturdays | +1.778 |
enaries | +1.775 |
Rules | +1.749 |
Neg logit contributions | |
paed | -1.555 |
neurot | -1.363 |
Australian | -1.352 |
HSBC | -1.333 |
unethical | -1.330 |
Token | the |
Token ID | 262 |
Feature activation | -4.24e+00 |
Pos logit contributions | |
paed | +6.733 |
Australian | +5.996 |
neurot | +5.967 |
unethical | +5.894 |
HSBC | +5.823 |
Neg logit contributions | |
unity | -6.786 |
Commands | -6.740 |
aturdays | -6.725 |
enaries | -6.677 |
endas | -6.541 |
Token | same |
Token ID | 976 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
paed | +5.706 |
neurot | +5.241 |
Australian | +5.237 |
unethical | +5.163 |
HSBC | +5.128 |
Neg logit contributions | |
unity | -3.081 |
Commands | -3.013 |
aturdays | -3.000 |
enaries | -2.960 |
endas | -2.881 |
Token | direction |
Token ID | 4571 |
Feature activation | -4.13e+00 |
Pos logit contributions | |
unity | +1.569 |
Commands | +1.492 |
aturdays | +1.445 |
enaries | +1.440 |
assemblies | +1.417 |
Neg logit contributions | |
paed | -2.546 |
neurot | -2.318 |
Australian | -2.305 |
HSBC | -2.283 |
unethical | -2.272 |
Token | of |
Token ID | 286 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
unity | +11.298 |
Commands | +10.738 |
assemblies | +10.730 |
Rules | +10.469 |
enaries | +10.461 |
Neg logit contributions | |
paed | -10.914 |
unethical | -9.696 |
neurot | -9.687 |
Australian | -9.511 |
HSBC | -9.495 |
Token | the |
Token ID | 262 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
unity | +19.932 |
assemblies | +19.261 |
Commands | +19.258 |
doors | +18.491 |
prayers | +18.016 |
Neg logit contributions | |
paed | -13.822 |
neurot | -11.923 |
HSBC | -11.766 |
unethical | -11.744 |
piracy | -11.665 |
Token | GitHub |
Token ID | 21722 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
unity | +12.198 |
Commands | +11.751 |
assemblies | +11.587 |
enaries | +11.288 |
doors | +11.267 |
Neg logit contributions | |
paed | -8.798 |
neurot | -7.644 |
unethical | -7.475 |
piracy | -7.398 |
HSBC | -7.389 |
Token | dataset |
Token ID | 27039 |
Feature activation | +6.85e+00 |
Pos logit contributions | |
paed | +0.126 |
neurot | +0.109 |
Australian | +0.108 |
HSBC | +0.106 |
unethical | +0.105 |
Neg logit contributions | |
unity | -0.192 |
Commands | -0.187 |
aturdays | -0.184 |
enaries | -0.183 |
Rules | -0.181 |
Token | . |
Token ID | 13 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
unity | +7.146 |
Commands | +6.859 |
assemblies | +6.710 |
enaries | +6.689 |
Rules | +6.631 |
Neg logit contributions | |
paed | -6.963 |
neurot | -6.153 |
unethical | -6.103 |
Australian | -6.072 |
HSBC | -6.011 |
Token | I |
Token ID | 314 |
Feature activation | -4.60e+00 |
Pos logit contributions | |
Commands | +13.270 |
unity | +13.140 |
assemblies | +12.199 |
Rules | +12.152 |
aturdays | +12.023 |
Neg logit contributions | |
paed | -12.799 |
unethical | -11.151 |
neurot | -11.112 |
piracy | -11.014 |
Australian | -10.742 |
Token | did |
Token ID | 750 |
Feature activation | +7.83e+00 |
Pos logit contributions | |
paed | +4.827 |
neurot | +4.335 |
Australian | +4.291 |
HSBC | +4.240 |
unethical | +4.221 |
Neg logit contributions | |
unity | -4.659 |
aturdays | -4.521 |
Commands | -4.507 |
enaries | -4.481 |
endas | -4.356 |
Token | this |
Token ID | 428 |
Feature activation | +6.22e+00 |
Pos logit contributions | |
unity | +8.187 |
Commands | +7.812 |
assemblies | +7.554 |
enaries | +7.530 |
Rules | +7.493 |
Neg logit contributions | |
paed | -7.926 |
neurot | -7.004 |
Australian | -6.897 |
unethical | -6.870 |
HSBC | -6.836 |
Token | by |
Token ID | 416 |
Feature activation | +5.94e+00 |
Pos logit contributions | |
unity | +6.627 |
Commands | +6.372 |
enaries | +6.191 |
assemblies | +6.141 |
aturdays | +6.133 |
Neg logit contributions | |
paed | -6.272 |
neurot | -5.507 |
Australian | -5.447 |
HSBC | -5.424 |
unethical | -5.386 |
Token | executing |
Token ID | 23710 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
unity | +6.770 |
Commands | +6.536 |
assemblies | +6.296 |
aturdays | +6.286 |
enaries | +6.265 |
Neg logit contributions | |
paed | -5.544 |
neurot | -4.833 |
Australian | -4.783 |
unethical | -4.766 |
HSBC | -4.746 |
Token | the |
Token ID | 262 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
unity | +15.590 |
Commands | +15.385 |
assemblies | +14.492 |
Rules | +14.193 |
doors | +14.149 |
Neg logit contributions | |
paed | -12.937 |
neurot | -11.147 |
unethical | -11.012 |
Australian | -10.963 |
HSBC | -10.954 |
Token | as |
Token ID | 355 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
paed | +3.986 |
Australian | +3.577 |
neurot | +3.524 |
HSBC | +3.448 |
piracy | +3.405 |
Neg logit contributions | |
unity | -4.902 |
aturdays | -4.886 |
Commands | -4.802 |
enaries | -4.713 |
endas | -4.698 |
Token | updates |
Token ID | 5992 |
Feature activation | -8.94e-01 |
Pos logit contributions | |
unity | +7.407 |
Commands | +6.960 |
assemblies | +6.662 |
doors | +6.642 |
prayers | +6.487 |
Neg logit contributions | |
paed | -15.404 |
neurot | -14.138 |
unethical | -14.108 |
HSBC | -13.873 |
piracy | -13.815 |
Token | regarding |
Token ID | 5115 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
paed | +0.836 |
neurot | +0.734 |
Australian | +0.732 |
HSBC | +0.715 |
unethical | +0.714 |
Neg logit contributions | |
unity | -1.039 |
Commands | -1.010 |
aturdays | -1.004 |
enaries | -0.991 |
Rules | -0.977 |
Token | the |
Token ID | 262 |
Feature activation | +9.01e-01 |
Pos logit contributions | |
paed | +7.844 |
Australian | +7.239 |
neurot | +6.786 |
HSBC | +6.712 |
NZ | +6.563 |
Neg logit contributions | |
aturdays | -14.518 |
enaries | -13.392 |
endars | -13.359 |
unity | -13.357 |
Commands | -13.293 |
Token | future |
Token ID | 2003 |
Feature activation | +9.39e+00 |
Pos logit contributions | |
unity | +0.961 |
Commands | +0.927 |
aturdays | +0.907 |
enaries | +0.906 |
Rules | +0.893 |
Neg logit contributions | |
paed | -0.934 |
neurot | -0.829 |
Australian | -0.823 |
HSBC | -0.813 |
unethical | -0.810 |
Token | of |
Token ID | 286 |
Feature activation | -7.62e+00 |
Pos logit contributions | |
unity | +7.195 |
Commands | +6.740 |
Rules | +6.411 |
doors | +6.351 |
isans | +6.341 |
Neg logit contributions | |
paed | -11.806 |
neurot | -10.791 |
unethical | -10.706 |
piracy | -10.582 |
HSBC | -10.385 |
Token | Cl |
Token ID | 1012 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
paed | +7.399 |
Australian | +6.757 |
neurot | +6.614 |
unethical | +6.482 |
HSBC | +6.468 |
Neg logit contributions | |
unity | -7.880 |
aturdays | -7.801 |
enaries | -7.739 |
Commands | -7.732 |
endas | -7.643 |
Token | arity |
Token ID | 6806 |
Feature activation | -1.93e+00 |
Pos logit contributions | |
unity | +5.728 |
isans | +4.831 |
enaries | +4.815 |
endas | +4.501 |
Commands | +4.499 |
Neg logit contributions | |
paed | -21.069 |
neurot | -19.511 |
unethical | -19.217 |
Australian | -19.195 |
piracy | -19.154 |
Token | Gaming |
Token ID | 14426 |
Feature activation | -5.15e+00 |
Pos logit contributions | |
paed | +1.626 |
Australian | +1.418 |
neurot | +1.410 |
HSBC | +1.383 |
unethical | +1.367 |
Neg logit contributions | |
unity | -2.403 |
aturdays | -2.336 |
Commands | -2.326 |
enaries | -2.299 |
assemblies | -2.272 |
Token |
|
Token ID | 198 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
paed | +5.106 |
Australian | +4.592 |
neurot | +4.556 |
unethical | +4.442 |
piracy | +4.425 |
Neg logit contributions | |
unity | -5.468 |
aturdays | -5.346 |
enaries | -5.336 |
Commands | -5.314 |
isans | -5.230 |
Token |
|
Token ID | 198 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
paed | +8.744 |
Australian | +8.512 |
HSBC | +7.744 |
NZ | +7.694 |
neurot | +7.395 |
Neg logit contributions | |
aturdays | -21.549 |
endars | -20.011 |
unity | -19.707 |
enaries | -19.622 |
endas | -19.470 |
Token | en |
Token ID | 268 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
paed | +2.368 |
Australian | +2.115 |
neurot | +2.094 |
unethical | +2.053 |
HSBC | +2.051 |
Neg logit contributions | |
unity | -2.409 |
Commands | -2.339 |
aturdays | -2.312 |
enaries | -2.276 |
assemblies | -2.246 |
Token | comp |
Token ID | 5589 |
Feature activation | +4.09e+00 |
Pos logit contributions | |
paed | +1.544 |
neurot | +1.369 |
Australian | +1.367 |
HSBC | +1.340 |
piracy | +1.333 |
Neg logit contributions | |
unity | -1.676 |
Commands | -1.626 |
aturdays | -1.616 |
enaries | -1.586 |
Rules | -1.574 |
Token | assing |
Token ID | 19696 |
Feature activation | +4.45e+00 |
Pos logit contributions | |
unity | +3.157 |
Commands | +2.984 |
enaries | +2.955 |
aturdays | +2.883 |
endas | +2.868 |
Neg logit contributions | |
paed | -5.390 |
neurot | -4.939 |
unethical | -4.859 |
Australian | -4.852 |
piracy | -4.835 |
Token | stereotype |
Token ID | 31240 |
Feature activation | +9.78e-01 |
Pos logit contributions | |
unity | +5.133 |
Commands | +4.880 |
enaries | +4.737 |
assemblies | +4.721 |
aturdays | +4.681 |
Neg logit contributions | |
paed | -4.195 |
neurot | -3.709 |
unethical | -3.623 |
HSBC | -3.615 |
Australian | -3.592 |
Token | of |
Token ID | 286 |
Feature activation | -8.27e+00 |
Pos logit contributions | |
unity | +0.971 |
Commands | +0.936 |
aturdays | +0.916 |
enaries | +0.913 |
Rules | +0.899 |
Neg logit contributions | |
paed | -1.085 |
neurot | -0.973 |
Australian | -0.965 |
HSBC | -0.953 |
unethical | -0.952 |
Token | trou |
Token ID | 4057 |
Feature activation | -3.63e-01 |
Pos logit contributions | |
paed | +8.485 |
Australian | +7.768 |
neurot | +7.458 |
piracy | +7.433 |
unethical | +7.327 |
Neg logit contributions | |
aturdays | -8.394 |
Commands | -8.229 |
unity | -8.185 |
enaries | -8.108 |
Rules | -8.052 |
Token | ser |
Token ID | 2655 |
Feature activation | +4.26e+00 |
Pos logit contributions | |
paed | +0.329 |
neurot | +0.286 |
Australian | +0.284 |
unethical | +0.278 |
HSBC | +0.278 |
Neg logit contributions | |
unity | -0.435 |
Commands | -0.423 |
aturdays | -0.417 |
enaries | -0.414 |
Rules | -0.410 |
Token | - |
Token ID | 12 |
Feature activation | -9.76e-01 |
Pos logit contributions | |
unity | +4.669 |
Commands | +4.483 |
enaries | +4.390 |
aturdays | +4.333 |
assemblies | +4.318 |
Neg logit contributions | |
paed | -4.233 |
neurot | -3.798 |
HSBC | -3.712 |
Australian | -3.692 |
unethical | -3.688 |
Token | w |
Token ID | 86 |
Feature activation | +6.79e+00 |
Pos logit contributions | |
paed | +1.095 |
neurot | +0.980 |
Australian | +0.977 |
unethical | +0.960 |
HSBC | +0.959 |
Neg logit contributions | |
unity | -0.954 |
Commands | -0.921 |
aturdays | -0.909 |
enaries | -0.896 |
Rules | -0.884 |
Token | earing |
Token ID | 6648 |
Feature activation | -9.05e+00 |
Pos logit contributions | |
unity | +5.823 |
Commands | +5.673 |
enaries | +5.671 |
aturdays | +5.554 |
endas | +5.501 |
Neg logit contributions | |
paed | -8.131 |
neurot | -7.449 |
unethical | -7.257 |
Australian | -7.209 |
piracy | -7.169 |
Token | , |
Token ID | 11 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
paed | +10.955 |
Australian | +10.130 |
neurot | +9.777 |
piracy | +9.748 |
unethical | +9.589 |
Neg logit contributions | |
aturdays | -7.447 |
unity | -7.263 |
Commands | -7.224 |
enaries | -7.109 |
Rules | -7.098 |
Token |
|
Token ID | 198 |
Feature activation | -5.97e+00 |
Pos logit contributions | |
paed | +5.773 |
Australian | +5.359 |
HSBC | +5.173 |
neurot | +5.094 |
NZ | +5.031 |
Neg logit contributions | |
unity | -6.702 |
aturdays | -6.637 |
enaries | -6.478 |
Commands | -6.341 |
endas | -6.332 |
Token |
|
Token ID | 198 |
Feature activation | -9.10e+00 |
Pos logit contributions | |
paed | +4.844 |
Australian | +4.383 |
HSBC | +4.221 |
neurot | +4.195 |
NZ | +4.094 |
Neg logit contributions | |
aturdays | -7.405 |
unity | -7.376 |
enaries | -7.133 |
Commands | -7.104 |
endas | -7.055 |
Token | That |
Token ID | 2504 |
Feature activation | -7.91e+00 |
Pos logit contributions | |
paed | +9.767 |
Australian | +8.927 |
neurot | +8.786 |
HSBC | +8.619 |
unethical | +8.546 |
Neg logit contributions | |
unity | -8.524 |
aturdays | -8.260 |
Commands | -8.195 |
enaries | -8.043 |
endas | -7.949 |
Token | seems |
Token ID | 2331 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
paed | +7.898 |
Australian | +7.047 |
neurot | +7.022 |
unethical | +6.893 |
HSBC | +6.773 |
Neg logit contributions | |
aturdays | -8.178 |
Commands | -8.124 |
unity | -8.039 |
enaries | -8.017 |
endas | -7.910 |
Token | to |
Token ID | 284 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
paed | +10.508 |
unethical | +9.547 |
neurot | +9.480 |
Australian | +9.463 |
piracy | +9.144 |
Neg logit contributions | |
aturdays | -12.893 |
Commands | -12.812 |
enaries | -12.631 |
unity | -12.617 |
endars | -12.336 |
Token | be |
Token ID | 307 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
paed | +14.325 |
Australian | +13.014 |
neurot | +12.723 |
HSBC | +12.389 |
leak | +12.210 |
Neg logit contributions | |
aturdays | -15.996 |
Commands | -15.986 |
enaries | -15.722 |
unity | -15.573 |
isans | -15.527 |
Token | the |
Token ID | 262 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
paed | +12.649 |
Australian | +11.709 |
piracy | +11.190 |
unethical | +11.186 |
HSBC | +11.145 |
Neg logit contributions | |
enaries | -13.552 |
aturdays | -13.412 |
Commands | -13.365 |
unity | -13.034 |
endars | -12.962 |
Token | case |
Token ID | 1339 |
Feature activation | -6.34e+00 |
Pos logit contributions | |
paed | +13.194 |
Australian | +12.280 |
neurot | +11.868 |
unethical | +11.682 |
HSBC | +11.594 |
Neg logit contributions | |
aturdays | -11.478 |
Commands | -11.353 |
enaries | -11.281 |
endas | -11.113 |
unity | -10.921 |
Token | with |
Token ID | 351 |
Feature activation | -1.73e+01 |
Pos logit contributions | |
paed | +6.416 |
Australian | +5.801 |
neurot | +5.694 |
HSBC | +5.653 |
unethical | +5.621 |
Neg logit contributions | |
unity | -6.568 |
Commands | -6.502 |
aturdays | -6.423 |
enaries | -6.314 |
endas | -6.310 |
Token | University |
Token ID | 2059 |
Feature activation | +3.90e+00 |
Pos logit contributions | |
paed | +19.662 |
Australian | +18.413 |
neurot | +17.611 |
HSBC | +17.475 |
unethical | +17.435 |
Neg logit contributions | |
aturdays | -12.979 |
enaries | -12.501 |
Commands | -12.317 |
endas | -12.212 |
endars | -12.083 |
Token | of |
Token ID | 286 |
Feature activation | -8.60e+00 |
Pos logit contributions | |
unity | +3.672 |
Commands | +3.520 |
enaries | +3.432 |
aturdays | +3.425 |
assemblies | +3.376 |
Neg logit contributions | |
paed | -4.454 |
neurot | -4.034 |
unethical | -3.958 |
Australian | -3.956 |
HSBC | -3.945 |
Token | systems |
Token ID | 3341 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
paed | +7.051 |
neurot | +6.415 |
Australian | +6.343 |
piracy | +6.194 |
unethical | +6.151 |
Neg logit contributions | |
unity | -7.319 |
aturdays | -7.247 |
Commands | -7.200 |
enaries | -7.030 |
endars | -7.015 |
Token | have |
Token ID | 423 |
Feature activation | +2.34e+00 |
Pos logit contributions | |
paed | +11.306 |
Australian | +10.391 |
neurot | +10.333 |
commercially | +10.233 |
HSBC | +9.997 |
Neg logit contributions | |
aturdays | -12.473 |
unity | -12.306 |
Commands | -12.093 |
Rules | -11.877 |
enaries | -11.843 |
Token | been |
Token ID | 587 |
Feature activation | +8.05e+00 |
Pos logit contributions | |
unity | +2.542 |
Commands | +2.451 |
enaries | +2.391 |
aturdays | +2.391 |
assemblies | +2.373 |
Neg logit contributions | |
paed | -2.365 |
neurot | -2.084 |
Australian | -2.068 |
HSBC | -2.045 |
unethical | -2.044 |
Token | installed |
Token ID | 6589 |
Feature activation | -7.63e+00 |
Pos logit contributions | |
unity | +7.855 |
Commands | +7.541 |
assemblies | +7.383 |
doors | +7.269 |
enaries | +7.206 |
Neg logit contributions | |
paed | -8.535 |
piracy | -7.492 |
neurot | -7.473 |
HSBC | -7.442 |
unethical | -7.418 |
Token | to |
Token ID | 284 |
Feature activation | -6.75e+00 |
Pos logit contributions | |
paed | +6.691 |
Australian | +5.987 |
neurot | +5.966 |
commercially | +5.937 |
HSBC | +5.744 |
Neg logit contributions | |
unity | -8.737 |
aturdays | -8.576 |
Commands | -8.532 |
enaries | -8.292 |
endas | -8.292 |
Token | reduce |
Token ID | 4646 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
paed | +6.028 |
neurot | +5.402 |
Australian | +5.379 |
commercially | +5.280 |
HSBC | +5.204 |
Neg logit contributions | |
aturdays | -7.706 |
unity | -7.622 |
Commands | -7.545 |
enaries | -7.431 |
Rules | -7.398 |
Token | sulfur |
Token ID | 37402 |
Feature activation | -6.60e+00 |
Pos logit contributions | |
paed | +24.937 |
neurot | +24.129 |
Australian | +23.768 |
leak | +23.376 |
commercially | +23.001 |
Neg logit contributions | |
aturdays | -16.128 |
endars | -15.525 |
Commands | -15.109 |
Rules | -15.056 |
endas | -14.924 |
Token | dioxide |
Token ID | 17556 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
paed | +6.311 |
neurot | +5.706 |
Australian | +5.626 |
piracy | +5.461 |
HSBC | +5.447 |
Neg logit contributions | |
unity | -7.078 |
Commands | -7.049 |
aturdays | -6.948 |
enaries | -6.851 |
Rules | -6.826 |
Token | emissions |
Token ID | 8971 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
paed | +13.158 |
neurot | +12.306 |
Australian | +11.935 |
piracy | +11.582 |
leak | +11.491 |
Neg logit contributions | |
aturdays | -13.668 |
Commands | -13.426 |
unity | -13.202 |
endas | -13.161 |
endars | -13.161 |
Token | . |
Token ID | 13 |
Feature activation | +3.78e+00 |
Pos logit contributions | |
paed | +12.009 |
neurot | +11.293 |
Australian | +11.104 |
commercially | +11.022 |
HSBC | +10.557 |
Neg logit contributions | |
unity | -15.669 |
aturdays | -15.395 |
Commands | -15.309 |
endars | -15.185 |
endas | -15.074 |
Token | The |
Token ID | 383 |
Feature activation | +3.56e+00 |
Pos logit contributions | |
unity | +4.399 |
Commands | +4.327 |
enaries | +4.171 |
Rules | +4.137 |
aturdays | +4.134 |
Neg logit contributions | |
paed | -3.537 |
neurot | -3.056 |
unethical | -3.012 |
piracy | -2.992 |
Australian | -2.968 |
Token | t |
Token ID | 83 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
paed | +10.011 |
Australian | +9.073 |
neurot | +9.027 |
HSBC | +8.803 |
piracy | +8.701 |
Neg logit contributions | |
unity | -8.086 |
Commands | -7.911 |
aturdays | -7.721 |
enaries | -7.616 |
assemblies | -7.594 |
Token | rend |
Token ID | 10920 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
unity | +1.763 |
Commands | +1.691 |
aturdays | +1.663 |
enaries | +1.654 |
Rules | +1.622 |
Neg logit contributions | |
paed | -2.460 |
neurot | -2.230 |
Australian | -2.220 |
unethical | -2.193 |
HSBC | -2.188 |
Token | s |
Token ID | 82 |
Feature activation | -2.66e+00 |
Pos logit contributions | |
unity | +2.200 |
Commands | +2.127 |
aturdays | +2.090 |
enaries | +2.086 |
Rules | +2.055 |
Neg logit contributions | |
paed | -2.136 |
neurot | -1.896 |
Australian | -1.880 |
unethical | -1.856 |
HSBC | -1.854 |
Token | 01 |
Token ID | 486 |
Feature activation | -9.73e+00 |
Pos logit contributions | |
paed | +2.550 |
neurot | +2.253 |
Australian | +2.243 |
HSBC | +2.191 |
unethical | +2.183 |
Neg logit contributions | |
unity | -3.012 |
Commands | -2.926 |
aturdays | -2.872 |
enaries | -2.864 |
assemblies | -2.815 |
Token | . |
Token ID | 13 |
Feature activation | -9.07e+00 |
Pos logit contributions | |
paed | +8.962 |
Australian | +7.995 |
neurot | +7.956 |
HSBC | +7.762 |
piracy | +7.666 |
Neg logit contributions | |
unity | -10.402 |
Commands | -10.105 |
aturdays | -9.978 |
enaries | -9.835 |
assemblies | -9.682 |
Token | html |
Token ID | 6494 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
paed | +8.165 |
Australian | +7.403 |
HSBC | +7.321 |
neurot | +7.300 |
piracy | +6.981 |
Neg logit contributions | |
unity | -9.932 |
aturdays | -9.765 |
Commands | -9.626 |
enaries | -9.538 |
assemblies | -9.474 |
Token | . |
Token ID | 13 |
Feature activation | -1.82e+01 |
Pos logit contributions | |
paed | +20.727 |
Australian | +19.972 |
neurot | +19.297 |
HSBC | +19.065 |
UK | +18.685 |
Neg logit contributions | |
aturdays | -19.256 |
unity | -18.660 |
enaries | -18.194 |
Commands | -18.063 |
Rules | -17.919 |
Token | Jo |
Token ID | 5302 |
Feature activation | -4.99e+00 |
Pos logit contributions | |
paed | +17.687 |
Australian | +16.981 |
HSBC | +16.184 |
neurot | +16.162 |
NZ | +15.735 |
Neg logit contributions | |
aturdays | -15.639 |
unity | -15.060 |
enaries | -14.942 |
Rules | -14.370 |
assemblies | -14.362 |
Token | iner |
Token ID | 7274 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
paed | +4.671 |
Australian | +4.140 |
neurot | +4.058 |
HSBC | +4.038 |
unethical | +3.979 |
Neg logit contributions | |
unity | -5.670 |
Commands | -5.489 |
aturdays | -5.479 |
enaries | -5.422 |
assemblies | -5.348 |
Token | T |
Token ID | 309 |
Feature activation | -9.30e+00 |
Pos logit contributions | |
paed | +13.899 |
Australian | +12.626 |
HSBC | +12.408 |
neurot | +12.388 |
NZ | +12.163 |
Neg logit contributions | |
unity | -13.424 |
aturdays | -13.290 |
Commands | -12.860 |
enaries | -12.846 |
endas | -12.702 |
Token | . |
Token ID | 13 |
Feature activation | -1.68e+01 |
Pos logit contributions | |
paed | +8.828 |
neurot | +7.899 |
Australian | +7.848 |
HSBC | +7.671 |
unethical | +7.542 |
Neg logit contributions | |
unity | -9.919 |
Commands | -9.597 |
aturdays | -9.434 |
enaries | -9.321 |
Rules | -9.231 |
Token | to |
Token ID | 284 |
Feature activation | -1.78e+01 |
Pos logit contributions | |
paed | +16.120 |
commercially | +15.014 |
Australian | +15.002 |
neurot | +14.890 |
HSBC | +14.112 |
Neg logit contributions | |
aturdays | -21.312 |
endars | -20.709 |
endas | -20.444 |
Commands | -20.010 |
Rules | -19.973 |
Token | boast |
Token ID | 28020 |
Feature activation | -9.37e+00 |
Pos logit contributions | |
paed | +16.574 |
neurot | +15.915 |
commercially | +15.809 |
Australian | +15.318 |
dermat | +14.803 |
Neg logit contributions | |
aturdays | -15.231 |
endars | -15.220 |
Commands | -15.113 |
enaries | -15.112 |
Rules | -15.107 |
Token | ; |
Token ID | 26 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
paed | +8.937 |
Australian | +8.057 |
neurot | +8.046 |
commercially | +7.886 |
unethical | +7.733 |
Neg logit contributions | |
unity | -9.667 |
Commands | -9.581 |
aturdays | -9.472 |
enaries | -9.392 |
Rules | -9.362 |
Token | another |
Token ID | 1194 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
paed | +16.240 |
neurot | +15.401 |
Australian | +15.243 |
commercially | +14.789 |
unethical | +14.731 |
Neg logit contributions | |
enaries | -11.816 |
aturdays | -11.665 |
unity | -11.545 |
endas | -11.529 |
Commands | -11.511 |
Token | popular |
Token ID | 2968 |
Feature activation | -2.95e+01 |
Pos logit contributions | |
paed | +21.516 |
neurot | +20.612 |
Australian | +20.352 |
commercially | +19.853 |
unethical | +19.527 |
Neg logit contributions | |
endas | -14.212 |
enaries | -14.148 |
Commands | -13.850 |
aturdays | -13.824 |
endars | -13.778 |
Token | and |
Token ID | 290 |
Feature activation | -2.74e+01 |
Pos logit contributions | |
paed | +29.583 |
Australian | +28.821 |
neurot | +28.512 |
commercially | +28.081 |
NZ | +27.414 |
Neg logit contributions | |
enaries | -16.259 |
endas | -15.814 |
endars | -15.469 |
Commands | -15.398 |
aturdays | -15.103 |
Token | professionally |
Token ID | 28049 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
paed | +26.906 |
neurot | +26.055 |
commercially | +26.030 |
Australian | +25.787 |
unethical | +25.287 |
Neg logit contributions | |
enaries | -16.734 |
aturdays | -16.482 |
endas | -16.311 |
Commands | -16.206 |
endars | -15.929 |
Token | used |
Token ID | 973 |
Feature activation | -3.05e+01 |
Pos logit contributions | |
paed | +15.468 |
neurot | +14.377 |
Australian | +14.287 |
commercially | +14.080 |
unethical | +14.061 |
Neg logit contributions | |
aturdays | -13.357 |
Commands | -13.352 |
unity | -13.183 |
enaries | -13.046 |
endas | -13.042 |
Token | medical |
Token ID | 3315 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
paed | +29.542 |
Australian | +28.942 |
neurot | +28.744 |
commercially | +28.425 |
pharmaceutical | +27.923 |
Neg logit contributions | |
enaries | -17.033 |
endas | -16.732 |
aturdays | -16.300 |
endars | -16.231 |
Commands | -16.052 |
Token | alk |
Token ID | 32915 |
Feature activation | -3.17e+00 |
Pos logit contributions | |
paed | +23.006 |
neurot | +22.094 |
Australian | +21.607 |
pharmaceutical | +21.266 |
unethical | +21.029 |
Neg logit contributions | |
enaries | -16.522 |
aturdays | -15.733 |
Commands | -15.724 |
endas | -15.373 |
Rules | -15.118 |
Token | al |
Token ID | 282 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
paed | +3.020 |
neurot | +2.688 |
Australian | +2.677 |
HSBC | +2.598 |
piracy | +2.585 |
Neg logit contributions | |
unity | -3.591 |
Commands | -3.490 |
aturdays | -3.433 |
enaries | -3.411 |
Rules | -3.369 |
Token | really |
Token ID | 1107 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
paed | +23.417 |
piracy | +22.517 |
unethical | +22.473 |
commercially | +21.766 |
Australian | +21.628 |
Neg logit contributions | |
enaries | -16.521 |
aturdays | -16.493 |
endas | -15.959 |
unity | -15.659 |
endars | -15.512 |
Token | likely |
Token ID | 1884 |
Feature activation | -2.44e+01 |
Pos logit contributions | |
paed | +19.474 |
piracy | +18.614 |
unethical | +18.453 |
Australian | +17.858 |
commercially | +17.745 |
Neg logit contributions | |
aturdays | -16.024 |
enaries | -15.952 |
endas | -15.269 |
unity | -15.240 |
isans | -15.207 |
Token | that |
Token ID | 326 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
paed | +22.827 |
piracy | +21.382 |
Australian | +21.185 |
unethical | +20.639 |
commercially | +20.405 |
Neg logit contributions | |
aturdays | -17.793 |
enaries | -17.705 |
Commands | -17.074 |
endas | -16.977 |
unity | -16.966 |
Token | Amazon |
Token ID | 6186 |
Feature activation | -1.62e+01 |
Pos logit contributions | |
paed | +10.337 |
Australian | +9.345 |
piracy | +9.274 |
unethical | +9.136 |
neurot | +9.061 |
Neg logit contributions | |
unity | -10.101 |
aturdays | -10.093 |
enaries | -10.073 |
Commands | -9.747 |
endas | -9.747 |
Token | is |
Token ID | 318 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
paed | +16.755 |
piracy | +15.383 |
Australian | +15.282 |
neurot | +15.142 |
unethical | +14.937 |
Neg logit contributions | |
unity | -13.165 |
aturdays | -13.092 |
enaries | -12.638 |
endas | -12.301 |
Commands | -12.245 |
Token | going |
Token ID | 1016 |
Feature activation | -2.42e+01 |
Pos logit contributions | |
paed | +18.503 |
piracy | +16.935 |
Australian | +16.733 |
neurot | +16.680 |
unethical | +16.637 |
Neg logit contributions | |
aturdays | -16.659 |
enaries | -15.903 |
unity | -15.812 |
Commands | -15.197 |
isans | -15.156 |
Token | to |
Token ID | 284 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
paed | +22.687 |
piracy | +20.714 |
viral | +20.646 |
Australian | +20.604 |
unethical | +20.456 |
Neg logit contributions | |
aturdays | -17.439 |
Commands | -17.183 |
unity | -16.772 |
isans | -16.633 |
endars | -16.464 |
Token | go |
Token ID | 467 |
Feature activation | -2.45e+01 |
Pos logit contributions | |
paed | +19.276 |
commercially | +17.938 |
piracy | +17.929 |
Australian | +17.747 |
leak | +17.631 |
Neg logit contributions | |
aturdays | -17.773 |
enaries | -16.878 |
isans | -16.834 |
endas | -16.608 |
endars | -16.480 |
Token | all |
Token ID | 477 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
paed | +24.382 |
piracy | +23.019 |
Australian | +22.819 |
viral | +22.413 |
unethical | +22.330 |
Neg logit contributions | |
aturdays | -15.970 |
endars | -15.749 |
Commands | -15.659 |
endas | -15.537 |
unity | -15.466 |
Token | 1984 |
Token ID | 12844 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
paed | +23.787 |
piracy | +22.836 |
Australian | +22.628 |
unethical | +22.037 |
commercially | +21.709 |
Neg logit contributions | |
aturdays | -15.780 |
enaries | -14.660 |
Commands | -14.538 |
unity | -14.518 |
isans | -14.322 |
Token | on |
Token ID | 319 |
Feature activation | -1.62e+01 |
Pos logit contributions | |
paed | +14.290 |
piracy | +13.065 |
Australian | +13.045 |
neurot | +12.833 |
unethical | +12.686 |
Neg logit contributions | |
unity | -11.569 |
aturdays | -11.384 |
Commands | -11.209 |
endas | -11.189 |
enaries | -11.179 |
Token | of |
Token ID | 286 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
paed | +28.490 |
Australian | +27.838 |
HSBC | +26.240 |
Malaysian | +26.010 |
UK | +25.880 |
Neg logit contributions | |
aturdays | -16.783 |
endars | -16.751 |
enaries | -16.470 |
endas | -16.361 |
Commands | -15.851 |
Token | Yahoo |
Token ID | 16551 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
paed | +19.307 |
Australian | +17.982 |
HSBC | +17.395 |
ITV | +17.024 |
NZ | +16.999 |
Neg logit contributions | |
aturdays | -15.023 |
enaries | -14.487 |
isans | -14.269 |
endars | -14.222 |
Commands | -14.184 |
Token | 's |
Token ID | 338 |
Feature activation | -8.10e+00 |
Pos logit contributions | |
paed | +11.263 |
Australian | +9.967 |
neurot | +9.771 |
HSBC | +9.586 |
piracy | +9.582 |
Neg logit contributions | |
aturdays | -12.884 |
unity | -12.689 |
Commands | -12.594 |
enaries | -12.566 |
endas | -12.265 |
Token | biggest |
Token ID | 4094 |
Feature activation | -1.81e+01 |
Pos logit contributions | |
paed | +9.193 |
Australian | +8.370 |
neurot | +8.170 |
HSBC | +8.130 |
unethical | +8.115 |
Neg logit contributions | |
unity | -7.279 |
aturdays | -7.267 |
Commands | -7.165 |
enaries | -7.081 |
endas | -7.031 |
Token | shareholders |
Token ID | 19195 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
paed | +21.199 |
Australian | +19.795 |
piracy | +19.062 |
unethical | +18.935 |
commercially | +18.847 |
Neg logit contributions | |
aturdays | -11.825 |
enaries | -11.535 |
endars | -11.480 |
endas | -11.470 |
unity | -11.312 |
Token | , |
Token ID | 11 |
Feature activation | -2.62e+01 |
Pos logit contributions | |
paed | +20.905 |
Australian | +19.336 |
HSBC | +19.199 |
NZ | +18.427 |
ITV | +18.419 |
Neg logit contributions | |
aturdays | -15.953 |
unity | -15.455 |
enaries | -15.281 |
endas | -15.240 |
Commands | -15.065 |
Token | Bill |
Token ID | 3941 |
Feature activation | -5.33e+00 |
Pos logit contributions | |
paed | +26.892 |
Australian | +25.619 |
HSBC | +24.764 |
NZ | +24.166 |
ITV | +24.084 |
Neg logit contributions | |
aturdays | -15.806 |
enaries | -15.538 |
endas | -15.338 |
endars | -15.175 |
isans | -14.794 |
Token | Miller |
Token ID | 7920 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
paed | +4.382 |
Australian | +3.868 |
neurot | +3.728 |
HSBC | +3.694 |
NZ | +3.615 |
Neg logit contributions | |
unity | -6.672 |
aturdays | -6.554 |
Commands | -6.414 |
enaries | -6.362 |
Rules | -6.322 |
Token | , |
Token ID | 11 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
paed | +12.699 |
Australian | +11.370 |
HSBC | +11.183 |
neurot | +10.921 |
NZ | +10.820 |
Neg logit contributions | |
unity | -14.031 |
aturdays | -13.814 |
enaries | -13.658 |
Commands | -13.538 |
isans | -13.320 |
Token | an |
Token ID | 281 |
Feature activation | -3.58e+01 |
Pos logit contributions | |
paed | +11.183 |
Australian | +10.113 |
HSBC | +9.943 |
neurot | +9.889 |
NZ | +9.670 |
Neg logit contributions | |
aturdays | -9.823 |
unity | -9.791 |
enaries | -9.686 |
Commands | -9.605 |
endas | -9.471 |
Token | asset |
Token ID | 11171 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
Australian | +32.752 |
paed | +31.607 |
HSBC | +30.452 |
ageing | +29.649 |
NZ | +29.633 |
Neg logit contributions | |
enaries | -20.170 |
endars | -19.373 |
aturdays | -18.914 |
Commands | -18.139 |
unity | -18.075 |