Token | , |
Token ID | 11 |
Feature activation | +5.50e+00 |
Pos logit contributions | |
Co | +18.283 |
B | +17.147 |
ian | +17.131 |
L | +17.040 |
P | +16.966 |
Neg logit contributions | |
tremend | -16.737 |
deaf | -13.952 |
meaningful | -13.200 |
proactive | -12.098 |
vested | -12.074 |
Token | T |
Token ID | 309 |
Feature activation | +8.71e+00 |
Pos logit contributions | |
Co | +6.564 |
ian | +6.050 |
L | +5.944 |
B | +5.916 |
she | +5.912 |
Neg logit contributions | |
tremend | -9.240 |
deaf | -7.884 |
meaningful | -7.613 |
vested | -7.082 |
proactive | -7.073 |
Token | . |
Token ID | 13 |
Feature activation | +8.03e+00 |
Pos logit contributions | |
Co | +7.284 |
ian | +6.510 |
j | +6.417 |
J | +6.394 |
L | +6.253 |
Neg logit contributions | |
tremend | -17.703 |
deaf | -15.486 |
meaningful | -15.075 |
vested | -14.332 |
proactive | -14.207 |
Token | J |
Token ID | 41 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
Co | +2.609 |
J | +2.140 |
L | +1.864 |
B | +1.808 |
P | +1.652 |
Neg logit contributions | |
tremend | -21.747 |
deaf | -18.816 |
meaningful | -18.387 |
vested | -18.007 |
proactive | -17.664 |
Token | . |
Token ID | 13 |
Feature activation | +9.65e+00 |
Pos logit contributions | |
Co | +14.370 |
L | +13.391 |
ian | +13.135 |
she | +13.026 |
Smith | +12.993 |
Neg logit contributions | |
tremend | -26.192 |
misunder | -18.841 |
deaf | -18.711 |
exha | -18.598 |
behavi | -18.521 |
Token | Osh |
Token ID | 46614 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
Co | +9.716 |
L | +8.967 |
P | +8.950 |
B | +8.788 |
Smith | +8.687 |
Neg logit contributions | |
tremend | -18.809 |
deaf | -14.367 |
behavi | -13.994 |
meaningful | -13.900 |
undermin | -13.860 |
Token | ie |
Token ID | 494 |
Feature activation | +7.35e+00 |
Pos logit contributions | |
i | +20.175 |
ian | +19.674 |
ie | +19.034 |
she | +18.483 |
oy | +18.375 |
Neg logit contributions | |
tremend | -39.155 |
exha | -30.691 |
behavi | -30.648 |
misunder | -29.160 |
eleph | -28.327 |
Token | and |
Token ID | 290 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
Co | +8.340 |
ian | +7.535 |
B | +7.521 |
L | +7.515 |
she | +7.461 |
Neg logit contributions | |
tremend | -12.191 |
deaf | -10.681 |
meaningful | -10.393 |
vested | -9.647 |
proactive | -9.645 |
Token | Nick |
Token ID | 8047 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
Co | +3.133 |
ian | +2.890 |
she | +2.826 |
L | +2.824 |
B | +2.820 |
Neg logit contributions | |
tremend | -4.152 |
deaf | -3.587 |
meaningful | -3.449 |
vested | -3.206 |
proactive | -3.189 |
Token | las |
Token ID | 21921 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
Co | +12.219 |
L | +11.776 |
ian | +11.456 |
i | +11.387 |
she | +11.372 |
Neg logit contributions | |
tremend | -21.823 |
deaf | -17.306 |
meaningful | -16.486 |
behavi | -16.478 |
misunder | -16.383 |
Token | Back |
Token ID | 5157 |
Feature activation | +9.83e+00 |
Pos logit contributions | |
Co | +10.803 |
ian | +10.263 |
B | +10.088 |
L | +9.993 |
j | +9.769 |
Neg logit contributions | |
tremend | -18.032 |
deaf | -13.846 |
meaningful | -13.077 |
behavi | -13.038 |
awaru | -12.668 |
Token |
|
Token ID | 198 |
Feature activation | +4.52e+00 |
Pos logit contributions | |
Co | +3.000 |
ian | +2.540 |
L | +2.530 |
B | +2.515 |
she | +2.508 |
Neg logit contributions | |
tremend | -10.911 |
deaf | -8.655 |
meaningful | -8.515 |
behavi | -8.455 |
exha | -8.331 |
Token | T |
Token ID | 51 |
Feature activation | +6.76e+00 |
Pos logit contributions | |
Co | +3.061 |
Star | +2.514 |
ian | +2.513 |
she | +2.503 |
L | +2.476 |
Neg logit contributions | |
tremend | -10.242 |
deaf | -9.193 |
meaningful | -9.047 |
vested | -8.542 |
visually | -8.536 |
Token | . |
Token ID | 13 |
Feature activation | +8.90e+00 |
Pos logit contributions | |
Co | +6.673 |
ian | +6.029 |
she | +5.876 |
Star | +5.823 |
L | +5.814 |
Neg logit contributions | |
tremend | -12.939 |
deaf | -11.383 |
meaningful | -11.184 |
vested | -10.470 |
proactive | -10.393 |
Token | J |
Token ID | 41 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
Co | +8.043 |
L | +7.168 |
B | +7.141 |
J | +7.046 |
P | +6.949 |
Neg logit contributions | |
tremend | -17.826 |
deaf | -15.382 |
meaningful | -15.234 |
vested | -14.605 |
personalized | -14.253 |
Token | . |
Token ID | 13 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
Co | +13.366 |
ian | +12.627 |
L | +12.593 |
B | +12.233 |
she | +12.071 |
Neg logit contributions | |
tremend | -22.912 |
deaf | -18.833 |
meaningful | -18.318 |
vested | -17.604 |
personalized | -17.521 |
Token | Osh |
Token ID | 46614 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
Co | +11.409 |
ian | +10.564 |
P | +10.439 |
B | +10.322 |
L | +10.306 |
Neg logit contributions | |
tremend | -18.661 |
deaf | -14.265 |
meaningful | -14.040 |
behavi | -13.763 |
vested | -13.422 |
Token | ie |
Token ID | 494 |
Feature activation | +5.93e+00 |
Pos logit contributions | |
ian | +17.269 |
i | +16.718 |
is | +16.236 |
she | +16.153 |
ie | +15.801 |
Neg logit contributions | |
tremend | -34.809 |
behavi | -27.655 |
deaf | -26.520 |
undermin | -26.160 |
meaningful | -26.130 |
Token |
|
Token ID | 198 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
Co | +6.590 |
ian | +5.935 |
L | +5.901 |
Star | +5.884 |
B | +5.875 |
Neg logit contributions | |
tremend | -10.531 |
deaf | -9.145 |
meaningful | -8.892 |
proactive | -8.243 |
vested | -8.229 |
Token |
|
Token ID | 198 |
Feature activation | +4.20e+00 |
Pos logit contributions | |
Co | +2.606 |
ian | +2.214 |
L | +2.201 |
B | +2.191 |
she | +2.182 |
Neg logit contributions | |
tremend | -8.844 |
deaf | -7.148 |
meaningful | -7.026 |
behavi | -6.834 |
proactive | -6.735 |
Token | Nick |
Token ID | 23609 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
Co | +2.787 |
ian | +2.287 |
Star | +2.281 |
she | +2.278 |
L | +2.237 |
Neg logit contributions | |
tremend | -9.550 |
deaf | -8.598 |
meaningful | -8.459 |
vested | -7.987 |
visually | -7.983 |
Token | las |
Token ID | 21921 |
Feature activation | +8.59e+00 |
Pos logit contributions | |
Co | +12.622 |
L | +11.948 |
ian | +11.816 |
she | +11.729 |
B | +11.631 |
Neg logit contributions | |
tremend | -15.728 |
deaf | -12.862 |
meaningful | -12.452 |
vested | -11.905 |
proactive | -11.720 |
Token | to |
Token ID | 284 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
Co | +4.790 |
ian | +4.464 |
B | +4.448 |
L | +4.446 |
she | +4.429 |
Neg logit contributions | |
tremend | -4.930 |
deaf | -3.570 |
meaningful | -3.479 |
vested | -3.241 |
behavi | -3.205 |
Token | Reuters |
Token ID | 8428 |
Feature activation | +7.90e+00 |
Pos logit contributions | |
tremend | +1.925 |
deaf | +1.642 |
meaningful | +1.594 |
visually | +1.434 |
vested | +1.431 |
Neg logit contributions | |
Co | -2.118 |
ian | -1.959 |
she | -1.958 |
Star | -1.948 |
uh | -1.930 |
Token | . |
Token ID | 13 |
Feature activation | +3.92e+00 |
Pos logit contributions | |
Co | +9.455 |
ian | +8.768 |
L | +8.642 |
Star | +8.623 |
B | +8.604 |
Neg logit contributions | |
tremend | -12.622 |
deaf | -10.964 |
meaningful | -10.746 |
vested | -9.942 |
proactive | -9.747 |
Token |
|
Token ID | 198 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
Co | +3.641 |
ian | +3.190 |
Star | +3.173 |
she | +3.166 |
L | +3.147 |
Neg logit contributions | |
tremend | -7.960 |
deaf | -6.944 |
meaningful | -6.827 |
vested | -6.413 |
proactive | -6.366 |
Token |
|
Token ID | 198 |
Feature activation | +9.64e+00 |
Pos logit contributions | |
Co | +6.679 |
B | +5.972 |
L | +5.933 |
P | +5.728 |
ian | +5.540 |
Neg logit contributions | |
tremend | -27.152 |
exha | -21.318 |
undermin | -20.960 |
behavi | -20.777 |
misunder | -20.658 |
Token | ADVERTISEMENT |
Token ID | 19053 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
Co | +8.014 |
L | +7.017 |
Star | +6.999 |
B | +6.987 |
P | +6.831 |
Neg logit contributions | |
tremend | -20.653 |
deaf | -17.451 |
meaningful | -17.287 |
vested | -16.446 |
proactive | -16.351 |
Token |
|
Token ID | 198 |
Feature activation | +7.63e+00 |
Pos logit contributions | |
Co | +20.251 |
P | +19.409 |
B | +19.335 |
L | +19.318 |
S | +19.082 |
Neg logit contributions | |
tremend | -29.426 |
vested | -22.031 |
meaningful | -21.805 |
deaf | -21.514 |
proactive | -21.380 |
Token |
|
Token ID | 198 |
Feature activation | +7.32e+00 |
Pos logit contributions | |
Co | +4.449 |
B | +3.802 |
L | +3.793 |
ian | +3.684 |
P | +3.635 |
Neg logit contributions | |
tremend | -20.468 |
exha | -16.025 |
behavi | -15.892 |
undermin | -15.811 |
misunder | -15.656 |
Token | Twenty |
Token ID | 34096 |
Feature activation | +4.62e+00 |
Pos logit contributions | |
Co | +4.788 |
Star | +3.952 |
L | +3.926 |
B | +3.907 |
P | +3.793 |
Neg logit contributions | |
tremend | -17.084 |
deaf | -14.916 |
meaningful | -14.749 |
vested | -14.031 |
proactive | -13.969 |
Token | - |
Token ID | 12 |
Feature activation | +3.72e+00 |
Pos logit contributions | |
Co | +6.387 |
ian | +5.969 |
she | +5.929 |
uh | +5.867 |
Star | +5.867 |
Neg logit contributions | |
tremend | -7.011 |
deaf | -5.806 |
meaningful | -5.701 |
vested | -5.252 |
visually | -5.189 |
Token | three |
Token ID | 15542 |
Feature activation | +3.63e+00 |
Pos logit contributions | |
Co | +2.835 |
she | +2.463 |
ian | +2.420 |
Star | +2.407 |
B | +2.359 |
Neg logit contributions | |
tremend | -8.046 |
deaf | -7.167 |
meaningful | -7.064 |
vested | -6.650 |
visually | -6.636 |
Token | ross |
Token ID | 1214 |
Feature activation | +8.08e+00 |
Pos logit contributions | |
Co | +16.364 |
uh | +15.974 |
ian | +15.918 |
oy | +15.547 |
j | +15.057 |
Neg logit contributions | |
tremend | -19.726 |
deaf | -16.802 |
meaningful | -16.165 |
proactive | -15.174 |
visually | -15.031 |
Token | . |
Token ID | 13 |
Feature activation | +3.97e+00 |
Pos logit contributions | |
Co | +10.254 |
ian | +9.727 |
she | +9.361 |
L | +9.257 |
Star | +9.213 |
Neg logit contributions | |
tremend | -12.680 |
deaf | -10.977 |
meaningful | -10.538 |
proactive | -9.696 |
visually | -9.651 |
Token | Carlton |
Token ID | 44348 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
Co | +5.132 |
ian | +4.693 |
L | +4.654 |
Star | +4.640 |
B | +4.634 |
Neg logit contributions | |
tremend | -6.587 |
deaf | -5.531 |
meaningful | -5.419 |
proactive | -4.973 |
vested | -4.965 |
Token | L |
Token ID | 406 |
Feature activation | +8.80e+00 |
Pos logit contributions | |
Co | +15.333 |
ian | +14.572 |
L | +14.388 |
B | +14.338 |
P | +14.134 |
Neg logit contributions | |
tremend | -17.936 |
deaf | -13.973 |
meaningful | -13.693 |
proactive | -12.702 |
behavi | -12.693 |
Token | . |
Token ID | 13 |
Feature activation | +7.97e+00 |
Pos logit contributions | |
Co | +7.841 |
ian | +7.208 |
uh | +6.952 |
oy | +6.826 |
she | +6.803 |
Neg logit contributions | |
tremend | -16.891 |
deaf | -14.949 |
meaningful | -14.662 |
proactive | -13.862 |
vested | -13.814 |
Token | Guth |
Token ID | 44003 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
Co | +10.234 |
L | +9.311 |
B | +9.275 |
ian | +9.270 |
Star | +9.102 |
Neg logit contributions | |
tremend | -12.996 |
deaf | -10.522 |
meaningful | -10.346 |
proactive | -9.640 |
vested | -9.591 |
Token | rie |
Token ID | 5034 |
Feature activation | +5.28e+00 |
Pos logit contributions | |
ian | +23.936 |
Co | +23.716 |
rick | +22.796 |
i | +22.678 |
ix | +22.565 |
Neg logit contributions | |
tremend | -21.495 |
deaf | -17.230 |
meaningful | -16.278 |
proactive | -15.213 |
vested | -15.014 |
Token | . |
Token ID | 13 |
Feature activation | +3.12e+00 |
Pos logit contributions | |
Co | +5.494 |
ian | +4.893 |
she | +4.827 |
Star | +4.811 |
L | +4.788 |
Neg logit contributions | |
tremend | -9.838 |
deaf | -8.632 |
meaningful | -8.492 |
proactive | -7.890 |
visually | -7.889 |
Token | Marion |
Token ID | 32473 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
Co | +4.040 |
ian | +3.693 |
she | +3.659 |
Star | +3.656 |
L | +3.649 |
Neg logit contributions | |
tremend | -5.168 |
deaf | -4.380 |
meaningful | -4.288 |
vested | -3.935 |
proactive | -3.929 |
Token | T |
Token ID | 309 |
Feature activation | +7.49e+00 |
Pos logit contributions | |
Co | +16.634 |
ian | +15.874 |
L | +15.659 |
B | +15.526 |
she | +15.322 |
Neg logit contributions | |
tremend | -18.278 |
deaf | -14.160 |
meaningful | -13.871 |
behavi | -12.916 |
proactive | -12.847 |
Token | . |
Token ID | 13 |
Feature activation | +8.86e+00 |
Pos logit contributions | |
Co | +5.991 |
ian | +5.398 |
uh | +5.272 |
she | +5.237 |
L | +5.073 |
Neg logit contributions | |
tremend | -15.179 |
deaf | -13.551 |
meaningful | -13.346 |
vested | -12.693 |
proactive | -12.614 |
Token | 8 |
Token ID | 807 |
Feature activation | +4.20e+00 |
Pos logit contributions | |
Co | +6.697 |
ian | +6.065 |
L | +6.039 |
B | +6.007 |
S | +5.887 |
Neg logit contributions | |
tremend | -11.949 |
deaf | -9.597 |
meaningful | -9.033 |
behavi | -8.914 |
vested | -8.789 |
Token | election |
Token ID | 3071 |
Feature activation | +3.79e+00 |
Pos logit contributions | |
Co | +7.011 |
ian | +6.621 |
Star | +6.555 |
she | +6.534 |
B | +6.519 |
Neg logit contributions | |
tremend | -5.140 |
deaf | -4.107 |
meaningful | -3.896 |
vested | -3.537 |
visually | -3.450 |
Token | . |
Token ID | 13 |
Feature activation | +3.72e+00 |
Pos logit contributions | |
Co | +4.484 |
ian | +4.126 |
she | +4.084 |
Star | +4.040 |
L | +4.037 |
Neg logit contributions | |
tremend | -6.528 |
deaf | -5.615 |
meaningful | -5.443 |
vested | -5.059 |
proactive | -5.055 |
Token |
|
Token ID | 198 |
Feature activation | +9.37e+00 |
Pos logit contributions | |
Co | +3.542 |
she | +3.132 |
ian | +3.099 |
Star | +3.066 |
L | +3.054 |
Neg logit contributions | |
tremend | -7.451 |
deaf | -6.494 |
meaningful | -6.390 |
vested | -5.987 |
proactive | -5.955 |
Token |
|
Token ID | 198 |
Feature activation | +8.40e+00 |
Pos logit contributions | |
Co | +5.799 |
L | +5.131 |
B | +5.112 |
P | +4.931 |
ian | +4.864 |
Neg logit contributions | |
tremend | -24.665 |
exha | -19.289 |
undermin | -19.039 |
behavi | -18.922 |
misunder | -18.734 |
Token | ADVERTISEMENT |
Token ID | 19053 |
Feature activation | +1.98e+01 |
Pos logit contributions | |
Co | +8.201 |
L | +7.211 |
B | +7.177 |
she | +7.158 |
P | +7.096 |
Neg logit contributions | |
tremend | -16.922 |
deaf | -14.240 |
meaningful | -14.085 |
vested | -13.321 |
artificially | -13.279 |
Token |
|
Token ID | 198 |
Feature activation | +7.85e+00 |
Pos logit contributions | |
Co | +17.672 |
P | +17.379 |
B | +17.339 |
S | +17.266 |
L | +17.220 |
Neg logit contributions | |
tremend | -36.198 |
exha | -26.862 |
carbohyd | -25.993 |
undermin | -25.865 |
eleph | -25.811 |
Token |
|
Token ID | 198 |
Feature activation | +7.49e+00 |
Pos logit contributions | |
Co | +4.514 |
L | +3.884 |
B | +3.856 |
P | +3.695 |
she | +3.690 |
Neg logit contributions | |
tremend | -21.247 |
exha | -16.647 |
behavi | -16.520 |
undermin | -16.468 |
misunder | -16.273 |
Token | Clinton |
Token ID | 16549 |
Feature activation | +5.46e+00 |
Pos logit contributions | |
Co | +5.003 |
she | +4.065 |
L | +4.063 |
B | +4.041 |
Star | +3.986 |
Neg logit contributions | |
tremend | -17.454 |
deaf | -15.174 |
meaningful | -15.024 |
vested | -14.307 |
proactive | -14.250 |
Token | mentioned |
Token ID | 4750 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
Co | +8.236 |
ian | +7.781 |
she | +7.666 |
L | +7.598 |
Star | +7.582 |
Neg logit contributions | |
tremend | -7.463 |
deaf | -6.026 |
meaningful | -5.895 |
proactive | -5.263 |
vested | -5.257 |
Token | the |
Token ID | 262 |
Feature activation | -4.59e+00 |
Pos logit contributions | |
tremend | +5.619 |
deaf | +4.878 |
meaningful | +4.722 |
vested | +4.157 |
proactive | +4.152 |
Neg logit contributions | |
Co | -7.808 |
ian | -7.254 |
Star | -7.251 |
she | -7.232 |
uh | -7.229 |
Token | Jeff |
Token ID | 19139 |
Feature activation | +7.56e+00 |
Pos logit contributions | |
Co | +4.797 |
ian | +4.433 |
B | +4.365 |
Star | +4.358 |
L | +4.344 |
Neg logit contributions | |
tremend | -6.438 |
deaf | -5.410 |
meaningful | -5.280 |
vested | -4.875 |
visually | -4.855 |
Token | Flake |
Token ID | 39727 |
Feature activation | +7.24e+00 |
Pos logit contributions | |
Co | +9.322 |
B | +8.440 |
she | +8.436 |
ian | +8.312 |
Star | +8.214 |
Neg logit contributions | |
tremend | -12.616 |
deaf | -10.677 |
meaningful | -10.301 |
vested | -9.734 |
proactive | -9.626 |
Token | ( |
Token ID | 7 |
Feature activation | +7.02e+00 |
Pos logit contributions | |
Co | +10.578 |
ian | +9.884 |
L | +9.814 |
B | +9.797 |
Star | +9.748 |
Neg logit contributions | |
tremend | -10.025 |
deaf | -8.115 |
meaningful | -7.871 |
vested | -7.273 |
proactive | -7.238 |
Token | R |
Token ID | 49 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
Co | +1.922 |
L | +1.214 |
B | +1.143 |
P | +1.047 |
Star | +1.004 |
Neg logit contributions | |
tremend | -18.854 |
deaf | -16.771 |
meaningful | -16.635 |
proactive | -15.905 |
vested | -15.859 |
Token | - |
Token ID | 12 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
Co | +14.280 |
ian | +12.711 |
PA | +12.543 |
L | +12.504 |
P | +12.456 |
Neg logit contributions | |
tremend | -18.786 |
deaf | -16.285 |
meaningful | -15.437 |
proactive | -14.943 |
vested | -14.941 |
Token | Ari |
Token ID | 26529 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
Co | +9.004 |
PA | +7.652 |
L | +7.539 |
B | +7.486 |
P | +7.310 |
Neg logit contributions | |
tremend | -27.230 |
deaf | -22.825 |
meaningful | -22.157 |
proactive | -21.754 |
behavi | -21.646 |
Token | z |
Token ID | 89 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
Co | +13.441 |
Z | +12.936 |
L | +12.388 |
j | +12.161 |
z | +12.100 |
Neg logit contributions | |
tremend | -35.783 |
behavi | -29.409 |
deaf | -28.191 |
proactive | -28.105 |
misunder | -27.965 |
Token | .) |
Token ID | 2014 |
Feature activation | +6.43e+00 |
Pos logit contributions | |
Co | +11.113 |
ian | +9.926 |
L | +9.694 |
Star | +9.390 |
B | +9.290 |
Neg logit contributions | |
tremend | -25.620 |
deaf | -22.709 |
meaningful | -21.946 |
proactive | -21.012 |
visually | -20.849 |
Token | after |
Token ID | 706 |
Feature activation | -4.06e+00 |
Pos logit contributions | |
Co | +10.070 |
ian | +9.563 |
L | +9.434 |
Star | +9.416 |
she | +9.383 |
Neg logit contributions | |
tremend | -8.179 |
deaf | -6.396 |
meaningful | -6.195 |
proactive | -5.633 |
vested | -5.612 |
Token | he |
Token ID | 339 |
Feature activation | -3.88e+00 |
Pos logit contributions | |
tremend | +4.992 |
deaf | +4.351 |
meaningful | +4.192 |
visually | +3.737 |
proactive | +3.654 |
Neg logit contributions | |
Co | -6.491 |
Star | -6.046 |
uh | -6.015 |
she | -6.012 |
ian | -6.004 |
Token | was |
Token ID | 373 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
tremend | +5.362 |
deaf | +4.848 |
meaningful | +4.651 |
visually | +4.311 |
vested | +4.252 |
Neg logit contributions | |
Co | -5.558 |
Star | -5.106 |
she | -5.091 |
uh | -5.041 |
Smith | -5.031 |
Token | . |
Token ID | 13 |
Feature activation | +9.91e-02 |
Pos logit contributions | |
tremend | +3.305 |
deaf | +2.931 |
meaningful | +2.860 |
visually | +2.642 |
vested | +2.639 |
Neg logit contributions | |
Co | -2.463 |
Star | -2.231 |
she | -2.226 |
ian | -2.219 |
Smith | -2.185 |
Token | � |
Token ID | 447 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
Co | +0.101 |
she | +0.090 |
ian | +0.090 |
Star | +0.089 |
uh | +0.087 |
Neg logit contributions | |
tremend | -0.185 |
deaf | -0.166 |
meaningful | -0.163 |
visually | -0.151 |
vested | -0.151 |
Token | � |
Token ID | 251 |
Feature activation | +8.07e+00 |
Pos logit contributions | |
Co | +9.654 |
B | +9.126 |
Star | +8.810 |
L | +8.786 |
uh | +8.761 |
Neg logit contributions | |
tremend | -21.092 |
deaf | -18.329 |
meaningful | -17.723 |
visually | -16.897 |
vested | -16.866 |
Token |
|
Token ID | 198 |
Feature activation | +6.10e+00 |
Pos logit contributions | |
Co | +10.638 |
she | +9.805 |
ian | +9.794 |
B | +9.773 |
L | +9.771 |
Neg logit contributions | |
tremend | -12.382 |
deaf | -10.338 |
meaningful | -10.087 |
visually | -9.249 |
vested | -9.239 |
Token |
|
Token ID | 198 |
Feature activation | +6.25e+00 |
Pos logit contributions | |
Co | +3.864 |
L | +3.289 |
B | +3.264 |
ian | +3.252 |
she | +3.191 |
Neg logit contributions | |
tremend | -15.856 |
exha | -12.273 |
behavi | -12.268 |
deaf | -12.238 |
undermin | -12.169 |
Token | ADVERTISEMENT |
Token ID | 19053 |
Feature activation | +1.95e+01 |
Pos logit contributions | |
Co | +4.763 |
B | +3.976 |
L | +3.973 |
she | +3.966 |
Star | +3.966 |
Neg logit contributions | |
tremend | -13.778 |
deaf | -12.094 |
meaningful | -11.917 |
vested | -11.283 |
visually | -11.255 |
Token |
|
Token ID | 198 |
Feature activation | +7.31e+00 |
Pos logit contributions | |
Co | +19.708 |
B | +18.970 |
P | +18.837 |
S | +18.679 |
L | +18.562 |
Neg logit contributions | |
tremend | -27.795 |
deaf | -20.669 |
vested | -20.618 |
meaningful | -20.523 |
predetermined | -20.271 |
Token |
|
Token ID | 198 |
Feature activation | +7.06e+00 |
Pos logit contributions | |
Co | +4.282 |
L | +3.658 |
B | +3.640 |
ian | +3.555 |
P | +3.501 |
Neg logit contributions | |
tremend | -19.516 |
exha | -15.253 |
behavi | -15.135 |
undermin | -15.072 |
misunder | -14.953 |
Token | How |
Token ID | 2437 |
Feature activation | +3.78e+00 |
Pos logit contributions | |
Co | +4.931 |
B | +4.076 |
L | +4.071 |
Star | +4.018 |
she | +3.987 |
Neg logit contributions | |
tremend | -16.171 |
deaf | -14.090 |
meaningful | -13.902 |
vested | -13.196 |
proactive | -13.178 |
Token | a |
Token ID | 257 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
Co | +6.821 |
ian | +6.437 |
she | +6.390 |
L | +6.372 |
B | +6.366 |
Neg logit contributions | |
tremend | -4.074 |
deaf | -3.095 |
meaningful | -2.945 |
vested | -2.630 |
visually | -2.579 |
Token | pro |
Token ID | 1676 |
Feature activation | +5.48e+00 |
Pos logit contributions | |
tremend | +0.130 |
deaf | +0.106 |
meaningful | +0.102 |
vested | +0.090 |
visually | +0.090 |
Neg logit contributions | |
Co | -0.186 |
ian | -0.174 |
she | -0.174 |
Star | -0.173 |
L | -0.172 |
Token | . |
Token ID | 13 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
tremend | +3.917 |
deaf | +3.529 |
meaningful | +3.466 |
visually | +3.249 |
vested | +3.235 |
Neg logit contributions | |
Co | -1.849 |
Star | -1.618 |
she | -1.613 |
ian | -1.611 |
Smith | -1.578 |
Token | � |
Token ID | 447 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
tremend | +0.310 |
deaf | +0.281 |
meaningful | +0.276 |
visually | +0.259 |
vested | +0.258 |
Neg logit contributions | |
Co | -0.130 |
ian | -0.114 |
she | -0.113 |
Star | -0.112 |
uh | -0.110 |
Token | � |
Token ID | 251 |
Feature activation | +9.02e+00 |
Pos logit contributions | |
Co | +6.506 |
B | +6.032 |
uh | +5.860 |
L | +5.830 |
Star | +5.708 |
Neg logit contributions | |
tremend | -26.542 |
deaf | -22.223 |
meaningful | -21.482 |
behavi | -20.937 |
misunder | -20.841 |
Token |
|
Token ID | 198 |
Feature activation | +7.56e+00 |
Pos logit contributions | |
Co | +11.206 |
L | +10.316 |
she | +10.304 |
Star | +10.182 |
B | +10.165 |
Neg logit contributions | |
tremend | -14.345 |
deaf | -11.894 |
meaningful | -11.655 |
vested | -10.737 |
proactive | -10.716 |
Token |
|
Token ID | 198 |
Feature activation | +7.34e+00 |
Pos logit contributions | |
Co | +4.579 |
L | +3.940 |
B | +3.926 |
ian | +3.823 |
P | +3.743 |
Neg logit contributions | |
tremend | -19.931 |
exha | -15.528 |
behavi | -15.408 |
undermin | -15.397 |
misunder | -15.224 |
Token | ADVERTISEMENT |
Token ID | 19053 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
Co | +6.516 |
L | +5.694 |
Star | +5.619 |
B | +5.595 |
she | +5.515 |
Neg logit contributions | |
tremend | -15.226 |
deaf | -13.097 |
meaningful | -12.927 |
vested | -12.240 |
proactive | -12.207 |
Token |
|
Token ID | 198 |
Feature activation | +7.24e+00 |
Pos logit contributions | |
Co | +17.880 |
S | +17.550 |
L | +17.486 |
B | +17.457 |
P | +17.443 |
Neg logit contributions | |
tremend | -33.384 |
exha | -24.677 |
misunder | -23.761 |
undermin | -23.739 |
carbohyd | -23.673 |
Token |
|
Token ID | 198 |
Feature activation | +7.12e+00 |
Pos logit contributions | |
Co | +4.305 |
L | +3.698 |
B | +3.675 |
ian | +3.552 |
she | +3.534 |
Neg logit contributions | |
tremend | -19.221 |
exha | -14.986 |
behavi | -14.907 |
undermin | -14.857 |
misunder | -14.703 |
Token | Ign |
Token ID | 32916 |
Feature activation | +9.27e+00 |
Pos logit contributions | |
Co | +4.884 |
L | +4.087 |
Star | +4.008 |
B | +3.980 |
she | +3.907 |
Neg logit contributions | |
tremend | -16.299 |
deaf | -14.195 |
meaningful | -14.041 |
vested | -13.353 |
proactive | -13.331 |
Token | at |
Token ID | 265 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
Co | +4.162 |
ian | +4.119 |
she | +3.896 |
uh | +3.781 |
i | +3.532 |
Neg logit contributions | |
tremend | -23.444 |
behavi | -19.642 |
deaf | -19.358 |
meaningful | -18.946 |
exha | -18.826 |
Token | ius |
Token ID | 3754 |
Feature activation | -2.81e-02 |
Pos logit contributions | |
Co | +1.246 |
ian | +1.059 |
she | +0.907 |
uh | +0.892 |
Star | +0.858 |
Neg logit contributions | |
tremend | -8.825 |
deaf | -7.832 |
meaningful | -7.691 |
vested | -7.389 |
proactive | -7.327 |
Token | ko |
Token ID | 7204 |
Feature activation | +8.27e+00 |
Pos logit contributions | |
Co | +11.981 |
ian | +11.745 |
she | +11.446 |
oy | +11.229 |
uh | +11.149 |
Neg logit contributions | |
tremend | -14.207 |
deaf | -11.858 |
meaningful | -11.531 |
proactive | -10.648 |
vested | -10.493 |
Token | , |
Token ID | 11 |
Feature activation | +2.96e+00 |
Pos logit contributions | |
Co | +11.207 |
ian | +10.681 |
j | +10.413 |
she | +10.399 |
i | +10.339 |
Neg logit contributions | |
tremend | -12.202 |
deaf | -10.146 |
meaningful | -9.852 |
proactive | -9.030 |
visually | -8.913 |
Token | Ser |
Token ID | 2930 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
Co | +4.044 |
ian | +3.741 |
she | +3.711 |
L | +3.679 |
Star | +3.678 |
Neg logit contributions | |
tremend | -4.581 |
deaf | -3.875 |
meaningful | -3.787 |
visually | -3.446 |
vested | -3.435 |
Token | hi |
Token ID | 5303 |
Feature activation | +6.14e+00 |
Pos logit contributions | |
Co | +14.623 |
ian | +14.542 |
she | +14.414 |
i | +14.293 |
uh | +14.250 |
Neg logit contributions | |
tremend | -23.607 |
deaf | -19.925 |
meaningful | -19.477 |
proactive | -18.477 |
personalized | -18.134 |
Token | y |
Token ID | 88 |
Feature activation | +8.94e+00 |
Pos logit contributions | |
Co | +2.505 |
ian | +2.087 |
uh | +1.909 |
she | +1.905 |
B | +1.826 |
Neg logit contributions | |
tremend | -15.102 |
deaf | -13.766 |
meaningful | -13.524 |
vested | -12.887 |
proactive | -12.865 |
Token | Kaz |
Token ID | 16385 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
Co | +11.332 |
ian | +10.529 |
B | +10.443 |
L | +10.415 |
she | +10.385 |
Neg logit contributions | |
tremend | -13.353 |
deaf | -11.344 |
meaningful | -11.078 |
proactive | -10.194 |
vested | -10.083 |
Token | arov |
Token ID | 42737 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
uh | +18.893 |
ian | +18.836 |
Co | +18.308 |
she | +18.082 |
oy | +18.030 |
Neg logit contributions | |
tremend | -25.801 |
deaf | -21.347 |
meaningful | -21.094 |
behavi | -20.403 |
proactive | -19.884 |
Token | , |
Token ID | 11 |
Feature activation | +3.37e+00 |
Pos logit contributions | |
Co | +15.521 |
ian | +14.644 |
B | +14.337 |
she | +14.290 |
L | +14.254 |
Neg logit contributions | |
tremend | -14.342 |
deaf | -11.792 |
meaningful | -11.659 |
proactive | -10.508 |
visually | -10.406 |
Token | Vital |
Token ID | 28476 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
Co | +4.845 |
ian | +4.506 |
she | +4.468 |
L | +4.435 |
B | +4.425 |
Neg logit contributions | |
tremend | -4.973 |
deaf | -4.149 |
meaningful | -4.057 |
visually | -3.663 |
vested | -3.652 |
Token | y |
Token ID | 88 |
Feature activation | +7.19e+00 |
Pos logit contributions | |
Co | +17.430 |
ian | +17.326 |
i | +17.115 |
j | +16.391 |
she | +16.337 |
Neg logit contributions | |
tremend | -18.763 |
deaf | -15.669 |
meaningful | -15.644 |
vested | -14.170 |
proactive | -14.130 |
Token | Nem |
Token ID | 22547 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
Co | +9.231 |
ian | +8.617 |
she | +8.548 |
L | +8.480 |
B | +8.450 |
Neg logit contributions | |
tremend | -11.171 |
deaf | -9.533 |
meaningful | -9.254 |
proactive | -8.487 |
vested | -8.475 |
Token | White |
Token ID | 2635 |
Feature activation | +9.50e+00 |
Pos logit contributions | |
Co | +10.359 |
ian | +9.938 |
B | +9.389 |
PA | +9.114 |
Smith | +8.977 |
Neg logit contributions | |
tremend | -22.248 |
awaru | -18.277 |
deaf | -18.089 |
meaningful | -17.341 |
behavi | -17.119 |
Token | house |
Token ID | 4803 |
Feature activation | +6.56e+00 |
Pos logit contributions | |
Co | +8.185 |
she | +7.362 |
B | +7.100 |
Star | +7.066 |
Smith | +7.007 |
Neg logit contributions | |
tremend | -18.842 |
deaf | -16.167 |
meaningful | -15.933 |
proactive | -14.882 |
visually | -14.784 |
Token | , |
Token ID | 11 |
Feature activation | +2.90e+00 |
Pos logit contributions | |
Co | +9.457 |
ian | +8.794 |
L | +8.690 |
she | +8.683 |
B | +8.682 |
Neg logit contributions | |
tremend | -9.240 |
deaf | -7.631 |
meaningful | -7.502 |
proactive | -6.788 |
vested | -6.786 |
Token | Democrat |
Token ID | 9755 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
Co | +5.461 |
ian | +5.140 |
she | +5.109 |
B | +5.099 |
L | +5.086 |
Neg logit contributions | |
tremend | -3.023 |
deaf | -2.280 |
meaningful | -2.197 |
vested | -1.872 |
visually | -1.847 |
Token | of |
Token ID | 286 |
Feature activation | +3.84e+00 |
Pos logit contributions | |
Co | +13.328 |
ian | +12.169 |
B | +12.143 |
L | +12.087 |
P | +12.044 |
Neg logit contributions | |
tremend | -14.815 |
deaf | -12.362 |
meaningful | -12.020 |
personalized | -11.214 |
visually | -11.037 |
Token | Rhode |
Token ID | 24545 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
Co | +5.374 |
ian | +4.993 |
she | +4.990 |
Star | +4.893 |
L | +4.893 |
Neg logit contributions | |
tremend | -5.924 |
deaf | -4.884 |
meaningful | -4.704 |
visually | -4.285 |
vested | -4.269 |
Token | Island |
Token ID | 5451 |
Feature activation | +9.62e+00 |
Pos logit contributions | |
Co | +16.774 |
ian | +16.750 |
uh | +14.918 |
S | +14.770 |
PA | +14.690 |
Neg logit contributions | |
tremend | -31.033 |
deaf | -24.631 |
misunder | -23.593 |
behavi | -23.243 |
meaningful | -22.355 |
Token | and |
Token ID | 290 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
Co | +12.472 |
ian | +11.425 |
L | +11.245 |
B | +11.227 |
P | +11.198 |
Neg logit contributions | |
tremend | -13.926 |
deaf | -11.787 |
meaningful | -11.476 |
proactive | -10.522 |
visually | -10.374 |
Token | member |
Token ID | 2888 |
Feature activation | +5.08e+00 |
Pos logit contributions | |
Co | +6.355 |
ian | +5.921 |
B | +5.893 |
P | +5.892 |
L | +5.883 |
Neg logit contributions | |
tremend | -2.961 |
deaf | -2.130 |
meaningful | -2.048 |
vested | -1.712 |
visually | -1.676 |
Token | of |
Token ID | 286 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
Co | +5.525 |
ian | +5.080 |
she | +5.001 |
L | +4.952 |
B | +4.930 |
Neg logit contributions | |
tremend | -9.962 |
deaf | -7.565 |
misunder | -7.367 |
meaningful | -7.362 |
behavi | -7.324 |
Token | the |
Token ID | 262 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
Co | +3.247 |
ian | +3.056 |
she | +3.053 |
B | +3.043 |
Star | +3.042 |
Neg logit contributions | |
tremend | -1.032 |
deaf | -0.693 |
meaningful | -0.635 |
visually | -0.488 |
vested | -0.470 |
Token | Writing |
Token ID | 22183 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
Co | +8.891 |
ian | +8.109 |
L | +8.072 |
B | +8.030 |
Star | +8.029 |
Neg logit contributions | |
tremend | -10.690 |
deaf | -8.748 |
meaningful | -8.628 |
vested | -8.066 |
proactive | -7.887 |
Token | by |
Token ID | 416 |
Feature activation | +4.27e+00 |
Pos logit contributions | |
Co | +12.765 |
ian | +11.787 |
L | +11.673 |
Star | +11.650 |
B | +11.576 |
Neg logit contributions | |
tremend | -16.668 |
deaf | -12.353 |
meaningful | -12.275 |
misunder | -11.536 |
awaru | -11.494 |
Token | Z |
Token ID | 1168 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
Co | +5.282 |
ian | +4.872 |
she | +4.804 |
L | +4.771 |
B | +4.756 |
Neg logit contributions | |
tremend | -7.282 |
deaf | -6.082 |
meaningful | -5.992 |
vested | -5.513 |
visually | -5.504 |
Token | eb |
Token ID | 1765 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
Co | +13.249 |
ian | +13.076 |
uh | +12.676 |
she | +12.654 |
B | +12.555 |
Neg logit contributions | |
tremend | -17.318 |
deaf | -14.597 |
meaningful | -14.428 |
proactive | -13.341 |
vested | -13.214 |
Token | a |
Token ID | 64 |
Feature activation | +8.78e+00 |
Pos logit contributions | |
Co | +17.729 |
she | +17.349 |
ian | +17.016 |
uh | +16.934 |
i | +16.759 |
Neg logit contributions | |
tremend | -18.332 |
meaningful | -15.004 |
deaf | -14.757 |
personalized | -13.700 |
proactive | -13.694 |
Token | Sidd |
Token ID | 44487 |
Feature activation | +1.87e+01 |
Pos logit contributions | |
Co | +10.619 |
ian | +10.118 |
she | +9.840 |
uh | +9.671 |
L | +9.642 |
Neg logit contributions | |
tremend | -14.418 |
deaf | -12.110 |
meaningful | -11.868 |
visually | -10.873 |
proactive | -10.867 |
Token | iqu |
Token ID | 1557 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
i | +17.565 |
Co | +17.400 |
she | +17.000 |
ian | +16.915 |
j | +16.773 |
Neg logit contributions | |
tremend | -28.183 |
deaf | -23.720 |
meaningful | -22.536 |
vested | -21.049 |
proactive | -20.953 |
Token | i |
Token ID | 72 |
Feature activation | +8.44e+00 |
Pos logit contributions | |
i | +7.345 |
ian | +6.933 |
Co | +6.718 |
she | +6.257 |
j | +6.110 |
Neg logit contributions | |
tremend | -24.020 |
meaningful | -21.127 |
deaf | -20.921 |
behavi | -19.558 |
proactive | -19.446 |
Token | ; |
Token ID | 26 |
Feature activation | +6.83e+00 |
Pos logit contributions | |
Co | +10.028 |
ian | +9.582 |
she | +9.264 |
uh | +9.169 |
Star | +9.115 |
Neg logit contributions | |
tremend | -14.169 |
deaf | -11.764 |
meaningful | -11.646 |
vested | -10.702 |
proactive | -10.651 |
Token | Editing |
Token ID | 39883 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
Co | +7.570 |
L | +6.756 |
ian | +6.721 |
B | +6.682 |
P | +6.658 |
Neg logit contributions | |
tremend | -12.189 |
deaf | -10.147 |
meaningful | -10.009 |
vested | -9.435 |
proactive | -9.261 |
Token | by |
Token ID | 416 |
Feature activation | +4.58e+00 |
Pos logit contributions | |
Co | +14.607 |
B | +13.479 |
L | +13.390 |
P | +13.248 |
ian | +13.191 |
Neg logit contributions | |
tremend | -24.146 |
behavi | -17.158 |
misunder | -17.018 |
exha | -16.558 |
undermin | -16.463 |
Token | nut |
Token ID | 14930 |
Feature activation | +7.28e+00 |
Pos logit contributions | |
Co | +7.677 |
ian | +6.766 |
Star | +6.703 |
she | +6.659 |
L | +6.586 |
Neg logit contributions | |
tremend | -16.222 |
deaf | -14.228 |
meaningful | -13.991 |
vested | -13.121 |
proactive | -13.028 |
Token | Brewery |
Token ID | 31003 |
Feature activation | +3.87e+00 |
Pos logit contributions | |
Co | +9.962 |
B | +9.073 |
L | +9.023 |
ian | +8.990 |
Star | +8.942 |
Neg logit contributions | |
tremend | -10.885 |
deaf | -9.205 |
meaningful | -8.947 |
vested | -8.261 |
proactive | -8.158 |
Token | in |
Token ID | 287 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
Co | +6.080 |
she | +5.608 |
ian | +5.607 |
Star | +5.594 |
L | +5.555 |
Neg logit contributions | |
tremend | -5.206 |
deaf | -4.362 |
meaningful | -4.210 |
vested | -3.785 |
visually | -3.763 |
Token | Boulder |
Token ID | 27437 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
tremend | +3.228 |
deaf | +2.831 |
meaningful | +2.773 |
visually | +2.534 |
vested | +2.525 |
Neg logit contributions | |
Co | -2.814 |
she | -2.576 |
ian | -2.574 |
Star | -2.564 |
uh | -2.537 |
Token | , |
Token ID | 11 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
Co | +14.946 |
ian | +13.892 |
L | +13.668 |
B | +13.664 |
uh | +13.530 |
Neg logit contributions | |
tremend | -14.205 |
deaf | -11.583 |
meaningful | -11.089 |
proactive | -10.197 |
vested | -10.054 |
Token | Colo |
Token ID | 41943 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
Co | +2.167 |
ian | +1.956 |
she | +1.941 |
Star | +1.924 |
B | +1.915 |
Neg logit contributions | |
tremend | -3.257 |
deaf | -2.843 |
meaningful | -2.778 |
visually | -2.566 |
vested | -2.564 |
Token | ., |
Token ID | 1539 |
Feature activation | +3.19e+00 |
Pos logit contributions | |
Co | +20.882 |
L | +19.348 |
uh | +19.208 |
B | +19.171 |
ian | +19.150 |
Neg logit contributions | |
tremend | -22.027 |
deaf | -18.051 |
meaningful | -17.714 |
vested | -16.514 |
proactive | -16.451 |
Token | on |
Token ID | 319 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
Co | +5.095 |
ian | +4.759 |
she | +4.736 |
Star | +4.706 |
L | +4.698 |
Neg logit contributions | |
tremend | -4.235 |
deaf | -3.412 |
meaningful | -3.307 |
vested | -2.976 |
proactive | -2.953 |
Token | Tuesday |
Token ID | 3431 |
Feature activation | +5.20e+00 |
Pos logit contributions | |
tremend | +1.923 |
deaf | +1.664 |
meaningful | +1.623 |
visually | +1.480 |
vested | +1.479 |
Neg logit contributions | |
Co | -1.710 |
ian | -1.569 |
she | -1.568 |
Star | -1.560 |
L | -1.541 |
Token | . |
Token ID | 13 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
Co | +5.624 |
ian | +5.085 |
she | +5.038 |
Star | +5.003 |
L | +5.002 |
Neg logit contributions | |
tremend | -9.476 |
deaf | -8.178 |
meaningful | -7.999 |
vested | -7.441 |
proactive | -7.424 |
Token | ( |
Token ID | 357 |
Feature activation | +8.85e+00 |
Pos logit contributions | |
Co | +1.214 |
ian | +1.086 |
she | +1.082 |
Star | +1.076 |
uh | +1.057 |
Neg logit contributions | |
tremend | -2.183 |
deaf | -1.950 |
meaningful | -1.909 |
visually | -1.777 |
vested | -1.773 |
Token | David |
Token ID | 3271 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
Co | +4.002 |
ian | +3.677 |
she | +3.670 |
Star | +3.637 |
L | +3.620 |
Neg logit contributions | |
tremend | -4.894 |
deaf | -4.205 |
meaningful | -4.069 |
visually | -3.737 |
vested | -3.731 |
Token | Duke |
Token ID | 11083 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
Co | +10.052 |
ian | +9.107 |
L | +8.947 |
Star | +8.818 |
she | +8.681 |
Neg logit contributions | |
tremend | -19.890 |
deaf | -16.354 |
meaningful | -15.650 |
behavi | -15.311 |
misunder | -15.009 |
Token | . |
Token ID | 13 |
Feature activation | +5.22e+00 |
Pos logit contributions | |
Co | +15.877 |
ian | +15.071 |
L | +14.903 |
B | +14.819 |
Star | +14.785 |
Neg logit contributions | |
tremend | -13.395 |
deaf | -10.641 |
meaningful | -10.305 |
proactive | -9.401 |
visually | -9.216 |
Token | ( |
Token ID | 357 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
Co | +7.003 |
L | +6.388 |
ian | +6.386 |
B | +6.376 |
Star | +6.374 |
Neg logit contributions | |
tremend | -8.356 |
deaf | -6.926 |
meaningful | -6.797 |
vested | -6.249 |
visually | -6.210 |
Token | Joe |
Token ID | 19585 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
Co | +14.706 |
L | +14.036 |
B | +13.929 |
P | +13.603 |
Star | +13.470 |
Neg logit contributions | |
tremend | -16.413 |
meaningful | -13.757 |
deaf | -13.586 |
proactive | -12.636 |
vested | -12.628 |
Token | Bur |
Token ID | 5481 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
Co | +15.240 |
B | +14.526 |
uh | +14.188 |
P | +14.165 |
j | +14.136 |
Neg logit contributions | |
tremend | -18.979 |
meaningful | -15.588 |
deaf | -15.584 |
vested | -14.847 |
proactive | -14.335 |
Token | bank |
Token ID | 17796 |
Feature activation | +6.70e+00 |
Pos logit contributions | |
Co | +10.209 |
j | +9.911 |
she | +9.796 |
uh | +9.647 |
i | +9.392 |
Neg logit contributions | |
tremend | -37.771 |
meaningful | -30.522 |
proactive | -29.989 |
deaf | -29.631 |
behavi | -29.569 |
Token | / |
Token ID | 14 |
Feature activation | +9.96e+00 |
Pos logit contributions | |
Co | +6.283 |
ian | +5.611 |
Star | +5.457 |
she | +5.444 |
L | +5.432 |
Neg logit contributions | |
tremend | -13.165 |
deaf | -11.479 |
meaningful | -11.374 |
vested | -10.624 |
proactive | -10.584 |
Token | Or |
Token ID | 5574 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
Co | +11.767 |
B | +10.786 |
L | +10.737 |
Star | +10.648 |
P | +10.577 |
Neg logit contributions | |
tremend | -16.512 |
deaf | -13.854 |
meaningful | -13.699 |
artificially | -12.789 |
vested | -12.704 |
Token | lando |
Token ID | 11993 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
Co | +11.233 |
she | +10.464 |
B | +10.157 |
Star | +10.086 |
ian | +10.069 |
Neg logit contributions | |
tremend | -19.153 |
deaf | -15.940 |
meaningful | -15.823 |
visually | -15.107 |
vested | -14.778 |
Token | Sentinel |
Token ID | 26716 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
Co | +13.154 |
Star | +12.504 |
B | +11.833 |
L | +11.733 |
ian | +11.619 |
Neg logit contributions | |
tremend | -21.749 |
deaf | -18.134 |
meaningful | -17.907 |
artificially | -16.742 |
proactive | -16.648 |
Token | ff |
Token ID | 487 |
Feature activation | +8.25e+00 |
Pos logit contributions | |
uh | +5.999 |
j | +5.685 |
Co | +5.564 |
ian | +5.447 |
she | +5.290 |
Neg logit contributions | |
tremend | -32.930 |
meaningful | -27.669 |
behavi | -27.382 |
deaf | -27.116 |
proactive | -26.627 |
Token |
|
Token ID | 198 |
Feature activation | +4.59e+00 |
Pos logit contributions | |
Co | +9.991 |
ian | +9.578 |
B | +9.085 |
Star | +9.071 |
L | +9.071 |
Neg logit contributions | |
tremend | -13.379 |
deaf | -11.118 |
meaningful | -10.983 |
vested | -10.138 |
proactive | -10.124 |
Token |
|
Token ID | 198 |
Feature activation | +5.43e+00 |
Pos logit contributions | |
Co | +3.129 |
ian | +2.647 |
L | +2.646 |
B | +2.625 |
she | +2.612 |
Neg logit contributions | |
tremend | -11.665 |
deaf | -9.184 |
meaningful | -9.054 |
behavi | -9.036 |
exha | -8.943 |
Token | 2005 |
Token ID | 14315 |
Feature activation | +8.77e+00 |
Pos logit contributions | |
Co | +3.290 |
Star | +2.695 |
B | +2.676 |
L | +2.650 |
she | +2.616 |
Neg logit contributions | |
tremend | -12.970 |
deaf | -11.337 |
meaningful | -11.241 |
proactive | -10.638 |
visually | -10.571 |
Token | Eric |
Token ID | 7651 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
Co | +10.856 |
ian | +10.327 |
B | +10.232 |
L | +10.131 |
Star | +10.058 |
Neg logit contributions | |
tremend | -14.119 |
deaf | -11.162 |
meaningful | -10.996 |
proactive | -10.256 |
vested | -10.175 |
Token | McCorm |
Token ID | 42037 |
Feature activation | +1.84e+01 |
Pos logit contributions | |
Co | +15.997 |
ian | +15.153 |
L | +14.958 |
B | +14.891 |
Star | +14.841 |
Neg logit contributions | |
tremend | -16.620 |
deaf | -13.446 |
meaningful | -13.292 |
proactive | -12.590 |
vested | -12.394 |
Token | ack |
Token ID | 441 |
Feature activation | +4.50e+00 |
Pos logit contributions | |
ian | +13.402 |
rick | +13.297 |
Co | +13.279 |
i | +13.244 |
ak | +12.857 |
Neg logit contributions | |
tremend | -35.159 |
exha | -26.836 |
misunder | -26.548 |
eleph | -26.512 |
unnecess | -26.420 |
Token |
|
Token ID | 198 |
Feature activation | +5.86e+00 |
Pos logit contributions | |
Co | +3.671 |
ian | +3.191 |
she | +3.133 |
Star | +3.130 |
B | +3.115 |
Neg logit contributions | |
tremend | -9.372 |
deaf | -8.319 |
meaningful | -8.214 |
proactive | -7.683 |
vested | -7.655 |
Token |
|
Token ID | 198 |
Feature activation | +6.67e+00 |
Pos logit contributions | |
Co | +3.658 |
L | +3.101 |
ian | +3.082 |
B | +3.072 |
she | +3.008 |
Neg logit contributions | |
tremend | -15.471 |
exha | -12.006 |
behavi | -12.001 |
undermin | -11.890 |
deaf | -11.826 |
Token | 2005 |
Token ID | 14315 |
Feature activation | +9.85e+00 |
Pos logit contributions | |
Co | +3.869 |
Star | +3.153 |
B | +3.151 |
L | +3.117 |
P | +3.076 |
Neg logit contributions | |
tremend | -15.839 |
deaf | -13.898 |
meaningful | -13.816 |
proactive | -13.079 |
visually | -12.992 |
Token | Ray |
Token ID | 7760 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
Co | +12.259 |
ian | +11.755 |
B | +11.639 |
L | +11.503 |
Star | +11.445 |
Neg logit contributions | |
tremend | -15.427 |
deaf | -11.965 |
meaningful | -11.745 |
proactive | -11.048 |
vested | -10.921 |
Token | Mac |
Token ID | 4100 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
Co | +11.282 |
ian | +10.498 |
L | +10.376 |
M | +10.311 |
P | +10.310 |
Neg logit contributions | |
tremend | -21.722 |
deaf | -15.805 |
exha | -15.796 |
behavi | -15.791 |
misunder | -15.744 |
Token |
|
Token ID | 198 |
Feature activation | +6.73e+00 |
Pos logit contributions | |
Co | +18.221 |
L | +16.979 |
B | +16.914 |
ian | +16.820 |
P | +16.745 |
Neg logit contributions | |
tremend | -17.516 |
deaf | -14.270 |
meaningful | -14.257 |
proactive | -13.364 |
personalized | -12.830 |
Token |
|
Token ID | 198 |
Feature activation | +7.55e+00 |
Pos logit contributions | |
Co | +4.036 |
L | +3.423 |
B | +3.397 |
ian | +3.393 |
she | +3.322 |
Neg logit contributions | |
tremend | -17.953 |
exha | -13.996 |
behavi | -13.951 |
undermin | -13.838 |
misunder | -13.754 |
Token | 2003 |
Token ID | 16088 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
Co | +3.561 |
Star | +2.685 |
L | +2.673 |
B | +2.548 |
P | +2.497 |
Neg logit contributions | |
tremend | -19.664 |
deaf | -16.719 |
meaningful | -16.626 |
proactive | -16.041 |
behavi | -15.844 |
Token | Eric |
Token ID | 7651 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
Co | +12.472 |
ian | +11.891 |
L | +11.692 |
B | +11.682 |
Star | +11.558 |
Neg logit contributions | |
tremend | -15.731 |
deaf | -12.156 |
meaningful | -11.928 |
proactive | -11.266 |
vested | -11.074 |
Token | McCorm |
Token ID | 42037 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
Co | +17.096 |
ian | +16.150 |
L | +16.014 |
B | +15.931 |
Star | +15.900 |
Neg logit contributions | |
tremend | -16.041 |
deaf | -12.664 |
meaningful | -12.419 |
proactive | -11.887 |
vested | -11.651 |
Token | ack |
Token ID | 441 |
Feature activation | +4.97e+00 |
Pos logit contributions | |
ian | +11.245 |
Co | +11.048 |
i | +10.948 |
rick | +10.776 |
ak | +10.750 |
Neg logit contributions | |
tremend | -36.742 |
exha | -28.783 |
eleph | -28.378 |
behavi | -28.371 |
misunder | -28.358 |
Token |
|
Token ID | 198 |
Feature activation | +5.99e+00 |
Pos logit contributions | |
Co | +5.144 |
ian | +4.604 |
Star | +4.520 |
L | +4.477 |
B | +4.471 |
Neg logit contributions | |
tremend | -9.223 |
deaf | -8.019 |
meaningful | -7.938 |
proactive | -7.432 |
vested | -7.345 |
Token |
|
Token ID | 198 |
Feature activation | +6.76e+00 |
Pos logit contributions | |
Co | +3.727 |
L | +3.152 |
B | +3.136 |
ian | +3.131 |
she | +3.064 |
Neg logit contributions | |
tremend | -15.787 |
behavi | -12.246 |
exha | -12.238 |
undermin | -12.119 |
deaf | -12.058 |
Token | 2003 |
Token ID | 16088 |
Feature activation | +9.66e+00 |
Pos logit contributions | |
Co | +3.396 |
Star | +2.610 |
L | +2.566 |
B | +2.476 |
P | +2.439 |
Neg logit contributions | |
tremend | -16.856 |
deaf | -14.783 |
meaningful | -14.689 |
proactive | -14.064 |
vested | -13.872 |
Token | Ray |
Token ID | 7760 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
Co | +12.240 |
ian | +11.634 |
B | +11.494 |
L | +11.445 |
Star | +11.326 |
Neg logit contributions | |
tremend | -14.968 |
deaf | -11.627 |
meaningful | -11.439 |
proactive | -10.786 |
vested | -10.624 |
Token | , |
Token ID | 11 |
Feature activation | +5.28e+00 |
Pos logit contributions | |
Co | +12.506 |
ian | +12.003 |
B | +11.685 |
L | +11.660 |
P | +11.528 |
Neg logit contributions | |
tremend | -27.581 |
misunder | -20.178 |
exha | -20.014 |
behavi | -19.811 |
undermin | -19.557 |
Token | Oliver |
Token ID | 15416 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
Co | +5.470 |
L | +4.941 |
ian | +4.931 |
B | +4.908 |
P | +4.831 |
Neg logit contributions | |
tremend | -10.278 |
deaf | -8.545 |
meaningful | -8.231 |
mutually | -7.645 |
proactive | -7.636 |
Token | , |
Token ID | 11 |
Feature activation | +7.97e+00 |
Pos logit contributions | |
Co | +15.227 |
ian | +14.960 |
i | +14.391 |
B | +14.142 |
- | +13.993 |
Neg logit contributions | |
tremend | -33.279 |
misunder | -24.408 |
exha | -24.364 |
undermin | -23.898 |
eleph | -23.765 |
Token | Federal |
Token ID | 5618 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
Co | +8.930 |
ian | +8.207 |
F | +7.741 |
P | +7.709 |
B | +7.703 |
Neg logit contributions | |
tremend | -15.191 |
deaf | -11.549 |
meaningful | -11.092 |
behavi | -10.743 |
unnecess | -10.707 |
Token | and |
Token ID | 290 |
Feature activation | +6.30e+00 |
Pos logit contributions | |
Co | +13.477 |
she | +12.892 |
L | +12.728 |
ian | +12.684 |
B | +12.628 |
Neg logit contributions | |
tremend | -28.007 |
misunder | -21.056 |
exha | -20.398 |
behavi | -19.997 |
undermin | -19.749 |
Token | Franklin |
Token ID | 14021 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
Co | +7.747 |
B | +6.943 |
L | +6.922 |
P | +6.915 |
Star | +6.879 |
Neg logit contributions | |
tremend | -11.307 |
deaf | -8.968 |
meaningful | -8.462 |
visually | -8.048 |
misunder | -8.041 |
Token | Streets |
Token ID | 27262 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
Co | +14.420 |
S | +13.831 |
ian | +13.689 |
Star | +13.653 |
W | +13.471 |
Neg logit contributions | |
tremend | -32.725 |
exha | -24.308 |
misunder | -23.930 |
deaf | -23.055 |
eleph | -22.875 |
Token | ), |
Token ID | 828 |
Feature activation | +6.45e+00 |
Pos logit contributions | |
Co | +3.627 |
B | +2.964 |
L | +2.845 |
uh | +2.732 |
she | +2.639 |
Neg logit contributions | |
tremend | -30.726 |
behavi | -24.828 |
exha | -24.229 |
unnecess | -24.115 |
undermin | -24.087 |
Token | the |
Token ID | 262 |
Feature activation | +6.02e+00 |
Pos logit contributions | |
Co | +12.220 |
ian | +11.740 |
L | +11.712 |
she | +11.708 |
B | +11.638 |
Neg logit contributions | |
tremend | -8.013 |
misunder | -4.346 |
exha | -4.205 |
deaf | -4.204 |
behavi | -4.126 |
Token | Stone |
Token ID | 8026 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
Co | +6.320 |
ian | +5.710 |
B | +5.686 |
she | +5.671 |
L | +5.666 |
Neg logit contributions | |
tremend | -11.773 |
deaf | -9.458 |
meaningful | -9.106 |
proactive | -8.603 |
vested | -8.567 |
Token | hurst |
Token ID | 33500 |
Feature activation | +7.94e+00 |
Pos logit contributions | |
Co | +5.815 |
she | +5.717 |
uh | +5.393 |
j | +5.377 |
L | +5.282 |
Neg logit contributions | |
tremend | -23.394 |
behavi | -18.816 |
meaningful | -18.425 |
deaf | -18.372 |
proactive | -18.277 |
Token |
|
Token ID | 198 |
Feature activation | +5.51e+00 |
Pos logit contributions | |
Co | +3.187 |
ian | +2.741 |
L | +2.692 |
she | +2.685 |
Star | +2.684 |
Neg logit contributions | |
tremend | -8.202 |
deaf | -7.284 |
meaningful | -7.170 |
visually | -6.739 |
proactive | -6.728 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
Co | +3.603 |
L | +3.049 |
ian | +3.043 |
B | +3.024 |
she | +2.976 |
Neg logit contributions | |
tremend | -14.187 |
deaf | -11.046 |
behavi | -10.990 |
exha | -10.961 |
undermin | -10.915 |
Token | 12 |
Token ID | 1065 |
Feature activation | +6.52e+00 |
Pos logit contributions | |
Co | +2.842 |
L | +2.181 |
Star | +2.120 |
ian | +2.103 |
she | +2.087 |
Neg logit contributions | |
tremend | -13.180 |
deaf | -11.940 |
meaningful | -11.732 |
vested | -11.177 |
visually | -11.136 |
Token | . |
Token ID | 13 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
Co | +4.266 |
B | +3.646 |
L | +3.628 |
ian | +3.513 |
P | +3.476 |
Neg logit contributions | |
tremend | -16.481 |
deaf | -12.969 |
meaningful | -12.783 |
behavi | -12.643 |
exha | -12.561 |
Token | Alex |
Token ID | 4422 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
Co | +5.015 |
ian | +4.564 |
L | +4.520 |
Star | +4.486 |
B | +4.481 |
Neg logit contributions | |
tremend | -6.968 |
deaf | -5.878 |
meaningful | -5.785 |
proactive | -5.350 |
vested | -5.339 |
Token | Dun |
Token ID | 5648 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
Co | +11.164 |
B | +10.383 |
ian | +10.243 |
W | +10.032 |
L | +10.021 |
Neg logit contributions | |
tremend | -23.571 |
behavi | -17.538 |
misunder | -17.026 |
meaningful | -16.961 |
proactive | -16.936 |
Token | bar |
Token ID | 5657 |
Feature activation | +8.74e+00 |
Pos logit contributions | |
B | +12.978 |
she | +12.423 |
Co | +12.308 |
j | +12.271 |
aro | +12.194 |
Neg logit contributions | |
tremend | -35.978 |
behavi | -28.181 |
exha | -27.661 |
misunder | -27.639 |
undermin | -27.144 |
Token | ( |
Token ID | 357 |
Feature activation | +8.75e+00 |
Pos logit contributions | |
Co | +8.348 |
ian | +7.749 |
B | +7.543 |
L | +7.507 |
she | +7.431 |
Neg logit contributions | |
tremend | -17.622 |
deaf | -13.582 |
meaningful | -13.329 |
behavi | -13.155 |
misunder | -13.006 |
Token | 93 |
Token ID | 6052 |
Feature activation | +8.39e+00 |
Pos logit contributions | |
Co | +5.463 |
L | +4.601 |
B | +4.562 |
she | +4.493 |
P | +4.407 |
Neg logit contributions | |
tremend | -20.961 |
deaf | -17.500 |
meaningful | -17.405 |
proactive | -16.717 |
behavi | -16.680 |
Token | ) |
Token ID | 8 |
Feature activation | +3.26e+00 |
Pos logit contributions | |
Co | +4.736 |
B | +4.029 |
L | +4.011 |
ian | +3.950 |
P | +3.782 |
Neg logit contributions | |
tremend | -21.581 |
deaf | -17.013 |
behavi | -16.979 |
exha | -16.821 |
undermin | -16.816 |
Token | ( |
Token ID | 357 |
Feature activation | +7.70e+00 |
Pos logit contributions | |
Co | +2.932 |
ian | +2.571 |
L | +2.553 |
she | +2.546 |
B | +2.543 |
Neg logit contributions | |
tremend | -7.078 |
deaf | -5.838 |
meaningful | -5.740 |
vested | -5.420 |
proactive | -5.403 |
Token | , |
Token ID | 837 |
Feature activation | +6.33e+00 |
Pos logit contributions | |
Co | +8.317 |
B | +7.672 |
L | +7.591 |
P | +7.550 |
S | +7.184 |
Neg logit contributions | |
tremend | -24.727 |
misunder | -18.481 |
exha | -18.435 |
undermin | -18.284 |
behavi | -18.261 |
Token | c |
Token ID | 269 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
Co | +7.220 |
ian | +6.510 |
L | +6.439 |
B | +6.425 |
C | +6.391 |
Neg logit contributions | |
tremend | -11.436 |
deaf | -8.672 |
meaningful | -8.237 |
behavi | -8.216 |
misunder | -8.117 |
Token | v |
Token ID | 85 |
Feature activation | +9.97e+00 |
Pos logit contributions | |
Co | +7.205 |
j | +7.146 |
she | +6.980 |
i | +6.641 |
L | +6.495 |
Neg logit contributions | |
tremend | -28.767 |
exha | -23.421 |
behavi | -22.981 |
misunder | -22.573 |
deaf | -22.319 |
Token | 2 |
Token ID | 17 |
Feature activation | +6.99e+00 |
Pos logit contributions | |
Co | +5.417 |
L | +4.781 |
B | +4.709 |
P | +4.375 |
ian | +4.177 |
Neg logit contributions | |
tremend | -26.538 |
exha | -21.297 |
behavi | -21.143 |
undermin | -20.789 |
misunder | -20.671 |
Token | . |
Token ID | 764 |
Feature activation | +8.52e+00 |
Pos logit contributions | |
Co | +7.087 |
L | +6.477 |
B | +6.444 |
ian | +6.324 |
P | +6.311 |
Neg logit contributions | |
tremend | -15.302 |
behavi | -11.198 |
exha | -11.194 |
deaf | -11.180 |
misunder | -11.043 |
Token | COL |
Token ID | 20444 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
Co | +12.219 |
B | +11.738 |
L | +11.613 |
M | +11.365 |
P | +11.319 |
Neg logit contributions | |
tremend | -11.184 |
deaf | -9.138 |
meaningful | -8.659 |
proactive | -8.172 |
vested | -8.027 |
Token | OR |
Token ID | 1581 |
Feature activation | +8.30e+00 |
Pos logit contributions | |
B | +16.310 |
Co | +16.109 |
L | +15.727 |
U | +15.594 |
P | +15.579 |
Neg logit contributions | |
tremend | -33.961 |
behavi | -25.497 |
exha | -25.199 |
undermin | -24.475 |
deaf | -24.176 |
Token | _ |
Token ID | 62 |
Feature activation | +6.49e+00 |
Pos logit contributions | |
Co | +3.913 |
B | +3.611 |
L | +3.409 |
P | +3.263 |
J | +2.913 |
Neg logit contributions | |
tremend | -22.170 |
deaf | -17.653 |
behavi | -17.463 |
exha | -17.445 |
undermin | -17.278 |
Token | B |
Token ID | 33 |
Feature activation | +7.94e+00 |
Pos logit contributions | |
Co | +3.302 |
B | +3.054 |
L | +2.815 |
P | +2.666 |
Star | +2.515 |
Neg logit contributions | |
tremend | -16.231 |
deaf | -13.992 |
meaningful | -13.776 |
proactive | -13.255 |
vested | -13.238 |
Token | GR |
Token ID | 10761 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
Co | +3.702 |
L | +3.340 |
B | +3.136 |
P | +2.985 |
W | +2.925 |
Neg logit contributions | |
tremend | -20.546 |
deaf | -17.026 |
meaningful | -16.567 |
behavi | -16.447 |
proactive | -16.309 |
Token | 2 |
Token ID | 17 |
Feature activation | +5.41e+00 |
Pos logit contributions | |
Co | +7.520 |
B | +6.989 |
L | +6.946 |
P | +6.689 |
W | +6.496 |
Neg logit contributions | |
tremend | -25.560 |
behavi | -19.808 |
exha | -19.727 |
deaf | -19.604 |
undermin | -19.482 |
Token | � |
Token ID | 251 |
Feature activation | +8.93e+00 |
Pos logit contributions | |
B | +10.698 |
Co | +10.696 |
uh | +10.192 |
Star | +10.089 |
she | +9.992 |
Neg logit contributions | |
tremend | -23.591 |
deaf | -18.312 |
behavi | -17.638 |
meaningful | -17.512 |
misunder | -17.325 |
Token | said |
Token ID | 531 |
Feature activation | +8.30e-01 |
Pos logit contributions | |
Co | +14.221 |
she | +13.677 |
L | +13.463 |
B | +13.411 |
Star | +13.389 |
Neg logit contributions | |
tremend | -10.724 |
deaf | -8.298 |
meaningful | -8.260 |
proactive | -7.328 |
vested | -7.303 |
Token | the |
Token ID | 262 |
Feature activation | -8.66e-01 |
Pos logit contributions | |
Co | +1.830 |
ian | +1.740 |
she | +1.740 |
Star | +1.733 |
L | +1.727 |
Neg logit contributions | |
tremend | -0.593 |
deaf | -0.401 |
meaningful | -0.380 |
vested | -0.285 |
visually | -0.281 |
Token | king |
Token ID | 5822 |
Feature activation | +2.46e+00 |
Pos logit contributions | |
tremend | +1.087 |
deaf | +0.908 |
meaningful | +0.878 |
visually | +0.780 |
vested | +0.779 |
Neg logit contributions | |
Co | -1.435 |
ian | -1.335 |
she | -1.335 |
Star | -1.330 |
L | -1.316 |
Token | . |
Token ID | 13 |
Feature activation | +3.46e+00 |
Pos logit contributions | |
Co | +3.220 |
ian | +2.978 |
she | +2.960 |
Star | +2.937 |
L | +2.911 |
Neg logit contributions | |
tremend | -3.921 |
deaf | -3.366 |
meaningful | -3.298 |
vested | -3.023 |
proactive | -3.008 |
Token | � |
Token ID | 564 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
Co | +3.656 |
she | +3.272 |
ian | +3.261 |
Star | +3.249 |
L | +3.220 |
Neg logit contributions | |
tremend | -6.546 |
deaf | -5.658 |
meaningful | -5.565 |
vested | -5.188 |
proactive | -5.169 |
Token | � |
Token ID | 250 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
Co | +16.741 |
B | +15.788 |
Star | +15.624 |
P | +15.369 |
L | +15.368 |
Neg logit contributions | |
tremend | -26.091 |
deaf | -21.373 |
meaningful | -20.774 |
vested | -19.710 |
mutually | -19.442 |
Token | What |
Token ID | 2061 |
Feature activation | +5.87e+00 |
Pos logit contributions | |
Co | +9.541 |
B | +8.506 |
L | +8.503 |
Star | +8.469 |
P | +8.336 |
Neg logit contributions | |
tremend | -20.403 |
deaf | -17.001 |
meaningful | -16.932 |
vested | -15.932 |
proactive | -15.906 |
Token | does |
Token ID | 857 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
Co | +9.232 |
ian | +8.786 |
B | +8.661 |
Star | +8.659 |
L | +8.647 |
Neg logit contributions | |
tremend | -7.349 |
deaf | -5.654 |
meaningful | -5.538 |
visually | -4.918 |
vested | -4.891 |
Token | he |
Token ID | 339 |
Feature activation | -8.71e-01 |
Pos logit contributions | |
Co | +2.240 |
she | +2.085 |
ian | +2.082 |
Star | +2.073 |
L | +2.059 |
Neg logit contributions | |
tremend | -1.963 |
deaf | -1.627 |
meaningful | -1.582 |
visually | -1.426 |
vested | -1.418 |
Token | want |
Token ID | 765 |
Feature activation | -2.14e+00 |
Pos logit contributions | |
tremend | +0.946 |
deaf | +0.759 |
meaningful | +0.730 |
vested | +0.631 |
visually | +0.630 |
Neg logit contributions | |
Co | -1.596 |
ian | -1.499 |
she | -1.497 |
Star | -1.492 |
L | -1.479 |
Token | ( |
Token ID | 357 |
Feature activation | +6.31e+00 |
Pos logit contributions | |
Co | +6.091 |
ian | +5.562 |
L | +5.400 |
she | +5.394 |
B | +5.386 |
Neg logit contributions | |
tremend | -11.185 |
deaf | -9.760 |
meaningful | -9.614 |
proactive | -8.969 |
vested | -8.948 |
Token | Equ |
Token ID | 23588 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
Co | +4.082 |
L | +3.411 |
B | +3.373 |
Star | +3.369 |
P | +3.229 |
Neg logit contributions | |
tremend | -14.669 |
deaf | -13.003 |
meaningful | -12.781 |
vested | -12.107 |
proactive | -12.105 |
Token | ipe |
Token ID | 3757 |
Feature activation | +7.59e+00 |
Pos logit contributions | |
ian | +10.285 |
Co | +10.121 |
i | +9.632 |
L | +9.458 |
ix | +9.316 |
Neg logit contributions | |
tremend | -22.258 |
deaf | -19.388 |
meaningful | -18.621 |
behavi | -17.814 |
proactive | -17.250 |
Token | Cycl |
Token ID | 28007 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
Co | +9.590 |
ian | +8.721 |
L | +8.708 |
B | +8.662 |
Star | +8.649 |
Neg logit contributions | |
tremend | -11.920 |
deaf | -10.362 |
meaningful | -10.107 |
vested | -9.288 |
artificially | -9.177 |
Token | iste |
Token ID | 40833 |
Feature activation | +7.13e+00 |
Pos logit contributions | |
Co | +14.424 |
uh | +13.289 |
ian | +13.001 |
i | +12.844 |
oh | +12.699 |
Neg logit contributions | |
tremend | -26.372 |
deaf | -22.250 |
meaningful | -21.634 |
behavi | -20.703 |
proactive | -20.120 |
Token | FD |
Token ID | 30002 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
Co | +9.600 |
L | +8.775 |
Star | +8.629 |
B | +8.608 |
Smith | +8.527 |
Neg logit contributions | |
tremend | -11.066 |
deaf | -9.230 |
meaningful | -8.992 |
vested | -8.349 |
proactive | -8.240 |
Token | J |
Token ID | 41 |
Feature activation | +7.49e+00 |
Pos logit contributions | |
J | +18.405 |
Co | +17.751 |
L | +16.752 |
W | +16.533 |
j | +16.395 |
Neg logit contributions | |
tremend | -28.893 |
deaf | -24.319 |
meaningful | -22.343 |
awaru | -22.100 |
behavi | -21.619 |
Token | - |
Token ID | 532 |
Feature activation | +5.79e+00 |
Pos logit contributions | |
Co | +6.918 |
L | +6.166 |
B | +6.044 |
ian | +5.978 |
Star | +5.895 |
Neg logit contributions | |
tremend | -14.409 |
deaf | -12.773 |
meaningful | -12.416 |
vested | -11.667 |
proactive | -11.599 |
Token | Big |
Token ID | 4403 |
Feature activation | +8.72e+00 |
Pos logit contributions | |
Co | +7.717 |
L | +7.130 |
B | +7.085 |
ian | +7.079 |
Star | +7.054 |
Neg logit contributions | |
tremend | -9.110 |
deaf | -7.622 |
meaningful | -7.447 |
vested | -6.852 |
artificially | -6.801 |
Token | Mat |
Token ID | 19044 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
Co | +11.132 |
L | +10.256 |
B | +10.125 |
Star | +10.119 |
P | +10.054 |
Neg logit contributions | |
tremend | -13.757 |
deaf | -11.778 |
meaningful | -11.415 |
vested | -10.671 |
proactive | -10.667 |
Token | ) |
Token ID | 8 |
Feature activation | +3.44e+00 |
Pos logit contributions | |
Co | +15.946 |
ian | +14.900 |
L | +14.805 |
B | +14.754 |
P | +14.503 |
Neg logit contributions | |
tremend | -15.651 |
deaf | -13.084 |
meaningful | -12.416 |
vested | -11.451 |
artificially | -11.222 |
Token | 's |
Token ID | 338 |
Feature activation | -6.28e+00 |
Pos logit contributions | |
tremend | +3.494 |
deaf | +3.103 |
meaningful | +3.017 |
visually | +2.797 |
vested | +2.775 |
Neg logit contributions | |
Co | -2.837 |
she | -2.600 |
Star | -2.576 |
uh | -2.548 |
ian | -2.537 |
Token | mix |
Token ID | 5022 |
Feature activation | -7.01e+00 |
Pos logit contributions | |
tremend | +7.993 |
deaf | +6.990 |
meaningful | +6.780 |
visually | +6.118 |
proactive | +6.058 |
Neg logit contributions | |
Co | -9.626 |
she | -8.914 |
Star | -8.862 |
Smith | -8.861 |
ian | -8.859 |
Token | - |
Token ID | 12 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
tremend | +13.658 |
deaf | +12.803 |
meaningful | +12.430 |
visually | +11.892 |
artificially | +11.710 |
Neg logit contributions | |
Co | -5.234 |
she | -4.317 |
Star | -4.302 |
Smith | -4.289 |
ian | -4.180 |
Token | ups |
Token ID | 4739 |
Feature activation | -7.01e+00 |
Pos logit contributions | |
tremend | +2.998 |
deaf | +2.759 |
meaningful | +2.703 |
visually | +2.558 |
vested | +2.552 |
Neg logit contributions | |
Co | -0.823 |
ian | -0.677 |
Star | -0.674 |
she | -0.652 |
Smith | -0.644 |
Token | closely |
Token ID | 7173 |
Feature activation | -7.54e+00 |
Pos logit contributions | |
tremend | +10.403 |
deaf | +9.507 |
meaningful | +9.234 |
visually | +8.754 |
artificially | +8.557 |
Neg logit contributions | |
Co | -8.820 |
Star | -8.031 |
she | -7.926 |
Smith | -7.920 |
uh | -7.801 |
Token | resemble |
Token ID | 22464 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
tremend | +8.398 |
deaf | +7.421 |
meaningful | +7.167 |
visually | +6.611 |
vested | +6.453 |
Neg logit contributions | |
Co | -12.126 |
Star | -11.325 |
she | -11.309 |
Smith | -11.251 |
uh | -11.158 |
Token | symptoms |
Token ID | 7460 |
Feature activation | -9.01e+00 |
Pos logit contributions | |
tremend | +21.014 |
deaf | +20.646 |
meaningful | +20.093 |
those | +19.016 |
visually | +18.816 |
Neg logit contributions | |
Co | -15.057 |
she | -13.910 |
Age | -13.371 |
Smith | -13.370 |
uh | -13.346 |
Token | of |
Token ID | 286 |
Feature activation | -9.07e+00 |
Pos logit contributions | |
tremend | +12.677 |
deaf | +11.940 |
meaningful | +11.439 |
visually | +10.760 |
artificially | +10.542 |
Neg logit contributions | |
Co | -11.110 |
Star | -10.067 |
she | -10.005 |
ian | -9.882 |
Smith | -9.881 |
Token | schizophrenia |
Token ID | 22794 |
Feature activation | -2.69e+00 |
Pos logit contributions | |
tremend | +12.023 |
deaf | +11.146 |
meaningful | +10.619 |
visually | +9.822 |
artificially | +9.648 |
Neg logit contributions | |
Co | -12.216 |
she | -11.467 |
ian | -11.259 |
Star | -11.225 |
uh | -11.205 |
Token | called |
Token ID | 1444 |
Feature activation | -5.21e+00 |
Pos logit contributions | |
tremend | +4.751 |
deaf | +4.291 |
meaningful | +4.207 |
visually | +3.936 |
vested | +3.897 |
Neg logit contributions | |
Co | -2.890 |
Star | -2.603 |
she | -2.581 |
ian | -2.540 |
Smith | -2.532 |
Token | derail |
Token ID | 33749 |
Feature activation | -2.72e+00 |
Pos logit contributions | |
tremend | +7.537 |
deaf | +6.627 |
meaningful | +6.390 |
visually | +5.862 |
proactive | +5.812 |
Neg logit contributions | |
Co | -7.210 |
she | -6.698 |
Star | -6.670 |
ian | -6.660 |
uh | -6.594 |
Token | bitcoins |
Token ID | 22690 |
Feature activation | -8.11e-01 |
Pos logit contributions | |
tremend | +3.433 |
deaf | +2.945 |
meaningful | +2.878 |
vested | +2.607 |
visually | +2.591 |
Neg logit contributions | |
Co | -3.502 |
she | -3.262 |
ian | -3.239 |
Star | -3.233 |
uh | -3.208 |
Token | . |
Token ID | 13 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
tremend | +1.538 |
deaf | +1.377 |
meaningful | +1.354 |
vested | +1.270 |
visually | +1.261 |
Neg logit contributions | |
Co | -0.806 |
she | -0.722 |
Star | -0.714 |
ian | -0.713 |
uh | -0.699 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +3.27e+00 |
Pos logit contributions | |
tremend | +2.367 |
deaf | +2.114 |
meaningful | +2.077 |
vested | +1.939 |
visually | +1.930 |
Neg logit contributions | |
Co | -1.316 |
she | -1.186 |
ian | -1.180 |
Star | -1.169 |
uh | -1.153 |
Token | Their |
Token ID | 14574 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
Co | +2.366 |
ian | +1.988 |
she | +1.985 |
Star | +1.976 |
L | +1.931 |
Neg logit contributions | |
tremend | -7.196 |
deaf | -6.481 |
meaningful | -6.376 |
vested | -6.008 |
visually | -6.005 |
Token | solution |
Token ID | 4610 |
Feature activation | -6.62e+00 |
Pos logit contributions | |
tremend | +2.483 |
deaf | +2.098 |
meaningful | +2.037 |
visually | +1.827 |
vested | +1.827 |
Neg logit contributions | |
Co | -2.886 |
ian | -2.676 |
she | -2.676 |
Star | -2.665 |
uh | -2.634 |
Token | involves |
Token ID | 9018 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
tremend | +10.602 |
deaf | +9.720 |
meaningful | +9.342 |
visually | +8.880 |
vested | +8.792 |
Neg logit contributions | |
Co | -7.470 |
she | -6.763 |
Star | -6.761 |
uh | -6.703 |
Smith | -6.693 |
Token | encaps |
Token ID | 32652 |
Feature activation | -6.67e+00 |
Pos logit contributions | |
tremend | +20.948 |
deaf | +19.560 |
meaningful | +19.156 |
artificially | +18.034 |
visually | +17.964 |
Neg logit contributions | |
Co | -13.782 |
she | -12.622 |
Star | -12.461 |
uh | -12.395 |
Smith | -12.305 |
Token | ulating |
Token ID | 8306 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
tremend | +7.943 |
deaf | +6.812 |
meaningful | +6.586 |
artificially | +5.983 |
visually | +5.923 |
Neg logit contributions | |
Co | -9.929 |
Star | -9.334 |
Smith | -9.179 |
she | -9.021 |
ian | -8.994 |
Token | per |
Token ID | 583 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
tremend | +19.346 |
deaf | +18.215 |
meaningful | +18.022 |
visually | +16.598 |
purely | +16.471 |
Neg logit contributions | |
Co | -12.714 |
she | -11.856 |
uh | -11.774 |
Smith | -11.686 |
Star | -11.630 |
Token | ov |
Token ID | 709 |
Feature activation | +4.51e+00 |
Pos logit contributions | |
tremend | +4.379 |
deaf | +4.013 |
meaningful | +3.942 |
visually | +3.721 |
proactive | +3.690 |
Neg logit contributions | |
Co | -1.364 |
Star | -1.133 |
she | -1.130 |
ian | -1.102 |
Smith | -1.102 |
Token | sk |
Token ID | 8135 |
Feature activation | +4.83e+00 |
Pos logit contributions | |
Co | +2.478 |
ian | +2.057 |
she | +1.990 |
Star | +1.905 |
L | +1.904 |
Neg logit contributions | |
tremend | -10.644 |
deaf | -9.621 |
meaningful | -9.507 |
vested | -8.950 |
visually | -8.943 |
Token | choices |
Token ID | 7747 |
Feature activation | -4.11e+00 |
Pos logit contributions | |
Co | +0.463 |
ian | +0.426 |
she | +0.426 |
Star | +0.425 |
uh | +0.419 |
Neg logit contributions | |
tremend | -0.463 |
deaf | -0.397 |
meaningful | -0.387 |
visually | -0.351 |
vested | -0.350 |
Token | , |
Token ID | 11 |
Feature activation | -5.91e+00 |
Pos logit contributions | |
tremend | +6.138 |
deaf | +5.389 |
meaningful | +5.286 |
visually | +4.824 |
vested | +4.810 |
Neg logit contributions | |
Co | -5.614 |
Star | -5.133 |
she | -5.132 |
ian | -5.099 |
Smith | -5.074 |
Token | but |
Token ID | 475 |
Feature activation | -5.01e-01 |
Pos logit contributions | |
tremend | +7.298 |
deaf | +6.287 |
meaningful | +6.223 |
visually | +5.516 |
reasonable | +5.493 |
Neg logit contributions | |
Co | -9.140 |
Star | -8.544 |
ian | -8.537 |
she | -8.483 |
uh | -8.388 |
Token | also |
Token ID | 635 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
tremend | +0.628 |
deaf | +0.514 |
meaningful | +0.493 |
vested | +0.439 |
visually | +0.438 |
Neg logit contributions | |
Co | -0.839 |
ian | -0.784 |
she | -0.781 |
Star | -0.777 |
L | -0.774 |
Token | obsc |
Token ID | 10666 |
Feature activation | -4.28e+00 |
Pos logit contributions | |
tremend | +6.734 |
deaf | +5.832 |
meaningful | +5.740 |
visually | +5.175 |
vested | +5.157 |
Neg logit contributions | |
Co | -6.892 |
she | -6.378 |
Star | -6.353 |
ian | -6.334 |
uh | -6.273 |
Token | ures |
Token ID | 942 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
tremend | +5.704 |
deaf | +4.957 |
meaningful | +4.860 |
visually | +4.486 |
artificially | +4.390 |
Neg logit contributions | |
Co | -6.030 |
Star | -5.670 |
Smith | -5.598 |
she | -5.588 |
B | -5.455 |
Token | significant |
Token ID | 2383 |
Feature activation | -8.93e+00 |
Pos logit contributions | |
tremend | +19.443 |
meaningful | +19.422 |
deaf | +18.481 |
vested | +17.471 |
reasonable | +17.415 |
Neg logit contributions | |
Co | -14.435 |
Star | -13.281 |
she | -13.121 |
uh | -12.986 |
Smith | -12.624 |
Token | conflicts |
Token ID | 12333 |
Feature activation | -7.36e+00 |
Pos logit contributions | |
tremend | +12.388 |
meaningful | +11.911 |
deaf | +11.607 |
vested | +10.843 |
proactive | +10.653 |
Neg logit contributions | |
Co | -10.885 |
Star | -10.173 |
she | -9.911 |
uh | -9.818 |
Smith | -9.795 |
Token | of |
Token ID | 286 |
Feature activation | -6.03e+00 |
Pos logit contributions | |
tremend | +11.657 |
deaf | +10.548 |
meaningful | +10.544 |
visually | +9.785 |
vested | +9.752 |
Neg logit contributions | |
Co | -8.117 |
Star | -7.432 |
Smith | -7.310 |
she | -7.297 |
uh | -7.195 |
Token | interest |
Token ID | 1393 |
Feature activation | -8.05e-01 |
Pos logit contributions | |
tremend | +4.706 |
deaf | +3.746 |
meaningful | +3.711 |
vested | +2.994 |
visually | +2.977 |
Neg logit contributions | |
Co | -12.267 |
she | -11.637 |
Star | -11.623 |
uh | -11.527 |
ian | -11.499 |
Token | in |
Token ID | 287 |
Feature activation | -6.26e+00 |
Pos logit contributions | |
tremend | +1.374 |
deaf | +1.206 |
meaningful | +1.182 |
vested | +1.091 |
visually | +1.090 |
Neg logit contributions | |
Co | -0.967 |
ian | -0.876 |
she | -0.876 |
Star | -0.873 |
uh | -0.859 |
Token |
|
Token ID | 198 |
Feature activation | +5.43e+00 |
Pos logit contributions | |
Co | +3.765 |
L | +3.210 |
B | +3.196 |
ian | +3.103 |
P | +3.103 |
Neg logit contributions | |
tremend | -14.497 |
deaf | -11.345 |
behavi | -11.272 |
exha | -11.196 |
meaningful | -11.129 |
Token | The |
Token ID | 464 |
Feature activation | -3.26e-02 |
Pos logit contributions | |
Co | +3.647 |
Star | +2.986 |
L | +2.953 |
she | +2.951 |
B | +2.938 |
Neg logit contributions | |
tremend | -12.401 |
deaf | -11.055 |
meaningful | -10.892 |
visually | -10.311 |
vested | -10.300 |
Token | trade |
Token ID | 3292 |
Feature activation | -8.68e-01 |
Pos logit contributions | |
tremend | +0.050 |
deaf | +0.042 |
meaningful | +0.041 |
visually | +0.038 |
vested | +0.038 |
Neg logit contributions | |
Co | -0.046 |
ian | -0.042 |
she | -0.042 |
Star | -0.042 |
L | -0.041 |
Token | also |
Token ID | 635 |
Feature activation | -8.23e+00 |
Pos logit contributions | |
tremend | +1.284 |
deaf | +1.109 |
meaningful | +1.081 |
visually | +0.983 |
vested | +0.982 |
Neg logit contributions | |
Co | -1.239 |
she | -1.139 |
ian | -1.139 |
Star | -1.132 |
uh | -1.120 |
Token | reun |
Token ID | 15398 |
Feature activation | -7.19e+00 |
Pos logit contributions | |
tremend | +11.127 |
deaf | +10.261 |
meaningful | +9.925 |
vested | +9.477 |
visually | +9.212 |
Neg logit contributions | |
Co | -11.075 |
Star | -10.206 |
she | -10.048 |
uh | -9.987 |
ian | -9.913 |
Token | ites |
Token ID | 2737 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
tremend | +12.677 |
meaningful | +11.408 |
deaf | +11.250 |
vested | +11.064 |
relatively | +10.676 |
Neg logit contributions | |
Co | -5.963 |
Smith | -5.260 |
Star | -5.259 |
uh | -5.178 |
Age | -5.038 |
Token | Fel |
Token ID | 13937 |
Feature activation | +3.30e+00 |
Pos logit contributions | |
tremend | +20.384 |
deaf | +19.111 |
meaningful | +18.927 |
relatively | +17.672 |
either | +17.561 |
Neg logit contributions | |
Co | -12.595 |
she | -11.677 |
uh | -11.495 |
Star | -10.982 |
ian | -10.941 |
Token | ton |
Token ID | 1122 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
Co | +2.111 |
ian | +1.741 |
she | +1.735 |
Star | +1.716 |
L | +1.666 |
Neg logit contributions | |
tremend | -7.505 |
deaf | -6.805 |
meaningful | -6.696 |
visually | -6.320 |
vested | -6.319 |
Token | and |
Token ID | 290 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
Co | +0.497 |
she | +0.457 |
ian | +0.455 |
Star | +0.453 |
uh | +0.449 |
Neg logit contributions | |
tremend | -0.559 |
deaf | -0.484 |
meaningful | -0.471 |
visually | -0.431 |
vested | -0.430 |
Token | Thomas |
Token ID | 5658 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
tremend | +6.926 |
deaf | +6.170 |
meaningful | +6.055 |
visually | +5.532 |
vested | +5.528 |
Neg logit contributions | |
Co | -5.338 |
she | -4.928 |
ian | -4.851 |
uh | -4.844 |
Star | -4.838 |
Token | with |
Token ID | 351 |
Feature activation | -6.78e+00 |
Pos logit contributions | |
Co | +4.675 |
ian | +4.322 |
she | +4.266 |
Star | +4.256 |
L | +4.237 |
Neg logit contributions | |
tremend | -5.148 |
deaf | -4.387 |
meaningful | -4.259 |
vested | -3.900 |
proactive | -3.898 |
Token | Space |
Token ID | 4687 |
Feature activation | +8.94e+00 |
Pos logit contributions | |
Co | +1.619 |
ian | +1.474 |
she | +1.470 |
Star | +1.462 |
L | +1.442 |
Neg logit contributions | |
tremend | -2.162 |
deaf | -1.879 |
meaningful | -1.828 |
visually | -1.681 |
vested | -1.680 |
Token | Sciences |
Token ID | 13473 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
Co | +10.236 |
ian | +9.447 |
B | +9.301 |
she | +9.244 |
L | +9.058 |
Neg logit contributions | |
tremend | -15.165 |
deaf | -13.034 |
meaningful | -12.200 |
visually | -11.553 |
vested | -11.427 |
Token | . |
Token ID | 13 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
Co | +5.629 |
ian | +5.183 |
she | +5.133 |
Star | +5.113 |
L | +5.103 |
Neg logit contributions | |
tremend | -6.164 |
deaf | -5.287 |
meaningful | -5.116 |
visually | -4.659 |
proactive | -4.636 |
Token | The |
Token ID | 383 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
Co | +1.814 |
ian | +1.646 |
she | +1.644 |
Star | +1.635 |
L | +1.613 |
Neg logit contributions | |
tremend | -2.534 |
deaf | -2.219 |
meaningful | -2.170 |
visually | -2.000 |
vested | -1.999 |
Token | students |
Token ID | 2444 |
Feature activation | -5.39e+00 |
Pos logit contributions | |
tremend | +0.270 |
deaf | +0.218 |
meaningful | +0.209 |
visually | +0.184 |
vested | +0.183 |
Neg logit contributions | |
Co | -0.403 |
ian | -0.377 |
she | -0.376 |
Star | -0.375 |
L | -0.373 |
Token | undertook |
Token ID | 45730 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
tremend | +9.934 |
deaf | +9.138 |
meaningful | +8.976 |
visually | +8.481 |
vested | +8.464 |
Neg logit contributions | |
Co | -5.084 |
Star | -4.518 |
she | -4.420 |
ian | -4.369 |
Smith | -4.356 |
Token | this |
Token ID | 428 |
Feature activation | -7.28e+00 |
Pos logit contributions | |
tremend | +20.789 |
meaningful | +19.231 |
deaf | +18.550 |
proactive | +17.652 |
relatively | +17.634 |
Neg logit contributions | |
Co | -12.957 |
she | -12.392 |
Star | -11.852 |
uh | -11.812 |
ian | -11.777 |
Token | project |
Token ID | 1628 |
Feature activation | -9.76e+00 |
Pos logit contributions | |
tremend | +9.872 |
deaf | +8.648 |
meaningful | +8.607 |
visually | +7.766 |
proactive | +7.765 |
Neg logit contributions | |
Co | -10.306 |
Star | -9.652 |
she | -9.627 |
ian | -9.463 |
uh | -9.453 |
Token | in |
Token ID | 287 |
Feature activation | -7.40e+00 |
Pos logit contributions | |
tremend | +13.041 |
meaningful | +12.110 |
deaf | +12.017 |
purely | +11.449 |
visually | +11.321 |
Neg logit contributions | |
Co | -12.196 |
Star | -11.344 |
she | -10.975 |
Smith | -10.958 |
uh | -10.885 |
Token | R |
Token ID | 371 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
tremend | +10.416 |
meaningful | +9.384 |
deaf | +9.379 |
proactive | +8.492 |
visually | +8.452 |
Neg logit contributions | |
Co | -9.793 |
Star | -8.983 |
she | -8.982 |
ian | -8.910 |
uh | -8.885 |
Token | enn |
Token ID | 1697 |
Feature activation | +6.09e+00 |
Pos logit contributions | |
Co | +1.474 |
ian | +1.194 |
she | +1.192 |
Star | +1.179 |
L | +1.140 |
Neg logit contributions | |
tremend | -5.739 |
deaf | -5.216 |
meaningful | -5.135 |
visually | -4.853 |
vested | -4.850 |
Token | , |
Token ID | 11 |
Feature activation | +4.77e-01 |
Pos logit contributions | |
Co | +5.305 |
she | +4.820 |
ian | +4.818 |
L | +4.760 |
B | +4.751 |
Neg logit contributions | |
tremend | -7.251 |
deaf | -6.296 |
meaningful | -6.101 |
proactive | -5.624 |
vested | -5.589 |
Token | South |
Token ID | 2520 |
Feature activation | +8.27e+00 |
Pos logit contributions | |
Co | +0.697 |
ian | +0.644 |
she | +0.643 |
Star | +0.638 |
L | +0.634 |
Neg logit contributions | |
tremend | -0.699 |
deaf | -0.593 |
meaningful | -0.576 |
vested | -0.521 |
visually | -0.520 |
Token | Carolina |
Token ID | 5913 |
Feature activation | +6.63e+00 |
Pos logit contributions | |
Co | +9.284 |
ian | +8.406 |
L | +8.372 |
Star | +8.322 |
she | +8.299 |
Neg logit contributions | |
tremend | -14.243 |
deaf | -12.176 |
meaningful | -11.720 |
visually | -10.950 |
vested | -10.916 |
Token | , |
Token ID | 11 |
Feature activation | -5.35e-01 |
Pos logit contributions | |
Co | +9.216 |
ian | +8.649 |
she | +8.527 |
L | +8.481 |
B | +8.469 |
Neg logit contributions | |
tremend | -9.672 |
deaf | -8.040 |
meaningful | -7.712 |
proactive | -7.010 |
vested | -6.929 |
Token | commemor |
Token ID | 28723 |
Feature activation | -4.13e+00 |
Pos logit contributions | |
tremend | +0.814 |
deaf | +0.699 |
meaningful | +0.681 |
vested | +0.619 |
visually | +0.619 |
Neg logit contributions | |
Co | -0.747 |
ian | -0.687 |
she | -0.686 |
Star | -0.682 |
L | -0.675 |
Token | ates |
Token ID | 689 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
tremend | +7.765 |
deaf | +7.328 |
meaningful | +7.264 |
vested | +6.873 |
visually | +6.816 |
Neg logit contributions | |
Co | -3.290 |
Star | -2.927 |
Smith | -2.856 |
she | -2.822 |
uh | -2.709 |
Token | her |
Token ID | 607 |
Feature activation | -6.69e+00 |
Pos logit contributions | |
tremend | +18.802 |
deaf | +18.406 |
meaningful | +17.742 |
living | +16.269 |
visually | +16.188 |
Neg logit contributions | |
Co | -14.181 |
Star | -12.799 |
uh | -12.710 |
aro | -12.387 |
ian | -12.272 |
Token | birthplace |
Token ID | 48145 |
Feature activation | -3.10e+00 |
Pos logit contributions | |
tremend | +9.785 |
deaf | +8.847 |
meaningful | +8.714 |
visually | +7.908 |
vested | +7.886 |
Neg logit contributions | |
Co | -8.647 |
uh | -7.857 |
Star | -7.856 |
she | -7.847 |
Smith | -7.805 |
Token | .[ |
Token ID | 3693 |
Feature activation | +5.43e+00 |
Pos logit contributions | |
tremend | +5.205 |
deaf | +4.665 |
meaningful | +4.586 |
visually | +4.241 |
vested | +4.224 |
Neg logit contributions | |
Co | -3.642 |
Star | -3.258 |
uh | -3.230 |
ian | -3.209 |
she | -3.205 |
Token | 61 |
Token ID | 5333 |
Feature activation | +7.99e+00 |
Pos logit contributions | |
Co | +2.873 |
she | +2.247 |
Star | +2.241 |
L | +2.238 |
B | +2.233 |
Neg logit contributions | |
tremend | -12.892 |
deaf | -11.719 |
meaningful | -11.468 |
vested | -10.888 |
visually | -10.862 |
Token | ] |
Token ID | 60 |
Feature activation | +2.63e+00 |
Pos logit contributions | |
Co | +6.019 |
ian | +5.247 |
she | +5.189 |
B | +5.173 |
L | +5.114 |
Neg logit contributions | |
tremend | -16.309 |
deaf | -14.599 |
meaningful | -14.332 |
vested | -13.537 |
proactive | -13.528 |
Token | all |
Token ID | 477 |
Feature activation | -7.26e+00 |
Pos logit contributions | |
tremend | +12.028 |
deaf | +10.929 |
meaningful | +10.730 |
vested | +9.933 |
visually | +9.918 |
Neg logit contributions | |
Co | -7.998 |
Star | -7.271 |
she | -7.153 |
ian | -7.149 |
uh | -7.108 |
Token | along |
Token ID | 1863 |
Feature activation | -2.85e+00 |
Pos logit contributions | |
tremend | +9.604 |
deaf | +8.410 |
meaningful | +8.371 |
reasonable | +7.642 |
vested | +7.534 |
Neg logit contributions | |
Co | -10.325 |
Star | -9.564 |
she | -9.540 |
ian | -9.521 |
Smith | -9.484 |
Token | " |
Token ID | 1 |
Feature activation | -8.65e+00 |
Pos logit contributions | |
tremend | +4.780 |
deaf | +4.211 |
meaningful | +4.126 |
visually | +3.803 |
vested | +3.795 |
Neg logit contributions | |
Co | -3.452 |
ian | -3.123 |
Star | -3.120 |
she | -3.107 |
Smith | -3.067 |
Token | that |
Token ID | 326 |
Feature activation | -9.30e+00 |
Pos logit contributions | |
tremend | +11.741 |
deaf | +10.740 |
meaningful | +10.478 |
visually | +9.472 |
vested | +9.472 |
Neg logit contributions | |
Co | -11.198 |
Star | -10.306 |
ian | -10.250 |
uh | -10.214 |
Smith | -10.157 |
Token | WikiLeaks |
Token ID | 19766 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
tremend | +13.989 |
deaf | +12.959 |
meaningful | +12.672 |
vested | +11.571 |
reasonable | +11.551 |
Neg logit contributions | |
Co | -10.616 |
uh | -9.720 |
Star | -9.666 |
ian | -9.606 |
she | -9.503 |
Token | possesses |
Token ID | 22194 |
Feature activation | -1.37e+01 |
Pos logit contributions | |
tremend | +2.135 |
deaf | +1.892 |
meaningful | +1.862 |
vested | +1.725 |
visually | +1.719 |
Neg logit contributions | |
Co | -1.471 |
she | -1.335 |
Star | -1.330 |
ian | -1.325 |
uh | -1.319 |
Token | classified |
Token ID | 10090 |
Feature activation | -3.19e+00 |
Pos logit contributions | |
tremend | +19.706 |
meaningful | +18.879 |
deaf | +18.298 |
reasonable | +17.360 |
vested | +17.316 |
Neg logit contributions | |
Co | -13.488 |
she | -12.531 |
Star | -12.370 |
Smith | -12.342 |
uh | -12.309 |
Token | US |
Token ID | 1294 |
Feature activation | -4.36e-01 |
Pos logit contributions | |
tremend | +3.449 |
deaf | +2.933 |
meaningful | +2.868 |
visually | +2.505 |
vested | +2.490 |
Neg logit contributions | |
Co | -5.561 |
she | -5.222 |
Star | -5.217 |
uh | -5.190 |
Smith | -5.154 |
Token | state |
Token ID | 1181 |
Feature activation | -4.15e-01 |
Pos logit contributions | |
tremend | +0.487 |
deaf | +0.405 |
meaningful | +0.396 |
visually | +0.345 |
vested | +0.344 |
Neg logit contributions | |
Co | -0.763 |
she | -0.718 |
Star | -0.713 |
ian | -0.710 |
uh | -0.709 |
Token | department |
Token ID | 5011 |
Feature activation | -2.54e-01 |
Pos logit contributions | |
tremend | +0.485 |
deaf | +0.406 |
meaningful | +0.397 |
vested | +0.348 |
visually | +0.348 |
Neg logit contributions | |
Co | -0.710 |
she | -0.666 |
Star | -0.662 |
ian | -0.661 |
uh | -0.660 |
Token | documents |
Token ID | 4963 |
Feature activation | -6.16e+00 |
Pos logit contributions | |
tremend | +0.320 |
deaf | +0.271 |
meaningful | +0.264 |
vested | +0.235 |
visually | +0.235 |
Neg logit contributions | |
Co | -0.414 |
she | -0.385 |
Star | -0.384 |
ian | -0.383 |
uh | -0.380 |
Token | the |
Token ID | 262 |
Feature activation | -4.40e+00 |
Pos logit contributions | |
tremend | +6.933 |
deaf | +6.051 |
meaningful | +5.881 |
vested | +5.313 |
visually | +5.296 |
Neg logit contributions | |
Co | -7.116 |
Star | -6.536 |
she | -6.526 |
ian | -6.525 |
uh | -6.503 |
Token | Trump |
Token ID | 1301 |
Feature activation | -2.39e+00 |
Pos logit contributions | |
tremend | +6.211 |
deaf | +5.408 |
meaningful | +5.222 |
vested | +4.743 |
visually | +4.740 |
Neg logit contributions | |
Co | -6.427 |
she | -5.912 |
ian | -5.908 |
Star | -5.884 |
uh | -5.843 |
Token | administration |
Token ID | 3662 |
Feature activation | -4.21e+00 |
Pos logit contributions | |
tremend | +3.516 |
deaf | +3.095 |
meaningful | +2.992 |
visually | +2.733 |
vested | +2.718 |
Neg logit contributions | |
Co | -3.254 |
she | -2.984 |
Star | -2.973 |
Smith | -2.968 |
uh | -2.957 |
Token | focused |
Token ID | 5670 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
tremend | +5.179 |
deaf | +4.545 |
meaningful | +4.398 |
vested | +3.972 |
visually | +3.932 |
Neg logit contributions | |
Co | -6.740 |
Star | -6.295 |
she | -6.261 |
Smith | -6.219 |
uh | -6.194 |
Token | heavily |
Token ID | 7272 |
Feature activation | -9.70e+00 |
Pos logit contributions | |
tremend | +14.336 |
deaf | +13.109 |
meaningful | +12.755 |
purely | +11.975 |
relatively | +11.829 |
Neg logit contributions | |
Co | -13.392 |
Star | -12.523 |
she | -12.438 |
ian | -12.129 |
uh | -12.121 |
Token | on |
Token ID | 319 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
tremend | +11.179 |
deaf | +10.297 |
meaningful | +9.844 |
purely | +9.068 |
visually | +8.805 |
Neg logit contributions | |
Co | -13.899 |
she | -12.944 |
Star | -12.875 |
uh | -12.688 |
Smith | -12.687 |
Token | burden |
Token ID | 10538 |
Feature activation | -7.45e+00 |
Pos logit contributions | |
tremend | +18.867 |
deaf | +18.286 |
meaningful | +17.872 |
artificially | +16.534 |
vested | +16.502 |
Neg logit contributions | |
Co | -13.855 |
she | -12.935 |
uh | -12.621 |
Star | -12.502 |
aro | -12.335 |
Token | sharing |
Token ID | 7373 |
Feature activation | -7.28e+00 |
Pos logit contributions | |
tremend | +15.863 |
deaf | +15.019 |
meaningful | +14.736 |
vested | +13.950 |
relatively | +13.890 |
Neg logit contributions | |
Co | -3.901 |
Star | -3.121 |
she | -3.106 |
uh | -3.070 |
ian | -3.062 |
Token | so |
Token ID | 523 |
Feature activation | -5.66e+00 |
Pos logit contributions | |
tremend | +10.765 |
deaf | +9.980 |
meaningful | +9.904 |
vested | +9.047 |
purely | +9.017 |
Neg logit contributions | |
Co | -8.558 |
Star | -7.913 |
she | -7.886 |
uh | -7.845 |
Smith | -7.772 |
Token | far |
Token ID | 1290 |
Feature activation | -4.94e+00 |
Pos logit contributions | |
tremend | +6.593 |
deaf | +5.582 |
meaningful | +5.423 |
visually | +4.787 |
artificially | +4.772 |
Neg logit contributions | |
Co | -9.410 |
Star | -8.864 |
she | -8.797 |
ian | -8.717 |
Smith | -8.695 |
Token | in |
Token ID | 287 |
Feature activation | -5.43e+00 |
Pos logit contributions | |
tremend | +8.217 |
deaf | +7.477 |
meaningful | +7.305 |
visually | +6.760 |
purely | +6.708 |
Neg logit contributions | |
Co | -5.698 |
she | -5.118 |
Star | -5.086 |
Smith | -5.027 |
ian | -4.993 |
Token | is |
Token ID | 318 |
Feature activation | -9.42e+00 |
Pos logit contributions | |
tremend | +8.514 |
deaf | +7.656 |
meaningful | +7.489 |
visually | +6.990 |
vested | +6.939 |
Neg logit contributions | |
Co | -5.647 |
Star | -5.074 |
she | -5.035 |
ian | -4.988 |
Smith | -4.975 |
Token | that |
Token ID | 326 |
Feature activation | -8.36e+00 |
Pos logit contributions | |
tremend | +13.705 |
deaf | +12.227 |
meaningful | +12.059 |
visually | +11.082 |
reasonable | +11.027 |
Neg logit contributions | |
Co | -11.514 |
Star | -10.636 |
she | -10.478 |
ian | -10.471 |
uh | -10.365 |
Token | the |
Token ID | 262 |
Feature activation | -7.05e+00 |
Pos logit contributions | |
tremend | +13.057 |
deaf | +11.807 |
meaningful | +11.602 |
visually | +10.701 |
vested | +10.638 |
Neg logit contributions | |
Co | -9.584 |
Star | -8.673 |
ian | -8.660 |
uh | -8.654 |
she | -8.622 |
Token | startup |
Token ID | 13693 |
Feature activation | -8.11e+00 |
Pos logit contributions | |
tremend | +10.453 |
deaf | +9.247 |
meaningful | +9.016 |
visually | +8.238 |
vested | +8.225 |
Neg logit contributions | |
Co | -9.270 |
she | -8.497 |
ian | -8.455 |
Star | -8.451 |
uh | -8.394 |
Token | momentum |
Token ID | 12858 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
tremend | +14.297 |
deaf | +12.940 |
meaningful | +12.810 |
vested | +11.976 |
relatively | +11.916 |
Neg logit contributions | |
Co | -7.455 |
uh | -6.632 |
she | -6.580 |
Star | -6.508 |
Smith | -6.478 |
Token | is |
Token ID | 318 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
tremend | +15.519 |
deaf | +14.226 |
meaningful | +14.038 |
vested | +13.141 |
relatively | +13.010 |
Neg logit contributions | |
Co | -11.135 |
uh | -10.070 |
Star | -10.038 |
she | -10.012 |
Smith | -9.918 |
Token | moving |
Token ID | 3867 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
tremend | +19.173 |
deaf | +18.013 |
meaningful | +17.741 |
relatively | +16.676 |
reasonable | +16.339 |
Neg logit contributions | |
Co | -14.696 |
Star | -13.661 |
she | -13.564 |
uh | -13.386 |
Smith | -13.315 |
Token | upwards |
Token ID | 21032 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
tremend | +15.805 |
deaf | +14.421 |
meaningful | +14.055 |
relatively | +13.343 |
visually | +13.014 |
Neg logit contributions | |
Co | -12.817 |
she | -11.962 |
Star | -11.639 |
uh | -11.609 |
ian | -11.482 |
Token | at |
Token ID | 379 |
Feature activation | -9.61e+00 |
Pos logit contributions | |
tremend | +16.139 |
deaf | +14.526 |
meaningful | +14.517 |
relatively | +13.794 |
visually | +13.721 |
Neg logit contributions | |
Co | -10.359 |
Star | -9.226 |
she | -9.183 |
Smith | -9.150 |
uh | -9.148 |
Token | an |
Token ID | 281 |
Feature activation | -6.16e+00 |
Pos logit contributions | |
tremend | +13.533 |
deaf | +12.007 |
meaningful | +11.748 |
reasonable | +10.969 |
relatively | +10.799 |
Neg logit contributions | |
Co | -12.466 |
she | -11.612 |
Star | -11.363 |
Smith | -11.340 |
uh | -11.262 |
Token | aggressive |
Token ID | 8361 |
Feature activation | -8.33e+00 |
Pos logit contributions | |
tremend | +5.750 |
deaf | +4.679 |
meaningful | +4.463 |
artificially | +3.975 |
reasonable | +3.794 |
Neg logit contributions | |
Co | -11.522 |
Star | -10.992 |
she | -10.846 |
Smith | -10.799 |
ian | -10.700 |
Token | plant |
Token ID | 4618 |
Feature activation | -7.18e+00 |
Pos logit contributions | |
Co | +17.858 |
ian | +16.938 |
she | +16.865 |
Star | +16.823 |
L | +16.749 |
Neg logit contributions | |
tremend | -7.727 |
deaf | -5.756 |
meaningful | -5.447 |
vested | -4.491 |
visually | -4.465 |
Token | � |
Token ID | 447 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
tremend | +13.403 |
deaf | +12.136 |
meaningful | +11.989 |
visually | +11.297 |
artificially | +11.186 |
Neg logit contributions | |
Co | -6.240 |
Star | -5.518 |
she | -5.431 |
uh | -5.356 |
ian | -5.320 |
Token | � |
Token ID | 247 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
Co | +1.485 |
ian | +1.287 |
she | +1.284 |
Star | +1.274 |
L | +1.248 |
Neg logit contributions | |
tremend | -3.654 |
deaf | -3.279 |
meaningful | -3.220 |
visually | -3.019 |
vested | -3.019 |
Token | s |
Token ID | 82 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
Co | +0.142 |
ian | +0.128 |
she | +0.127 |
Star | +0.127 |
uh | +0.125 |
Neg logit contributions | |
tremend | -0.215 |
deaf | -0.189 |
meaningful | -0.186 |
visually | -0.172 |
vested | -0.171 |
Token | production |
Token ID | 3227 |
Feature activation | -6.61e+00 |
Pos logit contributions | |
tremend | +7.343 |
deaf | +6.431 |
meaningful | +6.315 |
vested | +5.815 |
visually | +5.805 |
Neg logit contributions | |
Co | -5.599 |
she | -5.102 |
Star | -5.089 |
ian | -5.048 |
Smith | -5.020 |
Token | contributes |
Token ID | 22625 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
tremend | +11.183 |
deaf | +10.009 |
meaningful | +9.917 |
artificially | +9.248 |
visually | +9.175 |
Neg logit contributions | |
Co | -7.003 |
ian | -6.321 |
she | -6.311 |
Star | -6.266 |
uh | -6.214 |
Token | to |
Token ID | 284 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
tremend | +21.614 |
meaningful | +19.591 |
deaf | +19.006 |
relatively | +18.332 |
reasonable | +18.067 |
Neg logit contributions | |
Co | -11.506 |
she | -11.129 |
ian | -10.740 |
Star | -10.680 |
Smith | -10.500 |
Token | 21 |
Token ID | 2310 |
Feature activation | -5.51e+00 |
Pos logit contributions | |
tremend | +17.431 |
meaningful | +15.835 |
deaf | +15.727 |
reasonable | +14.469 |
artificially | +14.418 |
Neg logit contributions | |
Co | -11.767 |
she | -10.912 |
Star | -10.638 |
uh | -10.630 |
ian | -10.500 |
Token | % |
Token ID | 4 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
tremend | +10.572 |
deaf | +9.587 |
meaningful | +9.480 |
visually | +8.801 |
proactive | +8.798 |
Neg logit contributions | |
Co | -4.559 |
she | -4.118 |
ian | -4.112 |
Smith | -4.036 |
Star | -3.995 |
Token | of |
Token ID | 286 |
Feature activation | -5.99e+00 |
Pos logit contributions | |
tremend | +8.118 |
deaf | +7.185 |
meaningful | +7.097 |
vested | +6.528 |
visually | +6.515 |
Neg logit contributions | |
Co | -5.761 |
she | -5.283 |
Star | -5.265 |
ian | -5.258 |
uh | -5.186 |
Token | the |
Token ID | 262 |
Feature activation | -4.21e+00 |
Pos logit contributions | |
tremend | +7.618 |
deaf | +6.545 |
meaningful | +6.384 |
visually | +5.714 |
vested | +5.687 |
Neg logit contributions | |
Co | -9.299 |
she | -8.679 |
Star | -8.630 |
ian | -8.587 |
uh | -8.561 |
Token | said |
Token ID | 531 |
Feature activation | -4.24e+00 |
Pos logit contributions | |
tremend | +4.729 |
deaf | +4.129 |
meaningful | +3.990 |
vested | +3.669 |
visually | +3.659 |
Neg logit contributions | |
Co | -5.062 |
Star | -4.705 |
she | -4.682 |
ian | -4.598 |
uh | -4.595 |
Token | , |
Token ID | 11 |
Feature activation | -2.87e+00 |
Pos logit contributions | |
tremend | +7.318 |
deaf | +6.486 |
meaningful | +6.345 |
visually | +5.863 |
vested | +5.846 |
Neg logit contributions | |
Co | -4.776 |
she | -4.289 |
Star | -4.286 |
ian | -4.265 |
Smith | -4.202 |
Token | the |
Token ID | 262 |
Feature activation | -3.07e+00 |
Pos logit contributions | |
tremend | +3.092 |
deaf | +2.527 |
meaningful | +2.450 |
vested | +2.109 |
visually | +2.101 |
Neg logit contributions | |
Co | -5.189 |
she | -4.864 |
Star | -4.854 |
ian | -4.853 |
uh | -4.808 |
Token | culture |
Token ID | 3968 |
Feature activation | -4.33e+00 |
Pos logit contributions | |
tremend | +3.697 |
deaf | +3.104 |
meaningful | +3.016 |
vested | +2.663 |
visually | +2.646 |
Neg logit contributions | |
Co | -5.133 |
she | -4.793 |
ian | -4.787 |
Star | -4.775 |
uh | -4.729 |
Token | trivial |
Token ID | 20861 |
Feature activation | -7.23e+00 |
Pos logit contributions | |
tremend | +7.151 |
deaf | +6.374 |
meaningful | +6.212 |
vested | +5.721 |
visually | +5.663 |
Neg logit contributions | |
Co | -5.106 |
she | -4.662 |
Star | -4.602 |
ian | -4.577 |
uh | -4.531 |
Token | izes |
Token ID | 4340 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
tremend | +12.278 |
deaf | +10.930 |
meaningful | +10.767 |
vested | +10.072 |
visually | +10.007 |
Neg logit contributions | |
Co | -7.172 |
she | -6.481 |
Star | -6.477 |
Smith | -6.310 |
uh | -6.227 |
Token | religion |
Token ID | 5737 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
tremend | +19.000 |
meaningful | +18.294 |
deaf | +17.909 |
living | +16.683 |
everyday | +16.599 |
Neg logit contributions | |
Co | -13.150 |
she | -12.413 |
Star | -11.975 |
uh | -11.900 |
Smith | -11.708 |
Token | and |
Token ID | 290 |
Feature activation | -6.71e+00 |
Pos logit contributions | |
tremend | +6.093 |
deaf | +5.369 |
meaningful | +5.340 |
visually | +4.951 |
vested | +4.902 |
Neg logit contributions | |
Co | -3.799 |
Star | -3.401 |
she | -3.368 |
ian | -3.344 |
uh | -3.336 |
Token | normal |
Token ID | 3487 |
Feature activation | -5.83e-01 |
Pos logit contributions | |
tremend | +9.735 |
deaf | +8.696 |
meaningful | +8.513 |
vested | +7.732 |
visually | +7.710 |
Neg logit contributions | |
Co | -8.916 |
she | -8.337 |
Star | -8.137 |
uh | -8.036 |
ian | -8.027 |
Token | izes |
Token ID | 4340 |
Feature activation | -7.73e+00 |
Pos logit contributions | |
tremend | +1.166 |
deaf | +1.048 |
meaningful | +1.030 |
visually | +0.961 |
vested | +0.960 |
Neg logit contributions | |
Co | -0.526 |
she | -0.461 |
Star | -0.457 |
ian | -0.455 |
uh | -0.447 |
Token | secular |
Token ID | 14589 |
Feature activation | +7.50e-01 |
Pos logit contributions | |
tremend | +10.021 |
deaf | +8.978 |
meaningful | +8.914 |
vested | +7.904 |
reasonable | +7.902 |
Neg logit contributions | |
Co | -11.049 |
she | -10.319 |
Star | -10.205 |
Smith | -9.986 |
ian | -9.971 |
Token | results |
Token ID | 2482 |
Feature activation | -9.16e+00 |
Pos logit contributions | |
tremend | +14.415 |
meaningful | +13.130 |
deaf | +13.080 |
visually | +11.896 |
reasonable | +11.892 |
Neg logit contributions | |
Co | -10.393 |
she | -9.664 |
Star | -9.359 |
ian | -9.335 |
Smith | -9.310 |
Token | . |
Token ID | 13 |
Feature activation | -3.98e+00 |
Pos logit contributions | |
tremend | +15.568 |
meaningful | +14.581 |
deaf | +14.388 |
visually | +13.500 |
artificially | +13.418 |
Neg logit contributions | |
Co | -8.565 |
Star | -7.606 |
she | -7.474 |
Smith | -7.394 |
ian | -7.368 |
Token | Eight |
Token ID | 18087 |
Feature activation | -3.23e-01 |
Pos logit contributions | |
tremend | +7.393 |
deaf | +6.840 |
meaningful | +6.739 |
visually | +6.308 |
vested | +6.249 |
Neg logit contributions | |
Co | -3.454 |
ian | -3.098 |
she | -3.085 |
Star | -3.040 |
uh | -3.019 |
Token | city |
Token ID | 1748 |
Feature activation | -4.91e+00 |
Pos logit contributions | |
tremend | +0.552 |
deaf | +0.485 |
meaningful | +0.475 |
visually | +0.438 |
vested | +0.437 |
Neg logit contributions | |
Co | -0.388 |
ian | -0.352 |
she | -0.351 |
Star | -0.349 |
L | -0.344 |
Token | departments |
Token ID | 13346 |
Feature activation | -6.28e+00 |
Pos logit contributions | |
tremend | +9.451 |
deaf | +8.688 |
meaningful | +8.501 |
vested | +8.004 |
visually | +7.950 |
Neg logit contributions | |
Co | -4.163 |
ian | -3.642 |
she | -3.578 |
Smith | -3.567 |
uh | -3.561 |
Token | oversee |
Token ID | 19158 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
tremend | +9.584 |
deaf | +8.681 |
meaningful | +8.511 |
visually | +7.979 |
vested | +7.936 |
Neg logit contributions | |
Co | -7.530 |
Star | -6.962 |
she | -6.892 |
ian | -6.859 |
Smith | -6.815 |
Token | at |
Token ID | 379 |
Feature activation | -7.09e+00 |
Pos logit contributions | |
tremend | +20.245 |
meaningful | +19.032 |
deaf | +19.013 |
proactive | +17.602 |
relatively | +17.412 |
Neg logit contributions | |
Co | -12.446 |
she | -11.482 |
uh | -11.345 |
Smith | -10.966 |
Star | -10.962 |
Token | least |
Token ID | 1551 |
Feature activation | -3.84e+00 |
Pos logit contributions | |
tremend | +12.457 |
deaf | +11.219 |
meaningful | +11.156 |
reasonable | +10.467 |
visually | +10.353 |
Neg logit contributions | |
Co | -6.830 |
she | -6.265 |
uh | -6.017 |
Smith | -5.998 |
Star | -5.997 |
Token | 400 |
Token ID | 7337 |
Feature activation | -4.63e+00 |
Pos logit contributions | |
tremend | +4.593 |
deaf | +3.875 |
meaningful | +3.781 |
visually | +3.335 |
vested | +3.308 |
Neg logit contributions | |
Co | -6.427 |
she | -6.021 |
ian | -5.988 |
Star | -5.981 |
uh | -5.933 |
Token | contracts |
Token ID | 8592 |
Feature activation | -7.36e+00 |
Pos logit contributions | |
tremend | +7.519 |
deaf | +6.742 |
meaningful | +6.602 |
visually | +6.066 |
proactive | +6.057 |
Neg logit contributions | |
Co | -5.557 |
she | -5.073 |
Star | -5.031 |
ian | -5.023 |
uh | -4.955 |
Token | to |
Token ID | 284 |
Feature activation | -7.79e+00 |
Pos logit contributions | |
tremend | +11.725 |
deaf | +10.711 |
meaningful | +10.681 |
visually | +9.851 |
vested | +9.766 |
Neg logit contributions | |
Co | -8.064 |
she | -7.346 |
Star | -7.289 |
uh | -7.250 |
ian | -7.206 |
Token | ), |
Token ID | 828 |
Feature activation | -5.94e+00 |
Pos logit contributions | |
tremend | +5.907 |
deaf | +5.360 |
meaningful | +5.271 |
visually | +4.963 |
vested | +4.905 |
Neg logit contributions | |
Co | -2.644 |
Star | -2.330 |
she | -2.321 |
ian | -2.301 |
Smith | -2.254 |
Token | then |
Token ID | 788 |
Feature activation | -3.63e+00 |
Pos logit contributions | |
tremend | +8.604 |
deaf | +7.675 |
meaningful | +7.519 |
visually | +6.817 |
vested | +6.786 |
Neg logit contributions | |
Co | -7.924 |
Star | -7.346 |
she | -7.308 |
ian | -7.284 |
uh | -7.174 |
Token | the |
Token ID | 262 |
Feature activation | -5.41e+00 |
Pos logit contributions | |
tremend | +5.044 |
deaf | +4.358 |
meaningful | +4.243 |
visually | +3.828 |
vested | +3.813 |
Neg logit contributions | |
Co | -5.384 |
she | -4.992 |
Star | -4.990 |
ian | -4.990 |
uh | -4.907 |
Token | following |
Token ID | 1708 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
tremend | +7.973 |
deaf | +7.074 |
meaningful | +6.926 |
vested | +6.304 |
proactive | +6.276 |
Neg logit contributions | |
Co | -7.353 |
she | -6.792 |
Star | -6.742 |
ian | -6.722 |
uh | -6.655 |
Token | alignment |
Token ID | 19114 |
Feature activation | -6.55e+00 |
Pos logit contributions | |
tremend | +6.037 |
deaf | +5.289 |
meaningful | +5.208 |
proactive | +4.706 |
visually | +4.683 |
Neg logit contributions | |
Co | -6.274 |
she | -5.894 |
Star | -5.818 |
ian | -5.789 |
uh | -5.741 |
Token | becomes |
Token ID | 4329 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
tremend | +10.320 |
deaf | +9.458 |
meaningful | +9.327 |
visually | +8.736 |
vested | +8.578 |
Neg logit contributions | |
Co | -7.300 |
Star | -6.741 |
she | -6.740 |
uh | -6.566 |
Smith | -6.508 |
Token | possible |
Token ID | 1744 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
tremend | +19.273 |
meaningful | +18.675 |
deaf | +18.276 |
reasonable | +17.208 |
relatively | +16.867 |
Neg logit contributions | |
Co | -13.286 |
she | -12.756 |
Star | -12.363 |
Net | -12.044 |
ian | -11.985 |
Token | : |
Token ID | 25 |
Feature activation | -7.01e+00 |
Pos logit contributions | |
tremend | +15.363 |
deaf | +14.184 |
meaningful | +14.133 |
visually | +13.392 |
either | +13.122 |
Neg logit contributions | |
Co | -10.246 |
Star | -9.534 |
she | -9.534 |
Smith | -9.174 |
uh | -9.172 |
Token |
|
Token ID | 198 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
tremend | +12.253 |
deaf | +11.212 |
meaningful | +10.996 |
visually | +10.260 |
either | +10.232 |
Neg logit contributions | |
Co | -6.509 |
she | -6.004 |
Star | -5.909 |
ian | -5.840 |
uh | -5.776 |
Token |
|
Token ID | 198 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
Co | +1.424 |
ian | +1.216 |
she | +1.210 |
Star | +1.206 |
L | +1.200 |
Neg logit contributions | |
tremend | -3.761 |
deaf | -3.268 |
meaningful | -3.210 |
vested | -3.030 |
proactive | -3.018 |
Token | St |
Token ID | 1273 |
Feature activation | +2.27e+00 |
Pos logit contributions | |
Co | +1.195 |
ian | +1.000 |
she | +0.998 |
Star | +0.980 |
uh | +0.953 |
Neg logit contributions | |
tremend | -4.204 |
deaf | -3.830 |
meaningful | -3.765 |
visually | -3.552 |
vested | -3.548 |
Token | Campbell |
Token ID | 14327 |
Feature activation | +2.21e+00 |
Pos logit contributions | |
tremend | +8.984 |
deaf | +8.096 |
meaningful | +7.868 |
vested | +7.194 |
visually | +7.184 |
Neg logit contributions | |
Co | -7.847 |
she | -7.206 |
ian | -7.189 |
Star | -7.151 |
uh | -7.113 |
Token | residents |
Token ID | 5085 |
Feature activation | -5.64e+00 |
Pos logit contributions | |
Co | +2.445 |
ian | +2.196 |
she | +2.193 |
Star | +2.180 |
L | +2.148 |
Neg logit contributions | |
tremend | -3.998 |
deaf | -3.527 |
meaningful | -3.454 |
visually | -3.203 |
vested | -3.202 |
Token | could |
Token ID | 714 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
tremend | +8.249 |
deaf | +7.596 |
meaningful | +7.315 |
vested | +6.768 |
visually | +6.756 |
Neg logit contributions | |
Co | -7.256 |
Star | -6.673 |
she | -6.607 |
ian | -6.551 |
Smith | -6.532 |
Token | soon |
Token ID | 2582 |
Feature activation | -6.32e+00 |
Pos logit contributions | |
tremend | +12.510 |
deaf | +11.664 |
meaningful | +10.797 |
potentially | +10.388 |
visually | +10.327 |
Neg logit contributions | |
Co | -14.880 |
Star | -14.074 |
she | -13.828 |
Smith | -13.726 |
Link | -13.453 |
Token | see |
Token ID | 766 |
Feature activation | -8.41e+00 |
Pos logit contributions | |
tremend | +6.032 |
deaf | +5.201 |
meaningful | +4.844 |
visually | +4.305 |
vested | +4.163 |
Neg logit contributions | |
Co | -11.556 |
she | -10.904 |
Star | -10.875 |
Smith | -10.748 |
ian | -10.736 |
Token | upgrades |
Token ID | 16608 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
tremend | +10.657 |
meaningful | +9.553 |
deaf | +9.529 |
vested | +8.439 |
proactive | +8.413 |
Neg logit contributions | |
Co | -12.189 |
she | -11.451 |
Star | -11.237 |
uh | -11.198 |
Smith | -11.167 |
Token | to |
Token ID | 284 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
tremend | +17.861 |
deaf | +17.137 |
meaningful | +16.943 |
either | +15.787 |
visually | +15.754 |
Neg logit contributions | |
Co | -14.223 |
Star | -12.749 |
Smith | -12.686 |
Net | -12.386 |
she | -12.340 |
Token | some |
Token ID | 617 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
tremend | +16.664 |
deaf | +15.085 |
meaningful | +14.859 |
living | +13.597 |
either | +13.559 |
Neg logit contributions | |
Co | -12.808 |
she | -12.075 |
Star | -11.630 |
uh | -11.551 |
Smith | -11.459 |
Token | city |
Token ID | 1748 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
tremend | +6.169 |
deaf | +5.455 |
meaningful | +5.315 |
vested | +4.833 |
visually | +4.811 |
Neg logit contributions | |
Co | -6.219 |
she | -5.761 |
Star | -5.720 |
ian | -5.675 |
uh | -5.640 |
Token | parks |
Token ID | 14860 |
Feature activation | -4.03e+00 |
Pos logit contributions | |
tremend | +2.627 |
deaf | +2.338 |
meaningful | +2.281 |
vested | +2.103 |
visually | +2.091 |
Neg logit contributions | |
Co | -2.091 |
she | -1.904 |
ian | -1.886 |
Star | -1.882 |
uh | -1.869 |
Token | , |
Token ID | 11 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
tremend | +6.918 |
deaf | +6.247 |
meaningful | +6.183 |
visually | +5.758 |
vested | +5.741 |
Neg logit contributions | |
Co | -4.423 |
Star | -3.973 |
she | -3.921 |
Smith | -3.915 |
ian | -3.911 |
Token | nation |
Token ID | 3277 |
Feature activation | -8.15e+00 |
Pos logit contributions | |
Co | +8.467 |
she | +7.964 |
Star | +7.936 |
ian | +7.921 |
uh | +7.877 |
Neg logit contributions | |
tremend | -4.195 |
deaf | -3.352 |
meaningful | -3.216 |
visually | -2.711 |
vested | -2.694 |
Token | , |
Token ID | 11 |
Feature activation | -8.73e+00 |
Pos logit contributions | |
tremend | +14.803 |
deaf | +13.554 |
meaningful | +13.351 |
visually | +12.557 |
vested | +12.535 |
Neg logit contributions | |
Co | -6.992 |
Smith | -6.091 |
Star | -6.022 |
uh | -5.975 |
ian | -5.900 |
Token | the |
Token ID | 262 |
Feature activation | -4.86e+00 |
Pos logit contributions | |
tremend | +13.003 |
deaf | +11.802 |
meaningful | +11.520 |
vested | +10.585 |
visually | +10.559 |
Neg logit contributions | |
Co | -10.587 |
Star | -9.661 |
ian | -9.583 |
uh | -9.564 |
she | -9.548 |
Token | new |
Token ID | 649 |
Feature activation | -4.79e+00 |
Pos logit contributions | |
tremend | +6.777 |
deaf | +5.880 |
meaningful | +5.699 |
vested | +5.154 |
visually | +5.149 |
Neg logit contributions | |
Co | -7.180 |
she | -6.626 |
ian | -6.614 |
Star | -6.596 |
uh | -6.539 |
Token | information |
Token ID | 1321 |
Feature activation | -6.46e+00 |
Pos logit contributions | |
tremend | +7.006 |
deaf | +6.181 |
meaningful | +6.004 |
vested | +5.487 |
visually | +5.478 |
Neg logit contributions | |
Co | -6.567 |
she | -6.029 |
ian | -5.996 |
Star | -5.983 |
uh | -5.969 |
Token | revealed |
Token ID | 4602 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
tremend | +10.517 |
deaf | +9.661 |
meaningful | +9.394 |
visually | +8.786 |
vested | +8.725 |
Neg logit contributions | |
Co | -7.333 |
she | -6.557 |
uh | -6.547 |
Star | -6.544 |
Smith | -6.501 |
Token | by |
Token ID | 416 |
Feature activation | -7.45e+00 |
Pos logit contributions | |
tremend | +19.809 |
deaf | +18.713 |
meaningful | +18.583 |
widespread | +17.222 |
relatively | +17.158 |
Neg logit contributions | |
Co | -12.353 |
Star | -11.114 |
Smith | -11.030 |
uh | -10.987 |
Age | -10.834 |
Token | WikiLeaks |
Token ID | 19766 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
tremend | +10.806 |
deaf | +9.722 |
meaningful | +9.388 |
vested | +8.563 |
visually | +8.534 |
Neg logit contributions | |
Co | -9.772 |
she | -9.000 |
uh | -8.944 |
ian | -8.902 |
Star | -8.880 |
Token | concerning |
Token ID | 9305 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
Co | +1.740 |
ian | +1.608 |
she | +1.596 |
Star | +1.589 |
L | +1.574 |
Neg logit contributions | |
tremend | -1.941 |
deaf | -1.662 |
meaningful | -1.614 |
vested | -1.471 |
visually | -1.469 |
Token | U |
Token ID | 471 |
Feature activation | -3.16e-01 |
Pos logit contributions | |
tremend | +15.803 |
deaf | +14.908 |
meaningful | +14.703 |
widespread | +13.544 |
vested | +13.416 |
Neg logit contributions | |
Co | -13.394 |
she | -12.332 |
uh | -12.270 |
Star | -12.233 |
Smith | -12.092 |
Token | . |
Token ID | 13 |
Feature activation | +8.16e-01 |
Pos logit contributions | |
tremend | +0.630 |
deaf | +0.572 |
meaningful | +0.562 |
visually | +0.527 |
vested | +0.523 |
Neg logit contributions | |
Co | -0.277 |
ian | -0.240 |
she | -0.240 |
Star | -0.239 |
Smith | -0.234 |
Token | icket |
Token ID | 9715 |
Feature activation | +3.81e-01 |
Pos logit contributions | |
Co | +7.703 |
ian | +7.142 |
uh | +6.903 |
she | +6.889 |
B | +6.882 |
Neg logit contributions | |
tremend | -15.403 |
deaf | -13.344 |
meaningful | -12.922 |
proactive | -12.176 |
vested | -12.155 |
Token | . |
Token ID | 13 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
Co | +0.452 |
she | +0.409 |
ian | +0.408 |
Star | +0.407 |
uh | +0.400 |
Neg logit contributions | |
tremend | -0.658 |
deaf | -0.579 |
meaningful | -0.566 |
visually | -0.524 |
vested | -0.522 |
Token | Does |
Token ID | 8314 |
Feature activation | +5.37e-01 |
Pos logit contributions | |
tremend | +3.207 |
deaf | +3.008 |
meaningful | +2.940 |
visually | +2.769 |
vested | +2.715 |
Neg logit contributions | |
Co | -1.720 |
ian | -1.530 |
she | -1.523 |
Star | -1.504 |
uh | -1.495 |
Token | the |
Token ID | 262 |
Feature activation | -3.49e+00 |
Pos logit contributions | |
Co | +0.927 |
ian | +0.868 |
she | +0.867 |
Star | +0.864 |
L | +0.856 |
Neg logit contributions | |
tremend | -0.641 |
deaf | -0.524 |
meaningful | -0.506 |
vested | -0.446 |
visually | -0.445 |
Token | show |
Token ID | 905 |
Feature activation | -2.87e+00 |
Pos logit contributions | |
tremend | +4.278 |
deaf | +3.641 |
meaningful | +3.514 |
visually | +3.133 |
vested | +3.092 |
Neg logit contributions | |
Co | -5.756 |
she | -5.348 |
ian | -5.337 |
Star | -5.319 |
uh | -5.288 |
Token | incorporate |
Token ID | 19330 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
tremend | +3.564 |
deaf | +3.010 |
meaningful | +2.929 |
visually | +2.642 |
vested | +2.580 |
Neg logit contributions | |
Co | -4.690 |
she | -4.356 |
Star | -4.341 |
ian | -4.316 |
uh | -4.290 |
Token | that |
Token ID | 326 |
Feature activation | -6.95e+00 |
Pos logit contributions | |
tremend | +18.385 |
meaningful | +17.870 |
deaf | +17.555 |
visually | +16.184 |
reasonable | +16.031 |
Neg logit contributions | |
Co | -13.492 |
she | -12.304 |
uh | -12.038 |
ian | -11.818 |
Smith | -11.673 |
Token | wild |
Token ID | 4295 |
Feature activation | -2.72e+00 |
Pos logit contributions | |
tremend | +10.427 |
deaf | +9.380 |
meaningful | +9.328 |
visually | +8.584 |
proactive | +8.437 |
Neg logit contributions | |
Co | -8.734 |
she | -8.037 |
Star | -7.974 |
uh | -7.864 |
ian | -7.771 |
Token | , |
Token ID | 11 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
tremend | +4.858 |
deaf | +4.356 |
meaningful | +4.280 |
visually | +3.978 |
proactive | +3.957 |
Neg logit contributions | |
Co | -2.918 |
she | -2.583 |
Star | -2.567 |
ian | -2.563 |
uh | -2.534 |
Token | fun |
Token ID | 1257 |
Feature activation | +3.44e-01 |
Pos logit contributions | |
tremend | +3.197 |
deaf | +2.630 |
meaningful | +2.548 |
visually | +2.219 |
vested | +2.178 |
Neg logit contributions | |
Co | -5.401 |
she | -5.062 |
ian | -5.053 |
Star | -5.038 |
Smith | -4.990 |
Token | language |
Token ID | 3303 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
Co | +0.516 |
she | +0.476 |
ian | +0.476 |
Star | +0.475 |
uh | +0.468 |
Neg logit contributions | |
tremend | -0.487 |
deaf | -0.416 |
meaningful | -0.404 |
visually | -0.365 |
vested | -0.364 |
Token |
|
Token ID | 198 |
Feature activation | +5.74e+00 |
Pos logit contributions | |
Co | +3.755 |
L | +3.202 |
B | +3.182 |
she | +3.120 |
ian | +3.118 |
Neg logit contributions | |
tremend | -14.833 |
deaf | -11.594 |
behavi | -11.506 |
exha | -11.455 |
meaningful | -11.402 |
Token | The |
Token ID | 464 |
Feature activation | -6.05e-01 |
Pos logit contributions | |
Co | +3.776 |
Star | +3.072 |
L | +3.055 |
B | +3.040 |
she | +3.026 |
Neg logit contributions | |
tremend | -13.246 |
deaf | -11.785 |
meaningful | -11.581 |
proactive | -10.967 |
visually | -10.963 |
Token | PDF |
Token ID | 12960 |
Feature activation | -8.88e-01 |
Pos logit contributions | |
tremend | +0.673 |
deaf | +0.546 |
meaningful | +0.527 |
vested | +0.458 |
visually | +0.457 |
Neg logit contributions | |
Co | -1.090 |
ian | -1.021 |
she | -1.021 |
Star | -1.017 |
L | -1.007 |
Token | also |
Token ID | 635 |
Feature activation | -7.47e+00 |
Pos logit contributions | |
tremend | +1.325 |
deaf | +1.145 |
meaningful | +1.123 |
vested | +1.028 |
visually | +1.025 |
Neg logit contributions | |
Co | -1.240 |
she | -1.136 |
Star | -1.134 |
ian | -1.133 |
Smith | -1.121 |
Token | discl |
Token ID | 5862 |
Feature activation | -7.61e+00 |
Pos logit contributions | |
tremend | +10.835 |
deaf | +9.657 |
meaningful | +9.545 |
visually | +9.090 |
vested | +8.913 |
Neg logit contributions | |
Co | -9.391 |
Star | -8.557 |
she | -8.461 |
Smith | -8.414 |
ian | -8.309 |
Token | oses |
Token ID | 4629 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
tremend | +9.843 |
deaf | +9.683 |
meaningful | +9.350 |
visually | +8.851 |
either | +8.554 |
Neg logit contributions | |
Co | -9.277 |
Star | -8.710 |
Smith | -8.440 |
she | -8.105 |
B | -8.095 |
Token | Trump |
Token ID | 1301 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
tremend | +18.861 |
meaningful | +17.694 |
deaf | +16.956 |
vested | +16.456 |
reasonable | +16.437 |
Neg logit contributions | |
Co | -12.911 |
she | -11.976 |
Star | -11.836 |
uh | -11.794 |
Smith | -11.759 |
Token | � |
Token ID | 447 |
Feature activation | +4.32e+00 |
Pos logit contributions | |
tremend | +6.881 |
deaf | +6.228 |
meaningful | +6.149 |
vested | +5.839 |
visually | +5.797 |
Neg logit contributions | |
Co | -2.463 |
she | -2.157 |
Star | -2.151 |
ian | -2.130 |
uh | -2.119 |
Token | � |
Token ID | 247 |
Feature activation | -7.96e-01 |
Pos logit contributions | |
Co | +2.758 |
ian | +2.381 |
L | +2.285 |
she | +2.249 |
B | +2.231 |
Neg logit contributions | |
tremend | -10.121 |
deaf | -8.766 |
meaningful | -8.568 |
vested | -8.121 |
visually | -8.096 |
Token | s |
Token ID | 82 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
tremend | +1.991 |
deaf | +1.852 |
meaningful | +1.830 |
visually | +1.740 |
vested | +1.737 |
Neg logit contributions | |
Co | -0.288 |
Star | -0.196 |
ian | -0.193 |
she | -0.193 |
uh | -0.182 |
Token | investments |
Token ID | 11115 |
Feature activation | -3.85e+00 |
Pos logit contributions | |
tremend | +2.377 |
deaf | +1.966 |
meaningful | +1.913 |
vested | +1.682 |
visually | +1.662 |
Neg logit contributions | |
Co | -3.573 |
she | -3.347 |
ian | -3.342 |
Star | -3.330 |
uh | -3.309 |
Token |
|
Token ID | 198 |
Feature activation | +6.64e+00 |
Pos logit contributions | |
Co | +0.257 |
she | +0.232 |
ian | +0.230 |
Star | +0.227 |
uh | +0.224 |
Neg logit contributions | |
tremend | -0.504 |
deaf | -0.456 |
meaningful | -0.448 |
visually | -0.417 |
vested | -0.417 |
Token |
|
Token ID | 198 |
Feature activation | +6.15e+00 |
Pos logit contributions | |
Co | +4.528 |
L | +3.882 |
B | +3.866 |
P | +3.751 |
Star | +3.680 |
Neg logit contributions | |
tremend | -16.845 |
deaf | -13.175 |
exha | -12.966 |
behavi | -12.963 |
meaningful | -12.899 |
Token | The |
Token ID | 464 |
Feature activation | -6.57e-01 |
Pos logit contributions | |
Co | +4.282 |
Star | +3.496 |
L | +3.472 |
B | +3.447 |
ian | +3.433 |
Neg logit contributions | |
tremend | -14.015 |
deaf | -12.415 |
meaningful | -12.221 |
visually | -11.570 |
vested | -11.555 |
Token | following |
Token ID | 1708 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
tremend | +0.821 |
deaf | +0.681 |
meaningful | +0.659 |
visually | +0.585 |
vested | +0.584 |
Neg logit contributions | |
Co | -1.094 |
ian | -1.020 |
she | -1.019 |
Star | -1.015 |
L | -1.005 |
Token | charts |
Token ID | 15907 |
Feature activation | -5.44e+00 |
Pos logit contributions | |
tremend | +2.499 |
deaf | +2.164 |
meaningful | +2.111 |
visually | +1.917 |
vested | +1.910 |
Neg logit contributions | |
Co | -2.556 |
she | -2.371 |
ian | -2.356 |
Star | -2.350 |
uh | -2.323 |
Token | illustrate |
Token ID | 19418 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
tremend | +7.122 |
deaf | +6.303 |
meaningful | +6.201 |
visually | +5.947 |
vested | +5.707 |
Neg logit contributions | |
Co | -7.889 |
she | -7.320 |
Star | -7.297 |
Smith | -7.218 |
ian | -7.148 |
Token | the |
Token ID | 262 |
Feature activation | -7.63e+00 |
Pos logit contributions | |
tremend | +17.450 |
meaningful | +16.472 |
deaf | +15.674 |
relatively | +15.263 |
reasonable | +15.119 |
Neg logit contributions | |
Co | -13.724 |
she | -13.508 |
Smith | -13.274 |
Star | -12.990 |
She | -12.635 |
Token | H |
Token ID | 367 |
Feature activation | +5.44e-01 |
Pos logit contributions | |
tremend | +9.098 |
meaningful | +7.954 |
deaf | +7.926 |
relatively | +7.163 |
visually | +7.097 |
Neg logit contributions | |
Co | -11.578 |
she | -10.923 |
Smith | -10.889 |
Star | -10.829 |
ian | -10.712 |
Token | EC |
Token ID | 2943 |
Feature activation | +3.17e+00 |
Pos logit contributions | |
Co | +0.358 |
she | +0.303 |
Star | +0.300 |
ian | +0.297 |
Smith | +0.294 |
Neg logit contributions | |
tremend | -1.200 |
deaf | -1.092 |
meaningful | -1.078 |
visually | -1.016 |
vested | -1.007 |
Token | O |
Token ID | 46 |
Feature activation | +6.58e-01 |
Pos logit contributions | |
Co | +3.952 |
ian | +3.589 |
she | +3.570 |
Star | +3.562 |
L | +3.532 |
Neg logit contributions | |
tremend | -5.299 |
deaf | -4.625 |
meaningful | -4.508 |
visually | -4.151 |
vested | -4.150 |
Token | utilities |
Token ID | 20081 |
Feature activation | -2.95e+00 |
Pos logit contributions | |
Co | +0.950 |
she | +0.879 |
Star | +0.875 |
ian | +0.875 |
Smith | +0.865 |
Neg logit contributions | |
tremend | -0.959 |
deaf | -0.823 |
meaningful | -0.805 |
vested | -0.729 |
visually | -0.728 |
Token | is |
Token ID | 318 |
Feature activation | -9.92e+00 |
Pos logit contributions | |
Co | +0.894 |
ian | +0.825 |
she | +0.821 |
Star | +0.819 |
L | +0.809 |
Neg logit contributions | |
tremend | -0.961 |
deaf | -0.824 |
meaningful | -0.803 |
vested | -0.730 |
visually | -0.729 |
Token | a |
Token ID | 257 |
Feature activation | -6.22e+00 |
Pos logit contributions | |
tremend | +12.851 |
deaf | +11.820 |
meaningful | +11.740 |
visually | +10.773 |
relatively | +10.654 |
Neg logit contributions | |
Co | -13.244 |
she | -12.407 |
Star | -12.251 |
Smith | -12.230 |
uh | -12.197 |
Token | great |
Token ID | 1049 |
Feature activation | -2.80e+00 |
Pos logit contributions | |
tremend | +7.253 |
deaf | +6.252 |
meaningful | +6.174 |
visually | +5.476 |
proactive | +5.420 |
Neg logit contributions | |
Co | -10.166 |
she | -9.588 |
ian | -9.414 |
Star | -9.394 |
Smith | -9.367 |
Token | way |
Token ID | 835 |
Feature activation | -4.01e+00 |
Pos logit contributions | |
tremend | +3.091 |
deaf | +2.545 |
meaningful | +2.476 |
visually | +2.161 |
vested | +2.149 |
Neg logit contributions | |
Co | -5.000 |
she | -4.698 |
ian | -4.655 |
Star | -4.655 |
uh | -4.621 |
Token | to |
Token ID | 284 |
Feature activation | -9.23e+00 |
Pos logit contributions | |
tremend | +4.893 |
deaf | +4.107 |
meaningful | +3.989 |
visually | +3.583 |
vested | +3.497 |
Neg logit contributions | |
Co | -6.619 |
she | -6.163 |
ian | -6.155 |
Star | -6.123 |
uh | -6.100 |
Token | utilize |
Token ID | 17624 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
tremend | +10.398 |
deaf | +9.193 |
meaningful | +9.002 |
visually | +8.619 |
artificially | +8.201 |
Neg logit contributions | |
Co | -14.463 |
she | -13.614 |
Star | -13.445 |
uh | -13.377 |
Smith | -13.332 |
Token | a |
Token ID | 257 |
Feature activation | -6.60e+00 |
Pos logit contributions | |
tremend | +17.946 |
meaningful | +17.184 |
deaf | +16.769 |
visually | +16.025 |
proactive | +15.783 |
Neg logit contributions | |
Co | -13.810 |
she | -13.265 |
Smith | -12.502 |
uh | -12.492 |
Star | -12.374 |
Token | very |
Token ID | 845 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
tremend | +7.656 |
deaf | +6.615 |
meaningful | +6.582 |
visually | +5.900 |
proactive | +5.783 |
Neg logit contributions | |
Co | -10.739 |
she | -10.096 |
ian | -9.926 |
Star | -9.916 |
uh | -9.891 |
Token | cool |
Token ID | 3608 |
Feature activation | -3.37e+00 |
Pos logit contributions | |
tremend | +1.640 |
deaf | +1.264 |
meaningful | +1.209 |
visually | +1.000 |
vested | +0.996 |
Neg logit contributions | |
Co | -3.738 |
she | -3.529 |
ian | -3.523 |
Star | -3.515 |
uh | -3.486 |
Token | character |
Token ID | 2095 |
Feature activation | -2.97e+00 |
Pos logit contributions | |
tremend | +4.292 |
deaf | +3.706 |
meaningful | +3.636 |
visually | +3.289 |
proactive | +3.251 |
Neg logit contributions | |
Co | -5.339 |
she | -4.970 |
Star | -4.921 |
uh | -4.888 |
ian | -4.886 |
Token | . |
Token ID | 13 |
Feature activation | -2.96e+00 |
Pos logit contributions | |
tremend | +5.109 |
deaf | +4.545 |
meaningful | +4.475 |
visually | +4.187 |
vested | +4.129 |
Neg logit contributions | |
Co | -3.446 |
she | -3.102 |
Star | -3.081 |
ian | -3.050 |
uh | -3.040 |
Token | The |
Token ID | 464 |
Feature activation | +5.20e-02 |
Pos logit contributions | |
Co | +1.267 |
ian | +1.068 |
she | +1.060 |
Star | +1.033 |
uh | +1.013 |
Neg logit contributions | |
tremend | -4.304 |
deaf | -3.919 |
meaningful | -3.856 |
visually | -3.631 |
vested | -3.622 |
Token | Star |
Token ID | 2907 |
Feature activation | +4.49e+00 |
Pos logit contributions | |
Co | +0.089 |
ian | +0.084 |
she | +0.083 |
Star | +0.083 |
L | +0.083 |
Neg logit contributions | |
tremend | -0.062 |
deaf | -0.051 |
meaningful | -0.049 |
vested | -0.043 |
visually | -0.043 |
Token | Trek |
Token ID | 12338 |
Feature activation | +4.00e+00 |
Pos logit contributions | |
Co | +5.663 |
Star | +5.152 |
ian | +5.124 |
L | +5.086 |
she | +5.083 |
Neg logit contributions | |
tremend | -7.422 |
deaf | -6.451 |
meaningful | -6.286 |
vested | -5.821 |
proactive | -5.764 |
Token | universe |
Token ID | 6881 |
Feature activation | -2.16e+00 |
Pos logit contributions | |
Co | +6.052 |
ian | +5.655 |
Star | +5.642 |
she | +5.566 |
L | +5.539 |
Neg logit contributions | |
tremend | -5.582 |
deaf | -4.660 |
meaningful | -4.532 |
vested | -4.095 |
visually | -4.044 |
Token | neglect |
Token ID | 17985 |
Feature activation | -6.69e+00 |
Pos logit contributions | |
tremend | +3.695 |
deaf | +3.276 |
meaningful | +3.214 |
visually | +3.013 |
vested | +2.972 |
Neg logit contributions | |
Co | -2.499 |
she | -2.263 |
ian | -2.238 |
uh | -2.228 |
Star | -2.225 |
Token | s |
Token ID | 82 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
tremend | +15.196 |
deaf | +14.035 |
meaningful | +13.839 |
visually | +13.085 |
vested | +13.077 |
Neg logit contributions | |
Co | -3.034 |
Smith | -2.412 |
she | -2.316 |
ian | -2.306 |
Star | -2.276 |
Token | relat |
Token ID | 48993 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
tremend | +19.637 |
meaningful | +18.069 |
deaf | +17.781 |
reasonable | +16.766 |
relatively | +16.515 |
Neg logit contributions | |
Co | -12.582 |
she | -11.810 |
uh | -11.504 |
Smith | -11.434 |
ian | -11.083 |
Token | iv |
Token ID | 452 |
Feature activation | +2.27e+00 |
Pos logit contributions | |
Co | +1.875 |
ian | +1.549 |
she | +1.513 |
Star | +1.493 |
L | +1.462 |
Neg logit contributions | |
tremend | -7.812 |
deaf | -7.083 |
meaningful | -6.947 |
vested | -6.605 |
visually | -6.592 |
Token | istic |
Token ID | 2569 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
Co | +2.367 |
ian | +2.124 |
she | +2.116 |
Star | +2.100 |
L | +2.068 |
Neg logit contributions | |
tremend | -4.237 |
deaf | -3.750 |
meaningful | -3.675 |
vested | -3.422 |
visually | -3.418 |
Token | effects |
Token ID | 3048 |
Feature activation | -6.97e+00 |
Pos logit contributions | |
tremend | +5.829 |
deaf | +5.089 |
meaningful | +4.959 |
visually | +4.431 |
reasonable | +4.427 |
Neg logit contributions | |
Co | -6.865 |
she | -6.365 |
Smith | -6.356 |
uh | -6.341 |
Star | -6.249 |
Token | . |
Token ID | 13 |
Feature activation | -3.10e+00 |
Pos logit contributions | |
tremend | +11.378 |
deaf | +10.184 |
meaningful | +10.140 |
visually | +9.407 |
purely | +9.372 |
Neg logit contributions | |
Co | -7.776 |
she | -7.023 |
Smith | -6.999 |
Star | -6.988 |
ian | -6.928 |
Token | Sciences |
Token ID | 13473 |
Feature activation | +3.75e+00 |
Pos logit contributions | |
Co | +6.475 |
ian | +5.998 |
she | +5.895 |
Smith | +5.828 |
L | +5.806 |
Neg logit contributions | |
tremend | -13.764 |
deaf | -11.252 |
meaningful | -10.866 |
proactive | -10.430 |
vested | -10.394 |
Token | in |
Token ID | 287 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
Co | +5.870 |
ian | +5.467 |
she | +5.429 |
L | +5.409 |
B | +5.383 |
Neg logit contributions | |
tremend | -4.993 |
deaf | -4.190 |
meaningful | -4.048 |
proactive | -3.639 |
visually | -3.624 |
Token | Memory |
Token ID | 14059 |
Feature activation | +2.28e+00 |
Pos logit contributions | |
tremend | +0.258 |
deaf | +0.223 |
meaningful | +0.217 |
vested | +0.203 |
proactive | +0.203 |
Neg logit contributions | |
Co | -0.138 |
ian | -0.124 |
she | -0.123 |
Star | -0.123 |
L | -0.122 |
Token | of |
Token ID | 286 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
Co | +2.779 |
ian | +2.558 |
she | +2.528 |
L | +2.524 |
B | +2.511 |
Neg logit contributions | |
tremend | -4.110 |
deaf | -3.351 |
meaningful | -3.255 |
proactive | -3.037 |
vested | -3.034 |
Token | Alfred |
Token ID | 22044 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
tremend | +2.761 |
deaf | +2.395 |
meaningful | +2.333 |
vested | +2.110 |
visually | +2.107 |
Neg logit contributions | |
Co | -2.864 |
Star | -2.642 |
she | -2.635 |
ian | -2.615 |
Smith | -2.598 |
Token | Nobel |
Token ID | 20715 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
Co | +12.311 |
ian | +12.170 |
L | +11.763 |
B | +11.737 |
P | +11.628 |
Neg logit contributions | |
tremend | -19.837 |
deaf | -15.163 |
behavi | -14.837 |
exha | -14.486 |
undermin | -14.430 |
Token |
|
Token ID | 198 |
Feature activation | +4.93e+00 |
Pos logit contributions | |
Co | +19.279 |
ian | +18.450 |
B | +18.152 |
L | +18.137 |
j | +17.918 |
Neg logit contributions | |
tremend | -15.138 |
deaf | -12.333 |
meaningful | -11.591 |
proactive | -10.581 |
reasonable | -10.425 |
Token |
|
Token ID | 198 |
Feature activation | +4.79e+00 |
Pos logit contributions | |
Co | +3.391 |
L | +2.856 |
B | +2.845 |
ian | +2.824 |
she | +2.817 |
Neg logit contributions | |
tremend | -12.318 |
deaf | -9.790 |
meaningful | -9.612 |
behavi | -9.490 |
exha | -9.400 |
Token | A |
Token ID | 32 |
Feature activation | +2.52e+00 |
Pos logit contributions | |
Co | +3.425 |
she | +2.847 |
ian | +2.846 |
Star | +2.831 |
L | +2.815 |
Neg logit contributions | |
tremend | -10.620 |
deaf | -9.512 |
meaningful | -9.353 |
visually | -8.829 |
proactive | -8.820 |
Token | ward |
Token ID | 904 |
Feature activation | +5.97e+00 |
Pos logit contributions | |
Co | +3.849 |
ian | +3.597 |
she | +3.574 |
Star | +3.550 |
L | +3.544 |
Neg logit contributions | |
tremend | -3.451 |
deaf | -2.900 |
meaningful | -2.811 |
vested | -2.535 |
proactive | -2.526 |
Token | ed |
Token ID | 276 |
Feature activation | -7.26e-01 |
Pos logit contributions | |
Co | +8.601 |
ian | +8.019 |
she | +7.912 |
L | +7.906 |
Star | +7.864 |
Neg logit contributions | |
tremend | -8.485 |
deaf | -7.131 |
meaningful | -6.817 |
proactive | -6.255 |
visually | -6.197 |
Token |
|
Token ID | 198 |
Feature activation | +8.37e+00 |
Pos logit contributions | |
Co | +4.546 |
ian | +4.045 |
she | +4.034 |
L | +4.000 |
B | +3.998 |
Neg logit contributions | |
tremend | -8.079 |
deaf | -6.971 |
meaningful | -6.836 |
vested | -6.328 |
proactive | -6.327 |
Token |
|
Token ID | 198 |
Feature activation | +7.78e+00 |
Pos logit contributions | |
Co | +4.866 |
L | +4.169 |
B | +4.145 |
ian | +3.966 |
P | +3.949 |
Neg logit contributions | |
tremend | -22.154 |
exha | -17.416 |
behavi | -17.255 |
undermin | -17.195 |
misunder | -17.004 |
Token | Ser |
Token ID | 7089 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
Co | +5.083 |
B | +4.208 |
L | +4.196 |
Star | +4.097 |
she | +4.029 |
Neg logit contributions | |
tremend | -17.989 |
deaf | -15.748 |
meaningful | -15.588 |
proactive | -14.758 |
vested | -14.695 |
Token | hi |
Token ID | 5303 |
Feature activation | +5.19e+00 |
Pos logit contributions | |
Co | +13.462 |
ian | +13.073 |
uh | +12.710 |
she | +12.618 |
B | +12.568 |
Neg logit contributions | |
tremend | -19.017 |
deaf | -16.053 |
meaningful | -15.714 |
proactive | -14.688 |
vested | -14.527 |
Token | y |
Token ID | 88 |
Feature activation | +7.28e+00 |
Pos logit contributions | |
Co | +5.839 |
ian | +5.376 |
she | +5.289 |
uh | +5.238 |
L | +5.200 |
Neg logit contributions | |
tremend | -9.211 |
deaf | -8.047 |
meaningful | -7.856 |
vested | -7.280 |
proactive | -7.246 |
Token | Kaz |
Token ID | 16385 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
Co | +9.464 |
ian | +8.888 |
she | +8.779 |
uh | +8.687 |
B | +8.684 |
Neg logit contributions | |
tremend | -11.258 |
deaf | -9.571 |
meaningful | -9.326 |
vested | -8.585 |
proactive | -8.556 |
Token | arov |
Token ID | 42737 |
Feature activation | +9.34e+00 |
Pos logit contributions | |
ian | +19.267 |
uh | +18.879 |
Co | +18.851 |
she | +18.497 |
oy | +18.062 |
Neg logit contributions | |
tremend | -20.853 |
deaf | -16.913 |
meaningful | -16.084 |
behavi | -15.864 |
proactive | -15.186 |
Token | , |
Token ID | 11 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
Co | +13.532 |
ian | +12.701 |
she | +12.452 |
B | +12.383 |
L | +12.335 |
Neg logit contributions | |
tremend | -12.704 |
deaf | -10.417 |
meaningful | -10.207 |
proactive | -9.182 |
visually | -9.072 |
Token | former |
Token ID | 1966 |
Feature activation | +3.70e+00 |
Pos logit contributions | |
Co | +2.558 |
ian | +2.396 |
she | +2.384 |
Star | +2.376 |
L | +2.366 |
Neg logit contributions | |
tremend | -1.708 |
deaf | -1.373 |
meaningful | -1.328 |
vested | -1.157 |
visually | -1.153 |
Token | head |
Token ID | 1182 |
Feature activation | +2.31e+00 |
Pos logit contributions | |
Co | +5.740 |
ian | +5.361 |
Star | +5.282 |
she | +5.277 |
L | +5.276 |
Neg logit contributions | |
tremend | -5.034 |
deaf | -4.105 |
meaningful | -3.980 |
vested | -3.554 |
visually | -3.544 |
Token | of |
Token ID | 286 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
Co | +2.951 |
ian | +2.730 |
she | +2.701 |
Star | +2.687 |
L | +2.664 |
Neg logit contributions | |
tremend | -3.780 |
deaf | -3.253 |
meaningful | -3.183 |
vested | -2.918 |
proactive | -2.918 |
Token | familiar |
Token ID | 5385 |
Feature activation | +3.97e+00 |
Pos logit contributions | |
Co | +6.909 |
ian | +6.495 |
she | +6.421 |
Star | +6.407 |
L | +6.404 |
Neg logit contributions | |
tremend | -5.382 |
deaf | -4.382 |
meaningful | -4.238 |
visually | -3.759 |
proactive | -3.758 |
Token | with |
Token ID | 351 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
Co | +5.058 |
ian | +4.856 |
L | +4.721 |
she | +4.649 |
B | +4.647 |
Neg logit contributions | |
tremend | -6.978 |
deaf | -5.354 |
meaningful | -5.174 |
misunder | -4.921 |
behavi | -4.811 |
Token | the |
Token ID | 262 |
Feature activation | -4.19e-01 |
Pos logit contributions | |
tremend | +1.948 |
deaf | +1.456 |
meaningful | +1.385 |
vested | +1.090 |
visually | +1.084 |
Neg logit contributions | |
Co | -5.285 |
she | -5.011 |
ian | -5.001 |
Star | -4.988 |
uh | -4.952 |
Token | negotiations |
Token ID | 9825 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
tremend | +0.481 |
deaf | +0.389 |
meaningful | +0.375 |
visually | +0.328 |
vested | +0.328 |
Neg logit contributions | |
Co | -0.744 |
ian | -0.698 |
she | -0.696 |
Star | -0.694 |
L | -0.688 |
Token | . |
Token ID | 13 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
tremend | +2.874 |
deaf | +2.589 |
meaningful | +2.542 |
visually | +2.378 |
vested | +2.372 |
Neg logit contributions | |
Co | -1.368 |
she | -1.208 |
ian | -1.193 |
Star | -1.191 |
Smith | -1.171 |
Token | � |
Token ID | 564 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
Co | +2.774 |
ian | +2.500 |
she | +2.494 |
Star | +2.482 |
L | +2.455 |
Neg logit contributions | |
tremend | -4.225 |
deaf | -3.680 |
meaningful | -3.599 |
visually | -3.332 |
vested | -3.332 |
Token | � |
Token ID | 250 |
Feature activation | +6.55e+00 |
Pos logit contributions | |
Co | +13.215 |
B | +11.967 |
L | +11.833 |
Star | +11.802 |
ian | +11.688 |
Neg logit contributions | |
tremend | -22.268 |
deaf | -19.397 |
meaningful | -18.882 |
vested | -17.721 |
visually | -17.685 |
Token | Especially |
Token ID | 48464 |
Feature activation | +4.80e+00 |
Pos logit contributions | |
Co | +5.439 |
B | +4.635 |
she | +4.630 |
L | +4.613 |
Star | +4.604 |
Neg logit contributions | |
tremend | -13.888 |
deaf | -12.165 |
meaningful | -11.921 |
visually | -11.260 |
proactive | -11.244 |
Token | in |
Token ID | 287 |
Feature activation | -3.00e+00 |
Pos logit contributions | |
Co | +8.352 |
B | +7.822 |
ian | +7.820 |
L | +7.771 |
Star | +7.718 |
Neg logit contributions | |
tremend | -5.458 |
deaf | -4.122 |
meaningful | -3.820 |
vested | -3.505 |
proactive | -3.418 |
Token | an |
Token ID | 281 |
Feature activation | -7.98e-01 |
Pos logit contributions | |
tremend | +2.912 |
deaf | +2.330 |
meaningful | +2.238 |
visually | +1.901 |
vested | +1.874 |
Neg logit contributions | |
Co | -5.763 |
she | -5.441 |
ian | -5.419 |
Star | -5.410 |
uh | -5.383 |
Token | election |
Token ID | 3071 |
Feature activation | +2.87e+00 |
Pos logit contributions | |
tremend | +0.999 |
deaf | +0.833 |
meaningful | +0.807 |
visually | +0.718 |
vested | +0.715 |
Neg logit contributions | |
Co | -1.323 |
ian | -1.233 |
she | -1.232 |
Star | -1.229 |
L | -1.215 |
Token | esh |
Token ID | 5069 |
Feature activation | +9.11e+00 |
Pos logit contributions | |
Co | +17.877 |
uh | +16.625 |
she | +16.605 |
L | +16.275 |
oy | +16.225 |
Neg logit contributions | |
tremend | -17.624 |
deaf | -14.513 |
meaningful | -13.688 |
vested | -12.943 |
proactive | -12.768 |
Token | ama |
Token ID | 1689 |
Feature activation | +7.58e+00 |
Pos logit contributions | |
Co | +13.757 |
she | +12.920 |
ian | +12.912 |
uh | +12.868 |
L | +12.755 |
Neg logit contributions | |
tremend | -11.503 |
deaf | -9.429 |
meaningful | -9.076 |
vested | -8.137 |
proactive | -8.113 |
Token | and |
Token ID | 290 |
Feature activation | +6.04e-01 |
Pos logit contributions | |
Co | +10.856 |
she | +10.058 |
ian | +10.008 |
B | +9.974 |
L | +9.949 |
Neg logit contributions | |
tremend | -10.612 |
deaf | -8.917 |
meaningful | -8.662 |
vested | -7.866 |
proactive | -7.841 |
Token | Rabbi |
Token ID | 31807 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
Co | +0.933 |
ian | +0.866 |
she | +0.865 |
Star | +0.861 |
L | +0.853 |
Neg logit contributions | |
tremend | -0.828 |
deaf | -0.698 |
meaningful | -0.678 |
vested | -0.609 |
visually | -0.609 |
Token | Leon |
Token ID | 10592 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
Co | +14.878 |
she | +14.010 |
L | +13.944 |
ian | +13.929 |
B | +13.894 |
Neg logit contributions | |
tremend | -16.604 |
deaf | -13.033 |
meaningful | -12.465 |
proactive | -11.554 |
personalized | -11.465 |
Token | Wi |
Token ID | 11759 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
Co | +15.967 |
ian | +15.510 |
i | +15.218 |
she | +14.959 |
B | +14.881 |
Neg logit contributions | |
tremend | -15.979 |
deaf | -13.038 |
meaningful | -12.527 |
vested | -11.711 |
proactive | -11.566 |
Token | ener |
Token ID | 877 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
Co | +17.312 |
L | +16.645 |
uh | +16.504 |
ian | +16.300 |
B | +16.291 |
Neg logit contributions | |
tremend | -18.617 |
deaf | -15.158 |
meaningful | -14.904 |
vested | -13.621 |
proactive | -13.577 |
Token | Dow |
Token ID | 21842 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
Co | +17.113 |
ian | +16.343 |
uh | +16.078 |
B | +16.023 |
she | +15.996 |
Neg logit contributions | |
tremend | -14.492 |
deaf | -12.139 |
meaningful | -11.502 |
vested | -10.460 |
proactive | -10.334 |
Token | of |
Token ID | 286 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
Co | +21.437 |
ian | +20.617 |
she | +20.255 |
uh | +20.203 |
B | +20.175 |
Neg logit contributions | |
tremend | -16.214 |
deaf | -13.271 |
meaningful | -12.711 |
vested | -11.408 |
proactive | -11.376 |
Token | the |
Token ID | 262 |
Feature activation | +2.74e+00 |
Pos logit contributions | |
Co | +2.623 |
she | +2.447 |
ian | +2.444 |
Star | +2.431 |
L | +2.418 |
Neg logit contributions | |
tremend | -1.925 |
deaf | -1.567 |
meaningful | -1.516 |
vested | -1.343 |
visually | -1.339 |
Token | Shal |
Token ID | 47974 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
Co | +3.843 |
she | +3.538 |
ian | +3.518 |
Star | +3.505 |
L | +3.490 |
Neg logit contributions | |
tremend | -4.137 |
deaf | -3.493 |
meaningful | -3.397 |
vested | -3.110 |
visually | -3.087 |
Token | nut |
Token ID | 14930 |
Feature activation | +7.28e+00 |
Pos logit contributions | |
Co | +7.677 |
ian | +6.766 |
Star | +6.703 |
she | +6.659 |
L | +6.586 |
Neg logit contributions | |
tremend | -16.222 |
deaf | -14.228 |
meaningful | -13.991 |
vested | -13.121 |
proactive | -13.028 |
Token | Brewery |
Token ID | 31003 |
Feature activation | +3.87e+00 |
Pos logit contributions | |
Co | +9.962 |
B | +9.073 |
L | +9.023 |
ian | +8.990 |
Star | +8.942 |
Neg logit contributions | |
tremend | -10.885 |
deaf | -9.205 |
meaningful | -8.947 |
vested | -8.261 |
proactive | -8.158 |
Token | in |
Token ID | 287 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
Co | +6.080 |
she | +5.608 |
ian | +5.607 |
Star | +5.594 |
L | +5.555 |
Neg logit contributions | |
tremend | -5.206 |
deaf | -4.362 |
meaningful | -4.210 |
vested | -3.785 |
visually | -3.763 |
Token | Boulder |
Token ID | 27437 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
tremend | +3.228 |
deaf | +2.831 |
meaningful | +2.773 |
visually | +2.534 |
vested | +2.525 |
Neg logit contributions | |
Co | -2.814 |
she | -2.576 |
ian | -2.574 |
Star | -2.564 |
uh | -2.537 |
Token | , |
Token ID | 11 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
Co | +14.946 |
ian | +13.892 |
L | +13.668 |
B | +13.664 |
uh | +13.530 |
Neg logit contributions | |
tremend | -14.205 |
deaf | -11.583 |
meaningful | -11.089 |
proactive | -10.197 |
vested | -10.054 |
Token | Colo |
Token ID | 41943 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
Co | +2.167 |
ian | +1.956 |
she | +1.941 |
Star | +1.924 |
B | +1.915 |
Neg logit contributions | |
tremend | -3.257 |
deaf | -2.843 |
meaningful | -2.778 |
visually | -2.566 |
vested | -2.564 |
Token | ., |
Token ID | 1539 |
Feature activation | +3.19e+00 |
Pos logit contributions | |
Co | +20.882 |
L | +19.348 |
uh | +19.208 |
B | +19.171 |
ian | +19.150 |
Neg logit contributions | |
tremend | -22.027 |
deaf | -18.051 |
meaningful | -17.714 |
vested | -16.514 |
proactive | -16.451 |
Token | on |
Token ID | 319 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
Co | +5.095 |
ian | +4.759 |
she | +4.736 |
Star | +4.706 |
L | +4.698 |
Neg logit contributions | |
tremend | -4.235 |
deaf | -3.412 |
meaningful | -3.307 |
vested | -2.976 |
proactive | -2.953 |
Token | Tuesday |
Token ID | 3431 |
Feature activation | +5.20e+00 |
Pos logit contributions | |
tremend | +1.923 |
deaf | +1.664 |
meaningful | +1.623 |
visually | +1.480 |
vested | +1.479 |
Neg logit contributions | |
Co | -1.710 |
ian | -1.569 |
she | -1.568 |
Star | -1.560 |
L | -1.541 |
Token | . |
Token ID | 13 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
Co | +5.624 |
ian | +5.085 |
she | +5.038 |
Star | +5.003 |
L | +5.002 |
Neg logit contributions | |
tremend | -9.476 |
deaf | -8.178 |
meaningful | -7.999 |
vested | -7.441 |
proactive | -7.424 |
Token | ( |
Token ID | 357 |
Feature activation | +8.85e+00 |
Pos logit contributions | |
Co | +1.214 |
ian | +1.086 |
she | +1.082 |
Star | +1.076 |
uh | +1.057 |
Neg logit contributions | |
tremend | -2.183 |
deaf | -1.950 |
meaningful | -1.909 |
visually | -1.777 |
vested | -1.773 |
Token | the |
Token ID | 262 |
Feature activation | -2.57e+00 |
Pos logit contributions | |
tremend | +8.407 |
deaf | +7.348 |
meaningful | +7.191 |
visually | +6.534 |
proactive | +6.441 |
Neg logit contributions | |
Co | -8.235 |
she | -7.630 |
Smith | -7.600 |
ian | -7.524 |
uh | -7.495 |
Token | game |
Token ID | 983 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
tremend | +3.567 |
deaf | +3.050 |
meaningful | +2.968 |
visually | +2.684 |
vested | +2.658 |
Neg logit contributions | |
Co | -3.886 |
she | -3.599 |
ian | -3.595 |
Star | -3.568 |
Smith | -3.546 |
Token | � |
Token ID | 447 |
Feature activation | +8.34e+00 |
Pos logit contributions | |
Co | +2.163 |
ian | +1.972 |
she | +1.972 |
Star | +1.959 |
L | +1.937 |
Neg logit contributions | |
tremend | -2.812 |
deaf | -2.446 |
meaningful | -2.386 |
vested | -2.196 |
visually | -2.185 |
Token | � |
Token ID | 247 |
Feature activation | +4.32e+00 |
Pos logit contributions | |
Co | +3.983 |
ian | +3.381 |
B | +3.314 |
L | +3.313 |
uh | +3.242 |
Neg logit contributions | |
tremend | -20.114 |
deaf | -17.022 |
meaningful | -16.350 |
behavi | -15.974 |
misunder | -15.877 |
Token | s |
Token ID | 82 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
Co | +4.329 |
she | +3.890 |
ian | +3.853 |
Star | +3.818 |
L | +3.779 |
Neg logit contributions | |
tremend | -8.225 |
deaf | -7.306 |
meaningful | -7.130 |
vested | -6.653 |
visually | -6.627 |
Token | � |
Token ID | 564 |
Feature activation | +9.49e+00 |
Pos logit contributions | |
Co | +2.363 |
ian | +2.211 |
Star | +2.206 |
she | +2.201 |
L | +2.184 |
Neg logit contributions | |
tremend | -1.798 |
deaf | -1.480 |
meaningful | -1.420 |
vested | -1.273 |
visually | -1.253 |
Token | � |
Token ID | 250 |
Feature activation | +4.41e+00 |
Pos logit contributions | |
Co | +6.099 |
B | +5.343 |
L | +5.249 |
Star | +5.229 |
ian | +5.132 |
Neg logit contributions | |
tremend | -20.378 |
deaf | -17.383 |
meaningful | -16.789 |
behavi | -16.175 |
vested | -16.135 |
Token | Live |
Token ID | 18947 |
Feature activation | +4.63e+00 |
Pos logit contributions | |
Co | +4.247 |
Star | +3.750 |
she | +3.749 |
ian | +3.712 |
L | +3.689 |
Neg logit contributions | |
tremend | -8.610 |
deaf | -7.647 |
meaningful | -7.501 |
vested | -7.024 |
visually | -6.994 |
Token | Quest |
Token ID | 6785 |
Feature activation | +3.08e+00 |
Pos logit contributions | |
Co | +5.597 |
Star | +5.159 |
ian | +5.153 |
L | +5.066 |
she | +5.033 |
Neg logit contributions | |
tremend | -7.746 |
deaf | -6.811 |
meaningful | -6.530 |
vested | -6.092 |
visually | -6.027 |
Token | Mode |
Token ID | 10363 |
Feature activation | +2.60e+00 |
Pos logit contributions | |
Co | +3.077 |
ian | +2.729 |
she | +2.721 |
Star | +2.702 |
L | +2.679 |
Neg logit contributions | |
tremend | -5.879 |
deaf | -5.237 |
meaningful | -5.113 |
vested | -4.788 |
visually | -4.754 |
Token | . |
Token ID | 13 |
Feature activation | +7.89e-01 |
Pos logit contributions | |
Co | +3.005 |
ian | +2.711 |
she | +2.710 |
Star | +2.689 |
L | +2.664 |
Neg logit contributions | |
tremend | -4.559 |
deaf | -4.005 |
meaningful | -3.911 |
vested | -3.621 |
visually | -3.611 |
Token | ). |
Token ID | 737 |
Feature activation | +3.50e+00 |
Pos logit contributions | |
Co | +4.670 |
ian | +4.174 |
Star | +4.114 |
she | +4.096 |
L | +4.088 |
Neg logit contributions | |
tremend | -8.258 |
deaf | -7.281 |
meaningful | -7.068 |
vested | -6.642 |
visually | -6.601 |
Token | Wall |
Token ID | 22401 |
Feature activation | +9.77e+00 |
Pos logit contributions | |
Co | +3.360 |
ian | +2.955 |
she | +2.946 |
Star | +2.932 |
L | +2.895 |
Neg logit contributions | |
tremend | -6.866 |
deaf | -6.111 |
meaningful | -5.989 |
vested | -5.603 |
visually | -5.589 |
Token | Paper |
Token ID | 42950 |
Feature activation | +5.64e+00 |
Pos logit contributions | |
Co | +10.420 |
P | +9.266 |
B | +9.185 |
L | +9.149 |
Star | +9.098 |
Neg logit contributions | |
tremend | -17.030 |
deaf | -15.077 |
meaningful | -14.390 |
vested | -13.725 |
proactive | -13.430 |
Token | if |
Token ID | 611 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
Co | +7.485 |
L | +6.792 |
B | +6.765 |
P | +6.698 |
ian | +6.692 |
Neg logit contributions | |
tremend | -9.020 |
deaf | -7.734 |
meaningful | -7.410 |
vested | -6.904 |
proactive | -6.815 |
Token | ( |
Token ID | 357 |
Feature activation | +5.23e+00 |
Pos logit contributions | |
Co | +1.134 |
ian | +1.014 |
she | +1.012 |
Star | +1.006 |
L | +0.992 |
Neg logit contributions | |
tremend | -1.995 |
deaf | -1.765 |
meaningful | -1.728 |
vested | -1.607 |
visually | -1.606 |
Token | Test |
Token ID | 14402 |
Feature activation | +7.07e+00 |
Pos logit contributions | |
Co | +6.326 |
L | +5.690 |
she | +5.685 |
ian | +5.679 |
Star | +5.657 |
Neg logit contributions | |
tremend | -8.897 |
deaf | -7.692 |
meaningful | -7.503 |
vested | -6.980 |
proactive | -6.955 |
Token | - |
Token ID | 12 |
Feature activation | +5.45e+00 |
Pos logit contributions | |
Co | +8.372 |
L | +7.501 |
B | +7.469 |
ian | +7.467 |
Star | +7.441 |
Neg logit contributions | |
tremend | -12.116 |
deaf | -10.466 |
meaningful | -10.070 |
vested | -9.468 |
proactive | -9.432 |
Token | Path |
Token ID | 15235 |
Feature activation | +7.54e+00 |
Pos logit contributions | |
Co | +3.004 |
Star | +2.300 |
B | +2.269 |
L | +2.269 |
she | +2.235 |
Neg logit contributions | |
tremend | -12.894 |
deaf | -11.781 |
meaningful | -11.529 |
visually | -10.993 |
vested | -10.967 |
Token | - |
Token ID | 532 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
Co | +11.663 |
L | +10.768 |
Star | +10.708 |
she | +10.701 |
B | +10.671 |
Neg logit contributions | |
tremend | -9.902 |
deaf | -8.193 |
meaningful | -7.665 |
proactive | -7.075 |
vested | -7.043 |
Token | Path |
Token ID | 15235 |
Feature activation | +9.20e+00 |
Pos logit contributions | |
Co | +2.805 |
ian | +2.373 |
she | +2.373 |
Star | +2.367 |
L | +2.330 |
Neg logit contributions | |
tremend | -7.727 |
deaf | -6.947 |
meaningful | -6.812 |
vested | -6.424 |
visually | -6.419 |
Token | $ |
Token ID | 720 |
Feature activation | +7.50e+00 |
Pos logit contributions | |
Co | +13.917 |
L | +12.940 |
P | +12.798 |
B | +12.764 |
she | +12.742 |
Neg logit contributions | |
tremend | -11.854 |
deaf | -9.832 |
meaningful | -9.022 |
proactive | -8.433 |
vested | -8.385 |
Token | in |
Token ID | 287 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
Co | +1.714 |
ian | +1.591 |
she | +1.589 |
Star | +1.582 |
L | +1.566 |
Neg logit contributions | |
tremend | -1.504 |
deaf | -1.269 |
meaningful | -1.232 |
vested | -1.106 |
visually | -1.106 |
Token | a |
Token ID | 257 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
tremend | +2.325 |
deaf | +1.818 |
meaningful | +1.756 |
visually | +1.443 |
vested | +1.432 |
Neg logit contributions | |
Co | -5.039 |
she | -4.785 |
ian | -4.764 |
Star | -4.746 |
uh | -4.706 |
Token | furious |
Token ID | 21799 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
tremend | +1.696 |
deaf | +1.420 |
meaningful | +1.379 |
visually | +1.224 |
vested | +1.220 |
Neg logit contributions | |
Co | -2.207 |
she | -2.058 |
ian | -2.056 |
Star | -2.047 |
uh | -2.025 |
Token | fourth |
Token ID | 5544 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
tremend | +2.767 |
deaf | +2.402 |
meaningful | +2.347 |
visually | +2.091 |
vested | +2.074 |
Neg logit contributions | |
Co | -3.302 |
she | -3.087 |
Star | -3.053 |
ian | -3.041 |
uh | -3.022 |
Token | - |
Token ID | 12 |
Feature activation | +5.38e+00 |
Pos logit contributions | |
Co | +5.129 |
ian | +4.745 |
Star | +4.697 |
B | +4.681 |
L | +4.674 |
Neg logit contributions | |
tremend | -5.124 |
deaf | -4.283 |
meaningful | -4.111 |
vested | -3.795 |
visually | -3.771 |
Token | quarter |
Token ID | 24385 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
Co | +5.254 |
she | +4.645 |
ian | +4.623 |
B | +4.614 |
Star | +4.603 |
Neg logit contributions | |
tremend | -10.460 |
deaf | -9.171 |
meaningful | -8.901 |
vested | -8.441 |
proactive | -8.406 |
Token | comeback |
Token ID | 21933 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
Co | +7.016 |
ian | +6.637 |
Star | +6.543 |
L | +6.543 |
B | +6.540 |
Neg logit contributions | |
tremend | -4.733 |
deaf | -3.734 |
meaningful | -3.564 |
vested | -3.182 |
visually | -3.162 |
Token | . |
Token ID | 13 |
Feature activation | -1.99e-01 |
Pos logit contributions | |
tremend | +3.259 |
deaf | +2.880 |
meaningful | +2.838 |
visually | +2.573 |
vested | +2.569 |
Neg logit contributions | |
Co | -2.770 |
she | -2.540 |
Star | -2.501 |
ian | -2.499 |
uh | -2.466 |
Token | But |
Token ID | 887 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
tremend | +0.362 |
deaf | +0.327 |
meaningful | +0.319 |
visually | +0.297 |
vested | +0.295 |
Neg logit contributions | |
Co | -0.207 |
she | -0.187 |
ian | -0.186 |
Star | -0.185 |
uh | -0.182 |
Token | New |
Token ID | 968 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
Co | +2.459 |
ian | +2.300 |
she | +2.286 |
Smith | +2.276 |
Star | +2.275 |
Neg logit contributions | |
tremend | -1.678 |
deaf | -1.341 |
meaningful | -1.297 |
vested | -1.151 |
visually | -1.143 |
Token | Mexico |
Token ID | 5828 |
Feature activation | +6.99e+00 |
Pos logit contributions | |
Co | +5.683 |
ian | +5.251 |
she | +5.248 |
Star | +5.195 |
L | +5.146 |
Neg logit contributions | |
tremend | -6.387 |
deaf | -5.247 |
meaningful | -5.113 |
vested | -4.684 |
visually | -4.646 |
Token | : |
Token ID | 25 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
tremend | +2.413 |
deaf | +2.134 |
meaningful | +2.087 |
visually | +1.926 |
vested | +1.916 |
Neg logit contributions | |
Co | -1.736 |
ian | -1.566 |
she | -1.564 |
Star | -1.564 |
uh | -1.538 |
Token | step |
Token ID | 2239 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
tremend | +5.636 |
deaf | +4.999 |
meaningful | +4.905 |
visually | +4.454 |
proactive | +4.433 |
Neg logit contributions | |
Co | -4.696 |
Star | -4.295 |
ian | -4.294 |
she | -4.292 |
Smith | -4.215 |
Token | it |
Token ID | 340 |
Feature activation | -4.19e+00 |
Pos logit contributions | |
Co | +2.439 |
ian | +2.299 |
she | +2.286 |
Star | +2.285 |
B | +2.271 |
Neg logit contributions | |
tremend | -1.367 |
deaf | -1.074 |
meaningful | -1.031 |
vested | -0.889 |
visually | -0.888 |
Token | up |
Token ID | 510 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
tremend | +4.050 |
deaf | +3.454 |
meaningful | +3.300 |
vested | +2.796 |
visually | +2.794 |
Neg logit contributions | |
Co | -7.721 |
she | -7.259 |
Star | -7.251 |
ian | -7.170 |
Smith | -7.151 |
Token | . |
Token ID | 13 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
tremend | +2.796 |
deaf | +2.498 |
meaningful | +2.453 |
visually | +2.287 |
vested | +2.274 |
Neg logit contributions | |
Co | -1.456 |
she | -1.298 |
ian | -1.295 |
Star | -1.287 |
uh | -1.260 |
Token |
|
Token ID | 198 |
Feature activation | +8.63e+00 |
Pos logit contributions | |
tremend | +0.243 |
deaf | +0.220 |
meaningful | +0.216 |
visually | +0.202 |
vested | +0.201 |
Neg logit contributions | |
Co | -0.117 |
she | -0.104 |
ian | -0.104 |
Star | -0.103 |
uh | -0.101 |
Token |
|
Token ID | 198 |
Feature activation | +8.26e+00 |
Pos logit contributions | |
Co | +5.483 |
L | +4.784 |
B | +4.773 |
P | +4.589 |
ian | +4.552 |
Neg logit contributions | |
tremend | -22.354 |
exha | -17.400 |
behavi | -17.253 |
undermin | -17.215 |
misunder | -17.016 |
Token | And |
Token ID | 1870 |
Feature activation | +3.31e+00 |
Pos logit contributions | |
Co | +6.607 |
B | +5.574 |
Star | +5.562 |
L | +5.549 |
Smith | +5.436 |
Neg logit contributions | |
tremend | -17.938 |
deaf | -15.497 |
meaningful | -15.244 |
proactive | -14.436 |
vested | -14.432 |
Token | so |
Token ID | 523 |
Feature activation | +6.34e+00 |
Pos logit contributions | |
Co | +6.158 |
ian | +5.816 |
she | +5.778 |
Star | +5.749 |
B | +5.730 |
Neg logit contributions | |
tremend | -3.506 |
deaf | -2.637 |
meaningful | -2.554 |
vested | -2.195 |
proactive | -2.164 |
Token | it |
Token ID | 340 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
Co | +11.501 |
ian | +10.792 |
B | +10.779 |
Star | +10.744 |
L | +10.723 |
Neg logit contributions | |
tremend | -6.521 |
deaf | -4.761 |
meaningful | -4.512 |
artificially | -3.885 |
visually | -3.858 |
Token | went |
Token ID | 1816 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
tremend | +2.432 |
deaf | +2.144 |
meaningful | +2.095 |
visually | +1.937 |
vested | +1.937 |
Neg logit contributions | |
Co | -1.750 |
she | -1.586 |
Star | -1.583 |
ian | -1.583 |
L | -1.553 |
Token | der |
Token ID | 4587 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
tremend | +1.893 |
deaf | +1.512 |
meaningful | +1.452 |
visually | +1.244 |
vested | +1.239 |
Neg logit contributions | |
Co | -3.471 |
she | -3.262 |
ian | -3.260 |
Star | -3.252 |
L | -3.222 |
Token | anged |
Token ID | 5102 |
Feature activation | -7.98e+00 |
Pos logit contributions | |
Co | +1.008 |
ian | +0.896 |
she | +0.892 |
Star | +0.884 |
L | +0.873 |
Neg logit contributions | |
tremend | -1.942 |
deaf | -1.724 |
meaningful | -1.690 |
vested | -1.576 |
visually | -1.575 |
Token | . |
Token ID | 13 |
Feature activation | +7.56e-01 |
Pos logit contributions | |
tremend | +13.220 |
deaf | +12.357 |
meaningful | +12.033 |
visually | +11.568 |
purely | +11.228 |
Neg logit contributions | |
Co | -7.998 |
Star | -7.099 |
she | -7.095 |
Smith | -6.987 |
uh | -6.972 |
Token | There |
Token ID | 1318 |
Feature activation | +2.78e+00 |
Pos logit contributions | |
Co | +0.741 |
ian | +0.657 |
she | +0.655 |
Star | +0.651 |
uh | +0.642 |
Neg logit contributions | |
tremend | -1.446 |
deaf | -1.298 |
meaningful | -1.273 |
visually | -1.189 |
vested | -1.185 |
Token | � |
Token ID | 447 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
Co | +3.093 |
she | +2.822 |
ian | +2.805 |
Star | +2.749 |
L | +2.744 |
Neg logit contributions | |
tremend | -4.991 |
deaf | -4.360 |
meaningful | -4.285 |
vested | -3.969 |
proactive | -3.944 |
Token | � |
Token ID | 247 |
Feature activation | +5.11e+00 |
Pos logit contributions | |
Co | +6.878 |
B | +5.971 |
uh | +5.879 |
L | +5.858 |
she | +5.850 |
Neg logit contributions | |
tremend | -21.142 |
deaf | -18.542 |
meaningful | -18.208 |
vested | -17.422 |
proactive | -17.187 |
Token | s |
Token ID | 82 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
Co | +8.278 |
she | +7.790 |
ian | +7.750 |
Star | +7.661 |
L | +7.647 |
Neg logit contributions | |
tremend | -6.506 |
deaf | -5.391 |
meaningful | -5.227 |
vested | -4.688 |
proactive | -4.630 |
Token | a |
Token ID | 257 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
Co | +2.201 |
ian | +2.090 |
she | +2.084 |
Star | +2.073 |
L | +2.064 |
Neg logit contributions | |
tremend | -0.897 |
deaf | -0.659 |
meaningful | -0.622 |
vested | -0.508 |
visually | -0.504 |
Token | side |
Token ID | 1735 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
tremend | +1.568 |
deaf | +1.264 |
meaningful | +1.216 |
visually | +1.053 |
vested | +1.052 |
Neg logit contributions | |
Co | -2.619 |
ian | -2.457 |
she | -2.455 |
Star | -2.446 |
L | -2.425 |
Token | table |
Token ID | 3084 |
Feature activation | +5.79e-01 |
Pos logit contributions | |
Co | +3.122 |
she | +2.926 |
ian | +2.907 |
Star | +2.885 |
B | +2.879 |
Neg logit contributions | |
tremend | -2.538 |
deaf | -2.106 |
meaningful | -2.048 |
visually | -1.824 |
vested | -1.821 |
Token | shaped |
Token ID | 14292 |
Feature activation | -5.08e+00 |
Pos logit contributions | |
Co | +0.924 |
ian | +0.860 |
she | +0.859 |
Star | +0.854 |
L | +0.847 |
Neg logit contributions | |
tremend | -0.764 |
deaf | -0.639 |
meaningful | -0.620 |
vested | -0.554 |
visually | -0.554 |
Token | box |
Token ID | 3524 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
tremend | +3.744 |
deaf | +3.379 |
meaningful | +3.368 |
visually | +3.123 |
proactive | +3.123 |
Neg logit contributions | |
Co | -1.726 |
she | -1.508 |
ian | -1.504 |
Smith | -1.498 |
Star | -1.496 |
Token | to |
Token ID | 284 |
Feature activation | -5.39e+00 |
Pos logit contributions | |
tremend | +2.749 |
deaf | +2.369 |
meaningful | +2.339 |
visually | +2.143 |
proactive | +2.111 |
Neg logit contributions | |
Co | -2.650 |
she | -2.440 |
Star | -2.439 |
ian | -2.428 |
Smith | -2.419 |
Token | accomplish |
Token ID | 9989 |
Feature activation | -7.05e+00 |
Pos logit contributions | |
tremend | +5.999 |
deaf | +5.047 |
meaningful | +4.917 |
visually | +4.432 |
artificially | +4.291 |
Neg logit contributions | |
Co | -9.250 |
she | -8.692 |
ian | -8.667 |
Star | -8.638 |
Smith | -8.579 |
Token | the |
Token ID | 262 |
Feature activation | -5.43e+00 |
Pos logit contributions | |
tremend | +8.170 |
meaningful | +6.987 |
deaf | +6.917 |
visually | +6.139 |
proactive | +6.126 |
Neg logit contributions | |
Co | -11.328 |
she | -10.680 |
Star | -10.582 |
Smith | -10.558 |
ian | -10.530 |
Token | same |
Token ID | 976 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
tremend | +4.408 |
deaf | +3.414 |
meaningful | +3.303 |
visually | +2.711 |
proactive | +2.648 |
Neg logit contributions | |
Co | -11.061 |
Star | -10.439 |
she | -10.434 |
ian | -10.397 |
Smith | -10.348 |
Token | thing |
Token ID | 1517 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
tremend | +0.598 |
deaf | +0.496 |
meaningful | +0.477 |
vested | +0.425 |
visually | +0.424 |
Neg logit contributions | |
Co | -0.769 |
ian | -0.719 |
she | -0.716 |
Star | -0.711 |
L | -0.708 |
Token | . |
Token ID | 13 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
tremend | +8.134 |
deaf | +7.253 |
meaningful | +7.214 |
visually | +6.820 |
artificially | +6.687 |
Neg logit contributions | |
Co | -4.381 |
Star | -3.927 |
she | -3.880 |
ian | -3.825 |
uh | -3.809 |
Token | The |
Token ID | 383 |
Feature activation | -1.97e-01 |
Pos logit contributions | |
tremend | +3.503 |
deaf | +3.231 |
meaningful | +3.175 |
visually | +2.969 |
vested | +2.952 |
Neg logit contributions | |
Co | -1.819 |
she | -1.639 |
ian | -1.622 |
Star | -1.604 |
uh | -1.603 |
Token | news |
Token ID | 1705 |
Feature activation | +6.66e-01 |
Pos logit contributions | |
tremend | +0.229 |
deaf | +0.186 |
meaningful | +0.179 |
vested | +0.157 |
visually | +0.157 |
Neg logit contributions | |
Co | -0.345 |
ian | -0.323 |
she | -0.323 |
Star | -0.321 |
L | -0.319 |
Token | feed |
Token ID | 12363 |
Feature activation | +3.36e+00 |
Pos logit contributions | |
Co | +1.099 |
ian | +1.024 |
she | +1.023 |
Star | +1.019 |
L | +1.009 |
Neg logit contributions | |
tremend | -0.841 |
deaf | -0.700 |
meaningful | -0.678 |
visually | -0.603 |
vested | -0.602 |
Token | , |
Token ID | 11 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
Co | +5.382 |
ian | +5.001 |
she | +4.998 |
Star | +4.971 |
L | +4.944 |
Neg logit contributions | |
tremend | -4.347 |
deaf | -3.624 |
meaningful | -3.495 |
vested | -3.102 |
visually | -3.089 |
Token | . |
Token ID | 13 |
Feature activation | -5.40e-01 |
Pos logit contributions | |
tremend | +8.135 |
deaf | +7.338 |
meaningful | +7.210 |
visually | +6.766 |
vested | +6.637 |
Neg logit contributions | |
Co | -5.916 |
she | -5.270 |
Star | -5.252 |
ian | -5.235 |
Smith | -5.222 |
Token | Not |
Token ID | 1892 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
tremend | +1.021 |
deaf | +0.922 |
meaningful | +0.905 |
visually | +0.846 |
vested | +0.842 |
Neg logit contributions | |
Co | -0.526 |
ian | -0.468 |
she | -0.468 |
Star | -0.463 |
uh | -0.455 |
Token | confirmed |
Token ID | 4999 |
Feature activation | +9.28e-02 |
Pos logit contributions | |
Co | +3.783 |
ian | +3.564 |
Star | +3.547 |
she | +3.544 |
L | +3.523 |
Neg logit contributions | |
tremend | -1.913 |
deaf | -1.481 |
meaningful | -1.398 |
vested | -1.197 |
visually | -1.186 |
Token | but |
Token ID | 475 |
Feature activation | +3.36e-01 |
Pos logit contributions | |
Co | +0.132 |
ian | +0.122 |
she | +0.122 |
Star | +0.121 |
uh | +0.120 |
Neg logit contributions | |
tremend | -0.138 |
deaf | -0.118 |
meaningful | -0.115 |
visually | -0.105 |
vested | -0.105 |
Token | that |
Token ID | 326 |
Feature activation | +6.97e-01 |
Pos logit contributions | |
Co | +0.588 |
she | +0.551 |
ian | +0.551 |
Star | +0.548 |
L | +0.545 |
Neg logit contributions | |
tremend | -0.393 |
deaf | -0.317 |
meaningful | -0.304 |
vested | -0.267 |
visually | -0.266 |
Token | may |
Token ID | 743 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
Co | +0.898 |
ian | +0.820 |
she | +0.818 |
Star | +0.814 |
L | +0.806 |
Neg logit contributions | |
tremend | -1.135 |
deaf | -0.984 |
meaningful | -0.960 |
vested | -0.881 |
visually | -0.879 |
Token | mean |
Token ID | 1612 |
Feature activation | -8.02e-01 |
Pos logit contributions | |
tremend | +0.236 |
deaf | +0.182 |
meaningful | +0.175 |
vested | +0.150 |
proactive | +0.149 |
Neg logit contributions | |
Co | -0.438 |
ian | -0.413 |
she | -0.411 |
Star | -0.410 |
uh | -0.409 |
Token | they |
Token ID | 484 |
Feature activation | -4.27e+00 |
Pos logit contributions | |
tremend | +0.780 |
deaf | +0.606 |
meaningful | +0.578 |
vested | +0.488 |
visually | +0.487 |
Neg logit contributions | |
Co | -1.562 |
she | -1.471 |
ian | -1.471 |
Star | -1.466 |
L | -1.455 |
Token | will |
Token ID | 481 |
Feature activation | -5.68e+00 |
Pos logit contributions | |
tremend | +5.921 |
deaf | +5.203 |
meaningful | +5.030 |
visually | +4.638 |
vested | +4.628 |
Neg logit contributions | |
Co | -6.203 |
Star | -5.705 |
ian | -5.699 |
she | -5.685 |
Smith | -5.664 |
Token | only |
Token ID | 691 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
tremend | +5.805 |
deaf | +4.914 |
meaningful | +4.688 |
visually | +4.224 |
artificially | +4.072 |
Neg logit contributions | |
Co | -10.064 |
she | -9.443 |
Star | -9.432 |
Smith | -9.376 |
ian | -9.355 |
Token | carry |
Token ID | 3283 |
Feature activation | -2.71e+00 |
Pos logit contributions | |
tremend | +2.275 |
deaf | +1.824 |
meaningful | +1.752 |
visually | +1.509 |
vested | +1.503 |
Neg logit contributions | |
Co | -4.064 |
ian | -3.816 |
she | -3.815 |
Star | -3.803 |
uh | -3.766 |
Token | ters |
Token ID | 1010 |
Feature activation | -3.84e-01 |
Pos logit contributions | |
Co | +7.999 |
she | +7.780 |
ian | +7.403 |
L | +7.386 |
Smith | +7.232 |
Neg logit contributions | |
tremend | -15.949 |
deaf | -12.882 |
meaningful | -12.371 |
behavi | -12.176 |
vested | -11.978 |
Token | laughed |
Token ID | 13818 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
tremend | +0.588 |
deaf | +0.510 |
meaningful | +0.497 |
visually | +0.455 |
vested | +0.453 |
Neg logit contributions | |
Co | -0.529 |
she | -0.485 |
ian | -0.484 |
Star | -0.483 |
L | -0.476 |
Token | : |
Token ID | 25 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
tremend | +4.773 |
deaf | +4.281 |
meaningful | +4.175 |
visually | +3.864 |
reasonable | +3.820 |
Neg logit contributions | |
Co | -3.192 |
she | -2.899 |
Star | -2.874 |
ian | -2.861 |
uh | -2.829 |
Token | � |
Token ID | 564 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
tremend | +2.495 |
deaf | +2.201 |
meaningful | +2.150 |
visually | +1.981 |
vested | +1.967 |
Neg logit contributions | |
Co | -1.830 |
ian | -1.663 |
she | -1.657 |
Star | -1.656 |
Smith | -1.627 |
Token | � |
Token ID | 250 |
Feature activation | +4.76e+00 |
Pos logit contributions | |
Co | +10.591 |
Star | +9.454 |
she | +9.439 |
B | +9.427 |
ian | +9.426 |
Neg logit contributions | |
tremend | -21.332 |
deaf | -18.327 |
meaningful | -18.016 |
vested | -17.259 |
artificially | -16.897 |
Token | You |
Token ID | 1639 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
Co | +3.805 |
she | +3.281 |
ian | +3.247 |
Star | +3.239 |
L | +3.190 |
Neg logit contributions | |
tremend | -10.111 |
deaf | -9.030 |
meaningful | -8.886 |
vested | -8.365 |
visually | -8.348 |
Token | thought |
Token ID | 1807 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
Co | +1.650 |
ian | +1.543 |
she | +1.540 |
Star | +1.534 |
L | +1.531 |
Neg logit contributions | |
tremend | -1.275 |
deaf | -1.036 |
meaningful | -1.013 |
vested | -0.902 |
proactive | -0.893 |
Token | people |
Token ID | 661 |
Feature activation | -4.29e+00 |
Pos logit contributions | |
Co | +0.411 |
ian | +0.387 |
she | +0.386 |
Star | +0.384 |
L | +0.382 |
Neg logit contributions | |
tremend | -0.254 |
deaf | -0.200 |
meaningful | -0.193 |
vested | -0.168 |
visually | -0.167 |
Token | knew |
Token ID | 2993 |
Feature activation | -4.92e+00 |
Pos logit contributions | |
tremend | +6.055 |
deaf | +5.426 |
meaningful | +5.240 |
visually | +4.779 |
vested | +4.742 |
Neg logit contributions | |
Co | -6.144 |
Star | -5.625 |
she | -5.610 |
ian | -5.588 |
Smith | -5.547 |
Token | what |
Token ID | 644 |
Feature activation | -3.13e+00 |
Pos logit contributions | |
tremend | +6.799 |
deaf | +6.021 |
meaningful | +5.858 |
visually | +5.335 |
vested | +5.274 |
Neg logit contributions | |
Co | -7.096 |
she | -6.560 |
Star | -6.551 |
ian | -6.540 |
Smith | -6.491 |
Token | was |
Token ID | 373 |
Feature activation | -3.48e+00 |
Pos logit contributions | |
tremend | +5.034 |
deaf | +4.457 |
meaningful | +4.358 |
vested | +3.993 |
visually | +3.988 |
Neg logit contributions | |
Co | -3.968 |
she | -3.609 |
ian | -3.607 |
Star | -3.601 |
Smith | -3.561 |
Token | EW |
Token ID | 6217 |
Feature activation | +4.83e+00 |
Pos logit contributions | |
Co | +0.210 |
she | +0.180 |
Star | +0.179 |
ian | +0.179 |
Smith | +0.174 |
Neg logit contributions | |
tremend | -0.563 |
deaf | -0.508 |
meaningful | -0.500 |
visually | -0.470 |
vested | -0.467 |
Token | ILL |
Token ID | 8267 |
Feature activation | +3.62e+00 |
Pos logit contributions | |
Co | +6.551 |
L | +6.036 |
B | +5.973 |
she | +5.970 |
ian | +5.970 |
Neg logit contributions | |
tremend | -7.416 |
deaf | -6.393 |
meaningful | -6.238 |
proactive | -5.658 |
vested | -5.655 |
Token | NOT |
Token ID | 11929 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
Co | +5.551 |
she | +5.167 |
ian | +5.150 |
Star | +5.123 |
L | +5.119 |
Neg logit contributions | |
tremend | -4.972 |
deaf | -4.183 |
meaningful | -4.055 |
vested | -3.633 |
proactive | -3.628 |
Token | DIV |
Token ID | 33569 |
Feature activation | +3.15e+00 |
Pos logit contributions | |
tremend | +3.165 |
deaf | +2.860 |
meaningful | +2.802 |
visually | +2.628 |
vested | +2.608 |
Neg logit contributions | |
Co | -1.454 |
ian | -1.289 |
Star | -1.282 |
she | -1.268 |
Smith | -1.251 |
Token | IDE |
Token ID | 14114 |
Feature activation | -2.54e+00 |
Pos logit contributions | |
Co | +2.901 |
ian | +2.555 |
she | +2.533 |
Star | +2.516 |
L | +2.499 |
Neg logit contributions | |
tremend | -6.314 |
deaf | -5.603 |
meaningful | -5.508 |
visually | -5.149 |
vested | -5.146 |
Token | . |
Token ID | 13 |
Feature activation | -7.07e-01 |
Pos logit contributions | |
tremend | +4.886 |
deaf | +4.417 |
meaningful | +4.338 |
visually | +4.078 |
vested | +4.052 |
Neg logit contributions | |
Co | -2.318 |
ian | -2.084 |
she | -2.066 |
Star | -2.049 |
Smith | -2.000 |
Token | US |
Token ID | 2937 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
tremend | +1.533 |
deaf | +1.398 |
meaningful | +1.375 |
visually | +1.300 |
vested | +1.292 |
Neg logit contributions | |
Co | -0.492 |
she | -0.418 |
ian | -0.417 |
Star | -0.412 |
Smith | -0.398 |
Token | due |
Token ID | 2233 |
Feature activation | -2.32e+00 |
Pos logit contributions | |
Co | +5.439 |
ian | +5.013 |
she | +5.009 |
L | +4.988 |
Star | +4.974 |
Neg logit contributions | |
tremend | -5.528 |
deaf | -4.700 |
meaningful | -4.564 |
vested | -4.135 |
visually | -4.113 |
Token | to |
Token ID | 284 |
Feature activation | -6.76e+00 |
Pos logit contributions | |
tremend | +2.806 |
deaf | +2.319 |
meaningful | +2.241 |
visually | +1.978 |
vested | +1.975 |
Neg logit contributions | |
Co | -3.961 |
she | -3.697 |
ian | -3.695 |
Star | -3.685 |
uh | -3.642 |
Token | dangerous |
Token ID | 4923 |
Feature activation | -5.07e+00 |
Pos logit contributions | |
tremend | +8.689 |
deaf | +7.639 |
meaningful | +7.421 |
visually | +6.730 |
vested | +6.727 |
Neg logit contributions | |
Co | -10.088 |
she | -9.403 |
Star | -9.369 |
ian | -9.252 |
uh | -9.193 |
Token | , |
Token ID | 11 |
Feature activation | -3.13e+00 |
Pos logit contributions | |
tremend | +6.948 |
deaf | +6.154 |
meaningful | +5.961 |
vested | +5.591 |
visually | +5.580 |
Neg logit contributions | |
Co | -7.169 |
Star | -6.644 |
she | -6.617 |
Smith | -6.561 |
uh | -6.533 |
Token | with |
Token ID | 351 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
tremend | +5.199 |
deaf | +4.386 |
meaningful | +4.298 |
vested | +3.779 |
visually | +3.768 |
Neg logit contributions | |
Co | -6.978 |
Star | -6.487 |
ian | -6.440 |
she | -6.439 |
Smith | -6.430 |
Token | justice |
Token ID | 5316 |
Feature activation | +3.13e+00 |
Pos logit contributions | |
tremend | +1.515 |
deaf | +1.157 |
meaningful | +1.102 |
vested | +0.908 |
visually | +0.907 |
Neg logit contributions | |
Co | -3.423 |
ian | -3.231 |
she | -3.229 |
Star | -3.220 |
L | -3.194 |
Token | that |
Token ID | 326 |
Feature activation | -5.30e+00 |
Pos logit contributions | |
Co | +5.560 |
ian | +5.255 |
she | +5.235 |
L | +5.187 |
Star | +5.178 |
Neg logit contributions | |
tremend | -3.456 |
deaf | -2.772 |
meaningful | -2.656 |
visually | -2.338 |
proactive | -2.321 |
Token | history |
Token ID | 2106 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
tremend | +7.180 |
deaf | +6.363 |
meaningful | +6.302 |
vested | +5.638 |
reasonable | +5.625 |
Neg logit contributions | |
Co | -7.644 |
Star | -7.059 |
ian | -6.974 |
Smith | -6.964 |
uh | -6.959 |
Token | has |
Token ID | 468 |
Feature activation | -5.49e+00 |
Pos logit contributions | |
Co | +1.888 |
ian | +1.734 |
she | +1.731 |
Star | +1.705 |
L | +1.702 |
Neg logit contributions | |
tremend | -2.441 |
deaf | -2.089 |
meaningful | -2.049 |
vested | -1.881 |
visually | -1.880 |
Token | vind |
Token ID | 29178 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
tremend | +6.119 |
deaf | +5.261 |
meaningful | +5.062 |
vested | +4.416 |
visually | +4.413 |
Neg logit contributions | |
Co | -9.527 |
Star | -8.925 |
ian | -8.883 |
she | -8.860 |
uh | -8.823 |
Token | icated |
Token ID | 3474 |
Feature activation | -7.63e+00 |
Pos logit contributions | |
Co | +1.955 |
ian | +1.768 |
she | +1.745 |
Star | +1.721 |
L | +1.707 |
Neg logit contributions | |
tremend | -3.500 |
deaf | -3.088 |
meaningful | -3.026 |
visually | -2.805 |
vested | -2.802 |
Token | her |
Token ID | 607 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
tremend | +8.692 |
meaningful | +7.656 |
deaf | +7.645 |
reasonable | +6.750 |
vested | +6.671 |
Neg logit contributions | |
Co | -11.961 |
Star | -11.162 |
uh | -11.050 |
Smith | -11.016 |
ian | -10.999 |
Token | . |
Token ID | 13 |
Feature activation | +6.11e-01 |
Pos logit contributions | |
tremend | +4.056 |
deaf | +3.549 |
meaningful | +3.478 |
vested | +3.180 |
proactive | +3.161 |
Neg logit contributions | |
Co | -3.475 |
she | -3.165 |
Star | -3.163 |
ian | -3.146 |
Smith | -3.121 |
Token |
|
Token ID | 198 |
Feature activation | +7.10e+00 |
Pos logit contributions | |
Co | +0.565 |
ian | +0.496 |
she | +0.493 |
Star | +0.492 |
uh | +0.484 |
Neg logit contributions | |
tremend | -1.196 |
deaf | -1.081 |
meaningful | -1.061 |
visually | -0.991 |
vested | -0.990 |
Token |
|
Token ID | 198 |
Feature activation | +6.50e+00 |
Pos logit contributions | |
Co | +4.370 |
L | +3.736 |
B | +3.694 |
ian | +3.674 |
she | +3.665 |
Neg logit contributions | |
tremend | -18.551 |
exha | -14.452 |
behavi | -14.384 |
undermin | -14.292 |
misunder | -14.215 |
Token | - |
Token ID | 12 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
tremend | +1.776 |
deaf | +1.592 |
meaningful | +1.562 |
vested | +1.462 |
visually | +1.461 |
Neg logit contributions | |
Co | -0.795 |
ian | -0.695 |
she | -0.693 |
Star | -0.690 |
uh | -0.674 |
Token | the |
Token ID | 1169 |
Feature activation | -9.11e-01 |
Pos logit contributions | |
tremend | +3.505 |
deaf | +3.164 |
meaningful | +3.085 |
vested | +2.917 |
visually | +2.907 |
Neg logit contributions | |
Co | -1.603 |
ian | -1.406 |
Star | -1.398 |
Smith | -1.368 |
she | -1.361 |
Token | - |
Token ID | 12 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
tremend | +2.278 |
deaf | +2.119 |
meaningful | +2.078 |
vested | +1.980 |
visually | +1.980 |
Neg logit contributions | |
Co | -0.334 |
Star | -0.231 |
she | -0.231 |
ian | -0.231 |
Smith | -0.215 |
Token | counter |
Token ID | 24588 |
Feature activation | -5.39e-01 |
Pos logit contributions | |
Co | +0.145 |
ian | +0.128 |
Star | +0.127 |
Smith | +0.125 |
she | +0.125 |
Neg logit contributions | |
tremend | -0.315 |
deaf | -0.285 |
meaningful | -0.275 |
vested | -0.261 |
visually | -0.260 |
Token | supplement |
Token ID | 10327 |
Feature activation | -7.78e+00 |
Pos logit contributions | |
tremend | +0.599 |
deaf | +0.485 |
meaningful | +0.467 |
visually | +0.405 |
vested | +0.405 |
Neg logit contributions | |
Co | -0.971 |
ian | -0.911 |
she | -0.910 |
Star | -0.907 |
L | -0.899 |
Token | called |
Token ID | 1444 |
Feature activation | -7.96e+00 |
Pos logit contributions | |
tremend | +12.470 |
deaf | +11.352 |
meaningful | +11.310 |
artificially | +10.476 |
visually | +10.450 |
Neg logit contributions | |
Co | -8.433 |
Star | -7.533 |
she | -7.465 |
Smith | -7.449 |
ian | -7.366 |
Token | gal |
Token ID | 9426 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
tremend | +12.468 |
deaf | +11.075 |
meaningful | +10.925 |
proactive | +10.224 |
vested | +10.110 |
Neg logit contributions | |
Co | -8.725 |
uh | -8.021 |
she | -8.001 |
ian | -7.871 |
Star | -7.867 |
Token | ant |
Token ID | 415 |
Feature activation | +5.56e-01 |
Pos logit contributions | |
Co | +1.072 |
she | +0.873 |
ian | +0.870 |
Star | +0.858 |
uh | +0.830 |
Neg logit contributions | |
tremend | -4.027 |
deaf | -3.664 |
meaningful | -3.602 |
vested | -3.408 |
visually | -3.408 |
Token | amine |
Token ID | 9862 |
Feature activation | -2.86e+00 |
Pos logit contributions | |
Co | +0.485 |
Star | +0.419 |
she | +0.414 |
ian | +0.410 |
Smith | +0.407 |
Neg logit contributions | |
tremend | -1.118 |
deaf | -1.014 |
meaningful | -0.994 |
visually | -0.936 |
vested | -0.930 |
Token | , |
Token ID | 11 |
Feature activation | -3.32e+00 |
Pos logit contributions | |
tremend | +4.967 |
deaf | +4.440 |
meaningful | +4.360 |
visually | +4.049 |
vested | +4.038 |
Neg logit contributions | |
Co | -3.212 |
she | -2.889 |
Star | -2.884 |
ian | -2.868 |
uh | -2.831 |
Token | which |
Token ID | 543 |
Feature activation | -2.61e+00 |
Pos logit contributions | |
tremend | +4.591 |
deaf | +3.951 |
meaningful | +3.843 |
visually | +3.466 |
vested | +3.457 |
Neg logit contributions | |
Co | -4.973 |
ian | -4.600 |
Star | -4.582 |
she | -4.580 |
uh | -4.530 |
Token | product |
Token ID | 1720 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
tremend | +3.381 |
deaf | +2.798 |
meaningful | +2.727 |
vested | +2.394 |
visually | +2.392 |
Neg logit contributions | |
Co | -5.009 |
ian | -4.684 |
she | -4.682 |
Star | -4.648 |
uh | -4.616 |
Token | . |
Token ID | 13 |
Feature activation | +4.11e-01 |
Pos logit contributions | |
tremend | +3.060 |
deaf | +2.722 |
meaningful | +2.679 |
visually | +2.504 |
vested | +2.479 |
Neg logit contributions | |
Co | -1.855 |
Star | -1.647 |
ian | -1.646 |
she | -1.637 |
uh | -1.609 |
Token | The |
Token ID | 383 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
Co | +0.403 |
ian | +0.359 |
she | +0.358 |
Star | +0.354 |
uh | +0.349 |
Neg logit contributions | |
tremend | -0.777 |
deaf | -0.702 |
meaningful | -0.688 |
visually | -0.644 |
vested | -0.640 |
Token | officers |
Token ID | 3790 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
Co | +1.900 |
ian | +1.781 |
she | +1.775 |
Star | +1.775 |
L | +1.760 |
Neg logit contributions | |
tremend | -1.355 |
deaf | -1.096 |
meaningful | -1.064 |
vested | -0.937 |
visually | -0.937 |
Token | also |
Token ID | 635 |
Feature activation | -6.22e+00 |
Pos logit contributions | |
tremend | +1.369 |
deaf | +1.156 |
meaningful | +1.119 |
visually | +1.004 |
vested | +1.000 |
Neg logit contributions | |
Co | -1.698 |
she | -1.575 |
ian | -1.574 |
Star | -1.571 |
L | -1.552 |
Token | make |
Token ID | 787 |
Feature activation | -6.61e+00 |
Pos logit contributions | |
tremend | +7.606 |
deaf | +6.743 |
meaningful | +6.412 |
visually | +6.000 |
vested | +5.772 |
Neg logit contributions | |
Co | -9.742 |
Star | -9.020 |
she | -8.942 |
ian | -8.909 |
Smith | -8.875 |
Token | a |
Token ID | 257 |
Feature activation | -3.32e+00 |
Pos logit contributions | |
tremend | +8.057 |
deaf | +7.122 |
meaningful | +6.918 |
visually | +6.194 |
reasonable | +6.182 |
Neg logit contributions | |
Co | -10.322 |
she | -9.672 |
ian | -9.501 |
Star | -9.498 |
uh | -9.430 |
Token | point |
Token ID | 966 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
tremend | +3.662 |
deaf | +2.997 |
meaningful | +2.883 |
visually | +2.504 |
vested | +2.497 |
Neg logit contributions | |
Co | -5.982 |
she | -5.599 |
ian | -5.596 |
Star | -5.580 |
L | -5.523 |
Token | of |
Token ID | 286 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
tremend | +1.674 |
deaf | +1.443 |
meaningful | +1.406 |
visually | +1.283 |
vested | +1.276 |
Neg logit contributions | |
Co | -1.546 |
ian | -1.419 |
she | -1.418 |
Star | -1.414 |
L | -1.395 |
Token | trying |
Token ID | 2111 |
Feature activation | -7.10e+00 |
Pos logit contributions | |
tremend | +3.140 |
deaf | +2.581 |
meaningful | +2.469 |
visually | +2.165 |
vested | +2.115 |
Neg logit contributions | |
Co | -5.469 |
she | -5.120 |
Star | -5.113 |
ian | -5.108 |
L | -5.048 |
Token | to |
Token ID | 284 |
Feature activation | -7.08e+00 |
Pos logit contributions | |
tremend | +9.299 |
deaf | +7.832 |
meaningful | +7.637 |
visually | +6.935 |
reasonable | +6.852 |
Neg logit contributions | |
Co | -10.536 |
she | -9.808 |
ian | -9.783 |
uh | -9.725 |
Star | -9.714 |
Token | view |
Token ID | 1570 |
Feature activation | -3.96e+00 |
Pos logit contributions | |
Co | +2.056 |
ian | +1.924 |
she | +1.917 |
Star | +1.913 |
L | +1.901 |
Neg logit contributions | |
tremend | -1.475 |
deaf | -1.202 |
meaningful | -1.152 |
vested | -1.023 |
visually | -1.019 |
Token | : |
Token ID | 25 |
Feature activation | -3.04e+00 |
Pos logit contributions | |
tremend | +6.542 |
deaf | +5.854 |
meaningful | +5.775 |
visually | +5.399 |
vested | +5.364 |
Neg logit contributions | |
Co | -4.613 |
ian | -4.143 |
Star | -4.128 |
she | -4.115 |
Smith | -4.087 |
Token | The |
Token ID | 383 |
Feature activation | -2.11e+00 |
Pos logit contributions | |
tremend | +5.446 |
deaf | +4.866 |
meaningful | +4.790 |
visually | +4.432 |
proactive | +4.411 |
Neg logit contributions | |
Co | -3.268 |
ian | -2.931 |
she | -2.926 |
Star | -2.913 |
Smith | -2.859 |
Token | offensive |
Token ID | 5859 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
tremend | +2.865 |
deaf | +2.439 |
meaningful | +2.378 |
vested | +2.129 |
visually | +2.129 |
Neg logit contributions | |
Co | -3.264 |
she | -3.025 |
ian | -3.024 |
Star | -3.007 |
uh | -2.976 |
Token | line |
Token ID | 1627 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
Co | +2.030 |
ian | +1.897 |
she | +1.890 |
Star | +1.882 |
L | +1.868 |
Neg logit contributions | |
tremend | -1.535 |
deaf | -1.269 |
meaningful | -1.227 |
vested | -1.089 |
visually | -1.089 |
Token | came |
Token ID | 1625 |
Feature activation | -8.53e+00 |
Pos logit contributions | |
Co | +0.325 |
she | +0.295 |
ian | +0.294 |
Star | +0.293 |
uh | +0.288 |
Neg logit contributions | |
tremend | -0.464 |
deaf | -0.408 |
meaningful | -0.400 |
vested | -0.369 |
visually | -0.369 |
Token | together |
Token ID | 1978 |
Feature activation | -9.20e+00 |
Pos logit contributions | |
tremend | +11.144 |
deaf | +9.938 |
meaningful | +9.849 |
relatively | +8.989 |
proactive | +8.859 |
Neg logit contributions | |
Co | -11.768 |
she | -11.054 |
Star | -10.928 |
ian | -10.749 |
Smith | -10.739 |
Token | , |
Token ID | 11 |
Feature activation | -6.66e+00 |
Pos logit contributions | |
tremend | +14.199 |
deaf | +12.740 |
meaningful | +12.617 |
relatively | +11.879 |
visually | +11.838 |
Neg logit contributions | |
Co | -10.495 |
Star | -9.520 |
she | -9.452 |
ian | -9.341 |
Smith | -9.241 |
Token | Tony |
Token ID | 8832 |
Feature activation | +6.61e+00 |
Pos logit contributions | |
tremend | +9.581 |
deaf | +8.454 |
meaningful | +8.365 |
vested | +7.607 |
proactive | +7.586 |
Neg logit contributions | |
Co | -8.661 |
she | -8.102 |
Star | -8.074 |
ian | -7.981 |
uh | -7.913 |
Token | Romo |
Token ID | 42395 |
Feature activation | +6.50e+00 |
Pos logit contributions | |
Co | +9.878 |
B | +9.079 |
ian | +9.052 |
Star | +9.038 |
L | +8.997 |
Neg logit contributions | |
tremend | -9.010 |
deaf | -7.647 |
meaningful | -7.345 |
visually | -6.706 |
personalized | -6.663 |
Token | had |
Token ID | 550 |
Feature activation | -6.22e+00 |
Pos logit contributions | |
Co | +10.489 |
ian | +9.907 |
B | +9.752 |
she | +9.743 |
L | +9.735 |
Neg logit contributions | |
tremend | -7.901 |
deaf | -6.395 |
meaningful | -6.104 |
visually | -5.374 |
vested | -5.331 |
Token | o |
Token ID | 78 |
Feature activation | +3.34e+00 |
Pos logit contributions | |
Co | +3.968 |
ian | +3.265 |
she | +3.147 |
uh | +3.046 |
Star | +3.002 |
Neg logit contributions | |
tremend | -17.561 |
deaf | -15.873 |
meaningful | -15.557 |
vested | -14.795 |
proactive | -14.755 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +3.27e+00 |
Pos logit contributions | |
Co | +2.584 |
ian | +2.229 |
Star | +2.197 |
she | +2.181 |
L | +2.169 |
Neg logit contributions | |
tremend | -7.183 |
deaf | -6.406 |
meaningful | -6.303 |
vested | -5.934 |
visually | -5.910 |
Token | An |
Token ID | 2025 |
Feature activation | +2.16e+00 |
Pos logit contributions | |
Co | +2.366 |
ian | +1.979 |
Star | +1.978 |
she | +1.977 |
L | +1.937 |
Neg logit contributions | |
tremend | -7.215 |
deaf | -6.479 |
meaningful | -6.377 |
vested | -6.015 |
visually | -6.007 |
Token | Open |
Token ID | 4946 |
Feature activation | +3.11e+00 |
Pos logit contributions | |
Co | +3.721 |
she | +3.494 |
ian | +3.487 |
L | +3.447 |
Star | +3.446 |
Neg logit contributions | |
tremend | -2.578 |
deaf | -2.100 |
meaningful | -2.042 |
vested | -1.793 |
visually | -1.782 |
Token | Letter |
Token ID | 18121 |
Feature activation | -9.17e-01 |
Pos logit contributions | |
Co | +3.423 |
ian | +3.066 |
Star | +3.054 |
she | +3.046 |
B | +3.023 |
Neg logit contributions | |
tremend | -5.711 |
deaf | -4.963 |
meaningful | -4.883 |
visually | -4.530 |
proactive | -4.524 |
Token | to |
Token ID | 284 |
Feature activation | -8.39e+00 |
Pos logit contributions | |
tremend | +1.390 |
deaf | +1.218 |
meaningful | +1.187 |
visually | +1.086 |
vested | +1.081 |
Neg logit contributions | |
Co | -1.251 |
she | -1.151 |
ian | -1.148 |
Star | -1.142 |
uh | -1.133 |
Token | Senator |
Token ID | 8962 |
Feature activation | +6.87e-02 |
Pos logit contributions | |
tremend | +12.830 |
deaf | +11.802 |
meaningful | +11.448 |
visually | +10.605 |
vested | +10.562 |
Neg logit contributions | |
Co | -9.516 |
she | -8.738 |
ian | -8.607 |
uh | -8.603 |
Star | -8.577 |
Token | Bernie |
Token ID | 10477 |
Feature activation | +5.98e+00 |
Pos logit contributions | |
Co | +0.092 |
she | +0.084 |
ian | +0.084 |
Star | +0.084 |
uh | +0.083 |
Neg logit contributions | |
tremend | -0.107 |
deaf | -0.093 |
meaningful | -0.091 |
visually | -0.083 |
vested | -0.083 |
Token | Sanders |
Token ID | 5831 |
Feature activation | +2.27e+00 |
Pos logit contributions | |
Co | +7.157 |
B | +6.562 |
ian | +6.560 |
she | +6.496 |
P | +6.396 |
Neg logit contributions | |
tremend | -10.040 |
deaf | -8.570 |
meaningful | -8.277 |
vested | -7.818 |
proactive | -7.733 |
Token |
|
Token ID | 198 |
Feature activation | +6.17e-01 |
Pos logit contributions | |
Co | +2.669 |
ian | +2.416 |
she | +2.408 |
Star | +2.396 |
L | +2.366 |
Neg logit contributions | |
tremend | -3.945 |
deaf | -3.459 |
meaningful | -3.380 |
vested | -3.124 |
visually | -3.124 |
Token |
|
Token ID | 198 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
Co | +0.542 |
ian | +0.480 |
she | +0.479 |
Star | +0.470 |
uh | +0.467 |
Neg logit contributions | |
tremend | -1.212 |
deaf | -1.113 |
meaningful | -1.094 |
visually | -1.021 |
vested | -1.020 |
Token | former |
Token ID | 1966 |
Feature activation | +4.42e+00 |
Pos logit contributions | |
Co | +2.601 |
ian | +2.422 |
she | +2.396 |
Star | +2.394 |
L | +2.386 |
Neg logit contributions | |
tremend | -2.092 |
deaf | -1.719 |
meaningful | -1.660 |
vested | -1.481 |
visually | -1.480 |
Token | CEO |
Token ID | 6123 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
Co | +6.817 |
ian | +6.328 |
L | +6.252 |
B | +6.240 |
Star | +6.232 |
Neg logit contributions | |
tremend | -5.943 |
deaf | -4.852 |
meaningful | -4.682 |
visually | -4.215 |
vested | -4.180 |
Token | ) |
Token ID | 8 |
Feature activation | +6.72e-02 |
Pos logit contributions | |
Co | +3.361 |
ian | +2.997 |
she | +2.961 |
L | +2.940 |
B | +2.940 |
Neg logit contributions | |
tremend | -6.109 |
deaf | -5.374 |
meaningful | -5.259 |
proactive | -4.907 |
visually | -4.897 |
Token | would |
Token ID | 561 |
Feature activation | -4.17e+00 |
Pos logit contributions | |
Co | +0.085 |
she | +0.078 |
ian | +0.078 |
Star | +0.077 |
L | +0.076 |
Neg logit contributions | |
tremend | -0.110 |
deaf | -0.096 |
meaningful | -0.094 |
vested | -0.087 |
visually | -0.086 |
Token | later |
Token ID | 1568 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
tremend | +4.284 |
deaf | +3.474 |
meaningful | +3.319 |
visually | +2.919 |
vested | +2.890 |
Neg logit contributions | |
Co | -7.630 |
she | -7.225 |
Star | -7.186 |
ian | -7.148 |
Smith | -7.099 |
Token | attain |
Token ID | 18188 |
Feature activation | -7.76e+00 |
Pos logit contributions | |
tremend | +1.106 |
deaf | +0.889 |
meaningful | +0.856 |
vested | +0.740 |
visually | +0.739 |
Neg logit contributions | |
Co | -1.843 |
ian | -1.731 |
she | -1.727 |
Star | -1.721 |
L | -1.707 |
Token | inf |
Token ID | 1167 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
tremend | +11.196 |
meaningful | +9.758 |
deaf | +9.690 |
vested | +8.908 |
relatively | +8.760 |
Neg logit contributions | |
Co | -9.930 |
she | -9.415 |
ian | -9.320 |
Smith | -9.269 |
Star | -9.242 |
Token | amy |
Token ID | 14814 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
tremend | +2.691 |
deaf | +2.412 |
meaningful | +2.403 |
vested | +2.237 |
visually | +2.215 |
Neg logit contributions | |
Co | -1.432 |
she | -1.270 |
Star | -1.270 |
ian | -1.251 |
Smith | -1.231 |
Token | when |
Token ID | 618 |
Feature activation | -5.64e+00 |
Pos logit contributions | |
tremend | +6.934 |
deaf | +6.072 |
meaningful | +5.894 |
visually | +5.446 |
vested | +5.367 |
Neg logit contributions | |
Co | -7.080 |
Star | -6.508 |
she | -6.436 |
ian | -6.406 |
Smith | -6.402 |
Token | it |
Token ID | 340 |
Feature activation | -2.04e+00 |
Pos logit contributions | |
tremend | +7.859 |
deaf | +7.008 |
meaningful | +6.774 |
vested | +6.222 |
visually | +6.194 |
Neg logit contributions | |
Co | -7.686 |
she | -7.114 |
ian | -7.065 |
Star | -7.032 |
uh | -7.021 |
Token | was |
Token ID | 373 |
Feature activation | -3.94e+00 |
Pos logit contributions | |
tremend | +3.264 |
deaf | +2.886 |
meaningful | +2.797 |
vested | +2.601 |
visually | +2.598 |
Neg logit contributions | |
Co | -2.627 |
she | -2.391 |
ian | -2.380 |
Star | -2.378 |
Smith | -2.351 |