Token | Some |
Token ID | 4366 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
llor | +0.696 |
zag | +0.669 |
cling | +0.662 |
-$ | +0.659 |
rients | +0.658 |
Neg logit contributions | |
assian | -0.864 |
hower | -0.847 |
orah | -0.823 |
hari | -0.816 |
oops | -0.813 |
Token | small |
Token ID | 1402 |
Feature activation | -9.43e-01 |
Pos logit contributions | |
assian | +0.493 |
hower | +0.478 |
orah | +0.467 |
oops | +0.464 |
hari | +0.462 |
Neg logit contributions | |
llor | -0.490 |
zag | -0.473 |
cling | -0.466 |
rients | -0.466 |
-$ | -0.462 |
Token | quick |
Token ID | 2068 |
Feature activation | -9.67e-01 |
Pos logit contributions | |
assian | +3.510 |
hower | +3.399 |
orah | +3.315 |
oops | +3.314 |
hari | +3.286 |
Neg logit contributions | |
llor | -3.659 |
zag | -3.510 |
cling | -3.462 |
rients | -3.448 |
-$ | -3.372 |
Token | tips |
Token ID | 9040 |
Feature activation | +9.47e-01 |
Pos logit contributions | |
assian | +3.974 |
hower | +3.847 |
oops | +3.799 |
orah | +3.776 |
hari | +3.739 |
Neg logit contributions | |
llor | -3.351 |
zag | -3.205 |
cling | -3.134 |
rients | -3.127 |
-$ | -3.036 |
Token | ? |
Token ID | 30 |
Feature activation | +8.98e-01 |
Pos logit contributions | |
llor | +2.946 |
-$ | +2.874 |
zag | +2.809 |
rients | +2.769 |
cling | +2.768 |
Neg logit contributions | |
assian | -4.197 |
hower | -4.103 |
orah | -3.972 |
oops | -3.954 |
hari | -3.936 |
Token | Wear |
Token ID | 27539 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
llor | +3.053 |
-$ | +2.953 |
zag | +2.934 |
cling | +2.924 |
rients | +2.910 |
Neg logit contributions | |
assian | -3.730 |
hower | -3.643 |
orah | -3.501 |
hari | -3.491 |
oops | -3.477 |
Token | comfortable |
Token ID | 6792 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
cling | +6.172 |
zag | +6.110 |
-$ | +6.084 |
distingu | +6.032 |
llor | +6.028 |
Neg logit contributions | |
assian | -8.692 |
hower | -8.460 |
orah | -8.292 |
oops | -8.130 |
oran | -8.071 |
Token | shoes |
Token ID | 10012 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
llor | +3.758 |
cling | +3.751 |
-$ | +3.731 |
zag | +3.718 |
rients | +3.590 |
Neg logit contributions | |
assian | -5.651 |
hower | -5.605 |
orah | -5.512 |
oops | -5.356 |
hari | -5.295 |
Token | and |
Token ID | 290 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
llor | +4.646 |
-$ | +4.596 |
zag | +4.554 |
cling | +4.549 |
rients | +4.318 |
Neg logit contributions | |
assian | -7.045 |
hower | -6.844 |
orah | -6.719 |
oops | -6.669 |
hari | -6.656 |
Token | clothes |
Token ID | 8242 |
Feature activation | +9.25e-01 |
Pos logit contributions | |
llor | +3.557 |
zag | +3.478 |
-$ | +3.463 |
cling | +3.449 |
rients | +3.390 |
Neg logit contributions | |
assian | -4.738 |
hower | -4.629 |
orah | -4.445 |
oops | -4.440 |
hari | -4.415 |
Token | . |
Token ID | 13 |
Feature activation | +4.35e-01 |
Pos logit contributions | |
llor | +3.107 |
cling | +3.048 |
zag | +3.024 |
-$ | +3.012 |
rients | +2.921 |
Neg logit contributions | |
assian | -3.835 |
hower | -3.735 |
oops | -3.632 |
orah | -3.627 |
hari | -3.597 |
Token | us |
Token ID | 385 |
Feature activation | +2.42e-02 |
Pos logit contributions | |
llor | +0.228 |
zag | +0.221 |
cling | +0.218 |
rients | +0.216 |
-$ | +0.215 |
Neg logit contributions | |
assian | -0.217 |
hower | -0.211 |
orah | -0.203 |
oops | -0.202 |
hari | -0.202 |
Token | monkeys |
Token ID | 26697 |
Feature activation | +7.35e-01 |
Pos logit contributions | |
llor | +0.077 |
zag | +0.074 |
rients | +0.073 |
cling | +0.073 |
-$ | +0.072 |
Neg logit contributions | |
assian | -0.107 |
hower | -0.104 |
orah | -0.103 |
oops | -0.102 |
hari | -0.102 |
Token | ( |
Token ID | 357 |
Feature activation | +9.11e-01 |
Pos logit contributions | |
llor | +2.394 |
cling | +2.282 |
zag | +2.281 |
-$ | +2.258 |
rients | +2.238 |
Neg logit contributions | |
assian | -3.200 |
hower | -3.121 |
orah | -3.051 |
oops | -3.051 |
hari | -3.008 |
Token | Mac |
Token ID | 14155 |
Feature activation | +5.11e-01 |
Pos logit contributions | |
llor | +2.844 |
zag | +2.761 |
cling | +2.748 |
-$ | +2.713 |
rients | +2.686 |
Neg logit contributions | |
assian | -4.017 |
hower | -3.976 |
orah | -3.852 |
oops | -3.746 |
hari | -3.744 |
Token | aca |
Token ID | 22260 |
Feature activation | +8.38e-01 |
Pos logit contributions | |
llor | +1.838 |
zag | +1.752 |
cling | +1.726 |
rients | +1.723 |
-$ | +1.716 |
Neg logit contributions | |
assian | -2.055 |
hower | -2.025 |
hari | -1.935 |
oops | -1.928 |
orah | -1.914 |
Token | mul |
Token ID | 35971 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
llor | +2.327 |
-$ | +2.126 |
cling | +2.109 |
zag | +2.056 |
nc | +2.022 |
Neg logit contributions | |
assian | -4.063 |
hower | -4.056 |
oops | -3.919 |
orah | -3.899 |
hari | -3.870 |
Token | atta |
Token ID | 25014 |
Feature activation | +3.29e-01 |
Pos logit contributions | |
llor | +3.774 |
cig | +3.535 |
cert | +3.389 |
zag | +3.285 |
nc | +3.272 |
Neg logit contributions | |
hower | -11.089 |
orah | -10.350 |
oops | -10.271 |
Commands | -10.030 |
anooga | -9.957 |
Token | ) |
Token ID | 8 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
llor | +1.136 |
zag | +1.087 |
cling | +1.072 |
rients | +1.072 |
-$ | +1.065 |
Neg logit contributions | |
assian | -1.380 |
hower | -1.346 |
orah | -1.316 |
oops | -1.307 |
hari | -1.299 |
Token | were |
Token ID | 547 |
Feature activation | +5.85e-01 |
Pos logit contributions | |
llor | +1.289 |
zag | +1.234 |
cling | +1.225 |
rients | +1.217 |
-$ | +1.212 |
Neg logit contributions | |
assian | -1.576 |
hower | -1.534 |
orah | -1.501 |
oops | -1.495 |
hari | -1.482 |
Token | housed |
Token ID | 23707 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
llor | +2.530 |
cling | +2.448 |
zag | +2.434 |
-$ | +2.429 |
rients | +2.411 |
Neg logit contributions | |
assian | -1.936 |
hower | -1.882 |
oops | -1.814 |
orah | -1.807 |
hari | -1.774 |
Token | under |
Token ID | 739 |
Feature activation | +9.55e-01 |
Pos logit contributions | |
llor | +3.823 |
-$ | +3.733 |
cling | +3.717 |
zag | +3.548 |
rients | +3.534 |
Neg logit contributions | |
assian | -5.972 |
hower | -5.808 |
oops | -5.660 |
orah | -5.598 |
hari | -5.508 |
Token | students |
Token ID | 2444 |
Feature activation | +7.04e-01 |
Pos logit contributions | |
assian | +0.722 |
hower | +0.701 |
orah | +0.686 |
oops | +0.681 |
hari | +0.678 |
Neg logit contributions | |
llor | -0.667 |
zag | -0.642 |
cling | -0.633 |
rients | -0.633 |
-$ | -0.627 |
Token | to |
Token ID | 284 |
Feature activation | +7.42e-01 |
Pos logit contributions | |
llor | +2.169 |
zag | +2.063 |
rients | +2.025 |
-$ | +2.022 |
cling | +2.020 |
Neg logit contributions | |
assian | -3.203 |
hower | -3.136 |
orah | -3.076 |
oops | -3.063 |
hari | -3.042 |
Token | access |
Token ID | 1895 |
Feature activation | +4.07e-01 |
Pos logit contributions | |
llor | +2.361 |
zag | +2.247 |
cling | +2.220 |
-$ | +2.211 |
rients | +2.189 |
Neg logit contributions | |
assian | -3.298 |
hower | -3.222 |
oops | -3.160 |
orah | -3.144 |
hari | -3.142 |
Token | co |
Token ID | 763 |
Feature activation | +1.28e-01 |
Pos logit contributions | |
llor | +1.412 |
zag | +1.355 |
rients | +1.334 |
cling | +1.330 |
-$ | +1.330 |
Neg logit contributions | |
assian | -1.685 |
hower | -1.647 |
orah | -1.620 |
oops | -1.610 |
hari | -1.604 |
Token | - |
Token ID | 12 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
llor | +0.400 |
zag | +0.384 |
-$ | +0.377 |
cling | +0.377 |
rients | +0.376 |
Neg logit contributions | |
assian | -0.575 |
hower | -0.566 |
orah | -0.552 |
oops | -0.548 |
hari | -0.547 |
Token | cur |
Token ID | 22019 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
llor | +4.283 |
zag | +4.061 |
cling | +4.050 |
-$ | +4.005 |
rients | +3.924 |
Neg logit contributions | |
assian | -4.932 |
hower | -4.891 |
orah | -4.728 |
hari | -4.709 |
oops | -4.667 |
Token | ricular |
Token ID | 41001 |
Feature activation | +5.43e-02 |
Pos logit contributions | |
llor | +2.539 |
cling | +2.301 |
rients | +2.153 |
zag | +2.105 |
riers | +1.953 |
Neg logit contributions | |
hower | -12.269 |
assian | -12.247 |
oops | -12.014 |
orah | -11.822 |
hari | -11.817 |
Token | activities |
Token ID | 4568 |
Feature activation | +9.31e-02 |
Pos logit contributions | |
llor | +0.191 |
zag | +0.183 |
rients | +0.181 |
cling | +0.180 |
-$ | +0.180 |
Neg logit contributions | |
assian | -0.224 |
hower | -0.218 |
orah | -0.214 |
oops | -0.212 |
hari | -0.211 |
Token | to |
Token ID | 284 |
Feature activation | -4.81e-02 |
Pos logit contributions | |
llor | +0.329 |
zag | +0.317 |
rients | +0.311 |
cling | +0.311 |
-$ | +0.310 |
Neg logit contributions | |
assian | -0.381 |
hower | -0.371 |
orah | -0.365 |
oops | -0.362 |
hari | -0.361 |
Token | supplement |
Token ID | 10327 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
assian | +0.196 |
hower | +0.190 |
orah | +0.186 |
oops | +0.185 |
hari | +0.184 |
Neg logit contributions | |
llor | -0.171 |
zag | -0.165 |
rients | -0.162 |
cling | -0.162 |
-$ | -0.160 |
Token | their |
Token ID | 511 |
Feature activation | -4.18e-01 |
Pos logit contributions | |
llor | +0.065 |
zag | +0.062 |
cling | +0.062 |
rients | +0.062 |
-$ | +0.061 |
Neg logit contributions | |
assian | -0.069 |
hower | -0.067 |
orah | -0.066 |
oops | -0.065 |
hari | -0.065 |
Token | . |
Token ID | 13 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
assian | +2.297 |
hower | +2.219 |
orah | +2.213 |
oops | +2.196 |
hari | +2.164 |
Neg logit contributions | |
llor | -1.619 |
distingu | -1.578 |
zag | -1.548 |
rients | -1.531 |
cling | -1.518 |
Token | The |
Token ID | 383 |
Feature activation | +7.22e-01 |
Pos logit contributions | |
llor | +0.989 |
zag | +0.957 |
cling | +0.941 |
rients | +0.940 |
-$ | +0.935 |
Neg logit contributions | |
assian | -1.270 |
hower | -1.236 |
orah | -1.210 |
hari | -1.203 |
oops | -1.201 |
Token | Legend |
Token ID | 9883 |
Feature activation | +5.06e-01 |
Pos logit contributions | |
llor | +2.286 |
zag | +2.211 |
cling | +2.170 |
rients | +2.147 |
-$ | +2.144 |
Neg logit contributions | |
assian | -3.180 |
hower | -3.110 |
hari | -3.030 |
oops | -3.030 |
orah | -3.028 |
Token | of |
Token ID | 286 |
Feature activation | -4.84e-01 |
Pos logit contributions | |
llor | +1.774 |
zag | +1.689 |
-$ | +1.667 |
cling | +1.664 |
rients | +1.661 |
Neg logit contributions | |
assian | -2.090 |
hower | -2.052 |
oops | -2.006 |
orah | -1.964 |
hari | -1.959 |
Token | Zelda |
Token ID | 22166 |
Feature activation | +1.77e-01 |
Pos logit contributions | |
assian | +2.030 |
hower | +1.984 |
orah | +1.950 |
oops | +1.934 |
hari | +1.923 |
Neg logit contributions | |
llor | -1.650 |
zag | -1.579 |
cling | -1.557 |
rients | -1.555 |
-$ | -1.543 |
Token | : |
Token ID | 25 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
llor | +0.604 |
zag | +0.579 |
rients | +0.570 |
cling | +0.570 |
-$ | +0.566 |
Neg logit contributions | |
assian | -0.749 |
hower | -0.728 |
orah | -0.713 |
oops | -0.708 |
hari | -0.706 |
Token | O |
Token ID | 440 |
Feature activation | +3.06e-01 |
Pos logit contributions | |
llor | +5.692 |
rients | +5.490 |
zag | +5.439 |
-$ | +5.333 |
cling | +5.239 |
Neg logit contributions | |
assian | -9.001 |
hower | -8.914 |
oops | -8.303 |
hari | -8.285 |
orah | -8.276 |
Token | car |
Token ID | 7718 |
Feature activation | +7.32e-01 |
Pos logit contributions | |
llor | +0.916 |
zag | +0.895 |
rients | +0.874 |
cling | +0.868 |
-$ | +0.839 |
Neg logit contributions | |
hower | -1.441 |
assian | -1.438 |
hari | -1.358 |
orah | -1.326 |
oops | -1.301 |
Token | ina |
Token ID | 1437 |
Feature activation | +7.81e-01 |
Pos logit contributions | |
llor | +3.448 |
zag | +3.357 |
cling | +3.310 |
-$ | +3.268 |
nc | +3.251 |
Neg logit contributions | |
assian | -2.116 |
hower | -2.085 |
hari | -1.960 |
oops | -1.925 |
orah | -1.911 |
Token | of |
Token ID | 286 |
Feature activation | +4.95e-01 |
Pos logit contributions | |
llor | +2.689 |
-$ | +2.522 |
cling | +2.491 |
zag | +2.486 |
rients | +2.465 |
Neg logit contributions | |
assian | -3.307 |
hower | -3.237 |
orah | -3.098 |
oops | -3.082 |
hari | -3.074 |
Token | Time |
Token ID | 3862 |
Feature activation | +9.00e-01 |
Pos logit contributions | |
llor | +1.297 |
zag | +1.228 |
cling | +1.215 |
rients | +1.214 |
-$ | +1.194 |
Neg logit contributions | |
assian | -2.492 |
hower | -2.431 |
orah | -2.391 |
hari | -2.369 |
oops | -2.366 |
Token | ary |
Token ID | 560 |
Feature activation | -4.05e-01 |
Pos logit contributions | |
assian | +0.992 |
hower | +0.962 |
orah | +0.942 |
oops | +0.930 |
hari | +0.930 |
Neg logit contributions | |
llor | -1.031 |
zag | -0.996 |
cling | -0.982 |
rients | -0.981 |
-$ | -0.972 |
Token | awkward |
Token ID | 13006 |
Feature activation | -5.48e-01 |
Pos logit contributions | |
assian | +1.590 |
hower | +1.542 |
orah | +1.509 |
oops | +1.497 |
hari | +1.491 |
Neg logit contributions | |
llor | -1.502 |
zag | -1.446 |
rients | -1.426 |
cling | -1.420 |
-$ | -1.402 |
Token | ness |
Token ID | 1108 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
assian | +1.879 |
hower | +1.808 |
orah | +1.754 |
oops | +1.750 |
hari | +1.737 |
Neg logit contributions | |
llor | -2.300 |
zag | -2.218 |
rients | -2.195 |
cling | -2.183 |
-$ | -2.168 |
Token | in |
Token ID | 287 |
Feature activation | -3.41e-01 |
Pos logit contributions | |
llor | +0.708 |
zag | +0.681 |
cling | +0.673 |
rients | +0.671 |
-$ | +0.668 |
Neg logit contributions | |
assian | -0.739 |
hower | -0.719 |
orah | -0.703 |
oops | -0.699 |
hari | -0.696 |
Token | red |
Token ID | 2266 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
assian | +1.314 |
hower | +1.269 |
orah | +1.248 |
oops | +1.234 |
hari | +1.230 |
Neg logit contributions | |
llor | -1.293 |
zag | -1.235 |
rients | -1.219 |
cling | -1.212 |
-$ | -1.200 |
Token | iscover |
Token ID | 29392 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
llor | +0.390 |
zag | +0.376 |
cling | +0.372 |
rients | +0.370 |
-$ | +0.368 |
Neg logit contributions | |
assian | -0.429 |
hower | -0.418 |
orah | -0.406 |
oops | -0.403 |
hari | -0.403 |
Token | ing |
Token ID | 278 |
Feature activation | +8.85e-01 |
Pos logit contributions | |
cling | +3.402 |
llor | +3.354 |
rients | +3.017 |
-$ | +3.011 |
zag | +2.928 |
Neg logit contributions | |
assian | -10.870 |
hower | -10.784 |
orah | -10.714 |
oops | -10.598 |
hari | -10.466 |
Token | the |
Token ID | 262 |
Feature activation | -6.51e-02 |
Pos logit contributions | |
llor | +3.009 |
cling | +2.890 |
zag | +2.888 |
-$ | +2.865 |
rients | +2.852 |
Neg logit contributions | |
assian | -3.694 |
hower | -3.639 |
orah | -3.528 |
oops | -3.494 |
hari | -3.466 |
Token | physical |
Token ID | 3518 |
Feature activation | -3.42e-02 |
Pos logit contributions | |
assian | +0.255 |
hower | +0.248 |
orah | +0.243 |
oops | +0.241 |
hari | +0.240 |
Neg logit contributions | |
llor | -0.242 |
zag | -0.233 |
cling | -0.230 |
rients | -0.230 |
-$ | -0.228 |
Token | self |
Token ID | 2116 |
Feature activation | -4.38e-02 |
Pos logit contributions | |
assian | +0.131 |
hower | +0.127 |
orah | +0.124 |
oops | +0.123 |
hari | +0.123 |
Neg logit contributions | |
llor | -0.130 |
zag | -0.125 |
cling | -0.124 |
rients | -0.124 |
-$ | -0.123 |
Token | and |
Token ID | 290 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
assian | +0.180 |
hower | +0.175 |
orah | +0.171 |
oops | +0.170 |
hari | +0.169 |
Neg logit contributions | |
llor | -0.155 |
zag | -0.149 |
cling | -0.147 |
rients | -0.147 |
-$ | -0.146 |
Token | with |
Token ID | 351 |
Feature activation | -4.45e-02 |
Pos logit contributions | |
assian | +0.772 |
hower | +0.753 |
orah | +0.738 |
oops | +0.731 |
hari | +0.729 |
Neg logit contributions | |
llor | -0.564 |
zag | -0.539 |
rients | -0.533 |
cling | -0.532 |
-$ | -0.521 |
Token | , |
Token ID | 11 |
Feature activation | +1.80e-02 |
Pos logit contributions | |
assian | +0.188 |
hower | +0.184 |
orah | +0.180 |
oops | +0.178 |
hari | +0.178 |
Neg logit contributions | |
llor | -0.152 |
zag | -0.145 |
cling | -0.143 |
rients | -0.143 |
-$ | -0.142 |
Token | � |
Token ID | 447 |
Feature activation | +2.58e-01 |
Pos logit contributions | |
llor | +0.065 |
zag | +0.063 |
cling | +0.062 |
rients | +0.062 |
-$ | +0.061 |
Neg logit contributions | |
assian | -0.072 |
hower | -0.070 |
orah | -0.069 |
oops | -0.068 |
hari | -0.068 |
Token | � |
Token ID | 251 |
Feature activation | +4.36e-01 |
Pos logit contributions | |
llor | +1.110 |
zag | +1.069 |
-$ | +1.061 |
cling | +1.058 |
rients | +1.053 |
Neg logit contributions | |
assian | -0.868 |
hower | -0.839 |
orah | -0.795 |
oops | -0.793 |
hari | -0.788 |
Token | said |
Token ID | 531 |
Feature activation | -2.20e-01 |
Pos logit contributions | |
llor | +1.713 |
zag | +1.637 |
cling | +1.618 |
-$ | +1.609 |
rients | +1.609 |
Neg logit contributions | |
assian | -1.618 |
hower | -1.574 |
orah | -1.527 |
oops | -1.512 |
hari | -1.502 |
Token | Lady |
Token ID | 11182 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
assian | +0.888 |
hower | +0.865 |
orah | +0.846 |
hari | +0.837 |
oops | +0.837 |
Neg logit contributions | |
llor | -0.784 |
zag | -0.761 |
rients | -0.749 |
cling | -0.748 |
-$ | -0.743 |
Token | Kennedy |
Token ID | 10401 |
Feature activation | +3.47e-01 |
Pos logit contributions | |
llor | +5.466 |
cling | +4.932 |
rients | +4.760 |
zag | +4.752 |
-$ | +4.741 |
Neg logit contributions | |
assian | -8.638 |
oops | -8.396 |
hower | -8.367 |
orah | -8.252 |
hari | -8.214 |
Token | in |
Token ID | 287 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
llor | +1.160 |
zag | +1.104 |
cling | +1.088 |
rients | +1.087 |
-$ | +1.078 |
Neg logit contributions | |
assian | -1.495 |
hower | -1.454 |
orah | -1.424 |
oops | -1.417 |
hari | -1.408 |
Token | an |
Token ID | 281 |
Feature activation | +3.37e-01 |
Pos logit contributions | |
llor | +1.019 |
zag | +0.978 |
cling | +0.963 |
rients | +0.960 |
-$ | +0.951 |
Neg logit contributions | |
assian | -1.249 |
hower | -1.220 |
orah | -1.192 |
oops | -1.182 |
hari | -1.177 |
Token | interview |
Token ID | 2720 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
llor | +1.228 |
zag | +1.184 |
rients | +1.166 |
cling | +1.165 |
-$ | +1.161 |
Neg logit contributions | |
assian | -1.344 |
hower | -1.318 |
orah | -1.275 |
hari | -1.264 |
oops | -1.263 |
Token | with |
Token ID | 351 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
llor | +0.576 |
zag | +0.543 |
cling | +0.534 |
rients | +0.532 |
-$ | +0.531 |
Neg logit contributions | |
assian | -0.867 |
hower | -0.846 |
orah | -0.828 |
oops | -0.826 |
hari | -0.823 |
Token | despite |
Token ID | 3805 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
assian | +0.296 |
hower | +0.287 |
orah | +0.282 |
hari | +0.278 |
oops | +0.278 |
Neg logit contributions | |
llor | -0.274 |
zag | -0.264 |
rients | -0.261 |
cling | -0.260 |
-$ | -0.257 |
Token | the |
Token ID | 262 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
llor | +0.531 |
zag | +0.511 |
cling | +0.504 |
rients | +0.503 |
-$ | +0.500 |
Neg logit contributions | |
assian | -0.565 |
hower | -0.549 |
orah | -0.537 |
oops | -0.534 |
hari | -0.531 |
Token | consequences |
Token ID | 6948 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
assian | +0.813 |
hower | +0.791 |
orah | +0.774 |
oops | +0.766 |
hari | +0.764 |
Neg logit contributions | |
llor | -0.747 |
zag | -0.719 |
rients | -0.709 |
cling | -0.708 |
-$ | -0.701 |
Token | of |
Token ID | 286 |
Feature activation | -2.55e-01 |
Pos logit contributions | |
assian | +0.780 |
hower | +0.758 |
orah | +0.743 |
oops | +0.735 |
hari | +0.734 |
Neg logit contributions | |
llor | -0.664 |
zag | -0.638 |
rients | -0.629 |
cling | -0.628 |
-$ | -0.621 |
Token | running |
Token ID | 2491 |
Feature activation | +5.08e-03 |
Pos logit contributions | |
assian | +0.963 |
hower | +0.934 |
orah | +0.915 |
oops | +0.905 |
hari | +0.903 |
Neg logit contributions | |
llor | -0.980 |
zag | -0.941 |
rients | -0.931 |
cling | -0.925 |
-$ | -0.917 |
Token | counter |
Token ID | 3753 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
llor | +0.019 |
zag | +0.018 |
rients | +0.018 |
cling | +0.018 |
-$ | +0.018 |
Neg logit contributions | |
assian | -0.020 |
hower | -0.019 |
orah | -0.019 |
oops | -0.019 |
hari | -0.018 |
Token | to |
Token ID | 284 |
Feature activation | +4.21e-01 |
Pos logit contributions | |
llor | +5.182 |
zag | +5.028 |
rients | +4.895 |
-$ | +4.863 |
cling | +4.807 |
Neg logit contributions | |
assian | -8.607 |
hower | -8.528 |
orah | -8.389 |
oops | -8.340 |
hari | -8.148 |
Token | what |
Token ID | 644 |
Feature activation | -8.03e-01 |
Pos logit contributions | |
llor | +1.392 |
zag | +1.351 |
cling | +1.334 |
-$ | +1.329 |
rients | +1.325 |
Neg logit contributions | |
assian | -1.797 |
hower | -1.763 |
orah | -1.726 |
oops | -1.724 |
hari | -1.694 |
Token | is |
Token ID | 318 |
Feature activation | -3.74e-01 |
Pos logit contributions | |
assian | +3.106 |
hower | +2.992 |
orah | +2.929 |
hari | +2.894 |
oops | +2.875 |
Neg logit contributions | |
llor | -2.982 |
zag | -2.848 |
rients | -2.783 |
cling | -2.756 |
-$ | -2.714 |
Token | expected |
Token ID | 2938 |
Feature activation | +1.59e-02 |
Pos logit contributions | |
assian | +1.409 |
hower | +1.362 |
orah | +1.333 |
hari | +1.320 |
oops | +1.314 |
Neg logit contributions | |
llor | -1.456 |
zag | -1.403 |
rients | -1.382 |
cling | -1.380 |
-$ | -1.363 |
Token | of |
Token ID | 286 |
Feature activation | +4.94e-01 |
Pos logit contributions | |
llor | +0.058 |
zag | +0.056 |
cling | +0.055 |
rients | +0.055 |
-$ | +0.054 |
Neg logit contributions | |
assian | -0.064 |
hower | -0.062 |
orah | -0.061 |
oops | -0.060 |
hari | -0.060 |
Token | that |
Token ID | 326 |
Feature activation | +4.31e-01 |
Pos logit contributions | |
assian | +1.188 |
hower | +1.152 |
orah | +1.130 |
oops | +1.117 |
hari | +1.114 |
Neg logit contributions | |
llor | -1.349 |
zag | -1.310 |
rients | -1.294 |
cling | -1.292 |
-$ | -1.268 |
Token | today |
Token ID | 1909 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
llor | +1.529 |
zag | +1.464 |
-$ | +1.457 |
cling | +1.446 |
rients | +1.440 |
Neg logit contributions | |
assian | -1.777 |
hower | -1.729 |
orah | -1.676 |
oops | -1.668 |
hari | -1.658 |
Token | 's |
Token ID | 338 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
llor | +1.443 |
zag | +1.370 |
-$ | +1.353 |
cling | +1.349 |
rients | +1.341 |
Neg logit contributions | |
assian | -2.328 |
hower | -2.274 |
orah | -2.216 |
oops | -2.213 |
hari | -2.196 |
Token | crash |
Token ID | 7014 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
llor | +0.712 |
zag | +0.685 |
cling | +0.675 |
rients | +0.674 |
-$ | +0.672 |
Neg logit contributions | |
assian | -0.782 |
hower | -0.761 |
orah | -0.742 |
oops | -0.736 |
hari | -0.734 |
Token | will |
Token ID | 481 |
Feature activation | +7.09e-01 |
Pos logit contributions | |
llor | +0.526 |
zag | +0.503 |
cling | +0.498 |
-$ | +0.498 |
rients | +0.497 |
Neg logit contributions | |
assian | -0.626 |
hower | -0.607 |
orah | -0.593 |
oops | -0.590 |
hari | -0.587 |
Token | inaug |
Token ID | 14243 |
Feature activation | +1.84e+00 |
Pos logit contributions | |
llor | +2.372 |
zag | +2.264 |
cling | +2.251 |
-$ | +2.242 |
rients | +2.199 |
Neg logit contributions | |
assian | -3.070 |
hower | -2.957 |
oops | -2.891 |
hari | -2.887 |
orah | -2.862 |
Token | urate |
Token ID | 15537 |
Feature activation | +2.74e-01 |
Pos logit contributions | |
llor | +4.108 |
zag | +4.073 |
cling | +3.853 |
rients | +3.784 |
-$ | +3.715 |
Neg logit contributions | |
assian | -9.306 |
hower | -9.247 |
hari | -9.069 |
oops | -9.029 |
anooga | -8.850 |
Token | a |
Token ID | 257 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
llor | +0.889 |
zag | +0.851 |
cling | +0.837 |
rients | +0.836 |
-$ | +0.830 |
Neg logit contributions | |
assian | -1.205 |
hower | -1.175 |
orah | -1.151 |
oops | -1.142 |
hari | -1.138 |
Token | bear |
Token ID | 6842 |
Feature activation | -7.70e-03 |
Pos logit contributions | |
assian | +0.736 |
hower | +0.717 |
orah | +0.703 |
oops | +0.698 |
hari | +0.695 |
Neg logit contributions | |
llor | -0.624 |
zag | -0.600 |
rients | -0.594 |
cling | -0.590 |
-$ | -0.581 |
Token | market |
Token ID | 1910 |
Feature activation | +8.65e-02 |
Pos logit contributions | |
assian | +0.032 |
hower | +0.031 |
orah | +0.030 |
oops | +0.030 |
hari | +0.030 |
Neg logit contributions | |
llor | -0.027 |
zag | -0.026 |
-$ | -0.025 |
cling | -0.025 |
rients | -0.025 |
Token | like |
Token ID | 588 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
llor | +0.300 |
zag | +0.288 |
cling | +0.284 |
rients | +0.283 |
-$ | +0.283 |
Neg logit contributions | |
assian | -0.362 |
hower | -0.352 |
orah | -0.344 |
oops | -0.342 |
hari | -0.340 |
Token | that |
Token ID | 326 |
Feature activation | +3.73e-01 |
Pos logit contributions | |
llor | +0.922 |
zag | +0.890 |
cling | +0.877 |
rients | +0.877 |
-$ | +0.869 |
Neg logit contributions | |
assian | -0.933 |
hower | -0.907 |
orah | -0.885 |
oops | -0.878 |
hari | -0.875 |
Token | small |
Token ID | 1402 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
llor | +1.351 |
zag | +1.303 |
cling | +1.286 |
rients | +1.283 |
-$ | +1.272 |
Neg logit contributions | |
assian | -1.495 |
hower | -1.457 |
orah | -1.423 |
hari | -1.406 |
oops | -1.406 |
Token | pieces |
Token ID | 5207 |
Feature activation | +6.04e-01 |
Pos logit contributions | |
assian | +1.213 |
hower | +1.175 |
oops | +1.156 |
orah | +1.155 |
hari | +1.145 |
Neg logit contributions | |
llor | -0.950 |
zag | -0.905 |
rients | -0.892 |
cling | -0.891 |
-$ | -0.880 |
Token | of |
Token ID | 286 |
Feature activation | +3.09e-01 |
Pos logit contributions | |
llor | +2.178 |
zag | +2.116 |
cling | +2.096 |
rients | +2.072 |
-$ | +2.064 |
Neg logit contributions | |
assian | -2.405 |
hower | -2.346 |
orah | -2.291 |
oops | -2.279 |
hari | -2.265 |
Token | rubber |
Token ID | 14239 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
llor | +1.044 |
zag | +1.001 |
cling | +0.985 |
rients | +0.985 |
-$ | +0.975 |
Neg logit contributions | |
assian | -1.315 |
hower | -1.281 |
orah | -1.255 |
oops | -1.246 |
hari | -1.241 |
Token | wrapped |
Token ID | 12908 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
cling | +4.383 |
llor | +4.381 |
zag | +4.369 |
-$ | +4.278 |
rients | +4.215 |
Neg logit contributions | |
assian | -5.864 |
hower | -5.826 |
orah | -5.663 |
hari | -5.513 |
oops | -5.505 |
Token | around |
Token ID | 1088 |
Feature activation | +6.35e-01 |
Pos logit contributions | |
cling | +4.153 |
zag | +4.140 |
llor | +4.101 |
-$ | +3.972 |
rients | +3.904 |
Neg logit contributions | |
assian | -9.413 |
hower | -9.339 |
orah | -8.964 |
hari | -8.905 |
oops | -8.795 |
Token | a |
Token ID | 257 |
Feature activation | -5.94e-02 |
Pos logit contributions | |
llor | +2.199 |
zag | +2.134 |
cling | +2.108 |
rients | +2.099 |
-$ | +2.082 |
Neg logit contributions | |
assian | -2.632 |
hower | -2.582 |
orah | -2.518 |
oops | -2.476 |
hari | -2.476 |
Token | car |
Token ID | 1097 |
Feature activation | +3.29e-01 |
Pos logit contributions | |
assian | +0.232 |
hower | +0.225 |
orah | +0.221 |
oops | +0.219 |
hari | +0.218 |
Neg logit contributions | |
llor | -0.222 |
zag | -0.213 |
rients | -0.210 |
cling | -0.210 |
-$ | -0.208 |
Token | antenna |
Token ID | 20509 |
Feature activation | +5.77e-01 |
Pos logit contributions | |
llor | +1.053 |
zag | +1.016 |
cling | +1.005 |
rients | +0.992 |
-$ | +0.986 |
Neg logit contributions | |
assian | -1.450 |
hower | -1.421 |
orah | -1.382 |
hari | -1.374 |
oops | -1.373 |
Token | can |
Token ID | 460 |
Feature activation | -3.23e-02 |
Pos logit contributions | |
llor | +1.898 |
zag | +1.842 |
cling | +1.832 |
rients | +1.802 |
-$ | +1.800 |
Neg logit contributions | |
assian | -2.467 |
hower | -2.408 |
orah | -2.356 |
oops | -2.342 |
hari | -2.330 |
Token | the |
Token ID | 262 |
Feature activation | +6.61e-02 |
Pos logit contributions | |
llor | +1.226 |
zag | +1.176 |
cling | +1.161 |
rients | +1.159 |
-$ | +1.154 |
Neg logit contributions | |
assian | -1.477 |
hower | -1.440 |
orah | -1.404 |
oops | -1.395 |
hari | -1.393 |
Token | flagship |
Token ID | 21336 |
Feature activation | +4.78e-01 |
Pos logit contributions | |
llor | +0.216 |
zag | +0.207 |
cling | +0.204 |
rients | +0.204 |
-$ | +0.202 |
Neg logit contributions | |
assian | -0.288 |
hower | -0.281 |
orah | -0.276 |
oops | -0.274 |
hari | -0.273 |
Token | design |
Token ID | 1486 |
Feature activation | +8.05e-01 |
Pos logit contributions | |
llor | +1.533 |
zag | +1.470 |
-$ | +1.451 |
rients | +1.439 |
cling | +1.439 |
Neg logit contributions | |
assian | -2.108 |
hower | -2.058 |
orah | -2.002 |
hari | -1.993 |
oops | -1.992 |
Token | concept |
Token ID | 3721 |
Feature activation | +2.42e-01 |
Pos logit contributions | |
llor | +2.651 |
zag | +2.575 |
-$ | +2.551 |
rients | +2.530 |
cling | +2.528 |
Neg logit contributions | |
assian | -3.395 |
hower | -3.330 |
orah | -3.219 |
hari | -3.212 |
oops | -3.200 |
Token | of |
Token ID | 286 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
llor | +0.862 |
zag | +0.829 |
cling | +0.816 |
rients | +0.816 |
-$ | +0.813 |
Neg logit contributions | |
assian | -0.984 |
hower | -0.958 |
orah | -0.935 |
oops | -0.930 |
hari | -0.929 |
Token | Lightning |
Token ID | 12469 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
llor | +0.715 |
zag | +0.688 |
rients | +0.678 |
cling | +0.678 |
-$ | +0.674 |
Neg logit contributions | |
assian | -0.820 |
hower | -0.798 |
orah | -0.779 |
oops | -0.774 |
hari | -0.772 |
Token | series |
Token ID | 2168 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
llor | +5.629 |
-$ | +5.552 |
zag | +5.377 |
cling | +5.275 |
rients | +5.255 |
Neg logit contributions | |
assian | -7.627 |
hower | -7.526 |
oops | -7.320 |
hari | -7.305 |
orah | -7.238 |
Token | into |
Token ID | 656 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
llor | +3.589 |
-$ | +3.488 |
zag | +3.422 |
rients | +3.380 |
distingu | +3.366 |
Neg logit contributions | |
assian | -4.747 |
hower | -4.673 |
hari | -4.536 |
oops | -4.458 |
orah | -4.440 |
Token | R |
Token ID | 371 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
llor | +0.575 |
zag | +0.554 |
cling | +0.546 |
rients | +0.545 |
-$ | +0.541 |
Neg logit contributions | |
assian | -0.666 |
hower | -0.648 |
orah | -0.633 |
oops | -0.630 |
hari | -0.628 |
Token | 78 |
Token ID | 3695 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
assian | +1.016 |
hower | +0.984 |
orah | +0.969 |
oops | +0.962 |
hari | +0.958 |
Neg logit contributions | |
llor | -0.830 |
zag | -0.797 |
cling | -0.788 |
rients | -0.787 |
-$ | -0.772 |
Token | 70 |
Token ID | 2154 |
Feature activation | +4.61e-01 |
Pos logit contributions | |
llor | +0.845 |
zag | +0.799 |
cling | +0.782 |
rients | +0.782 |
-$ | +0.768 |
Neg logit contributions | |
assian | -1.713 |
hower | -1.675 |
orah | -1.648 |
oops | -1.638 |
hari | -1.633 |
Token | but |
Token ID | 475 |
Feature activation | +8.16e-01 |
Pos logit contributions | |
llor | +0.445 |
zag | +0.432 |
rients | +0.422 |
cling | +0.422 |
-$ | +0.422 |
Neg logit contributions | |
assian | -0.518 |
hower | -0.508 |
orah | -0.495 |
oops | -0.490 |
hari | -0.489 |
Token | that |
Token ID | 326 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
llor | +2.798 |
zag | +2.672 |
-$ | +2.652 |
rients | +2.644 |
cling | +2.616 |
Neg logit contributions | |
assian | -3.386 |
hower | -3.344 |
hari | -3.226 |
oops | -3.216 |
orah | -3.206 |
Token | the |
Token ID | 262 |
Feature activation | +3.37e-01 |
Pos logit contributions | |
llor | +1.831 |
zag | +1.762 |
-$ | +1.739 |
rients | +1.735 |
cling | +1.730 |
Neg logit contributions | |
assian | -2.233 |
hower | -2.205 |
orah | -2.131 |
hari | -2.126 |
oops | -2.119 |
Token | studio |
Token ID | 8034 |
Feature activation | +3.17e-01 |
Pos logit contributions | |
llor | +1.183 |
zag | +1.148 |
rients | +1.123 |
cling | +1.122 |
-$ | +1.121 |
Neg logit contributions | |
assian | -1.377 |
hower | -1.356 |
orah | -1.315 |
hari | -1.309 |
oops | -1.308 |
Token | cannot |
Token ID | 2314 |
Feature activation | +2.94e-01 |
Pos logit contributions | |
llor | +1.057 |
zag | +1.012 |
cling | +0.998 |
rients | +0.995 |
-$ | +0.992 |
Neg logit contributions | |
assian | -1.366 |
hower | -1.338 |
orah | -1.300 |
oops | -1.297 |
hari | -1.292 |
Token | dedicate |
Token ID | 39383 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
llor | +1.011 |
zag | +0.970 |
cling | +0.956 |
rients | +0.954 |
-$ | +0.950 |
Neg logit contributions | |
assian | -1.235 |
hower | -1.204 |
orah | -1.174 |
oops | -1.169 |
hari | -1.166 |
Token | more |
Token ID | 517 |
Feature activation | +5.77e-01 |
Pos logit contributions | |
-$ | +5.505 |
llor | +5.464 |
zag | +5.367 |
rients | +5.192 |
cling | +5.099 |
Neg logit contributions | |
hower | -7.817 |
assian | -7.693 |
hari | -7.439 |
orah | -7.432 |
oops | -7.295 |
Token | than |
Token ID | 621 |
Feature activation | +6.49e-01 |
Pos logit contributions | |
llor | +1.926 |
-$ | +1.861 |
zag | +1.856 |
cling | +1.829 |
rients | +1.820 |
Neg logit contributions | |
assian | -2.425 |
hower | -2.419 |
hari | -2.328 |
oops | -2.325 |
orah | -2.323 |
Token | 5 |
Token ID | 642 |
Feature activation | +4.08e-01 |
Pos logit contributions | |
llor | +2.073 |
zag | +2.013 |
-$ | +2.011 |
cling | +1.968 |
rients | +1.955 |
Neg logit contributions | |
assian | -2.825 |
hower | -2.803 |
orah | -2.717 |
oops | -2.701 |
hari | -2.701 |
Token | % |
Token ID | 4 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
llor | +1.503 |
-$ | +1.467 |
zag | +1.449 |
cling | +1.438 |
rients | +1.435 |
Neg logit contributions | |
hower | -1.576 |
assian | -1.575 |
orah | -1.512 |
oops | -1.497 |
hari | -1.494 |
Token | of |
Token ID | 286 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
llor | +1.801 |
zag | +1.732 |
cling | +1.708 |
rients | +1.708 |
-$ | +1.700 |
Neg logit contributions | |
assian | -1.822 |
hower | -1.776 |
orah | -1.732 |
oops | -1.718 |
hari | -1.711 |
Token | for |
Token ID | 329 |
Feature activation | +6.72e-01 |
Pos logit contributions | |
llor | +1.681 |
zag | +1.610 |
-$ | +1.594 |
rients | +1.586 |
cling | +1.585 |
Neg logit contributions | |
assian | -1.871 |
hower | -1.836 |
oops | -1.785 |
orah | -1.767 |
hari | -1.756 |
Token | international |
Token ID | 3230 |
Feature activation | +6.50e-01 |
Pos logit contributions | |
llor | +2.129 |
zag | +2.055 |
rients | +2.035 |
cling | +2.018 |
-$ | +2.010 |
Neg logit contributions | |
assian | -2.977 |
hower | -2.927 |
hari | -2.833 |
orah | -2.824 |
oops | -2.813 |
Token | freedom |
Token ID | 4925 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
llor | +2.303 |
zag | +2.243 |
rients | +2.218 |
cling | +2.210 |
-$ | +2.204 |
Neg logit contributions | |
assian | -2.616 |
hower | -2.577 |
hari | -2.470 |
oops | -2.463 |
orah | -2.463 |
Token | of |
Token ID | 286 |
Feature activation | +1.04e-01 |
Pos logit contributions | |
llor | +1.379 |
zag | +1.325 |
cling | +1.309 |
rients | +1.304 |
-$ | +1.297 |
Neg logit contributions | |
assian | -1.525 |
hower | -1.482 |
orah | -1.442 |
oops | -1.442 |
hari | -1.427 |
Token | expression |
Token ID | 5408 |
Feature activation | +9.55e-02 |
Pos logit contributions | |
llor | +0.371 |
zag | +0.357 |
cling | +0.351 |
rients | +0.351 |
-$ | +0.347 |
Neg logit contributions | |
assian | -0.424 |
hower | -0.413 |
orah | -0.403 |
oops | -0.400 |
hari | -0.399 |
Token | Jill |
Token ID | 22772 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
llor | +0.371 |
zag | +0.357 |
rients | +0.352 |
cling | +0.352 |
-$ | +0.350 |
Neg logit contributions | |
assian | -0.359 |
hower | -0.349 |
orah | -0.340 |
oops | -0.338 |
hari | -0.336 |
Token | ian |
Token ID | 666 |
Feature activation | +5.75e-01 |
Pos logit contributions | |
llor | +6.403 |
zag | +6.040 |
cling | +5.997 |
rients | +5.874 |
nc | +5.851 |
Neg logit contributions | |
assian | -6.794 |
hower | -6.557 |
oops | -6.492 |
hari | -6.285 |
orah | -6.281 |
Token | C |
Token ID | 327 |
Feature activation | +6.54e-01 |
Pos logit contributions | |
llor | +2.064 |
zag | +1.980 |
cling | +1.959 |
rients | +1.951 |
-$ | +1.929 |
Neg logit contributions | |
assian | -2.304 |
hower | -2.236 |
orah | -2.179 |
oops | -2.177 |
hari | -2.165 |
Token | . |
Token ID | 13 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
llor | +2.613 |
zag | +2.509 |
cling | +2.480 |
rients | +2.465 |
-$ | +2.430 |
Neg logit contributions | |
assian | -2.336 |
hower | -2.306 |
orah | -2.241 |
oops | -2.218 |
hari | -2.185 |
Token | York |
Token ID | 1971 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
llor | +1.208 |
zag | +1.162 |
cling | +1.153 |
rients | +1.144 |
-$ | +1.130 |
Neg logit contributions | |
assian | -1.339 |
hower | -1.300 |
orah | -1.275 |
oops | -1.271 |
hari | -1.259 |
Token | added |
Token ID | 2087 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
assian | +0.942 |
hower | +0.917 |
orah | +0.897 |
oops | +0.888 |
hari | +0.886 |
Neg logit contributions | |
llor | -0.845 |
zag | -0.814 |
cling | -0.801 |
rients | -0.801 |
-$ | -0.793 |
Token | the |
Token ID | 262 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
llor | +0.325 |
zag | +0.310 |
rients | +0.306 |
cling | +0.306 |
-$ | +0.302 |
Neg logit contributions | |
assian | -0.376 |
hower | -0.366 |
orah | -0.359 |
oops | -0.356 |
hari | -0.355 |
Token | game |
Token ID | 983 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
llor | +0.488 |
zag | +0.468 |
cling | +0.462 |
rients | +0.460 |
-$ | +0.456 |
Neg logit contributions | |
assian | -0.568 |
hower | -0.553 |
orah | -0.542 |
oops | -0.538 |
hari | -0.535 |
Token | for |
Token ID | 329 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
assian | +1.040 |
hower | +1.011 |
orah | +0.990 |
oops | +0.982 |
hari | +0.979 |
Neg logit contributions | |
llor | -0.922 |
zag | -0.885 |
cling | -0.874 |
rients | -0.873 |
-$ | -0.860 |
Token | the |
Token ID | 262 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
llor | +0.841 |
zag | +0.811 |
cling | +0.799 |
rients | +0.799 |
-$ | +0.794 |
Neg logit contributions | |
assian | -0.959 |
hower | -0.933 |
orah | -0.913 |
oops | -0.904 |
hari | -0.903 |
Token | first |
Token ID | 717 |
Feature activation | +7.28e-01 |
Pos logit contributions | |
llor | +0.408 |
zag | +0.392 |
cling | +0.387 |
rients | +0.387 |
-$ | +0.383 |
Neg logit contributions | |
assian | -0.436 |
hower | -0.424 |
orah | -0.415 |
oops | -0.411 |
hari | -0.410 |
Token | time |
Token ID | 640 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
llor | +2.036 |
-$ | +1.975 |
zag | +1.964 |
cling | +1.951 |
rients | +1.914 |
Neg logit contributions | |
assian | -3.445 |
hower | -3.364 |
orah | -3.313 |
oops | -3.298 |
hari | -3.266 |
Token | . |
Token ID | 13 |
Feature activation | +2.02e-01 |
Pos logit contributions | |
llor | +4.832 |
-$ | +4.726 |
zag | +4.558 |
cling | +4.509 |
� | +4.502 |
Neg logit contributions | |
assian | -8.339 |
orah | -8.046 |
hower | -7.970 |
oops | -7.960 |
hari | -7.841 |
Token | The |
Token ID | 383 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
llor | +0.714 |
zag | +0.686 |
rients | +0.679 |
cling | +0.678 |
-$ | +0.678 |
Neg logit contributions | |
assian | -0.826 |
hower | -0.805 |
orah | -0.784 |
oops | -0.781 |
hari | -0.779 |
Token | added |
Token ID | 2087 |
Feature activation | -8.00e-01 |
Pos logit contributions | |
llor | +0.421 |
zag | +0.404 |
cling | +0.398 |
rients | +0.398 |
-$ | +0.395 |
Neg logit contributions | |
assian | -0.519 |
hower | -0.505 |
orah | -0.494 |
oops | -0.492 |
hari | -0.490 |
Token | Game |
Token ID | 3776 |
Feature activation | -7.40e-01 |
Pos logit contributions | |
assian | +3.085 |
hower | +3.009 |
orah | +2.925 |
oops | +2.885 |
hari | +2.877 |
Neg logit contributions | |
llor | -2.998 |
zag | -2.876 |
cling | -2.810 |
rients | -2.788 |
-$ | -2.733 |
Token | Pad |
Token ID | 26114 |
Feature activation | +6.74e-01 |
Pos logit contributions | |
assian | +4.121 |
hower | +4.032 |
oops | +3.955 |
orah | +3.948 |
hari | +3.937 |
Neg logit contributions | |
llor | -1.487 |
zag | -1.416 |
cling | -1.358 |
rients | -1.356 |
-$ | -1.304 |
Token | Fil |
Token ID | 11928 |
Feature activation | +4.46e-01 |
Pos logit contributions | |
llor | +0.775 |
zag | +0.748 |
cling | +0.739 |
rients | +0.734 |
-$ | +0.728 |
Neg logit contributions | |
assian | -0.961 |
hower | -0.935 |
orah | -0.913 |
hari | -0.900 |
oops | -0.898 |
Token | ber |
Token ID | 527 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
llor | +1.312 |
zag | +1.271 |
cling | +1.263 |
rients | +1.256 |
-$ | +1.252 |
Neg logit contributions | |
assian | -2.070 |
hower | -2.040 |
orah | -1.963 |
oops | -1.949 |
hari | -1.932 |
Token | ts |
Token ID | 912 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
assian | +1.039 |
hower | +1.013 |
orah | +0.995 |
oops | +0.991 |
hari | +0.985 |
Neg logit contributions | |
llor | -0.750 |
zag | -0.715 |
cling | -0.704 |
rients | -0.698 |
-$ | -0.696 |
Token | ) |
Token ID | 8 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
assian | +0.699 |
hower | +0.681 |
orah | +0.666 |
oops | +0.662 |
hari | +0.659 |
Neg logit contributions | |
llor | -0.587 |
zag | -0.564 |
cling | -0.555 |
rients | -0.554 |
-$ | -0.548 |
Token | , |
Token ID | 837 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
llor | +1.231 |
zag | +1.180 |
rients | +1.174 |
cling | +1.166 |
-$ | +1.155 |
Neg logit contributions | |
assian | -1.593 |
hower | -1.551 |
orah | -1.518 |
oops | -1.499 |
hari | -1.491 |
Token | Pist |
Token ID | 18667 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
llor | +0.349 |
zag | +0.335 |
cling | +0.330 |
rients | +0.329 |
-$ | +0.327 |
Neg logit contributions | |
assian | -0.437 |
hower | -0.426 |
orah | -0.417 |
oops | -0.413 |
hari | -0.411 |
Token | ach |
Token ID | 620 |
Feature activation | +4.94e-01 |
Pos logit contributions | |
llor | +4.215 |
nc | +4.014 |
zag | +4.008 |
rients | +3.819 |
cling | +3.783 |
Neg logit contributions | |
hower | -9.030 |
assian | -8.690 |
orah | -8.420 |
Commands | -8.217 |
hari | -8.215 |
Token | ios |
Token ID | 4267 |
Feature activation | -2.75e-01 |
Pos logit contributions | |
llor | +2.043 |
zag | +1.980 |
rients | +1.964 |
cling | +1.936 |
-$ | +1.924 |
Neg logit contributions | |
hower | -1.712 |
assian | -1.711 |
orah | -1.615 |
hari | -1.611 |
oops | -1.597 |
Token | , |
Token ID | 837 |
Feature activation | +4.25e-01 |
Pos logit contributions | |
assian | +1.179 |
hower | +1.147 |
orah | +1.126 |
oops | +1.122 |
hari | +1.117 |
Neg logit contributions | |
llor | -0.921 |
zag | -0.884 |
cling | -0.868 |
rients | -0.864 |
-$ | -0.857 |
Token | Cas |
Token ID | 11294 |
Feature activation | +7.76e-01 |
Pos logit contributions | |
llor | +1.421 |
zag | +1.367 |
cling | +1.345 |
rients | +1.342 |
-$ | +1.337 |
Neg logit contributions | |
assian | -1.820 |
hower | -1.775 |
orah | -1.743 |
oops | -1.719 |
hari | -1.701 |
Token | hews |
Token ID | 40645 |
Feature activation | +6.35e-01 |
Pos logit contributions | |
llor | +2.677 |
zag | +2.670 |
cling | +2.589 |
rients | +2.551 |
nc | +2.531 |
Neg logit contributions | |
hower | -3.188 |
assian | -3.070 |
orah | -2.928 |
hari | -2.923 |
oops | -2.915 |
Token | found |
Token ID | 1043 |
Feature activation | +7.46e-01 |
Pos logit contributions | |
llor | +0.471 |
zag | +0.451 |
cling | +0.448 |
rients | +0.442 |
-$ | +0.441 |
Neg logit contributions | |
assian | -0.612 |
hower | -0.597 |
orah | -0.583 |
oops | -0.578 |
hari | -0.578 |
Token | like |
Token ID | 588 |
Feature activation | +5.86e-01 |
Pos logit contributions | |
llor | +2.484 |
zag | +2.405 |
-$ | +2.361 |
cling | +2.360 |
rients | +2.348 |
Neg logit contributions | |
assian | -3.167 |
hower | -3.105 |
orah | -3.045 |
oops | -2.995 |
hari | -2.974 |
Token | a |
Token ID | 257 |
Feature activation | +6.87e-01 |
Pos logit contributions | |
llor | +1.959 |
zag | +1.890 |
cling | +1.864 |
-$ | +1.859 |
rients | +1.849 |
Neg logit contributions | |
assian | -2.503 |
hower | -2.443 |
orah | -2.390 |
oops | -2.366 |
hari | -2.357 |
Token | piece |
Token ID | 3704 |
Feature activation | +4.69e-01 |
Pos logit contributions | |
llor | +2.350 |
zag | +2.259 |
cling | +2.243 |
-$ | +2.238 |
rients | +2.200 |
Neg logit contributions | |
assian | -2.869 |
hower | -2.798 |
orah | -2.729 |
oops | -2.718 |
hari | -2.679 |
Token | of |
Token ID | 286 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
llor | +1.716 |
zag | +1.663 |
cling | +1.635 |
-$ | +1.633 |
rients | +1.615 |
Neg logit contributions | |
assian | -1.848 |
hower | -1.794 |
orah | -1.759 |
oops | -1.743 |
hari | -1.743 |
Token | ply |
Token ID | 35960 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
llor | +0.341 |
zag | +0.322 |
rients | +0.318 |
cling | +0.316 |
-$ | +0.311 |
Neg logit contributions | |
assian | -0.621 |
hower | -0.606 |
orah | -0.595 |
oops | -0.593 |
hari | -0.591 |
Token | wood |
Token ID | 3822 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
llor | +5.410 |
cling | +5.265 |
zag | +5.246 |
-$ | +5.142 |
nc | +5.015 |
Neg logit contributions | |
hower | -7.507 |
orah | -7.444 |
assian | -7.382 |
hari | -7.195 |
oops | -7.164 |
Token | . |
Token ID | 13 |
Feature activation | +4.04e-01 |
Pos logit contributions | |
llor | +3.979 |
-$ | +3.869 |
zag | +3.864 |
cling | +3.842 |
rients | +3.729 |
Neg logit contributions | |
assian | -4.838 |
hower | -4.764 |
orah | -4.681 |
hari | -4.611 |
oops | -4.562 |
Token | So |
Token ID | 1406 |
Feature activation | -4.90e-01 |
Pos logit contributions | |
llor | +1.480 |
zag | +1.423 |
-$ | +1.414 |
cling | +1.414 |
rients | +1.401 |
Neg logit contributions | |
assian | -1.595 |
hower | -1.555 |
orah | -1.514 |
hari | -1.506 |
oops | -1.486 |
Token | okay |
Token ID | 8788 |
Feature activation | -4.20e-01 |
Pos logit contributions | |
assian | +1.887 |
hower | +1.830 |
orah | +1.797 |
oops | +1.792 |
hari | +1.774 |
Neg logit contributions | |
llor | -1.842 |
zag | -1.785 |
rients | -1.763 |
cling | -1.749 |
-$ | -1.729 |
Token | , |
Token ID | 11 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
assian | +1.696 |
hower | +1.644 |
orah | +1.611 |
oops | +1.609 |
hari | +1.593 |
Neg logit contributions | |
llor | -1.509 |
zag | -1.460 |
rients | -1.438 |
cling | -1.434 |
-$ | -1.419 |
Token | be |
Token ID | 307 |
Feature activation | +1.67e-02 |
Pos logit contributions | |
llor | +0.158 |
zag | +0.152 |
cling | +0.150 |
rients | +0.150 |
-$ | +0.149 |
Neg logit contributions | |
assian | -0.184 |
hower | -0.179 |
orah | -0.176 |
oops | -0.174 |
hari | -0.174 |
Token | covered |
Token ID | 5017 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
llor | +0.063 |
zag | +0.061 |
cling | +0.061 |
rients | +0.060 |
-$ | +0.060 |
Neg logit contributions | |
assian | -0.064 |
hower | -0.062 |
orah | -0.061 |
oops | -0.060 |
hari | -0.060 |
Token | up |
Token ID | 510 |
Feature activation | +5.89e-01 |
Pos logit contributions | |
llor | +3.116 |
zag | +3.027 |
cling | +2.992 |
-$ | +2.992 |
rients | +2.940 |
Neg logit contributions | |
assian | -4.465 |
hower | -4.345 |
orah | -4.213 |
oops | -4.207 |
hari | -4.189 |
Token | by |
Token ID | 416 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
llor | +1.958 |
zag | +1.873 |
cling | +1.866 |
-$ | +1.857 |
rients | +1.843 |
Neg logit contributions | |
assian | -2.539 |
hower | -2.474 |
orah | -2.417 |
oops | -2.403 |
hari | -2.395 |
Token | plastic |
Token ID | 7309 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
llor | +0.987 |
zag | +0.950 |
cling | +0.943 |
rients | +0.934 |
-$ | +0.930 |
Neg logit contributions | |
assian | -1.201 |
hower | -1.170 |
orah | -1.145 |
oops | -1.135 |
hari | -1.132 |
Token | circles |
Token ID | 13332 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
llor | +4.501 |
cling | +4.414 |
-$ | +4.383 |
zag | +4.378 |
rients | +4.280 |
Neg logit contributions | |
assian | -5.949 |
hower | -5.847 |
orah | -5.678 |
hari | -5.569 |
oops | -5.541 |
Token | which |
Token ID | 543 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
llor | +5.078 |
-$ | +5.017 |
zag | +5.012 |
cling | +4.944 |
nc | +4.698 |
Neg logit contributions | |
assian | -7.635 |
hower | -7.516 |
hari | -7.421 |
orah | -7.420 |
oops | -7.311 |
Token | can |
Token ID | 460 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
llor | +1.515 |
zag | +1.465 |
cling | +1.447 |
rients | +1.438 |
-$ | +1.432 |
Neg logit contributions | |
assian | -1.793 |
hower | -1.737 |
orah | -1.702 |
hari | -1.692 |
oops | -1.686 |
Token | easily |
Token ID | 3538 |
Feature activation | -2.75e-01 |
Pos logit contributions | |
assian | +0.681 |
hower | +0.665 |
orah | +0.652 |
oops | +0.647 |
hari | +0.644 |
Neg logit contributions | |
llor | -0.534 |
zag | -0.511 |
rients | -0.504 |
cling | -0.500 |
-$ | -0.497 |
Token | be |
Token ID | 307 |
Feature activation | -9.44e-02 |
Pos logit contributions | |
assian | +1.178 |
hower | +1.150 |
orah | +1.130 |
oops | +1.122 |
hari | +1.114 |
Neg logit contributions | |
llor | -0.922 |
zag | -0.873 |
rients | -0.867 |
cling | -0.856 |
-$ | -0.851 |
Token | pulled |
Token ID | 5954 |
Feature activation | -4.06e-01 |
Pos logit contributions | |
assian | +0.371 |
hower | +0.361 |
orah | +0.353 |
oops | +0.350 |
hari | +0.349 |
Neg logit contributions | |
llor | -0.350 |
zag | -0.338 |
cling | -0.333 |
rients | -0.333 |
-$ | -0.330 |
Token | Christmas |
Token ID | 6786 |
Feature activation | +6.68e-01 |
Pos logit contributions | |
llor | +1.986 |
zag | +1.906 |
cling | +1.874 |
rients | +1.859 |
-$ | +1.858 |
Neg logit contributions | |
assian | -2.567 |
hower | -2.501 |
orah | -2.440 |
oops | -2.427 |
hari | -2.423 |
Token | Story |
Token ID | 8362 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
llor | +2.043 |
zag | +1.954 |
-$ | +1.930 |
cling | +1.924 |
rients | +1.887 |
Neg logit contributions | |
assian | -3.033 |
hower | -2.948 |
oops | -2.882 |
hari | -2.877 |
orah | -2.854 |
Token | " |
Token ID | 1 |
Feature activation | -3.27e-01 |
Pos logit contributions | |
llor | +1.651 |
zag | +1.570 |
-$ | +1.537 |
rients | +1.537 |
cling | +1.536 |
Neg logit contributions | |
assian | -2.709 |
hower | -2.642 |
oops | -2.577 |
orah | -2.576 |
hari | -2.571 |
Token | and |
Token ID | 290 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
assian | +1.325 |
hower | +1.290 |
orah | +1.268 |
oops | +1.256 |
hari | +1.251 |
Neg logit contributions | |
llor | -1.165 |
zag | -1.119 |
cling | -1.105 |
rients | -1.105 |
-$ | -1.085 |
Token | " |
Token ID | 366 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
llor | +0.796 |
zag | +0.768 |
cling | +0.759 |
rients | +0.759 |
-$ | +0.752 |
Neg logit contributions | |
assian | -0.689 |
hower | -0.667 |
orah | -0.651 |
oops | -0.646 |
hari | -0.642 |
Token | Mir |
Token ID | 27453 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
assian | +0.544 |
hower | +0.531 |
orah | +0.519 |
hari | +0.514 |
oops | +0.513 |
Neg logit contributions | |
llor | -0.440 |
zag | -0.423 |
cling | -0.417 |
rients | -0.415 |
-$ | -0.414 |
Token | acle |
Token ID | 6008 |
Feature activation | +5.44e-01 |
Pos logit contributions | |
llor | +5.435 |
zag | +5.432 |
cling | +5.395 |
rients | +5.297 |
-$ | +5.176 |
Neg logit contributions | |
assian | -7.134 |
hower | -7.023 |
oops | -6.918 |
hari | -6.765 |
oleon | -6.506 |
Token | on |
Token ID | 319 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
llor | +1.746 |
rients | +1.634 |
zag | +1.633 |
-$ | +1.632 |
cling | +1.600 |
Neg logit contributions | |
assian | -2.426 |
hower | -2.338 |
hari | -2.297 |
orah | -2.292 |
oops | -2.281 |
Token | 34 |
Token ID | 4974 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
assian | +0.743 |
hower | +0.727 |
orah | +0.711 |
oops | +0.706 |
hari | +0.704 |
Neg logit contributions | |
llor | -0.434 |
zag | -0.412 |
cling | -0.406 |
rients | -0.405 |
-$ | -0.403 |
Token | th |
Token ID | 400 |
Feature activation | -8.65e-02 |
Pos logit contributions | |
assian | +0.540 |
hower | +0.533 |
hari | +0.516 |
orah | +0.512 |
oops | +0.510 |
Neg logit contributions | |
llor | -0.306 |
zag | -0.293 |
rients | -0.290 |
-$ | -0.290 |
cling | -0.285 |
Token | Street |
Token ID | 3530 |
Feature activation | +2.02e-01 |
Pos logit contributions | |
assian | +0.370 |
hower | +0.360 |
orah | +0.353 |
oops | +0.351 |
hari | +0.350 |
Neg logit contributions | |
llor | -0.292 |
zag | -0.279 |
cling | -0.275 |
rients | -0.275 |
-$ | -0.274 |
Token | - |
Token ID | 12 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
llor | +4.443 |
zag | +4.220 |
-$ | +4.210 |
cling | +4.184 |
rients | +4.174 |
Neg logit contributions | |
assian | -6.285 |
hower | -6.183 |
hari | -5.914 |
orah | -5.897 |
oops | -5.878 |
Token | cyclop |
Token ID | 22873 |
Feature activation | +7.15e-01 |
Pos logit contributions | |
llor | +1.507 |
zag | +1.439 |
cling | +1.421 |
rients | +1.409 |
-$ | +1.395 |
Neg logit contributions | |
assian | -2.263 |
hower | -2.203 |
orah | -2.163 |
hari | -2.140 |
oops | -2.123 |
Token | rop |
Token ID | 1773 |
Feature activation | +9.18e-01 |
Pos logit contributions | |
llor | +2.311 |
rients | +2.177 |
zag | +2.139 |
cling | +2.110 |
-$ | +2.098 |
Neg logit contributions | |
assian | -3.167 |
hower | -3.141 |
hari | -3.039 |
oops | -2.994 |
orah | -2.963 |
Token | yl |
Token ID | 2645 |
Feature activation | +5.74e-01 |
Pos logit contributions | |
llor | +3.605 |
rients | +3.444 |
zag | +3.338 |
-$ | +3.328 |
cling | +3.325 |
Neg logit contributions | |
hower | -3.387 |
assian | -3.377 |
hari | -3.230 |
oops | -3.164 |
orah | -3.141 |
Token | methyl |
Token ID | 43654 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
llor | +1.990 |
zag | +1.904 |
rients | +1.885 |
cling | +1.881 |
-$ | +1.865 |
Neg logit contributions | |
assian | -2.396 |
hower | -2.341 |
orah | -2.289 |
oops | -2.264 |
hari | -2.261 |
Token | - |
Token ID | 12 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
llor | +3.833 |
zag | +3.646 |
rients | +3.638 |
-$ | +3.631 |
cling | +3.629 |
Neg logit contributions | |
assian | -4.441 |
hower | -4.349 |
orah | -4.260 |
hari | -4.195 |
oops | -4.159 |
Token | 7 |
Token ID | 22 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
llor | +4.718 |
-$ | +4.540 |
nc | +4.532 |
zag | +4.519 |
cling | +4.462 |
Neg logit contributions | |
assian | -8.168 |
hower | -7.879 |
orah | -7.803 |
hari | -7.536 |
oops | -7.469 |
Token | -( |
Token ID | 30420 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
llor | +4.038 |
-$ | +3.871 |
zag | +3.786 |
rients | +3.702 |
nc | +3.674 |
Neg logit contributions | |
assian | -7.223 |
hower | -7.078 |
orah | -6.934 |
hari | -6.876 |
oops | -6.864 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
llor | +3.465 |
-$ | +3.267 |
zag | +3.259 |
nc | +3.180 |
cling | +3.095 |
Neg logit contributions | |
assian | -7.663 |
hower | -7.472 |
orah | -7.260 |
hari | -7.245 |
oops | -7.048 |
Token | , |
Token ID | 11 |
Feature activation | +8.23e-01 |
Pos logit contributions | |
llor | +3.479 |
-$ | +3.345 |
zag | +3.281 |
rients | +3.244 |
nc | +3.242 |
Neg logit contributions | |
assian | -5.383 |
hower | -5.325 |
orah | -5.196 |
oops | -5.118 |
hari | -5.077 |
Token | 6 |
Token ID | 21 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
llor | +1.970 |
zag | +1.874 |
-$ | +1.863 |
cling | +1.833 |
rients | +1.825 |
Neg logit contributions | |
assian | -4.303 |
hower | -4.223 |
orah | -4.108 |
hari | -4.074 |
oops | -4.058 |
Token | pr |
Token ID | 778 |
Feature activation | +8.77e-01 |
Pos logit contributions | |
llor | +1.095 |
zag | +1.051 |
cling | +1.036 |
rients | +1.035 |
-$ | +1.025 |
Neg logit contributions | |
assian | -1.327 |
hower | -1.292 |
orah | -1.265 |
oops | -1.255 |
hari | -1.251 |
Token | imate |
Token ID | 1920 |
Feature activation | +3.68e-01 |
Pos logit contributions | |
llor | +1.538 |
zag | +1.442 |
rients | +1.388 |
cling | +1.371 |
-$ | +1.321 |
Neg logit contributions | |
assian | -5.124 |
hower | -5.093 |
orah | -4.968 |
hari | -4.931 |
oops | -4.896 |
Token | c |
Token ID | 66 |
Feature activation | +5.84e-01 |
Pos logit contributions | |
llor | +1.298 |
zag | +1.250 |
cling | +1.233 |
rients | +1.232 |
-$ | +1.225 |
Neg logit contributions | |
assian | -1.516 |
hower | -1.476 |
orah | -1.441 |
oops | -1.431 |
hari | -1.423 |
Token | FP |
Token ID | 31459 |
Feature activation | -3.11e-02 |
Pos logit contributions | |
llor | +2.272 |
cling | +2.196 |
zag | +2.161 |
rients | +2.153 |
nc | +2.127 |
Neg logit contributions | |
hower | -2.166 |
assian | -2.145 |
orah | -2.068 |
hari | -2.046 |
oops | -2.021 |
Token | 3 |
Token ID | 18 |
Feature activation | +5.68e-01 |
Pos logit contributions | |
assian | +0.135 |
hower | +0.132 |
orah | +0.129 |
oops | +0.128 |
hari | +0.128 |
Neg logit contributions | |
llor | -0.103 |
zag | -0.098 |
cling | -0.097 |
rients | -0.097 |
-$ | -0.096 |
Token | cand |
Token ID | 2658 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
llor | +1.877 |
zag | +1.799 |
cling | +1.776 |
rients | +1.773 |
-$ | +1.760 |
Neg logit contributions | |
assian | -2.467 |
hower | -2.405 |
orah | -2.352 |
oops | -2.331 |
hari | -2.326 |
Token | ies |
Token ID | 444 |
Feature activation | +5.41e-01 |
Pos logit contributions | |
llor | +6.489 |
rients | +6.362 |
cling | +6.300 |
zag | +6.293 |
nc | +6.075 |
Neg logit contributions | |
assian | -6.417 |
hower | -6.397 |
hari | -5.853 |
orah | -5.788 |
Commands | -5.704 |
Token | ( |
Token ID | 357 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
llor | +1.675 |
zag | +1.604 |
cling | +1.579 |
rients | +1.577 |
-$ | +1.570 |
Neg logit contributions | |
assian | -2.450 |
hower | -2.389 |
orah | -2.343 |
oops | -2.328 |
hari | -2.319 |
Token | S |
Token ID | 50 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
llor | +3.228 |
zag | +3.161 |
cling | +3.155 |
rients | +3.103 |
-$ | +3.076 |
Neg logit contributions | |
assian | -4.634 |
hower | -4.550 |
orah | -4.435 |
hari | -4.333 |
oops | -4.294 |
Token | DS |
Token ID | 5258 |
Feature activation | +2.64e-02 |
Pos logit contributions | |
llor | +3.909 |
zag | +3.866 |
cling | +3.828 |
rients | +3.766 |
-$ | +3.754 |
Neg logit contributions | |
assian | -3.837 |
hower | -3.798 |
hari | -3.619 |
orah | -3.616 |
oops | -3.607 |
Token | Diet |
Token ID | 16292 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
llor | +0.087 |
zag | +0.084 |
cling | +0.083 |
rients | +0.083 |
-$ | +0.083 |
Neg logit contributions | |
assian | -0.114 |
hower | -0.111 |
orah | -0.109 |
oops | -0.107 |
hari | -0.107 |
Token | in |
Token ID | 287 |
Feature activation | +3.67e-01 |
Pos logit contributions | |
llor | +1.238 |
zag | +1.197 |
cling | +1.177 |
rients | +1.176 |
-$ | +1.169 |
Neg logit contributions | |
assian | -1.411 |
hower | -1.369 |
oops | -1.333 |
orah | -1.321 |
hari | -1.318 |
Token | his |
Token ID | 465 |
Feature activation | +6.28e-01 |
Pos logit contributions | |
llor | +1.343 |
zag | +1.305 |
cling | +1.285 |
rients | +1.281 |
-$ | +1.274 |
Neg logit contributions | |
assian | -1.446 |
hower | -1.408 |
oops | -1.368 |
orah | -1.363 |
hari | -1.353 |
Token | book |
Token ID | 1492 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
llor | +2.078 |
zag | +2.011 |
cling | +1.963 |
rients | +1.958 |
-$ | +1.957 |
Neg logit contributions | |
assian | -2.689 |
hower | -2.619 |
oops | -2.549 |
hari | -2.537 |
orah | -2.520 |
Token | � |
Token ID | 564 |
Feature activation | +9.76e-01 |
Pos logit contributions | |
assian | +0.693 |
hower | +0.674 |
orah | +0.660 |
oops | +0.654 |
hari | +0.652 |
Neg logit contributions | |
llor | -0.614 |
zag | -0.590 |
cling | -0.581 |
rients | -0.581 |
-$ | -0.576 |
Token | � |
Token ID | 250 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
llor | +3.680 |
cling | +3.520 |
rients | +3.512 |
zag | +3.502 |
-$ | +3.486 |
Neg logit contributions | |
assian | -3.681 |
hower | -3.597 |
oops | -3.475 |
hari | -3.402 |
orah | -3.389 |
Token | Mu |
Token ID | 33239 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
llor | +0.520 |
zag | +0.499 |
cling | +0.492 |
rients | +0.492 |
-$ | +0.488 |
Neg logit contributions | |
assian | -0.613 |
hower | -0.597 |
orah | -0.581 |
oops | -0.578 |
hari | -0.575 |
Token | hammad |
Token ID | 14875 |
Feature activation | +6.18e-01 |
Pos logit contributions | |
llor | +5.454 |
zag | +5.262 |
cling | +5.039 |
-$ | +4.957 |
rients | +4.871 |
Neg logit contributions | |
assian | -7.352 |
hower | -7.317 |
oops | -7.265 |
orah | -6.838 |
hari | -6.684 |
Token | , |
Token ID | 11 |
Feature activation | +5.89e-01 |
Pos logit contributions | |
llor | +1.942 |
zag | +1.847 |
cling | +1.826 |
rients | +1.817 |
-$ | +1.817 |
Neg logit contributions | |
assian | -2.740 |
hower | -2.671 |
oops | -2.634 |
orah | -2.584 |
hari | -2.544 |
Token | Prophet |
Token ID | 13583 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
llor | +2.043 |
zag | +1.970 |
rients | +1.946 |
cling | +1.943 |
-$ | +1.918 |
Neg logit contributions | |
assian | -2.433 |
hower | -2.359 |
oops | -2.289 |
orah | -2.261 |
hari | -2.249 |
Token | of |
Token ID | 286 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
llor | +1.041 |
zag | +0.998 |
rients | +0.982 |
cling | +0.981 |
-$ | +0.978 |
Neg logit contributions | |
assian | -1.166 |
hower | -1.132 |
oops | -1.101 |
orah | -1.101 |
hari | -1.091 |
Token | God |
Token ID | 1793 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
llor | +0.483 |
zag | +0.467 |
rients | +0.461 |
cling | +0.460 |
-$ | +0.457 |
Neg logit contributions | |
assian | -0.456 |
hower | -0.442 |
orah | -0.429 |
oops | -0.427 |
hari | -0.425 |
Token | am |
Token ID | 321 |
Feature activation | +6.75e-01 |
Pos logit contributions | |
assian | +2.952 |
orah | +2.840 |
oops | +2.756 |
hower | +2.741 |
hari | +2.706 |
Neg logit contributions | |
llor | -4.132 |
cling | -4.010 |
distingu | -4.001 |
zag | -3.976 |
-$ | -3.938 |
Token | , |
Token ID | 11 |
Feature activation | +5.79e-02 |
Pos logit contributions | |
llor | +2.200 |
zag | +2.081 |
cling | +2.078 |
-$ | +2.076 |
rients | +2.062 |
Neg logit contributions | |
assian | -2.959 |
hower | -2.872 |
orah | -2.802 |
hari | -2.797 |
oops | -2.784 |
Token | a |
Token ID | 257 |
Feature activation | +1.68e-01 |
Pos logit contributions | |
llor | +0.189 |
zag | +0.181 |
rients | +0.178 |
cling | +0.178 |
-$ | +0.176 |
Neg logit contributions | |
assian | -0.253 |
hower | -0.246 |
orah | -0.241 |
oops | -0.240 |
hari | -0.239 |
Token | benz |
Token ID | 39601 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
llor | +0.553 |
zag | +0.530 |
rients | +0.521 |
cling | +0.521 |
-$ | +0.515 |
Neg logit contributions | |
assian | -0.733 |
hower | -0.714 |
orah | -0.700 |
oops | -0.695 |
hari | -0.693 |
Token | od |
Token ID | 375 |
Feature activation | -9.18e-01 |
Pos logit contributions | |
assian | +0.894 |
hower | +0.856 |
orah | +0.843 |
oops | +0.834 |
hari | +0.829 |
Neg logit contributions | |
llor | -1.090 |
zag | -1.050 |
rients | -1.042 |
cling | -1.041 |
-$ | -1.031 |
Token | iazep |
Token ID | 48826 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
assian | +2.434 |
hower | +2.298 |
orah | +2.293 |
oops | +2.260 |
hari | +2.211 |
Neg logit contributions | |
llor | -4.529 |
zag | -4.361 |
cling | -4.358 |
rients | -4.316 |
-$ | -4.297 |
Token | ine |
Token ID | 500 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
assian | +5.726 |
orah | +5.032 |
oran | +5.031 |
hari | +4.926 |
oops | +4.817 |
Neg logit contributions | |
cling | -12.252 |
rients | -12.237 |
zag | -12.180 |
llor | -12.141 |
� | -11.990 |
Token | anx |
Token ID | 7296 |
Feature activation | +4.54e-01 |
Pos logit contributions | |
assian | +0.945 |
hower | +0.913 |
orah | +0.899 |
oops | +0.889 |
hari | +0.881 |
Neg logit contributions | |
llor | -0.871 |
zag | -0.844 |
rients | -0.832 |
cling | -0.828 |
-$ | -0.808 |
Token | io |
Token ID | 952 |
Feature activation | -7.09e-01 |
Pos logit contributions | |
llor | +1.598 |
zag | +1.536 |
cling | +1.518 |
rients | +1.516 |
-$ | +1.505 |
Neg logit contributions | |
assian | -1.864 |
hower | -1.837 |
hari | -1.756 |
orah | -1.754 |
oops | -1.744 |
Token | ly |
Token ID | 306 |
Feature activation | +5.56e-01 |
Pos logit contributions | |
assian | +2.411 |
hower | +2.310 |
hari | +2.279 |
oops | +2.255 |
orah | +2.246 |
Neg logit contributions | |
llor | -2.957 |
zag | -2.882 |
rients | -2.834 |
distingu | -2.817 |
cling | -2.801 |
Token | tic |
Token ID | 13370 |
Feature activation | -3.49e-01 |
Pos logit contributions | |
llor | +2.057 |
zag | +1.980 |
cling | +1.952 |
rients | +1.951 |
-$ | +1.934 |
Neg logit contributions | |
assian | -2.195 |
hower | -2.133 |
orah | -2.086 |
oops | -2.070 |
hari | -2.062 |
Token | crumbling |
Token ID | 37550 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
assian | +0.770 |
hower | +0.749 |
orah | +0.735 |
oops | +0.729 |
hari | +0.724 |
Neg logit contributions | |
llor | -0.637 |
zag | -0.610 |
rients | -0.603 |
cling | -0.601 |
-$ | -0.593 |
Token | sidewalks |
Token ID | 38282 |
Feature activation | +7.86e-02 |
Pos logit contributions | |
assian | +0.679 |
hower | +0.662 |
orah | +0.648 |
oops | +0.643 |
hari | +0.638 |
Neg logit contributions | |
llor | -0.586 |
zag | -0.562 |
rients | -0.556 |
cling | -0.553 |
-$ | -0.544 |
Token | to |
Token ID | 284 |
Feature activation | -3.56e-01 |
Pos logit contributions | |
llor | +0.237 |
zag | +0.227 |
cling | +0.223 |
rients | +0.222 |
-$ | +0.222 |
Neg logit contributions | |
assian | -0.364 |
hower | -0.355 |
orah | -0.349 |
hari | -0.345 |
oops | -0.345 |
Token | the |
Token ID | 262 |
Feature activation | -7.89e-01 |
Pos logit contributions | |
assian | +1.363 |
hower | +1.323 |
orah | +1.300 |
oops | +1.284 |
hari | +1.275 |
Neg logit contributions | |
llor | -1.352 |
zag | -1.294 |
rients | -1.283 |
cling | -1.279 |
-$ | -1.258 |
Token | hom |
Token ID | 3488 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
assian | +2.987 |
hower | +2.899 |
orah | +2.858 |
oops | +2.823 |
hari | +2.778 |
Neg logit contributions | |
llor | -2.975 |
zag | -2.871 |
rients | -2.837 |
cling | -2.825 |
-$ | -2.764 |
Token | ew |
Token ID | 413 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
assian | +3.594 |
oops | +3.337 |
orah | +3.323 |
hower | +3.312 |
oran | +3.294 |
Neg logit contributions | |
llor | -6.611 |
zag | -6.366 |
rients | -6.348 |
distingu | -6.339 |
cling | -6.337 |
Token | on |
Token ID | 261 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
orah | +7.093 |
oops | +7.011 |
assian | +6.959 |
hower | +6.928 |
hari | +6.889 |
Neg logit contributions | |
distingu | -9.501 |
llor | -9.432 |
-$ | -9.248 |
rients | -9.191 |
zag | -9.149 |
Token | ers |
Token ID | 364 |
Feature activation | -5.82e-01 |
Pos logit contributions | |
llor | +0.534 |
zag | +0.510 |
cling | +0.506 |
-$ | +0.498 |
rients | +0.498 |
Neg logit contributions | |
assian | -0.675 |
hower | -0.658 |
orah | -0.645 |
oops | -0.642 |
hari | -0.636 |
Token | owning |
Token ID | 23107 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
assian | +2.412 |
hower | +2.347 |
orah | +2.301 |
oops | +2.283 |
hari | +2.269 |
Neg logit contributions | |
llor | -2.028 |
zag | -1.949 |
rients | -1.924 |
cling | -1.917 |
-$ | -1.891 |
Token | the |
Token ID | 262 |
Feature activation | -4.79e-01 |
Pos logit contributions | |
assian | +0.892 |
hower | +0.860 |
orah | +0.851 |
oops | +0.847 |
hari | +0.836 |
Neg logit contributions | |
llor | -0.757 |
zag | -0.719 |
rients | -0.713 |
cling | -0.710 |
-$ | -0.697 |
Token | houses |
Token ID | 7777 |
Feature activation | -2.23e-01 |
Pos logit contributions | |
assian | +1.857 |
hower | +1.795 |
orah | +1.769 |
oops | +1.756 |
hari | +1.729 |
Neg logit contributions | |
llor | -1.784 |
zag | -1.712 |
rients | -1.686 |
cling | -1.685 |
-$ | -1.657 |
Token | August |
Token ID | 2932 |
Feature activation | -9.03e-01 |
Pos logit contributions | |
assian | +4.408 |
orah | +4.082 |
hower | +4.047 |
hari | +4.044 |
oops | +4.043 |
Neg logit contributions | |
llor | -5.743 |
zag | -5.618 |
distingu | -5.607 |
cling | -5.485 |
rients | -5.450 |
Token | 2012 |
Token ID | 2321 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
assian | +4.200 |
hower | +4.032 |
orah | +4.012 |
oops | +3.961 |
hari | +3.921 |
Neg logit contributions | |
llor | -2.643 |
zag | -2.515 |
distingu | -2.499 |
cling | -2.496 |
rients | -2.463 |
Token | United |
Token ID | 1578 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
assian | +5.142 |
hower | +4.949 |
orah | +4.894 |
oops | +4.849 |
hari | +4.788 |
Neg logit contributions | |
llor | -2.972 |
zag | -2.804 |
distingu | -2.793 |
cling | -2.786 |
rients | -2.768 |
Token | States |
Token ID | 1829 |
Feature activation | -7.95e-01 |
Pos logit contributions | |
assian | +3.625 |
hower | +3.527 |
orah | +3.392 |
hari | +3.337 |
oops | +3.322 |
Neg logit contributions | |
llor | -5.969 |
zag | -5.782 |
cling | -5.698 |
rients | -5.683 |
-$ | -5.674 |
Token | 3 |
Token ID | 513 |
Feature activation | -6.33e-01 |
Pos logit contributions | |
assian | +3.444 |
hower | +3.330 |
orah | +3.272 |
oops | +3.236 |
hari | +3.217 |
Neg logit contributions | |
llor | -2.606 |
zag | -2.477 |
cling | -2.457 |
rients | -2.451 |
distingu | -2.444 |
Token | 240 |
Token ID | 16102 |
Feature activation | -2.21e+00 |
Pos logit contributions | |
assian | +2.193 |
hower | +2.119 |
orah | +2.069 |
oops | +2.048 |
hari | +2.035 |
Neg logit contributions | |
llor | -2.643 |
zag | -2.553 |
cling | -2.526 |
rients | -2.523 |
-$ | -2.499 |
Token | Posts |
Token ID | 12043 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
assian | +3.980 |
orah | +3.603 |
oops | +3.450 |
oran | +3.315 |
hower | +3.222 |
Neg logit contributions | |
llor | -12.250 |
distingu | -12.118 |
zag | -11.996 |
cling | -11.907 |
rients | -11.671 |
Token | # |
Token ID | 1303 |
Feature activation | -3.86e-01 |
Pos logit contributions | |
assian | +4.821 |
hower | +4.561 |
orah | +4.548 |
oops | +4.521 |
hari | +4.425 |
Neg logit contributions | |
llor | -6.031 |
zag | -5.953 |
rients | -5.849 |
cling | -5.737 |
-$ | -5.736 |
Token | 10 |
Token ID | 940 |
Feature activation | -5.71e-01 |
Pos logit contributions | |
assian | +1.805 |
hower | +1.762 |
orah | +1.731 |
oops | +1.720 |
hari | +1.713 |
Neg logit contributions | |
llor | -1.147 |
zag | -1.092 |
cling | -1.073 |
rients | -1.073 |
-$ | -1.058 |
Token | Happy |
Token ID | 14628 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
assian | +2.280 |
hower | +2.212 |
orah | +2.176 |
oops | +2.168 |
hari | +2.144 |
Neg logit contributions | |
llor | -2.069 |
zag | -1.995 |
rients | -1.966 |
cling | -1.963 |
-$ | -1.936 |
Token | it |
Token ID | 340 |
Feature activation | -8.11e-01 |
Pos logit contributions | |
assian | +0.784 |
hower | +0.761 |
oops | +0.745 |
orah | +0.745 |
hari | +0.739 |
Neg logit contributions | |
llor | -0.653 |
zag | -0.627 |
rients | -0.623 |
cling | -0.621 |
-$ | -0.614 |
Token | at |
Token ID | 379 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
assian | +3.620 |
hower | +3.480 |
orah | +3.469 |
oops | +3.451 |
hari | +3.449 |
Neg logit contributions | |
llor | -3.935 |
distingu | -3.854 |
zag | -3.824 |
rients | -3.805 |
cling | -3.757 |
Token | 9 |
Token ID | 860 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
assian | +4.355 |
hower | +4.205 |
orah | +4.204 |
oops | +4.201 |
hari | +4.128 |
Neg logit contributions | |
llor | -3.609 |
distingu | -3.501 |
rients | -3.414 |
zag | -3.409 |
cling | -3.397 |
Token | : |
Token ID | 25 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
assian | +4.614 |
orah | +4.427 |
oops | +4.404 |
hari | +4.325 |
hower | +4.310 |
Neg logit contributions | |
distingu | -5.168 |
llor | -5.038 |
zag | -4.861 |
rients | -4.814 |
cling | -4.738 |
Token | 28 |
Token ID | 2078 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
assian | +2.600 |
orah | +2.501 |
oops | +2.498 |
hower | +2.492 |
hari | +2.459 |
Neg logit contributions | |
llor | -1.973 |
distingu | -1.887 |
zag | -1.872 |
rients | -1.854 |
cling | -1.840 |
Token | am |
Token ID | 321 |
Feature activation | -9.11e-01 |
Pos logit contributions | |
assian | +4.620 |
hower | +4.430 |
orah | +4.394 |
oops | +4.391 |
hari | +4.331 |
Neg logit contributions | |
llor | -5.203 |
zag | -5.023 |
distingu | -5.023 |
rients | -4.975 |
cling | -4.933 |
Token | PST |
Token ID | 28220 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
assian | +3.836 |
hower | +3.703 |
oops | +3.623 |
orah | +3.616 |
hari | +3.591 |
Neg logit contributions | |
llor | -3.101 |
zag | -3.014 |
cling | -2.953 |
rients | -2.927 |
distingu | -2.916 |
Token |
|
Token ID | 198 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
hower | +6.918 |
assian | +6.819 |
oops | +6.489 |
orah | +6.449 |
oran | +6.408 |
Neg logit contributions | |
llor | -8.471 |
zag | -8.450 |
rients | -8.203 |
cling | -8.071 |
distingu | -8.060 |
Token |
|
Token ID | 198 |
Feature activation | -2.40e-01 |
Pos logit contributions | |
assian | +3.696 |
orah | +3.531 |
oops | +3.529 |
hower | +3.468 |
hari | +3.466 |
Neg logit contributions | |
distingu | -4.752 |
llor | -4.601 |
zag | -4.457 |
rients | -4.433 |
cling | -4.377 |
Token | Do |
Token ID | 5211 |
Feature activation | +2.44e-02 |
Pos logit contributions | |
assian | +0.985 |
hower | +0.958 |
orah | +0.939 |
oops | +0.932 |
hari | +0.928 |
Neg logit contributions | |
llor | -0.851 |
zag | -0.817 |
rients | -0.805 |
cling | -0.805 |
-$ | -0.796 |
Token | use |
Token ID | 779 |
Feature activation | +9.54e-02 |
Pos logit contributions | |
llor | +0.085 |
zag | +0.082 |
rients | +0.081 |
cling | +0.080 |
-$ | +0.079 |
Neg logit contributions | |
assian | -0.100 |
hower | -0.098 |
orah | -0.097 |
oops | -0.096 |
hari | -0.095 |
Token | social |
Token ID | 1919 |
Feature activation | -7.13e-01 |
Pos logit contributions | |
llor | +0.356 |
zag | +0.342 |
rients | +0.337 |
cling | +0.337 |
-$ | +0.334 |
Neg logit contributions | |
assian | -0.374 |
hower | -0.363 |
orah | -0.355 |
oops | -0.352 |
hari | -0.351 |
Token | by |
Token ID | 416 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
llor | +1.904 |
zag | +1.832 |
-$ | +1.824 |
cling | +1.801 |
rients | +1.775 |
Neg logit contributions | |
assian | -2.539 |
hower | -2.461 |
hari | -2.400 |
orah | -2.399 |
oops | -2.394 |
Token | Brazilian |
Token ID | 17036 |
Feature activation | +4.31e-01 |
Pos logit contributions | |
assian | +0.647 |
hower | +0.630 |
orah | +0.617 |
oops | +0.614 |
hari | +0.610 |
Neg logit contributions | |
llor | -0.477 |
zag | -0.456 |
cling | -0.450 |
rients | -0.450 |
-$ | -0.443 |
Token | construction |
Token ID | 5103 |
Feature activation | +5.12e-01 |
Pos logit contributions | |
llor | +1.582 |
zag | +1.520 |
-$ | +1.508 |
rients | +1.488 |
cling | +1.488 |
Neg logit contributions | |
assian | -1.702 |
hower | -1.668 |
orah | -1.621 |
hari | -1.620 |
oops | -1.608 |
Token | company |
Token ID | 1664 |
Feature activation | +7.83e-01 |
Pos logit contributions | |
llor | +2.009 |
zag | +1.927 |
-$ | +1.914 |
cling | +1.905 |
rients | +1.899 |
Neg logit contributions | |
assian | -1.899 |
hower | -1.831 |
orah | -1.803 |
hari | -1.793 |
oops | -1.784 |
Token | Od |
Token ID | 10529 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
llor | +2.465 |
zag | +2.347 |
-$ | +2.317 |
rients | +2.311 |
cling | +2.287 |
Neg logit contributions | |
assian | -3.488 |
hower | -3.413 |
orah | -3.340 |
hari | -3.335 |
oops | -3.297 |
Token | eb |
Token ID | 1765 |
Feature activation | -2.13e+00 |
Pos logit contributions | |
assian | +0.548 |
hower | +0.533 |
orah | +0.525 |
oops | +0.522 |
hari | +0.519 |
Neg logit contributions | |
llor | -0.403 |
zag | -0.386 |
cling | -0.379 |
rients | -0.379 |
-$ | -0.376 |
Token | re |
Token ID | 260 |
Feature activation | -7.09e-01 |
Pos logit contributions | |
assian | +9.657 |
oops | +9.578 |
orah | +9.335 |
oran | +8.922 |
hari | +8.888 |
Neg logit contributions | |
distingu | -5.803 |
llor | -5.787 |
-$ | -5.459 |
zag | -5.445 |
cling | -5.355 |
Token | cht |
Token ID | 21474 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
assian | +2.543 |
hower | +2.475 |
orah | +2.426 |
oops | +2.397 |
hari | +2.366 |
Neg logit contributions | |
llor | -2.840 |
zag | -2.725 |
cling | -2.710 |
rients | -2.703 |
distingu | -2.655 |
Token | . |
Token ID | 13 |
Feature activation | -9.15e-02 |
Pos logit contributions | |
assian | +0.534 |
hower | +0.521 |
orah | +0.510 |
oops | +0.507 |
hari | +0.505 |
Neg logit contributions | |
llor | -0.365 |
zag | -0.349 |
cling | -0.343 |
rients | -0.343 |
-$ | -0.338 |
Token |
|
Token ID | 198 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
assian | +0.363 |
hower | +0.352 |
orah | +0.344 |
oops | +0.342 |
hari | +0.340 |
Neg logit contributions | |
llor | -0.336 |
zag | -0.324 |
cling | -0.320 |
rients | -0.319 |
-$ | -0.316 |
Token |
|
Token ID | 198 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
llor | +0.463 |
zag | +0.444 |
-$ | +0.443 |
cling | +0.440 |
rients | +0.437 |
Neg logit contributions | |
assian | -0.542 |
hower | -0.535 |
orah | -0.515 |
oops | -0.510 |
hari | -0.509 |
Token | ce |
Token ID | 344 |
Feature activation | -2.44e-01 |
Pos logit contributions | |
assian | +2.920 |
hower | +2.857 |
orah | +2.811 |
oops | +2.795 |
hari | +2.783 |
Neg logit contributions | |
llor | -1.377 |
zag | -1.296 |
rients | -1.270 |
cling | -1.268 |
-$ | -1.251 |
Token | / |
Token ID | 14 |
Feature activation | -7.17e-01 |
Pos logit contributions | |
assian | +1.192 |
hower | +1.162 |
orah | +1.143 |
oops | +1.137 |
hari | +1.131 |
Neg logit contributions | |
llor | -0.675 |
zag | -0.638 |
rients | -0.630 |
cling | -0.624 |
-$ | -0.615 |
Token | edd |
Token ID | 6048 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
assian | +3.303 |
hower | +3.214 |
orah | +3.174 |
oops | +3.170 |
hari | +3.150 |
Neg logit contributions | |
llor | -2.146 |
zag | -2.030 |
rients | -2.020 |
distingu | -1.994 |
cling | -1.991 |
Token | 75 |
Token ID | 2425 |
Feature activation | -9.24e-01 |
Pos logit contributions | |
assian | +4.958 |
hower | +4.837 |
orah | +4.827 |
oops | +4.749 |
hari | +4.740 |
Neg logit contributions | |
llor | -3.136 |
zag | -2.961 |
rients | -2.959 |
distingu | -2.957 |
cling | -2.909 |
Token | / |
Token ID | 14 |
Feature activation | -7.16e-01 |
Pos logit contributions | |
assian | +4.361 |
hower | +4.212 |
orah | +4.206 |
hari | +4.168 |
oops | +4.166 |
Neg logit contributions | |
llor | -2.650 |
zag | -2.525 |
distingu | -2.519 |
rients | -2.510 |
cling | -2.468 |
Token | AUT |
Token ID | 39371 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
assian | +3.012 |
hower | +2.909 |
oops | +2.877 |
orah | +2.872 |
hari | +2.834 |
Neg logit contributions | |
llor | -2.472 |
zag | -2.370 |
rients | -2.324 |
cling | -2.309 |
distingu | -2.292 |
Token | OC |
Token ID | 4503 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
assian | +5.576 |
orah | +5.541 |
oops | +5.493 |
oran | +5.479 |
hower | +5.432 |
Neg logit contributions | |
zag | -9.683 |
llor | -9.647 |
distingu | -9.629 |
rients | -9.226 |
cling | -9.093 |
Token | R |
Token ID | 49 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
assian | +6.104 |
orah | +5.828 |
oops | +5.763 |
hari | +5.623 |
oran | +5.576 |
Neg logit contributions | |
llor | -4.929 |
distingu | -4.815 |
zag | -4.757 |
rients | -4.670 |
cling | -4.587 |
Token | OP |
Token ID | 3185 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
assian | +0.589 |
hower | +0.584 |
hari | +0.547 |
orah | +0.545 |
oops | +0.535 |
Neg logit contributions | |
llor | -0.684 |
cling | -0.667 |
-$ | -0.667 |
zag | -0.665 |
rients | -0.661 |
Token | / |
Token ID | 14 |
Feature activation | -7.95e-01 |
Pos logit contributions | |
assian | +4.534 |
hower | +4.434 |
hari | +4.362 |
oops | +4.330 |
orah | +4.315 |
Neg logit contributions | |
llor | -3.055 |
distingu | -2.975 |
zag | -2.910 |
cling | -2.865 |
rients | -2.855 |
Token | h |
Token ID | 71 |
Feature activation | -5.24e-01 |
Pos logit contributions | |
assian | +2.668 |
hower | +2.583 |
orah | +2.524 |
oops | +2.521 |
hari | +2.504 |
Neg logit contributions | |
llor | -3.396 |
zag | -3.270 |
rients | -3.218 |
cling | -3.209 |
distingu | -3.202 |
Token | at |
Token ID | 379 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
assian | +3.072 |
orah | +2.969 |
hari | +2.940 |
hower | +2.937 |
oops | +2.937 |
Neg logit contributions | |
distingu | -3.402 |
llor | -3.398 |
zag | -3.294 |
rients | -3.274 |
cling | -3.225 |
Token | 2 |
Token ID | 362 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
assian | +4.318 |
orah | +4.198 |
oops | +4.187 |
hower | +4.180 |
hari | +4.101 |
Neg logit contributions | |
llor | -3.666 |
distingu | -3.565 |
rients | -3.468 |
zag | -3.461 |
cling | -3.423 |
Token | : |
Token ID | 25 |
Feature activation | -6.62e-01 |
Pos logit contributions | |
assian | +4.936 |
orah | +4.755 |
oops | +4.726 |
hari | +4.647 |
hower | +4.546 |
Neg logit contributions | |
distingu | -6.175 |
llor | -5.792 |
zag | -5.575 |
rients | -5.557 |
� | -5.431 |
Token | 29 |
Token ID | 1959 |
Feature activation | -9.83e-01 |
Pos logit contributions | |
assian | +2.840 |
orah | +2.733 |
oops | +2.729 |
hower | +2.716 |
hari | +2.683 |
Neg logit contributions | |
llor | -2.195 |
distingu | -2.106 |
zag | -2.082 |
rients | -2.063 |
cling | -2.046 |
Token | am |
Token ID | 321 |
Feature activation | -6.85e-01 |
Pos logit contributions | |
assian | +3.993 |
hower | +3.865 |
orah | +3.833 |
oops | +3.804 |
hari | +3.777 |
Neg logit contributions | |
llor | -3.423 |
distingu | -3.310 |
zag | -3.294 |
rients | -3.269 |
cling | -3.215 |
Token | PST |
Token ID | 28220 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
assian | +2.850 |
hower | +2.764 |
orah | +2.713 |
oops | +2.705 |
hari | +2.686 |
Neg logit contributions | |
llor | -2.365 |
zag | -2.280 |
cling | -2.242 |
rients | -2.230 |
distingu | -2.225 |
Token |
|
Token ID | 198 |
Feature activation | -9.66e-01 |
Pos logit contributions | |
hower | +6.126 |
assian | +6.080 |
oops | +5.811 |
orah | +5.767 |
hari | +5.660 |
Neg logit contributions | |
llor | -8.331 |
zag | -8.170 |
rients | -8.038 |
cling | -7.968 |
distingu | -7.902 |
Token |
|
Token ID | 198 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
assian | +3.313 |
orah | +3.167 |
oops | +3.148 |
hower | +3.127 |
hari | +3.110 |
Neg logit contributions | |
distingu | -4.039 |
llor | -3.968 |
zag | -3.828 |
rients | -3.814 |
cling | -3.763 |
Token | Do |
Token ID | 5211 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
assian | +1.141 |
hower | +1.109 |
orah | +1.089 |
oops | +1.083 |
hari | +1.076 |
Neg logit contributions | |
llor | -1.006 |
zag | -0.963 |
rients | -0.952 |
cling | -0.950 |
-$ | -0.938 |
Token | not |
Token ID | 407 |
Feature activation | +3.64e-01 |
Pos logit contributions | |
assian | +0.894 |
hower | +0.880 |
orah | +0.869 |
hari | +0.855 |
oops | +0.854 |
Neg logit contributions | |
llor | -0.822 |
rients | -0.794 |
zag | -0.789 |
cling | -0.781 |
-$ | -0.774 |
Token | use |
Token ID | 779 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
llor | +1.317 |
zag | +1.268 |
cling | +1.251 |
rients | +1.247 |
-$ | +1.240 |
Neg logit contributions | |
assian | -1.463 |
hower | -1.421 |
orah | -1.384 |
oops | -1.378 |
hari | -1.373 |
Token | removed |
Token ID | 4615 |
Feature activation | -5.28e-01 |
Pos logit contributions | |
assian | +1.811 |
hower | +1.734 |
orah | +1.698 |
hari | +1.683 |
oops | +1.670 |
Neg logit contributions | |
llor | -1.719 |
zag | -1.683 |
rients | -1.655 |
cling | -1.654 |
-$ | -1.620 |
Token | from |
Token ID | 422 |
Feature activation | -6.90e-01 |
Pos logit contributions | |
assian | +2.278 |
hower | +2.220 |
orah | +2.178 |
oops | +2.156 |
hari | +2.154 |
Neg logit contributions | |
llor | -1.712 |
zag | -1.676 |
cling | -1.644 |
rients | -1.643 |
-$ | -1.609 |
Token | office |
Token ID | 2607 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
assian | +2.425 |
hower | +2.355 |
orah | +2.284 |
oops | +2.261 |
hari | +2.253 |
Neg logit contributions | |
llor | -2.800 |
zag | -2.722 |
rients | -2.706 |
cling | -2.666 |
-$ | -2.656 |
Token | , |
Token ID | 11 |
Feature activation | -4.51e-01 |
Pos logit contributions | |
assian | +4.050 |
hower | +3.929 |
orah | +3.856 |
oops | +3.816 |
hari | +3.801 |
Neg logit contributions | |
llor | -3.637 |
zag | -3.606 |
cling | -3.553 |
rients | -3.539 |
distingu | -3.477 |
Token | effective |
Token ID | 4050 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
assian | +1.772 |
hower | +1.721 |
orah | +1.686 |
oops | +1.675 |
hari | +1.668 |
Neg logit contributions | |
llor | -1.659 |
zag | -1.604 |
rients | -1.583 |
cling | -1.583 |
-$ | -1.566 |
Token | immediately |
Token ID | 3393 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
assian | +4.491 |
hower | +4.351 |
oops | +4.335 |
orah | +4.269 |
hari | +4.263 |
Neg logit contributions | |
llor | -4.715 |
zag | -4.661 |
rients | -4.589 |
cling | -4.545 |
distingu | -4.473 |
Token | . |
Token ID | 13 |
Feature activation | -1.10e-01 |
Pos logit contributions | |
assian | +7.233 |
hower | +6.965 |
oops | +6.894 |
orah | +6.821 |
oran | +6.809 |
Neg logit contributions | |
zag | -7.148 |
llor | -7.122 |
cling | -7.009 |
rients | -6.943 |
distingu | -6.896 |
Token | � |
Token ID | 447 |
Feature activation | -8.96e-02 |
Pos logit contributions | |
assian | +0.445 |
hower | +0.433 |
orah | +0.423 |
oops | +0.420 |
hari | +0.419 |
Neg logit contributions | |
llor | -0.395 |
zag | -0.380 |
cling | -0.374 |
rients | -0.374 |
-$ | -0.371 |
Token | � |
Token ID | 251 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
assian | +0.299 |
hower | +0.290 |
orah | +0.284 |
oops | +0.281 |
hari | +0.280 |
Neg logit contributions | |
llor | -0.384 |
zag | -0.372 |
rients | -0.367 |
cling | -0.367 |
-$ | -0.362 |
Token |
|
Token ID | 198 |
Feature activation | -3.93e-01 |
Pos logit contributions | |
assian | +0.089 |
hower | +0.086 |
orah | +0.084 |
oops | +0.084 |
hari | +0.083 |
Neg logit contributions | |
llor | -0.085 |
zag | -0.081 |
cling | -0.080 |
rients | -0.080 |
-$ | -0.080 |
Token |
|
Token ID | 198 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
assian | +1.504 |
hower | +1.455 |
orah | +1.429 |
oops | +1.419 |
hari | +1.412 |
Neg logit contributions | |
llor | -1.497 |
zag | -1.442 |
rients | -1.423 |
cling | -1.421 |
distingu | -1.408 |
Token | � |
Token ID | 251 |
Feature activation | +4.08e-01 |
Pos logit contributions | |
llor | +1.171 |
zag | +1.129 |
-$ | +1.119 |
cling | +1.118 |
rients | +1.109 |
Neg logit contributions | |
assian | -0.985 |
hower | -0.952 |
orah | -0.918 |
oops | -0.911 |
hari | -0.904 |
Token | which |
Token ID | 543 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
llor | +1.513 |
zag | +1.441 |
cling | +1.433 |
-$ | +1.428 |
rients | +1.408 |
Neg logit contributions | |
assian | -1.614 |
hower | -1.573 |
orah | -1.518 |
oops | -1.491 |
hari | -1.490 |
Token | he |
Token ID | 339 |
Feature activation | -3.08e-01 |
Pos logit contributions | |
assian | +4.602 |
hower | +4.456 |
orah | +4.427 |
oops | +4.389 |
hari | +4.360 |
Neg logit contributions | |
llor | -4.206 |
zag | -4.151 |
cling | -4.059 |
rients | -4.054 |
-$ | -3.952 |
Token | takes |
Token ID | 2753 |
Feature activation | -7.06e-01 |
Pos logit contributions | |
assian | +1.240 |
hower | +1.205 |
orah | +1.180 |
oops | +1.171 |
hari | +1.167 |
Neg logit contributions | |
llor | -1.116 |
zag | -1.074 |
cling | -1.058 |
rients | -1.058 |
-$ | -1.048 |
Token | to |
Token ID | 284 |
Feature activation | -7.61e-02 |
Pos logit contributions | |
assian | +2.885 |
hower | +2.788 |
orah | +2.744 |
oops | +2.728 |
hari | +2.720 |
Neg logit contributions | |
llor | -2.480 |
zag | -2.410 |
rients | -2.364 |
cling | -2.359 |
-$ | -2.318 |
Token | mean |
Token ID | 1612 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
assian | +0.278 |
hower | +0.270 |
orah | +0.263 |
oops | +0.261 |
hari | +0.260 |
Neg logit contributions | |
llor | -0.304 |
zag | -0.293 |
cling | -0.289 |
rients | -0.289 |
-$ | -0.287 |
Token | the |
Token ID | 262 |
Feature activation | -3.54e-01 |
Pos logit contributions | |
assian | +6.845 |
oops | +6.756 |
orah | +6.685 |
hower | +6.624 |
hari | +6.558 |
Neg logit contributions | |
llor | -7.341 |
zag | -7.257 |
rients | -7.191 |
cling | -7.073 |
-$ | -6.995 |
Token | newspaper |
Token ID | 7533 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
assian | +1.436 |
hower | +1.394 |
orah | +1.368 |
oops | +1.358 |
hari | +1.350 |
Neg logit contributions | |
llor | -1.266 |
zag | -1.221 |
rients | -1.203 |
cling | -1.201 |
-$ | -1.191 |
Token | he |
Token ID | 339 |
Feature activation | -6.98e-01 |
Pos logit contributions | |
llor | +0.457 |
zag | +0.439 |
cling | +0.433 |
-$ | +0.431 |
rients | +0.430 |
Neg logit contributions | |
assian | -0.467 |
hower | -0.455 |
orah | -0.445 |
hari | -0.439 |
oops | -0.439 |
Token | used |
Token ID | 973 |
Feature activation | -2.24e-01 |
Pos logit contributions | |
assian | +2.657 |
hower | +2.570 |
orah | +2.540 |
oops | +2.528 |
hari | +2.507 |
Neg logit contributions | |
llor | -2.631 |
zag | -2.556 |
rients | -2.501 |
cling | -2.501 |
-$ | -2.483 |
Token | to |
Token ID | 284 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
assian | +0.992 |
hower | +0.967 |
orah | +0.947 |
oops | +0.941 |
hari | +0.938 |
Neg logit contributions | |
llor | -0.723 |
zag | -0.691 |
cling | -0.680 |
rients | -0.679 |
-$ | -0.673 |
Token | at |
Token ID | 379 |
Feature activation | -9.44e-01 |
Pos logit contributions | |
assian | +4.504 |
hower | +4.331 |
oops | +4.290 |
hari | +4.284 |
orah | +4.251 |
Neg logit contributions | |
llor | -4.977 |
zag | -4.901 |
distingu | -4.882 |
rients | -4.857 |
cling | -4.782 |
Token | 10 |
Token ID | 838 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
assian | +3.922 |
hower | +3.792 |
oops | +3.777 |
orah | +3.764 |
hari | +3.709 |
Neg logit contributions | |
llor | -3.186 |
distingu | -3.061 |
zag | -3.024 |
rients | -3.014 |
cling | -3.006 |
Token | : |
Token ID | 25 |
Feature activation | -5.47e-01 |
Pos logit contributions | |
assian | +4.724 |
orah | +4.517 |
oops | +4.497 |
hower | +4.468 |
hari | +4.440 |
Neg logit contributions | |
llor | -4.887 |
distingu | -4.827 |
zag | -4.683 |
rients | -4.633 |
cling | -4.580 |
Token | 02 |
Token ID | 2999 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
assian | +2.389 |
hower | +2.296 |
orah | +2.294 |
oops | +2.292 |
hari | +2.260 |
Neg logit contributions | |
llor | -1.779 |
zag | -1.691 |
distingu | -1.689 |
rients | -1.671 |
cling | -1.662 |
Token | am |
Token ID | 321 |
Feature activation | -8.49e-01 |
Pos logit contributions | |
assian | +4.802 |
hower | +4.654 |
orah | +4.584 |
hari | +4.547 |
oops | +4.524 |
Neg logit contributions | |
llor | -4.962 |
zag | -4.816 |
rients | -4.729 |
distingu | -4.713 |
cling | -4.701 |
Token | PST |
Token ID | 28220 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
assian | +3.555 |
hower | +3.441 |
orah | +3.381 |
oops | +3.354 |
hari | +3.323 |
Neg logit contributions | |
llor | -2.869 |
zag | -2.817 |
cling | -2.755 |
rients | -2.733 |
distingu | -2.728 |
Token |
|
Token ID | 198 |
Feature activation | -9.27e-01 |
Pos logit contributions | |
assian | +6.481 |
hower | +6.480 |
orah | +6.217 |
oran | +6.196 |
oops | +6.081 |
Neg logit contributions | |
llor | -7.785 |
zag | -7.724 |
distingu | -7.515 |
cling | -7.446 |
rients | -7.391 |
Token |
|
Token ID | 198 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
assian | +3.182 |
orah | +3.035 |
oops | +3.026 |
hower | +2.997 |
hari | +2.986 |
Neg logit contributions | |
distingu | -3.874 |
llor | -3.804 |
zag | -3.680 |
rients | -3.650 |
cling | -3.607 |
Token | Do |
Token ID | 5211 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
assian | +0.055 |
hower | +0.054 |
orah | +0.053 |
oops | +0.052 |
hari | +0.052 |
Neg logit contributions | |
llor | -0.045 |
zag | -0.044 |
cling | -0.043 |
rients | -0.043 |
-$ | -0.043 |
Token | not |
Token ID | 407 |
Feature activation | +9.73e-01 |
Pos logit contributions | |
llor | +0.561 |
zag | +0.539 |
cling | +0.531 |
rients | +0.530 |
-$ | +0.526 |
Neg logit contributions | |
assian | -0.655 |
hower | -0.637 |
orah | -0.623 |
oops | -0.619 |
hari | -0.617 |
Token | use |
Token ID | 779 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
llor | +3.289 |
zag | +3.171 |
-$ | +3.149 |
cling | +3.142 |
rients | +3.094 |
Neg logit contributions | |
assian | -4.084 |
hower | -3.979 |
oops | -3.832 |
hari | -3.817 |
orah | -3.798 |
Token | right |
Token ID | 826 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
assian | +2.598 |
hower | +2.447 |
oops | +2.412 |
orah | +2.404 |
hari | +2.361 |
Neg logit contributions | |
llor | -4.262 |
zag | -4.140 |
rients | -4.134 |
cling | -4.100 |
-$ | -4.071 |
Token | and |
Token ID | 290 |
Feature activation | -4.91e-01 |
Pos logit contributions | |
assian | +1.008 |
hower | +0.977 |
orah | +0.956 |
oops | +0.949 |
hari | +0.946 |
Neg logit contributions | |
llor | -0.971 |
zag | -0.936 |
rients | -0.923 |
cling | -0.923 |
-$ | -0.914 |
Token | coll |
Token ID | 2927 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
assian | +1.839 |
hower | +1.777 |
oops | +1.749 |
orah | +1.749 |
hari | +1.725 |
Neg logit contributions | |
llor | -1.887 |
zag | -1.826 |
cling | -1.806 |
rients | -1.790 |
-$ | -1.778 |
Token | ides |
Token ID | 1460 |
Feature activation | +6.37e-02 |
Pos logit contributions | |
llor | +0.753 |
rients | +0.729 |
zag | +0.726 |
cling | +0.713 |
-$ | +0.705 |
Neg logit contributions | |
assian | -1.226 |
hower | -1.224 |
orah | -1.168 |
hari | -1.165 |
oops | -1.139 |
Token | with |
Token ID | 351 |
Feature activation | -8.56e-04 |
Pos logit contributions | |
llor | +0.197 |
zag | +0.188 |
cling | +0.185 |
rients | +0.184 |
-$ | +0.183 |
Neg logit contributions | |
assian | -0.291 |
hower | -0.284 |
orah | -0.278 |
oops | -0.277 |
hari | -0.276 |
Token | Bo |
Token ID | 3248 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
assian | +0.004 |
hower | +0.003 |
orah | +0.003 |
oops | +0.003 |
hari | +0.003 |
Neg logit contributions | |
llor | -0.003 |
zag | -0.003 |
cling | -0.003 |
rients | -0.003 |
-$ | -0.003 |
Token | z |
Token ID | 89 |
Feature activation | -2.95e-01 |
Pos logit contributions | |
assian | +8.501 |
hari | +8.291 |
orah | +8.245 |
oops | +8.186 |
hower | +8.140 |
Neg logit contributions | |
distingu | -6.107 |
llor | -5.861 |
rients | -5.575 |
� | -5.544 |
cling | -5.538 |
Token | eman |
Token ID | 8463 |
Feature activation | -8.86e-01 |
Pos logit contributions | |
assian | +0.651 |
hower | +0.622 |
orah | +0.586 |
oops | +0.585 |
hari | +0.577 |
Neg logit contributions | |
llor | -1.608 |
zag | -1.565 |
cling | -1.545 |
rients | -1.543 |
-$ | -1.539 |
Token | . |
Token ID | 13 |
Feature activation | -7.31e-01 |
Pos logit contributions | |
assian | +3.697 |
hower | +3.597 |
orah | +3.558 |
hari | +3.510 |
oops | +3.501 |
Neg logit contributions | |
llor | -2.949 |
zag | -2.859 |
rients | -2.843 |
cling | -2.820 |
distingu | -2.771 |
Token | B |
Token ID | 347 |
Feature activation | -9.22e-01 |
Pos logit contributions | |
assian | +2.836 |
hower | +2.749 |
orah | +2.701 |
oops | +2.691 |
hari | +2.652 |
Neg logit contributions | |
llor | -2.722 |
zag | -2.630 |
cling | -2.590 |
rients | -2.583 |
distingu | -2.553 |
Token | ugg |
Token ID | 6837 |
Feature activation | +6.16e-02 |
Pos logit contributions | |
assian | +2.114 |
hower | +1.989 |
oops | +1.982 |
orah | +1.975 |
hari | +1.955 |
Neg logit contributions | |
llor | -4.844 |
distingu | -4.748 |
zag | -4.694 |
rients | -4.677 |
cling | -4.665 |
Token | press |
Token ID | 1803 |
Feature activation | +2.29e-01 |
Pos logit contributions | |
llor | +0.395 |
zag | +0.380 |
cling | +0.374 |
-$ | +0.373 |
rients | +0.372 |
Neg logit contributions | |
assian | -0.461 |
hower | -0.450 |
orah | -0.438 |
oops | -0.435 |
hari | -0.433 |
Token | conference |
Token ID | 4495 |
Feature activation | -8.92e-02 |
Pos logit contributions | |
llor | +0.872 |
zag | +0.837 |
cling | +0.836 |
-$ | +0.827 |
rients | +0.825 |
Neg logit contributions | |
assian | -0.876 |
hower | -0.847 |
orah | -0.835 |
oops | -0.822 |
hari | -0.814 |
Token | . |
Token ID | 13 |
Feature activation | -4.86e-01 |
Pos logit contributions | |
assian | +0.408 |
hower | +0.397 |
orah | +0.390 |
oops | +0.388 |
hari | +0.385 |
Neg logit contributions | |
llor | -0.277 |
zag | -0.263 |
cling | -0.258 |
-$ | -0.258 |
rients | -0.256 |
Token |
|
Token ID | 198 |
Feature activation | -5.71e-01 |
Pos logit contributions | |
assian | +1.839 |
hower | +1.781 |
orah | +1.743 |
oops | +1.729 |
hari | +1.723 |
Neg logit contributions | |
llor | -1.872 |
zag | -1.808 |
cling | -1.784 |
rients | -1.783 |
-$ | -1.757 |
Token |
|
Token ID | 198 |
Feature activation | -3.12e-01 |
Pos logit contributions | |
assian | +2.078 |
hower | +1.987 |
orah | +1.976 |
oops | +1.964 |
hari | +1.950 |
Neg logit contributions | |
llor | -2.263 |
distingu | -2.220 |
zag | -2.185 |
rients | -2.162 |
cling | -2.148 |
Token | " |
Token ID | 1 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
assian | +1.533 |
hower | +1.493 |
orah | +1.472 |
oops | +1.466 |
hari | +1.459 |
Neg logit contributions | |
llor | -0.852 |
zag | -0.808 |
rients | -0.793 |
cling | -0.792 |
-$ | -0.778 |
Token | She |
Token ID | 3347 |
Feature activation | +4.40e-01 |
Pos logit contributions | |
assian | +6.373 |
oops | +6.270 |
orah | +5.970 |
hari | +5.938 |
hower | +5.856 |
Neg logit contributions | |
distingu | -7.862 |
llor | -7.824 |
rients | -7.615 |
zag | -7.584 |
cling | -7.357 |
Token | 's |
Token ID | 338 |
Feature activation | +4.28e-02 |
Pos logit contributions | |
llor | +1.425 |
cling | +1.357 |
zag | +1.349 |
-$ | +1.328 |
rients | +1.324 |
Neg logit contributions | |
assian | -1.943 |
hower | -1.899 |
orah | -1.840 |
oops | -1.836 |
hari | -1.817 |
Token | handcuffed |
Token ID | 41529 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
llor | +0.151 |
zag | +0.146 |
cling | +0.144 |
rients | +0.143 |
-$ | +0.143 |
Neg logit contributions | |
assian | -0.175 |
hower | -0.171 |
orah | -0.167 |
oops | -0.166 |
hari | -0.165 |
Token | , |
Token ID | 11 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
assian | +5.079 |
orah | +4.965 |
hower | +4.879 |
hari | +4.865 |
oops | +4.827 |
Neg logit contributions | |
llor | -5.196 |
rients | -5.067 |
zag | -5.047 |
distingu | -4.936 |
cling | -4.850 |
Token | there |
Token ID | 612 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
assian | +1.617 |
hower | +1.562 |
orah | +1.527 |
oops | +1.513 |
hari | +1.506 |
Neg logit contributions | |
llor | -1.969 |
zag | -1.904 |
rients | -1.881 |
cling | -1.877 |
-$ | -1.862 |
Token | Scott |
Token ID | 4746 |
Feature activation | -9.69e-01 |
Pos logit contributions | |
assian | +3.691 |
orah | +3.577 |
hower | +3.509 |
oops | +3.475 |
oran | +3.458 |
Neg logit contributions | |
llor | -5.635 |
rients | -5.540 |
distingu | -5.418 |
-$ | -5.362 |
zag | -5.353 |
Token | declared |
Token ID | 6875 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
assian | +3.631 |
hower | +3.532 |
orah | +3.489 |
hari | +3.416 |
oops | +3.401 |
Neg logit contributions | |
llor | -3.661 |
zag | -3.528 |
rients | -3.527 |
cling | -3.496 |
-$ | -3.432 |
Token | a |
Token ID | 257 |
Feature activation | -4.25e-02 |
Pos logit contributions | |
assian | +4.069 |
hower | +4.026 |
oops | +3.971 |
orah | +3.939 |
hari | +3.876 |
Neg logit contributions | |
llor | -3.844 |
rients | -3.653 |
zag | -3.641 |
cling | -3.626 |
� | -3.475 |
Token | state |
Token ID | 1181 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
assian | +0.148 |
hower | +0.143 |
orah | +0.140 |
oops | +0.139 |
hari | +0.138 |
Neg logit contributions | |
llor | -0.177 |
zag | -0.171 |
cling | -0.169 |
rients | -0.168 |
-$ | -0.167 |
Token | of |
Token ID | 286 |
Feature activation | -2.73e-03 |
Pos logit contributions | |
assian | +1.351 |
hower | +1.312 |
orah | +1.280 |
oops | +1.260 |
hari | +1.243 |
Neg logit contributions | |
llor | -1.592 |
rients | -1.539 |
zag | -1.535 |
cling | -1.507 |
-$ | -1.473 |
Token | emergency |
Token ID | 6334 |
Feature activation | -1.93e+00 |
Pos logit contributions | |
assian | +0.008 |
hower | +0.008 |
orah | +0.008 |
oops | +0.008 |
hari | +0.008 |
Neg logit contributions | |
llor | -0.013 |
zag | -0.012 |
cling | -0.012 |
rients | -0.012 |
-$ | -0.012 |
Token | for |
Token ID | 329 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
assian | +6.632 |
hower | +6.546 |
orah | +6.440 |
oops | +6.310 |
oran | +6.297 |
Neg logit contributions | |
llor | -7.223 |
rients | -7.027 |
zag | -7.005 |
cling | -6.987 |
distingu | -6.887 |
Token | the |
Token ID | 262 |
Feature activation | -3.50e-01 |
Pos logit contributions | |
assian | +4.034 |
hower | +3.914 |
orah | +3.868 |
oops | +3.838 |
hari | +3.763 |
Neg logit contributions | |
llor | -4.047 |
rients | -3.865 |
zag | -3.855 |
cling | -3.804 |
distingu | -3.718 |
Token | entire |
Token ID | 2104 |
Feature activation | +9.01e-02 |
Pos logit contributions | |
assian | +1.272 |
hower | +1.233 |
orah | +1.211 |
oops | +1.200 |
hari | +1.189 |
Neg logit contributions | |
llor | -1.396 |
zag | -1.339 |
cling | -1.325 |
rients | -1.325 |
-$ | -1.299 |
Token | state |
Token ID | 1181 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
llor | +0.363 |
zag | +0.351 |
cling | +0.346 |
rients | +0.346 |
-$ | +0.345 |
Neg logit contributions | |
assian | -0.326 |
hower | -0.316 |
orah | -0.307 |
oops | -0.305 |
hari | -0.304 |
Token | . |
Token ID | 13 |
Feature activation | -3.82e-01 |
Pos logit contributions | |
assian | +1.205 |
hower | +1.174 |
orah | +1.151 |
oops | +1.142 |
hari | +1.138 |
Neg logit contributions | |
llor | -0.933 |
zag | -0.895 |
cling | -0.880 |
rients | -0.880 |
-$ | -0.870 |
Token | coalition |
Token ID | 9906 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
llor | +0.013 |
zag | +0.012 |
cling | +0.012 |
rients | +0.012 |
-$ | +0.012 |
Neg logit contributions | |
assian | -0.016 |
hower | -0.015 |
orah | -0.015 |
oops | -0.015 |
hari | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
assian | +0.981 |
hower | +0.958 |
orah | +0.937 |
oops | +0.930 |
hari | +0.927 |
Neg logit contributions | |
llor | -0.710 |
zag | -0.680 |
rients | -0.671 |
cling | -0.669 |
-$ | -0.660 |
Token | Added |
Token ID | 10687 |
Feature activation | -7.43e-01 |
Pos logit contributions | |
assian | +0.563 |
hower | +0.547 |
orah | +0.533 |
oops | +0.530 |
hari | +0.528 |
Neg logit contributions | |
llor | -0.563 |
zag | -0.542 |
cling | -0.535 |
rients | -0.535 |
-$ | -0.531 |
Token | into |
Token ID | 656 |
Feature activation | -8.99e-01 |
Pos logit contributions | |
assian | +3.091 |
hower | +2.993 |
orah | +2.967 |
oops | +2.927 |
hari | +2.897 |
Neg logit contributions | |
llor | -2.472 |
zag | -2.427 |
cling | -2.386 |
rients | -2.363 |
-$ | -2.336 |
Token | the |
Token ID | 262 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
assian | +3.189 |
hower | +3.081 |
orah | +3.017 |
oops | +2.986 |
hari | +2.963 |
Neg logit contributions | |
llor | -3.579 |
rients | -3.442 |
zag | -3.435 |
cling | -3.404 |
distingu | -3.390 |
Token | mix |
Token ID | 5022 |
Feature activation | -1.93e+00 |
Pos logit contributions | |
assian | +4.188 |
orah | +4.038 |
hower | +4.018 |
oops | +3.925 |
hari | +3.913 |
Neg logit contributions | |
llor | -3.466 |
rients | -3.309 |
zag | -3.303 |
cling | -3.289 |
-$ | -3.256 |
Token | , |
Token ID | 11 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
assian | +6.841 |
hower | +6.668 |
orah | +6.463 |
hari | +6.352 |
oops | +6.302 |
Neg logit contributions | |
llor | -6.974 |
rients | -6.951 |
zag | -6.945 |
distingu | -6.759 |
cling | -6.745 |
Token | the |
Token ID | 262 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
assian | +0.450 |
hower | +0.438 |
orah | +0.428 |
oops | +0.425 |
hari | +0.423 |
Neg logit contributions | |
llor | -0.417 |
zag | -0.401 |
rients | -0.395 |
cling | -0.395 |
-$ | -0.392 |
Token | internal |
Token ID | 5387 |
Feature activation | -2.75e-01 |
Pos logit contributions | |
llor | +0.722 |
zag | +0.693 |
cling | +0.684 |
rients | +0.680 |
-$ | +0.676 |
Neg logit contributions | |
assian | -0.760 |
hower | -0.741 |
hari | -0.720 |
orah | -0.719 |
oops | -0.718 |
Token | debate |
Token ID | 4384 |
Feature activation | +5.81e-02 |
Pos logit contributions | |
assian | +0.915 |
hower | +0.879 |
orah | +0.860 |
oops | +0.850 |
hari | +0.847 |
Neg logit contributions | |
llor | -1.183 |
zag | -1.145 |
rients | -1.133 |
cling | -1.132 |
-$ | -1.124 |
Token | in |
Token ID | 287 |
Feature activation | -5.77e-02 |
Pos logit contributions | |
llor | +0.200 |
zag | +0.192 |
cling | +0.189 |
rients | +0.189 |
-$ | +0.187 |
Neg logit contributions | |
assian | -0.244 |
hower | -0.238 |
orah | -0.233 |
oops | -0.231 |
hari | -0.230 |
Token | . |
Token ID | 13 |
Feature activation | +4.97e-02 |
Pos logit contributions | |
assian | +0.320 |
hower | +0.312 |
orah | +0.306 |
oops | +0.304 |
hari | +0.303 |
Neg logit contributions | |
llor | -0.213 |
zag | -0.203 |
cling | -0.199 |
rients | -0.199 |
-$ | -0.197 |
Token |
|
Token ID | 198 |
Feature activation | +2.77e-02 |
Pos logit contributions | |
llor | +0.183 |
zag | +0.176 |
cling | +0.173 |
rients | +0.173 |
-$ | +0.172 |
Neg logit contributions | |
assian | -0.197 |
hower | -0.192 |
orah | -0.188 |
oops | -0.186 |
hari | -0.185 |
Token |
|
Token ID | 198 |
Feature activation | +7.49e-02 |
Pos logit contributions | |
llor | +0.100 |
zag | +0.096 |
-$ | +0.095 |
cling | +0.095 |
rients | +0.094 |
Neg logit contributions | |
assian | -0.113 |
hower | -0.111 |
orah | -0.107 |
oops | -0.106 |
hari | -0.106 |
Token | This |
Token ID | 1212 |
Feature activation | +4.79e-02 |
Pos logit contributions | |
llor | +0.248 |
zag | +0.238 |
cling | +0.234 |
-$ | +0.234 |
rients | +0.233 |
Neg logit contributions | |
assian | -0.325 |
hower | -0.320 |
orah | -0.310 |
hari | -0.306 |
oops | -0.305 |
Token | article |
Token ID | 2708 |
Feature activation | -3.61e-01 |
Pos logit contributions | |
llor | +0.159 |
zag | +0.152 |
cling | +0.150 |
rients | +0.149 |
-$ | +0.148 |
Neg logit contributions | |
assian | -0.208 |
hower | -0.202 |
orah | -0.199 |
oops | -0.196 |
hari | -0.196 |
Token | originally |
Token ID | 6198 |
Feature activation | -1.93e+00 |
Pos logit contributions | |
assian | +1.465 |
hower | +1.419 |
orah | +1.389 |
oops | +1.384 |
hari | +1.377 |
Neg logit contributions | |
llor | -1.289 |
zag | -1.237 |
cling | -1.229 |
rients | -1.221 |
-$ | -1.208 |
Token | appeared |
Token ID | 4120 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
assian | +5.820 |
hari | +5.543 |
orah | +5.526 |
oops | +5.464 |
hower | +5.432 |
Neg logit contributions | |
llor | -8.180 |
cling | -8.116 |
rients | -8.069 |
zag | -7.985 |
distingu | -7.901 |
Token | on |
Token ID | 319 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
assian | +5.521 |
oops | +5.389 |
hower | +5.373 |
orah | +5.356 |
hari | +5.313 |
Neg logit contributions | |
llor | -5.817 |
zag | -5.655 |
rients | -5.634 |
distingu | -5.623 |
cling | -5.566 |
Token | HuffPost |
Token ID | 35130 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
assian | +4.723 |
oops | +4.607 |
hower | +4.600 |
hari | +4.549 |
orah | +4.528 |
Neg logit contributions | |
llor | -3.621 |
zag | -3.484 |
rients | -3.471 |
distingu | -3.407 |
cling | -3.390 |
Token | . |
Token ID | 13 |
Feature activation | -1.87e-01 |
Pos logit contributions | |
assian | +5.197 |
hower | +5.039 |
orah | +4.942 |
oops | +4.923 |
oran | +4.842 |
Neg logit contributions | |
llor | -3.788 |
zag | -3.607 |
rients | -3.587 |
cling | -3.537 |
distingu | -3.536 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
assian | +0.778 |
hower | +0.757 |
orah | +0.741 |
oops | +0.736 |
hari | +0.733 |
Neg logit contributions | |
llor | -0.649 |
zag | -0.623 |
cling | -0.614 |
rients | -0.614 |
-$ | -0.608 |
Token | was |
Token ID | 373 |
Feature activation | -3.10e-01 |
Pos logit contributions | |
llor | +0.589 |
zag | +0.564 |
cling | +0.559 |
-$ | +0.555 |
rients | +0.552 |
Neg logit contributions | |
assian | -0.731 |
hower | -0.711 |
orah | -0.696 |
hari | -0.689 |
oops | -0.686 |
Token | up |
Token ID | 510 |
Feature activation | +1.77e-01 |
Pos logit contributions | |
assian | +1.140 |
hower | +1.105 |
orah | +1.081 |
oops | +1.072 |
hari | +1.066 |
Neg logit contributions | |
llor | -1.232 |
zag | -1.189 |
rients | -1.174 |
cling | -1.172 |
-$ | -1.162 |
Token | . |
Token ID | 13 |
Feature activation | -6.30e-01 |
Pos logit contributions | |
llor | +0.590 |
zag | +0.566 |
-$ | +0.561 |
cling | +0.559 |
rients | +0.553 |
Neg logit contributions | |
assian | -0.759 |
hower | -0.740 |
orah | -0.721 |
oops | -0.719 |
hari | -0.717 |
Token |
|
Token ID | 198 |
Feature activation | -7.09e-01 |
Pos logit contributions | |
assian | +2.294 |
hower | +2.215 |
orah | +2.171 |
oops | +2.155 |
hari | +2.145 |
Neg logit contributions | |
llor | -2.510 |
zag | -2.423 |
cling | -2.384 |
rients | -2.383 |
distingu | -2.361 |
Token |
|
Token ID | 198 |
Feature activation | -6.80e-01 |
Pos logit contributions | |
assian | +2.535 |
hower | +2.412 |
orah | +2.410 |
oops | +2.395 |
hari | +2.379 |
Neg logit contributions | |
llor | -2.839 |
distingu | -2.811 |
zag | -2.743 |
rients | -2.716 |
cling | -2.691 |
Token | " |
Token ID | 1 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
assian | +3.272 |
hower | +3.151 |
oops | +3.149 |
orah | +3.141 |
hari | +3.127 |
Neg logit contributions | |
llor | -1.902 |
zag | -1.797 |
distingu | -1.773 |
rients | -1.769 |
cling | -1.747 |
Token | I |
Token ID | 40 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
assian | +6.224 |
oops | +6.219 |
orah | +5.872 |
hari | +5.821 |
hower | +5.787 |
Neg logit contributions | |
llor | -7.867 |
distingu | -7.721 |
zag | -7.542 |
rients | -7.533 |
cling | -7.286 |
Token | tried |
Token ID | 3088 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
llor | +0.375 |
zag | +0.360 |
cling | +0.360 |
-$ | +0.355 |
rients | +0.352 |
Neg logit contributions | |
assian | -0.427 |
hower | -0.416 |
orah | -0.402 |
oops | -0.402 |
hari | -0.402 |
Token | to |
Token ID | 284 |
Feature activation | +8.81e-01 |
Pos logit contributions | |
llor | +2.175 |
zag | +2.081 |
-$ | +2.062 |
cling | +2.051 |
rients | +2.016 |
Neg logit contributions | |
assian | -2.838 |
hower | -2.781 |
orah | -2.698 |
oops | -2.694 |
hari | -2.651 |
Token | stall |
Token ID | 22549 |
Feature activation | -7.72e-02 |
Pos logit contributions | |
llor | +3.187 |
-$ | +3.104 |
zag | +3.068 |
cling | +3.055 |
distingu | +3.042 |
Neg logit contributions | |
assian | -3.444 |
hower | -3.337 |
hari | -3.247 |
oops | -3.206 |
orah | -3.173 |
Token | him |
Token ID | 683 |
Feature activation | -8.96e-02 |
Pos logit contributions | |
assian | +0.287 |
hower | +0.279 |
orah | +0.272 |
oops | +0.269 |
hari | +0.268 |
Neg logit contributions | |
llor | -0.303 |
zag | -0.292 |
cling | -0.288 |
rients | -0.288 |
-$ | -0.287 |
Token | home |
Token ID | 1363 |
Feature activation | +4.62e-02 |
Pos logit contributions | |
assian | +2.108 |
hower | +2.037 |
orah | +2.002 |
oops | +1.981 |
hari | +1.974 |
Neg logit contributions | |
llor | -2.016 |
zag | -1.941 |
cling | -1.912 |
rients | -1.911 |
-$ | -1.889 |
Token | supply |
Token ID | 5127 |
Feature activation | -7.05e-01 |
Pos logit contributions | |
llor | +0.167 |
zag | +0.160 |
cling | +0.159 |
rients | +0.158 |
-$ | +0.158 |
Neg logit contributions | |
assian | -0.186 |
hower | -0.181 |
orah | -0.176 |
oops | -0.176 |
hari | -0.175 |
Token | ; |
Token ID | 26 |
Feature activation | -4.15e-01 |
Pos logit contributions | |
assian | +2.824 |
hower | +2.753 |
orah | +2.701 |
oops | +2.668 |
hari | +2.664 |
Neg logit contributions | |
llor | -2.525 |
zag | -2.445 |
rients | -2.396 |
cling | -2.384 |
-$ | -2.341 |
Token | from |
Token ID | 422 |
Feature activation | -4.28e-01 |
Pos logit contributions | |
assian | +1.627 |
hower | +1.580 |
orah | +1.554 |
oops | +1.537 |
hari | +1.532 |
Neg logit contributions | |
llor | -1.533 |
zag | -1.478 |
rients | -1.459 |
cling | -1.450 |
-$ | -1.429 |
Token | the |
Token ID | 262 |
Feature activation | -4.42e-01 |
Pos logit contributions | |
assian | +1.700 |
hower | +1.649 |
orah | +1.626 |
oops | +1.604 |
hari | +1.593 |
Neg logit contributions | |
llor | -1.560 |
zag | -1.490 |
rients | -1.478 |
cling | -1.471 |
-$ | -1.437 |
Token | works |
Token ID | 2499 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
assian | +1.754 |
hower | +1.695 |
orah | +1.671 |
oops | +1.648 |
hari | +1.639 |
Neg logit contributions | |
llor | -1.624 |
zag | -1.559 |
rients | -1.536 |
cling | -1.534 |
-$ | -1.513 |
Token | of |
Token ID | 286 |
Feature activation | -5.20e-01 |
Pos logit contributions | |
assian | +7.055 |
hower | +6.913 |
orah | +6.751 |
hari | +6.544 |
oops | +6.513 |
Neg logit contributions | |
llor | -7.107 |
rients | -6.779 |
zag | -6.779 |
cling | -6.584 |
distingu | -6.552 |
Token | Mr |
Token ID | 1770 |
Feature activation | +3.21e-01 |
Pos logit contributions | |
assian | +2.021 |
hower | +1.964 |
orah | +1.924 |
oops | +1.901 |
hari | +1.895 |
Neg logit contributions | |
llor | -1.937 |
zag | -1.848 |
rients | -1.836 |
cling | -1.836 |
-$ | -1.799 |
Token | . |
Token ID | 13 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
llor | +0.957 |
zag | +0.912 |
cling | +0.896 |
rients | +0.895 |
-$ | +0.884 |
Neg logit contributions | |
assian | -1.498 |
hower | -1.463 |
orah | -1.436 |
oops | -1.426 |
hari | -1.421 |
Token | Wh |
Token ID | 854 |
Feature activation | -5.92e-01 |
Pos logit contributions | |
llor | +1.159 |
zag | +1.111 |
cling | +1.094 |
-$ | +1.092 |
rients | +1.090 |
Neg logit contributions | |
assian | -1.527 |
hower | -1.489 |
oops | -1.455 |
orah | -1.453 |
hari | -1.446 |
Token | arton |
Token ID | 41328 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
assian | +1.748 |
hower | +1.674 |
orah | +1.629 |
oops | +1.615 |
hari | +1.604 |
Neg logit contributions | |
llor | -2.777 |
zag | -2.691 |
cling | -2.663 |
rients | -2.663 |
-$ | -2.643 |
Token | at |
Token ID | 379 |
Feature activation | -9.72e-01 |
Pos logit contributions | |
assian | +4.429 |
orah | +4.296 |
hari | +4.292 |
oops | +4.256 |
hower | +4.163 |
Neg logit contributions | |
distingu | -5.847 |
llor | -5.616 |
rients | -5.514 |
zag | -5.506 |
� | -5.390 |
Token | 9 |
Token ID | 860 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
assian | +4.021 |
orah | +3.888 |
oops | +3.883 |
hower | +3.879 |
hari | +3.811 |
Neg logit contributions | |
llor | -3.279 |
distingu | -3.192 |
rients | -3.109 |
zag | -3.095 |
cling | -3.078 |
Token | : |
Token ID | 25 |
Feature activation | -5.90e-01 |
Pos logit contributions | |
assian | +4.459 |
orah | +4.282 |
oops | +4.256 |
hari | +4.183 |
hower | +4.132 |
Neg logit contributions | |
distingu | -5.304 |
llor | -5.059 |
zag | -4.882 |
rients | -4.851 |
cling | -4.757 |
Token | 01 |
Token ID | 486 |
Feature activation | -9.85e-01 |
Pos logit contributions | |
assian | +2.546 |
orah | +2.450 |
oops | +2.444 |
hower | +2.441 |
hari | +2.408 |
Neg logit contributions | |
llor | -1.938 |
distingu | -1.855 |
zag | -1.842 |
rients | -1.825 |
cling | -1.809 |
Token | am |
Token ID | 321 |
Feature activation | -8.05e-01 |
Pos logit contributions | |
assian | +3.598 |
hower | +3.486 |
orah | +3.438 |
oops | +3.407 |
hari | +3.394 |
Neg logit contributions | |
llor | -3.813 |
zag | -3.702 |
distingu | -3.699 |
rients | -3.679 |
cling | -3.609 |
Token | PDT |
Token ID | 28288 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
assian | +2.941 |
hower | +2.832 |
orah | +2.777 |
oops | +2.773 |
hari | +2.754 |
Neg logit contributions | |
llor | -3.170 |
zag | -3.083 |
distingu | -3.041 |
cling | -3.034 |
rients | -3.018 |
Token |
|
Token ID | 198 |
Feature activation | -9.80e-01 |
Pos logit contributions | |
hower | +5.826 |
assian | +5.800 |
orah | +5.538 |
oops | +5.501 |
oran | +5.435 |
Neg logit contributions | |
llor | -7.734 |
zag | -7.586 |
rients | -7.431 |
cling | -7.401 |
distingu | -7.362 |
Token |
|
Token ID | 198 |
Feature activation | -3.02e-01 |
Pos logit contributions | |
assian | +3.343 |
orah | +3.199 |
oops | +3.185 |
hower | +3.155 |
hari | +3.134 |
Neg logit contributions | |
distingu | -4.112 |
llor | -4.025 |
zag | -3.894 |
rients | -3.876 |
cling | -3.824 |
Token | Do |
Token ID | 5211 |
Feature activation | -9.08e-02 |
Pos logit contributions | |
assian | +1.227 |
hower | +1.192 |
orah | +1.172 |
oops | +1.166 |
hari | +1.158 |
Neg logit contributions | |
llor | -1.076 |
zag | -1.030 |
rients | -1.018 |
cling | -1.016 |
-$ | -1.002 |
Token | use |
Token ID | 779 |
Feature activation | -1.30e-03 |
Pos logit contributions | |
assian | +0.367 |
hower | +0.360 |
orah | +0.355 |
oops | +0.350 |
hari | +0.350 |
Neg logit contributions | |
llor | -0.320 |
rients | -0.309 |
zag | -0.308 |
cling | -0.305 |
-$ | -0.302 |
Token | social |
Token ID | 1919 |
Feature activation | -8.64e-01 |
Pos logit contributions | |
assian | +0.005 |
hower | +0.005 |
orah | +0.005 |
hari | +0.005 |
oops | +0.005 |
Neg logit contributions | |
llor | -0.005 |
zag | -0.005 |
rients | -0.005 |
cling | -0.005 |
-$ | -0.005 |
Token | Hillary |
Token ID | 20397 |
Feature activation | +2.00e-01 |
Pos logit contributions | |
llor | +2.026 |
-$ | +2.007 |
zag | +1.984 |
cling | +1.966 |
nc | +1.945 |
Neg logit contributions | |
assian | -2.677 |
hower | -2.666 |
orah | -2.549 |
hari | -2.486 |
oran | -2.458 |
Token | Clinton |
Token ID | 2605 |
Feature activation | +6.50e-01 |
Pos logit contributions | |
llor | +0.867 |
zag | +0.840 |
rients | +0.829 |
cling | +0.829 |
-$ | +0.822 |
Neg logit contributions | |
assian | -0.660 |
hower | -0.639 |
orah | -0.622 |
oops | -0.616 |
hari | -0.614 |
Token | 's |
Token ID | 338 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
llor | +1.973 |
zag | +1.884 |
cling | +1.848 |
-$ | +1.835 |
rients | +1.833 |
Neg logit contributions | |
assian | -2.986 |
hower | -2.909 |
orah | -2.855 |
oops | -2.837 |
hari | -2.820 |
Token | campaign |
Token ID | 1923 |
Feature activation | +8.83e-04 |
Pos logit contributions | |
llor | +1.326 |
zag | +1.272 |
cling | +1.248 |
rients | +1.236 |
-$ | +1.234 |
Neg logit contributions | |
assian | -2.040 |
hower | -1.986 |
orah | -1.948 |
oops | -1.935 |
hari | -1.934 |
Token | manager |
Token ID | 4706 |
Feature activation | -7.87e-01 |
Pos logit contributions | |
llor | +0.004 |
zag | +0.004 |
rients | +0.004 |
cling | +0.004 |
-$ | +0.004 |
Neg logit contributions | |
assian | -0.003 |
hower | -0.003 |
orah | -0.003 |
hari | -0.003 |
oops | -0.003 |
Token | Rob |
Token ID | 3851 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
assian | +2.457 |
hower | +2.372 |
orah | +2.317 |
hari | +2.291 |
oops | +2.289 |
Neg logit contributions | |
llor | -3.479 |
zag | -3.389 |
cling | -3.363 |
rients | -3.361 |
-$ | -3.293 |
Token | by |
Token ID | 1525 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
assian | +5.393 |
orah | +5.343 |
hari | +5.305 |
oops | +5.249 |
hower | +5.222 |
Neg logit contributions | |
distingu | -8.465 |
llor | -8.340 |
zag | -7.929 |
� | -7.902 |
rients | -7.833 |
Token | M |
Token ID | 337 |
Feature activation | +2.69e-01 |
Pos logit contributions | |
assian | +0.669 |
hower | +0.650 |
orah | +0.634 |
oops | +0.630 |
hari | +0.628 |
Neg logit contributions | |
llor | -0.538 |
zag | -0.518 |
rients | -0.509 |
-$ | -0.508 |
cling | -0.507 |
Token | ook |
Token ID | 566 |
Feature activation | -3.04e-01 |
Pos logit contributions | |
llor | +1.351 |
zag | +1.310 |
cling | +1.305 |
-$ | +1.295 |
rients | +1.289 |
Neg logit contributions | |
assian | -0.720 |
hower | -0.674 |
orah | -0.645 |
hari | -0.636 |
oops | -0.621 |
Token | said |
Token ID | 531 |
Feature activation | -7.43e-01 |
Pos logit contributions | |
assian | +1.129 |
hower | +1.095 |
orah | +1.071 |
oops | +1.059 |
hari | +1.059 |
Neg logit contributions | |
llor | -1.188 |
zag | -1.146 |
cling | -1.132 |
rients | -1.131 |
-$ | -1.122 |
Token | the |
Token ID | 262 |
Feature activation | +8.02e-02 |
Pos logit contributions | |
assian | +2.818 |
hower | +2.745 |
oops | +2.715 |
hari | +2.698 |
orah | +2.697 |
Neg logit contributions | |
llor | -2.771 |
zag | -2.680 |
rients | -2.650 |
cling | -2.637 |
distingu | -2.591 |
Token | noise |
Token ID | 7838 |
Feature activation | +4.09e-01 |
Pos logit contributions | |
assian | +0.350 |
hower | +0.340 |
orah | +0.333 |
oops | +0.331 |
hari | +0.329 |
Neg logit contributions | |
llor | -0.333 |
zag | -0.320 |
rients | -0.316 |
cling | -0.316 |
-$ | -0.313 |
Token | and |
Token ID | 290 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
llor | +1.377 |
zag | +1.331 |
cling | +1.319 |
-$ | +1.316 |
rients | +1.307 |
Neg logit contributions | |
assian | -1.739 |
hower | -1.686 |
orah | -1.654 |
hari | -1.642 |
oops | -1.639 |
Token | trash |
Token ID | 13913 |
Feature activation | +8.69e-01 |
Pos logit contributions | |
llor | +0.449 |
zag | +0.432 |
cling | +0.425 |
rients | +0.425 |
-$ | +0.421 |
Neg logit contributions | |
assian | -0.546 |
hower | -0.531 |
orah | -0.520 |
oops | -0.516 |
hari | -0.515 |
Token | . |
Token ID | 13 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
llor | +2.686 |
cling | +2.629 |
zag | +2.594 |
-$ | +2.582 |
rients | +2.553 |
Neg logit contributions | |
assian | -3.877 |
hower | -3.709 |
orah | -3.683 |
hari | -3.663 |
oops | -3.637 |
Token | Est |
Token ID | 10062 |
Feature activation | -2.82e-01 |
Pos logit contributions | |
llor | +0.516 |
zag | +0.497 |
cling | +0.490 |
-$ | +0.489 |
rients | +0.488 |
Neg logit contributions | |
assian | -0.640 |
hower | -0.629 |
orah | -0.610 |
oops | -0.606 |
hari | -0.603 |
Token | eb |
Token ID | 1765 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
assian | +1.097 |
hower | +1.056 |
orah | +1.044 |
oops | +1.034 |
hari | +1.029 |
Neg logit contributions | |
llor | -1.060 |
zag | -1.018 |
rients | -1.004 |
cling | -1.004 |
-$ | -0.994 |
Token | an |
Token ID | 272 |
Feature activation | -3.72e-01 |
Pos logit contributions | |
assian | +6.641 |
orah | +6.505 |
oops | +6.465 |
hari | +6.259 |
oran | +6.161 |
Neg logit contributions | |
llor | -7.210 |
zag | -7.152 |
distingu | -6.984 |
-$ | -6.949 |
rients | -6.887 |
Token | Par |
Token ID | 2547 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
assian | +1.592 |
hower | +1.551 |
orah | +1.521 |
oops | +1.509 |
hari | +1.503 |
Neg logit contributions | |
llor | -1.250 |
zag | -1.196 |
cling | -1.178 |
rients | -1.177 |
-$ | -1.165 |
Token | ra |
Token ID | 430 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
llor | +0.940 |
zag | +0.915 |
cling | +0.895 |
rients | +0.889 |
-$ | +0.873 |
Neg logit contributions | |
assian | -1.097 |
hower | -1.086 |
orah | -1.049 |
oops | -1.043 |
hari | -1.038 |
Token | and |
Token ID | 290 |
Feature activation | -6.62e-01 |
Pos logit contributions | |
llor | +0.839 |
zag | +0.804 |
-$ | +0.784 |
cling | +0.780 |
rients | +0.779 |
Neg logit contributions | |
assian | -1.277 |
hower | -1.260 |
orah | -1.225 |
oops | -1.220 |
hari | -1.213 |
Token | William |
Token ID | 3977 |
Feature activation | -5.53e-01 |
Pos logit contributions | |
assian | +2.567 |
hower | +2.480 |
orah | +2.440 |
oops | +2.430 |
hari | +2.423 |
Neg logit contributions | |
llor | -2.455 |
zag | -2.374 |
rients | -2.351 |
cling | -2.339 |
-$ | -2.313 |
Token | based |
Token ID | 1912 |
Feature activation | +3.60e-01 |
Pos logit contributions | |
llor | +0.789 |
zag | +0.752 |
cling | +0.742 |
rients | +0.740 |
-$ | +0.736 |
Neg logit contributions | |
assian | -0.998 |
hower | -0.973 |
orah | -0.952 |
oops | -0.947 |
hari | -0.946 |
Token | in |
Token ID | 287 |
Feature activation | +2.61e-01 |
Pos logit contributions | |
llor | +1.185 |
zag | +1.129 |
cling | +1.118 |
rients | +1.110 |
-$ | +1.103 |
Neg logit contributions | |
assian | -1.571 |
hower | -1.528 |
orah | -1.493 |
oops | -1.485 |
hari | -1.482 |
Token | London |
Token ID | 3576 |
Feature activation | +7.54e-01 |
Pos logit contributions | |
llor | +0.823 |
zag | +0.787 |
cling | +0.774 |
rients | +0.771 |
-$ | +0.763 |
Neg logit contributions | |
assian | -1.172 |
hower | -1.143 |
orah | -1.119 |
oops | -1.112 |
hari | -1.111 |
Token | , |
Token ID | 11 |
Feature activation | +6.92e-01 |
Pos logit contributions | |
llor | +2.365 |
zag | +2.225 |
-$ | +2.211 |
cling | +2.207 |
rients | +2.199 |
Neg logit contributions | |
assian | -3.370 |
hower | -3.300 |
hari | -3.213 |
oops | -3.191 |
orah | -3.189 |
Token | wrote |
Token ID | 2630 |
Feature activation | +4.40e-01 |
Pos logit contributions | |
llor | +2.269 |
zag | +2.111 |
rients | +2.102 |
cling | +2.084 |
-$ | +2.062 |
Neg logit contributions | |
assian | -3.043 |
hower | -2.965 |
hari | -2.891 |
orah | -2.874 |
oops | -2.873 |
Token | an |
Token ID | 281 |
Feature activation | +9.82e-01 |
Pos logit contributions | |
llor | +1.454 |
zag | +1.389 |
cling | +1.367 |
rients | +1.363 |
-$ | +1.359 |
Neg logit contributions | |
assian | -1.901 |
hower | -1.857 |
orah | -1.802 |
hari | -1.799 |
oops | -1.792 |
Token | essay |
Token ID | 14268 |
Feature activation | -2.56e-01 |
Pos logit contributions | |
llor | +2.870 |
zag | +2.759 |
-$ | +2.759 |
rients | +2.749 |
distingu | +2.718 |
Neg logit contributions | |
assian | -4.471 |
hower | -4.430 |
hari | -4.271 |
orah | -4.221 |
oops | -4.199 |
Token | , |
Token ID | 11 |
Feature activation | +5.52e-02 |
Pos logit contributions | |
assian | +1.024 |
hower | +0.995 |
orah | +0.975 |
oops | +0.967 |
hari | +0.962 |
Neg logit contributions | |
llor | -0.929 |
zag | -0.894 |
cling | -0.881 |
rients | -0.881 |
-$ | -0.871 |
Token | entitled |
Token ID | 9080 |
Feature activation | +5.55e-01 |
Pos logit contributions | |
llor | +0.204 |
zag | +0.196 |
cling | +0.194 |
rients | +0.193 |
-$ | +0.192 |
Neg logit contributions | |
assian | -0.218 |
hower | -0.212 |
orah | -0.207 |
hari | -0.205 |
oops | -0.205 |
Token | " |
Token ID | 366 |
Feature activation | +5.80e-01 |
Pos logit contributions | |
llor | +2.003 |
zag | +1.917 |
cling | +1.904 |
rients | +1.897 |
-$ | +1.887 |
Neg logit contributions | |
assian | -2.236 |
hower | -2.165 |
hari | -2.119 |
orah | -2.113 |
oops | -2.095 |
Token | The |
Token ID | 464 |
Feature activation | +8.26e-01 |
Pos logit contributions | |
llor | +1.943 |
zag | +1.865 |
cling | +1.857 |
-$ | +1.829 |
rients | +1.821 |
Neg logit contributions | |
assian | -2.482 |
hower | -2.419 |
orah | -2.359 |
hari | -2.351 |
oops | -2.298 |
Token | aked |
Token ID | 4335 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
llor | +0.797 |
zag | +0.765 |
cling | +0.753 |
rients | +0.743 |
-$ | +0.729 |
Neg logit contributions | |
assian | -1.411 |
hower | -1.385 |
hari | -1.337 |
orah | -1.336 |
oops | -1.326 |
Token | past |
Token ID | 1613 |
Feature activation | +2.56e-01 |
Pos logit contributions | |
llor | +4.141 |
zag | +4.034 |
cling | +3.991 |
rients | +3.988 |
-$ | +3.933 |
Neg logit contributions | |
assian | -5.400 |
hower | -5.321 |
orah | -5.116 |
oops | -5.078 |
hari | -5.070 |
Token | eb |
Token ID | 1765 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
llor | +0.967 |
zag | +0.930 |
rients | +0.925 |
cling | +0.921 |
-$ | +0.913 |
Neg logit contributions | |
assian | -0.982 |
hower | -0.962 |
orah | -0.930 |
oops | -0.926 |
hari | -0.924 |
Token | oard |
Token ID | 11953 |
Feature activation | +5.17e-01 |
Pos logit contributions | |
assian | +3.986 |
oops | +3.862 |
hari | +3.690 |
orah | +3.644 |
oran | +3.431 |
Neg logit contributions | |
llor | -8.107 |
distingu | -7.908 |
zag | -7.904 |
cling | -7.777 |
-$ | -7.694 |
Token | or |
Token ID | 393 |
Feature activation | -3.31e-01 |
Pos logit contributions | |
llor | +1.710 |
zag | +1.636 |
cling | +1.617 |
rients | +1.613 |
-$ | +1.600 |
Neg logit contributions | |
assian | -2.241 |
hower | -2.186 |
orah | -2.139 |
oops | -2.118 |
hari | -2.113 |
Token | cloth |
Token ID | 16270 |
Feature activation | +9.37e-01 |
Pos logit contributions | |
assian | +1.408 |
hower | +1.368 |
orah | +1.347 |
hari | +1.341 |
oops | +1.338 |
Neg logit contributions | |
llor | -1.112 |
zag | -1.057 |
rients | -1.050 |
-$ | -1.036 |
cling | -1.034 |
Token | , |
Token ID | 11 |
Feature activation | +4.17e-01 |
Pos logit contributions | |
llor | +3.036 |
cling | +2.933 |
zag | +2.924 |
-$ | +2.904 |
rients | +2.895 |
Neg logit contributions | |
assian | -4.045 |
hower | -4.010 |
orah | -3.837 |
hari | -3.807 |
oops | -3.804 |
Token | and |
Token ID | 290 |
Feature activation | +3.61e-01 |
Pos logit contributions | |
llor | +1.435 |
zag | +1.386 |
cling | +1.372 |
rients | +1.363 |
-$ | +1.352 |
Neg logit contributions | |
assian | -1.750 |
hower | -1.708 |
orah | -1.667 |
oops | -1.650 |
hari | -1.641 |
Token | silver |
Token ID | 8465 |
Feature activation | +4.38e-01 |
Pos logit contributions | |
llor | +1.371 |
zag | +1.324 |
cling | +1.314 |
rients | +1.309 |
-$ | +1.300 |
Neg logit contributions | |
assian | -1.386 |
hower | -1.346 |
orah | -1.315 |
oops | -1.305 |
hari | -1.293 |
Token | . |
Token ID | 13 |
Feature activation | -3.87e-02 |
Pos logit contributions | |
llor | +1.444 |
zag | +1.390 |
cling | +1.376 |
rients | +1.369 |
-$ | +1.366 |
Neg logit contributions | |
assian | -1.898 |
hower | -1.860 |
orah | -1.808 |
oops | -1.799 |
hari | -1.790 |
Token | This |
Token ID | 770 |
Feature activation | +4.51e-02 |
Pos logit contributions | |
assian | +0.150 |
hower | +0.145 |
orah | +0.142 |
oops | +0.141 |
hari | +0.140 |
Neg logit contributions | |
llor | -0.146 |
zag | -0.141 |
cling | -0.139 |
rients | -0.139 |
-$ | -0.138 |
Token |
|
Token ID | 198 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
assian | +0.103 |
hower | +0.101 |
orah | +0.098 |
oops | +0.097 |
hari | +0.097 |
Neg logit contributions | |
llor | -0.093 |
zag | -0.089 |
-$ | -0.088 |
cling | -0.088 |
rients | -0.088 |
Token | It |
Token ID | 1026 |
Feature activation | -2.83e-02 |
Pos logit contributions | |
llor | +0.366 |
zag | +0.354 |
-$ | +0.351 |
cling | +0.349 |
rients | +0.344 |
Neg logit contributions | |
assian | -0.456 |
hower | -0.453 |
orah | -0.433 |
hari | -0.429 |
oops | -0.426 |
Token | 's |
Token ID | 338 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
assian | +0.127 |
hower | +0.124 |
orah | +0.121 |
oops | +0.121 |
hari | +0.120 |
Neg logit contributions | |
llor | -0.089 |
zag | -0.086 |
cling | -0.084 |
rients | -0.084 |
-$ | -0.083 |
Token | been |
Token ID | 587 |
Feature activation | -6.48e-01 |
Pos logit contributions | |
assian | +0.727 |
hower | +0.708 |
orah | +0.693 |
oops | +0.687 |
hari | +0.685 |
Neg logit contributions | |
llor | -0.650 |
zag | -0.624 |
rients | -0.616 |
cling | -0.615 |
-$ | -0.609 |
Token | less |
Token ID | 1342 |
Feature activation | -9.32e-01 |
Pos logit contributions | |
assian | +2.576 |
hower | +2.491 |
orah | +2.470 |
hari | +2.430 |
oops | +2.430 |
Neg logit contributions | |
llor | -2.359 |
zag | -2.237 |
rients | -2.235 |
cling | -2.217 |
-$ | -2.167 |
Token | than |
Token ID | 621 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
assian | +3.180 |
hower | +3.036 |
orah | +2.993 |
hari | +2.943 |
oops | +2.931 |
Neg logit contributions | |
llor | -3.893 |
zag | -3.752 |
rients | -3.749 |
cling | -3.679 |
-$ | -3.603 |
Token | a |
Token ID | 257 |
Feature activation | +6.42e-01 |
Pos logit contributions | |
llor | +3.413 |
-$ | +3.394 |
zag | +3.345 |
cling | +3.290 |
distingu | +3.194 |
Neg logit contributions | |
assian | -5.514 |
hower | -5.437 |
oops | -5.253 |
orah | -5.238 |
hari | -5.217 |
Token | year |
Token ID | 614 |
Feature activation | +6.35e-01 |
Pos logit contributions | |
llor | +1.852 |
zag | +1.779 |
-$ | +1.771 |
cling | +1.771 |
distingu | +1.712 |
Neg logit contributions | |
assian | -3.004 |
hower | -2.916 |
oops | -2.874 |
orah | -2.868 |
hari | -2.842 |
Token | since |
Token ID | 1201 |
Feature activation | +7.24e-01 |
Pos logit contributions | |
llor | +1.896 |
zag | +1.842 |
-$ | +1.814 |
cling | +1.792 |
rients | +1.744 |
Neg logit contributions | |
assian | -2.894 |
hower | -2.843 |
orah | -2.783 |
oops | -2.778 |
hari | -2.767 |
Token | game |
Token ID | 983 |
Feature activation | -3.32e-02 |
Pos logit contributions | |
llor | +2.462 |
zag | +2.353 |
cling | +2.324 |
rients | +2.304 |
-$ | +2.303 |
Neg logit contributions | |
assian | -3.071 |
hower | -2.964 |
orah | -2.901 |
hari | -2.878 |
oops | -2.863 |
Token | developer |
Token ID | 8517 |
Feature activation | +3.45e-01 |
Pos logit contributions | |
assian | +0.131 |
hower | +0.127 |
orah | +0.125 |
oops | +0.124 |
hari | +0.123 |
Neg logit contributions | |
llor | -0.123 |
zag | -0.118 |
cling | -0.116 |
rients | -0.116 |
-$ | -0.115 |
Token |
|
Token ID | 198 |
Feature activation | +4.92e-01 |
Pos logit contributions | |
llor | +1.672 |
-$ | +1.627 |
zag | +1.611 |
cling | +1.594 |
rients | +1.577 |
Neg logit contributions | |
assian | -2.137 |
hower | -2.133 |
orah | -2.029 |
hari | -2.016 |
oops | -2.011 |
Token | The |
Token ID | 464 |
Feature activation | +3.77e-01 |
Pos logit contributions | |
llor | +1.657 |
zag | +1.588 |
-$ | +1.568 |
cling | +1.568 |
rients | +1.556 |
Neg logit contributions | |
assian | -2.102 |
hower | -2.069 |
orah | -1.991 |
hari | -1.980 |
oops | -1.969 |
Token | Russian |
Token ID | 3394 |
Feature activation | +3.03e-01 |
Pos logit contributions | |
llor | +1.187 |
zag | +1.133 |
cling | +1.108 |
rients | +1.108 |
-$ | +1.100 |
Neg logit contributions | |
assian | -1.701 |
hower | -1.655 |
orah | -1.618 |
oops | -1.616 |
hari | -1.612 |
Token | Navy |
Token ID | 8565 |
Feature activation | +3.98e-01 |
Pos logit contributions | |
llor | +0.995 |
zag | +0.953 |
cling | +0.935 |
-$ | +0.934 |
rients | +0.932 |
Neg logit contributions | |
assian | -1.323 |
hower | -1.289 |
orah | -1.258 |
oops | -1.254 |
hari | -1.250 |
Token | logged |
Token ID | 18832 |
Feature activation | +6.48e-01 |
Pos logit contributions | |
llor | +1.336 |
zag | +1.277 |
cling | +1.258 |
rients | +1.258 |
-$ | +1.251 |
Neg logit contributions | |
assian | -1.708 |
hower | -1.664 |
orah | -1.628 |
oops | -1.616 |
hari | -1.610 |
Token | over |
Token ID | 625 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
llor | +2.064 |
zag | +1.985 |
-$ | +1.950 |
rients | +1.931 |
cling | +1.931 |
Neg logit contributions | |
assian | -2.874 |
hower | -2.823 |
orah | -2.744 |
oops | -2.719 |
hari | -2.714 |
Token | 6 |
Token ID | 718 |
Feature activation | +3.46e-01 |
Pos logit contributions | |
llor | +3.096 |
-$ | +2.957 |
zag | +2.956 |
cling | +2.886 |
rients | +2.868 |
Neg logit contributions | |
assian | -5.629 |
hower | -5.466 |
orah | -5.356 |
hari | -5.336 |
oops | -5.325 |
Token | 500 |
Token ID | 4059 |
Feature activation | -4.11e-01 |
Pos logit contributions | |
llor | +1.069 |
zag | +1.033 |
-$ | +1.017 |
rients | +1.013 |
cling | +1.011 |
Neg logit contributions | |
assian | -1.559 |
hower | -1.529 |
orah | -1.494 |
hari | -1.485 |
oops | -1.479 |
Token | n |
Token ID | 299 |
Feature activation | +6.66e-01 |
Pos logit contributions | |
assian | +1.559 |
hower | +1.509 |
orah | +1.481 |
oops | +1.465 |
hari | +1.460 |
Neg logit contributions | |
llor | -1.578 |
zag | -1.522 |
cling | -1.506 |
rients | -1.501 |
-$ | -1.482 |
Token | autical |
Token ID | 37073 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
llor | +1.761 |
zag | +1.667 |
rients | +1.643 |
cling | +1.630 |
-$ | +1.615 |
Neg logit contributions | |
assian | -3.312 |
hower | -3.268 |
orah | -3.174 |
oops | -3.156 |
hari | -3.147 |
Token | reactor |
Token ID | 21905 |
Feature activation | -4.49e-03 |
Pos logit contributions | |
assian | +0.392 |
hower | +0.381 |
orah | +0.372 |
oops | +0.367 |
hari | +0.366 |
Neg logit contributions | |
llor | -0.445 |
zag | -0.429 |
cling | -0.424 |
rients | -0.424 |
-$ | -0.421 |
Token | on |
Token ID | 319 |
Feature activation | +5.98e-02 |
Pos logit contributions | |
assian | +0.395 |
hower | +0.384 |
orah | +0.376 |
oops | +0.373 |
hari | +0.371 |
Neg logit contributions | |
llor | -0.351 |
zag | -0.337 |
cling | -0.333 |
rients | -0.332 |
-$ | -0.331 |
Token | three |
Token ID | 1115 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
llor | +0.205 |
zag | +0.197 |
cling | +0.194 |
rients | +0.194 |
-$ | +0.192 |
Neg logit contributions | |
assian | -0.252 |
hower | -0.245 |
orah | -0.240 |
oops | -0.238 |
hari | -0.238 |
Token | different |
Token ID | 1180 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
llor | +1.369 |
zag | +1.328 |
rients | +1.311 |
-$ | +1.307 |
cling | +1.296 |
Neg logit contributions | |
assian | -1.519 |
hower | -1.494 |
orah | -1.447 |
oops | -1.436 |
hari | -1.430 |
Token | Open |
Token ID | 4946 |
Feature activation | -1.39e-01 |
Pos logit contributions | |
llor | +0.915 |
zag | +0.886 |
rients | +0.875 |
cling | +0.869 |
-$ | +0.868 |
Neg logit contributions | |
assian | -0.900 |
hower | -0.882 |
orah | -0.860 |
oops | -0.852 |
hari | -0.846 |
Token | Systems |
Token ID | 11998 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
assian | +0.640 |
hower | +0.622 |
orah | +0.610 |
oops | +0.607 |
hari | +0.605 |
Neg logit contributions | |
llor | -0.429 |
zag | -0.408 |
cling | -0.401 |
rients | -0.399 |
-$ | -0.395 |
Token | Inter |
Token ID | 4225 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
llor | +1.062 |
zag | +1.017 |
rients | +1.005 |
cling | +1.002 |
-$ | +0.995 |
Neg logit contributions | |
assian | -1.368 |
hower | -1.335 |
orah | -1.309 |
oops | -1.299 |
hari | -1.294 |
Token | connection |
Token ID | 38659 |
Feature activation | +4.88e-01 |
Pos logit contributions | |
zag | +2.979 |
llor | +2.978 |
cling | +2.970 |
rients | +2.912 |
-$ | +2.890 |
Neg logit contributions | |
assian | -4.536 |
hower | -4.458 |
orah | -4.274 |
hari | -4.269 |
oops | -4.238 |
Token | ( |
Token ID | 357 |
Feature activation | +9.05e-01 |
Pos logit contributions | |
llor | +1.640 |
zag | +1.579 |
rients | +1.558 |
cling | +1.551 |
-$ | +1.538 |
Neg logit contributions | |
assian | -2.082 |
hower | -2.033 |
orah | -1.994 |
hari | -1.969 |
oops | -1.968 |
Token | OS |
Token ID | 2640 |
Feature activation | +9.84e-01 |
Pos logit contributions | |
llor | +3.082 |
-$ | +3.013 |
zag | +2.984 |
cling | +2.978 |
rients | +2.968 |
Neg logit contributions | |
hower | -3.629 |
assian | -3.613 |
hari | -3.466 |
orah | -3.437 |
oops | -3.340 |
Token | I |
Token ID | 40 |
Feature activation | +8.06e-01 |
Pos logit contributions | |
llor | +3.084 |
-$ | +3.018 |
rients | +3.015 |
zag | +2.966 |
cling | +2.916 |
Neg logit contributions | |
assian | -4.264 |
hower | -4.186 |
orah | -4.105 |
oops | -4.025 |
hari | -4.010 |
Token | ) |
Token ID | 8 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
llor | +2.808 |
rients | +2.672 |
zag | +2.670 |
cling | +2.661 |
-$ | +2.639 |
Neg logit contributions | |
assian | -3.335 |
hower | -3.244 |
orah | -3.195 |
hari | -3.142 |
oops | -3.140 |
Token | a |
Token ID | 257 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
llor | +1.674 |
zag | +1.591 |
cling | +1.571 |
rients | +1.570 |
-$ | +1.562 |
Neg logit contributions | |
assian | -2.250 |
hower | -2.217 |
orah | -2.157 |
oops | -2.144 |
hari | -2.142 |
Token | fan |
Token ID | 4336 |
Feature activation | +3.26e-01 |
Pos logit contributions | |
llor | +1.304 |
zag | +1.244 |
cling | +1.223 |
-$ | +1.218 |
rients | +1.214 |
Neg logit contributions | |
assian | -1.479 |
hower | -1.439 |
oops | -1.406 |
orah | -1.398 |
hari | -1.397 |
Token | as |
Token ID | 355 |
Feature activation | +3.31e-01 |
Pos logit contributions | |
llor | +1.142 |
zag | +1.097 |
cling | +1.085 |
-$ | +1.078 |
rients | +1.070 |
Neg logit contributions | |
assian | -1.331 |
hower | -1.308 |
orah | -1.276 |
oops | -1.269 |
hari | -1.258 |
Token | well |
Token ID | 880 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
llor | +1.530 |
zag | +1.480 |
cling | +1.467 |
rients | +1.460 |
-$ | +1.459 |
Neg logit contributions | |
assian | -0.999 |
hower | -0.969 |
orah | -0.934 |
oops | -0.929 |
hari | -0.918 |
Token | . |
Token ID | 13 |
Feature activation | +4.56e-01 |
Pos logit contributions | |
assian | +0.931 |
hower | +0.904 |
orah | +0.885 |
oops | +0.877 |
hari | +0.874 |
Neg logit contributions | |
llor | -0.878 |
zag | -0.846 |
cling | -0.834 |
rients | -0.834 |
-$ | -0.825 |
Token |
|
Token ID | 198 |
Feature activation | +5.65e-01 |
Pos logit contributions | |
llor | +1.583 |
-$ | +1.518 |
zag | +1.512 |
cling | +1.496 |
rients | +1.491 |
Neg logit contributions | |
assian | -1.873 |
hower | -1.843 |
orah | -1.780 |
hari | -1.778 |
oops | -1.765 |
Token |
|
Token ID | 198 |
Feature activation | +6.59e-01 |
Pos logit contributions | |
llor | +1.849 |
-$ | +1.808 |
zag | +1.787 |
cling | +1.767 |
rients | +1.735 |
Neg logit contributions | |
hower | -2.437 |
assian | -2.430 |
orah | -2.310 |
hari | -2.291 |
oops | -2.288 |
Token | How |
Token ID | 2437 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
llor | +2.193 |
-$ | +2.160 |
zag | +2.144 |
cling | +2.108 |
nc | +2.060 |
Neg logit contributions | |
hower | -2.828 |
assian | -2.756 |
orah | -2.635 |
hari | -2.613 |
oops | -2.564 |
Token | do |
Token ID | 466 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
llor | +0.688 |
zag | +0.661 |
cling | +0.650 |
rients | +0.649 |
-$ | +0.645 |
Neg logit contributions | |
assian | -0.832 |
hower | -0.813 |
orah | -0.792 |
oops | -0.788 |
hari | -0.787 |
Token | you |
Token ID | 345 |
Feature activation | +3.89e-01 |
Pos logit contributions | |
llor | +1.495 |
zag | +1.440 |
cling | +1.424 |
rients | +1.423 |
-$ | +1.414 |
Neg logit contributions | |
assian | -1.445 |
hower | -1.412 |
orah | -1.367 |
oops | -1.363 |
hari | -1.361 |
Token | maintain |
Token ID | 5529 |
Feature activation | +6.70e-01 |
Pos logit contributions | |
llor | +1.317 |
zag | +1.258 |
cling | +1.252 |
rients | +1.240 |
-$ | +1.240 |
Neg logit contributions | |
assian | -1.656 |
hower | -1.618 |
orah | -1.569 |
oops | -1.566 |
hari | -1.565 |
Token | 138 |
Token ID | 20107 |
Feature activation | -6.83e-01 |
Pos logit contributions | |
llor | +2.921 |
zag | +2.846 |
-$ | +2.830 |
rients | +2.778 |
cling | +2.764 |
Neg logit contributions | |
assian | -4.376 |
hower | -4.279 |
orah | -4.167 |
hari | -4.161 |
oops | -4.125 |
Token | s |
Token ID | 82 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
assian | +2.827 |
oops | +2.698 |
hower | +2.687 |
orah | +2.676 |
hari | +2.648 |
Neg logit contributions | |
llor | -2.389 |
distingu | -2.308 |
zag | -2.275 |
rients | -2.247 |
cling | -2.235 |
Token | )} |
Token ID | 38165 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
llor | +0.975 |
-$ | +0.919 |
zag | +0.919 |
cling | +0.906 |
rients | +0.902 |
Neg logit contributions | |
assian | -1.466 |
hower | -1.450 |
orah | -1.403 |
hari | -1.392 |
oops | -1.376 |
Token | Q |
Token ID | 1195 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
llor | +1.183 |
zag | +1.137 |
cling | +1.116 |
-$ | +1.114 |
rients | +1.110 |
Neg logit contributions | |
assian | -1.731 |
hower | -1.691 |
orah | -1.653 |
oops | -1.640 |
hari | -1.638 |
Token | c |
Token ID | 66 |
Feature activation | +8.61e-02 |
Pos logit contributions | |
assian | +0.960 |
hower | +0.938 |
orah | +0.923 |
oops | +0.918 |
hari | +0.914 |
Neg logit contributions | |
llor | -0.524 |
zag | -0.496 |
rients | -0.488 |
cling | -0.487 |
-$ | -0.480 |
Token | 7 |
Token ID | 22 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
llor | +0.227 |
zag | +0.218 |
-$ | +0.213 |
cling | +0.212 |
rients | +0.209 |
Neg logit contributions | |
assian | -0.431 |
hower | -0.424 |
orah | -0.412 |
hari | -0.412 |
oops | -0.408 |
Token | { |
Token ID | 1391 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
llor | +0.775 |
-$ | +0.741 |
zag | +0.738 |
cling | +0.726 |
rients | +0.718 |
Neg logit contributions | |
assian | -1.397 |
hower | -1.383 |
orah | -1.345 |
hari | -1.339 |
oops | -1.333 |
Token | ( |
Token ID | 7 |
Feature activation | +6.53e-01 |
Pos logit contributions | |
llor | +0.382 |
zag | +0.361 |
-$ | +0.358 |
cling | +0.356 |
rients | +0.351 |
Neg logit contributions | |
assian | -0.752 |
hower | -0.744 |
orah | -0.723 |
hari | -0.718 |
oops | -0.712 |
Token | 33 |
Token ID | 2091 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
llor | +1.928 |
zag | +1.869 |
-$ | +1.846 |
rients | +1.822 |
cling | +1.818 |
Neg logit contributions | |
assian | -3.009 |
hower | -2.941 |
orah | -2.875 |
hari | -2.857 |
oops | -2.841 |
Token | s |
Token ID | 82 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
llor | +0.041 |
zag | +0.039 |
cling | +0.039 |
rients | +0.038 |
distingu | +0.038 |
Neg logit contributions | |
assian | -0.049 |
hower | -0.047 |
oops | -0.047 |
orah | -0.047 |
hari | -0.046 |
Token | )} |
Token ID | 38165 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
llor | +0.450 |
zag | +0.427 |
-$ | +0.423 |
cling | +0.421 |
rients | +0.419 |
Neg logit contributions | |
assian | -0.645 |
hower | -0.635 |
orah | -0.617 |
hari | -0.611 |
oops | -0.607 |
Token | thy |
Token ID | 20057 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
llor | +1.740 |
zag | +1.688 |
cling | +1.667 |
-$ | +1.657 |
rients | +1.646 |
Neg logit contributions | |
assian | -2.075 |
hower | -2.053 |
orah | -1.977 |
hari | -1.945 |
oops | -1.942 |
Token | ph |
Token ID | 872 |
Feature activation | -4.29e-01 |
Pos logit contributions | |
llor | +0.985 |
cling | +0.941 |
zag | +0.940 |
-$ | +0.934 |
rients | +0.932 |
Neg logit contributions | |
assian | -1.023 |
hower | -0.998 |
orah | -0.969 |
hari | -0.969 |
oops | -0.955 |
Token | allic |
Token ID | 18196 |
Feature activation | -5.81e-01 |
Pos logit contributions | |
assian | +1.368 |
hower | +1.328 |
orah | +1.284 |
oops | +1.268 |
hari | +1.267 |
Neg logit contributions | |
llor | -1.913 |
zag | -1.850 |
cling | -1.831 |
rients | -1.830 |
-$ | -1.818 |
Token | idol |
Token ID | 21580 |
Feature activation | -1.87e-01 |
Pos logit contributions | |
assian | +2.159 |
hower | +2.091 |
orah | +2.046 |
oops | +2.029 |
hari | +2.016 |
Neg logit contributions | |
llor | -2.272 |
zag | -2.197 |
cling | -2.163 |
rients | -2.163 |
-$ | -2.142 |
Token | of |
Token ID | 286 |
Feature activation | -2.70e-01 |
Pos logit contributions | |
assian | +0.744 |
hower | +0.727 |
orah | +0.705 |
hari | +0.700 |
oops | +0.697 |
Neg logit contributions | |
llor | -0.684 |
zag | -0.659 |
rients | -0.651 |
cling | -0.651 |
-$ | -0.647 |
Token | sod |
Token ID | 32581 |
Feature activation | +8.53e-02 |
Pos logit contributions | |
assian | +1.068 |
hower | +1.038 |
orah | +1.016 |
oops | +1.011 |
hari | +1.001 |
Neg logit contributions | |
llor | -0.996 |
zag | -0.956 |
rients | -0.943 |
cling | -0.942 |
-$ | -0.934 |
Token | omy |
Token ID | 9145 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
llor | +0.315 |
zag | +0.307 |
cling | +0.304 |
rients | +0.302 |
-$ | +0.297 |
Neg logit contributions | |
assian | -0.334 |
hower | -0.328 |
orah | -0.318 |
hari | -0.316 |
oops | -0.313 |
Token | � |
Token ID | 447 |
Feature activation | +5.83e-02 |
Pos logit contributions | |
assian | +0.929 |
hower | +0.904 |
orah | +0.885 |
oops | +0.878 |
hari | +0.876 |
Neg logit contributions | |
llor | -0.765 |
zag | -0.734 |
cling | -0.724 |
rients | -0.723 |
-$ | -0.717 |
Token | � |
Token ID | 251 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
llor | +0.264 |
zag | +0.255 |
rients | +0.253 |
cling | +0.253 |
-$ | +0.251 |
Neg logit contributions | |
assian | -0.182 |
hower | -0.175 |
orah | -0.170 |
oops | -0.168 |
hari | -0.167 |
Token | and |
Token ID | 290 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
llor | +1.292 |
cling | +1.234 |
zag | +1.232 |
-$ | +1.213 |
rients | +1.212 |
Neg logit contributions | |
assian | -1.605 |
hower | -1.557 |
orah | -1.531 |
hari | -1.493 |
oops | -1.492 |
Token | his |
Token ID | 465 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
assian | +0.460 |
hower | +0.447 |
orah | +0.436 |
oops | +0.432 |
hari | +0.431 |
Neg logit contributions | |
llor | -0.485 |
zag | -0.468 |
cling | -0.462 |
rients | -0.461 |
-$ | -0.457 |
Token | ms |
Token ID | 907 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
assian | +1.258 |
hower | +1.213 |
orah | +1.185 |
oops | +1.175 |
hari | +1.170 |
Neg logit contributions | |
llor | -1.584 |
zag | -1.530 |
cling | -1.513 |
rients | -1.512 |
-$ | -1.500 |
Token | was |
Token ID | 373 |
Feature activation | +5.54e-01 |
Pos logit contributions | |
llor | +1.124 |
zag | +1.074 |
cling | +1.056 |
-$ | +1.050 |
rients | +1.049 |
Neg logit contributions | |
assian | -1.321 |
hower | -1.288 |
orah | -1.254 |
oops | -1.251 |
hari | -1.244 |
Token | still |
Token ID | 991 |
Feature activation | +3.26e-01 |
Pos logit contributions | |
llor | +1.963 |
zag | +1.876 |
cling | +1.848 |
-$ | +1.841 |
rients | +1.839 |
Neg logit contributions | |
assian | -2.273 |
hower | -2.231 |
oops | -2.160 |
orah | -2.147 |
hari | -2.138 |
Token | alive |
Token ID | 6776 |
Feature activation | +6.36e-03 |
Pos logit contributions | |
llor | +1.188 |
zag | +1.142 |
cling | +1.126 |
rients | +1.124 |
-$ | +1.117 |
Neg logit contributions | |
assian | -1.304 |
hower | -1.272 |
orah | -1.237 |
oops | -1.234 |
hari | -1.224 |
Token | - |
Token ID | 532 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
llor | +0.019 |
zag | +0.019 |
rients | +0.018 |
cling | +0.018 |
-$ | +0.018 |
Neg logit contributions | |
assian | -0.029 |
hower | -0.029 |
orah | -0.028 |
hari | -0.028 |
oops | -0.028 |
Token | a |
Token ID | 257 |
Feature activation | +9.52e-02 |
Pos logit contributions | |
assian | +0.471 |
hower | +0.455 |
orah | +0.447 |
oops | +0.443 |
hari | +0.442 |
Neg logit contributions | |
llor | -0.466 |
zag | -0.448 |
cling | -0.444 |
rients | -0.444 |
-$ | -0.438 |
Token | music |
Token ID | 2647 |
Feature activation | +5.91e-02 |
Pos logit contributions | |
llor | +0.353 |
zag | +0.340 |
rients | +0.335 |
cling | +0.335 |
-$ | +0.332 |
Neg logit contributions | |
assian | -0.375 |
hower | -0.364 |
orah | -0.356 |
oops | -0.353 |
hari | -0.352 |
Token | critic |
Token ID | 4014 |
Feature activation | +8.71e-02 |
Pos logit contributions | |
llor | +0.198 |
zag | +0.189 |
cling | +0.186 |
rients | +0.185 |
-$ | +0.185 |
Neg logit contributions | |
assian | -0.253 |
hower | -0.247 |
orah | -0.242 |
oops | -0.241 |
hari | -0.240 |
Token | for |
Token ID | 329 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
llor | +0.335 |
zag | +0.323 |
cling | +0.318 |
rients | +0.317 |
-$ | +0.317 |
Neg logit contributions | |
assian | -0.329 |
hower | -0.322 |
orah | -0.312 |
oops | -0.311 |
hari | -0.309 |
Token | the |
Token ID | 262 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
assian | +0.700 |
hower | +0.680 |
orah | +0.666 |
oops | +0.661 |
hari | +0.659 |
Neg logit contributions | |
llor | -0.606 |
zag | -0.582 |
cling | -0.575 |
rients | -0.574 |
-$ | -0.567 |
Token | New |
Token ID | 968 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
llor | +0.339 |
zag | +0.324 |
cling | +0.319 |
rients | +0.319 |
-$ | +0.316 |
Neg logit contributions | |
assian | -0.447 |
hower | -0.436 |
orah | -0.427 |
oops | -0.424 |
hari | -0.422 |
Token | being |
Token ID | 852 |
Feature activation | -2.23e-01 |
Pos logit contributions | |
llor | +0.811 |
zag | +0.782 |
cling | +0.771 |
rients | +0.768 |
-$ | +0.767 |
Neg logit contributions | |
assian | -0.919 |
hower | -0.895 |
orah | -0.872 |
oops | -0.867 |
hari | -0.865 |
Token | told |
Token ID | 1297 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
assian | +0.847 |
hower | +0.822 |
orah | +0.806 |
oops | +0.798 |
hari | +0.796 |
Neg logit contributions | |
llor | -0.859 |
zag | -0.825 |
rients | -0.816 |
cling | -0.813 |
-$ | -0.802 |
Token | that |
Token ID | 326 |
Feature activation | -8.57e-02 |
Pos logit contributions | |
llor | +0.521 |
zag | +0.502 |
rients | +0.495 |
cling | +0.493 |
-$ | +0.487 |
Neg logit contributions | |
assian | -0.586 |
hower | -0.570 |
orah | -0.560 |
oops | -0.556 |
hari | -0.551 |
Token | they |
Token ID | 484 |
Feature activation | -8.37e-02 |
Pos logit contributions | |
assian | +0.321 |
hower | +0.311 |
orah | +0.306 |
oops | +0.305 |
hari | +0.300 |
Neg logit contributions | |
llor | -0.332 |
zag | -0.320 |
rients | -0.315 |
cling | -0.314 |
-$ | -0.309 |
Token | need |
Token ID | 761 |
Feature activation | +9.85e-03 |
Pos logit contributions | |
assian | +0.365 |
hower | +0.356 |
orah | +0.349 |
oops | +0.347 |
hari | +0.345 |
Neg logit contributions | |
llor | -0.275 |
zag | -0.263 |
rients | -0.259 |
cling | -0.258 |
-$ | -0.255 |
Token | to |
Token ID | 284 |
Feature activation | +8.69e-01 |
Pos logit contributions | |
llor | +0.033 |
zag | +0.031 |
rients | +0.031 |
cling | +0.031 |
-$ | +0.030 |
Neg logit contributions | |
assian | -0.042 |
hower | -0.041 |
orah | -0.040 |
oops | -0.040 |
hari | -0.040 |
Token | stop |
Token ID | 2245 |
Feature activation | +2.57e-02 |
Pos logit contributions | |
llor | +2.973 |
zag | +2.852 |
-$ | +2.843 |
cling | +2.830 |
rients | +2.785 |
Neg logit contributions | |
assian | -3.644 |
hower | -3.552 |
hari | -3.450 |
oops | -3.424 |
orah | -3.390 |
Token | displaying |
Token ID | 19407 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
llor | +0.106 |
zag | +0.102 |
rients | +0.101 |
cling | +0.101 |
-$ | +0.100 |
Neg logit contributions | |
assian | -0.090 |
hower | -0.087 |
orah | -0.085 |
oops | -0.085 |
hari | -0.084 |
Token | the |
Token ID | 262 |
Feature activation | -5.11e-02 |
Pos logit contributions | |
assian | +1.165 |
hower | +1.127 |
orah | +1.119 |
oops | +1.112 |
hari | +1.086 |
Neg logit contributions | |
llor | -1.121 |
zag | -1.073 |
rients | -1.063 |
cling | -1.056 |
-$ | -1.035 |
Token | Olympic |
Token ID | 11514 |
Feature activation | +7.39e-02 |
Pos logit contributions | |
assian | +0.210 |
hower | +0.205 |
orah | +0.201 |
oops | +0.200 |
hari | +0.197 |
Neg logit contributions | |
llor | -0.179 |
zag | -0.172 |
rients | -0.170 |
cling | -0.170 |
-$ | -0.167 |
Token | rings |
Token ID | 13917 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
llor | +0.269 |
zag | +0.259 |
cling | +0.255 |
rients | +0.255 |
-$ | +0.253 |
Neg logit contributions | |
assian | -0.296 |
hower | -0.288 |
orah | -0.281 |
oops | -0.279 |
hari | -0.278 |
Token | . |
Token ID | 13 |
Feature activation | +3.46e-01 |
Pos logit contributions | |
assian | +1.242 |
hower | +1.214 |
orah | +1.189 |
oops | +1.182 |
hari | +1.177 |
Neg logit contributions | |
llor | -0.928 |
zag | -0.889 |
rients | -0.877 |
cling | -0.876 |
-$ | -0.862 |
Token | Lenin |
Token ID | 22899 |
Feature activation | +3.85e-01 |
Pos logit contributions | |
llor | +1.228 |
zag | +1.168 |
cling | +1.159 |
rients | +1.159 |
-$ | +1.157 |
Neg logit contributions | |
assian | -1.416 |
hower | -1.375 |
orah | -1.338 |
hari | -1.336 |
oops | -1.332 |
Token | was |
Token ID | 373 |
Feature activation | +6.96e-01 |
Pos logit contributions | |
llor | +1.303 |
zag | +1.243 |
cling | +1.226 |
rients | +1.226 |
-$ | +1.220 |
Neg logit contributions | |
assian | -1.644 |
hower | -1.593 |
orah | -1.559 |
oops | -1.551 |
hari | -1.545 |
Token | retired |
Token ID | 9880 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
llor | +2.508 |
zag | +2.377 |
cling | +2.364 |
-$ | +2.356 |
rients | +2.350 |
Neg logit contributions | |
assian | -2.836 |
hower | -2.755 |
oops | -2.669 |
orah | -2.663 |
hari | -2.651 |
Token | in |
Token ID | 287 |
Feature activation | +3.66e-01 |
Pos logit contributions | |
llor | +0.738 |
zag | +0.707 |
cling | +0.697 |
rients | +0.696 |
-$ | +0.690 |
Neg logit contributions | |
assian | -0.941 |
hower | -0.916 |
orah | -0.897 |
oops | -0.891 |
hari | -0.888 |
Token | 1989 |
Token ID | 11104 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
llor | +1.021 |
zag | +0.976 |
cling | +0.954 |
rients | +0.951 |
-$ | +0.949 |
Neg logit contributions | |
assian | -1.780 |
hower | -1.738 |
orah | -1.701 |
hari | -1.694 |
oops | -1.692 |
Token | and |
Token ID | 290 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
assian | +1.558 |
hower | +1.519 |
orah | +1.489 |
oops | +1.475 |
hari | +1.469 |
Neg logit contributions | |
llor | -1.258 |
zag | -1.211 |
rients | -1.196 |
cling | -1.192 |
-$ | -1.171 |
Token | is |
Token ID | 318 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
llor | +0.766 |
zag | +0.732 |
rients | +0.723 |
cling | +0.722 |
-$ | +0.717 |
Neg logit contributions | |
assian | -0.907 |
hower | -0.881 |
orah | -0.862 |
oops | -0.857 |
hari | -0.855 |
Token | now |
Token ID | 783 |
Feature activation | -3.35e-01 |
Pos logit contributions | |
llor | +0.620 |
zag | +0.596 |
cling | +0.589 |
rients | +0.588 |
-$ | +0.584 |
Neg logit contributions | |
assian | -0.648 |
hower | -0.630 |
orah | -0.614 |
oops | -0.611 |
hari | -0.608 |
Token | a |
Token ID | 257 |
Feature activation | -2.84e-02 |
Pos logit contributions | |
assian | +1.314 |
hower | +1.282 |
orah | +1.265 |
oops | +1.243 |
hari | +1.240 |
Neg logit contributions | |
llor | -1.230 |
zag | -1.191 |
cling | -1.164 |
rients | -1.164 |
-$ | -1.151 |
Token | museum |
Token ID | 13257 |
Feature activation | +3.68e-01 |
Pos logit contributions | |
assian | +0.116 |
hower | +0.113 |
orah | +0.111 |
oops | +0.110 |
hari | +0.109 |
Neg logit contributions | |
llor | -0.101 |
zag | -0.097 |
rients | -0.095 |
cling | -0.095 |
-$ | -0.094 |
Token | telling |
Token ID | 5149 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
assian | +0.553 |
hower | +0.536 |
orah | +0.521 |
oops | +0.517 |
hari | +0.514 |
Neg logit contributions | |
llor | -0.679 |
zag | -0.657 |
cling | -0.649 |
rients | -0.648 |
-$ | -0.644 |
Token | us |
Token ID | 514 |
Feature activation | -5.70e-01 |
Pos logit contributions | |
llor | +1.252 |
zag | +1.192 |
-$ | +1.167 |
cling | +1.167 |
rients | +1.162 |
Neg logit contributions | |
assian | -1.949 |
hower | -1.908 |
orah | -1.858 |
oops | -1.852 |
hari | -1.841 |
Token | .' |
Token ID | 2637 |
Feature activation | -4.10e-01 |
Pos logit contributions | |
assian | +2.422 |
hower | +2.355 |
orah | +2.313 |
oops | +2.296 |
hari | +2.291 |
Neg logit contributions | |
llor | -1.925 |
zag | -1.853 |
rients | -1.826 |
cling | -1.822 |
-$ | -1.785 |
Token |
|
Token ID | 198 |
Feature activation | +3.96e-01 |
Pos logit contributions | |
assian | +1.516 |
hower | +1.478 |
hari | +1.436 |
orah | +1.436 |
oops | +1.433 |
Neg logit contributions | |
llor | -1.597 |
zag | -1.539 |
rients | -1.524 |
cling | -1.523 |
-$ | -1.502 |
Token |
|
Token ID | 198 |
Feature activation | +3.40e-01 |
Pos logit contributions | |
llor | +1.336 |
-$ | +1.297 |
zag | +1.286 |
cling | +1.277 |
rients | +1.260 |
Neg logit contributions | |
assian | -1.679 |
hower | -1.662 |
orah | -1.584 |
hari | -1.574 |
oops | -1.570 |
Token | Scroll |
Token ID | 29261 |
Feature activation | -5.74e-01 |
Pos logit contributions | |
llor | +1.106 |
zag | +1.076 |
-$ | +1.075 |
cling | +1.062 |
rients | +1.040 |
Neg logit contributions | |
assian | -1.480 |
hower | -1.476 |
orah | -1.412 |
hari | -1.377 |
oops | -1.365 |
Token | down |
Token ID | 866 |
Feature activation | +5.85e-01 |
Pos logit contributions | |
assian | +1.568 |
hower | +1.504 |
orah | +1.469 |
oops | +1.450 |
hari | +1.444 |
Neg logit contributions | |
llor | -2.798 |
zag | -2.723 |
rients | -2.696 |
cling | -2.684 |
-$ | -2.665 |
Token | for |
Token ID | 329 |
Feature activation | -1.49e-01 |
Pos logit contributions | |
llor | +2.016 |
zag | +1.954 |
cling | +1.919 |
-$ | +1.903 |
rients | +1.901 |
Neg logit contributions | |
assian | -2.452 |
hower | -2.379 |
orah | -2.343 |
oops | -2.306 |
hari | -2.298 |
Token | video |
Token ID | 2008 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
assian | +0.760 |
hower | +0.745 |
orah | +0.731 |
oops | +0.729 |
hari | +0.727 |
Neg logit contributions | |
llor | -0.381 |
zag | -0.360 |
rients | -0.352 |
cling | -0.352 |
-$ | -0.348 |
Token |
|
Token ID | 198 |
Feature activation | +4.79e-01 |
Pos logit contributions | |
assian | +0.663 |
hower | +0.646 |
orah | +0.627 |
oops | +0.626 |
hari | +0.623 |
Neg logit contributions | |
llor | -0.697 |
zag | -0.667 |
cling | -0.663 |
rients | -0.663 |
-$ | -0.653 |
Token |
|
Token ID | 198 |
Feature activation | +6.24e-01 |
Pos logit contributions | |
llor | +1.581 |
-$ | +1.542 |
zag | +1.525 |
cling | +1.516 |
rients | +1.493 |
Neg logit contributions | |
assian | -2.048 |
hower | -2.033 |
orah | -1.933 |
hari | -1.926 |
oops | -1.912 |
Token | one |
Token ID | 530 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
llor | +1.526 |
zag | +1.473 |
-$ | +1.455 |
cling | +1.455 |
rients | +1.449 |
Neg logit contributions | |
assian | -1.893 |
hower | -1.848 |
orah | -1.808 |
oops | -1.793 |
hari | -1.792 |
Token | , |
Token ID | 11 |
Feature activation | -2.89e-02 |
Pos logit contributions | |
llor | +0.731 |
zag | +0.700 |
-$ | +0.690 |
cling | +0.689 |
rients | +0.688 |
Neg logit contributions | |
assian | -0.978 |
hower | -0.952 |
orah | -0.935 |
oops | -0.928 |
hari | -0.926 |
Token | then |
Token ID | 788 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
assian | +0.116 |
hower | +0.113 |
orah | +0.110 |
oops | +0.109 |
hari | +0.109 |
Neg logit contributions | |
llor | -0.105 |
zag | -0.101 |
cling | -0.100 |
rients | -0.100 |
-$ | -0.099 |
Token | to |
Token ID | 284 |
Feature activation | +4.94e-01 |
Pos logit contributions | |
llor | +1.282 |
zag | +1.240 |
cling | +1.218 |
-$ | +1.216 |
rients | +1.215 |
Neg logit contributions | |
assian | -1.497 |
hower | -1.462 |
orah | -1.425 |
oops | -1.420 |
hari | -1.414 |
Token | use |
Token ID | 779 |
Feature activation | -2.69e-01 |
Pos logit contributions | |
llor | +1.721 |
zag | +1.671 |
cling | +1.642 |
-$ | +1.641 |
rients | +1.629 |
Neg logit contributions | |
assian | -2.034 |
hower | -1.986 |
orah | -1.932 |
oops | -1.930 |
hari | -1.921 |
Token | it |
Token ID | 340 |
Feature activation | -7.48e-01 |
Pos logit contributions | |
assian | +1.061 |
hower | +1.032 |
orah | +1.011 |
oops | +1.002 |
hari | +0.994 |
Neg logit contributions | |
llor | -0.994 |
zag | -0.951 |
rients | -0.937 |
cling | -0.935 |
-$ | -0.917 |
Token | , |
Token ID | 11 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
assian | +3.059 |
hower | +2.992 |
orah | +2.929 |
hari | +2.880 |
oops | +2.869 |
Neg logit contributions | |
llor | -2.592 |
zag | -2.484 |
rients | -2.464 |
cling | -2.451 |
distingu | -2.395 |
Token | which |
Token ID | 543 |
Feature activation | -4.89e-01 |
Pos logit contributions | |
assian | +0.455 |
hower | +0.443 |
orah | +0.434 |
oops | +0.430 |
hari | +0.429 |
Neg logit contributions | |
llor | -0.421 |
zag | -0.405 |
rients | -0.399 |
cling | -0.399 |
-$ | -0.395 |
Token | often |
Token ID | 1690 |
Feature activation | -9.27e-01 |
Pos logit contributions | |
assian | +1.914 |
hower | +1.872 |
orah | +1.827 |
oops | +1.822 |
hari | +1.800 |
Neg logit contributions | |
llor | -1.785 |
zag | -1.738 |
cling | -1.698 |
rients | -1.691 |
-$ | -1.653 |
Token | requires |
Token ID | 4433 |
Feature activation | -6.89e-01 |
Pos logit contributions | |
assian | +3.298 |
hower | +3.190 |
orah | +3.148 |
oops | +3.111 |
hari | +3.070 |
Neg logit contributions | |
llor | -3.693 |
zag | -3.592 |
cling | -3.498 |
rients | -3.469 |
distingu | -3.391 |
Token | transportation |
Token ID | 9358 |
Feature activation | +5.03e-01 |
Pos logit contributions | |
assian | +2.678 |
hower | +2.588 |
orah | +2.553 |
oops | +2.517 |
hari | +2.508 |
Neg logit contributions | |
llor | -2.560 |
zag | -2.437 |
rients | -2.420 |
cling | -2.399 |
-$ | -2.324 |
Token |
|
Token ID | 198 |
Feature activation | +9.30e-02 |
Pos logit contributions | |
llor | +0.375 |
zag | +0.361 |
-$ | +0.357 |
cling | +0.356 |
rients | +0.354 |
Neg logit contributions | |
assian | -0.426 |
hower | -0.418 |
orah | -0.404 |
oops | -0.400 |
hari | -0.400 |
Token | " |
Token ID | 1 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
llor | +0.248 |
zag | +0.237 |
-$ | +0.233 |
cling | +0.232 |
rients | +0.228 |
Neg logit contributions | |
assian | -0.464 |
hower | -0.456 |
orah | -0.444 |
hari | -0.441 |
oops | -0.436 |
Token | But |
Token ID | 1537 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
assian | +4.503 |
oops | +4.383 |
hower | +4.375 |
orah | +4.311 |
hari | +4.239 |
Neg logit contributions | |
llor | -4.512 |
zag | -4.315 |
distingu | -4.314 |
rients | -4.314 |
cling | -4.262 |
Token | when |
Token ID | 618 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
llor | +0.844 |
zag | +0.810 |
-$ | +0.798 |
cling | +0.798 |
rients | +0.794 |
Neg logit contributions | |
assian | -0.906 |
hower | -0.869 |
orah | -0.853 |
hari | -0.850 |
oops | -0.842 |
Token | they |
Token ID | 484 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
llor | +0.857 |
zag | +0.821 |
cling | +0.814 |
-$ | +0.810 |
rients | +0.809 |
Neg logit contributions | |
assian | -0.883 |
hower | -0.848 |
orah | -0.838 |
hari | -0.829 |
oops | -0.823 |
Token | first |
Token ID | 717 |
Feature activation | -4.82e-01 |
Pos logit contributions | |
assian | +0.656 |
hower | +0.638 |
orah | +0.623 |
oops | +0.618 |
hari | +0.617 |
Neg logit contributions | |
llor | -0.611 |
zag | -0.587 |
cling | -0.580 |
rients | -0.577 |
-$ | -0.575 |
Token | met |
Token ID | 1138 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
assian | +1.779 |
hower | +1.725 |
orah | +1.684 |
oops | +1.670 |
hari | +1.663 |
Neg logit contributions | |
llor | -1.907 |
zag | -1.840 |
rients | -1.817 |
cling | -1.816 |
-$ | -1.799 |
Token | , |
Token ID | 11 |
Feature activation | +6.95e-02 |
Pos logit contributions | |
assian | +0.741 |
hower | +0.719 |
orah | +0.704 |
oops | +0.700 |
hari | +0.698 |
Neg logit contributions | |
llor | -0.637 |
zag | -0.610 |
cling | -0.601 |
rients | -0.599 |
-$ | -0.597 |
Token | and |
Token ID | 290 |
Feature activation | -1.81e-02 |
Pos logit contributions | |
llor | +0.258 |
zag | +0.247 |
cling | +0.243 |
-$ | +0.243 |
rients | +0.242 |
Neg logit contributions | |
assian | -0.276 |
hower | -0.265 |
orah | -0.261 |
hari | -0.259 |
oops | -0.257 |
Token | O |
Token ID | 440 |
Feature activation | -6.60e-01 |
Pos logit contributions | |
assian | +0.071 |
hower | +0.069 |
orah | +0.068 |
hari | +0.067 |
oops | +0.067 |
Neg logit contributions | |
llor | -0.067 |
zag | -0.064 |
cling | -0.063 |
-$ | -0.063 |
rients | -0.063 |
Token | ' |
Token ID | 6 |
Feature activation | -3.06e-01 |
Pos logit contributions | |
assian | +3.459 |
hower | +3.381 |
orah | +3.367 |
oops | +3.353 |
hari | +3.315 |
Neg logit contributions | |
llor | -1.541 |
zag | -1.460 |
distingu | -1.451 |
rients | -1.435 |
cling | -1.426 |
Token | Prim |
Token ID | 23828 |
Feature activation | -5.94e-01 |
Pos logit contributions | |
llor | +0.227 |
zag | +0.219 |
cling | +0.215 |
rients | +0.214 |
-$ | +0.213 |
Neg logit contributions | |
assian | -0.293 |
hower | -0.286 |
orah | -0.279 |
hari | -0.276 |
oops | -0.276 |
Token | al |
Token ID | 282 |
Feature activation | -4.61e-01 |
Pos logit contributions | |
assian | +2.264 |
hower | +2.186 |
orah | +2.155 |
oops | +2.134 |
hari | +2.130 |
Neg logit contributions | |
llor | -2.258 |
zag | -2.175 |
cling | -2.153 |
rients | -2.151 |
-$ | -2.136 |
Token | Druid |
Token ID | 32685 |
Feature activation | -4.61e-01 |
Pos logit contributions | |
assian | +2.070 |
hower | +2.023 |
orah | +1.981 |
oops | +1.964 |
hari | +1.961 |
Neg logit contributions | |
llor | -1.439 |
zag | -1.375 |
cling | -1.353 |
rients | -1.352 |
distingu | -1.336 |
Token | vs |
Token ID | 3691 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
assian | +2.362 |
hower | +2.305 |
orah | +2.271 |
oops | +2.258 |
hari | +2.255 |
Neg logit contributions | |
llor | -1.141 |
zag | -1.083 |
cling | -1.063 |
rients | -1.057 |
-$ | -1.037 |
Token | Er |
Token ID | 5256 |
Feature activation | -4.89e-01 |
Pos logit contributions | |
llor | +1.982 |
zag | +1.907 |
cling | +1.872 |
rients | +1.869 |
-$ | +1.865 |
Neg logit contributions | |
assian | -2.266 |
hower | -2.216 |
orah | -2.156 |
oops | -2.135 |
hari | -2.131 |
Token | t |
Token ID | 83 |
Feature activation | -4.73e-01 |
Pos logit contributions | |
assian | +2.072 |
hower | +2.001 |
orah | +1.972 |
hari | +1.946 |
oops | +1.943 |
Neg logit contributions | |
llor | -1.666 |
zag | -1.579 |
rients | -1.573 |
-$ | -1.569 |
distingu | -1.562 |
Token | ai |
Token ID | 1872 |
Feature activation | -6.77e-01 |
Pos logit contributions | |
assian | +1.773 |
hower | +1.718 |
orah | +1.682 |
oops | +1.661 |
hari | +1.658 |
Neg logit contributions | |
llor | -1.839 |
zag | -1.775 |
cling | -1.754 |
rients | -1.753 |
-$ | -1.743 |
Token | , |
Token ID | 11 |
Feature activation | +2.23e-02 |
Pos logit contributions | |
assian | +2.752 |
hower | +2.670 |
orah | +2.618 |
hari | +2.597 |
oops | +2.586 |
Neg logit contributions | |
llor | -2.394 |
zag | -2.308 |
rients | -2.283 |
cling | -2.278 |
-$ | -2.262 |
Token | Wizard |
Token ID | 16884 |
Feature activation | -3.34e-01 |
Pos logit contributions | |
llor | +0.083 |
zag | +0.079 |
cling | +0.078 |
rients | +0.078 |
-$ | +0.077 |
Neg logit contributions | |
assian | -0.088 |
hower | -0.086 |
orah | -0.084 |
oops | -0.083 |
hari | -0.083 |
Token | Ad |
Token ID | 1215 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
assian | +1.239 |
hower | +1.198 |
orah | +1.171 |
oops | +1.156 |
hari | +1.155 |
Neg logit contributions | |
llor | -1.303 |
zag | -1.262 |
rients | -1.250 |
cling | -1.248 |
-$ | -1.237 |
Token | ept |
Token ID | 19598 |
Feature activation | -5.12e-01 |
Pos logit contributions | |
assian | +0.415 |
hower | +0.403 |
orah | +0.392 |
oops | +0.388 |
hari | +0.386 |
Neg logit contributions | |
llor | -0.484 |
zag | -0.467 |
rients | -0.461 |
cling | -0.461 |
-$ | -0.457 |
Token | Trump |
Token ID | 1301 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
assian | +0.470 |
hower | +0.457 |
orah | +0.446 |
oops | +0.443 |
hari | +0.443 |
Neg logit contributions | |
llor | -0.471 |
zag | -0.454 |
rients | -0.449 |
cling | -0.448 |
-$ | -0.444 |
Token | said |
Token ID | 531 |
Feature activation | -7.37e-02 |
Pos logit contributions | |
llor | +0.933 |
zag | +0.897 |
cling | +0.882 |
-$ | +0.877 |
rients | +0.877 |
Neg logit contributions | |
assian | -1.137 |
hower | -1.109 |
orah | -1.081 |
oops | -1.075 |
hari | -1.064 |
Token | . |
Token ID | 13 |
Feature activation | -2.08e-01 |
Pos logit contributions | |
assian | +0.295 |
hower | +0.287 |
orah | +0.281 |
oops | +0.279 |
hari | +0.278 |
Neg logit contributions | |
llor | -0.268 |
zag | -0.258 |
cling | -0.254 |
rients | -0.254 |
-$ | -0.252 |
Token |
|
Token ID | 198 |
Feature activation | -3.43e-01 |
Pos logit contributions | |
assian | +0.844 |
hower | +0.820 |
orah | +0.800 |
hari | +0.792 |
oops | +0.792 |
Neg logit contributions | |
llor | -0.748 |
zag | -0.721 |
cling | -0.709 |
rients | -0.708 |
-$ | -0.708 |
Token |
|
Token ID | 198 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
assian | +1.314 |
hower | +1.273 |
orah | +1.250 |
oops | +1.240 |
hari | +1.234 |
Neg logit contributions | |
llor | -1.303 |
zag | -1.255 |
rients | -1.238 |
cling | -1.236 |
distingu | -1.222 |
Token | ' |
Token ID | 6 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
assian | +0.520 |
hower | +0.511 |
orah | +0.495 |
hari | +0.489 |
oops | +0.487 |
Neg logit contributions | |
llor | -0.381 |
zag | -0.366 |
-$ | -0.361 |
cling | -0.361 |
rients | -0.358 |
Token | If |
Token ID | 1532 |
Feature activation | -3.19e-01 |
Pos logit contributions | |
assian | +4.977 |
oops | +4.918 |
orah | +4.759 |
hari | +4.733 |
hower | +4.690 |
Neg logit contributions | |
llor | -5.822 |
distingu | -5.625 |
zag | -5.571 |
rients | -5.541 |
cling | -5.438 |
Token | the |
Token ID | 262 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
assian | +1.218 |
hower | +1.182 |
orah | +1.158 |
oops | +1.152 |
hari | +1.146 |
Neg logit contributions | |
llor | -1.212 |
zag | -1.170 |
rients | -1.156 |
cling | -1.153 |
-$ | -1.139 |
Token | reporting |
Token ID | 6447 |
Feature activation | +1.84e-01 |
Pos logit contributions | |
llor | +0.871 |
zag | +0.845 |
cling | +0.830 |
rients | +0.829 |
-$ | +0.824 |
Neg logit contributions | |
assian | -0.892 |
hower | -0.871 |
orah | -0.847 |
oops | -0.837 |
hari | -0.834 |
Token | is |
Token ID | 318 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
llor | +0.592 |
zag | +0.568 |
rients | +0.560 |
-$ | +0.560 |
cling | +0.559 |
Neg logit contributions | |
assian | -0.812 |
hower | -0.794 |
orah | -0.773 |
oops | -0.768 |
hari | -0.762 |
Token | accurate |
Token ID | 7187 |
Feature activation | +4.00e-01 |
Pos logit contributions | |
llor | +0.075 |
zag | +0.073 |
cling | +0.072 |
rients | +0.072 |
-$ | +0.071 |
Neg logit contributions | |
assian | -0.069 |
hower | -0.067 |
orah | -0.066 |
oops | -0.065 |
hari | -0.065 |
Token | it |
Token ID | 270 |
Feature activation | -2.25e-01 |
Pos logit contributions | |
llor | +1.018 |
zag | +0.982 |
cling | +0.968 |
rients | +0.966 |
-$ | +0.958 |
Neg logit contributions | |
assian | -1.128 |
hower | -1.099 |
orah | -1.074 |
oops | -1.061 |
hari | -1.060 |
Token | -> |
Token ID | 3784 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
assian | +1.078 |
hower | +1.055 |
orah | +1.033 |
oops | +1.026 |
hari | +1.024 |
Neg logit contributions | |
llor | -0.641 |
zag | -0.610 |
cling | -0.599 |
rients | -0.598 |
-$ | -0.595 |
Token | i |
Token ID | 72 |
Feature activation | -6.16e-02 |
Pos logit contributions | |
llor | +0.805 |
zag | +0.778 |
cling | +0.763 |
rients | +0.760 |
-$ | +0.754 |
Neg logit contributions | |
assian | -1.107 |
hower | -1.082 |
orah | -1.059 |
oops | -1.043 |
hari | -1.041 |
Token | () |
Token ID | 3419 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
assian | +0.297 |
hower | +0.289 |
orah | +0.284 |
oops | +0.283 |
hari | +0.282 |
Neg logit contributions | |
llor | -0.174 |
zag | -0.165 |
rients | -0.162 |
cling | -0.162 |
-$ | -0.160 |
Token | == |
Token ID | 6624 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
llor | +0.871 |
zag | +0.845 |
cling | +0.835 |
rients | +0.835 |
-$ | +0.829 |
Neg logit contributions | |
assian | -0.565 |
hower | -0.544 |
orah | -0.528 |
oops | -0.523 |
hari | -0.520 |
Token | count |
Token ID | 954 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
assian | +0.625 |
hower | +0.609 |
orah | +0.598 |
oops | +0.595 |
hari | +0.592 |
Neg logit contributions | |
llor | -0.464 |
zag | -0.443 |
cling | -0.436 |
rients | -0.436 |
-$ | -0.430 |
Token | % |
Token ID | 4064 |
Feature activation | +5.17e-02 |
Pos logit contributions | |
assian | +5.340 |
hower | +5.072 |
oops | +5.023 |
orah | +4.970 |
hari | +4.952 |
Neg logit contributions | |
llor | -5.219 |
zag | -5.018 |
rients | -4.987 |
cling | -4.901 |
distingu | -4.899 |
Token | 5 |
Token ID | 642 |
Feature activation | -3.44e-01 |
Pos logit contributions | |
llor | +0.153 |
zag | +0.146 |
cling | +0.143 |
rients | +0.143 |
-$ | +0.141 |
Neg logit contributions | |
assian | -0.242 |
hower | -0.237 |
orah | -0.232 |
oops | -0.231 |
hari | -0.230 |
Token | ); |
Token ID | 1776 |
Feature activation | -3.24e-01 |
Pos logit contributions | |
assian | +1.441 |
hower | +1.402 |
orah | +1.373 |
oops | +1.363 |
hari | +1.358 |
Neg logit contributions | |
llor | -1.188 |
zag | -1.139 |
cling | -1.122 |
rients | -1.122 |
-$ | -1.111 |
Token | ++ |
Token ID | 19969 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
assian | +1.312 |
hower | +1.270 |
orah | +1.243 |
oops | +1.243 |
hari | +1.235 |
Neg logit contributions | |
llor | -1.164 |
zag | -1.115 |
rients | -1.100 |
cling | -1.099 |
-$ | -1.078 |
Token | count |
Token ID | 9127 |
Feature activation | -6.34e-01 |
Pos logit contributions | |
llor | +1.107 |
zag | +1.072 |
cling | +1.062 |
rients | +1.051 |
-$ | +1.047 |
Neg logit contributions | |
assian | -1.111 |
hower | -1.085 |
orah | -1.057 |
hari | -1.040 |
oops | -1.039 |
Token | who |
Token ID | 508 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
llor | +0.645 |
zag | +0.623 |
cling | +0.621 |
-$ | +0.616 |
rients | +0.611 |
Neg logit contributions | |
assian | -0.637 |
hower | -0.626 |
oops | -0.607 |
orah | -0.600 |
hari | -0.598 |
Token | claim |
Token ID | 1624 |
Feature activation | -5.10e-01 |
Pos logit contributions | |
assian | +0.454 |
hower | +0.442 |
orah | +0.431 |
oops | +0.429 |
hari | +0.427 |
Neg logit contributions | |
llor | -0.382 |
zag | -0.367 |
cling | -0.363 |
rients | -0.361 |
-$ | -0.358 |
Token | to |
Token ID | 284 |
Feature activation | -6.11e-01 |
Pos logit contributions | |
assian | +2.083 |
hower | +2.012 |
orah | +2.002 |
oops | +1.981 |
hari | +1.973 |
Neg logit contributions | |
llor | -1.794 |
zag | -1.711 |
rients | -1.690 |
cling | -1.678 |
-$ | -1.658 |
Token | speak |
Token ID | 2740 |
Feature activation | -7.00e-01 |
Pos logit contributions | |
assian | +2.455 |
orah | +2.384 |
hower | +2.378 |
hari | +2.323 |
oops | +2.321 |
Neg logit contributions | |
llor | -2.181 |
zag | -2.097 |
rients | -2.066 |
cling | -2.030 |
-$ | -2.023 |
Token | and |
Token ID | 290 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
assian | +2.687 |
orah | +2.584 |
hower | +2.579 |
hari | +2.528 |
oran | +2.520 |
Neg logit contributions | |
llor | -2.627 |
zag | -2.521 |
rients | -2.506 |
cling | -2.498 |
-$ | -2.448 |
Token | act |
Token ID | 719 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
assian | +0.666 |
hower | +0.647 |
orah | +0.633 |
oops | +0.629 |
hari | +0.626 |
Neg logit contributions | |
llor | -0.606 |
zag | -0.583 |
cling | -0.575 |
rients | -0.575 |
-$ | -0.569 |
Token | for |
Token ID | 329 |
Feature activation | -2.70e-02 |
Pos logit contributions | |
assian | +5.521 |
orah | +5.295 |
hari | +5.216 |
oran | +5.212 |
hower | +5.092 |
Neg logit contributions | |
llor | -6.278 |
rients | -6.006 |
zag | -5.975 |
cling | -5.963 |
-$ | -5.829 |
Token | the |
Token ID | 262 |
Feature activation | -4.06e-01 |
Pos logit contributions | |
assian | +0.107 |
hower | +0.105 |
orah | +0.101 |
oops | +0.101 |
hari | +0.100 |
Neg logit contributions | |
llor | -0.099 |
zag | -0.097 |
cling | -0.095 |
rients | -0.095 |
-$ | -0.094 |
Token | will |
Token ID | 481 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
assian | +1.526 |
hower | +1.480 |
orah | +1.449 |
oops | +1.435 |
hari | +1.430 |
Neg logit contributions | |
llor | -1.573 |
zag | -1.519 |
cling | -1.498 |
rients | -1.496 |
-$ | -1.484 |
Token | of |
Token ID | 286 |
Feature activation | -4.52e-01 |
Pos logit contributions | |
assian | +3.530 |
hower | +3.378 |
orah | +3.378 |
hari | +3.318 |
oops | +3.272 |
Neg logit contributions | |
llor | -4.256 |
zag | -4.137 |
rients | -4.056 |
cling | -4.014 |
distingu | -3.968 |
Token | their |
Token ID | 511 |
Feature activation | -7.04e-01 |
Pos logit contributions | |
assian | +1.481 |
hower | +1.429 |
orah | +1.400 |
oops | +1.379 |
hari | +1.376 |
Neg logit contributions | |
llor | -1.967 |
zag | -1.897 |
rients | -1.878 |
cling | -1.875 |
-$ | -1.861 |
Token | , |
Token ID | 11 |
Feature activation | -5.31e-01 |
Pos logit contributions | |
llor | +1.403 |
zag | +1.367 |
cling | +1.359 |
rients | +1.345 |
-$ | +1.341 |
Neg logit contributions | |
assian | -1.495 |
hower | -1.455 |
orah | -1.425 |
hari | -1.403 |
oops | -1.398 |
Token | and |
Token ID | 290 |
Feature activation | -1.72e-01 |
Pos logit contributions | |
assian | +2.034 |
hower | +1.971 |
orah | +1.932 |
oops | +1.917 |
hari | +1.914 |
Neg logit contributions | |
llor | -2.016 |
zag | -1.936 |
rients | -1.919 |
cling | -1.912 |
-$ | -1.898 |
Token | as |
Token ID | 355 |
Feature activation | -9.74e-02 |
Pos logit contributions | |
assian | +0.637 |
hower | +0.618 |
orah | +0.603 |
oops | +0.599 |
hari | +0.596 |
Neg logit contributions | |
llor | -0.680 |
zag | -0.657 |
cling | -0.647 |
rients | -0.647 |
-$ | -0.642 |
Token | a |
Token ID | 257 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
assian | +0.398 |
hower | +0.388 |
orah | +0.379 |
oops | +0.377 |
hari | +0.375 |
Neg logit contributions | |
llor | -0.347 |
zag | -0.333 |
cling | -0.328 |
rients | -0.328 |
-$ | -0.325 |
Token | reward |
Token ID | 6721 |
Feature activation | -8.66e-01 |
Pos logit contributions | |
llor | +0.069 |
zag | +0.066 |
cling | +0.065 |
rients | +0.065 |
-$ | +0.065 |
Neg logit contributions | |
assian | -0.070 |
hower | -0.069 |
oops | -0.067 |
orah | -0.066 |
hari | -0.066 |
Token | for |
Token ID | 329 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
assian | +3.216 |
hower | +3.122 |
orah | +3.091 |
hari | +3.023 |
oops | +3.011 |
Neg logit contributions | |
llor | -3.311 |
zag | -3.183 |
cling | -3.182 |
rients | -3.178 |
-$ | -3.091 |
Token | his |
Token ID | 465 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
assian | +4.360 |
orah | +4.227 |
hower | +4.147 |
oops | +4.104 |
oran | +4.059 |
Neg logit contributions | |
llor | -6.243 |
rients | -6.034 |
zag | -5.921 |
cling | -5.867 |
-$ | -5.814 |
Token | hard |
Token ID | 1327 |
Feature activation | -7.49e-01 |
Pos logit contributions | |
assian | +4.001 |
hower | +3.848 |
orah | +3.820 |
oops | +3.720 |
oran | +3.643 |
Neg logit contributions | |
llor | -5.579 |
rients | -5.363 |
zag | -5.319 |
cling | -5.266 |
-$ | -5.213 |
Token | work |
Token ID | 670 |
Feature activation | -9.81e-01 |
Pos logit contributions | |
assian | +2.637 |
hower | +2.546 |
orah | +2.488 |
oops | +2.464 |
hari | +2.452 |
Neg logit contributions | |
llor | -3.091 |
zag | -2.970 |
rients | -2.945 |
cling | -2.929 |
-$ | -2.905 |
Token | and |
Token ID | 290 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
assian | +3.651 |
hower | +3.510 |
orah | +3.492 |
hari | +3.425 |
oops | +3.385 |
Neg logit contributions | |
llor | -3.761 |
rients | -3.571 |
zag | -3.557 |
cling | -3.551 |
-$ | -3.479 |
Token | diligence |
Token ID | 34136 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
assian | +0.785 |
hower | +0.761 |
orah | +0.739 |
oops | +0.735 |
hari | +0.733 |
Neg logit contributions | |
llor | -0.913 |
zag | -0.885 |
cling | -0.874 |
rients | -0.871 |
-$ | -0.867 |
Token | private |
Token ID | 2839 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
assian | +0.072 |
hower | +0.070 |
orah | +0.068 |
oops | +0.068 |
hari | +0.068 |
Neg logit contributions | |
llor | -0.072 |
zag | -0.069 |
cling | -0.068 |
rients | -0.068 |
-$ | -0.068 |
Token | company |
Token ID | 1664 |
Feature activation | +5.37e-01 |
Pos logit contributions | |
llor | +0.589 |
zag | +0.572 |
-$ | +0.570 |
cling | +0.562 |
rients | +0.560 |
Neg logit contributions | |
assian | -0.589 |
hower | -0.566 |
oops | -0.556 |
orah | -0.555 |
hari | -0.549 |
Token | . |
Token ID | 13 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
llor | +1.795 |
zag | +1.744 |
-$ | +1.732 |
cling | +1.703 |
rients | +1.666 |
Neg logit contributions | |
assian | -2.275 |
hower | -2.228 |
orah | -2.161 |
hari | -2.156 |
oops | -2.156 |
Token |
|
Token ID | 198 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
assian | +1.559 |
hower | +1.515 |
orah | +1.484 |
oops | +1.476 |
hari | +1.469 |
Neg logit contributions | |
llor | -1.408 |
zag | -1.356 |
cling | -1.337 |
rients | -1.335 |
-$ | -1.318 |
Token |
|
Token ID | 198 |
Feature activation | -2.76e-01 |
Pos logit contributions | |
assian | +1.480 |
hower | +1.431 |
orah | +1.406 |
oops | +1.396 |
hari | +1.390 |
Neg logit contributions | |
llor | -1.488 |
zag | -1.434 |
rients | -1.415 |
cling | -1.413 |
distingu | -1.406 |
Token | " |
Token ID | 1 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
assian | +1.330 |
hower | +1.296 |
orah | +1.276 |
oops | +1.271 |
hari | +1.266 |
Neg logit contributions | |
llor | -0.777 |
zag | -0.740 |
rients | -0.726 |
cling | -0.725 |
-$ | -0.714 |
Token | We |
Token ID | 1135 |
Feature activation | -4.72e-01 |
Pos logit contributions | |
oops | +5.898 |
assian | +5.892 |
orah | +5.654 |
hari | +5.545 |
hower | +5.471 |
Neg logit contributions | |
llor | -6.836 |
distingu | -6.778 |
zag | -6.654 |
rients | -6.641 |
cling | -6.456 |
Token | are |
Token ID | 389 |
Feature activation | -2.97e-01 |
Pos logit contributions | |
assian | +1.980 |
hower | +1.929 |
orah | +1.898 |
oops | +1.885 |
hari | +1.873 |
Neg logit contributions | |
llor | -1.608 |
zag | -1.545 |
rients | -1.530 |
cling | -1.515 |
-$ | -1.501 |
Token | a |
Token ID | 257 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
assian | +1.205 |
hower | +1.173 |
orah | +1.154 |
oops | +1.144 |
hari | +1.138 |
Neg logit contributions | |
llor | -1.055 |
zag | -1.013 |
rients | -1.000 |
cling | -0.998 |
-$ | -0.981 |
Token | community |
Token ID | 2055 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
assian | +0.591 |
hower | +0.575 |
orah | +0.562 |
oops | +0.557 |
hari | +0.555 |
Neg logit contributions | |
llor | -0.554 |
zag | -0.533 |
cling | -0.526 |
rients | -0.526 |
-$ | -0.521 |
Token | - |
Token ID | 12 |
Feature activation | -3.07e-01 |
Pos logit contributions | |
llor | +0.732 |
zag | +0.703 |
-$ | +0.700 |
cling | +0.694 |
rients | +0.691 |
Neg logit contributions | |
assian | -0.806 |
hower | -0.783 |
oops | -0.765 |
orah | -0.764 |
hari | -0.757 |