Token | Come |
Token ID | 7911 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.444 |
the | +5.257 |
, | +5.257 |
. | +5.122 |
a | +5.071 |
Neg logit contributions | |
umm | -3.983 |
lor | -3.917 |
rol | -3.879 |
osity | -3.734 |
bek | -3.675 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.259 |
the | +2.099 |
, | +2.079 |
. | +1.962 |
a | +1.941 |
Neg logit contributions | |
umm | -7.096 |
lor | -7.036 |
rol | -6.996 |
bek | -6.836 |
arians | -6.821 |
Token | see |
Token ID | 766 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.893 |
, | +3.654 |
. | +3.602 |
the | +3.572 |
a | +3.465 |
Neg logit contributions | |
lor | -5.353 |
rol | -5.347 |
umm | -5.334 |
bek | -5.229 |
osity | -5.224 |
Token | !" |
Token ID | 2474 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.033 |
the | +2.805 |
, | +2.768 |
a | +2.730 |
. | +2.596 |
Neg logit contributions | |
lor | -6.081 |
umm | -5.960 |
rol | -5.894 |
arians | -5.863 |
ocol | -5.774 |
Token | She |
Token ID | 1375 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.868 |
, | +2.729 |
the | +2.729 |
a | +2.591 |
. | +2.588 |
Neg logit contributions | |
umm | -6.369 |
lor | -6.307 |
rol | -6.254 |
osity | -6.117 |
arians | -6.062 |
Token | runs |
Token ID | 4539 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.170 |
, | +5.066 |
the | +5.050 |
. | +4.968 |
a | +4.874 |
Neg logit contributions | |
lor | -4.063 |
umm | -4.010 |
rol | -4.004 |
arians | -3.865 |
rob | -3.832 |
Token | to |
Token ID | 284 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.826 |
the | +1.665 |
, | +1.657 |
. | +1.527 |
a | +1.507 |
Neg logit contributions | |
umm | -7.543 |
lor | -7.469 |
rol | -7.443 |
bek | -7.273 |
osity | -7.261 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.450 |
, | +2.291 |
. | +2.111 |
the | +2.008 |
a | +1.996 |
Neg logit contributions | |
umm | -6.540 |
lor | -6.534 |
rol | -6.529 |
arians | -6.433 |
ocol | -6.427 |
Token | tree |
Token ID | 5509 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.900 |
, | +3.752 |
the | +3.633 |
. | +3.563 |
a | +3.488 |
Neg logit contributions | |
umm | -5.494 |
lor | -5.383 |
rol | -5.243 |
bek | -5.189 |
arians | -5.187 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +0.491 |
and | +0.454 |
a | +0.364 |
, | +0.359 |
. | +0.209 |
Neg logit contributions | |
umm | -8.540 |
lor | -8.539 |
rol | -8.496 |
bek | -8.312 |
osity | -8.294 |
Token | shows |
Token ID | 2523 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.945 |
, | +4.797 |
. | +4.714 |
the | +4.691 |
a | +4.588 |
Neg logit contributions | |
lor | -4.226 |
rol | -4.209 |
umm | -4.175 |
rob | -4.091 |
osity | -4.063 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.569 |
the | +1.451 |
, | +1.304 |
a | +1.264 |
. | +1.179 |
Neg logit contributions | |
umm | -7.487 |
rol | -7.373 |
lor | -7.357 |
osity | -7.282 |
arians | -7.264 |
Token | Ben |
Token ID | 3932 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.721 |
. | +3.592 |
, | +3.581 |
the | +3.529 |
a | +3.408 |
Neg logit contributions | |
umm | -5.347 |
lor | -5.260 |
osity | -5.179 |
rol | -5.119 |
arians | -5.093 |
Token | ! |
Token ID | 0 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.182 |
the | +1.072 |
a | +0.946 |
, | +0.929 |
. | +0.748 |
Neg logit contributions | |
umm | -8.005 |
lor | -7.977 |
rol | -7.800 |
bek | -7.741 |
arians | -7.735 |
Token | I |
Token ID | 314 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.253 |
, | +5.060 |
the | +5.053 |
. | +4.928 |
a | +4.892 |
Neg logit contributions | |
umm | -4.223 |
lor | -4.144 |
rol | -4.087 |
osity | -3.963 |
bek | -3.904 |
Token | found |
Token ID | 1043 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.550 |
the | +4.482 |
, | +4.391 |
. | +4.263 |
a | +4.251 |
Neg logit contributions | |
rol | -4.704 |
lor | -4.661 |
umm | -4.602 |
bek | -4.506 |
ides | -4.456 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.167 |
, | +2.922 |
the | +2.748 |
. | +2.738 |
a | +2.508 |
Neg logit contributions | |
lor | -6.142 |
rol | -6.133 |
umm | -6.128 |
ocol | -5.937 |
rob | -5.863 |
Token | new |
Token ID | 649 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.716 |
the | +4.575 |
, | +4.450 |
. | +4.427 |
a | +4.318 |
Neg logit contributions | |
lor | -4.613 |
umm | -4.607 |
bek | -4.436 |
rol | -4.401 |
arians | -4.342 |
Token | friend |
Token ID | 1545 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.166 |
the | +4.156 |
, | +3.984 |
a | +3.896 |
. | +3.881 |
Neg logit contributions | |
umm | -4.997 |
lor | -4.994 |
rol | -4.801 |
bek | -4.703 |
rob | -4.699 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.991 |
the | +2.973 |
, | +2.792 |
a | +2.783 |
. | +2.619 |
Neg logit contributions | |
lor | -6.176 |
rol | -6.113 |
umm | -6.077 |
arians | -5.955 |
bek | -5.844 |
Token | Come |
Token ID | 7911 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.444 |
the | +5.257 |
, | +5.257 |
. | +5.122 |
a | +5.071 |
Neg logit contributions | |
umm | -3.983 |
lor | -3.917 |
rol | -3.879 |
osity | -3.734 |
bek | -3.675 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.259 |
the | +2.099 |
, | +2.079 |
. | +1.962 |
a | +1.941 |
Neg logit contributions | |
umm | -7.096 |
lor | -7.036 |
rol | -6.996 |
bek | -6.836 |
arians | -6.821 |
Token | name |
Token ID | 1438 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.862 |
the | +4.768 |
, | +4.718 |
. | +4.513 |
a | +4.474 |
Neg logit contributions | |
umm | -4.376 |
lor | -4.357 |
rol | -4.270 |
arians | -4.193 |
bek | -4.139 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.428 |
the | +3.250 |
, | +3.212 |
. | +3.119 |
a | +3.097 |
Neg logit contributions | |
lor | -5.776 |
umm | -5.703 |
rol | -5.661 |
rob | -5.569 |
arians | -5.501 |
Token | The |
Token ID | 383 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.608 |
, | +2.412 |
the | +2.348 |
a | +2.282 |
. | +2.263 |
Neg logit contributions | |
lor | -6.550 |
umm | -6.537 |
rol | -6.488 |
bek | -6.342 |
arians | -6.317 |
Token | bird |
Token ID | 6512 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.711 |
, | +4.522 |
the | +4.507 |
. | +4.351 |
a | +4.303 |
Neg logit contributions | |
umm | -4.618 |
lor | -4.512 |
rob | -4.397 |
rol | -4.392 |
arians | -4.368 |
Token | whist |
Token ID | 32262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.366 |
the | +4.287 |
, | +4.228 |
a | +4.172 |
. | +4.090 |
Neg logit contributions | |
lor | -4.794 |
rol | -4.760 |
umm | -4.654 |
rob | -4.588 |
arians | -4.513 |
Token | les |
Token ID | 829 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +6.897 |
, | +6.778 |
the | +6.746 |
a | +6.604 |
. | +6.590 |
Neg logit contributions | |
lor | -2.431 |
rol | -2.393 |
umm | -2.371 |
rob | -2.220 |
osity | -2.185 |
Token | again |
Token ID | 757 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.850 |
the | +1.771 |
, | +1.742 |
a | +1.602 |
. | +1.534 |
Neg logit contributions | |
rol | -7.185 |
lor | -7.141 |
umm | -7.060 |
osity | -6.933 |
ides | -6.850 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +0.628 |
and | +0.567 |
a | +0.548 |
, | +0.432 |
. | +0.169 |
Neg logit contributions | |
lor | -8.277 |
umm | -8.225 |
bek | -8.137 |
ides | -8.072 |
arians | -8.036 |
Token | fl |
Token ID | 781 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.204 |
, | +5.040 |
. | +4.902 |
the | +4.897 |
a | +4.818 |
Neg logit contributions | |
lor | -3.975 |
umm | -3.926 |
rol | -3.888 |
rob | -3.849 |
arians | -3.799 |
Token | aps |
Token ID | 1686 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +6.795 |
the | +6.633 |
, | +6.619 |
. | +6.471 |
a | +6.455 |
Neg logit contributions | |
umm | -2.652 |
lor | -2.632 |
rol | -2.619 |
osity | -2.429 |
bek | -2.411 |
Token | its |
Token ID | 663 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.704 |
, | +2.554 |
the | +2.491 |
a | +2.354 |
. | +2.317 |
Neg logit contributions | |
rol | -6.372 |
lor | -6.333 |
umm | -6.215 |
osity | -6.129 |
bek | -6.121 |
Token | Ben |
Token ID | 3932 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.147 |
, | +1.952 |
. | +1.774 |
the | +1.736 |
a | +1.613 |
Neg logit contributions | |
lor | -6.865 |
umm | -6.860 |
rol | -6.778 |
ocol | -6.777 |
osity | -6.736 |
Token | 's |
Token ID | 338 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.155 |
the | +3.098 |
, | +3.021 |
a | +2.938 |
. | +2.865 |
Neg logit contributions | |
lor | -5.973 |
rol | -5.942 |
umm | -5.925 |
osity | -5.802 |
ides | -5.768 |
Token | voice |
Token ID | 3809 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.369 |
the | +4.286 |
, | +4.234 |
a | +4.074 |
. | +4.034 |
Neg logit contributions | |
umm | -4.945 |
lor | -4.847 |
rol | -4.727 |
osity | -4.644 |
arians | -4.635 |
Token | from |
Token ID | 422 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.305 |
the | +1.275 |
, | +1.175 |
a | +1.147 |
. | +0.982 |
Neg logit contributions | |
umm | -7.789 |
lor | -7.724 |
rol | -7.687 |
osity | -7.564 |
arians | -7.550 |
Token | behind |
Token ID | 2157 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.002 |
, | +3.891 |
the | +3.619 |
. | +3.609 |
a | +3.521 |
Neg logit contributions | |
umm | -5.195 |
ocol | -5.084 |
rol | -5.035 |
rob | -4.946 |
arians | -4.937 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.302 |
, | +1.116 |
the | +0.926 |
. | +0.879 |
a | +0.820 |
Neg logit contributions | |
lor | -7.713 |
umm | -7.643 |
rol | -7.586 |
ocol | -7.571 |
rob | -7.350 |
Token | tree |
Token ID | 5509 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.892 |
the | +3.698 |
, | +3.694 |
a | +3.616 |
. | +3.591 |
Neg logit contributions | |
lor | -5.382 |
umm | -5.272 |
rol | -5.183 |
bek | -5.051 |
rob | -5.043 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.186 |
the | +1.157 |
, | +1.072 |
a | +1.068 |
. | +0.807 |
Neg logit contributions | |
lor | -7.901 |
rol | -7.775 |
umm | -7.763 |
bek | -7.601 |
arians | -7.578 |
Token | He |
Token ID | 679 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.580 |
, | +3.426 |
the | +3.387 |
. | +3.276 |
a | +3.247 |
Neg logit contributions | |
umm | -5.748 |
lor | -5.642 |
rol | -5.612 |
osity | -5.556 |
bek | -5.398 |
Token | says |
Token ID | 1139 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.827 |
the | +4.723 |
, | +4.716 |
. | +4.625 |
a | +4.544 |
Neg logit contributions | |
lor | -4.356 |
rol | -4.276 |
umm | -4.274 |
arians | -4.151 |
rob | -4.130 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.271 |
the | +1.068 |
, | +1.031 |
. | +0.956 |
a | +0.920 |
Neg logit contributions | |
umm | -8.068 |
lor | -8.048 |
rol | -7.985 |
osity | -7.843 |
bek | -7.806 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +1.551 |
and | +1.504 |
, | +1.358 |
a | +1.356 |
. | +1.150 |
Neg logit contributions | |
lor | -7.472 |
umm | -7.430 |
rol | -7.394 |
arians | -7.294 |
osity | -7.193 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
, | +2.598 |
and | +2.561 |
the | +2.503 |
. | +2.488 |
a | +2.396 |
Neg logit contributions | |
rol | -6.304 |
umm | -6.289 |
lor | -6.219 |
osity | -6.138 |
arians | -6.130 |
Token | he |
Token ID | 339 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.977 |
, | +2.850 |
. | +2.776 |
the | +2.653 |
a | +2.559 |
Neg logit contributions | |
umm | -6.076 |
rol | -6.074 |
lor | -6.042 |
bek | -6.007 |
osity | -5.954 |
Token | never |
Token ID | 1239 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.841 |
the | +3.749 |
, | +3.743 |
. | +3.617 |
a | +3.591 |
Neg logit contributions | |
lor | -5.354 |
rol | -5.289 |
umm | -5.246 |
arians | -5.156 |
bek | -5.138 |
Token | had |
Token ID | 550 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.263 |
the | +4.057 |
, | +4.030 |
. | +3.899 |
a | +3.898 |
Neg logit contributions | |
umm | -4.964 |
rol | -4.939 |
lor | -4.889 |
beh | -4.866 |
osity | -4.865 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.930 |
, | +2.696 |
the | +2.452 |
. | +2.451 |
a | +2.201 |
Neg logit contributions | |
lor | -6.288 |
rol | -6.268 |
beh | -6.216 |
umm | -6.155 |
osity | -6.050 |
Token | good |
Token ID | 922 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.864 |
the | +5.797 |
. | +5.568 |
, | +5.566 |
a | +5.488 |
Neg logit contributions | |
umm | -3.394 |
lor | -3.378 |
bek | -3.255 |
osity | -3.193 |
rol | -3.139 |
Token | night |
Token ID | 1755 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +4.839 |
and | +4.829 |
, | +4.652 |
. | +4.544 |
a | +4.543 |
Neg logit contributions | |
umm | -4.469 |
lor | -4.311 |
rol | -4.223 |
ides | -4.130 |
osity | -4.126 |
Token | 's |
Token ID | 338 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.227 |
the | +3.163 |
, | +3.049 |
a | +3.016 |
. | +2.812 |
Neg logit contributions | |
umm | -6.094 |
lor | -5.948 |
rol | -5.817 |
vation | -5.699 |
ides | -5.662 |
Token | sleep |
Token ID | 3993 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.483 |
the | +5.407 |
, | +5.313 |
a | +5.142 |
. | +5.069 |
Neg logit contributions | |
umm | -3.785 |
lor | -3.640 |
rol | -3.533 |
osity | -3.507 |
ides | -3.461 |
Token | again |
Token ID | 757 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.502 |
the | +3.423 |
, | +3.330 |
a | +3.246 |
. | +3.056 |
Neg logit contributions | |
lor | -5.812 |
umm | -5.764 |
rol | -5.607 |
arians | -5.500 |
bek | -5.458 |
Token | opened |
Token ID | 4721 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.342 |
the | +3.285 |
, | +3.224 |
. | +3.146 |
a | +3.115 |
Neg logit contributions | |
lor | -5.811 |
rol | -5.714 |
umm | -5.689 |
arians | -5.577 |
bek | -5.571 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.091 |
, | +0.917 |
the | +0.817 |
. | +0.783 |
a | +0.732 |
Neg logit contributions | |
umm | -8.127 |
lor | -8.113 |
rol | -8.076 |
osity | -7.870 |
bek | -7.853 |
Token | closet |
Token ID | 21615 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.838 |
the | +4.688 |
, | +4.668 |
a | +4.513 |
. | +4.497 |
Neg logit contributions | |
umm | -4.517 |
lor | -4.478 |
rol | -4.370 |
bek | -4.257 |
osity | -4.232 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.488 |
the | +2.478 |
, | +2.357 |
a | +2.333 |
. | +2.219 |
Neg logit contributions | |
lor | -6.695 |
umm | -6.677 |
rol | -6.572 |
osity | -6.388 |
bek | -6.377 |
Token | saw |
Token ID | 2497 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.219 |
, | +3.073 |
the | +2.972 |
. | +2.963 |
a | +2.841 |
Neg logit contributions | |
lor | -5.999 |
rol | -5.974 |
umm | -5.937 |
bek | -5.847 |
rob | -5.763 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.330 |
, | +2.102 |
. | +1.908 |
the | +1.839 |
a | +1.652 |
Neg logit contributions | |
umm | -7.027 |
rol | -6.983 |
lor | -6.882 |
rob | -6.774 |
ocol | -6.715 |
Token | big |
Token ID | 1263 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.033 |
the | +3.889 |
, | +3.826 |
. | +3.732 |
a | +3.697 |
Neg logit contributions | |
umm | -5.310 |
lor | -5.223 |
bek | -5.093 |
rol | -5.074 |
osity | -5.000 |
Token | monster |
Token ID | 9234 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.544 |
the | +4.415 |
, | +4.330 |
. | +4.299 |
a | +4.288 |
Neg logit contributions | |
umm | -4.755 |
lor | -4.539 |
rol | -4.480 |
ocol | -4.404 |
bek | -4.399 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.901 |
the | +2.786 |
, | +2.731 |
a | +2.626 |
. | +2.527 |
Neg logit contributions | |
lor | -6.338 |
umm | -6.336 |
rol | -6.288 |
arians | -6.088 |
rob | -6.078 |
Token | The |
Token ID | 383 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.358 |
, | +3.195 |
the | +3.125 |
. | +3.028 |
a | +2.970 |
Neg logit contributions | |
umm | -6.010 |
lor | -5.942 |
rol | -5.860 |
bek | -5.736 |
osity | -5.717 |
Token | monster |
Token ID | 9234 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.269 |
, | +5.074 |
the | +5.053 |
. | +4.917 |
a | +4.844 |
Neg logit contributions | |
umm | -4.198 |
lor | -4.072 |
rol | -3.979 |
rob | -3.853 |
osity | -3.846 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.615 |
the | +0.462 |
, | +0.392 |
a | +0.298 |
. | +0.174 |
Neg logit contributions | |
umm | -8.717 |
lor | -8.629 |
rol | -8.568 |
bek | -8.424 |
osity | -8.409 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.002 |
, | +2.830 |
the | +2.777 |
. | +2.665 |
a | +2.621 |
Neg logit contributions | |
umm | -6.424 |
lor | -6.423 |
rol | -6.315 |
osity | -6.191 |
bek | -6.181 |
Token | A |
Token ID | 32 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.341 |
, | +4.164 |
the | +4.157 |
. | +4.005 |
a | +4.000 |
Neg logit contributions | |
umm | -5.012 |
lor | -4.979 |
rol | -4.916 |
rob | -4.730 |
bek | -4.698 |
Token | woman |
Token ID | 2415 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.084 |
the | +3.916 |
, | +3.890 |
. | +3.766 |
a | +3.758 |
Neg logit contributions | |
umm | -5.345 |
lor | -5.254 |
rol | -5.186 |
bek | -5.070 |
osity | -5.046 |
Token | had |
Token ID | 550 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.130 |
the | +3.101 |
, | +3.025 |
a | +2.988 |
. | +2.938 |
Neg logit contributions | |
lor | -5.911 |
rol | -5.842 |
umm | -5.832 |
rob | -5.698 |
arians | -5.676 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.240 |
, | +3.099 |
the | +3.039 |
. | +2.942 |
a | +2.739 |
Neg logit contributions | |
lor | -6.077 |
rol | -6.057 |
umm | -5.892 |
ocol | -5.724 |
rob | -5.724 |
Token | broken |
Token ID | 5445 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.571 |
the | +4.431 |
, | +4.321 |
. | +4.285 |
a | +4.185 |
Neg logit contributions | |
umm | -4.798 |
lor | -4.610 |
rol | -4.570 |
bek | -4.559 |
osity | -4.437 |
Token | toy |
Token ID | 13373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.234 |
the | +5.160 |
, | +4.990 |
a | +4.955 |
. | +4.932 |
Neg logit contributions | |
umm | -4.003 |
lor | -3.916 |
rol | -3.816 |
bek | -3.704 |
ocol | -3.683 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.370 |
the | +3.318 |
, | +3.187 |
a | +3.125 |
. | +3.006 |
Neg logit contributions | |
umm | -5.839 |
lor | -5.797 |
rol | -5.725 |
arians | -5.633 |
osity | -5.553 |
Token | She |
Token ID | 1375 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.687 |
, | +3.511 |
the | +3.474 |
. | +3.352 |
a | +3.338 |
Neg logit contributions | |
umm | -5.753 |
lor | -5.607 |
rol | -5.603 |
osity | -5.457 |
bek | -5.367 |
Token | liked |
Token ID | 8288 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.048 |
the | +2.971 |
, | +2.965 |
. | +2.777 |
a | +2.761 |
Neg logit contributions | |
lor | -6.082 |
rol | -6.047 |
umm | -6.045 |
bek | -5.923 |
arians | -5.882 |
Token | very |
Token ID | 845 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.469 |
the | +3.396 |
, | +3.303 |
a | +3.226 |
. | +3.147 |
Neg logit contributions | |
umm | -5.695 |
rol | -5.612 |
lor | -5.597 |
arians | -5.512 |
osity | -5.399 |
Token | much |
Token ID | 881 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.338 |
the | +3.170 |
, | +3.143 |
a | +2.984 |
. | +2.983 |
Neg logit contributions | |
umm | -6.044 |
lor | -5.957 |
rol | -5.938 |
bek | -5.756 |
osity | -5.725 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +0.493 |
and | +0.487 |
a | +0.375 |
, | +0.338 |
. | +0.116 |
Neg logit contributions | |
umm | -8.539 |
lor | -8.346 |
rol | -8.302 |
arians | -8.253 |
bek | -8.154 |
Token | It |
Token ID | 632 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.825 |
, | +3.679 |
the | +3.620 |
. | +3.495 |
a | +3.475 |
Neg logit contributions | |
umm | -5.632 |
rol | -5.438 |
lor | -5.425 |
osity | -5.271 |
arians | -5.213 |
Token | was |
Token ID | 373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.382 |
, | +3.244 |
the | +3.204 |
. | +3.064 |
a | +3.043 |
Neg logit contributions | |
rol | -5.847 |
umm | -5.810 |
lor | -5.784 |
bek | -5.631 |
rob | -5.609 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.073 |
, | +2.885 |
. | +2.766 |
the | +2.740 |
a | +2.513 |
Neg logit contributions | |
rol | -6.067 |
umm | -6.001 |
lor | -5.870 |
ocol | -5.860 |
osity | -5.856 |
Token | red |
Token ID | 2266 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.724 |
the | +3.569 |
, | +3.512 |
. | +3.421 |
a | +3.356 |
Neg logit contributions | |
umm | -5.645 |
bek | -5.450 |
lor | -5.437 |
rol | -5.312 |
osity | -5.270 |
Token | car |
Token ID | 1097 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.323 |
the | +4.282 |
, | +4.151 |
a | +4.066 |
. | +4.039 |
Neg logit contributions | |
umm | -4.981 |
lor | -4.819 |
rol | -4.782 |
bek | -4.660 |
osity | -4.631 |
Token | that |
Token ID | 326 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.516 |
the | +1.451 |
, | +1.340 |
a | +1.273 |
. | +1.157 |
Neg logit contributions | |
umm | -7.599 |
lor | -7.558 |
rol | -7.552 |
arians | -7.434 |
osity | -7.368 |
Token | could |
Token ID | 714 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.983 |
, | +3.822 |
. | +3.654 |
the | +3.652 |
a | +3.554 |
Neg logit contributions | |
rol | -5.308 |
umm | -5.290 |
lor | -5.191 |
osity | -5.041 |
bek | -5.018 |
Token | make |
Token ID | 787 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.229 |
, | +4.116 |
the | +3.997 |
. | +3.888 |
a | +3.790 |
Neg logit contributions | |
rol | -4.978 |
lor | -4.874 |
umm | -4.859 |
arians | -4.782 |
osity | -4.716 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +1.272 |
and | +1.265 |
, | +1.136 |
a | +1.119 |
. | +0.982 |
Neg logit contributions | |
umm | -7.797 |
lor | -7.657 |
rol | -7.629 |
arians | -7.591 |
osity | -7.512 |
Token | gave |
Token ID | 2921 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.297 |
, | +4.091 |
. | +3.980 |
the | +3.889 |
a | +3.692 |
Neg logit contributions | |
bek | -4.972 |
beh | -4.883 |
umm | -4.854 |
osity | -4.795 |
lor | -4.792 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.509 |
, | +2.324 |
. | +2.133 |
the | +2.012 |
a | +1.960 |
Neg logit contributions | |
rol | -6.853 |
lor | -6.799 |
umm | -6.774 |
bek | -6.632 |
arians | -6.563 |
Token | mighty |
Token ID | 18680 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.178 |
, | +4.996 |
the | +4.984 |
. | +4.838 |
a | +4.712 |
Neg logit contributions | |
umm | -4.240 |
lor | -4.150 |
arians | -4.061 |
rol | -3.997 |
bek | -3.984 |
Token | lion |
Token ID | 18744 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.100 |
the | +5.009 |
, | +4.877 |
. | +4.783 |
a | +4.782 |
Neg logit contributions | |
umm | -4.281 |
lor | -4.138 |
arians | -4.042 |
rol | -4.014 |
bek | -3.969 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.947 |
, | +2.785 |
the | +2.726 |
. | +2.542 |
a | +2.463 |
Neg logit contributions | |
lor | -6.283 |
rol | -6.166 |
umm | -6.027 |
beh | -6.023 |
bek | -5.994 |
Token | shiny |
Token ID | 22441 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.044 |
the | +4.889 |
, | +4.785 |
. | +4.728 |
a | +4.546 |
Neg logit contributions | |
lor | -4.286 |
umm | -4.242 |
bek | -4.217 |
rol | -4.077 |
osity | -4.027 |
Token | red |
Token ID | 2266 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.233 |
the | +5.187 |
, | +5.000 |
. | +4.947 |
a | +4.919 |
Neg logit contributions | |
umm | -4.077 |
lor | -3.912 |
rol | -3.816 |
ocol | -3.755 |
bek | -3.722 |
Token | apple |
Token ID | 17180 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.984 |
the | +4.970 |
, | +4.768 |
a | +4.688 |
. | +4.662 |
Neg logit contributions | |
umm | -4.346 |
lor | -4.220 |
rol | -4.100 |
bek | -3.975 |
ocol | -3.955 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +2.124 |
and | +2.124 |
, | +1.970 |
a | +1.896 |
. | +1.713 |
Neg logit contributions | |
umm | -7.065 |
lor | -6.969 |
rol | -6.906 |
bek | -6.692 |
arians | -6.676 |
Token | The |
Token ID | 383 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.144 |
, | +4.043 |
the | +3.948 |
. | +3.893 |
a | +3.813 |
Neg logit contributions | |
umm | -5.298 |
lor | -5.187 |
rol | -5.165 |
osity | -5.028 |
arians | -4.987 |
Token | reward |
Token ID | 6721 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.925 |
the | +4.777 |
, | +4.658 |
. | +4.608 |
a | +4.440 |
Neg logit contributions | |
lor | -4.375 |
umm | -4.286 |
bek | -4.274 |
rol | -4.238 |
osity | -4.153 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +2.056 |
and | +2.055 |
a | +1.865 |
, | +1.845 |
. | +1.638 |
Neg logit contributions | |
lor | -7.056 |
rol | -7.024 |
umm | -6.943 |
arians | -6.902 |
ides | -6.777 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.661 |
, | +3.508 |
the | +3.456 |
. | +3.376 |
a | +3.327 |
Neg logit contributions | |
lor | -5.647 |
umm | -5.644 |
rol | -5.607 |
arians | -5.459 |
osity | -5.402 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.777 |
, | +1.629 |
the | +1.608 |
. | +1.469 |
a | +1.449 |
Neg logit contributions | |
lor | -7.590 |
rol | -7.489 |
umm | -7.462 |
bek | -7.316 |
arians | -7.294 |
Token | The |
Token ID | 464 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.954 |
, | +4.824 |
the | +4.771 |
. | +4.679 |
a | +4.598 |
Neg logit contributions | |
lor | -4.479 |
umm | -4.409 |
rol | -4.393 |
bek | -4.308 |
arians | -4.266 |
Token | monkey |
Token ID | 21657 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.111 |
, | +4.927 |
the | +4.866 |
. | +4.787 |
a | +4.666 |
Neg logit contributions | |
umm | -4.370 |
arians | -4.152 |
lor | -4.132 |
rol | -4.052 |
bek | -4.045 |
Token | decided |
Token ID | 3066 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.596 |
the | +3.595 |
, | +3.479 |
. | +3.464 |
a | +3.437 |
Neg logit contributions | |
lor | -5.479 |
rol | -5.367 |
umm | -5.348 |
arians | -5.326 |
bek | -5.308 |
Token | to |
Token ID | 284 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.439 |
the | +1.272 |
, | +1.268 |
. | +1.192 |
a | +1.157 |
Neg logit contributions | |
lor | -7.672 |
bek | -7.463 |
osity | -7.462 |
rol | -7.436 |
arians | -7.410 |
Token | be |
Token ID | 307 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.452 |
, | +4.224 |
the | +4.211 |
. | +4.125 |
a | +4.058 |
Neg logit contributions | |
lor | -4.809 |
umm | -4.739 |
arians | -4.685 |
rol | -4.610 |
ides | -4.573 |
Token | brave |
Token ID | 14802 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.966 |
, | +3.709 |
. | +3.531 |
the | +3.524 |
a | +3.239 |
Neg logit contributions | |
beh | -5.264 |
rol | -5.257 |
lor | -5.236 |
bek | -5.192 |
umm | -5.125 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +1.272 |
and | +1.265 |
, | +1.136 |
a | +1.119 |
. | +0.982 |
Neg logit contributions | |
umm | -7.797 |
lor | -7.657 |
rol | -7.629 |
arians | -7.591 |
osity | -7.512 |
Token | They |
Token ID | 1119 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.414 |
, | +3.239 |
the | +3.204 |
. | +3.117 |
a | +3.066 |
Neg logit contributions | |
umm | -5.885 |
lor | -5.856 |
rol | -5.830 |
arians | -5.728 |
osity | -5.638 |
Token | tried |
Token ID | 3088 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.914 |
, | +3.731 |
the | +3.692 |
. | +3.621 |
a | +3.557 |
Neg logit contributions | |
rol | -5.319 |
bek | -5.202 |
umm | -5.165 |
lor | -5.157 |
arians | -5.141 |
Token | to |
Token ID | 284 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.648 |
, | +1.511 |
the | +1.504 |
. | +1.490 |
a | +1.366 |
Neg logit contributions | |
lor | -7.181 |
rol | -7.172 |
osity | -7.152 |
bek | -7.106 |
arians | -7.082 |
Token | think |
Token ID | 892 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.538 |
, | +4.429 |
the | +4.290 |
. | +4.259 |
a | +4.126 |
Neg logit contributions | |
arians | -4.606 |
lor | -4.447 |
umm | -4.432 |
bek | -4.390 |
beh | -4.373 |
Token | of |
Token ID | 286 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.750 |
the | +2.641 |
, | +2.587 |
a | +2.535 |
. | +2.497 |
Neg logit contributions | |
lor | -6.190 |
rol | -6.187 |
umm | -6.098 |
ides | -6.010 |
arians | -6.009 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.924 |
, | +2.732 |
. | +2.558 |
the | +2.432 |
a | +2.158 |
Neg logit contributions | |
lor | -6.323 |
arians | -6.214 |
umm | -6.205 |
bek | -6.042 |
rol | -6.004 |
Token | way |
Token ID | 835 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.750 |
the | +4.548 |
, | +4.438 |
. | +4.377 |
a | +4.325 |
Neg logit contributions | |
umm | -4.570 |
bek | -4.537 |
lor | -4.532 |
arians | -4.393 |
rol | -4.346 |
Token | to |
Token ID | 284 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.543 |
the | +1.380 |
, | +1.311 |
a | +1.300 |
. | +1.199 |
Neg logit contributions | |
rol | -7.639 |
lor | -7.566 |
umm | -7.529 |
osity | -7.442 |
bek | -7.363 |
Token | give |
Token ID | 1577 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.579 |
, | +4.346 |
. | +4.182 |
the | +4.126 |
a | +4.024 |
Neg logit contributions | |
arians | -4.633 |
lor | -4.583 |
bek | -4.476 |
umm | -4.461 |
rol | -4.444 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.223 |
, | +3.003 |
the | +2.826 |
. | +2.795 |
a | +2.763 |
Neg logit contributions | |
rol | -5.965 |
lor | -5.918 |
umm | -5.916 |
arians | -5.809 |
beh | -5.782 |
Token | lion |
Token ID | 18744 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.228 |
, | +5.032 |
the | +5.027 |
. | +4.876 |
a | +4.790 |
Neg logit contributions | |
umm | -4.261 |
lor | -4.054 |
rol | -4.013 |
arians | -4.005 |
bek | -3.881 |
Token | way |
Token ID | 835 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.750 |
the | +4.548 |
, | +4.438 |
. | +4.377 |
a | +4.325 |
Neg logit contributions | |
umm | -4.570 |
bek | -4.537 |
lor | -4.532 |
arians | -4.393 |
rol | -4.346 |
Token | to |
Token ID | 284 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.543 |
the | +1.380 |
, | +1.311 |
a | +1.300 |
. | +1.199 |
Neg logit contributions | |
rol | -7.639 |
lor | -7.566 |
umm | -7.529 |
osity | -7.442 |
bek | -7.363 |
Token | give |
Token ID | 1577 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.579 |
, | +4.346 |
. | +4.182 |
the | +4.126 |
a | +4.024 |
Neg logit contributions | |
arians | -4.633 |
lor | -4.583 |
bek | -4.476 |
umm | -4.461 |
rol | -4.444 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.223 |
, | +3.003 |
the | +2.826 |
. | +2.795 |
a | +2.763 |
Neg logit contributions | |
rol | -5.965 |
lor | -5.918 |
umm | -5.916 |
arians | -5.809 |
beh | -5.782 |
Token | lion |
Token ID | 18744 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.228 |
, | +5.032 |
the | +5.027 |
. | +4.876 |
a | +4.790 |
Neg logit contributions | |
umm | -4.261 |
lor | -4.054 |
rol | -4.013 |
arians | -4.005 |
bek | -3.881 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.785 |
the | +2.594 |
, | +2.561 |
. | +2.421 |
a | +2.353 |
Neg logit contributions | |
lor | -6.314 |
rol | -6.222 |
beh | -6.093 |
umm | -6.090 |
osity | -6.067 |
Token | reward |
Token ID | 6721 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.925 |
the | +4.777 |
, | +4.658 |
. | +4.608 |
a | +4.440 |
Neg logit contributions | |
lor | -4.375 |
umm | -4.286 |
bek | -4.274 |
rol | -4.238 |
osity | -4.153 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +2.056 |
and | +2.055 |
a | +1.865 |
, | +1.845 |
. | +1.638 |
Neg logit contributions | |
lor | -7.056 |
rol | -7.024 |
umm | -6.943 |
arians | -6.902 |
ides | -6.777 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.661 |
, | +3.508 |
the | +3.456 |
. | +3.376 |
a | +3.327 |
Neg logit contributions | |
lor | -5.647 |
umm | -5.644 |
rol | -5.607 |
arians | -5.459 |
osity | -5.402 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.777 |
, | +1.629 |
the | +1.608 |
. | +1.469 |
a | +1.449 |
Neg logit contributions | |
lor | -7.590 |
rol | -7.489 |
umm | -7.462 |
bek | -7.316 |
arians | -7.294 |
Token | The |
Token ID | 464 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.954 |
, | +4.824 |
the | +4.771 |
. | +4.679 |
a | +4.598 |
Neg logit contributions | |
lor | -4.479 |
umm | -4.409 |
rol | -4.393 |
bek | -4.308 |
arians | -4.266 |
Token | very |
Token ID | 845 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.505 |
, | +3.361 |
. | +3.300 |
the | +3.209 |
a | +2.971 |
Neg logit contributions | |
rol | -5.759 |
lor | -5.581 |
umm | -5.415 |
beh | -5.371 |
osity | -5.360 |
Token | happy |
Token ID | 3772 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.093 |
the | +3.849 |
, | +3.838 |
. | +3.789 |
a | +3.693 |
Neg logit contributions | |
umm | -5.144 |
rol | -5.072 |
bek | -5.058 |
osity | -4.982 |
lor | -4.971 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +0.720 |
and | +0.685 |
a | +0.605 |
, | +0.569 |
. | +0.437 |
Neg logit contributions | |
umm | -8.268 |
lor | -8.180 |
rol | -8.075 |
osity | -8.024 |
arians | -7.976 |
Token | thanked |
Token ID | 26280 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.431 |
, | +4.245 |
. | +4.197 |
the | +4.119 |
a | +4.077 |
Neg logit contributions | |
umm | -4.735 |
lor | -4.660 |
bek | -4.647 |
rol | -4.638 |
beh | -4.533 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.157 |
, | +1.984 |
. | +1.798 |
the | +1.737 |
a | +1.733 |
Neg logit contributions | |
umm | -7.075 |
lor | -7.058 |
rol | -6.986 |
arians | -6.925 |
bek | -6.889 |
Token | monkey |
Token ID | 21657 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.936 |
, | +4.769 |
the | +4.695 |
. | +4.575 |
a | +4.476 |
Neg logit contributions | |
umm | -4.532 |
lor | -4.340 |
arians | -4.256 |
rol | -4.252 |
bek | -4.186 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.986 |
the | +1.907 |
, | +1.837 |
a | +1.737 |
. | +1.613 |
Neg logit contributions | |
lor | -7.159 |
rol | -7.084 |
umm | -7.011 |
bek | -6.923 |
arians | -6.908 |
Token | But |
Token ID | 887 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.423 |
, | +4.311 |
the | +4.221 |
. | +4.142 |
a | +4.114 |
Neg logit contributions | |
umm | -4.984 |
lor | -4.903 |
rol | -4.887 |
osity | -4.698 |
arians | -4.687 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.759 |
. | +2.543 |
, | +2.523 |
the | +2.462 |
a | +2.439 |
Neg logit contributions | |
umm | -6.325 |
bek | -6.256 |
lor | -6.250 |
rol | -6.220 |
arians | -6.169 |
Token | rest |
Token ID | 1334 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.087 |
, | +4.927 |
the | +4.870 |
. | +4.792 |
a | +4.622 |
Neg logit contributions | |
umm | -4.333 |
lor | -4.123 |
arians | -4.069 |
bek | -4.025 |
rob | -3.995 |
Token | of |
Token ID | 286 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +6.000 |
the | +5.878 |
, | +5.846 |
a | +5.817 |
. | +5.782 |
Neg logit contributions | |
rol | -3.244 |
umm | -3.153 |
lor | -3.104 |
osity | -3.007 |
bek | -2.966 |
Token | mighty |
Token ID | 18680 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.178 |
, | +4.996 |
the | +4.984 |
. | +4.838 |
a | +4.712 |
Neg logit contributions | |
umm | -4.240 |
lor | -4.150 |
arians | -4.061 |
rol | -3.997 |
bek | -3.984 |
Token | lion |
Token ID | 18744 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.100 |
the | +5.009 |
, | +4.877 |
. | +4.783 |
a | +4.782 |
Neg logit contributions | |
umm | -4.281 |
lor | -4.138 |
arians | -4.042 |
rol | -4.014 |
bek | -3.969 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.947 |
, | +2.785 |
the | +2.726 |
. | +2.542 |
a | +2.463 |
Neg logit contributions | |
lor | -6.283 |
rol | -6.166 |
umm | -6.027 |
beh | -6.023 |
bek | -5.994 |
Token | shiny |
Token ID | 22441 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.044 |
the | +4.889 |
, | +4.785 |
. | +4.728 |
a | +4.546 |
Neg logit contributions | |
lor | -4.286 |
umm | -4.242 |
bek | -4.217 |
rol | -4.077 |
osity | -4.027 |
Token | red |
Token ID | 2266 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.233 |
the | +5.187 |
, | +5.000 |
. | +4.947 |
a | +4.919 |
Neg logit contributions | |
umm | -4.077 |
lor | -3.912 |
rol | -3.816 |
ocol | -3.755 |
bek | -3.722 |
Token | apple |
Token ID | 17180 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.984 |
the | +4.970 |
, | +4.768 |
a | +4.688 |
. | +4.662 |
Neg logit contributions | |
umm | -4.346 |
lor | -4.220 |
rol | -4.100 |
bek | -3.975 |
ocol | -3.955 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +2.124 |
and | +2.124 |
, | +1.970 |
a | +1.896 |
. | +1.713 |
Neg logit contributions | |
umm | -7.065 |
lor | -6.969 |
rol | -6.906 |
bek | -6.692 |
arians | -6.676 |
Token | The |
Token ID | 383 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.144 |
, | +4.043 |
the | +3.948 |
. | +3.893 |
a | +3.813 |
Neg logit contributions | |
umm | -5.298 |
lor | -5.187 |
rol | -5.165 |
osity | -5.028 |
arians | -4.987 |
Token | lion |
Token ID | 18744 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.086 |
, | +4.911 |
the | +4.843 |
. | +4.772 |
a | +4.641 |
Neg logit contributions | |
umm | -4.350 |
lor | -4.140 |
arians | -4.128 |
bek | -4.048 |
rol | -4.040 |
Token | was |
Token ID | 373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.687 |
the | +3.670 |
, | +3.596 |
. | +3.567 |
a | +3.520 |
Neg logit contributions | |
lor | -5.390 |
rol | -5.289 |
umm | -5.279 |
arians | -5.222 |
bek | -5.162 |
Token | very |
Token ID | 845 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.505 |
, | +3.361 |
. | +3.300 |
the | +3.209 |
a | +2.971 |
Neg logit contributions | |
rol | -5.759 |
lor | -5.581 |
umm | -5.415 |
beh | -5.371 |
osity | -5.360 |
Token | He |
Token ID | 679 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.408 |
, | +4.290 |
the | +4.198 |
. | +4.093 |
a | +3.997 |
Neg logit contributions | |
umm | -5.118 |
rol | -4.928 |
lor | -4.913 |
osity | -4.794 |
arians | -4.767 |
Token | yelled |
Token ID | 22760 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.106 |
, | +4.058 |
the | +4.013 |
. | +3.971 |
a | +3.892 |
Neg logit contributions | |
lor | -4.945 |
rol | -4.906 |
arians | -4.885 |
bek | -4.844 |
umm | -4.793 |
Token | that |
Token ID | 326 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.364 |
the | +2.292 |
, | +2.171 |
. | +2.144 |
a | +2.106 |
Neg logit contributions | |
umm | -6.631 |
rol | -6.622 |
lor | -6.563 |
osity | -6.524 |
arians | -6.419 |
Token | he |
Token ID | 339 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.647 |
, | +2.392 |
. | +2.312 |
the | +2.170 |
a | +2.135 |
Neg logit contributions | |
umm | -6.531 |
rol | -6.467 |
lor | -6.442 |
osity | -6.419 |
bek | -6.361 |
Token | wanted |
Token ID | 2227 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +3.931 |
and | +3.922 |
, | +3.844 |
a | +3.681 |
. | +3.655 |
Neg logit contributions | |
lor | -5.237 |
rol | -5.219 |
arians | -5.113 |
umm | -5.063 |
ides | -4.997 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.799 |
, | +1.605 |
. | +1.457 |
the | +1.402 |
a | +1.279 |
Neg logit contributions | |
umm | -7.176 |
lor | -7.173 |
rol | -7.016 |
arians | -6.999 |
osity | -6.957 |
Token | better |
Token ID | 1365 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.931 |
the | +4.751 |
, | +4.660 |
. | +4.606 |
a | +4.503 |
Neg logit contributions | |
umm | -4.434 |
lor | -4.308 |
bek | -4.279 |
rol | -4.148 |
osity | -4.129 |
Token | reward |
Token ID | 6721 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.345 |
the | +4.313 |
, | +4.127 |
. | +4.032 |
a | +4.023 |
Neg logit contributions | |
umm | -4.958 |
lor | -4.785 |
rol | -4.578 |
bek | -4.553 |
ides | -4.523 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.923 |
the | +1.895 |
, | +1.728 |
a | +1.716 |
. | +1.520 |
Neg logit contributions | |
lor | -7.115 |
rol | -7.094 |
umm | -7.031 |
arians | -6.954 |
bek | -6.897 |
Token | All |
Token ID | 1439 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.027 |
, | +3.871 |
the | +3.813 |
. | +3.691 |
a | +3.665 |
Neg logit contributions | |
umm | -5.446 |
lor | -5.322 |
rol | -5.265 |
arians | -5.145 |
osity | -5.112 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.764 |
, | +1.549 |
. | +1.439 |
a | +1.419 |
the | +1.379 |
Neg logit contributions | |
umm | -7.443 |
rol | -7.390 |
osity | -7.232 |
lor | -7.230 |
bek | -7.191 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +0.551 |
and | +0.434 |
a | +0.424 |
, | +0.311 |
. | +0.199 |
Neg logit contributions | |
rol | -8.294 |
lor | -8.239 |
umm | -8.234 |
osity | -8.227 |
arians | -8.070 |
Token | said |
Token ID | 531 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.425 |
, | +4.188 |
. | +4.092 |
the | +3.955 |
a | +3.921 |
Neg logit contributions | |
rol | -4.893 |
bek | -4.832 |
umm | -4.806 |
lor | -4.799 |
beh | -4.699 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.107 |
the | +3.835 |
, | +3.766 |
. | +3.740 |
a | +3.660 |
Neg logit contributions | |
lor | -5.200 |
umm | -5.109 |
rol | -5.076 |
osity | -4.999 |
bek | -4.915 |
Token | " |
Token ID | 366 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.844 |
the | +2.718 |
, | +2.706 |
. | +2.579 |
a | +2.569 |
Neg logit contributions | |
lor | -6.304 |
umm | -6.241 |
rol | -6.184 |
osity | -6.172 |
arians | -6.103 |
Token | Would |
Token ID | 17353 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +6.037 |
, | +5.979 |
the | +5.848 |
. | +5.744 |
a | +5.673 |
Neg logit contributions | |
umm | -3.526 |
lor | -3.522 |
rol | -3.424 |
bek | -3.292 |
arians | -3.223 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.239 |
, | +3.048 |
the | +3.033 |
. | +2.916 |
a | +2.874 |
Neg logit contributions | |
umm | -6.176 |
lor | -6.129 |
rol | -6.064 |
bek | -5.909 |
arians | -5.891 |
Token | hug |
Token ID | 16225 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.167 |
the | +4.986 |
, | +4.925 |
. | +4.815 |
a | +4.725 |
Neg logit contributions | |
umm | -4.331 |
lor | -4.184 |
bek | -4.130 |
rol | -4.056 |
arians | -3.947 |
Token | work |
Token ID | 670 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.086 |
the | +4.017 |
, | +3.889 |
a | +3.842 |
. | +3.819 |
Neg logit contributions | |
lor | -5.123 |
umm | -5.070 |
rol | -5.065 |
osity | -4.853 |
reetings | -4.842 |
Token | instead |
Token ID | 2427 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.557 |
the | +3.442 |
, | +3.323 |
a | +3.318 |
. | +3.269 |
Neg logit contributions | |
umm | -5.618 |
lor | -5.565 |
rol | -5.529 |
osity | -5.369 |
reetings | -5.367 |
Token | of |
Token ID | 286 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.017 |
the | +3.912 |
a | +3.790 |
, | +3.777 |
. | +3.706 |
Neg logit contributions | |
lor | -5.194 |
umm | -5.147 |
rol | -5.119 |
reetings | -4.957 |
osity | -4.873 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.329 |
, | +4.103 |
. | +4.011 |
the | +3.920 |
a | +3.795 |
Neg logit contributions | |
umm | -4.824 |
lor | -4.739 |
ocol | -4.732 |
arians | -4.717 |
rol | -4.566 |
Token | loudly |
Token ID | 23112 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.734 |
the | +3.460 |
, | +3.440 |
. | +3.298 |
a | +3.286 |
Neg logit contributions | |
umm | -5.625 |
lor | -5.574 |
rol | -5.472 |
bek | -5.428 |
osity | -5.394 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.353 |
the | +2.292 |
, | +2.151 |
a | +2.119 |
. | +2.041 |
Neg logit contributions | |
lor | -6.698 |
umm | -6.644 |
rol | -6.619 |
osity | -6.532 |
arians | -6.463 |
Token | " |
Token ID | 366 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.917 |
, | +2.854 |
the | +2.821 |
. | +2.766 |
a | +2.669 |
Neg logit contributions | |
rol | -6.078 |
lor | -6.016 |
umm | -5.965 |
osity | -5.965 |
arians | -5.885 |
Token | I |
Token ID | 40 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.947 |
, | +5.848 |
the | +5.774 |
. | +5.648 |
a | +5.609 |
Neg logit contributions | |
umm | -3.551 |
lor | -3.498 |
rol | -3.467 |
bek | -3.287 |
osity | -3.236 |
Token | want |
Token ID | 765 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.750 |
the | +4.680 |
, | +4.548 |
a | +4.450 |
. | +4.436 |
Neg logit contributions | |
lor | -4.481 |
rol | -4.472 |
umm | -4.367 |
bek | -4.277 |
reetings | -4.238 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.059 |
, | +1.853 |
. | +1.743 |
the | +1.663 |
a | +1.484 |
Neg logit contributions | |
lor | -7.098 |
umm | -7.063 |
rol | -6.947 |
arians | -6.873 |
osity | -6.847 |
Token | reward |
Token ID | 6721 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.153 |
the | +4.986 |
, | +4.904 |
. | +4.834 |
a | +4.705 |
Neg logit contributions | |
umm | -4.196 |
lor | -4.147 |
rol | -4.058 |
bek | -4.020 |
osity | -3.952 |
Token | !" |
Token ID | 2474 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.869 |
the | +2.788 |
, | +2.650 |
a | +2.574 |
. | +2.519 |
Neg logit contributions | |
umm | -6.322 |
lor | -6.307 |
rol | -6.298 |
arians | -6.152 |
bek | -6.031 |
Token | The |
Token ID | 383 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.544 |
, | +3.429 |
the | +3.377 |
. | +3.240 |
a | +3.232 |
Neg logit contributions | |
lor | -5.710 |
umm | -5.624 |
rol | -5.570 |
arians | -5.415 |
bek | -5.402 |
Token | other |
Token ID | 584 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.197 |
, | +5.009 |
the | +4.973 |
. | +4.853 |
a | +4.754 |
Neg logit contributions | |
umm | -4.305 |
lor | -4.062 |
arians | -4.014 |
bek | -3.973 |
rol | -3.967 |
Token | animals |
Token ID | 4695 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.659 |
the | +4.509 |
, | +4.472 |
. | +4.354 |
a | +4.316 |
Neg logit contributions | |
umm | -4.702 |
rol | -4.545 |
lor | -4.512 |
arians | -4.430 |
bek | -4.389 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +0.949 |
and | +0.931 |
, | +0.757 |
a | +0.741 |
. | +0.553 |
Neg logit contributions | |
umm | -8.071 |
lor | -7.899 |
rol | -7.870 |
arians | -7.791 |
osity | -7.768 |
Token | I |
Token ID | 314 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.186 |
, | +5.015 |
the | +4.990 |
. | +4.878 |
a | +4.818 |
Neg logit contributions | |
umm | -4.269 |
lor | -4.171 |
rol | -4.114 |
osity | -4.030 |
arians | -3.966 |
Token | can |
Token ID | 460 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.161 |
the | +4.067 |
, | +4.015 |
a | +3.867 |
. | +3.865 |
Neg logit contributions | |
umm | -5.028 |
rol | -5.026 |
lor | -5.008 |
bek | -4.863 |
osity | -4.855 |
Token | 't |
Token ID | 470 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.404 |
the | +4.241 |
, | +4.226 |
. | +4.080 |
a | +4.071 |
Neg logit contributions | |
umm | -4.870 |
lor | -4.839 |
rol | -4.757 |
arians | -4.689 |
osity | -4.646 |
Token | fix |
Token ID | 4259 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.104 |
the | +3.985 |
, | +3.943 |
a | +3.816 |
. | +3.754 |
Neg logit contributions | |
umm | -5.168 |
lor | -5.075 |
rol | -4.998 |
arians | -4.925 |
ides | -4.918 |
Token | it |
Token ID | 340 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.751 |
, | +1.526 |
. | +1.319 |
the | +1.319 |
a | +1.287 |
Neg logit contributions | |
umm | -7.387 |
lor | -7.386 |
rol | -7.233 |
ocol | -7.224 |
arians | -7.208 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.539 |
the | +2.487 |
, | +2.339 |
a | +2.311 |
. | +2.085 |
Neg logit contributions | |
umm | -6.601 |
rol | -6.519 |
lor | -6.494 |
arians | -6.346 |
ides | -6.335 |
Token | I |
Token ID | 314 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.261 |
, | +5.109 |
the | +5.095 |
. | +4.960 |
a | +4.896 |
Neg logit contributions | |
umm | -4.202 |
lor | -4.076 |
rol | -4.022 |
osity | -3.945 |
arians | -3.909 |
Token | love |
Token ID | 1842 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.112 |
the | +4.025 |
, | +3.965 |
a | +3.826 |
. | +3.812 |
Neg logit contributions | |
rol | -5.077 |
umm | -5.076 |
lor | -5.053 |
bek | -4.910 |
osity | -4.891 |
Token | my |
Token ID | 616 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.176 |
, | +3.025 |
the | +2.831 |
. | +2.829 |
a | +2.785 |
Neg logit contributions | |
umm | -6.083 |
arians | -5.845 |
ocol | -5.845 |
lor | -5.838 |
osity | -5.793 |
Token | toy |
Token ID | 13373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.501 |
the | +3.439 |
, | +3.346 |
a | +3.185 |
. | +3.137 |
Neg logit contributions | |
umm | -5.713 |
arians | -5.493 |
lor | -5.453 |
bek | -5.390 |
osity | -5.364 |
Token | that |
Token ID | 326 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.516 |
the | +1.451 |
, | +1.340 |
a | +1.273 |
. | +1.157 |
Neg logit contributions | |
umm | -7.599 |
lor | -7.558 |
rol | -7.552 |
arians | -7.434 |
osity | -7.368 |
Token | could |
Token ID | 714 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.983 |
, | +3.822 |
. | +3.654 |
the | +3.652 |
a | +3.554 |
Neg logit contributions | |
rol | -5.308 |
umm | -5.290 |
lor | -5.191 |
osity | -5.041 |
bek | -5.018 |
Token | make |
Token ID | 787 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.229 |
, | +4.116 |
the | +3.997 |
. | +3.888 |
a | +3.790 |
Neg logit contributions | |
rol | -4.978 |
lor | -4.874 |
umm | -4.859 |
arians | -4.782 |
osity | -4.716 |
Token | sounds |
Token ID | 5238 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.539 |
, | +3.353 |
the | +3.168 |
. | +3.100 |
a | +2.999 |
Neg logit contributions | |
rol | -5.748 |
umm | -5.662 |
lor | -5.605 |
beh | -5.459 |
ocol | -5.437 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.417 |
the | +1.340 |
, | +1.298 |
a | +1.182 |
. | +1.076 |
Neg logit contributions | |
umm | -7.657 |
rol | -7.601 |
lor | -7.472 |
osity | -7.426 |
arians | -7.398 |
Token | move |
Token ID | 1445 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.838 |
, | +4.688 |
the | +4.511 |
. | +4.474 |
a | +4.364 |
Neg logit contributions | |
umm | -4.312 |
rol | -4.248 |
osity | -4.248 |
arians | -4.141 |
bek | -4.124 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.315 |
, | +2.192 |
the | +2.131 |
a | +2.013 |
. | +1.920 |
Neg logit contributions | |
rol | -6.779 |
umm | -6.686 |
lor | -6.593 |
arians | -6.514 |
osity | -6.501 |
Token | But |
Token ID | 887 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.998 |
, | +3.858 |
the | +3.798 |
. | +3.665 |
a | +3.645 |
Neg logit contributions | |
umm | -5.452 |
rol | -5.298 |
lor | -5.268 |
arians | -5.110 |
osity | -5.105 |
Token | one |
Token ID | 530 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.574 |
. | +2.350 |
, | +2.279 |
the | +2.203 |
a | +2.151 |
Neg logit contributions | |
umm | -6.576 |
rol | -6.426 |
lor | -6.416 |
osity | -6.416 |
bek | -6.385 |
Token | day |
Token ID | 1110 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.241 |
the | +3.085 |
, | +3.075 |
. | +2.952 |
a | +2.920 |
Neg logit contributions | |
umm | -6.105 |
lor | -5.953 |
rol | -5.945 |
bek | -5.873 |
osity | -5.788 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.824 |
the | +0.480 |
. | +0.464 |
, | +0.420 |
a | +0.367 |
Neg logit contributions | |
umm | -8.297 |
lor | -8.292 |
rol | -8.180 |
osity | -8.119 |
bek | -8.099 |
Token | used |
Token ID | 973 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.670 |
, | +3.541 |
the | +3.520 |
. | +3.392 |
a | +3.339 |
Neg logit contributions | |
umm | -5.520 |
rol | -5.486 |
lor | -5.468 |
bek | -5.403 |
arians | -5.327 |
Token | glue |
Token ID | 22749 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.370 |
, | +2.217 |
. | +2.077 |
the | +1.966 |
a | +1.827 |
Neg logit contributions | |
rol | -6.674 |
umm | -6.614 |
ocol | -6.505 |
osity | -6.467 |
lor | -6.461 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.284 |
the | +1.176 |
, | +1.136 |
a | +1.106 |
. | +1.041 |
Neg logit contributions | |
rol | -7.647 |
lor | -7.579 |
umm | -7.571 |
osity | -7.482 |
ides | -7.341 |
Token | tape |
Token ID | 9154 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.794 |
, | +4.657 |
. | +4.580 |
the | +4.526 |
a | +4.319 |
Neg logit contributions | |
umm | -4.228 |
ocol | -4.051 |
bek | -4.036 |
rol | -4.026 |
vals | -4.023 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.374 |
the | +1.239 |
, | +1.191 |
a | +1.136 |
. | +1.045 |
Neg logit contributions | |
rol | -7.668 |
umm | -7.546 |
lor | -7.542 |
osity | -7.451 |
ides | -7.324 |
Token | scissors |
Token ID | 41786 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.799 |
, | +4.677 |
. | +4.586 |
the | +4.538 |
a | +4.348 |
Neg logit contributions | |
umm | -4.185 |
bek | -4.041 |
rol | -4.013 |
plets | -3.977 |
vals | -3.976 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.126 |
the | +2.046 |
, | +1.952 |
a | +1.906 |
. | +1.765 |
Neg logit contributions | |
rol | -6.957 |
lor | -6.839 |
umm | -6.775 |
osity | -6.754 |
ides | -6.685 |
Token | But |
Token ID | 887 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.830 |
, | +3.688 |
the | +3.656 |
. | +3.529 |
a | +3.499 |
Neg logit contributions | |
umm | -5.591 |
rol | -5.365 |
lor | -5.322 |
osity | -5.261 |
arians | -5.228 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.992 |
. | +1.772 |
, | +1.720 |
a | +1.612 |
the | +1.612 |
Neg logit contributions | |
umm | -7.104 |
rol | -6.991 |
osity | -6.927 |
bek | -6.913 |
lor | -6.886 |
Token | toy |
Token ID | 13373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.879 |
, | +3.809 |
the | +3.752 |
. | +3.600 |
a | +3.510 |
Neg logit contributions | |
umm | -5.464 |
lor | -5.237 |
arians | -5.149 |
bek | -5.140 |
rob | -5.087 |
Token | did |
Token ID | 750 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.762 |
the | +3.672 |
, | +3.621 |
. | +3.509 |
a | +3.503 |
Neg logit contributions | |
lor | -5.425 |
umm | -5.418 |
rol | -5.334 |
arians | -5.275 |
bek | -5.214 |
Token | cookies |
Token ID | 14746 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.733 |
the | +4.567 |
, | +4.549 |
. | +4.419 |
a | +4.407 |
Neg logit contributions | |
umm | -4.659 |
lor | -4.522 |
rol | -4.497 |
bek | -4.315 |
arians | -4.311 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.182 |
the | +1.131 |
, | +1.012 |
a | +0.977 |
. | +0.832 |
Neg logit contributions | |
umm | -7.953 |
lor | -7.893 |
rol | -7.862 |
arians | -7.709 |
rob | -7.697 |
Token | but |
Token ID | 475 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.436 |
, | +4.360 |
the | +4.277 |
. | +4.230 |
a | +4.138 |
Neg logit contributions | |
umm | -4.794 |
rol | -4.717 |
lor | -4.638 |
arians | -4.503 |
rob | -4.500 |
Token | her |
Token ID | 607 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.440 |
, | +2.216 |
the | +2.174 |
. | +2.156 |
a | +2.044 |
Neg logit contributions | |
umm | -6.865 |
lor | -6.738 |
rol | -6.717 |
bek | -6.618 |
osity | -6.561 |
Token | mom |
Token ID | 1995 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.225 |
the | +4.052 |
, | +4.050 |
. | +3.927 |
a | +3.843 |
Neg logit contributions | |
umm | -5.223 |
lor | -4.985 |
rol | -4.891 |
arians | -4.874 |
bek | -4.791 |
Token | always |
Token ID | 1464 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.743 |
the | +3.671 |
, | +3.595 |
a | +3.533 |
. | +3.485 |
Neg logit contributions | |
umm | -5.423 |
rol | -5.365 |
lor | -5.364 |
bek | -5.216 |
arians | -5.177 |
Token | told |
Token ID | 1297 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.648 |
the | +3.498 |
, | +3.465 |
a | +3.356 |
. | +3.353 |
Neg logit contributions | |
rol | -5.462 |
umm | -5.452 |
lor | -5.404 |
bek | -5.401 |
osity | -5.292 |
Token | her |
Token ID | 607 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.772 |
, | +1.604 |
the | +1.491 |
. | +1.443 |
a | +1.377 |
Neg logit contributions | |
umm | -7.474 |
rol | -7.349 |
lor | -7.323 |
osity | -7.174 |
ides | -7.164 |
Token | not |
Token ID | 407 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.070 |
the | +1.890 |
, | +1.869 |
. | +1.730 |
a | +1.718 |
Neg logit contributions | |
umm | -7.235 |
lor | -7.230 |
rol | -7.111 |
osity | -7.045 |
bek | -6.998 |
Token | to |
Token ID | 284 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.733 |
, | +1.587 |
the | +1.541 |
. | +1.407 |
a | +1.378 |
Neg logit contributions | |
umm | -7.524 |
lor | -7.416 |
rol | -7.409 |
osity | -7.374 |
bek | -7.315 |
Token | eat |
Token ID | 4483 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.946 |
the | +3.797 |
, | +3.725 |
a | +3.665 |
. | +3.566 |
Neg logit contributions | |
umm | -5.408 |
lor | -5.163 |
rol | -5.160 |
bek | -5.060 |
osity | -5.049 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.419 |
the | +2.393 |
a | +2.254 |
, | +2.236 |
. | +1.955 |
Neg logit contributions | |
umm | -6.883 |
rol | -6.826 |
lor | -6.704 |
plets | -6.485 |
rob | -6.475 |
Token | She |
Token ID | 1375 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.266 |
the | +4.124 |
, | +4.105 |
. | +3.955 |
a | +3.944 |
Neg logit contributions | |
umm | -5.182 |
lor | -5.048 |
rol | -4.981 |
osity | -4.925 |
bek | -4.814 |
Token | wished |
Token ID | 16555 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.443 |
, | +4.397 |
the | +4.391 |
. | +4.281 |
a | +4.229 |
Neg logit contributions | |
lor | -4.646 |
rol | -4.566 |
bek | -4.525 |
umm | -4.523 |
arians | -4.423 |
Token | they |
Token ID | 484 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.606 |
, | +2.472 |
the | +2.412 |
. | +2.390 |
a | +2.342 |
Neg logit contributions | |
umm | -6.533 |
lor | -6.437 |
rol | -6.395 |
osity | -6.369 |
arians | -6.223 |
Token | had |
Token ID | 550 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.200 |
, | +3.036 |
the | +3.010 |
. | +2.892 |
a | +2.856 |
Neg logit contributions | |
umm | -6.129 |
lor | -6.113 |
rol | -6.074 |
bek | -5.931 |
osity | -5.900 |
Token | never |
Token ID | 1239 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.552 |
, | +4.419 |
the | +4.200 |
. | +4.189 |
a | +3.981 |
Neg logit contributions | |
lor | -4.722 |
bek | -4.595 |
rol | -4.580 |
umm | -4.548 |
beh | -4.527 |
Token | gone |
Token ID | 3750 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.659 |
, | +4.480 |
the | +4.396 |
. | +4.326 |
a | +4.196 |
Neg logit contributions | |
umm | -4.644 |
rol | -4.580 |
lor | -4.519 |
beh | -4.464 |
osity | -4.429 |
Token | to |
Token ID | 284 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.499 |
the | +2.373 |
, | +2.300 |
a | +2.224 |
. | +2.134 |
Neg logit contributions | |
rol | -6.489 |
umm | -6.446 |
lor | -6.433 |
osity | -6.302 |
beh | -6.293 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.801 |
, | +2.525 |
. | +2.302 |
the | +2.188 |
a | +2.185 |
Neg logit contributions | |
umm | -6.324 |
rol | -6.209 |
lor | -6.187 |
ocol | -6.093 |
former | -6.063 |
Token | gloomy |
Token ID | 46400 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.538 |
, | +5.348 |
the | +5.312 |
. | +5.195 |
a | +5.142 |
Neg logit contributions | |
umm | -3.955 |
lor | -3.824 |
rol | -3.735 |
bek | -3.581 |
arians | -3.569 |
Token | restaurant |
Token ID | 7072 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.190 |
the | +5.119 |
, | +5.012 |
a | +4.996 |
. | +4.861 |
Neg logit contributions | |
umm | -4.208 |
lor | -3.942 |
rol | -3.820 |
rob | -3.699 |
arians | -3.682 |
Token | his |
Token ID | 465 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.111 |
, | +2.934 |
. | +2.801 |
the | +2.601 |
a | +2.584 |
Neg logit contributions | |
umm | -6.079 |
bek | -6.057 |
rol | -5.991 |
lor | -5.920 |
osity | -5.900 |
Token | mom |
Token ID | 1995 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.258 |
, | +3.056 |
the | +3.044 |
. | +2.881 |
a | +2.823 |
Neg logit contributions | |
umm | -6.105 |
arians | -5.887 |
lor | -5.845 |
rol | -5.784 |
bek | -5.783 |
Token | went |
Token ID | 1816 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.909 |
the | +3.825 |
, | +3.782 |
a | +3.678 |
. | +3.635 |
Neg logit contributions | |
rol | -5.252 |
umm | -5.240 |
lor | -5.125 |
bek | -5.022 |
arians | -4.977 |
Token | to |
Token ID | 284 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.412 |
the | +2.292 |
, | +2.273 |
a | +2.139 |
. | +2.089 |
Neg logit contributions | |
rol | -6.739 |
lor | -6.698 |
umm | -6.608 |
bek | -6.495 |
osity | -6.468 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.116 |
, | +1.964 |
. | +1.754 |
the | +1.499 |
a | +1.470 |
Neg logit contributions | |
ocol | -6.772 |
umm | -6.747 |
bek | -6.744 |
lor | -6.743 |
rol | -6.727 |
Token | living |
Token ID | 2877 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.866 |
, | +4.692 |
the | +4.574 |
. | +4.506 |
a | +4.368 |
Neg logit contributions | |
umm | -4.610 |
lor | -4.565 |
bek | -4.351 |
rol | -4.344 |
arians | -4.302 |
Token | room |
Token ID | 2119 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.632 |
, | +3.519 |
the | +3.379 |
. | +3.328 |
a | +3.304 |
Neg logit contributions | |
umm | -5.683 |
lor | -5.638 |
rol | -5.456 |
bek | -5.428 |
arians | -5.304 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +0.708 |
and | +0.656 |
, | +0.533 |
a | +0.515 |
. | +0.280 |
Neg logit contributions | |
umm | -8.283 |
lor | -8.261 |
rol | -8.238 |
bek | -8.015 |
osity | -8.010 |
Token | They |
Token ID | 1119 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.589 |
, | +3.450 |
the | +3.402 |
. | +3.304 |
a | +3.265 |
Neg logit contributions | |
umm | -5.790 |
rol | -5.636 |
lor | -5.587 |
osity | -5.525 |
bek | -5.476 |
Token | unp |
Token ID | 8593 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.524 |
, | +3.391 |
the | +3.327 |
. | +3.269 |
a | +3.198 |
Neg logit contributions | |
rol | -5.668 |
lor | -5.559 |
umm | -5.553 |
bek | -5.528 |
arians | -5.429 |
Token | acked |
Token ID | 6021 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +7.144 |
, | +6.945 |
the | +6.944 |
. | +6.814 |
a | +6.769 |
Neg logit contributions | |
umm | -2.300 |
lor | -2.205 |
rol | -2.129 |
osity | -2.001 |
bek | -1.995 |
Token | b |
Token ID | 275 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.230 |
the | +4.207 |
a | +4.124 |
, | +4.060 |
. | +3.925 |
Neg logit contributions | |
umm | -5.003 |
lor | -4.942 |
rol | -4.863 |
arians | -4.716 |
osity | -4.623 |
Token | ales |
Token ID | 2040 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +8.624 |
the | +8.574 |
, | +8.474 |
a | +8.417 |
. | +8.285 |
Neg logit contributions | |
umm | -0.965 |
rol | -0.893 |
lor | -0.811 |
unn | -0.684 |
ocol | -0.641 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.165 |
the | +3.065 |
a | +2.997 |
, | +2.985 |
. | +2.824 |
Neg logit contributions | |
rol | -5.925 |
umm | -5.881 |
lor | -5.829 |
osity | -5.741 |
vation | -5.638 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.563 |
, | +3.402 |
the | +3.364 |
. | +3.231 |
a | +3.223 |
Neg logit contributions | |
umm | -5.837 |
rol | -5.816 |
lor | -5.801 |
osity | -5.585 |
bek | -5.553 |
Token | Once |
Token ID | 7454 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.872 |
, | +3.692 |
the | +3.679 |
a | +3.535 |
. | +3.513 |
Neg logit contributions | |
lor | -5.430 |
umm | -5.386 |
rol | -5.348 |
rob | -5.185 |
arians | -5.069 |
Token | upon |
Token ID | 2402 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.364 |
the | +4.172 |
, | +4.158 |
a | +4.043 |
. | +4.039 |
Neg logit contributions | |
umm | -4.953 |
lor | -4.891 |
rol | -4.875 |
osity | -4.707 |
bek | -4.687 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.538 |
, | +0.453 |
the | +0.337 |
. | +0.202 |
a | +0.015 |
Neg logit contributions | |
lor | -8.604 |
rol | -8.536 |
umm | -8.514 |
bek | -8.326 |
rob | -8.326 |
Token | time |
Token ID | 640 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.643 |
the | +2.548 |
, | +2.472 |
. | +2.344 |
a | +2.336 |
Neg logit contributions | |
umm | -6.655 |
lor | -6.585 |
rol | -6.523 |
bek | -6.378 |
ides | -6.325 |
Token | there |
Token ID | 612 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.305 |
the | +0.131 |
, | +0.032 |
. | -0.002 |
a | -0.027 |
Neg logit contributions | |
umm | -8.974 |
lor | -8.937 |
rol | -8.916 |
osity | -8.732 |
bek | -8.702 |
Token | was |
Token ID | 373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.749 |
the | +1.495 |
, | +1.474 |
. | +1.421 |
a | +1.416 |
Neg logit contributions | |
umm | -7.505 |
rol | -7.453 |
lor | -7.453 |
rob | -7.208 |
bek | -7.180 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.546 |
, | +0.400 |
the | +0.343 |
. | +0.248 |
a | +0.088 |
Neg logit contributions | |
umm | -8.756 |
rol | -8.666 |
lor | -8.648 |
rob | -8.453 |
bek | -8.445 |
Token | his |
Token ID | 465 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.780 |
, | +3.556 |
. | +3.362 |
the | +3.297 |
a | +3.206 |
Neg logit contributions | |
umm | -5.357 |
lor | -5.310 |
ocol | -5.266 |
rol | -5.222 |
osity | -5.107 |
Token | room |
Token ID | 2119 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.189 |
the | +5.005 |
, | +4.896 |
a | +4.830 |
. | +4.787 |
Neg logit contributions | |
umm | -4.174 |
lor | -3.974 |
bek | -3.847 |
rol | -3.782 |
arians | -3.774 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +1.551 |
and | +1.504 |
, | +1.358 |
a | +1.356 |
. | +1.150 |
Neg logit contributions | |
lor | -7.472 |
umm | -7.430 |
rol | -7.394 |
arians | -7.294 |
osity | -7.193 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
, | +2.598 |
and | +2.561 |
the | +2.503 |
. | +2.488 |
a | +2.396 |
Neg logit contributions | |
rol | -6.304 |
umm | -6.289 |
lor | -6.219 |
osity | -6.138 |
arians | -6.130 |
Token | he |
Token ID | 339 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.977 |
, | +2.850 |
. | +2.776 |
the | +2.653 |
a | +2.559 |
Neg logit contributions | |
umm | -6.076 |
rol | -6.074 |
lor | -6.042 |
bek | -6.007 |
osity | -5.954 |
Token | never |
Token ID | 1239 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.841 |
the | +3.749 |
, | +3.743 |
. | +3.617 |
a | +3.591 |
Neg logit contributions | |
lor | -5.354 |
rol | -5.289 |
umm | -5.246 |
arians | -5.156 |
bek | -5.138 |
Token | had |
Token ID | 550 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.263 |
the | +4.057 |
, | +4.030 |
. | +3.899 |
a | +3.898 |
Neg logit contributions | |
umm | -4.964 |
rol | -4.939 |
lor | -4.889 |
beh | -4.866 |
osity | -4.865 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.930 |
, | +2.696 |
the | +2.452 |
. | +2.451 |
a | +2.201 |
Neg logit contributions | |
lor | -6.288 |
rol | -6.268 |
beh | -6.216 |
umm | -6.155 |
osity | -6.050 |
Token | good |
Token ID | 922 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.864 |
the | +5.797 |
. | +5.568 |
, | +5.566 |
a | +5.488 |
Neg logit contributions | |
umm | -3.394 |
lor | -3.378 |
bek | -3.255 |
osity | -3.193 |
rol | -3.139 |
Token | night |
Token ID | 1755 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +4.839 |
and | +4.829 |
, | +4.652 |
. | +4.544 |
a | +4.543 |
Neg logit contributions | |
umm | -4.469 |
lor | -4.311 |
rol | -4.223 |
ides | -4.130 |
osity | -4.126 |
Token | 's |
Token ID | 338 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.227 |
the | +3.163 |
, | +3.049 |
a | +3.016 |
. | +2.812 |
Neg logit contributions | |
umm | -6.094 |
lor | -5.948 |
rol | -5.817 |
vation | -5.699 |
ides | -5.662 |
Token | day |
Token ID | 1110 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.033 |
, | +2.868 |
the | +2.847 |
. | +2.712 |
a | +2.683 |
Neg logit contributions | |
umm | -6.497 |
lor | -6.405 |
rol | -6.395 |
arians | -6.210 |
osity | -6.207 |
Token | on |
Token ID | 319 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.129 |
, | +2.009 |
the | +1.953 |
. | +1.830 |
a | +1.781 |
Neg logit contributions | |
umm | -7.368 |
lor | -7.233 |
rol | -7.210 |
osity | -7.051 |
arians | -7.039 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.439 |
the | +0.199 |
a | +0.167 |
. | +0.135 |
, | +0.107 |
Neg logit contributions | |
lor | -8.754 |
umm | -8.749 |
rol | -8.546 |
rob | -8.492 |
arians | -8.483 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.936 |
, | +2.735 |
. | +2.664 |
the | +2.520 |
a | +2.456 |
Neg logit contributions | |
umm | -6.205 |
rol | -6.007 |
arians | -5.948 |
osity | -5.943 |
bek | -5.903 |
Token | was |
Token ID | 373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.230 |
the | +3.155 |
, | +3.104 |
. | +3.030 |
a | +3.017 |
Neg logit contributions | |
lor | -5.923 |
umm | -5.817 |
rol | -5.813 |
arians | -5.689 |
osity | -5.666 |
Token | always |
Token ID | 1464 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.608 |
, | +3.413 |
. | +3.260 |
the | +3.250 |
a | +3.046 |
Neg logit contributions | |
lor | -5.683 |
rol | -5.655 |
umm | -5.531 |
beh | -5.472 |
osity | -5.438 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.067 |
, | +3.865 |
the | +3.736 |
. | +3.730 |
a | +3.512 |
Neg logit contributions | |
rol | -5.039 |
beh | -5.004 |
lor | -4.952 |
bek | -4.933 |
umm | -4.874 |
Token | in |
Token ID | 287 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.812 |
the | +1.728 |
, | +1.673 |
a | +1.628 |
. | +1.524 |
Neg logit contributions | |
umm | -7.284 |
rol | -7.183 |
lor | -7.053 |
osity | -7.009 |
arians | -6.914 |
Token | his |
Token ID | 465 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.780 |
, | +3.556 |
. | +3.362 |
the | +3.297 |
a | +3.206 |
Neg logit contributions | |
umm | -5.357 |
lor | -5.310 |
ocol | -5.266 |
rol | -5.222 |
osity | -5.107 |
Token | room |
Token ID | 2119 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.189 |
the | +5.005 |
, | +4.896 |
a | +4.830 |
. | +4.787 |
Neg logit contributions | |
umm | -4.174 |
lor | -3.974 |
bek | -3.847 |
rol | -3.782 |
arians | -3.774 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +1.551 |
and | +1.504 |
, | +1.358 |
a | +1.356 |
. | +1.150 |
Neg logit contributions | |
lor | -7.472 |
umm | -7.430 |
rol | -7.394 |
arians | -7.294 |
osity | -7.193 |
Token | 're |
Token ID | 821 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.620 |
the | +5.423 |
, | +5.403 |
. | +5.331 |
a | +5.160 |
Neg logit contributions | |
lor | -3.703 |
umm | -3.663 |
rol | -3.655 |
osity | -3.535 |
ides | -3.480 |
Token | welcome |
Token ID | 7062 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.308 |
, | +4.008 |
. | +3.943 |
the | +3.908 |
a | +3.755 |
Neg logit contributions | |
umm | -5.126 |
rol | -5.030 |
lor | -4.982 |
osity | -4.849 |
bek | -4.823 |
Token | ! |
Token ID | 0 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.551 |
the | +3.360 |
, | +3.285 |
a | +3.214 |
. | +3.163 |
Neg logit contributions | |
umm | -5.793 |
lor | -5.768 |
rol | -5.642 |
arians | -5.515 |
bek | -5.492 |
Token | I |
Token ID | 314 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.557 |
, | +5.367 |
the | +5.356 |
. | +5.251 |
a | +5.201 |
Neg logit contributions | |
umm | -3.927 |
lor | -3.846 |
rol | -3.777 |
osity | -3.666 |
bek | -3.630 |
Token | 'm |
Token ID | 1101 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.202 |
the | +5.179 |
, | +5.044 |
a | +4.930 |
. | +4.921 |
Neg logit contributions | |
lor | -4.017 |
rol | -4.006 |
umm | -3.941 |
bek | -3.858 |
reetings | -3.820 |
Token | glad |
Token ID | 9675 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.764 |
, | +4.526 |
. | +4.483 |
the | +4.431 |
a | +4.273 |
Neg logit contributions | |
rol | -4.626 |
umm | -4.517 |
lor | -4.493 |
osity | -4.350 |
bek | -4.298 |
Token | I |
Token ID | 314 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.677 |
, | +3.463 |
the | +3.394 |
. | +3.340 |
a | +3.337 |
Neg logit contributions | |
umm | -5.626 |
lor | -5.583 |
rol | -5.408 |
osity | -5.376 |
arians | -5.342 |
Token | could |
Token ID | 714 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.640 |
the | +4.494 |
, | +4.494 |
a | +4.320 |
. | +4.306 |
Neg logit contributions | |
rol | -4.643 |
lor | -4.636 |
umm | -4.530 |
reetings | -4.461 |
bek | -4.458 |
Token | help |
Token ID | 1037 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.480 |
the | +3.377 |
, | +3.265 |
a | +3.179 |
. | +3.095 |
Neg logit contributions | |
lor | -5.708 |
umm | -5.702 |
rol | -5.547 |
arians | -5.546 |
ides | -5.471 |
Token | ." |
Token ID | 526 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.349 |
, | +3.126 |
the | +3.086 |
a | +3.069 |
. | +2.952 |
Neg logit contributions | |
umm | -5.842 |
lor | -5.800 |
arians | -5.722 |
rol | -5.575 |
osity | -5.518 |
Token | |
Token ID | 220 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.312 |
, | +3.186 |
the | +3.168 |
a | +3.059 |
. | +3.027 |
Neg logit contributions | |
lor | -6.059 |
umm | -6.007 |
rol | -5.882 |
osity | -5.718 |
bek | -5.696 |
Token | The |
Token ID | 464 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +6.139 |
, | +6.001 |
the | +5.955 |
. | +5.859 |
a | +5.789 |
Neg logit contributions | |
lor | -3.300 |
umm | -3.221 |
rol | -3.195 |
bek | -3.027 |
arians | -3.010 |
Token | two |
Token ID | 734 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.092 |
, | +4.935 |
the | +4.896 |
. | +4.788 |
a | +4.666 |
Neg logit contributions | |
umm | -4.386 |
lor | -4.158 |
arians | -4.102 |
bek | -4.078 |
rol | -4.037 |
Token | cr |
Token ID | 1067 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.006 |
the | +3.851 |
, | +3.816 |
. | +3.781 |
a | +3.770 |
Neg logit contributions | |
umm | -5.302 |
rol | -5.212 |
lor | -5.130 |
arians | -5.095 |
unn | -4.986 |
Token | anes |
Token ID | 7305 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +8.036 |
the | +7.958 |
, | +7.890 |
. | +7.778 |
a | +7.754 |
Neg logit contributions | |
umm | -1.529 |
rol | -1.493 |
lor | -1.461 |
osity | -1.286 |
ides | -1.185 |
Token | were |
Token ID | 547 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.414 |
the | +4.296 |
a | +4.240 |
, | +4.237 |
. | +4.179 |
Neg logit contributions | |
rol | -4.778 |
lor | -4.712 |
umm | -4.659 |
osity | -4.584 |
arians | -4.543 |
Token | always |
Token ID | 1464 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.432 |
, | +4.192 |
. | +4.166 |
the | +4.083 |
a | +4.009 |
Neg logit contributions | |
rol | -4.886 |
umm | -4.705 |
lor | -4.651 |
osity | -4.556 |
arians | -4.552 |
Token | loyal |
Token ID | 9112 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.987 |
, | +3.745 |
. | +3.686 |
the | +3.649 |
a | +3.501 |
Neg logit contributions | |
rol | -5.196 |
bek | -5.141 |
umm | -5.137 |
osity | -5.031 |
beh | -5.018 |
Token | to |
Token ID | 284 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +2.784 |
and | +2.713 |
a | +2.599 |
, | +2.549 |
. | +2.472 |
Neg logit contributions | |
umm | -6.455 |
rol | -6.235 |
lor | -6.214 |
arians | -6.208 |
osity | -6.192 |
Token | each |
Token ID | 1123 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.673 |
, | +5.445 |
. | +5.290 |
the | +5.254 |
a | +5.184 |
Neg logit contributions | |
arians | -3.696 |
lor | -3.654 |
umm | -3.581 |
rol | -3.505 |
osity | -3.476 |
Token | other |
Token ID | 584 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.640 |
, | +2.505 |
the | +2.424 |
a | +2.319 |
. | +2.300 |
Neg logit contributions | |
umm | -6.541 |
lor | -6.495 |
rol | -6.468 |
bek | -6.420 |
arians | -6.354 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.329 |
the | +2.290 |
a | +2.154 |
, | +2.139 |
. | +2.021 |
Neg logit contributions | |
lor | -6.674 |
umm | -6.668 |
rol | -6.635 |
arians | -6.614 |
osity | -6.567 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.089 |
, | +0.887 |
the | +0.840 |
a | +0.822 |
. | +0.675 |
Neg logit contributions | |
umm | -8.171 |
rol | -7.897 |
ocol | -7.767 |
lor | -7.759 |
osity | -7.703 |
Token | neighborhood |
Token ID | 6232 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.275 |
, | +5.128 |
the | +5.123 |
a | +4.985 |
. | +4.969 |
Neg logit contributions | |
umm | -4.155 |
rol | -3.952 |
lor | -3.928 |
bek | -3.794 |
osity | -3.785 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.354 |
the | +2.247 |
, | +2.168 |
a | +2.113 |
. | +1.952 |
Neg logit contributions | |
umm | -6.994 |
rol | -6.825 |
lor | -6.707 |
arians | -6.657 |
osity | -6.640 |
Token | He |
Token ID | 679 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.027 |
, | +3.885 |
the | +3.812 |
. | +3.699 |
a | +3.679 |
Neg logit contributions | |
umm | -5.523 |
rol | -5.367 |
lor | -5.315 |
osity | -5.139 |
bek | -5.074 |
Token | had |
Token ID | 550 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.645 |
, | +3.562 |
the | +3.556 |
. | +3.500 |
a | +3.441 |
Neg logit contributions | |
rol | -5.478 |
umm | -5.432 |
lor | -5.412 |
bek | -5.324 |
arians | -5.315 |
Token | never |
Token ID | 1239 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.780 |
, | +2.700 |
. | +2.506 |
the | +2.429 |
a | +2.176 |
Neg logit contributions | |
rol | -6.477 |
lor | -6.454 |
umm | -6.378 |
bek | -6.218 |
arians | -6.155 |
Token | seen |
Token ID | 1775 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.481 |
, | +5.277 |
the | +5.209 |
. | +5.121 |
a | +5.016 |
Neg logit contributions | |
umm | -3.907 |
rol | -3.763 |
lor | -3.735 |
bek | -3.702 |
osity | -3.680 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.152 |
, | +3.985 |
. | +3.820 |
the | +3.720 |
a | +3.552 |
Neg logit contributions | |
umm | -5.160 |
rol | -5.141 |
lor | -5.034 |
osity | -4.812 |
rob | -4.807 |
Token | world |
Token ID | 995 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.815 |
, | +5.659 |
the | +5.643 |
. | +5.474 |
a | +5.464 |
Neg logit contributions | |
umm | -3.717 |
rol | -3.450 |
lor | -3.371 |
arians | -3.305 |
bek | -3.299 |
Token | from |
Token ID | 422 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.574 |
, | +3.400 |
the | +3.395 |
a | +3.282 |
. | +3.246 |
Neg logit contributions | |
umm | -5.763 |
rol | -5.642 |
lor | -5.636 |
osity | -5.436 |
bek | -5.370 |
Token | so |
Token ID | 523 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.796 |
, | +2.615 |
. | +2.439 |
the | +2.313 |
a | +2.241 |
Neg logit contributions | |
umm | -6.503 |
rol | -6.354 |
ocol | -6.202 |
arians | -6.168 |
lor | -6.159 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.022 |
, | +2.848 |
. | +2.676 |
the | +2.616 |
a | +2.496 |
Neg logit contributions | |
umm | -6.314 |
lor | -6.157 |
rol | -6.025 |
rob | -6.004 |
bek | -5.950 |
Token | farm |
Token ID | 5318 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.881 |
, | +4.707 |
the | +4.681 |
. | +4.508 |
a | +4.463 |
Neg logit contributions | |
umm | -4.734 |
lor | -4.435 |
rol | -4.357 |
bek | -4.258 |
arians | -4.242 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.116 |
the | +2.054 |
a | +1.975 |
, | +1.937 |
. | +1.725 |
Neg logit contributions | |
umm | -7.084 |
lor | -6.997 |
rol | -6.935 |
arians | -6.775 |
osity | -6.669 |
Token | they |
Token ID | 484 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.131 |
, | +3.968 |
. | +3.931 |
a | +3.826 |
the | +3.803 |
Neg logit contributions | |
umm | -5.054 |
osity | -4.986 |
rol | -4.986 |
lor | -4.928 |
bek | -4.884 |
Token | were |
Token ID | 547 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.871 |
, | +3.684 |
the | +3.659 |
a | +3.585 |
. | +3.566 |
Neg logit contributions | |
rol | -5.390 |
umm | -5.365 |
lor | -5.356 |
bek | -5.217 |
osity | -5.202 |
Token | always |
Token ID | 1464 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.992 |
, | +3.783 |
. | +3.665 |
the | +3.645 |
a | +3.556 |
Neg logit contributions | |
rol | -5.340 |
umm | -5.304 |
lor | -5.271 |
osity | -5.049 |
bek | -5.011 |
Token | sure |
Token ID | 1654 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.420 |
, | +4.227 |
. | +4.072 |
the | +4.066 |
a | +3.927 |
Neg logit contributions | |
umm | -4.844 |
rol | -4.811 |
bek | -4.747 |
lor | -4.659 |
beh | -4.614 |
Token | to |
Token ID | 284 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.507 |
, | +2.260 |
. | +2.105 |
the | +2.082 |
a | +2.004 |
Neg logit contributions | |
lor | -6.847 |
umm | -6.826 |
rol | -6.768 |
osity | -6.692 |
bek | -6.616 |
Token | share |
Token ID | 2648 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.319 |
, | +4.075 |
the | +3.929 |
. | +3.906 |
a | +3.836 |
Neg logit contributions | |
umm | -4.957 |
lor | -4.843 |
osity | -4.800 |
bek | -4.769 |
ocol | -4.769 |
Token | some |
Token ID | 617 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.111 |
, | +2.064 |
the | +1.934 |
a | +1.830 |
. | +1.774 |
Neg logit contributions | |
lor | -6.750 |
umm | -6.708 |
rol | -6.611 |
bek | -6.512 |
ocol | -6.496 |
Token | cocoa |
Token ID | 35845 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.891 |
the | +3.843 |
, | +3.759 |
a | +3.697 |
. | +3.546 |
Neg logit contributions | |
umm | -5.494 |
rol | -5.213 |
lor | -5.190 |
ocol | -5.032 |
unn | -4.995 |
Token | play |
Token ID | 711 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.690 |
, | +3.468 |
the | +3.358 |
. | +3.326 |
a | +3.285 |
Neg logit contributions | |
umm | -5.464 |
rol | -5.383 |
lor | -5.365 |
vation | -5.208 |
arians | -5.200 |
Token | in |
Token ID | 287 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.817 |
the | +1.635 |
, | +1.633 |
. | +1.466 |
a | +1.447 |
Neg logit contributions | |
lor | -7.371 |
rol | -7.369 |
umm | -7.367 |
rob | -7.230 |
arians | -7.103 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.660 |
, | +0.524 |
. | +0.303 |
the | +0.292 |
a | +0.263 |
Neg logit contributions | |
lor | -8.317 |
rol | -8.281 |
umm | -8.180 |
rob | -8.122 |
arians | -8.031 |
Token | sandbox |
Token ID | 35204 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.244 |
, | +4.098 |
the | +4.016 |
. | +3.937 |
a | +3.835 |
Neg logit contributions | |
umm | -5.185 |
rol | -5.073 |
lor | -5.045 |
rob | -4.891 |
bek | -4.812 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.139 |
the | +1.060 |
, | +0.959 |
a | +0.883 |
. | +0.746 |
Neg logit contributions | |
umm | -8.077 |
rol | -8.021 |
lor | -8.008 |
arians | -7.748 |
bek | -7.731 |
Token | |
Token ID | 220 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.380 |
the | +2.214 |
, | +2.209 |
. | +2.082 |
a | +2.080 |
Neg logit contributions | |
umm | -6.942 |
lor | -6.877 |
rol | -6.864 |
osity | -6.691 |
bek | -6.616 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.496 |
, | +1.348 |
the | +1.337 |
a | +1.175 |
. | +1.143 |
Neg logit contributions | |
lor | -7.765 |
rol | -7.753 |
umm | -7.711 |
osity | -7.478 |
bek | -7.467 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.404 |
the | +1.236 |
, | +1.229 |
. | +1.087 |
a | +1.082 |
Neg logit contributions | |
lor | -7.883 |
umm | -7.880 |
rol | -7.837 |
bek | -7.635 |
osity | -7.609 |
Token | " |
Token ID | 1 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.854 |
the | +4.704 |
, | +4.685 |
. | +4.550 |
a | +4.528 |
Neg logit contributions | |
umm | -4.562 |
lor | -4.541 |
rol | -4.490 |
bek | -4.337 |
osity | -4.299 |
Token | Mom |
Token ID | 29252 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.554 |
the | +4.374 |
, | +4.373 |
. | +4.238 |
a | +4.216 |
Neg logit contributions | |
umm | -4.893 |
lor | -4.813 |
rol | -4.776 |
bek | -4.610 |
osity | -4.609 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.184 |
the | +3.029 |
, | +2.922 |
a | +2.901 |
. | +2.882 |
Neg logit contributions | |
umm | -6.129 |
lor | -6.013 |
rol | -5.999 |
osity | -5.849 |
bek | -5.845 |
Token | sandbox |
Token ID | 35204 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.766 |
, | +5.587 |
the | +5.545 |
. | +5.458 |
a | +5.374 |
Neg logit contributions | |
umm | -3.664 |
lor | -3.543 |
rol | -3.533 |
rob | -3.342 |
bek | -3.306 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.405 |
the | +3.312 |
, | +3.200 |
a | +3.152 |
. | +3.128 |
Neg logit contributions | |
umm | -5.811 |
rol | -5.746 |
lor | -5.743 |
bek | -5.515 |
rob | -5.494 |
Token | asked |
Token ID | 1965 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.342 |
, | +2.091 |
the | +2.074 |
. | +1.968 |
a | +1.947 |
Neg logit contributions | |
umm | -6.919 |
rol | -6.842 |
lor | -6.825 |
arians | -6.643 |
rob | -6.636 |
Token | Lily |
Token ID | 20037 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.181 |
, | +1.929 |
the | +1.870 |
. | +1.778 |
a | +1.732 |
Neg logit contributions | |
umm | -7.078 |
rol | -7.043 |
lor | -6.977 |
bek | -6.822 |
arians | -6.809 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.671 |
the | +1.540 |
, | +1.479 |
a | +1.381 |
. | +1.288 |
Neg logit contributions | |
umm | -7.541 |
lor | -7.496 |
rol | -7.476 |
osity | -7.322 |
bek | -7.315 |
Token | |
Token ID | 220 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.637 |
the | +3.483 |
, | +3.421 |
a | +3.333 |
. | +3.325 |
Neg logit contributions | |
umm | -5.515 |
lor | -5.502 |
rol | -5.479 |
osity | -5.357 |
bek | -5.286 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.509 |
the | +1.348 |
, | +1.334 |
a | +1.197 |
. | +1.143 |
Neg logit contributions | |
lor | -7.735 |
rol | -7.731 |
umm | -7.695 |
osity | -7.468 |
arians | -7.439 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.505 |
the | +1.325 |
, | +1.296 |
a | +1.197 |
. | +1.178 |
Neg logit contributions | |
lor | -7.762 |
umm | -7.692 |
rol | -7.689 |
bek | -7.488 |
osity | -7.464 |
Token | " |
Token ID | 1 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.023 |
the | +2.877 |
, | +2.819 |
a | +2.728 |
. | +2.722 |
Neg logit contributions | |
lor | -6.310 |
umm | -6.293 |
rol | -6.188 |
bek | -6.128 |
osity | -6.077 |
Token | Sure |
Token ID | 19457 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.685 |
the | +5.505 |
, | +5.492 |
. | +5.362 |
a | +5.360 |
Neg logit contributions | |
umm | -3.731 |
lor | -3.661 |
rol | -3.612 |
osity | -3.455 |
arians | -3.439 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.735 |
the | +0.548 |
, | +0.409 |
a | +0.399 |
. | +0.353 |
Neg logit contributions | |
umm | -8.606 |
lor | -8.530 |
rol | -8.416 |
bek | -8.367 |
arians | -8.288 |
Token | was |
Token ID | 373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.033 |
the | +1.876 |
, | +1.864 |
. | +1.751 |
a | +1.745 |
Neg logit contributions | |
umm | -7.231 |
lor | -7.157 |
rol | -7.153 |
bek | -6.996 |
osity | -6.956 |
Token | white |
Token ID | 2330 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.030 |
, | +2.871 |
the | +2.825 |
. | +2.764 |
a | +2.634 |
Neg logit contributions | |
umm | -6.202 |
rol | -6.187 |
lor | -6.052 |
bek | -5.936 |
osity | -5.919 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.186 |
the | +0.076 |
, | +0.031 |
. | -0.096 |
a | -0.103 |
Neg logit contributions | |
umm | -9.155 |
lor | -9.033 |
rol | -9.015 |
osity | -8.816 |
arians | -8.812 |
Token | wide |
Token ID | 3094 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.651 |
, | +3.451 |
. | +3.365 |
the | +3.239 |
a | +3.178 |
Neg logit contributions | |
umm | -5.628 |
rol | -5.505 |
bek | -5.432 |
lor | -5.361 |
rob | -5.333 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.815 |
the | +0.774 |
, | +0.641 |
a | +0.564 |
. | +0.455 |
Neg logit contributions | |
umm | -8.363 |
rol | -8.176 |
lor | -8.160 |
osity | -8.013 |
arians | -7.964 |
Token | |
Token ID | 220 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.241 |
, | +3.089 |
the | +2.995 |
. | +2.971 |
a | +2.860 |
Neg logit contributions | |
umm | -6.176 |
lor | -6.093 |
rol | -6.045 |
osity | -5.896 |
plets | -5.836 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.601 |
, | +1.468 |
the | +1.422 |
a | +1.255 |
. | +1.225 |
Neg logit contributions | |
lor | -7.690 |
rol | -7.660 |
umm | -7.568 |
osity | -7.381 |
arians | -7.349 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.421 |
, | +1.258 |
the | +1.250 |
. | +1.114 |
a | +1.093 |
Neg logit contributions | |
lor | -7.884 |
umm | -7.859 |
rol | -7.826 |
bek | -7.636 |
osity | -7.606 |
Token | The |
Token ID | 464 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.806 |
, | +4.654 |
the | +4.624 |
. | +4.521 |
a | +4.454 |
Neg logit contributions | |
umm | -4.609 |
lor | -4.589 |
rol | -4.542 |
bek | -4.420 |
osity | -4.372 |
Token | m |
Token ID | 285 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.083 |
, | +3.919 |
the | +3.895 |
. | +3.791 |
a | +3.734 |
Neg logit contributions | |
umm | -5.417 |
lor | -5.171 |
rol | -5.135 |
arians | -5.065 |
bek | -5.033 |
Token | ama |
Token ID | 1689 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +7.101 |
, | +6.924 |
the | +6.904 |
. | +6.786 |
a | +6.746 |
Neg logit contributions | |
umm | -2.291 |
lor | -2.214 |
rol | -2.172 |
bek | -2.024 |
osity | -2.019 |
Token | special |
Token ID | 2041 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.341 |
the | +4.219 |
, | +4.125 |
a | +4.054 |
. | +4.007 |
Neg logit contributions | |
umm | -4.989 |
osity | -4.750 |
rol | -4.749 |
lor | -4.723 |
bek | -4.662 |
Token | place |
Token ID | 1295 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.393 |
the | +4.390 |
, | +4.198 |
a | +4.192 |
. | +4.058 |
Neg logit contributions | |
umm | -4.915 |
lor | -4.634 |
rol | -4.593 |
bek | -4.573 |
osity | -4.536 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.921 |
the | +1.828 |
, | +1.736 |
a | +1.668 |
. | +1.518 |
Neg logit contributions | |
umm | -7.180 |
rol | -7.166 |
lor | -7.142 |
osity | -6.959 |
bek | -6.956 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.142 |
, | +1.974 |
the | +1.942 |
. | +1.824 |
a | +1.805 |
Neg logit contributions | |
umm | -7.292 |
lor | -7.211 |
rol | -7.154 |
osity | -6.978 |
bek | -6.965 |
Token | Once |
Token ID | 7454 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.507 |
, | +3.337 |
the | +3.318 |
a | +3.162 |
. | +3.126 |
Neg logit contributions | |
lor | -5.806 |
umm | -5.749 |
rol | -5.729 |
rob | -5.547 |
arians | -5.432 |
Token | upon |
Token ID | 2402 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.308 |
the | +4.107 |
, | +4.089 |
a | +3.988 |
. | +3.973 |
Neg logit contributions | |
umm | -4.983 |
lor | -4.936 |
rol | -4.922 |
osity | -4.751 |
bek | -4.729 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.547 |
, | +0.456 |
the | +0.327 |
. | +0.204 |
a | +0.016 |
Neg logit contributions | |
lor | -8.623 |
rol | -8.541 |
umm | -8.519 |
rob | -8.345 |
bek | -8.335 |
Token | time |
Token ID | 640 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.643 |
the | +2.531 |
, | +2.475 |
. | +2.331 |
a | +2.323 |
Neg logit contributions | |
umm | -6.667 |
lor | -6.605 |
rol | -6.542 |
bek | -6.403 |
ides | -6.338 |
Token | there |
Token ID | 612 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.323 |
the | +0.153 |
, | +0.017 |
. | +0.009 |
a | -0.004 |
Neg logit contributions | |
umm | -8.901 |
lor | -8.894 |
rol | -8.875 |
osity | -8.689 |
bek | -8.654 |
Token | was |
Token ID | 373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.693 |
the | +1.454 |
, | +1.442 |
. | +1.365 |
a | +1.357 |
Neg logit contributions | |
umm | -7.507 |
rol | -7.493 |
lor | -7.487 |
rob | -7.247 |
bek | -7.216 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.572 |
, | +0.430 |
the | +0.367 |
. | +0.269 |
a | +0.106 |
Neg logit contributions | |
umm | -8.701 |
rol | -8.638 |
lor | -8.602 |
rob | -8.428 |
bek | -8.410 |
Token | new |
Token ID | 649 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.754 |
the | +3.582 |
, | +3.563 |
a | +3.428 |
. | +3.362 |
Neg logit contributions | |
umm | -5.582 |
lor | -5.365 |
osity | -5.280 |
bek | -5.265 |
arians | -5.263 |
Token | lamp |
Token ID | 20450 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.311 |
the | +5.165 |
, | +5.114 |
a | +4.981 |
. | +4.964 |
Neg logit contributions | |
umm | -4.039 |
lor | -3.926 |
rol | -3.866 |
osity | -3.767 |
arians | -3.719 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.674 |
the | +1.653 |
, | +1.528 |
a | +1.481 |
. | +1.267 |
Neg logit contributions | |
umm | -7.475 |
lor | -7.461 |
rol | -7.310 |
arians | -7.243 |
osity | -7.233 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.829 |
the | +1.661 |
, | +1.630 |
. | +1.516 |
a | +1.485 |
Neg logit contributions | |
umm | -7.607 |
lor | -7.517 |
rol | -7.517 |
arians | -7.375 |
bek | -7.348 |
Token | Once |
Token ID | 7454 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.448 |
, | +1.291 |
the | +1.263 |
. | +1.104 |
a | +1.103 |
Neg logit contributions | |
lor | -7.823 |
umm | -7.800 |
rol | -7.735 |
rob | -7.559 |
bek | -7.502 |
Token | upon |
Token ID | 2402 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.281 |
the | +4.098 |
, | +4.094 |
. | +3.965 |
a | +3.949 |
Neg logit contributions | |
umm | -5.075 |
lor | -5.000 |
rol | -4.968 |
osity | -4.802 |
bek | -4.797 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.484 |
, | +0.369 |
the | +0.285 |
. | +0.153 |
a | +0.025 |
Neg logit contributions | |
lor | -8.712 |
umm | -8.673 |
rol | -8.632 |
bek | -8.442 |
rob | -8.440 |
Token | time |
Token ID | 640 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.595 |
the | +2.470 |
, | +2.425 |
. | +2.292 |
a | +2.278 |
Neg logit contributions | |
umm | -6.732 |
lor | -6.661 |
rol | -6.598 |
bek | -6.454 |
osity | -6.405 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.258 |
the | +0.085 |
, | +0.018 |
. | -0.048 |
a | -0.074 |
Neg logit contributions | |
umm | -9.056 |
lor | -9.008 |
rol | -8.967 |
osity | -8.792 |
bek | -8.777 |
Token | there |
Token ID | 612 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.952 |
the | +1.754 |
, | +1.754 |
. | +1.643 |
a | +1.587 |
Neg logit contributions | |
umm | -7.393 |
lor | -7.322 |
rol | -7.303 |
bek | -7.137 |
osity | -7.129 |
Token | was |
Token ID | 373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.533 |
the | +1.322 |
, | +1.295 |
. | +1.232 |
a | +1.205 |
Neg logit contributions | |
umm | -7.714 |
lor | -7.671 |
rol | -7.639 |
bek | -7.407 |
osity | -7.403 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.160 |
the | +2.138 |
, | +2.008 |
a | +2.000 |
. | +1.782 |
Neg logit contributions | |
umm | -6.874 |
rol | -6.856 |
lor | -6.828 |
ides | -6.555 |
osity | -6.517 |
Token | She |
Token ID | 1375 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.200 |
, | +4.047 |
the | +4.030 |
. | +3.898 |
a | +3.813 |
Neg logit contributions | |
umm | -5.314 |
lor | -5.130 |
rol | -5.051 |
osity | -5.033 |
arians | -4.888 |
Token | smiled |
Token ID | 13541 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.101 |
, | +4.082 |
the | +4.028 |
. | +4.008 |
a | +3.886 |
Neg logit contributions | |
lor | -4.978 |
rol | -4.966 |
umm | -4.945 |
bek | -4.858 |
arians | -4.724 |
Token | happily |
Token ID | 18177 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.604 |
the | +1.551 |
, | +1.461 |
. | +1.394 |
a | +1.344 |
Neg logit contributions | |
umm | -7.593 |
lor | -7.454 |
rol | -7.413 |
osity | -7.378 |
bek | -7.187 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
the | +1.542 |
and | +1.536 |
, | +1.371 |
a | +1.350 |
. | +1.250 |
Neg logit contributions | |
umm | -7.673 |
lor | -7.595 |
rol | -7.512 |
bek | -7.439 |
osity | -7.389 |
Token | glad |
Token ID | 9675 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
, | +4.310 |
and | +4.253 |
. | +4.242 |
the | +4.205 |
a | +4.078 |
Neg logit contributions | |
umm | -4.720 |
lor | -4.668 |
rol | -4.667 |
osity | -4.612 |
bek | -4.584 |
Token | that |
Token ID | 326 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.697 |
the | +1.565 |
, | +1.535 |
a | +1.443 |
. | +1.382 |
Neg logit contributions | |
umm | -7.549 |
lor | -7.379 |
osity | -7.307 |
rol | -7.276 |
bek | -7.134 |
Token | she |
Token ID | 673 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.882 |
, | +2.600 |
. | +2.503 |
the | +2.481 |
a | +2.410 |
Neg logit contributions | |
umm | -6.404 |
lor | -6.273 |
rol | -6.134 |
osity | -6.098 |
arians | -6.066 |
Token | had |
Token ID | 550 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.169 |
, | +3.020 |
the | +3.005 |
. | +2.882 |
a | +2.855 |
Neg logit contributions | |
umm | -6.215 |
lor | -6.178 |
rol | -6.110 |
bek | -6.016 |
osity | -5.947 |
Token | found |
Token ID | 1043 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.415 |
, | +4.209 |
the | +4.078 |
. | +4.039 |
a | +3.889 |
Neg logit contributions | |
lor | -4.910 |
umm | -4.792 |
rol | -4.755 |
bek | -4.695 |
beh | -4.604 |
Token | something |
Token ID | 1223 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.997 |
, | +2.857 |
the | +2.636 |
. | +2.634 |
a | +2.472 |
Neg logit contributions | |
rol | -6.189 |
lor | -6.182 |
umm | -6.131 |
ocol | -5.884 |
rob | -5.807 |
Token | she |
Token ID | 673 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.915 |
, | +3.628 |
the | +3.559 |
. | +3.503 |
a | +3.479 |
Neg logit contributions | |
umm | -5.412 |
osity | -5.198 |
rol | -5.142 |
lor | -5.120 |
ocol | -5.101 |
Token | painted |
Token ID | 13055 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.389 |
the | +4.296 |
, | +4.272 |
a | +4.136 |
. | +4.062 |
Neg logit contributions | |
umm | -4.898 |
rol | -4.707 |
lor | -4.704 |
bek | -4.653 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.008 |
, | +2.846 |
the | +2.744 |
. | +2.635 |
a | +2.622 |
Neg logit contributions | |
umm | -6.201 |
rol | -6.095 |
lor | -5.961 |
ocol | -5.817 |
arians | -5.802 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.320 |
the | +2.151 |
, | +2.131 |
. | +2.017 |
a | +1.981 |
Neg logit contributions | |
umm | -7.092 |
lor | -7.022 |
rol | -7.015 |
arians | -6.865 |
bek | -6.854 |
Token | Once |
Token ID | 7454 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.419 |
, | +1.258 |
the | +1.236 |
. | +1.078 |
a | +1.075 |
Neg logit contributions | |
lor | -7.851 |
umm | -7.848 |
rol | -7.776 |
rob | -7.582 |
bek | -7.555 |
Token | upon |
Token ID | 2402 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.172 |
the | +3.993 |
, | +3.993 |
. | +3.859 |
a | +3.838 |
Neg logit contributions | |
umm | -5.193 |
lor | -5.116 |
rol | -5.080 |
bek | -4.914 |
osity | -4.912 |
Token | a |
Token ID | 257 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.482 |
, | +0.360 |
the | +0.283 |
. | +0.151 |
a | +0.033 |
Neg logit contributions | |
lor | -8.728 |
umm | -8.691 |
rol | -8.639 |
bek | -8.456 |
rob | -8.443 |
Token | time |
Token ID | 640 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.574 |
the | +2.431 |
, | +2.401 |
. | +2.265 |
a | +2.254 |
Neg logit contributions | |
umm | -6.780 |
lor | -6.705 |
rol | -6.650 |
bek | -6.500 |
osity | -6.469 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.261 |
the | +0.093 |
, | +0.013 |
. | -0.046 |
a | -0.060 |
Neg logit contributions | |
umm | -9.020 |
lor | -8.975 |
rol | -8.940 |
osity | -8.774 |
bek | -8.749 |
Token | there |
Token ID | 612 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.980 |
, | +1.782 |
the | +1.779 |
. | +1.671 |
a | +1.608 |
Neg logit contributions | |
umm | -7.311 |
lor | -7.243 |
rol | -7.240 |
bek | -7.074 |
osity | -7.062 |
Token | was |
Token ID | 373 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.500 |
the | +1.293 |
, | +1.278 |
. | +1.196 |
a | +1.170 |
Neg logit contributions | |
umm | -7.779 |
lor | -7.727 |
rol | -7.692 |
bek | -7.478 |
rob | -7.468 |
Token | path |
Token ID | 3108 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +5.168 |
the | +5.020 |
, | +5.009 |
a | +4.885 |
. | +4.871 |
Neg logit contributions | |
umm | -4.279 |
lor | -4.167 |
rol | -4.100 |
arians | -3.935 |
osity | -3.927 |
Token | towards |
Token ID | 3371 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.680 |
the | +1.609 |
, | +1.490 |
a | +1.459 |
. | +1.311 |
Neg logit contributions | |
rol | -7.504 |
umm | -7.483 |
lor | -7.370 |
osity | -7.223 |
bek | -7.195 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.987 |
, | +1.757 |
. | +1.585 |
the | +1.568 |
a | +1.470 |
Neg logit contributions | |
umm | -7.251 |
rol | -7.227 |
lor | -7.212 |
arians | -6.954 |
osity | -6.938 |
Token | party |
Token ID | 2151 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.392 |
the | +4.281 |
, | +4.250 |
a | +4.090 |
. | +4.073 |
Neg logit contributions | |
umm | -5.172 |
lor | -4.857 |
rol | -4.837 |
arians | -4.747 |
osity | -4.635 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.079 |
the | +1.035 |
, | +0.883 |
a | +0.881 |
. | +0.587 |
Neg logit contributions | |
umm | -8.216 |
lor | -8.133 |
rol | -8.087 |
arians | -7.907 |
osity | -7.830 |
Token | |
Token ID | 220 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.991 |
, | +3.814 |
the | +3.812 |
. | +3.677 |
a | +3.653 |
Neg logit contributions | |
umm | -5.430 |
lor | -5.352 |
rol | -5.328 |
osity | -5.151 |
bek | -5.140 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.572 |
, | +1.425 |
the | +1.398 |
a | +1.220 |
. | +1.209 |
Neg logit contributions | |
lor | -7.770 |
rol | -7.731 |
umm | -7.653 |
osity | -7.455 |
arians | -7.428 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.391 |
, | +1.219 |
the | +1.217 |
. | +1.080 |
a | +1.061 |
Neg logit contributions | |
umm | -7.938 |
lor | -7.917 |
rol | -7.878 |
bek | -7.686 |
osity | -7.673 |
Token | Along |
Token ID | 24035 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.816 |
the | +4.634 |
, | +4.629 |
. | +4.496 |
a | +4.480 |
Neg logit contributions | |
umm | -4.638 |
lor | -4.509 |
rol | -4.467 |
osity | -4.327 |
bek | -4.310 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.304 |
, | +2.063 |
the | +1.989 |
. | +1.974 |
a | +1.957 |
Neg logit contributions | |
rol | -7.027 |
lor | -6.995 |
umm | -6.922 |
osity | -6.756 |
bek | -6.702 |
Token | way |
Token ID | 835 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.167 |
the | +3.983 |
, | +3.945 |
a | +3.848 |
. | +3.842 |
Neg logit contributions | |
umm | -5.321 |
lor | -5.227 |
rol | -5.152 |
arians | -4.961 |
osity | -4.927 |
Token | friend |
Token ID | 1545 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.865 |
the | +2.672 |
, | +2.648 |
. | +2.555 |
a | +2.522 |
Neg logit contributions | |
umm | -6.411 |
lor | -6.243 |
arians | -6.204 |
bek | -6.167 |
rol | -6.136 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.594 |
the | +1.406 |
. | +1.327 |
a | +1.311 |
, | +1.278 |
Neg logit contributions | |
rol | -7.437 |
umm | -7.383 |
lor | -7.345 |
osity | -7.314 |
arians | -7.200 |
Token | Tim |
Token ID | 5045 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.151 |
, | +3.003 |
. | +2.861 |
the | +2.840 |
a | +2.653 |
Neg logit contributions | |
rol | -5.884 |
lor | -5.823 |
osity | -5.766 |
umm | -5.734 |
bek | -5.702 |
Token | my |
Token ID | 1820 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.852 |
the | +3.691 |
, | +3.654 |
a | +3.586 |
. | +3.520 |
Neg logit contributions | |
umm | -5.366 |
lor | -5.305 |
rol | -5.296 |
osity | -5.219 |
bek | -5.164 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.726 |
the | +0.573 |
, | +0.510 |
a | +0.475 |
. | +0.376 |
Neg logit contributions | |
umm | -8.450 |
lor | -8.410 |
rol | -8.327 |
osity | -8.314 |
bek | -8.237 |
Token | |
Token ID | 220 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.412 |
the | +2.229 |
, | +2.193 |
a | +2.120 |
. | +2.076 |
Neg logit contributions | |
umm | -6.924 |
rol | -6.826 |
lor | -6.750 |
osity | -6.654 |
bek | -6.567 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.507 |
, | +1.357 |
the | +1.337 |
a | +1.175 |
. | +1.144 |
Neg logit contributions | |
lor | -7.783 |
rol | -7.779 |
umm | -7.758 |
osity | -7.525 |
bek | -7.481 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.425 |
the | +1.257 |
, | +1.254 |
a | +1.115 |
. | +1.106 |
Neg logit contributions | |
lor | -7.842 |
umm | -7.841 |
rol | -7.811 |
bek | -7.596 |
rob | -7.593 |
Token | Tim |
Token ID | 14967 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.778 |
the | +3.621 |
, | +3.607 |
a | +3.477 |
. | +3.473 |
Neg logit contributions | |
umm | -5.627 |
lor | -5.526 |
rol | -5.519 |
bek | -5.377 |
osity | -5.337 |
Token | my |
Token ID | 1820 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.880 |
the | +3.756 |
, | +3.727 |
a | +3.625 |
. | +3.604 |
Neg logit contributions | |
umm | -5.369 |
lor | -5.317 |
rol | -5.306 |
bek | -5.183 |
osity | -5.165 |
Token | said |
Token ID | 531 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.097 |
the | +2.965 |
, | +2.928 |
. | +2.826 |
a | +2.824 |
Neg logit contributions | |
umm | -6.142 |
lor | -6.091 |
rol | -6.041 |
osity | -5.929 |
bek | -5.925 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.491 |
the | +2.342 |
, | +2.285 |
a | +2.166 |
. | +2.103 |
Neg logit contributions | |
rol | -6.677 |
lor | -6.641 |
umm | -6.604 |
rob | -6.466 |
arians | -6.452 |
Token | She |
Token ID | 1375 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.616 |
the | +3.440 |
, | +3.436 |
a | +3.297 |
. | +3.297 |
Neg logit contributions | |
umm | -5.781 |
lor | -5.641 |
rol | -5.603 |
osity | -5.501 |
bek | -5.423 |
Token | looked |
Token ID | 3114 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +3.568 |
, | +3.412 |
the | +3.394 |
. | +3.273 |
a | +3.232 |
Neg logit contributions | |
umm | -5.744 |
lor | -5.729 |
rol | -5.684 |
bek | -5.536 |
arians | -5.504 |
Token | out |
Token ID | 503 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.809 |
the | +2.624 |
, | +2.624 |
. | +2.473 |
a | +2.458 |
Neg logit contributions | |
umm | -6.664 |
lor | -6.599 |
rol | -6.522 |
bek | -6.369 |
osity | -6.363 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.582 |
, | +1.413 |
the | +1.380 |
. | +1.288 |
a | +1.253 |
Neg logit contributions | |
umm | -7.750 |
rol | -7.669 |
lor | -7.650 |
osity | -7.495 |
bek | -7.476 |
Token | window |
Token ID | 4324 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.469 |
, | +4.316 |
the | +4.310 |
. | +4.188 |
a | +4.160 |
Neg logit contributions | |
umm | -4.967 |
lor | -4.863 |
rol | -4.830 |
osity | -4.673 |
bek | -4.656 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +0.714 |
the | +0.709 |
, | +0.580 |
a | +0.557 |
. | +0.517 |
Neg logit contributions | |
umm | -8.424 |
rol | -8.272 |
lor | -8.232 |
osity | -8.146 |
bek | -8.032 |
Token | saw |
Token ID | 2497 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +2.813 |
, | +2.616 |
. | +2.552 |
the | +2.541 |
a | +2.452 |
Neg logit contributions | |
umm | -6.390 |
rol | -6.379 |
lor | -6.312 |
bek | -6.250 |
osity | -6.249 |
Token | cherry |
Token ID | 23612 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.554 |
, | +1.391 |
. | +1.268 |
the | +1.150 |
a | +0.930 |
Neg logit contributions | |
rol | -7.690 |
umm | -7.633 |
lor | -7.612 |
rob | -7.439 |
osity | -7.434 |
Token | trees |
Token ID | 7150 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +4.317 |
the | +4.172 |
, | +4.142 |
a | +4.066 |
. | +4.001 |
Neg logit contributions | |
umm | -5.042 |
lor | -4.879 |
rol | -4.876 |
rob | -4.714 |
arians | -4.695 |
Token | growing |
Token ID | 3957 |
Feature activation | -4.23e+02 |
Pos logit contributions | |
and | +1.195 |
the | +1.094 |
, | +1.021 |
a | +0.979 |
. | +0.889 |
Neg logit contributions | |
umm | -8.013 |
rol | -7.939 |
lor | -7.910 |
osity | -7.741 |
arians | -7.706 |