Token | happy |
Token ID | 3772 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.788 |
, | +3.676 |
. | +3.611 |
the | +3.403 |
a | +3.303 |
Neg logit contributions | |
umm | -5.641 |
rol | -5.450 |
lor | -5.416 |
rim | -5.400 |
ubb | -5.391 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.378 |
, | +1.326 |
. | +1.241 |
the | +1.148 |
a | +1.054 |
Neg logit contributions | |
umm | -7.810 |
lor | -7.549 |
rol | -7.538 |
osity | -7.514 |
rim | -7.492 |
Token | loved |
Token ID | 6151 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.806 |
, | +3.710 |
. | +3.634 |
the | +3.429 |
a | +3.335 |
Neg logit contributions | |
umm | -5.611 |
lor | -5.414 |
rol | -5.401 |
vation | -5.330 |
rim | -5.308 |
Token | to |
Token ID | 284 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.446 |
, | +2.376 |
. | +2.244 |
the | +2.021 |
a | +1.952 |
Neg logit contributions | |
umm | -6.923 |
rol | -6.723 |
lor | -6.715 |
rim | -6.659 |
osity | -6.644 |
Token | fly |
Token ID | 6129 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.960 |
, | +3.842 |
. | +3.762 |
the | +3.574 |
a | +3.476 |
Neg logit contributions | |
umm | -5.401 |
lor | -5.237 |
rol | -5.179 |
vation | -5.173 |
rim | -5.165 |
Token | high |
Token ID | 1029 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.489 |
, | +2.438 |
. | +2.299 |
the | +2.162 |
a | +2.053 |
Neg logit contributions | |
umm | -6.653 |
rol | -6.620 |
lor | -6.555 |
rim | -6.445 |
ubb | -6.393 |
Token | up |
Token ID | 510 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.793 |
, | +1.737 |
. | +1.613 |
the | +1.514 |
a | +1.396 |
Neg logit contributions | |
umm | -7.455 |
rol | -7.273 |
lor | -7.270 |
arians | -7.129 |
rim | -7.122 |
Token | in |
Token ID | 287 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.189 |
, | +2.128 |
. | +2.021 |
the | +1.840 |
a | +1.767 |
Neg logit contributions | |
umm | -7.001 |
rol | -6.881 |
lor | -6.765 |
ubb | -6.741 |
rim | -6.715 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.385 |
, | +1.295 |
. | +1.152 |
the | +0.775 |
a | +0.757 |
Neg logit contributions | |
umm | -7.951 |
lor | -7.722 |
rol | -7.694 |
ubb | -7.685 |
ocol | -7.640 |
Token | sky |
Token ID | 6766 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.544 |
, | +4.459 |
. | +4.373 |
the | +4.157 |
a | +4.064 |
Neg logit contributions | |
umm | -4.900 |
lor | -4.715 |
rol | -4.660 |
vation | -4.605 |
ubb | -4.560 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.534 |
, | +0.478 |
the | +0.297 |
. | +0.283 |
a | +0.182 |
Neg logit contributions | |
umm | -8.622 |
lor | -8.483 |
rol | -8.456 |
rim | -8.312 |
vation | -8.272 |
Token | saw |
Token ID | 2497 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.086 |
. | +3.050 |
, | +3.042 |
the | +2.847 |
a | +2.753 |
Neg logit contributions | |
umm | -6.020 |
lor | -5.936 |
arians | -5.867 |
rol | -5.844 |
vation | -5.820 |
Token | that |
Token ID | 326 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.528 |
, | +2.391 |
. | +2.366 |
the | +1.959 |
a | +1.864 |
Neg logit contributions | |
umm | -6.726 |
rol | -6.603 |
lor | -6.529 |
rim | -6.495 |
osity | -6.490 |
Token | Tim |
Token ID | 5045 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.798 |
, | +2.651 |
. | +2.639 |
the | +2.274 |
a | +2.234 |
Neg logit contributions | |
umm | -6.504 |
rol | -6.325 |
lor | -6.228 |
ubb | -6.223 |
osity | -6.217 |
Token | my |
Token ID | 1820 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.826 |
, | +3.747 |
. | +3.681 |
the | +3.506 |
a | +3.418 |
Neg logit contributions | |
umm | -5.403 |
rol | -5.267 |
lor | -5.245 |
rim | -5.198 |
osity | -5.188 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.621 |
, | +2.539 |
. | +2.488 |
the | +2.343 |
a | +2.229 |
Neg logit contributions | |
umm | -6.435 |
lor | -6.343 |
vation | -6.291 |
arians | -6.288 |
osity | -6.244 |
Token | struggling |
Token ID | 9648 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.868 |
, | +3.763 |
. | +3.696 |
the | +3.457 |
a | +3.290 |
Neg logit contributions | |
umm | -5.429 |
rol | -5.283 |
ubb | -5.255 |
lor | -5.242 |
rim | -5.201 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.015 |
, | +0.996 |
. | +0.891 |
the | +0.816 |
a | +0.650 |
Neg logit contributions | |
umm | -7.962 |
rol | -7.823 |
lor | -7.760 |
rim | -7.729 |
osity | -7.698 |
Token | offered |
Token ID | 4438 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.507 |
, | +3.400 |
. | +3.357 |
the | +3.060 |
a | +3.026 |
Neg logit contributions | |
umm | -5.643 |
rol | -5.586 |
osity | -5.518 |
lor | -5.489 |
rim | -5.481 |
Token | to |
Token ID | 284 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.692 |
, | +1.595 |
. | +1.492 |
the | +1.161 |
a | +1.111 |
Neg logit contributions | |
umm | -7.454 |
rol | -7.350 |
osity | -7.178 |
ocol | -7.161 |
lor | -7.144 |
Token | help |
Token ID | 1037 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.926 |
, | +3.835 |
. | +3.756 |
the | +3.455 |
a | +3.377 |
Neg logit contributions | |
umm | -5.411 |
rol | -5.249 |
lor | -5.228 |
rim | -5.219 |
vation | -5.179 |
Token | him |
Token ID | 683 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.173 |
, | +2.021 |
. | +1.778 |
the | +1.702 |
a | +1.687 |
Neg logit contributions | |
umm | -6.995 |
rim | -6.840 |
rol | -6.836 |
beh | -6.778 |
ocol | -6.771 |
Token | " |
Token ID | 366 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.478 |
, | +2.428 |
. | +2.366 |
the | +2.162 |
a | +2.053 |
Neg logit contributions | |
umm | -6.613 |
osity | -6.478 |
rol | -6.458 |
lor | -6.452 |
arians | -6.410 |
Token | Okay |
Token ID | 16454 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.672 |
, | +5.620 |
. | +5.507 |
the | +5.305 |
a | +5.201 |
Neg logit contributions | |
umm | -3.849 |
lor | -3.642 |
rol | -3.633 |
vation | -3.568 |
rim | -3.521 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.911 |
. | +0.685 |
, | +0.677 |
the | +0.495 |
a | +0.437 |
Neg logit contributions | |
umm | -8.453 |
lor | -8.194 |
arians | -8.150 |
vation | -8.119 |
rol | -8.118 |
Token | but |
Token ID | 475 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.495 |
, | +3.413 |
. | +3.390 |
the | +3.085 |
a | +3.029 |
Neg logit contributions | |
umm | -5.874 |
lor | -5.588 |
rol | -5.577 |
osity | -5.557 |
ubb | -5.542 |
Token | be |
Token ID | 307 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.214 |
, | +3.073 |
. | +3.072 |
the | +2.761 |
a | +2.722 |
Neg logit contributions | |
umm | -6.156 |
lor | -5.881 |
osity | -5.872 |
ubb | -5.861 |
arians | -5.842 |
Token | careful |
Token ID | 8161 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.695 |
, | +4.618 |
. | +4.526 |
the | +4.274 |
a | +4.145 |
Neg logit contributions | |
umm | -4.535 |
rol | -4.471 |
rim | -4.415 |
lor | -4.398 |
ubb | -4.358 |
Token | not |
Token ID | 407 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.488 |
, | +2.381 |
. | +2.272 |
the | +2.154 |
a | +2.068 |
Neg logit contributions | |
umm | -6.812 |
lor | -6.627 |
rol | -6.625 |
rim | -6.568 |
vation | -6.559 |
Token | to |
Token ID | 284 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.071 |
, | +1.954 |
. | +1.838 |
the | +1.677 |
a | +1.600 |
Neg logit contributions | |
umm | -7.239 |
rol | -7.068 |
osity | -7.040 |
lor | -7.013 |
rim | -6.988 |
Token | hurt |
Token ID | 5938 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.326 |
, | +4.186 |
. | +4.068 |
the | +3.913 |
a | +3.858 |
Neg logit contributions | |
umm | -4.992 |
rol | -4.804 |
rim | -4.792 |
lor | -4.757 |
ubb | -4.739 |
Token | me |
Token ID | 502 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.445 |
, | +4.300 |
. | +4.166 |
a | +3.891 |
the | +3.890 |
Neg logit contributions | |
umm | -4.758 |
ubb | -4.633 |
rol | -4.626 |
lor | -4.624 |
arians | -4.612 |
Token | ." |
Token ID | 526 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.612 |
, | +2.518 |
. | +2.348 |
the | +2.324 |
a | +2.244 |
Neg logit contributions | |
umm | -6.550 |
lor | -6.457 |
rol | -6.447 |
rim | -6.379 |
vation | -6.325 |
Token | big |
Token ID | 1263 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.538 |
, | +4.441 |
. | +4.389 |
the | +4.218 |
a | +4.054 |
Neg logit contributions | |
umm | -4.831 |
lor | -4.604 |
rol | -4.562 |
vation | -4.535 |
ubb | -4.512 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.770 |
, | +4.637 |
. | +4.630 |
the | +4.462 |
a | +4.371 |
Neg logit contributions | |
umm | -4.584 |
lor | -4.270 |
rol | -4.256 |
ocol | -4.238 |
ubb | -4.228 |
Token | mean |
Token ID | 1612 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.627 |
, | +3.600 |
. | +3.516 |
the | +3.286 |
a | +3.141 |
Neg logit contributions | |
umm | -5.667 |
rol | -5.440 |
lor | -5.359 |
rim | -5.357 |
vation | -5.350 |
Token | dog |
Token ID | 3290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.673 |
, | +4.564 |
. | +4.486 |
the | +4.367 |
a | +4.236 |
Neg logit contributions | |
umm | -4.699 |
lor | -4.475 |
rol | -4.454 |
rim | -4.412 |
ubb | -4.378 |
Token | who |
Token ID | 508 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.195 |
, | +2.095 |
. | +1.965 |
the | +1.893 |
a | +1.799 |
Neg logit contributions | |
umm | -7.001 |
rol | -6.939 |
lor | -6.914 |
rim | -6.827 |
arians | -6.806 |
Token | didn |
Token ID | 1422 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.605 |
, | +4.524 |
. | +4.434 |
the | +4.240 |
a | +4.145 |
Neg logit contributions | |
umm | -4.787 |
rol | -4.596 |
lor | -4.596 |
vation | -4.513 |
rim | -4.497 |
Token | 't |
Token ID | 470 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.578 |
, | +4.490 |
. | +4.388 |
the | +4.197 |
a | +4.091 |
Neg logit contributions | |
umm | -4.810 |
lor | -4.641 |
rol | -4.636 |
vation | -4.566 |
rim | -4.527 |
Token | like |
Token ID | 588 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.310 |
, | +4.218 |
. | +4.103 |
the | +3.929 |
a | +3.833 |
Neg logit contributions | |
umm | -5.091 |
rol | -4.933 |
lor | -4.891 |
rim | -4.877 |
vation | -4.866 |
Token | Tim |
Token ID | 5045 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.605 |
, | +3.514 |
. | +3.393 |
the | +3.142 |
a | +3.099 |
Neg logit contributions | |
umm | -5.748 |
lor | -5.525 |
rol | -5.518 |
ubb | -5.475 |
rim | -5.469 |
Token | my |
Token ID | 1820 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.507 |
, | +3.436 |
. | +3.275 |
the | +3.211 |
a | +3.125 |
Neg logit contributions | |
umm | -5.698 |
rol | -5.632 |
lor | -5.550 |
rim | -5.518 |
vation | -5.469 |
Token | or |
Token ID | 393 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.519 |
, | +2.433 |
. | +2.271 |
the | +2.217 |
a | +2.128 |
Neg logit contributions | |
umm | -6.660 |
rol | -6.548 |
lor | -6.508 |
vation | -6.445 |
rim | -6.442 |
Token | save |
Token ID | 3613 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.055 |
, | +3.964 |
. | +3.793 |
the | +3.718 |
a | +3.596 |
Neg logit contributions | |
umm | -5.194 |
vation | -5.080 |
lor | -5.004 |
arians | -4.964 |
rol | -4.961 |
Token | them |
Token ID | 606 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.464 |
, | +3.343 |
. | +3.189 |
the | +2.905 |
a | +2.871 |
Neg logit contributions | |
umm | -5.758 |
rol | -5.651 |
ocol | -5.640 |
arians | -5.637 |
ubb | -5.575 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.560 |
, | +1.456 |
. | +1.285 |
the | +1.256 |
a | +1.166 |
Neg logit contributions | |
umm | -7.571 |
rol | -7.486 |
lor | -7.437 |
vation | -7.371 |
arians | -7.358 |
Token | She |
Token ID | 1375 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.537 |
, | +3.435 |
. | +3.330 |
the | +3.154 |
a | +3.036 |
Neg logit contributions | |
umm | -5.868 |
lor | -5.703 |
rol | -5.658 |
arians | -5.582 |
osity | -5.568 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.456 |
, | +3.403 |
. | +3.303 |
the | +3.122 |
a | +3.012 |
Neg logit contributions | |
umm | -5.865 |
rol | -5.719 |
lor | -5.716 |
vation | -5.618 |
arians | -5.610 |
Token | scared |
Token ID | 12008 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.996 |
, | +3.927 |
. | +3.818 |
the | +3.571 |
a | +3.452 |
Neg logit contributions | |
umm | -5.343 |
rol | -5.232 |
lor | -5.149 |
ubb | -5.138 |
rim | -5.108 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.132 |
, | +1.073 |
. | +0.914 |
the | +0.888 |
a | +0.847 |
Neg logit contributions | |
umm | -7.965 |
rol | -7.784 |
ubb | -7.666 |
rim | -7.645 |
osity | -7.628 |
Token | sad |
Token ID | 6507 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.457 |
, | +4.352 |
. | +4.244 |
the | +4.000 |
a | +3.919 |
Neg logit contributions | |
umm | -4.831 |
rol | -4.761 |
ubb | -4.687 |
osity | -4.653 |
lor | -4.635 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.573 |
, | +0.482 |
the | +0.344 |
. | +0.275 |
a | +0.238 |
Neg logit contributions | |
umm | -8.588 |
rol | -8.328 |
lor | -8.295 |
arians | -8.276 |
osity | -8.243 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.235 |
, | +3.112 |
. | +3.010 |
the | +2.825 |
a | +2.707 |
Neg logit contributions | |
umm | -6.149 |
lor | -5.984 |
rol | -5.937 |
osity | -5.881 |
arians | -5.845 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.698 |
. | +1.529 |
the | +1.356 |
a | +1.255 |
Neg logit contributions | |
lor | -7.425 |
umm | -7.327 |
rol | -7.319 |
rim | -7.295 |
reetings | -7.266 |
Token | anything |
Token ID | 1997 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.646 |
, | +4.489 |
. | +4.416 |
the | +4.223 |
a | +4.120 |
Neg logit contributions | |
umm | -4.725 |
lor | -4.604 |
rol | -4.525 |
vation | -4.491 |
ubb | -4.484 |
Token | either |
Token ID | 2035 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.225 |
, | +2.130 |
. | +2.005 |
the | +1.902 |
a | +1.829 |
Neg logit contributions | |
umm | -6.998 |
lor | -6.845 |
rol | -6.830 |
vation | -6.777 |
rim | -6.759 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.075 |
, | +0.962 |
. | +0.841 |
the | +0.802 |
a | +0.727 |
Neg logit contributions | |
umm | -8.105 |
lor | -7.950 |
rol | -7.921 |
rim | -7.860 |
vation | -7.860 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.415 |
, | +3.341 |
. | +3.212 |
the | +3.011 |
a | +2.908 |
Neg logit contributions | |
umm | -5.953 |
lor | -5.830 |
rol | -5.779 |
osity | -5.673 |
vation | -5.661 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.420 |
, | +3.376 |
. | +3.309 |
the | +3.130 |
a | +3.028 |
Neg logit contributions | |
umm | -5.819 |
lor | -5.686 |
rol | -5.662 |
vation | -5.605 |
rim | -5.576 |
Token | scared |
Token ID | 12008 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.176 |
, | +4.105 |
. | +4.002 |
the | +3.785 |
a | +3.653 |
Neg logit contributions | |
umm | -5.148 |
rol | -5.021 |
lor | -4.973 |
ubb | -4.938 |
rim | -4.923 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.574 |
, | +0.502 |
. | +0.371 |
the | +0.359 |
a | +0.325 |
Neg logit contributions | |
umm | -8.536 |
rol | -8.270 |
ubb | -8.238 |
rim | -8.231 |
ocol | -8.173 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.514 |
, | +3.428 |
. | +3.300 |
the | +3.111 |
a | +3.006 |
Neg logit contributions | |
umm | -5.911 |
lor | -5.709 |
rol | -5.687 |
vation | -5.584 |
osity | -5.580 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.565 |
, | +1.480 |
. | +1.336 |
the | +1.149 |
a | +1.070 |
Neg logit contributions | |
umm | -7.691 |
lor | -7.668 |
rol | -7.610 |
rim | -7.544 |
vation | -7.513 |
Token | Tom |
Token ID | 13787 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.079 |
, | +3.987 |
. | +3.889 |
the | +3.700 |
a | +3.602 |
Neg logit contributions | |
umm | -5.360 |
lor | -5.233 |
rol | -5.184 |
vation | -5.140 |
rim | -5.113 |
Token | went |
Token ID | 1816 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.365 |
, | +3.321 |
. | +3.268 |
the | +3.091 |
a | +2.989 |
Neg logit contributions | |
umm | -5.841 |
lor | -5.741 |
rol | -5.713 |
vation | -5.648 |
rim | -5.618 |
Token | animals |
Token ID | 4695 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.565 |
, | +4.505 |
. | +4.411 |
the | +4.196 |
a | +4.095 |
Neg logit contributions | |
umm | -4.866 |
rol | -4.612 |
rim | -4.577 |
ubb | -4.568 |
lor | -4.566 |
Token | in |
Token ID | 287 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.414 |
, | +3.332 |
. | +3.265 |
the | +3.096 |
a | +3.047 |
Neg logit contributions | |
umm | -5.799 |
rol | -5.726 |
lor | -5.646 |
vation | -5.600 |
rim | -5.600 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.388 |
, | +2.284 |
. | +2.217 |
the | +1.903 |
a | +1.864 |
Neg logit contributions | |
umm | -6.874 |
rol | -6.708 |
lor | -6.683 |
ubb | -6.680 |
ocol | -6.637 |
Token | jungle |
Token ID | 20712 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.976 |
, | +5.873 |
. | +5.784 |
the | +5.576 |
a | +5.483 |
Neg logit contributions | |
umm | -3.524 |
rol | -3.251 |
lor | -3.251 |
vation | -3.212 |
rim | -3.177 |
Token | were |
Token ID | 547 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.262 |
, | +3.158 |
. | +3.073 |
the | +2.971 |
a | +2.880 |
Neg logit contributions | |
umm | -5.973 |
rol | -5.870 |
lor | -5.807 |
vation | -5.756 |
rim | -5.712 |
Token | afraid |
Token ID | 7787 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.097 |
, | +3.993 |
. | +3.912 |
the | +3.685 |
a | +3.600 |
Neg logit contributions | |
umm | -5.250 |
rol | -5.133 |
lor | -5.054 |
rim | -5.013 |
ubb | -5.001 |
Token | of |
Token ID | 286 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.131 |
, | +2.041 |
. | +1.941 |
the | +1.824 |
a | +1.767 |
Neg logit contributions | |
umm | -7.107 |
rol | -6.901 |
lor | -6.786 |
osity | -6.779 |
ubb | -6.774 |
Token | him |
Token ID | 683 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.198 |
, | +4.090 |
. | +3.978 |
the | +3.694 |
a | +3.650 |
Neg logit contributions | |
umm | -5.095 |
rol | -4.898 |
lor | -4.866 |
ubb | -4.863 |
ocol | -4.829 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.560 |
, | +1.454 |
. | +1.335 |
the | +1.316 |
a | +1.218 |
Neg logit contributions | |
umm | -7.538 |
lor | -7.438 |
rol | -7.421 |
osity | -7.335 |
vation | -7.328 |
Token | One |
Token ID | 1881 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.889 |
, | +3.815 |
. | +3.693 |
the | +3.506 |
a | +3.409 |
Neg logit contributions | |
umm | -5.514 |
rol | -5.364 |
lor | -5.348 |
arians | -5.236 |
osity | -5.194 |
Token | day |
Token ID | 1110 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.355 |
, | +3.250 |
. | +3.193 |
the | +2.969 |
a | +2.876 |
Neg logit contributions | |
umm | -6.005 |
rol | -5.789 |
lor | -5.754 |
rim | -5.736 |
ubb | -5.711 |
Token | roared |
Token ID | 45615 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.864 |
, | +3.810 |
. | +3.779 |
the | +3.582 |
a | +3.504 |
Neg logit contributions | |
umm | -5.332 |
lor | -5.234 |
rol | -5.157 |
vation | -5.135 |
arians | -5.123 |
Token | again |
Token ID | 757 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.054 |
, | +2.998 |
. | +2.971 |
the | +2.794 |
a | +2.647 |
Neg logit contributions | |
umm | -5.946 |
rol | -5.879 |
lor | -5.786 |
ubb | -5.766 |
osity | -5.753 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.923 |
, | +0.833 |
. | +0.808 |
the | +0.698 |
a | +0.654 |
Neg logit contributions | |
umm | -8.057 |
lor | -7.897 |
osity | -7.896 |
ubb | -7.887 |
former | -7.857 |
Token | this |
Token ID | 428 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
, | +3.267 |
and | +3.254 |
. | +3.224 |
the | +2.931 |
a | +2.914 |
Neg logit contributions | |
umm | -5.853 |
rol | -5.743 |
osity | -5.667 |
ubb | -5.646 |
lor | -5.644 |
Token | time |
Token ID | 640 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.198 |
, | +3.125 |
. | +3.037 |
the | +2.876 |
a | +2.772 |
Neg logit contributions | |
umm | -6.169 |
lor | -5.984 |
vation | -5.927 |
rol | -5.921 |
rim | -5.910 |
Token | louder |
Token ID | 27089 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.078 |
, | +1.937 |
. | +1.905 |
the | +1.656 |
a | +1.596 |
Neg logit contributions | |
umm | -7.109 |
rol | -6.960 |
lor | -6.929 |
ubb | -6.892 |
osity | -6.882 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.482 |
, | +2.385 |
. | +2.324 |
the | +2.194 |
a | +2.141 |
Neg logit contributions | |
umm | -6.749 |
lor | -6.515 |
ubb | -6.502 |
rim | -6.476 |
vation | -6.464 |
Token | more |
Token ID | 517 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.341 |
, | +4.220 |
. | +4.176 |
the | +3.821 |
a | +3.785 |
Neg logit contributions | |
umm | -5.061 |
rol | -4.850 |
ubb | -4.835 |
lor | -4.801 |
vation | -4.800 |
Token | fiercely |
Token ID | 33285 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.258 |
, | +5.170 |
. | +5.046 |
the | +4.875 |
a | +4.805 |
Neg logit contributions | |
umm | -4.141 |
ubb | -3.900 |
ocol | -3.852 |
rol | -3.843 |
rim | -3.829 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.732 |
, | +4.616 |
. | +4.520 |
the | +4.359 |
a | +4.306 |
Neg logit contributions | |
umm | -4.581 |
ubb | -4.346 |
rol | -4.333 |
lor | -4.328 |
vation | -4.323 |
Token | He |
Token ID | 679 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.280 |
, | +4.225 |
. | +4.105 |
the | +3.892 |
a | +3.772 |
Neg logit contributions | |
umm | -5.233 |
rol | -4.981 |
lor | -4.961 |
osity | -4.885 |
arians | -4.863 |
Token | Eventually |
Token ID | 28724 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.006 |
, | +3.980 |
. | +3.865 |
the | +3.655 |
a | +3.528 |
Neg logit contributions | |
lor | -5.353 |
umm | -5.269 |
rol | -5.262 |
rim | -5.196 |
vation | -5.172 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.433 |
. | +1.244 |
, | +1.164 |
the | +0.931 |
a | +0.890 |
Neg logit contributions | |
umm | -7.897 |
lor | -7.675 |
ubb | -7.630 |
ocol | -7.616 |
rol | -7.614 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.702 |
. | +3.603 |
, | +3.597 |
the | +3.176 |
a | +3.153 |
Neg logit contributions | |
umm | -5.653 |
vation | -5.349 |
lor | -5.336 |
ubb | -5.317 |
osity | -5.284 |
Token | snake |
Token ID | 17522 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.455 |
, | +5.368 |
. | +5.271 |
the | +5.090 |
a | +4.952 |
Neg logit contributions | |
umm | -4.077 |
lor | -3.779 |
rol | -3.776 |
vation | -3.754 |
ubb | -3.738 |
Token | went |
Token ID | 1816 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.497 |
, | +4.412 |
. | +4.347 |
the | +4.170 |
a | +4.085 |
Neg logit contributions | |
umm | -4.814 |
lor | -4.670 |
rol | -4.661 |
vation | -4.577 |
rim | -4.553 |
Token | far |
Token ID | 1290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.224 |
, | +3.128 |
. | +3.035 |
the | +2.864 |
a | +2.782 |
Neg logit contributions | |
umm | -6.072 |
rol | -6.012 |
lor | -5.903 |
rim | -5.810 |
ubb | -5.808 |
Token | away |
Token ID | 1497 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.236 |
, | +3.194 |
. | +3.099 |
a | +3.020 |
the | +2.993 |
Neg logit contributions | |
umm | -5.847 |
lor | -5.668 |
rol | -5.664 |
ubb | -5.560 |
rim | -5.559 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.218 |
, | +1.137 |
. | +1.017 |
the | +0.946 |
a | +0.876 |
Neg logit contributions | |
umm | -7.852 |
rol | -7.730 |
lor | -7.695 |
ubb | -7.648 |
vation | -7.591 |
Token | Harry |
Token ID | 5850 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.291 |
, | +4.164 |
. | +4.128 |
the | +3.741 |
a | +3.733 |
Neg logit contributions | |
umm | -5.150 |
rol | -4.935 |
lor | -4.874 |
ubb | -4.854 |
osity | -4.835 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.735 |
, | +3.661 |
. | +3.579 |
the | +3.396 |
a | +3.315 |
Neg logit contributions | |
umm | -5.483 |
lor | -5.448 |
rol | -5.397 |
vation | -5.313 |
ubb | -5.251 |
Token | sad |
Token ID | 6507 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.285 |
, | +4.201 |
. | +4.112 |
the | +3.881 |
a | +3.773 |
Neg logit contributions | |
umm | -5.048 |
rol | -4.982 |
lor | -4.937 |
ubb | -4.840 |
vation | -4.830 |
Token | |
Token ID | 220 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.208 |
, | +3.173 |
. | +3.069 |
the | +2.865 |
a | +2.800 |
Neg logit contributions | |
umm | -6.014 |
rol | -5.912 |
lor | -5.892 |
vation | -5.778 |
rim | -5.751 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.648 |
, | +1.561 |
. | +1.383 |
the | +1.264 |
a | +1.168 |
Neg logit contributions | |
umm | -7.647 |
lor | -7.633 |
rol | -7.609 |
vation | -7.429 |
rim | -7.427 |
Token | S |
Token ID | 50 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.983 |
, | +3.937 |
. | +3.800 |
the | +3.587 |
a | +3.488 |
Neg logit contributions | |
lor | -5.356 |
umm | -5.331 |
rol | -5.279 |
rim | -5.219 |
vation | -5.204 |
Token | ally |
Token ID | 453 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +6.838 |
, | +6.729 |
. | +6.645 |
the | +6.517 |
a | +6.428 |
Neg logit contributions | |
umm | -2.730 |
lor | -2.526 |
rol | -2.479 |
rim | -2.421 |
vation | -2.410 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.046 |
, | +3.992 |
. | +3.939 |
the | +3.754 |
a | +3.674 |
Neg logit contributions | |
umm | -5.163 |
rol | -5.049 |
lor | -5.042 |
vation | -4.940 |
rim | -4.936 |
Token | scared |
Token ID | 12008 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.139 |
, | +4.054 |
. | +3.976 |
the | +3.750 |
a | +3.636 |
Neg logit contributions | |
umm | -5.231 |
rol | -5.104 |
lor | -5.047 |
ubb | -4.984 |
rim | -4.978 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.104 |
, | +1.008 |
. | +0.936 |
the | +0.908 |
a | +0.861 |
Neg logit contributions | |
umm | -8.047 |
rol | -7.773 |
ubb | -7.746 |
osity | -7.703 |
rim | -7.702 |
Token | ran |
Token ID | 4966 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.108 |
, | +4.006 |
. | +3.938 |
the | +3.663 |
a | +3.616 |
Neg logit contributions | |
umm | -5.135 |
rol | -5.063 |
ubb | -4.974 |
lor | -4.961 |
osity | -4.945 |
Token | away |
Token ID | 1497 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.131 |
, | +3.056 |
. | +2.954 |
the | +2.777 |
a | +2.680 |
Neg logit contributions | |
umm | -6.141 |
rol | -6.042 |
lor | -5.942 |
vation | -5.900 |
ubb | -5.865 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.602 |
, | +1.450 |
. | +1.319 |
the | +1.218 |
a | +1.203 |
Neg logit contributions | |
umm | -7.521 |
rol | -7.392 |
ubb | -7.374 |
rim | -7.315 |
lor | -7.287 |
Token | She |
Token ID | 1375 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.906 |
, | +3.822 |
. | +3.757 |
the | +3.545 |
a | +3.471 |
Neg logit contributions | |
umm | -5.562 |
rol | -5.329 |
lor | -5.282 |
osity | -5.261 |
ubb | -5.166 |
Token | nearby |
Token ID | 6716 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.398 |
, | +4.326 |
. | +4.239 |
the | +4.076 |
a | +3.981 |
Neg logit contributions | |
umm | -4.944 |
ocol | -4.724 |
rol | -4.708 |
ubb | -4.657 |
vation | -4.565 |
Token | leaves |
Token ID | 5667 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.789 |
, | +1.717 |
. | +1.568 |
the | +1.546 |
a | +1.484 |
Neg logit contributions | |
umm | -7.443 |
rol | -7.221 |
lor | -7.129 |
arians | -7.060 |
ubb | -7.053 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.535 |
, | +1.485 |
. | +1.371 |
the | +1.292 |
a | +1.256 |
Neg logit contributions | |
umm | -7.534 |
rol | -7.510 |
lor | -7.333 |
ubb | -7.307 |
osity | -7.285 |
Token | Rabbit |
Token ID | 25498 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.362 |
, | +4.315 |
. | +4.216 |
the | +3.972 |
a | +3.875 |
Neg logit contributions | |
umm | -5.090 |
rol | -4.919 |
lor | -4.900 |
osity | -4.786 |
vation | -4.747 |
Token | then |
Token ID | 788 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.000 |
, | +3.942 |
. | +3.918 |
the | +3.688 |
a | +3.619 |
Neg logit contributions | |
umm | -5.220 |
lor | -5.113 |
rol | -5.109 |
vation | -5.022 |
ubb | -4.977 |
Token | began |
Token ID | 2540 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.427 |
, | +4.350 |
. | +4.314 |
the | +4.047 |
a | +3.980 |
Neg logit contributions | |
umm | -4.837 |
rol | -4.705 |
lor | -4.648 |
ubb | -4.619 |
vation | -4.603 |
Token | to |
Token ID | 284 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.804 |
, | +2.720 |
. | +2.648 |
the | +2.420 |
a | +2.358 |
Neg logit contributions | |
umm | -6.419 |
rol | -6.298 |
lor | -6.251 |
ubb | -6.249 |
osity | -6.211 |
Token | fan |
Token ID | 4336 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.642 |
, | +4.531 |
. | +4.465 |
the | +4.215 |
a | +4.141 |
Neg logit contributions | |
umm | -4.705 |
rol | -4.515 |
ubb | -4.503 |
rim | -4.458 |
vation | -4.440 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.907 |
, | +4.800 |
. | +4.738 |
the | +4.559 |
a | +4.517 |
Neg logit contributions | |
umm | -4.341 |
rol | -4.275 |
lor | -4.176 |
rim | -4.126 |
arians | -4.115 |
Token | handle |
Token ID | 5412 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.238 |
, | +5.159 |
. | +5.058 |
the | +4.899 |
a | +4.782 |
Neg logit contributions | |
umm | -4.373 |
arians | -3.961 |
rol | -3.955 |
ubb | -3.950 |
vation | -3.929 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.432 |
, | +4.360 |
. | +4.265 |
the | +4.142 |
a | +4.077 |
Neg logit contributions | |
umm | -4.822 |
rol | -4.714 |
osity | -4.536 |
lor | -4.533 |
ubb | -4.523 |
Token | weeks |
Token ID | 2745 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.970 |
, | +4.836 |
. | +4.777 |
the | +4.567 |
a | +4.480 |
Neg logit contributions | |
umm | -4.337 |
rol | -4.153 |
ubb | -4.099 |
ocol | -4.086 |
lor | -4.082 |
Token | ago |
Token ID | 2084 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.281 |
, | +2.166 |
. | +2.100 |
the | +2.004 |
a | +1.948 |
Neg logit contributions | |
umm | -6.978 |
rol | -6.782 |
lor | -6.776 |
vation | -6.727 |
arians | -6.676 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.717 |
, | +2.595 |
. | +2.508 |
the | +2.437 |
a | +2.311 |
Neg logit contributions | |
umm | -6.458 |
lor | -6.368 |
rol | -6.294 |
vation | -6.248 |
arians | -6.219 |
Token | but |
Token ID | 475 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.324 |
, | +3.317 |
. | +3.241 |
the | +2.950 |
a | +2.845 |
Neg logit contributions | |
umm | -5.828 |
rol | -5.752 |
lor | -5.708 |
arians | -5.641 |
osity | -5.619 |
Token | she |
Token ID | 673 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.136 |
. | +4.014 |
, | +3.979 |
the | +3.652 |
a | +3.598 |
Neg logit contributions | |
umm | -5.229 |
lor | -5.029 |
rol | -5.008 |
osity | -4.941 |
ubb | -4.941 |
Token | didn |
Token ID | 1422 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.723 |
, | +3.619 |
. | +3.570 |
the | +3.384 |
a | +3.270 |
Neg logit contributions | |
umm | -5.630 |
lor | -5.483 |
rol | -5.419 |
vation | -5.367 |
ubb | -5.339 |
Token | 't |
Token ID | 470 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.642 |
, | +4.549 |
. | +4.453 |
the | +4.273 |
a | +4.129 |
Neg logit contributions | |
umm | -4.707 |
lor | -4.593 |
rol | -4.552 |
vation | -4.500 |
ubb | -4.435 |
Token | have |
Token ID | 423 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.569 |
, | +4.468 |
. | +4.343 |
the | +4.228 |
a | +4.125 |
Neg logit contributions | |
umm | -4.758 |
vation | -4.561 |
ubb | -4.542 |
rol | -4.538 |
lor | -4.532 |
Token | any |
Token ID | 597 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.854 |
, | +3.759 |
. | +3.629 |
the | +3.378 |
a | +3.258 |
Neg logit contributions | |
umm | -5.469 |
rol | -5.319 |
lor | -5.311 |
ubb | -5.238 |
vation | -5.196 |
Token | friends |
Token ID | 2460 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.869 |
, | +4.746 |
. | +4.630 |
the | +4.564 |
a | +4.431 |
Neg logit contributions | |
umm | -4.506 |
ocol | -4.226 |
rol | -4.218 |
ubb | -4.205 |
lor | -4.154 |
Token | yet |
Token ID | 1865 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.166 |
, | +2.079 |
. | +1.919 |
the | +1.838 |
a | +1.777 |
Neg logit contributions | |
umm | -7.033 |
rol | -6.935 |
lor | -6.930 |
vation | -6.830 |
osity | -6.813 |
Token | paint |
Token ID | 7521 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.622 |
, | +4.537 |
. | +4.433 |
the | +4.245 |
a | +4.139 |
Neg logit contributions | |
umm | -4.866 |
vation | -4.587 |
rol | -4.558 |
lor | -4.556 |
ubb | -4.538 |
Token | had |
Token ID | 550 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.444 |
, | +4.369 |
. | +4.295 |
the | +4.112 |
a | +4.027 |
Neg logit contributions | |
umm | -4.932 |
rol | -4.729 |
lor | -4.705 |
vation | -4.660 |
ubb | -4.598 |
Token | dried |
Token ID | 16577 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.741 |
, | +4.686 |
. | +4.575 |
the | +4.334 |
a | +4.211 |
Neg logit contributions | |
umm | -4.627 |
rol | -4.475 |
lor | -4.442 |
ubb | -4.353 |
osity | -4.349 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.304 |
, | +3.221 |
. | +3.133 |
the | +2.918 |
a | +2.900 |
Neg logit contributions | |
umm | -6.036 |
rol | -5.805 |
ubb | -5.685 |
lor | -5.683 |
osity | -5.650 |
Token | it |
Token ID | 340 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.975 |
, | +3.889 |
. | +3.805 |
the | +3.453 |
a | +3.421 |
Neg logit contributions | |
umm | -5.423 |
rol | -5.246 |
ubb | -5.188 |
osity | -5.134 |
lor | -5.126 |
Token | wouldn |
Token ID | 3636 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.195 |
, | +4.115 |
. | +4.019 |
the | +3.820 |
a | +3.732 |
Neg logit contributions | |
umm | -5.210 |
rol | -5.015 |
lor | -5.000 |
vation | -4.931 |
ubb | -4.911 |
Token | 't |
Token ID | 470 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.640 |
, | +4.547 |
. | +4.447 |
the | +4.258 |
a | +4.174 |
Neg logit contributions | |
umm | -4.717 |
rol | -4.568 |
lor | -4.548 |
vation | -4.494 |
ubb | -4.452 |
Token | come |
Token ID | 1282 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.248 |
, | +4.148 |
. | +4.036 |
the | +3.862 |
a | +3.771 |
Neg logit contributions | |
umm | -5.093 |
rol | -4.911 |
vation | -4.859 |
osity | -4.852 |
lor | -4.828 |
Token | off |
Token ID | 572 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.811 |
, | +4.722 |
. | +4.574 |
the | +4.490 |
a | +4.365 |
Neg logit contributions | |
umm | -4.436 |
rol | -4.351 |
osity | -4.274 |
lor | -4.182 |
ubb | -4.149 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.592 |
, | +1.503 |
. | +1.302 |
the | +1.197 |
a | +1.158 |
Neg logit contributions | |
umm | -7.683 |
rol | -7.500 |
lor | -7.381 |
ubb | -7.369 |
vation | -7.354 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.894 |
, | +2.793 |
. | +2.687 |
the | +2.489 |
a | +2.413 |
Neg logit contributions | |
umm | -6.589 |
lor | -6.386 |
rol | -6.371 |
osity | -6.191 |
vation | -6.182 |
Token | walked |
Token ID | 6807 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.475 |
, | +4.384 |
. | +4.343 |
the | +4.148 |
a | +4.056 |
Neg logit contributions | |
umm | -4.735 |
rol | -4.704 |
lor | -4.621 |
vation | -4.577 |
ubb | -4.559 |
Token | through |
Token ID | 832 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.086 |
, | +3.025 |
. | +2.985 |
the | +2.765 |
a | +2.685 |
Neg logit contributions | |
umm | -6.060 |
rol | -6.008 |
lor | -5.852 |
vation | -5.830 |
arians | -5.796 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.375 |
, | +1.260 |
. | +1.208 |
the | +0.845 |
a | +0.820 |
Neg logit contributions | |
umm | -7.722 |
rol | -7.556 |
ubb | -7.545 |
lor | -7.544 |
arians | -7.506 |
Token | maze |
Token ID | 31237 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +6.012 |
, | +5.905 |
. | +5.834 |
the | +5.614 |
a | +5.523 |
Neg logit contributions | |
umm | -3.435 |
rol | -3.133 |
lor | -3.133 |
vation | -3.128 |
osity | -3.067 |
Token | together |
Token ID | 1978 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.817 |
, | +2.720 |
. | +2.648 |
the | +2.582 |
a | +2.496 |
Neg logit contributions | |
umm | -6.349 |
rol | -6.220 |
lor | -6.176 |
vation | -6.124 |
arians | -6.080 |
Token | trying |
Token ID | 2111 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.953 |
, | +0.827 |
. | +0.736 |
the | +0.664 |
a | +0.631 |
Neg logit contributions | |
umm | -8.017 |
rol | -7.836 |
vation | -7.802 |
ubb | -7.802 |
lor | -7.796 |
Token | to |
Token ID | 284 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.034 |
, | +1.945 |
. | +1.843 |
the | +1.693 |
a | +1.585 |
Neg logit contributions | |
umm | -6.921 |
lor | -6.881 |
rol | -6.836 |
osity | -6.778 |
arians | -6.745 |
Token | find |
Token ID | 1064 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.912 |
, | +3.830 |
. | +3.692 |
the | +3.420 |
a | +3.345 |
Neg logit contributions | |
umm | -5.291 |
vation | -5.207 |
lor | -5.172 |
arians | -5.162 |
rol | -5.137 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.443 |
, | +3.316 |
. | +3.232 |
the | +2.880 |
a | +2.780 |
Neg logit contributions | |
umm | -5.851 |
rol | -5.696 |
lor | -5.665 |
ubb | -5.557 |
ocol | -5.534 |
Token | exit |
Token ID | 8420 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.947 |
, | +4.872 |
. | +4.746 |
the | +4.581 |
a | +4.420 |
Neg logit contributions | |
umm | -4.537 |
rol | -4.231 |
lor | -4.206 |
ubb | -4.185 |
vation | -4.182 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.987 |
, | +2.884 |
. | +2.751 |
the | +2.692 |
a | +2.635 |
Neg logit contributions | |
umm | -6.217 |
rol | -6.070 |
lor | -5.986 |
arians | -5.953 |
osity | -5.926 |
Token | wished |
Token ID | 16555 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.250 |
, | +4.160 |
. | +4.065 |
the | +3.829 |
a | +3.762 |
Neg logit contributions | |
umm | -5.147 |
rol | -4.942 |
lor | -4.901 |
rim | -4.881 |
ubb | -4.869 |
Token | she |
Token ID | 673 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.543 |
, | +2.460 |
. | +2.347 |
the | +2.116 |
a | +2.082 |
Neg logit contributions | |
umm | -6.670 |
osity | -6.467 |
rol | -6.454 |
lor | -6.440 |
ubb | -6.410 |
Token | had |
Token ID | 550 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.309 |
, | +3.221 |
. | +3.134 |
the | +2.942 |
a | +2.843 |
Neg logit contributions | |
umm | -6.153 |
lor | -5.953 |
rol | -5.942 |
vation | -5.866 |
ubb | -5.842 |
Token | been |
Token ID | 587 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.699 |
, | +4.622 |
. | +4.496 |
the | +4.240 |
a | +4.118 |
Neg logit contributions | |
umm | -4.665 |
lor | -4.536 |
rol | -4.475 |
vation | -4.430 |
osity | -4.404 |
Token | more |
Token ID | 517 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.797 |
, | +4.701 |
. | +4.609 |
the | +4.403 |
a | +4.298 |
Neg logit contributions | |
umm | -4.645 |
rol | -4.441 |
lor | -4.440 |
vation | -4.369 |
ubb | -4.359 |
Token | careful |
Token ID | 8161 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.636 |
, | +4.553 |
. | +4.459 |
the | +4.282 |
a | +4.180 |
Neg logit contributions | |
umm | -4.829 |
lor | -4.607 |
rol | -4.593 |
vation | -4.539 |
ubb | -4.534 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.729 |
, | +1.682 |
. | +1.488 |
the | +1.472 |
a | +1.344 |
Neg logit contributions | |
umm | -7.527 |
rol | -7.344 |
lor | -7.315 |
osity | -7.251 |
vation | -7.234 |
Token | From |
Token ID | 3574 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.379 |
, | +4.298 |
. | +4.195 |
the | +4.029 |
a | +3.932 |
Neg logit contributions | |
umm | -5.056 |
lor | -4.830 |
rol | -4.771 |
osity | -4.769 |
vation | -4.662 |
Token | then |
Token ID | 788 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.890 |
, | +1.816 |
. | +1.769 |
the | +1.467 |
a | +1.418 |
Neg logit contributions | |
umm | -7.352 |
lor | -7.163 |
vation | -7.135 |
rim | -7.119 |
rol | -7.090 |
Token | on |
Token ID | 319 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.734 |
, | +1.629 |
. | +1.577 |
the | +1.370 |
a | +1.284 |
Neg logit contributions | |
umm | -7.651 |
lor | -7.460 |
rol | -7.432 |
vation | -7.383 |
ubb | -7.340 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.326 |
. | +0.168 |
, | +0.083 |
a | -0.074 |
the | -0.086 |
Neg logit contributions | |
umm | -8.957 |
lor | -8.769 |
vation | -8.685 |
arians | -8.665 |
rol | -8.654 |
Token | she |
Token ID | 673 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.896 |
, | +1.821 |
. | +1.751 |
the | +1.457 |
a | +1.401 |
Neg logit contributions | |
umm | -7.313 |
lor | -7.237 |
osity | -7.171 |
rol | -7.088 |
ubb | -7.063 |
Token | had |
Token ID | 550 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.749 |
, | +3.670 |
. | +3.580 |
the | +3.393 |
a | +3.293 |
Neg logit contributions | |
umm | -5.682 |
lor | -5.484 |
rol | -5.470 |
vation | -5.398 |
ubb | -5.372 |
Token | to |
Token ID | 284 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.825 |
, | +2.752 |
. | +2.662 |
the | +2.373 |
a | +2.234 |
Neg logit contributions | |
umm | -6.528 |
lor | -6.325 |
osity | -6.282 |
rol | -6.280 |
ubb | -6.234 |
Token | be |
Token ID | 307 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.156 |
, | +4.042 |
. | +3.948 |
the | +3.840 |
a | +3.722 |
Neg logit contributions | |
umm | -5.160 |
rim | -4.890 |
lor | -4.884 |
vation | -4.865 |
former | -4.840 |
Token | more |
Token ID | 517 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.540 |
, | +4.463 |
. | +4.364 |
the | +4.127 |
a | +3.999 |
Neg logit contributions | |
umm | -4.820 |
rol | -4.641 |
lor | -4.618 |
ubb | -4.577 |
rim | -4.557 |
Token | careful |
Token ID | 8161 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.622 |
, | +4.557 |
. | +4.462 |
the | +4.281 |
a | +4.174 |
Neg logit contributions | |
umm | -4.810 |
lor | -4.579 |
rol | -4.569 |
ubb | -4.525 |
rim | -4.522 |
Token | when |
Token ID | 618 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.955 |
, | +1.928 |
. | +1.800 |
the | +1.721 |
a | +1.608 |
Neg logit contributions | |
umm | -7.262 |
rol | -7.019 |
lor | -7.012 |
osity | -6.989 |
vation | -6.949 |
Token | she |
Token ID | 673 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.854 |
, | +3.702 |
. | +3.623 |
the | +3.381 |
a | +3.330 |
Neg logit contributions | |
umm | -5.538 |
ubb | -5.283 |
osity | -5.253 |
vation | -5.244 |
rol | -5.237 |
Token | painted |
Token ID | 13055 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.433 |
, | +4.373 |
. | +4.253 |
the | +4.104 |
a | +4.006 |
Neg logit contributions | |
umm | -4.950 |
rol | -4.705 |
lor | -4.696 |
vation | -4.677 |
ubb | -4.653 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.104 |
, | +3.026 |
. | +2.893 |
the | +2.679 |
a | +2.606 |
Neg logit contributions | |
umm | -6.209 |
rol | -6.004 |
lor | -5.905 |
ubb | -5.885 |
ocol | -5.856 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.431 |
, | +2.351 |
. | +2.250 |
the | +2.057 |
a | +1.967 |
Neg logit contributions | |
umm | -7.013 |
lor | -6.805 |
rol | -6.774 |
osity | -6.690 |
vation | -6.681 |
Token | arms |
Token ID | 5101 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.942 |
, | +4.865 |
. | +4.767 |
the | +4.601 |
a | +4.532 |
Neg logit contributions | |
umm | -4.451 |
lor | -4.245 |
rol | -4.193 |
arians | -4.162 |
vation | -4.136 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
, | +0.639 |
and | +0.625 |
. | +0.545 |
the | +0.498 |
a | +0.324 |
Neg logit contributions | |
rol | -8.315 |
umm | -8.274 |
osity | -8.140 |
lor | -8.113 |
ubb | -8.065 |
Token | said |
Token ID | 531 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.424 |
, | +4.365 |
. | +4.283 |
the | +3.953 |
a | +3.910 |
Neg logit contributions | |
umm | -4.712 |
rol | -4.608 |
lor | -4.570 |
arians | -4.569 |
rim | -4.508 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.823 |
. | +0.635 |
, | +0.602 |
the | +0.443 |
a | +0.362 |
Neg logit contributions | |
umm | -8.448 |
lor | -8.313 |
rol | -8.283 |
osity | -8.271 |
ubb | -8.246 |
Token | " |
Token ID | 366 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.502 |
, | +2.422 |
. | +2.373 |
the | +2.181 |
a | +2.117 |
Neg logit contributions | |
umm | -6.608 |
osity | -6.508 |
lor | -6.494 |
arians | -6.479 |
rol | -6.446 |
Token | Fine |
Token ID | 34389 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.844 |
, | +5.764 |
. | +5.670 |
the | +5.469 |
a | +5.375 |
Neg logit contributions | |
umm | -3.664 |
lor | -3.460 |
rol | -3.442 |
vation | -3.380 |
ubb | -3.348 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.852 |
, | +0.621 |
. | +0.592 |
the | +0.516 |
a | +0.434 |
Neg logit contributions | |
umm | -8.379 |
lor | -8.179 |
arians | -8.129 |
vation | -8.049 |
rol | -8.042 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.397 |
, | +3.293 |
. | +3.277 |
the | +2.975 |
a | +2.914 |
Neg logit contributions | |
umm | -5.926 |
lor | -5.682 |
vation | -5.647 |
arians | -5.647 |
osity | -5.636 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.661 |
, | +1.506 |
. | +1.427 |
the | +1.320 |
a | +1.239 |
Neg logit contributions | |
umm | -7.651 |
lor | -7.476 |
rol | -7.406 |
rim | -7.364 |
arians | -7.344 |
Token | be |
Token ID | 307 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.763 |
, | +3.688 |
. | +3.654 |
the | +3.364 |
a | +3.288 |
Neg logit contributions | |
umm | -5.548 |
lor | -5.347 |
rol | -5.307 |
ubb | -5.285 |
osity | -5.278 |
Token | gr |
Token ID | 1036 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.973 |
, | +4.861 |
. | +4.750 |
the | +4.532 |
a | +4.385 |
Neg logit contributions | |
umm | -4.345 |
lor | -4.283 |
rol | -4.239 |
rim | -4.215 |
vation | -4.190 |
Token | It |
Token ID | 632 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.188 |
, | +4.099 |
. | +4.001 |
the | +3.820 |
a | +3.720 |
Neg logit contributions | |
umm | -5.172 |
rol | -5.048 |
lor | -5.014 |
osity | -4.910 |
arians | -4.867 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.938 |
, | +3.869 |
. | +3.774 |
the | +3.578 |
a | +3.484 |
Neg logit contributions | |
umm | -5.424 |
rol | -5.261 |
lor | -5.251 |
vation | -5.174 |
ubb | -5.141 |
Token | paint |
Token ID | 7521 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.604 |
, | +3.534 |
. | +3.447 |
the | +3.159 |
a | +3.020 |
Neg logit contributions | |
umm | -5.718 |
rol | -5.599 |
ubb | -5.494 |
rim | -5.463 |
ocol | -5.452 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.588 |
, | +3.496 |
. | +3.400 |
the | +3.303 |
a | +3.183 |
Neg logit contributions | |
umm | -5.819 |
rol | -5.574 |
lor | -5.546 |
vation | -5.473 |
ubb | -5.386 |
Token | It |
Token ID | 632 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.254 |
, | +4.185 |
. | +4.076 |
the | +3.859 |
a | +3.753 |
Neg logit contributions | |
umm | -5.114 |
rol | -4.993 |
lor | -4.968 |
osity | -4.850 |
ocol | -4.846 |
Token | spl |
Token ID | 4328 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.309 |
, | +3.250 |
. | +3.148 |
the | +2.953 |
a | +2.855 |
Neg logit contributions | |
umm | -6.056 |
rol | -5.886 |
lor | -5.861 |
vation | -5.793 |
rim | -5.757 |
Token | ashed |
Token ID | 5263 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +7.454 |
, | +7.394 |
. | +7.290 |
the | +7.140 |
a | +7.018 |
Neg logit contributions | |
umm | -2.075 |
rol | -1.917 |
lor | -1.818 |
rim | -1.754 |
osity | -1.753 |
Token | on |
Token ID | 319 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.374 |
, | +2.341 |
. | +2.222 |
the | +2.020 |
a | +1.972 |
Neg logit contributions | |
umm | -6.827 |
rol | -6.689 |
ubb | -6.491 |
rim | -6.440 |
ocol | -6.434 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.266 |
, | +1.237 |
. | +1.128 |
the | +0.772 |
a | +0.764 |
Neg logit contributions | |
umm | -7.930 |
rol | -7.665 |
ocol | -7.661 |
ubb | -7.647 |
lor | -7.623 |
Token | walls |
Token ID | 7714 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.069 |
, | +5.026 |
. | +4.900 |
the | +4.736 |
a | +4.653 |
Neg logit contributions | |
umm | -4.330 |
vation | -4.073 |
lor | -4.054 |
rol | -4.045 |
rim | -4.013 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.276 |
, | +1.206 |
. | +1.109 |
the | +1.022 |
a | +0.942 |
Neg logit contributions | |
umm | -7.948 |
rol | -7.781 |
lor | -7.664 |
vation | -7.651 |
ubb | -7.629 |
Token | this |
Token ID | 428 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
, | +3.267 |
and | +3.254 |
. | +3.224 |
the | +2.931 |
a | +2.914 |
Neg logit contributions | |
umm | -5.853 |
rol | -5.743 |
osity | -5.667 |
ubb | -5.646 |
lor | -5.644 |
Token | time |
Token ID | 640 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.198 |
, | +3.125 |
. | +3.037 |
the | +2.876 |
a | +2.772 |
Neg logit contributions | |
umm | -6.169 |
lor | -5.984 |
vation | -5.927 |
rol | -5.921 |
rim | -5.910 |
Token | louder |
Token ID | 27089 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.078 |
, | +1.937 |
. | +1.905 |
the | +1.656 |
a | +1.596 |
Neg logit contributions | |
umm | -7.109 |
rol | -6.960 |
lor | -6.929 |
ubb | -6.892 |
osity | -6.882 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.482 |
, | +2.385 |
. | +2.324 |
the | +2.194 |
a | +2.141 |
Neg logit contributions | |
umm | -6.749 |
lor | -6.515 |
ubb | -6.502 |
rim | -6.476 |
vation | -6.464 |
Token | more |
Token ID | 517 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.341 |
, | +4.220 |
. | +4.176 |
the | +3.821 |
a | +3.785 |
Neg logit contributions | |
umm | -5.061 |
rol | -4.850 |
ubb | -4.835 |
lor | -4.801 |
vation | -4.800 |
Token | fiercely |
Token ID | 33285 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.258 |
, | +5.170 |
. | +5.046 |
the | +4.875 |
a | +4.805 |
Neg logit contributions | |
umm | -4.141 |
ubb | -3.900 |
ocol | -3.852 |
rol | -3.843 |
rim | -3.829 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.732 |
, | +4.616 |
. | +4.520 |
the | +4.359 |
a | +4.306 |
Neg logit contributions | |
umm | -4.581 |
ubb | -4.346 |
rol | -4.333 |
lor | -4.328 |
vation | -4.323 |
Token | He |
Token ID | 679 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.280 |
, | +4.225 |
. | +4.105 |
the | +3.892 |
a | +3.772 |
Neg logit contributions | |
umm | -5.233 |
rol | -4.981 |
lor | -4.961 |
osity | -4.885 |
arians | -4.863 |
Token | yelled |
Token ID | 22760 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.159 |
, | +4.114 |
. | +4.045 |
the | +3.819 |
a | +3.735 |
Neg logit contributions | |
umm | -5.106 |
lor | -4.982 |
rol | -4.972 |
arians | -4.896 |
vation | -4.895 |
Token | that |
Token ID | 326 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.312 |
, | +2.214 |
. | +2.203 |
the | +2.015 |
a | +1.900 |
Neg logit contributions | |
umm | -6.845 |
rol | -6.707 |
lor | -6.651 |
osity | -6.640 |
ubb | -6.633 |
Token | he |
Token ID | 339 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.648 |
, | +2.524 |
. | +2.464 |
the | +2.139 |
a | +2.100 |
Neg logit contributions | |
umm | -6.684 |
rol | -6.497 |
ubb | -6.479 |
lor | -6.477 |
osity | -6.438 |
Token | were |
Token ID | 547 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.961 |
, | +3.887 |
. | +3.842 |
the | +3.628 |
a | +3.583 |
Neg logit contributions | |
umm | -5.226 |
rol | -5.159 |
lor | -5.081 |
vation | -5.073 |
ubb | -5.051 |
Token | very |
Token ID | 845 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.062 |
, | +3.984 |
. | +3.901 |
the | +3.669 |
a | +3.562 |
Neg logit contributions | |
umm | -5.239 |
rol | -5.141 |
lor | -5.070 |
ubb | -5.033 |
rim | -5.019 |
Token | scared |
Token ID | 12008 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.235 |
, | +4.136 |
. | +4.055 |
the | +3.857 |
a | +3.763 |
Neg logit contributions | |
umm | -5.181 |
rol | -4.987 |
ubb | -4.936 |
lor | -4.927 |
rim | -4.926 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.854 |
, | +0.781 |
. | +0.711 |
the | +0.611 |
a | +0.579 |
Neg logit contributions | |
umm | -8.293 |
rol | -8.082 |
ubb | -7.975 |
osity | -7.960 |
rim | -7.960 |
Token | kept |
Token ID | 4030 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.404 |
, | +4.291 |
. | +4.211 |
the | +3.947 |
a | +3.902 |
Neg logit contributions | |
umm | -4.921 |
rol | -4.819 |
ubb | -4.732 |
lor | -4.720 |
osity | -4.698 |
Token | quiet |
Token ID | 5897 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.514 |
, | +4.449 |
. | +4.334 |
the | +4.045 |
a | +3.982 |
Neg logit contributions | |
umm | -4.734 |
rol | -4.639 |
ubb | -4.578 |
lor | -4.574 |
rim | -4.565 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.127 |
, | +2.041 |
. | +1.915 |
the | +1.872 |
a | +1.775 |
Neg logit contributions | |
umm | -7.190 |
rol | -6.916 |
lor | -6.885 |
ubb | -6.841 |
vation | -6.814 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.474 |
, | +4.413 |
. | +4.295 |
the | +4.083 |
a | +3.997 |
Neg logit contributions | |
umm | -4.983 |
rol | -4.781 |
lor | -4.770 |
arians | -4.690 |
vation | -4.665 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.781 |
, | +1.724 |
. | +1.604 |
the | +1.385 |
a | +1.305 |
Neg logit contributions | |
lor | -7.491 |
umm | -7.486 |
rol | -7.429 |
vation | -7.380 |
rim | -7.358 |
Token | Then |
Token ID | 6423 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.277 |
, | +5.220 |
. | +5.121 |
the | +4.892 |
a | +4.796 |
Neg logit contributions | |
umm | -4.177 |
lor | -4.060 |
rol | -4.016 |
vation | -3.977 |
rim | -3.935 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.748 |
. | +1.557 |
, | +1.500 |
the | +1.239 |
a | +1.158 |
Neg logit contributions | |
umm | -7.529 |
lor | -7.313 |
arians | -7.280 |
rol | -7.268 |
ubb | -7.262 |
Token | table |
Token ID | 3084 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.922 |
, | +4.842 |
. | +4.720 |
the | +4.532 |
a | +4.419 |
Neg logit contributions | |
umm | -4.565 |
lor | -4.296 |
rol | -4.284 |
vation | -4.210 |
ubb | -4.185 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.433 |
, | +1.377 |
. | +1.229 |
the | +1.207 |
a | +1.081 |
Neg logit contributions | |
umm | -7.767 |
lor | -7.627 |
rol | -7.619 |
vation | -7.508 |
ubb | -7.443 |
Token | broke |
Token ID | 6265 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.217 |
, | +4.116 |
. | +4.031 |
the | +3.740 |
a | +3.684 |
Neg logit contributions | |
umm | -5.133 |
rol | -5.005 |
lor | -4.943 |
vation | -4.887 |
ubb | -4.873 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.184 |
, | +2.135 |
. | +1.871 |
the | +1.742 |
a | +1.663 |
Neg logit contributions | |
umm | -7.075 |
rol | -6.969 |
lor | -6.819 |
ubb | -6.810 |
ocol | -6.729 |
Token | The |
Token ID | 383 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.479 |
, | +3.391 |
. | +3.275 |
the | +3.003 |
a | +2.928 |
Neg logit contributions | |
umm | -5.976 |
lor | -5.759 |
rol | -5.751 |
vation | -5.627 |
ubb | -5.615 |
Token | woman |
Token ID | 2415 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.973 |
, | +3.960 |
. | +3.838 |
the | +3.633 |
a | +3.497 |
Neg logit contributions | |
umm | -5.434 |
lor | -5.135 |
vation | -5.129 |
ubb | -5.109 |
arians | -5.098 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.951 |
, | +2.901 |
. | +2.825 |
the | +2.634 |
a | +2.554 |
Neg logit contributions | |
umm | -6.261 |
rol | -6.158 |
lor | -6.123 |
vation | -6.066 |
rim | -6.032 |
Token | very |
Token ID | 845 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.256 |
, | +3.174 |
. | +3.091 |
the | +2.859 |
a | +2.738 |
Neg logit contributions | |
umm | -6.103 |
rol | -5.972 |
lor | -5.926 |
ubb | -5.862 |
rim | -5.856 |
Token | sad |
Token ID | 6507 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.864 |
, | +3.732 |
. | +3.661 |
the | +3.460 |
a | +3.364 |
Neg logit contributions | |
umm | -5.553 |
rol | -5.381 |
ubb | -5.352 |
rim | -5.332 |
lor | -5.314 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.337 |
, | +0.329 |
the | +0.268 |
. | +0.128 |
a | +0.124 |
Neg logit contributions | |
umm | -8.594 |
rol | -8.290 |
lor | -8.288 |
osity | -8.253 |
rim | -8.219 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.225 |
, | +3.133 |
. | +3.019 |
the | +2.805 |
a | +2.758 |
Neg logit contributions | |
umm | -6.174 |
rol | -5.932 |
lor | -5.929 |
osity | -5.815 |
vation | -5.767 |
Token | toy |
Token ID | 13373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.523 |
, | +4.514 |
. | +4.390 |
the | +4.183 |
a | +4.044 |
Neg logit contributions | |
umm | -4.872 |
lor | -4.592 |
arians | -4.552 |
vation | -4.547 |
ubb | -4.526 |
Token | fell |
Token ID | 3214 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.987 |
, | +3.910 |
. | +3.835 |
the | +3.655 |
a | +3.546 |
Neg logit contributions | |
umm | -5.359 |
lor | -5.209 |
rol | -5.164 |
vation | -5.105 |
arians | -5.081 |
Token | from |
Token ID | 422 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.979 |
, | +2.951 |
. | +2.836 |
the | +2.732 |
a | +2.601 |
Neg logit contributions | |
umm | -6.167 |
rol | -6.124 |
lor | -5.976 |
osity | -5.941 |
ubb | -5.876 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.946 |
, | +2.897 |
. | +2.744 |
the | +2.427 |
a | +2.351 |
Neg logit contributions | |
umm | -6.261 |
ocol | -6.076 |
rol | -6.073 |
ubb | -6.032 |
former | -5.985 |
Token | table |
Token ID | 3084 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.922 |
, | +4.842 |
. | +4.720 |
the | +4.532 |
a | +4.419 |
Neg logit contributions | |
umm | -4.565 |
lor | -4.296 |
rol | -4.284 |
vation | -4.210 |
ubb | -4.185 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.433 |
, | +1.377 |
. | +1.229 |
the | +1.207 |
a | +1.081 |
Neg logit contributions | |
umm | -7.767 |
lor | -7.627 |
rol | -7.619 |
vation | -7.508 |
ubb | -7.443 |
Token | broke |
Token ID | 6265 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.217 |
, | +4.116 |
. | +4.031 |
the | +3.740 |
a | +3.684 |
Neg logit contributions | |
umm | -5.133 |
rol | -5.005 |
lor | -4.943 |
vation | -4.887 |
ubb | -4.873 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.184 |
, | +2.135 |
. | +1.871 |
the | +1.742 |
a | +1.663 |
Neg logit contributions | |
umm | -7.075 |
rol | -6.969 |
lor | -6.819 |
ubb | -6.810 |
ocol | -6.729 |
Token | The |
Token ID | 383 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.479 |
, | +3.391 |
. | +3.275 |
the | +3.003 |
a | +2.928 |
Neg logit contributions | |
umm | -5.976 |
lor | -5.759 |
rol | -5.751 |
vation | -5.627 |
ubb | -5.615 |
Token | woman |
Token ID | 2415 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.973 |
, | +3.960 |
. | +3.838 |
the | +3.633 |
a | +3.497 |
Neg logit contributions | |
umm | -5.434 |
lor | -5.135 |
vation | -5.129 |
ubb | -5.109 |
arians | -5.098 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.951 |
, | +2.901 |
. | +2.825 |
the | +2.634 |
a | +2.554 |
Neg logit contributions | |
umm | -6.261 |
rol | -6.158 |
lor | -6.123 |
vation | -6.066 |
rim | -6.032 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.228 |
, | +0.099 |
. | +0.060 |
the | -0.133 |
a | -0.212 |
Neg logit contributions | |
umm | -9.158 |
lor | -8.916 |
rol | -8.915 |
vation | -8.838 |
ubb | -8.815 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.274 |
, | +2.179 |
. | +2.108 |
the | +1.857 |
a | +1.782 |
Neg logit contributions | |
umm | -7.107 |
rol | -6.888 |
lor | -6.848 |
vation | -6.833 |
ubb | -6.792 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.192 |
, | +3.144 |
. | +3.099 |
the | +2.930 |
a | +2.838 |
Neg logit contributions | |
umm | -5.989 |
lor | -5.853 |
rol | -5.801 |
vation | -5.758 |
arians | -5.750 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.739 |
, | +0.637 |
. | +0.561 |
the | +0.207 |
a | +0.192 |
Neg logit contributions | |
umm | -8.672 |
rol | -8.399 |
vation | -8.379 |
ubb | -8.375 |
osity | -8.352 |
Token | unknown |
Token ID | 6439 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.688 |
, | +3.593 |
. | +3.503 |
the | +3.290 |
a | +3.190 |
Neg logit contributions | |
umm | -5.779 |
lor | -5.561 |
rol | -5.543 |
vation | -5.491 |
ubb | -5.486 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.140 |
, | +4.036 |
. | +3.949 |
the | +3.768 |
a | +3.682 |
Neg logit contributions | |
umm | -5.299 |
lor | -5.068 |
rol | -5.057 |
ubb | -5.011 |
vation | -4.991 |
Token | fixed |
Token ID | 5969 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.024 |
, | +3.941 |
. | +3.852 |
the | +3.673 |
a | +3.584 |
Neg logit contributions | |
umm | -5.341 |
rol | -5.152 |
lor | -5.141 |
vation | -5.075 |
ubb | -5.050 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.190 |
, | +2.131 |
. | +2.047 |
a | +1.714 |
the | +1.662 |
Neg logit contributions | |
umm | -6.945 |
rol | -6.782 |
arians | -6.778 |
ocol | -6.735 |
ubb | -6.728 |
Token | bike |
Token ID | 7161 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.406 |
, | +4.334 |
. | +4.240 |
the | +4.034 |
a | +3.924 |
Neg logit contributions | |
umm | -5.027 |
lor | -4.744 |
ubb | -4.722 |
rol | -4.694 |
vation | -4.683 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.045 |
, | +2.012 |
the | +1.844 |
. | +1.811 |
a | +1.737 |
Neg logit contributions | |
umm | -7.039 |
rol | -6.962 |
lor | -6.852 |
arians | -6.827 |
vation | -6.806 |
Token | The |
Token ID | 383 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.646 |
, | +3.564 |
. | +3.478 |
the | +3.275 |
a | +3.179 |
Neg logit contributions | |
umm | -5.798 |
rol | -5.576 |
lor | -5.567 |
vation | -5.496 |
osity | -5.468 |
Token | The |
Token ID | 464 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.503 |
, | +4.396 |
. | +4.298 |
the | +4.114 |
a | +4.008 |
Neg logit contributions | |
umm | -4.806 |
lor | -4.799 |
vation | -4.720 |
rim | -4.701 |
rol | -4.699 |
Token | end |
Token ID | 886 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.651 |
, | +4.568 |
. | +4.459 |
the | +4.274 |
a | +4.144 |
Neg logit contributions | |
umm | -4.798 |
lor | -4.525 |
ubb | -4.521 |
vation | -4.513 |
rol | -4.500 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.522 |
, | +0.392 |
. | +0.228 |
the | +0.177 |
a | +0.075 |
Neg logit contributions | |
umm | -8.848 |
lor | -8.638 |
rol | -8.607 |
rim | -8.573 |
vation | -8.571 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.970 |
, | +2.886 |
. | +2.778 |
the | +2.566 |
a | +2.471 |
Neg logit contributions | |
umm | -6.485 |
lor | -6.344 |
rol | -6.280 |
osity | -6.199 |
vation | -6.192 |
Token | A |
Token ID | 32 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.300 |
, | +4.211 |
. | +4.092 |
the | +3.923 |
a | +3.828 |
Neg logit contributions | |
umm | -5.071 |
lor | -4.935 |
rol | -4.889 |
vation | -4.809 |
rim | -4.778 |
Token | woman |
Token ID | 2415 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.164 |
, | +4.041 |
. | +3.982 |
the | +3.818 |
a | +3.724 |
Neg logit contributions | |
umm | -5.275 |
lor | -5.051 |
vation | -4.991 |
rol | -4.977 |
rim | -4.964 |
Token | had |
Token ID | 550 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.259 |
, | +3.205 |
. | +3.142 |
the | +2.962 |
a | +2.886 |
Neg logit contributions | |
umm | -5.955 |
lor | -5.829 |
rol | -5.804 |
vation | -5.741 |
rim | -5.728 |
Token | a |
Token ID | 257 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.272 |
, | +3.208 |
. | +3.108 |
the | +2.887 |
a | +2.699 |
Neg logit contributions | |
umm | -6.001 |
rol | -5.970 |
lor | -5.969 |
rim | -5.822 |
ocol | -5.788 |
Token | broken |
Token ID | 5445 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.588 |
, | +4.458 |
. | +4.429 |
the | +4.241 |
a | +4.094 |
Neg logit contributions | |
umm | -4.823 |
lor | -4.561 |
rol | -4.549 |
vation | -4.499 |
ubb | -4.497 |
Token | toy |
Token ID | 13373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.216 |
, | +5.079 |
. | +5.052 |
the | +4.926 |
a | +4.794 |
Neg logit contributions | |
umm | -4.086 |
lor | -3.878 |
rol | -3.822 |
rim | -3.798 |
ocol | -3.787 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.382 |
, | +3.289 |
. | +3.158 |
the | +3.140 |
a | +3.009 |
Neg logit contributions | |
umm | -5.857 |
lor | -5.693 |
rol | -5.649 |
arians | -5.613 |
vation | -5.560 |
Token | ! |
Token ID | 0 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.110 |
, | +2.038 |
the | +1.939 |
. | +1.875 |
a | +1.815 |
Neg logit contributions | |
umm | -7.137 |
lor | -7.046 |
rol | -6.911 |
arians | -6.834 |
vation | -6.813 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.408 |
, | +3.345 |
. | +3.232 |
the | +2.999 |
a | +2.890 |
Neg logit contributions | |
umm | -6.014 |
lor | -5.851 |
rol | -5.809 |
osity | -5.702 |
vation | -5.700 |
Token | opened |
Token ID | 4721 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.472 |
, | +3.416 |
. | +3.363 |
the | +3.171 |
a | +3.068 |
Neg logit contributions | |
umm | -5.762 |
lor | -5.674 |
rol | -5.630 |
vation | -5.565 |
rim | -5.535 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.330 |
, | +1.244 |
. | +1.161 |
the | +0.873 |
a | +0.843 |
Neg logit contributions | |
umm | -7.941 |
lor | -7.798 |
rol | -7.789 |
ubb | -7.675 |
ocol | -7.656 |
Token | closet |
Token ID | 21615 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.887 |
, | +4.806 |
. | +4.686 |
the | +4.545 |
a | +4.432 |
Neg logit contributions | |
umm | -4.501 |
lor | -4.340 |
rol | -4.260 |
vation | -4.229 |
osity | -4.176 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.513 |
, | +2.478 |
. | +2.388 |
the | +2.330 |
a | +2.249 |
Neg logit contributions | |
umm | -6.658 |
lor | -6.565 |
rol | -6.461 |
vation | -6.374 |
osity | -6.329 |
Token | saw |
Token ID | 2497 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.319 |
, | +3.255 |
. | +3.188 |
the | +2.899 |
a | +2.823 |
Neg logit contributions | |
umm | -5.935 |
rol | -5.839 |
lor | -5.839 |
vation | -5.756 |
ubb | -5.702 |
Token | a |
Token ID | 257 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.397 |
, | +2.280 |
. | +2.161 |
the | +1.848 |
a | +1.735 |
Neg logit contributions | |
umm | -7.031 |
rol | -6.861 |
ubb | -6.799 |
lor | -6.791 |
ocol | -6.716 |
Token | big |
Token ID | 1263 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.095 |
, | +3.990 |
. | +3.928 |
the | +3.746 |
a | +3.630 |
Neg logit contributions | |
umm | -5.301 |
lor | -5.095 |
vation | -5.025 |
rol | -5.022 |
rim | -4.989 |
Token | monster |
Token ID | 9234 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.667 |
, | +4.553 |
. | +4.542 |
the | +4.334 |
a | +4.260 |
Neg logit contributions | |
umm | -4.692 |
lor | -4.394 |
rol | -4.369 |
ocol | -4.365 |
vation | -4.352 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.960 |
, | +2.878 |
. | +2.739 |
the | +2.642 |
a | +2.543 |
Neg logit contributions | |
umm | -6.343 |
lor | -6.205 |
rol | -6.186 |
vation | -6.119 |
rim | -6.092 |
Token | Tom |
Token ID | 13787 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.079 |
, | +3.987 |
. | +3.889 |
the | +3.700 |
a | +3.602 |
Neg logit contributions | |
umm | -5.360 |
lor | -5.233 |
rol | -5.184 |
vation | -5.140 |
rim | -5.113 |
Token | went |
Token ID | 1816 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.365 |
, | +3.321 |
. | +3.268 |
the | +3.091 |
a | +2.989 |
Neg logit contributions | |
umm | -5.841 |
lor | -5.741 |
rol | -5.713 |
vation | -5.648 |
rim | -5.618 |
Token | to |
Token ID | 284 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.133 |
, | +2.052 |
. | +1.956 |
the | +1.772 |
a | +1.679 |
Neg logit contributions | |
umm | -7.220 |
rol | -7.081 |
lor | -7.066 |
vation | -6.994 |
rim | -6.962 |
Token | his |
Token ID | 465 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.813 |
, | +2.732 |
. | +2.609 |
the | +2.271 |
a | +2.239 |
Neg logit contributions | |
umm | -6.427 |
rol | -6.287 |
vation | -6.286 |
lor | -6.259 |
rim | -6.259 |
Token | bed |
Token ID | 3996 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.216 |
, | +4.139 |
. | +4.045 |
the | +3.876 |
a | +3.761 |
Neg logit contributions | |
umm | -5.137 |
lor | -4.878 |
arians | -4.837 |
vation | -4.819 |
rol | -4.778 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.409 |
, | +1.359 |
the | +1.245 |
. | +1.237 |
a | +1.117 |
Neg logit contributions | |
umm | -7.709 |
lor | -7.654 |
vation | -7.499 |
rol | -7.498 |
rim | -7.409 |
Token | hid |
Token ID | 24519 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.049 |
, | +3.980 |
. | +3.894 |
the | +3.634 |
a | +3.540 |
Neg logit contributions | |
umm | -5.162 |
lor | -5.095 |
rol | -5.058 |
vation | -5.021 |
rim | -4.955 |
Token | under |
Token ID | 739 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.355 |
, | +3.310 |
. | +3.059 |
the | +2.894 |
a | +2.869 |
Neg logit contributions | |
umm | -5.825 |
rol | -5.700 |
ocol | -5.663 |
ubb | -5.623 |
lor | -5.604 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.829 |
, | +1.744 |
. | +1.596 |
the | +1.250 |
a | +1.168 |
Neg logit contributions | |
umm | -7.444 |
lor | -7.254 |
ocol | -7.236 |
ubb | -7.221 |
rol | -7.189 |
Token | covers |
Token ID | 8698 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.848 |
, | +4.792 |
. | +4.658 |
the | +4.517 |
a | +4.440 |
Neg logit contributions | |
umm | -4.502 |
lor | -4.287 |
vation | -4.256 |
rol | -4.248 |
rim | -4.209 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.977 |
, | +0.917 |
. | +0.677 |
the | +0.646 |
a | +0.615 |
Neg logit contributions | |
umm | -8.254 |
lor | -8.136 |
rol | -8.122 |
vation | -7.973 |
rim | -7.938 |
Token | The |
Token ID | 383 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.347 |
, | +3.269 |
. | +3.161 |
the | +2.940 |
a | +2.845 |
Neg logit contributions | |
umm | -6.070 |
lor | -5.877 |
rol | -5.836 |
vation | -5.766 |
osity | -5.738 |
Token | monster |
Token ID | 9234 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.364 |
, | +5.271 |
. | +5.180 |
the | +4.987 |
a | +4.878 |
Neg logit contributions | |
umm | -4.115 |
lor | -3.903 |
rol | -3.881 |
vation | -3.826 |
ubb | -3.808 |
Token | looked |
Token ID | 3114 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.267 |
, | +3.183 |
. | +3.100 |
the | +2.918 |
a | +2.822 |
Neg logit contributions | |
umm | -6.110 |
lor | -5.929 |
rol | -5.915 |
vation | -5.847 |
rim | -5.824 |
Token | at |
Token ID | 379 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.763 |
, | +3.688 |
. | +3.609 |
the | +3.397 |
a | +3.285 |
Neg logit contributions | |
umm | -5.519 |
rol | -5.410 |
lor | -5.285 |
rim | -5.282 |
ubb | -5.275 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.963 |
, | +2.921 |
. | +2.809 |
the | +2.464 |
a | +2.461 |
Neg logit contributions | |
umm | -6.327 |
lor | -6.139 |
rol | -6.131 |
vation | -6.047 |
ocol | -6.014 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
, | +0.593 |
and | +0.591 |
. | +0.456 |
the | +0.429 |
a | +0.331 |
Neg logit contributions | |
umm | -8.375 |
lor | -8.350 |
rol | -8.319 |
vation | -8.246 |
rim | -8.193 |
Token | said |
Token ID | 531 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.922 |
, | +3.845 |
. | +3.772 |
the | +3.460 |
a | +3.393 |
Neg logit contributions | |
umm | -5.390 |
rol | -5.169 |
lor | -5.165 |
ubb | -5.131 |
vation | -5.106 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.169 |
, | +0.997 |
. | +0.969 |
the | +0.774 |
a | +0.686 |
Neg logit contributions | |
umm | -8.192 |
lor | -8.054 |
rol | -8.022 |
ubb | -7.948 |
osity | -7.938 |
Token | " |
Token ID | 366 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.473 |
, | +2.393 |
. | +2.325 |
the | +2.131 |
a | +2.068 |
Neg logit contributions | |
umm | -6.659 |
lor | -6.567 |
osity | -6.539 |
rol | -6.507 |
arians | -6.445 |
Token | I |
Token ID | 40 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +6.350 |
, | +6.275 |
. | +6.175 |
the | +5.969 |
a | +5.873 |
Neg logit contributions | |
umm | -3.150 |
lor | -2.953 |
rol | -2.940 |
vation | -2.876 |
ubb | -2.836 |
Token | will |
Token ID | 481 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.782 |
, | +4.699 |
. | +4.602 |
the | +4.403 |
a | +4.315 |
Neg logit contributions | |
umm | -4.734 |
lor | -4.514 |
rol | -4.498 |
vation | -4.428 |
ubb | -4.401 |
Token | scared |
Token ID | 12008 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.118 |
, | +4.018 |
. | +3.932 |
the | +3.665 |
a | +3.534 |
Neg logit contributions | |
umm | -5.084 |
rol | -5.024 |
lor | -4.966 |
ubb | -4.959 |
rim | -4.941 |
Token | in |
Token ID | 287 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.834 |
, | +1.776 |
. | +1.680 |
the | +1.536 |
a | +1.484 |
Neg logit contributions | |
umm | -7.372 |
rol | -7.173 |
ubb | -7.087 |
osity | -7.053 |
lor | -7.053 |
Token | his |
Token ID | 465 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.886 |
, | +3.773 |
. | +3.656 |
the | +3.347 |
a | +3.288 |
Neg logit contributions | |
umm | -5.416 |
ubb | -5.276 |
lor | -5.230 |
ocol | -5.221 |
rol | -5.193 |
Token | room |
Token ID | 2119 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.203 |
, | +5.053 |
. | +4.982 |
the | +4.829 |
a | +4.723 |
Neg logit contributions | |
umm | -4.227 |
lor | -3.960 |
ubb | -3.905 |
rim | -3.888 |
vation | -3.884 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.508 |
, | +1.439 |
. | +1.310 |
the | +1.277 |
a | +1.159 |
Neg logit contributions | |
umm | -7.626 |
lor | -7.499 |
rol | -7.465 |
arians | -7.387 |
vation | -7.371 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
, | +2.541 |
and | +2.529 |
. | +2.468 |
the | +2.216 |
a | +2.143 |
Neg logit contributions | |
umm | -6.649 |
rol | -6.499 |
lor | -6.451 |
rim | -6.402 |
ubb | -6.389 |
Token | he |
Token ID | 339 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.971 |
, | +2.899 |
. | +2.835 |
the | +2.553 |
a | +2.477 |
Neg logit contributions | |
umm | -6.350 |
rol | -6.178 |
lor | -6.164 |
osity | -6.078 |
ubb | -6.071 |
Token | never |
Token ID | 1239 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.863 |
, | +3.764 |
. | +3.677 |
the | +3.487 |
a | +3.388 |
Neg logit contributions | |
umm | -5.615 |
lor | -5.391 |
rol | -5.385 |
vation | -5.313 |
ubb | -5.286 |
Token | had |
Token ID | 550 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.339 |
, | +4.226 |
. | +4.143 |
the | +3.958 |
a | +3.861 |
Neg logit contributions | |
umm | -5.027 |
rol | -4.857 |
lor | -4.828 |
osity | -4.783 |
rim | -4.777 |
Token | a |
Token ID | 257 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.869 |
, | +2.758 |
. | +2.628 |
the | +2.378 |
a | +2.244 |
Neg logit contributions | |
umm | -6.449 |
lor | -6.332 |
rol | -6.330 |
ubb | -6.237 |
rim | -6.210 |
Token | good |
Token ID | 922 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.847 |
, | +5.721 |
. | +5.678 |
the | +5.513 |
a | +5.369 |
Neg logit contributions | |
umm | -3.551 |
lor | -3.369 |
rol | -3.297 |
vation | -3.282 |
ubb | -3.275 |
Token | went |
Token ID | 1816 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.405 |
, | +3.358 |
. | +3.300 |
the | +3.067 |
a | +2.954 |
Neg logit contributions | |
umm | -5.844 |
lor | -5.730 |
rol | -5.698 |
arians | -5.643 |
rim | -5.613 |
Token | to |
Token ID | 284 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.830 |
, | +1.762 |
. | +1.696 |
the | +1.480 |
a | +1.376 |
Neg logit contributions | |
umm | -7.449 |
rol | -7.324 |
lor | -7.299 |
vation | -7.244 |
osity | -7.199 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.132 |
, | +2.064 |
. | +1.945 |
the | +1.548 |
a | +1.523 |
Neg logit contributions | |
umm | -7.054 |
vation | -6.951 |
rol | -6.922 |
lor | -6.880 |
arians | -6.864 |
Token | unknown |
Token ID | 6439 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.706 |
, | +4.601 |
. | +4.498 |
the | +4.249 |
a | +4.146 |
Neg logit contributions | |
umm | -4.814 |
lor | -4.580 |
rol | -4.505 |
vation | -4.489 |
osity | -4.464 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.173 |
, | +4.075 |
. | +3.981 |
the | +3.855 |
a | +3.784 |
Neg logit contributions | |
umm | -5.155 |
lor | -4.919 |
rol | -4.849 |
rim | -4.818 |
ubb | -4.812 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.918 |
, | +1.859 |
. | +1.790 |
the | +1.668 |
a | +1.619 |
Neg logit contributions | |
umm | -7.003 |
lor | -6.968 |
rol | -6.938 |
arians | -6.908 |
vation | -6.877 |
Token | said |
Token ID | 531 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.378 |
, | +3.287 |
. | +3.247 |
the | +2.868 |
a | +2.842 |
Neg logit contributions | |
umm | -5.818 |
vation | -5.681 |
arians | -5.664 |
lor | -5.662 |
rol | -5.658 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.791 |
. | +1.581 |
, | +1.577 |
the | +1.375 |
a | +1.275 |
Neg logit contributions | |
umm | -7.552 |
lor | -7.402 |
rol | -7.345 |
osity | -7.307 |
ubb | -7.292 |
Token | " |
Token ID | 366 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.554 |
, | +2.448 |
. | +2.401 |
the | +2.228 |
a | +2.116 |
Neg logit contributions | |
umm | -6.534 |
osity | -6.442 |
lor | -6.404 |
arians | -6.378 |
rol | -6.370 |
Token | I |
Token ID | 40 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.996 |
, | +5.974 |
. | +5.842 |
the | +5.615 |
a | +5.524 |
Neg logit contributions | |
umm | -3.541 |
lor | -3.350 |
rol | -3.300 |
vation | -3.287 |
rim | -3.215 |
Token | can |
Token ID | 460 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.389 |
, | +4.299 |
. | +4.214 |
the | +4.023 |
a | +3.923 |
Neg logit contributions | |
umm | -5.073 |
lor | -4.873 |
rol | -4.863 |
vation | -4.786 |
ubb | -4.764 |
Token | a |
Token ID | 257 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.585 |
, | +3.535 |
. | +3.392 |
the | +3.091 |
a | +2.923 |
Neg logit contributions | |
umm | -5.623 |
lor | -5.588 |
rol | -5.531 |
osity | -5.425 |
ubb | -5.409 |
Token | flat |
Token ID | 6228 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.308 |
, | +4.180 |
. | +4.149 |
the | +3.949 |
a | +3.787 |
Neg logit contributions | |
umm | -5.063 |
lor | -4.863 |
rol | -4.777 |
ubb | -4.770 |
vation | -4.766 |
Token | tire |
Token ID | 15867 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.155 |
. | +5.042 |
, | +5.033 |
the | +4.896 |
a | +4.767 |
Neg logit contributions | |
umm | -4.152 |
lor | -3.929 |
rol | -3.839 |
rim | -3.825 |
ocol | -3.809 |
Token | on |
Token ID | 319 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.823 |
, | +1.757 |
the | +1.617 |
. | +1.599 |
a | +1.473 |
Neg logit contributions | |
umm | -7.242 |
rol | -7.090 |
lor | -7.059 |
arians | -7.000 |
vation | -6.974 |
Token | a |
Token ID | 257 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.340 |
, | +2.239 |
. | +2.098 |
the | +1.743 |
a | +1.694 |
Neg logit contributions | |
umm | -6.829 |
lor | -6.682 |
ocol | -6.666 |
arians | -6.626 |
rol | -6.626 |
Token | bike |
Token ID | 7161 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.929 |
, | +4.823 |
. | +4.715 |
the | +4.575 |
a | +4.493 |
Neg logit contributions | |
umm | -4.357 |
lor | -4.237 |
vation | -4.089 |
rim | -4.071 |
arians | -4.047 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.787 |
, | +0.725 |
the | +0.580 |
. | +0.539 |
a | +0.485 |
Neg logit contributions | |
umm | -8.258 |
rol | -8.210 |
lor | -8.199 |
vation | -8.109 |
arians | -8.074 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.697 |
, | +2.621 |
. | +2.533 |
the | +2.312 |
a | +2.245 |
Neg logit contributions | |
umm | -6.666 |
lor | -6.470 |
rol | -6.467 |
vation | -6.392 |
arians | -6.345 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.452 |
, | +1.384 |
. | +1.270 |
the | +1.095 |
a | +1.014 |
Neg logit contributions | |
umm | -7.753 |
lor | -7.702 |
rol | -7.645 |
vation | -7.563 |
rim | -7.548 |
Token | Tom |
Token ID | 13787 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.656 |
, | +4.570 |
. | +4.483 |
the | +4.289 |
a | +4.190 |
Neg logit contributions | |
umm | -4.813 |
lor | -4.619 |
rol | -4.606 |
vation | -4.536 |
rim | -4.503 |
Token | wanted |
Token ID | 2227 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.152 |
, | +3.100 |
. | +3.077 |
the | +2.888 |
a | +2.778 |
Neg logit contributions | |
umm | -5.899 |
lor | -5.839 |
arians | -5.785 |
rol | -5.780 |
rim | -5.726 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.590 |
, | +2.474 |
. | +2.411 |
the | +2.155 |
a | +2.053 |
Neg logit contributions | |
umm | -6.778 |
rol | -6.550 |
lor | -6.525 |
vation | -6.504 |
osity | -6.463 |
Token | saw |
Token ID | 2497 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.197 |
, | +3.135 |
. | +3.079 |
the | +2.885 |
a | +2.785 |
Neg logit contributions | |
umm | -6.057 |
lor | -5.905 |
rol | -5.856 |
rim | -5.817 |
vation | -5.803 |
Token | an |
Token ID | 281 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.036 |
, | +0.936 |
. | +0.858 |
the | +0.482 |
a | +0.329 |
Neg logit contributions | |
umm | -8.285 |
rol | -8.113 |
lor | -8.099 |
rim | -8.033 |
osity | -8.027 |
Token | unknown |
Token ID | 6439 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.566 |
, | +4.488 |
. | +4.420 |
the | +4.222 |
a | +4.100 |
Neg logit contributions | |
umm | -4.863 |
rol | -4.572 |
lor | -4.547 |
rim | -4.537 |
ubb | -4.531 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.897 |
, | +4.806 |
. | +4.719 |
the | +4.587 |
a | +4.474 |
Neg logit contributions | |
umm | -4.477 |
lor | -4.183 |
rim | -4.142 |
rol | -4.136 |
ubb | -4.107 |
Token | who |
Token ID | 508 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.373 |
, | +2.306 |
. | +2.155 |
the | +2.051 |
a | +1.985 |
Neg logit contributions | |
umm | -6.739 |
rol | -6.667 |
lor | -6.649 |
rim | -6.597 |
vation | -6.587 |
Token | needed |
Token ID | 2622 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.691 |
, | +3.617 |
. | +3.527 |
the | +3.308 |
a | +3.233 |
Neg logit contributions | |
umm | -5.604 |
rol | -5.450 |
lor | -5.419 |
vation | -5.366 |
rim | -5.353 |
Token | help |
Token ID | 1037 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.031 |
, | +2.887 |
. | +2.765 |
the | +2.475 |
a | +2.296 |
Neg logit contributions | |
umm | -6.160 |
ocol | -6.057 |
lor | -6.044 |
rol | -5.974 |
vation | -5.951 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.263 |
, | +1.129 |
. | +0.909 |
the | +0.846 |
a | +0.760 |
Neg logit contributions | |
umm | -7.627 |
rim | -7.561 |
ocol | -7.543 |
arians | -7.534 |
uries | -7.507 |
Token | The |
Token ID | 383 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.346 |
, | +3.271 |
. | +3.168 |
the | +2.931 |
a | +2.869 |
Neg logit contributions | |
umm | -6.021 |
lor | -5.824 |
rol | -5.800 |
vation | -5.730 |
osity | -5.693 |
Token | unknown |
Token ID | 6439 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.262 |
, | +4.157 |
. | +4.055 |
the | +3.856 |
a | +3.757 |
Neg logit contributions | |
umm | -5.210 |
lor | -5.004 |
rol | -4.951 |
vation | -4.941 |
ubb | -4.920 |
Token | needed |
Token ID | 2622 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.691 |
, | +3.617 |
. | +3.527 |
the | +3.308 |
a | +3.233 |
Neg logit contributions | |
umm | -5.604 |
rol | -5.450 |
lor | -5.419 |
vation | -5.366 |
rim | -5.353 |
Token | help |
Token ID | 1037 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.031 |
, | +2.887 |
. | +2.765 |
the | +2.475 |
a | +2.296 |
Neg logit contributions | |
umm | -6.160 |
ocol | -6.057 |
lor | -6.044 |
rol | -5.974 |
vation | -5.951 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.263 |
, | +1.129 |
. | +0.909 |
the | +0.846 |
a | +0.760 |
Neg logit contributions | |
umm | -7.627 |
rim | -7.561 |
ocol | -7.543 |
arians | -7.534 |
uries | -7.507 |
Token | The |
Token ID | 383 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.346 |
, | +3.271 |
. | +3.168 |
the | +2.931 |
a | +2.869 |
Neg logit contributions | |
umm | -6.021 |
lor | -5.824 |
rol | -5.800 |
vation | -5.730 |
osity | -5.693 |
Token | unknown |
Token ID | 6439 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.262 |
, | +4.157 |
. | +4.055 |
the | +3.856 |
a | +3.757 |
Neg logit contributions | |
umm | -5.210 |
lor | -5.004 |
rol | -4.951 |
vation | -4.941 |
ubb | -4.920 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.175 |
, | +4.064 |
. | +3.977 |
the | +3.817 |
a | +3.722 |
Neg logit contributions | |
umm | -5.188 |
lor | -4.975 |
vation | -4.929 |
rol | -4.911 |
ubb | -4.887 |
Token | had |
Token ID | 550 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.763 |
, | +3.664 |
. | +3.593 |
the | +3.407 |
a | +3.319 |
Neg logit contributions | |
umm | -5.478 |
rol | -5.353 |
lor | -5.324 |
vation | -5.266 |
osity | -5.253 |
Token | a |
Token ID | 257 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.585 |
, | +3.535 |
. | +3.392 |
the | +3.091 |
a | +2.923 |
Neg logit contributions | |
umm | -5.623 |
lor | -5.588 |
rol | -5.531 |
osity | -5.425 |
ubb | -5.409 |
Token | flat |
Token ID | 6228 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.308 |
, | +4.180 |
. | +4.149 |
the | +3.949 |
a | +3.787 |
Neg logit contributions | |
umm | -5.063 |
lor | -4.863 |
rol | -4.777 |
ubb | -4.770 |
vation | -4.766 |
Token | tire |
Token ID | 15867 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.155 |
. | +5.042 |
, | +5.033 |
the | +4.896 |
a | +4.767 |
Neg logit contributions | |
umm | -4.152 |
lor | -3.929 |
rol | -3.839 |
rim | -3.825 |
ocol | -3.809 |
Token | on |
Token ID | 319 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.823 |
, | +1.757 |
the | +1.617 |
. | +1.599 |
a | +1.473 |
Neg logit contributions | |
umm | -7.242 |
rol | -7.090 |
lor | -7.059 |
arians | -7.000 |
vation | -6.974 |
Token | your |
Token ID | 534 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.836 |
, | +2.686 |
. | +2.607 |
a | +2.254 |
the | +2.232 |
Neg logit contributions | |
umm | -6.323 |
lor | -6.239 |
ocol | -6.226 |
arians | -6.221 |
icians | -6.179 |
Token | bike |
Token ID | 7161 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.313 |
, | +5.212 |
. | +5.075 |
the | +4.949 |
a | +4.870 |
Neg logit contributions | |
umm | -4.033 |
ubb | -3.756 |
lor | -3.739 |
former | -3.722 |
arians | -3.714 |
Token | ." |
Token ID | 526 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.897 |
, | +2.758 |
. | +2.650 |
the | +2.623 |
a | +2.519 |
Neg logit contributions | |
umm | -6.301 |
lor | -6.160 |
rol | -6.110 |
arians | -6.096 |
vation | -6.068 |
Token | The |
Token ID | 383 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.154 |
, | +3.076 |
. | +2.981 |
the | +2.773 |
a | +2.687 |
Neg logit contributions | |
umm | -6.234 |
lor | -5.998 |
rol | -5.976 |
vation | -5.960 |
arians | -5.902 |
Token | unknown |
Token ID | 6439 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.949 |
, | +3.853 |
. | +3.762 |
the | +3.558 |
a | +3.461 |
Neg logit contributions | |
umm | -5.517 |
lor | -5.313 |
rol | -5.287 |
vation | -5.235 |
ubb | -5.221 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.091 |
, | +3.981 |
. | +3.904 |
the | +3.726 |
a | +3.638 |
Neg logit contributions | |
umm | -5.301 |
lor | -5.089 |
rol | -5.049 |
ubb | -5.003 |
vation | -5.002 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.446 |
, | +3.360 |
. | +3.281 |
the | +3.094 |
a | +3.000 |
Neg logit contributions | |
umm | -5.924 |
rol | -5.732 |
lor | -5.732 |
vation | -5.659 |
ubb | -5.627 |
Token | happy |
Token ID | 3772 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.217 |
, | +3.118 |
. | +3.052 |
the | +2.791 |
a | +2.655 |
Neg logit contributions | |
umm | -6.060 |
rol | -5.953 |
lor | -5.907 |
ubb | -5.852 |
rim | -5.850 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.992 |
, | +0.935 |
. | +0.826 |
the | +0.700 |
a | +0.619 |
Neg logit contributions | |
umm | -8.233 |
lor | -8.022 |
rol | -7.977 |
osity | -7.936 |
rim | -7.917 |
Token | said |
Token ID | 531 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.611 |
, | +3.522 |
. | +3.462 |
the | +3.209 |
a | +3.137 |
Neg logit contributions | |
umm | -5.769 |
rol | -5.541 |
lor | -5.536 |
vation | -5.496 |
osity | -5.479 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.373 |
, | +1.166 |
. | +1.157 |
the | +0.953 |
a | +0.861 |
Neg logit contributions | |
umm | -8.004 |
lor | -7.825 |
rol | -7.795 |
ubb | -7.725 |
osity | -7.722 |
Token | can |
Token ID | 460 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.389 |
, | +4.299 |
. | +4.214 |
the | +4.023 |
a | +3.923 |
Neg logit contributions | |
umm | -5.073 |
lor | -4.873 |
rol | -4.863 |
vation | -4.786 |
ubb | -4.764 |
Token | help |
Token ID | 1037 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.383 |
, | +4.273 |
. | +4.201 |
the | +4.028 |
a | +3.919 |
Neg logit contributions | |
umm | -4.951 |
lor | -4.785 |
vation | -4.752 |
rol | -4.718 |
arians | -4.715 |
Token | you |
Token ID | 345 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.217 |
, | +3.046 |
. | +2.953 |
the | +2.705 |
a | +2.700 |
Neg logit contributions | |
umm | -5.917 |
arians | -5.879 |
vation | -5.807 |
lor | -5.773 |
rim | -5.769 |
Token | fix |
Token ID | 4259 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.077 |
, | +3.930 |
. | +3.838 |
the | +3.786 |
a | +3.669 |
Neg logit contributions | |
umm | -5.109 |
lor | -5.034 |
vation | -4.937 |
arians | -4.919 |
rim | -4.889 |
Token | your |
Token ID | 534 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.836 |
, | +2.686 |
. | +2.607 |
a | +2.254 |
the | +2.232 |
Neg logit contributions | |
umm | -6.323 |
lor | -6.239 |
ocol | -6.226 |
arians | -6.221 |
icians | -6.179 |
Token | bike |
Token ID | 7161 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.313 |
, | +5.212 |
. | +5.075 |
the | +4.949 |
a | +4.870 |
Neg logit contributions | |
umm | -4.033 |
ubb | -3.756 |
lor | -3.739 |
former | -3.722 |
arians | -3.714 |
Token | ." |
Token ID | 526 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.897 |
, | +2.758 |
. | +2.650 |
the | +2.623 |
a | +2.519 |
Neg logit contributions | |
umm | -6.301 |
lor | -6.160 |
rol | -6.110 |
arians | -6.096 |
vation | -6.068 |
Token | The |
Token ID | 383 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.154 |
, | +3.076 |
. | +2.981 |
the | +2.773 |
a | +2.687 |
Neg logit contributions | |
umm | -6.234 |
lor | -5.998 |
rol | -5.976 |
vation | -5.960 |
arians | -5.902 |
Token | unknown |
Token ID | 6439 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.949 |
, | +3.853 |
. | +3.762 |
the | +3.558 |
a | +3.461 |
Neg logit contributions | |
umm | -5.517 |
lor | -5.313 |
rol | -5.287 |
vation | -5.235 |
ubb | -5.221 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.091 |
, | +3.981 |
. | +3.904 |
the | +3.726 |
a | +3.638 |
Neg logit contributions | |
umm | -5.301 |
lor | -5.089 |
rol | -5.049 |
ubb | -5.003 |
vation | -5.002 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.446 |
, | +3.360 |
. | +3.281 |
the | +3.094 |
a | +3.000 |
Neg logit contributions | |
umm | -5.924 |
rol | -5.732 |
lor | -5.732 |
vation | -5.659 |
ubb | -5.627 |
Token | The |
Token ID | 383 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.154 |
, | +3.076 |
. | +2.981 |
the | +2.773 |
a | +2.687 |
Neg logit contributions | |
umm | -6.234 |
lor | -5.998 |
rol | -5.976 |
vation | -5.960 |
arians | -5.902 |
Token | unknown |
Token ID | 6439 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.949 |
, | +3.853 |
. | +3.762 |
the | +3.558 |
a | +3.461 |
Neg logit contributions | |
umm | -5.517 |
lor | -5.313 |
rol | -5.287 |
vation | -5.235 |
ubb | -5.221 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.091 |
, | +3.981 |
. | +3.904 |
the | +3.726 |
a | +3.638 |
Neg logit contributions | |
umm | -5.301 |
lor | -5.089 |
rol | -5.049 |
ubb | -5.003 |
vation | -5.002 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.446 |
, | +3.360 |
. | +3.281 |
the | +3.094 |
a | +3.000 |
Neg logit contributions | |
umm | -5.924 |
rol | -5.732 |
lor | -5.732 |
vation | -5.659 |
ubb | -5.627 |
Token | happy |
Token ID | 3772 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.217 |
, | +3.118 |
. | +3.052 |
the | +2.791 |
a | +2.655 |
Neg logit contributions | |
umm | -6.060 |
rol | -5.953 |
lor | -5.907 |
ubb | -5.852 |
rim | -5.850 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.992 |
, | +0.935 |
. | +0.826 |
the | +0.700 |
a | +0.619 |
Neg logit contributions | |
umm | -8.233 |
lor | -8.022 |
rol | -7.977 |
osity | -7.936 |
rim | -7.917 |
Token | said |
Token ID | 531 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.611 |
, | +3.522 |
. | +3.462 |
the | +3.209 |
a | +3.137 |
Neg logit contributions | |
umm | -5.769 |
rol | -5.541 |
lor | -5.536 |
vation | -5.496 |
osity | -5.479 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.373 |
, | +1.166 |
. | +1.157 |
the | +0.953 |
a | +0.861 |
Neg logit contributions | |
umm | -8.004 |
lor | -7.825 |
rol | -7.795 |
ubb | -7.725 |
osity | -7.722 |
Token | " |
Token ID | 366 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.418 |
, | +2.374 |
. | +2.312 |
the | +2.089 |
a | +2.009 |
Neg logit contributions | |
umm | -6.785 |
lor | -6.616 |
rol | -6.592 |
osity | -6.569 |
arians | -6.558 |
Token | Thank |
Token ID | 10449 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +5.742 |
, | +5.659 |
. | +5.569 |
the | +5.374 |
a | +5.276 |
Neg logit contributions | |
umm | -3.743 |
lor | -3.539 |
rol | -3.527 |
vation | -3.454 |
ubb | -3.425 |
Token | you |
Token ID | 345 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.283 |
, | +3.156 |
. | +3.067 |
the | +2.855 |
a | +2.775 |
Neg logit contributions | |
umm | -6.178 |
lor | -6.002 |
rol | -5.940 |
vation | -5.922 |
ubb | -5.869 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.160 |
, | +3.125 |
. | +3.023 |
the | +2.834 |
a | +2.742 |
Neg logit contributions | |
umm | -6.111 |
rol | -5.913 |
lor | -5.912 |
vation | -5.884 |
arians | -5.818 |
Token |
|
Token ID | 198 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.469 |
, | +1.409 |
. | +1.291 |
the | +1.115 |
a | +1.029 |
Neg logit contributions | |
umm | -7.749 |
lor | -7.712 |
rol | -7.644 |
vation | -7.584 |
rim | -7.563 |
Token | Together |
Token ID | 41631 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.799 |
, | +4.722 |
. | +4.633 |
the | +4.437 |
a | +4.336 |
Neg logit contributions | |
umm | -4.647 |
lor | -4.462 |
rol | -4.441 |
vation | -4.381 |
rim | -4.346 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.228 |
, | +0.099 |
. | +0.060 |
the | -0.133 |
a | -0.212 |
Neg logit contributions | |
umm | -9.158 |
lor | -8.916 |
rol | -8.915 |
vation | -8.838 |
ubb | -8.815 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.274 |
, | +2.179 |
. | +2.108 |
the | +1.857 |
a | +1.782 |
Neg logit contributions | |
umm | -7.107 |
rol | -6.888 |
lor | -6.848 |
vation | -6.833 |
ubb | -6.792 |
Token | and |
Token ID | 290 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.192 |
, | +3.144 |
. | +3.099 |
the | +2.930 |
a | +2.838 |
Neg logit contributions | |
umm | -5.989 |
lor | -5.853 |
rol | -5.801 |
vation | -5.758 |
arians | -5.750 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.739 |
, | +0.637 |
. | +0.561 |
the | +0.207 |
a | +0.192 |
Neg logit contributions | |
umm | -8.672 |
rol | -8.399 |
vation | -8.379 |
ubb | -8.375 |
osity | -8.352 |
Token | unknown |
Token ID | 6439 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.688 |
, | +3.593 |
. | +3.503 |
the | +3.290 |
a | +3.190 |
Neg logit contributions | |
umm | -5.779 |
lor | -5.561 |
rol | -5.543 |
vation | -5.491 |
ubb | -5.486 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.140 |
, | +4.036 |
. | +3.949 |
the | +3.768 |
a | +3.682 |
Neg logit contributions | |
umm | -5.299 |
lor | -5.068 |
rol | -5.057 |
ubb | -5.011 |
vation | -4.991 |
Token | fixed |
Token ID | 5969 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.024 |
, | +3.941 |
. | +3.852 |
the | +3.673 |
a | +3.584 |
Neg logit contributions | |
umm | -5.341 |
rol | -5.152 |
lor | -5.141 |
vation | -5.075 |
ubb | -5.050 |
Token | the |
Token ID | 262 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.190 |
, | +2.131 |
. | +2.047 |
a | +1.714 |
the | +1.662 |
Neg logit contributions | |
umm | -6.945 |
rol | -6.782 |
arians | -6.778 |
ocol | -6.735 |
ubb | -6.728 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.155 |
, | +0.011 |
. | -0.029 |
the | -0.218 |
a | -0.315 |
Neg logit contributions | |
umm | -9.220 |
lor | -9.017 |
rol | -9.013 |
vation | -8.939 |
ubb | -8.913 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.590 |
, | +2.474 |
. | +2.411 |
the | +2.155 |
a | +2.053 |
Neg logit contributions | |
umm | -6.778 |
rol | -6.550 |
lor | -6.525 |
vation | -6.504 |
osity | -6.463 |
Token | saw |
Token ID | 2497 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.197 |
, | +3.135 |
. | +3.079 |
the | +2.885 |
a | +2.785 |
Neg logit contributions | |
umm | -6.057 |
lor | -5.905 |
rol | -5.856 |
rim | -5.817 |
vation | -5.803 |
Token | an |
Token ID | 281 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.036 |
, | +0.936 |
. | +0.858 |
the | +0.482 |
a | +0.329 |
Neg logit contributions | |
umm | -8.285 |
rol | -8.113 |
lor | -8.099 |
rim | -8.033 |
osity | -8.027 |
Token | unknown |
Token ID | 6439 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.566 |
, | +4.488 |
. | +4.420 |
the | +4.222 |
a | +4.100 |
Neg logit contributions | |
umm | -4.863 |
rol | -4.572 |
lor | -4.547 |
rim | -4.537 |
ubb | -4.531 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.897 |
, | +4.806 |
. | +4.719 |
the | +4.587 |
a | +4.474 |
Neg logit contributions | |
umm | -4.477 |
lor | -4.183 |
rim | -4.142 |
rol | -4.136 |
ubb | -4.107 |
Token | who |
Token ID | 508 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.373 |
, | +2.306 |
. | +2.155 |
the | +2.051 |
a | +1.985 |
Neg logit contributions | |
umm | -6.739 |
rol | -6.667 |
lor | -6.649 |
rim | -6.597 |
vation | -6.587 |
Token | needed |
Token ID | 2622 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.691 |
, | +3.617 |
. | +3.527 |
the | +3.308 |
a | +3.233 |
Neg logit contributions | |
umm | -5.604 |
rol | -5.450 |
lor | -5.419 |
vation | -5.366 |
rim | -5.353 |
Token | help |
Token ID | 1037 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.031 |
, | +2.887 |
. | +2.765 |
the | +2.475 |
a | +2.296 |
Neg logit contributions | |
umm | -6.160 |
ocol | -6.057 |
lor | -6.044 |
rol | -5.974 |
vation | -5.951 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.263 |
, | +1.129 |
. | +0.909 |
the | +0.846 |
a | +0.760 |
Neg logit contributions | |
umm | -7.627 |
rim | -7.561 |
ocol | -7.543 |
arians | -7.534 |
uries | -7.507 |
Token | The |
Token ID | 383 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.346 |
, | +3.271 |
. | +3.168 |
the | +2.931 |
a | +2.869 |
Neg logit contributions | |
umm | -6.021 |
lor | -5.824 |
rol | -5.800 |
vation | -5.730 |
osity | -5.693 |
Token | there |
Token ID | 612 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.979 |
, | +1.842 |
. | +1.810 |
the | +1.569 |
a | +1.451 |
Neg logit contributions | |
umm | -7.255 |
rol | -7.136 |
lor | -7.086 |
ubb | -7.028 |
osity | -7.025 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.628 |
, | +1.502 |
. | +1.457 |
the | +1.239 |
a | +1.170 |
Neg logit contributions | |
umm | -7.697 |
lor | -7.525 |
rol | -7.521 |
rim | -7.416 |
vation | -7.402 |
Token | a |
Token ID | 257 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.663 |
, | +0.602 |
. | +0.517 |
the | +0.260 |
a | +0.081 |
Neg logit contributions | |
umm | -8.684 |
rol | -8.487 |
lor | -8.455 |
rim | -8.378 |
ubb | -8.367 |
Token | kind |
Token ID | 1611 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.044 |
, | +2.954 |
. | +2.876 |
the | +2.681 |
a | +2.582 |
Neg logit contributions | |
umm | -6.353 |
lor | -6.127 |
rol | -6.101 |
vation | -6.052 |
rim | -6.046 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.299 |
, | +4.216 |
. | +4.157 |
the | +3.983 |
a | +3.895 |
Neg logit contributions | |
umm | -5.065 |
lor | -4.816 |
rol | -4.782 |
rim | -4.753 |
ubb | -4.729 |
Token | named |
Token ID | 3706 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.690 |
, | +3.598 |
. | +3.482 |
the | +3.355 |
a | +3.276 |
Neg logit contributions | |
umm | -5.572 |
lor | -5.431 |
rol | -5.416 |
rim | -5.386 |
vation | -5.305 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.352 |
, | +3.172 |
. | +3.105 |
the | +2.808 |
a | +2.708 |
Neg logit contributions | |
umm | -6.090 |
rol | -5.844 |
lor | -5.812 |
arians | -5.784 |
osity | -5.781 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.433 |
, | +0.376 |
. | +0.193 |
the | +0.134 |
a | +0.040 |
Neg logit contributions | |
lor | -8.543 |
umm | -8.529 |
rim | -8.479 |
rol | -8.453 |
osity | -8.361 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.945 |
, | +2.858 |
. | +2.770 |
the | +2.580 |
a | +2.481 |
Neg logit contributions | |
umm | -6.507 |
lor | -6.317 |
rol | -6.302 |
vation | -6.227 |
ubb | -6.207 |
Token | liked |
Token ID | 8288 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.369 |
, | +3.288 |
. | +3.207 |
the | +3.020 |
a | +2.918 |
Neg logit contributions | |
umm | -5.979 |
lor | -5.797 |
rol | -5.772 |
vation | -5.705 |
rim | -5.702 |
Token | to |
Token ID | 284 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.319 |
, | +1.250 |
. | +1.164 |
the | +0.934 |
a | +0.841 |
Neg logit contributions | |
umm | -8.076 |
lor | -7.843 |
rol | -7.839 |
rim | -7.769 |
osity | -7.763 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.520 |
, | +1.430 |
. | +1.345 |
the | +1.154 |
a | +1.056 |
Neg logit contributions | |
umm | -7.924 |
lor | -7.723 |
rol | -7.714 |
vation | -7.638 |
ubb | -7.615 |
Token | Once |
Token ID | 7454 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.981 |
, | +1.906 |
. | +1.778 |
the | +1.603 |
a | +1.511 |
Neg logit contributions | |
umm | -7.346 |
lor | -7.231 |
rol | -7.182 |
vation | -7.098 |
rim | -7.058 |
Token | upon |
Token ID | 2402 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.123 |
, | +3.990 |
. | +3.929 |
the | +3.735 |
a | +3.685 |
Neg logit contributions | |
umm | -5.160 |
rol | -5.012 |
lor | -5.009 |
osity | -4.909 |
ubb | -4.906 |
Token | a |
Token ID | 257 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.614 |
, | +0.596 |
. | +0.426 |
the | +0.225 |
a | +0.026 |
Neg logit contributions | |
umm | -8.560 |
lor | -8.487 |
rol | -8.429 |
vation | -8.368 |
rim | -8.325 |
Token | time |
Token ID | 640 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.018 |
, | +2.931 |
. | +2.849 |
the | +2.702 |
a | +2.572 |
Neg logit contributions | |
umm | -6.339 |
lor | -6.160 |
rol | -6.116 |
rim | -6.069 |
vation | -6.062 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.220 |
. | +0.048 |
, | +0.021 |
the | -0.139 |
a | -0.233 |
Neg logit contributions | |
umm | -9.065 |
lor | -8.921 |
rol | -8.914 |
ubb | -8.800 |
rim | -8.798 |
Token | there |
Token ID | 612 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.979 |
, | +1.842 |
. | +1.810 |
the | +1.569 |
a | +1.451 |
Neg logit contributions | |
umm | -7.255 |
rol | -7.136 |
lor | -7.086 |
ubb | -7.028 |
osity | -7.025 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.628 |
, | +1.502 |
. | +1.457 |
the | +1.239 |
a | +1.170 |
Neg logit contributions | |
umm | -7.697 |
lor | -7.525 |
rol | -7.521 |
rim | -7.416 |
vation | -7.402 |
Token | a |
Token ID | 257 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.663 |
, | +0.602 |
. | +0.517 |
the | +0.260 |
a | +0.081 |
Neg logit contributions | |
umm | -8.684 |
rol | -8.487 |
lor | -8.455 |
rim | -8.378 |
ubb | -8.367 |
Token | kind |
Token ID | 1611 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.044 |
, | +2.954 |
. | +2.876 |
the | +2.681 |
a | +2.582 |
Neg logit contributions | |
umm | -6.353 |
lor | -6.127 |
rol | -6.101 |
vation | -6.052 |
rim | -6.046 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.299 |
, | +4.216 |
. | +4.157 |
the | +3.983 |
a | +3.895 |
Neg logit contributions | |
umm | -5.065 |
lor | -4.816 |
rol | -4.782 |
rim | -4.753 |
ubb | -4.729 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.220 |
. | +0.048 |
, | +0.021 |
the | -0.139 |
a | -0.233 |
Neg logit contributions | |
umm | -9.065 |
lor | -8.921 |
rol | -8.914 |
ubb | -8.800 |
rim | -8.798 |
Token | there |
Token ID | 612 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.979 |
, | +1.842 |
. | +1.810 |
the | +1.569 |
a | +1.451 |
Neg logit contributions | |
umm | -7.255 |
rol | -7.136 |
lor | -7.086 |
ubb | -7.028 |
osity | -7.025 |
Token | was |
Token ID | 373 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +1.628 |
, | +1.502 |
. | +1.457 |
the | +1.239 |
a | +1.170 |
Neg logit contributions | |
umm | -7.697 |
lor | -7.525 |
rol | -7.521 |
rim | -7.416 |
vation | -7.402 |
Token | a |
Token ID | 257 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.663 |
, | +0.602 |
. | +0.517 |
the | +0.260 |
a | +0.081 |
Neg logit contributions | |
umm | -8.684 |
rol | -8.487 |
lor | -8.455 |
rim | -8.378 |
ubb | -8.367 |
Token | kind |
Token ID | 1611 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.044 |
, | +2.954 |
. | +2.876 |
the | +2.681 |
a | +2.582 |
Neg logit contributions | |
umm | -6.353 |
lor | -6.127 |
rol | -6.101 |
vation | -6.052 |
rim | -6.046 |
Token | person |
Token ID | 1048 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +4.299 |
, | +4.216 |
. | +4.157 |
the | +3.983 |
a | +3.895 |
Neg logit contributions | |
umm | -5.065 |
lor | -4.816 |
rol | -4.782 |
rim | -4.753 |
ubb | -4.729 |
Token | named |
Token ID | 3706 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.690 |
, | +3.598 |
. | +3.482 |
the | +3.355 |
a | +3.276 |
Neg logit contributions | |
umm | -5.572 |
lor | -5.431 |
rol | -5.416 |
rim | -5.386 |
vation | -5.305 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.352 |
, | +3.172 |
. | +3.105 |
the | +2.808 |
a | +2.708 |
Neg logit contributions | |
umm | -6.090 |
rol | -5.844 |
lor | -5.812 |
arians | -5.784 |
osity | -5.781 |
Token | . |
Token ID | 13 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +0.433 |
, | +0.376 |
. | +0.193 |
the | +0.134 |
a | +0.040 |
Neg logit contributions | |
lor | -8.543 |
umm | -8.529 |
rim | -8.479 |
rol | -8.453 |
osity | -8.361 |
Token | Tom |
Token ID | 4186 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +2.945 |
, | +2.858 |
. | +2.770 |
the | +2.580 |
a | +2.481 |
Neg logit contributions | |
umm | -6.507 |
lor | -6.317 |
rol | -6.302 |
vation | -6.227 |
ubb | -6.207 |
Token | liked |
Token ID | 8288 |
Feature activation | -9.84e+01 |
Pos logit contributions | |
and | +3.369 |
, | +3.288 |
. | +3.207 |
the | +3.020 |
a | +2.918 |
Neg logit contributions | |
umm | -5.979 |
lor | -5.797 |
rol | -5.772 |
vation | -5.705 |
rim | -5.702 |