Token | he |
Token ID | 339 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.629 |
, | +2.598 |
. | +2.489 |
the | +2.312 |
a | +2.097 |
Neg logit contributions | |
umm | -6.098 |
lor | -6.088 |
former | -6.076 |
osity | -6.013 |
rol | -6.007 |
Token | had |
Token ID | 550 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.558 |
and | +3.541 |
. | +3.430 |
the | +3.360 |
a | +3.141 |
Neg logit contributions | |
lor | -5.324 |
former | -5.217 |
umm | -5.163 |
rol | -5.133 |
osity | -5.098 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.704 |
and | +1.701 |
. | +1.570 |
the | +1.451 |
a | +1.194 |
Neg logit contributions | |
lor | -7.242 |
former | -7.122 |
rol | -7.035 |
umm | -7.030 |
osity | -6.983 |
Token | take |
Token ID | 1011 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.789 |
, | +3.773 |
. | +3.633 |
the | +3.562 |
a | +3.325 |
Neg logit contributions | |
lor | -5.075 |
former | -5.033 |
umm | -4.929 |
ocol | -4.892 |
rol | -4.851 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.370 |
, | +2.337 |
. | +2.229 |
the | +2.087 |
a | +1.838 |
Neg logit contributions | |
lor | -6.506 |
former | -6.422 |
umm | -6.373 |
ocol | -6.339 |
rol | -6.309 |
Token | bath |
Token ID | 7837 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.338 |
, | +4.300 |
. | +4.185 |
the | +4.118 |
a | +3.871 |
Neg logit contributions | |
lor | -4.593 |
former | -4.459 |
umm | -4.426 |
rol | -4.369 |
bek | -4.363 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.666 |
, | +2.663 |
the | +2.555 |
. | +2.502 |
a | +2.315 |
Neg logit contributions | |
lor | -6.196 |
umm | -6.071 |
former | -6.048 |
rol | -6.041 |
arians | -5.905 |
Token | Even |
Token ID | 3412 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.645 |
and | +3.633 |
. | +3.484 |
the | +3.422 |
a | +3.188 |
Neg logit contributions | |
lor | -5.256 |
umm | -5.215 |
former | -5.208 |
rol | -5.115 |
osity | -5.095 |
Token | though |
Token ID | 996 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.131 |
and | +4.122 |
. | +4.011 |
the | +3.863 |
a | +3.688 |
Neg logit contributions | |
lor | -4.637 |
former | -4.620 |
umm | -4.594 |
rol | -4.551 |
osity | -4.548 |
Token | he |
Token ID | 339 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.122 |
, | +2.067 |
. | +1.966 |
the | +1.819 |
a | +1.635 |
Neg logit contributions | |
lor | -6.658 |
former | -6.621 |
umm | -6.566 |
ocol | -6.534 |
osity | -6.488 |
Token | didn |
Token ID | 1422 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.269 |
and | +3.252 |
. | +3.143 |
the | +3.072 |
a | +2.855 |
Neg logit contributions | |
lor | -5.616 |
former | -5.528 |
umm | -5.457 |
rol | -5.438 |
ocol | -5.394 |
Token | until |
Token ID | 1566 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.099 |
, | +2.081 |
the | +1.971 |
. | +1.958 |
a | +1.760 |
Neg logit contributions | |
lor | -6.616 |
former | -6.544 |
rol | -6.474 |
umm | -6.451 |
arians | -6.405 |
Token | they |
Token ID | 484 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.372 |
, | +2.269 |
. | +2.188 |
the | +2.039 |
a | +1.850 |
Neg logit contributions | |
lor | -6.429 |
former | -6.389 |
umm | -6.359 |
rol | -6.319 |
ocol | -6.294 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.432 |
, | +3.405 |
. | +3.295 |
the | +3.205 |
a | +2.997 |
Neg logit contributions | |
lor | -5.523 |
former | -5.352 |
umm | -5.349 |
rol | -5.341 |
bek | -5.281 |
Token | something |
Token ID | 1223 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.034 |
, | +1.991 |
. | +1.866 |
the | +1.698 |
a | +1.442 |
Neg logit contributions | |
lor | -6.848 |
former | -6.795 |
umm | -6.729 |
rol | -6.675 |
osity | -6.633 |
Token | gl |
Token ID | 1278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.355 |
, | +3.315 |
. | +3.152 |
the | +3.126 |
a | +2.896 |
Neg logit contributions | |
lor | -5.426 |
umm | -5.337 |
former | -5.305 |
rol | -5.298 |
ocol | -5.280 |
Token | immer |
Token ID | 10957 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +8.012 |
, | +7.998 |
. | +7.857 |
the | +7.825 |
a | +7.588 |
Neg logit contributions | |
lor | -1.023 |
former | -0.867 |
umm | -0.864 |
rol | -0.837 |
osity | -0.791 |
Token | ing |
Token ID | 278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.709 |
and | +4.706 |
the | +4.559 |
. | +4.531 |
a | +4.321 |
Neg logit contributions | |
lor | -4.156 |
umm | -4.085 |
rol | -4.037 |
osity | -3.946 |
former | -3.945 |
Token | in |
Token ID | 287 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.757 |
and | +2.753 |
. | +2.590 |
the | +2.544 |
a | +2.350 |
Neg logit contributions | |
lor | -6.030 |
rol | -5.925 |
umm | -5.911 |
former | -5.878 |
ocol | -5.853 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.868 |
and | +0.867 |
. | +0.707 |
the | +0.540 |
a | +0.359 |
Neg logit contributions | |
lor | -7.966 |
former | -7.919 |
umm | -7.878 |
ocol | -7.854 |
rol | -7.800 |
Token | distance |
Token ID | 5253 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.733 |
, | +4.720 |
. | +4.585 |
the | +4.507 |
a | +4.289 |
Neg logit contributions | |
lor | -4.191 |
umm | -4.123 |
former | -4.098 |
rol | -3.989 |
ocol | -3.954 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.315 |
, | +0.299 |
the | +0.116 |
. | +0.076 |
a | -0.021 |
Neg logit contributions | |
lor | -8.403 |
umm | -8.350 |
former | -8.273 |
rol | -8.272 |
ocol | -8.227 |
Token | I |
Token ID | 314 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.064 |
, | +2.984 |
. | +2.871 |
the | +2.723 |
a | +2.545 |
Neg logit contributions | |
lor | -5.861 |
ocol | -5.659 |
former | -5.658 |
umm | -5.640 |
osity | -5.613 |
Token | can |
Token ID | 460 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.770 |
, | +3.740 |
. | +3.611 |
the | +3.573 |
a | +3.330 |
Neg logit contributions | |
lor | -5.184 |
former | -5.018 |
umm | -4.982 |
ocol | -4.964 |
rol | -4.957 |
Token | find |
Token ID | 1064 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.970 |
, | +3.948 |
. | +3.817 |
the | +3.800 |
a | +3.552 |
Neg logit contributions | |
lor | -4.949 |
former | -4.796 |
umm | -4.781 |
rol | -4.721 |
ocol | -4.697 |
Token | something |
Token ID | 1223 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.782 |
, | +2.718 |
. | +2.601 |
the | +2.487 |
a | +2.251 |
Neg logit contributions | |
lor | -6.155 |
ocol | -5.991 |
umm | -5.934 |
former | -5.933 |
rol | -5.909 |
Token | gl |
Token ID | 1278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.238 |
, | +3.153 |
. | +3.032 |
the | +3.005 |
a | +2.774 |
Neg logit contributions | |
lor | -5.653 |
umm | -5.541 |
former | -5.532 |
rol | -5.466 |
ocol | -5.458 |
Token | immer |
Token ID | 10957 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +8.064 |
, | +8.053 |
. | +7.914 |
the | +7.912 |
a | +7.652 |
Neg logit contributions | |
lor | -0.979 |
former | -0.814 |
umm | -0.808 |
rol | -0.769 |
ocol | -0.744 |
Token | ing |
Token ID | 278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.610 |
, | +3.586 |
the | +3.465 |
. | +3.451 |
a | +3.222 |
Neg logit contributions | |
lor | -5.274 |
umm | -5.218 |
rol | -5.120 |
former | -5.084 |
ocol | -5.044 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.191 |
, | +3.181 |
. | +3.057 |
the | +2.979 |
a | +2.784 |
Neg logit contributions | |
lor | -5.649 |
umm | -5.522 |
former | -5.514 |
rol | -5.479 |
ocol | -5.471 |
Token | |
Token ID | 220 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.847 |
, | +2.842 |
. | +2.705 |
the | +2.611 |
a | +2.423 |
Neg logit contributions | |
lor | -5.976 |
former | -5.803 |
umm | -5.782 |
rol | -5.755 |
osity | -5.724 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.397 |
, | +1.385 |
. | +1.191 |
the | +1.169 |
a | +0.976 |
Neg logit contributions | |
lor | -7.543 |
rol | -7.305 |
former | -7.297 |
umm | -7.287 |
ocol | -7.200 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.409 |
, | +1.400 |
. | +1.256 |
the | +1.177 |
a | +0.980 |
Neg logit contributions | |
lor | -7.559 |
former | -7.285 |
rol | -7.271 |
umm | -7.236 |
bek | -7.221 |
Token | my |
Token ID | 1820 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.431 |
and | +3.421 |
. | +3.327 |
the | +3.251 |
a | +3.044 |
Neg logit contributions | |
lor | -5.461 |
rol | -5.280 |
former | -5.277 |
umm | -5.275 |
osity | -5.230 |
Token | brought |
Token ID | 3181 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.408 |
and | +3.396 |
. | +3.308 |
the | +3.234 |
a | +3.018 |
Neg logit contributions | |
lor | -5.476 |
former | -5.305 |
umm | -5.278 |
rol | -5.272 |
osity | -5.241 |
Token | her |
Token ID | 607 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.824 |
and | +1.808 |
. | +1.670 |
the | +1.564 |
a | +1.314 |
Neg logit contributions | |
lor | -7.076 |
former | -6.953 |
umm | -6.937 |
rol | -6.922 |
ocol | -6.879 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.502 |
and | +2.491 |
. | +2.353 |
the | +2.258 |
a | +1.995 |
Neg logit contributions | |
lor | -6.398 |
former | -6.312 |
umm | -6.246 |
rol | -6.207 |
ocol | -6.174 |
Token | special |
Token ID | 2041 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.483 |
, | +4.457 |
. | +4.349 |
the | +4.267 |
a | +4.020 |
Neg logit contributions | |
lor | -4.451 |
former | -4.327 |
umm | -4.304 |
rol | -4.240 |
bek | -4.228 |
Token | lunch |
Token ID | 9965 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.962 |
, | +4.932 |
. | +4.829 |
the | +4.791 |
a | +4.517 |
Neg logit contributions | |
lor | -3.932 |
former | -3.819 |
umm | -3.800 |
ocol | -3.719 |
bek | -3.692 |
Token | that |
Token ID | 326 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.502 |
and | +4.497 |
the | +4.407 |
. | +4.327 |
a | +4.135 |
Neg logit contributions | |
lor | -4.406 |
umm | -4.274 |
former | -4.175 |
rol | -4.170 |
bek | -4.081 |
Token | Car |
Token ID | 1879 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.067 |
, | +3.052 |
. | +2.923 |
the | +2.806 |
a | +2.594 |
Neg logit contributions | |
lor | -5.869 |
umm | -5.749 |
former | -5.705 |
rol | -5.670 |
bek | -5.633 |
Token | a |
Token ID | 64 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +5.727 |
, | +5.713 |
. | +5.567 |
the | +5.527 |
a | +5.292 |
Neg logit contributions | |
lor | -3.303 |
umm | -3.094 |
former | -3.093 |
rol | -3.058 |
osity | -3.030 |
Token | had |
Token ID | 550 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.591 |
, | +3.590 |
. | +3.439 |
the | +3.428 |
a | +3.185 |
Neg logit contributions | |
lor | -5.312 |
former | -5.154 |
umm | -5.123 |
rol | -5.088 |
ocol | -5.035 |
Token | never |
Token ID | 1239 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.277 |
and | +4.258 |
. | +4.093 |
the | +4.030 |
a | +3.775 |
Neg logit contributions | |
lor | -4.720 |
former | -4.550 |
umm | -4.489 |
rol | -4.488 |
ocol | -4.418 |
Token | They |
Token ID | 1119 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.065 |
and | +4.051 |
. | +3.917 |
the | +3.842 |
a | +3.619 |
Neg logit contributions | |
lor | -4.822 |
umm | -4.738 |
former | -4.712 |
rol | -4.674 |
osity | -4.632 |
Token | were |
Token ID | 547 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.563 |
and | +3.559 |
. | +3.443 |
the | +3.351 |
a | +3.140 |
Neg logit contributions | |
lor | -5.289 |
former | -5.188 |
rol | -5.169 |
umm | -5.149 |
osity | -5.122 |
Token | going |
Token ID | 1016 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.172 |
, | +3.164 |
. | +3.064 |
the | +2.898 |
a | +2.685 |
Neg logit contributions | |
lor | -5.688 |
rol | -5.641 |
former | -5.595 |
umm | -5.593 |
osity | -5.529 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.351 |
and | +1.344 |
. | +1.234 |
the | +1.138 |
a | +0.903 |
Neg logit contributions | |
lor | -7.519 |
former | -7.388 |
rol | -7.366 |
umm | -7.364 |
osity | -7.309 |
Token | go |
Token ID | 467 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.581 |
, | +3.568 |
. | +3.438 |
the | +3.244 |
a | +3.030 |
Neg logit contributions | |
lor | -5.324 |
former | -5.276 |
umm | -5.146 |
rol | -5.115 |
ocol | -5.100 |
Token | camping |
Token ID | 22498 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.068 |
and | +2.065 |
. | +1.941 |
the | +1.880 |
a | +1.657 |
Neg logit contributions | |
lor | -6.758 |
former | -6.615 |
rol | -6.603 |
umm | -6.549 |
osity | -6.505 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.886 |
, | +2.886 |
. | +2.747 |
the | +2.721 |
a | +2.489 |
Neg logit contributions | |
lor | -5.945 |
former | -5.826 |
umm | -5.736 |
rol | -5.728 |
arians | -5.699 |
Token | have |
Token ID | 423 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.884 |
, | +3.854 |
. | +3.758 |
the | +3.552 |
a | +3.348 |
Neg logit contributions | |
former | -4.985 |
lor | -4.981 |
rol | -4.861 |
umm | -4.856 |
osity | -4.839 |
Token | lots |
Token ID | 6041 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.351 |
and | +3.336 |
. | +3.201 |
the | +3.067 |
a | +2.800 |
Neg logit contributions | |
lor | -5.601 |
former | -5.467 |
rol | -5.418 |
umm | -5.414 |
osity | -5.286 |
Token | of |
Token ID | 286 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.269 |
and | +2.262 |
the | +2.117 |
. | +2.113 |
a | +1.880 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.516 |
former | -6.490 |
rol | -6.459 |
ocol | -6.438 |
Token | fun |
Token ID | 1257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.229 |
and | +3.222 |
. | +3.068 |
the | +2.999 |
a | +2.747 |
Neg logit contributions | |
lor | -5.610 |
former | -5.601 |
ocol | -5.517 |
rol | -5.506 |
umm | -5.502 |
Token | Inside |
Token ID | 14384 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.160 |
and | +3.158 |
. | +3.042 |
the | +2.917 |
a | +2.703 |
Neg logit contributions | |
lor | -5.731 |
umm | -5.610 |
former | -5.586 |
rol | -5.568 |
osity | -5.542 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.158 |
, | +1.096 |
. | +1.022 |
the | +0.878 |
a | +0.747 |
Neg logit contributions | |
lor | -7.734 |
rol | -7.550 |
umm | -7.537 |
former | -7.469 |
ocol | -7.459 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.000 |
, | +0.987 |
. | +0.860 |
the | +0.714 |
a | +0.442 |
Neg logit contributions | |
lor | -7.906 |
former | -7.819 |
umm | -7.786 |
rol | -7.769 |
ocol | -7.692 |
Token | y |
Token ID | 331 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.968 |
, | +3.927 |
. | +3.836 |
the | +3.769 |
a | +3.524 |
Neg logit contributions | |
lor | -4.913 |
umm | -4.848 |
former | -4.847 |
bek | -4.736 |
ocol | -4.722 |
Token | ummy |
Token ID | 13513 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +5.854 |
, | +5.792 |
. | +5.702 |
the | +5.695 |
a | +5.480 |
Neg logit contributions | |
umm | -3.132 |
lor | -3.080 |
former | -2.979 |
ocol | -2.967 |
rol | -2.931 |
Token | drink |
Token ID | 4144 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.462 |
, | +4.415 |
. | +4.351 |
the | +4.335 |
a | +4.084 |
Neg logit contributions | |
umm | -4.319 |
lor | -4.298 |
ocol | -4.213 |
former | -4.185 |
rol | -4.132 |
Token | ! |
Token ID | 0 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.512 |
, | +2.490 |
the | +2.371 |
. | +2.336 |
a | +2.135 |
Neg logit contributions | |
lor | -6.288 |
umm | -6.270 |
rol | -6.170 |
former | -6.098 |
ocol | -6.062 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.812 |
, | +2.808 |
. | +2.677 |
the | +2.559 |
a | +2.355 |
Neg logit contributions | |
lor | -6.116 |
umm | -5.993 |
former | -5.963 |
rol | -5.961 |
osity | -5.895 |
Token | baby |
Token ID | 5156 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.224 |
, | +3.217 |
. | +3.079 |
the | +3.001 |
a | +2.756 |
Neg logit contributions | |
lor | -5.699 |
umm | -5.685 |
former | -5.649 |
rol | -5.525 |
ocol | -5.484 |
Token | drank |
Token ID | 24070 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.676 |
and | +2.664 |
. | +2.580 |
the | +2.489 |
a | +2.278 |
Neg logit contributions | |
lor | -6.175 |
umm | -6.084 |
former | -6.041 |
rol | -6.018 |
bek | -5.934 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.927 |
, | +1.925 |
. | +1.821 |
the | +1.693 |
a | +1.495 |
Neg logit contributions | |
lor | -6.830 |
umm | -6.801 |
rol | -6.744 |
former | -6.737 |
ocol | -6.666 |
Token | drink |
Token ID | 4144 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.118 |
, | +4.063 |
. | +3.922 |
the | +3.827 |
a | +3.645 |
Neg logit contributions | |
lor | -4.723 |
former | -4.690 |
ocol | -4.605 |
umm | -4.604 |
rol | -4.569 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.652 |
, | +1.624 |
. | +1.446 |
the | +1.418 |
a | +1.216 |
Neg logit contributions | |
lor | -7.136 |
umm | -7.071 |
rol | -7.032 |
ocol | -6.997 |
former | -6.992 |
Token | He |
Token ID | 679 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.066 |
and | +3.064 |
. | +2.924 |
the | +2.850 |
a | +2.624 |
Neg logit contributions | |
lor | -5.873 |
former | -5.737 |
umm | -5.732 |
rol | -5.705 |
osity | -5.619 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.618 |
and | +3.604 |
. | +3.501 |
the | +3.401 |
a | +3.177 |
Neg logit contributions | |
lor | -5.297 |
former | -5.179 |
rol | -5.130 |
umm | -5.119 |
bek | -5.078 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.938 |
and | +1.931 |
. | +1.821 |
the | +1.632 |
a | +1.375 |
Neg logit contributions | |
lor | -6.979 |
former | -6.828 |
rol | -6.806 |
umm | -6.802 |
ocol | -6.731 |
Token | glass |
Token ID | 5405 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.212 |
, | +4.186 |
. | +4.094 |
the | +4.025 |
a | +3.784 |
Neg logit contributions | |
lor | -4.673 |
umm | -4.580 |
former | -4.570 |
bek | -4.474 |
rol | -4.466 |
Token | on |
Token ID | 319 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.170 |
, | +3.168 |
. | +3.044 |
the | +3.037 |
a | +2.817 |
Neg logit contributions | |
lor | -5.672 |
umm | -5.601 |
rol | -5.500 |
former | -5.445 |
ocol | -5.426 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.589 |
, | +0.583 |
. | +0.462 |
the | +0.280 |
a | +0.105 |
Neg logit contributions | |
lor | -8.227 |
former | -8.134 |
umm | -8.129 |
ocol | -8.069 |
rol | -8.047 |
Token | sidewalk |
Token ID | 24058 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.818 |
and | +4.798 |
. | +4.647 |
the | +4.602 |
a | +4.379 |
Neg logit contributions | |
lor | -4.099 |
umm | -4.036 |
former | -3.999 |
rol | -3.889 |
arians | -3.861 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.967 |
and | +1.961 |
the | +1.847 |
. | +1.837 |
a | +1.619 |
Neg logit contributions | |
lor | -6.865 |
umm | -6.756 |
rol | -6.702 |
former | -6.666 |
osity | -6.639 |
Token | he |
Token ID | 339 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.181 |
and | +3.162 |
. | +3.067 |
the | +2.903 |
a | +2.673 |
Neg logit contributions | |
lor | -5.699 |
former | -5.579 |
rol | -5.522 |
umm | -5.519 |
bek | -5.484 |
Token | day |
Token ID | 1110 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.856 |
, | +2.831 |
. | +2.727 |
the | +2.633 |
a | +2.425 |
Neg logit contributions | |
lor | -5.969 |
umm | -5.943 |
former | -5.916 |
rol | -5.824 |
osity | -5.815 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.572 |
, | +0.480 |
. | +0.424 |
the | +0.327 |
a | +0.112 |
Neg logit contributions | |
lor | -8.270 |
umm | -8.163 |
rol | -8.104 |
ocol | -8.100 |
former | -8.091 |
Token | Tommy |
Token ID | 19919 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.271 |
, | +3.242 |
. | +3.142 |
the | +3.005 |
a | +2.782 |
Neg logit contributions | |
lor | -5.546 |
umm | -5.487 |
former | -5.444 |
rol | -5.418 |
bek | -5.399 |
Token | got |
Token ID | 1392 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.915 |
and | +2.888 |
. | +2.804 |
the | +2.744 |
a | +2.515 |
Neg logit contributions | |
lor | -5.951 |
former | -5.805 |
umm | -5.769 |
rol | -5.737 |
osity | -5.713 |
Token | very |
Token ID | 845 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.985 |
, | +2.977 |
. | +2.832 |
the | +2.703 |
a | +2.448 |
Neg logit contributions | |
lor | -5.894 |
former | -5.858 |
rol | -5.811 |
umm | -5.795 |
ocol | -5.750 |
Token | thirsty |
Token ID | 47124 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.077 |
, | +4.057 |
. | +3.917 |
the | +3.827 |
a | +3.586 |
Neg logit contributions | |
former | -4.798 |
lor | -4.780 |
umm | -4.746 |
rol | -4.696 |
ocol | -4.687 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.614 |
and | +0.597 |
the | +0.499 |
. | +0.435 |
a | +0.262 |
Neg logit contributions | |
umm | -8.051 |
lor | -8.020 |
former | -7.937 |
rol | -7.914 |
ocol | -7.838 |
Token | but |
Token ID | 475 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.685 |
and | +1.594 |
. | +1.550 |
the | +1.428 |
a | +1.188 |
Neg logit contributions | |
lor | -7.088 |
former | -7.024 |
rol | -7.018 |
umm | -7.002 |
osity | -6.906 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.355 |
, | +2.327 |
. | +2.252 |
the | +2.062 |
a | +1.872 |
Neg logit contributions | |
lor | -6.469 |
former | -6.379 |
umm | -6.370 |
bek | -6.315 |
rol | -6.305 |
Token | too |
Token ID | 1165 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.104 |
, | +3.091 |
. | +2.952 |
the | +2.807 |
a | +2.548 |
Neg logit contributions | |
lor | -5.755 |
former | -5.685 |
rol | -5.654 |
umm | -5.608 |
osity | -5.569 |
Token | tired |
Token ID | 10032 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.973 |
, | +3.965 |
. | +3.803 |
the | +3.747 |
a | +3.506 |
Neg logit contributions | |
former | -4.824 |
lor | -4.820 |
umm | -4.763 |
ocol | -4.710 |
rol | -4.696 |
Token | when |
Token ID | 618 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.696 |
, | +1.692 |
. | +1.556 |
the | +1.536 |
a | +1.304 |
Neg logit contributions | |
lor | -7.035 |
former | -6.968 |
umm | -6.895 |
rol | -6.894 |
osity | -6.839 |
Token | she |
Token ID | 673 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.397 |
, | +2.320 |
. | +2.227 |
the | +2.084 |
a | +1.862 |
Neg logit contributions | |
lor | -6.475 |
former | -6.370 |
umm | -6.346 |
rol | -6.325 |
osity | -6.300 |
Token | noticed |
Token ID | 6810 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.666 |
, | +3.634 |
. | +3.524 |
the | +3.445 |
a | +3.224 |
Neg logit contributions | |
lor | -5.320 |
former | -5.112 |
umm | -5.099 |
rol | -5.097 |
bek | -5.027 |
Token | something |
Token ID | 1223 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.674 |
, | +1.638 |
. | +1.513 |
the | +1.357 |
a | +1.089 |
Neg logit contributions | |
lor | -7.241 |
former | -7.102 |
rol | -7.031 |
umm | -7.031 |
ocol | -6.987 |
Token | gl |
Token ID | 1278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.589 |
, | +3.561 |
. | +3.398 |
the | +3.361 |
a | +3.125 |
Neg logit contributions | |
lor | -5.221 |
umm | -5.127 |
former | -5.087 |
rol | -5.083 |
ocol | -5.076 |
Token | immer |
Token ID | 10957 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +7.812 |
, | +7.798 |
. | +7.661 |
the | +7.616 |
a | +7.385 |
Neg logit contributions | |
lor | -1.215 |
former | -1.063 |
umm | -1.061 |
rol | -1.028 |
osity | -0.989 |
Token | ing |
Token ID | 278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.803 |
and | +4.794 |
the | +4.640 |
. | +4.627 |
a | +4.398 |
Neg logit contributions | |
lor | -4.087 |
umm | -4.006 |
rol | -3.961 |
former | -3.877 |
osity | -3.874 |
Token | in |
Token ID | 287 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.831 |
and | +2.817 |
. | +2.668 |
the | +2.609 |
a | +2.405 |
Neg logit contributions | |
lor | -5.995 |
rol | -5.882 |
umm | -5.865 |
former | -5.830 |
ocol | -5.823 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.083 |
and | +1.074 |
. | +0.921 |
the | +0.747 |
a | +0.551 |
Neg logit contributions | |
lor | -7.779 |
former | -7.714 |
umm | -7.684 |
ocol | -7.663 |
rol | -7.604 |
Token | corner |
Token ID | 5228 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.682 |
, | +4.673 |
. | +4.527 |
the | +4.453 |
a | +4.229 |
Neg logit contributions | |
lor | -4.287 |
umm | -4.188 |
former | -4.179 |
rol | -4.084 |
ocol | -4.020 |
Token | of |
Token ID | 286 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.830 |
and | +1.825 |
the | +1.645 |
. | +1.619 |
a | +1.432 |
Neg logit contributions | |
lor | -7.017 |
umm | -6.887 |
rol | -6.878 |
former | -6.861 |
ocol | -6.803 |
Token | little |
Token ID | 1310 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.866 |
and | +2.837 |
. | +2.702 |
the | +2.634 |
a | +2.344 |
Neg logit contributions | |
lor | -6.023 |
umm | -5.972 |
former | -5.954 |
osity | -5.850 |
arians | -5.815 |
Token | sister |
Token ID | 6621 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.056 |
, | +4.011 |
. | +3.905 |
the | +3.864 |
a | +3.630 |
Neg logit contributions | |
umm | -4.795 |
lor | -4.756 |
former | -4.722 |
ocol | -4.638 |
osity | -4.620 |
Token | Lily |
Token ID | 20037 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.411 |
, | +2.328 |
. | +2.266 |
the | +2.195 |
a | +1.971 |
Neg logit contributions | |
lor | -6.420 |
umm | -6.310 |
former | -6.295 |
rol | -6.234 |
osity | -6.206 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.291 |
, | +2.280 |
. | +2.159 |
the | +2.102 |
a | +1.884 |
Neg logit contributions | |
lor | -6.509 |
umm | -6.413 |
former | -6.375 |
rol | -6.367 |
ocol | -6.317 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.798 |
, | +0.785 |
. | +0.640 |
the | +0.488 |
a | +0.230 |
Neg logit contributions | |
lor | -8.119 |
former | -7.972 |
umm | -7.961 |
rol | -7.917 |
ocol | -7.907 |
Token | glow |
Token ID | 19634 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.978 |
, | +3.960 |
. | +3.861 |
the | +3.772 |
a | +3.535 |
Neg logit contributions | |
lor | -4.909 |
umm | -4.818 |
former | -4.807 |
bek | -4.731 |
osity | -4.721 |
Token | in |
Token ID | 287 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.172 |
and | +3.169 |
the | +3.012 |
. | +2.989 |
a | +2.763 |
Neg logit contributions | |
lor | -5.694 |
umm | -5.622 |
former | -5.544 |
rol | -5.482 |
ocol | -5.481 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.875 |
and | +0.866 |
. | +0.697 |
the | +0.494 |
a | +0.325 |
Neg logit contributions | |
lor | -7.985 |
former | -7.927 |
ocol | -7.885 |
umm | -7.872 |
rol | -7.771 |
Token | sky |
Token ID | 6766 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.241 |
, | +4.234 |
. | +4.088 |
the | +4.002 |
a | +3.780 |
Neg logit contributions | |
lor | -4.714 |
umm | -4.619 |
former | -4.616 |
rol | -4.491 |
osity | -4.479 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.260 |
and | +0.259 |
the | +0.114 |
. | +0.030 |
a | -0.100 |
Neg logit contributions | |
lor | -8.523 |
umm | -8.403 |
former | -8.382 |
rol | -8.341 |
ocol | -8.302 |
Token | It |
Token ID | 632 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.033 |
, | +3.020 |
. | +2.902 |
the | +2.804 |
a | +2.605 |
Neg logit contributions | |
lor | -5.812 |
umm | -5.733 |
former | -5.666 |
rol | -5.645 |
osity | -5.638 |
Token | necklace |
Token ID | 38987 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.585 |
, | +4.568 |
. | +4.479 |
the | +4.431 |
a | +4.198 |
Neg logit contributions | |
lor | -4.265 |
umm | -4.187 |
former | -4.187 |
bek | -4.037 |
osity | -4.036 |
Token | made |
Token ID | 925 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.135 |
, | +2.129 |
the | +2.038 |
. | +1.974 |
a | +1.791 |
Neg logit contributions | |
lor | -6.782 |
umm | -6.588 |
rol | -6.535 |
former | -6.493 |
osity | -6.471 |
Token | out |
Token ID | 503 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.771 |
and | +2.766 |
. | +2.626 |
the | +2.515 |
a | +2.310 |
Neg logit contributions | |
lor | -6.081 |
umm | -6.003 |
rol | -5.982 |
former | -5.955 |
osity | -5.924 |
Token | of |
Token ID | 286 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.773 |
and | +2.743 |
. | +2.593 |
the | +2.553 |
a | +2.318 |
Neg logit contributions | |
lor | -6.123 |
former | -6.050 |
umm | -6.016 |
rol | -6.013 |
osity | -5.964 |
Token | gl |
Token ID | 1278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.512 |
and | +4.500 |
. | +4.360 |
the | +4.205 |
a | +3.981 |
Neg logit contributions | |
lor | -4.356 |
former | -4.356 |
umm | -4.293 |
ocol | -4.260 |
rol | -4.181 |
Token | immer |
Token ID | 10957 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +7.850 |
, | +7.843 |
. | +7.696 |
the | +7.677 |
a | +7.435 |
Neg logit contributions | |
lor | -1.224 |
former | -1.085 |
umm | -1.070 |
rol | -1.025 |
ocol | -0.994 |
Token | ing |
Token ID | 278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.517 |
and | +4.512 |
the | +4.373 |
. | +4.359 |
a | +4.140 |
Neg logit contributions | |
lor | -4.339 |
umm | -4.314 |
rol | -4.205 |
former | -4.159 |
osity | -4.128 |
Token | jewels |
Token ID | 42701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.016 |
and | +3.000 |
. | +2.873 |
the | +2.817 |
a | +2.628 |
Neg logit contributions | |
lor | -5.806 |
umm | -5.763 |
former | -5.715 |
rol | -5.672 |
ocol | -5.644 |
Token | ! |
Token ID | 0 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.217 |
and | +2.217 |
the | +2.125 |
. | +2.068 |
a | +1.879 |
Neg logit contributions | |
lor | -6.629 |
umm | -6.479 |
former | -6.424 |
rol | -6.414 |
osity | -6.382 |
Token | Sarah |
Token ID | 10490 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.968 |
, | +3.955 |
. | +3.826 |
the | +3.750 |
a | +3.531 |
Neg logit contributions | |
lor | -4.946 |
umm | -4.851 |
former | -4.832 |
osity | -4.796 |
rol | -4.757 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.110 |
and | +3.098 |
. | +3.010 |
the | +2.919 |
a | +2.713 |
Neg logit contributions | |
lor | -5.828 |
former | -5.664 |
umm | -5.635 |
rol | -5.607 |
bek | -5.579 |
Token | until |
Token ID | 1566 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.211 |
, | +2.194 |
. | +2.077 |
the | +2.076 |
a | +1.869 |
Neg logit contributions | |
lor | -6.659 |
former | -6.437 |
rol | -6.387 |
umm | -6.372 |
osity | -6.370 |
Token | he |
Token ID | 339 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.168 |
, | +2.075 |
. | +1.991 |
the | +1.828 |
a | +1.633 |
Neg logit contributions | |
lor | -6.741 |
umm | -6.628 |
former | -6.605 |
ocol | -6.558 |
rol | -6.552 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.162 |
, | +3.139 |
. | +3.026 |
the | +2.953 |
a | +2.732 |
Neg logit contributions | |
lor | -5.811 |
umm | -5.626 |
former | -5.622 |
rol | -5.589 |
osity | -5.518 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.726 |
, | +1.692 |
. | +1.562 |
the | +1.369 |
a | +1.114 |
Neg logit contributions | |
lor | -7.190 |
former | -7.112 |
umm | -7.058 |
rol | -7.003 |
ocol | -6.955 |
Token | gl |
Token ID | 1278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.648 |
, | +3.614 |
. | +3.519 |
the | +3.440 |
a | +3.209 |
Neg logit contributions | |
lor | -5.252 |
former | -5.175 |
umm | -5.165 |
bek | -5.074 |
osity | -5.028 |
Token | immer |
Token ID | 10957 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +7.924 |
, | +7.910 |
. | +7.771 |
the | +7.748 |
a | +7.505 |
Neg logit contributions | |
lor | -1.127 |
former | -0.956 |
umm | -0.954 |
rol | -0.912 |
ocol | -0.878 |
Token | of |
Token ID | 286 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.589 |
the | +3.440 |
. | +3.437 |
a | +3.200 |
Neg logit contributions | |
lor | -5.303 |
umm | -5.273 |
rol | -5.152 |
former | -5.095 |
osity | -5.082 |
Token | light |
Token ID | 1657 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.509 |
, | +4.509 |
. | +4.382 |
the | +4.247 |
a | +4.038 |
Neg logit contributions | |
lor | -4.364 |
umm | -4.326 |
former | -4.322 |
ocol | -4.274 |
rol | -4.231 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.505 |
and | +2.495 |
the | +2.334 |
. | +2.320 |
a | +2.120 |
Neg logit contributions | |
lor | -6.373 |
umm | -6.292 |
former | -6.201 |
rol | -6.186 |
ocol | -6.149 |
Token | |
Token ID | 220 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.978 |
, | +2.972 |
. | +2.847 |
the | +2.735 |
a | +2.517 |
Neg logit contributions | |
lor | -6.005 |
umm | -5.838 |
former | -5.797 |
rol | -5.767 |
osity | -5.748 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.418 |
and | +1.401 |
. | +1.228 |
the | +1.195 |
a | +0.969 |
Neg logit contributions | |
lor | -7.538 |
rol | -7.337 |
former | -7.292 |
umm | -7.278 |
osity | -7.222 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.595 |
, | +1.438 |
. | +1.427 |
the | +1.298 |
a | +1.085 |
Neg logit contributions | |
lor | -7.233 |
umm | -7.098 |
former | -7.089 |
bek | -7.014 |
rol | -7.006 |
Token | she |
Token ID | 673 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.257 |
, | +2.187 |
. | +2.096 |
the | +1.928 |
a | +1.695 |
Neg logit contributions | |
lor | -6.599 |
former | -6.508 |
umm | -6.463 |
rol | -6.440 |
bek | -6.425 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.350 |
, | +3.338 |
. | +3.229 |
the | +3.170 |
a | +2.919 |
Neg logit contributions | |
lor | -5.589 |
former | -5.450 |
umm | -5.385 |
rol | -5.358 |
bek | -5.339 |
Token | something |
Token ID | 1223 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.551 |
, | +1.507 |
. | +1.386 |
the | +1.219 |
a | +0.944 |
Neg logit contributions | |
lor | -7.407 |
former | -7.249 |
umm | -7.186 |
rol | -7.182 |
ocol | -7.136 |
Token | gl |
Token ID | 1278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.226 |
, | +3.192 |
. | +3.033 |
the | +3.002 |
a | +2.763 |
Neg logit contributions | |
lor | -5.583 |
umm | -5.478 |
rol | -5.457 |
former | -5.442 |
ocol | -5.438 |
Token | immer |
Token ID | 10957 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +7.823 |
, | +7.811 |
. | +7.674 |
the | +7.628 |
a | +7.396 |
Neg logit contributions | |
lor | -1.208 |
umm | -1.056 |
former | -1.054 |
rol | -1.022 |
osity | -0.981 |
Token | ing |
Token ID | 278 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.598 |
and | +4.581 |
the | +4.435 |
. | +4.421 |
a | +4.192 |
Neg logit contributions | |
lor | -4.289 |
umm | -4.209 |
rol | -4.164 |
osity | -4.069 |
former | -4.066 |
Token | in |
Token ID | 287 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.425 |
and | +2.405 |
. | +2.259 |
the | +2.208 |
a | +2.009 |
Neg logit contributions | |
lor | -6.384 |
rol | -6.271 |
umm | -6.250 |
former | -6.202 |
ocol | -6.187 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.685 |
and | +0.670 |
. | +0.525 |
the | +0.352 |
a | +0.176 |
Neg logit contributions | |
lor | -8.175 |
former | -8.096 |
umm | -8.075 |
ocol | -8.054 |
rol | -8.012 |
Token | corner |
Token ID | 5228 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.391 |
, | +4.385 |
. | +4.243 |
the | +4.166 |
a | +3.946 |
Neg logit contributions | |
lor | -4.569 |
umm | -4.475 |
former | -4.437 |
rol | -4.370 |
osity | -4.327 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.676 |
and | +1.664 |
the | +1.499 |
. | +1.463 |
a | +1.291 |
Neg logit contributions | |
lor | -7.151 |
umm | -7.026 |
rol | -7.015 |
former | -6.989 |
osity | -6.920 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.165 |
, | +1.109 |
. | +1.036 |
the | +0.890 |
a | +0.755 |
Neg logit contributions | |
lor | -7.746 |
rol | -7.559 |
umm | -7.558 |
former | -7.491 |
ocol | -7.463 |
Token | cooler |
Token ID | 19346 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.737 |
, | +4.704 |
. | +4.604 |
the | +4.579 |
a | +4.339 |
Neg logit contributions | |
lor | -4.204 |
umm | -4.124 |
former | -4.072 |
rol | -4.009 |
ocol | -3.938 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.510 |
, | +2.462 |
. | +2.400 |
the | +2.333 |
a | +2.151 |
Neg logit contributions | |
lor | -6.381 |
umm | -6.198 |
rol | -6.161 |
former | -6.157 |
osity | -6.119 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.894 |
, | +1.884 |
. | +1.753 |
the | +1.644 |
a | +1.386 |
Neg logit contributions | |
lor | -7.036 |
former | -6.929 |
umm | -6.895 |
rol | -6.891 |
osity | -6.784 |
Token | cool |
Token ID | 3608 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.785 |
, | +3.754 |
. | +3.659 |
the | +3.585 |
a | +3.340 |
Neg logit contributions | |
lor | -5.113 |
former | -5.047 |
umm | -5.029 |
bek | -4.933 |
rol | -4.903 |
Token | drink |
Token ID | 4144 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.337 |
, | +4.307 |
. | +4.240 |
the | +4.195 |
a | +3.963 |
Neg logit contributions | |
lor | -4.468 |
umm | -4.436 |
former | -4.395 |
ocol | -4.309 |
rol | -4.307 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.567 |
, | +2.553 |
the | +2.435 |
. | +2.383 |
a | +2.196 |
Neg logit contributions | |
lor | -6.279 |
umm | -6.217 |
rol | -6.129 |
former | -6.074 |
ocol | -6.014 |
Token | " |
Token ID | 366 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.146 |
and | +3.144 |
. | +3.032 |
the | +2.909 |
a | +2.705 |
Neg logit contributions | |
lor | -5.809 |
umm | -5.649 |
former | -5.594 |
rol | -5.591 |
osity | -5.581 |
Token | Wow |
Token ID | 22017 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +5.206 |
and | +5.192 |
. | +5.060 |
the | +4.975 |
a | +4.744 |
Neg logit contributions | |
lor | -3.802 |
umm | -3.678 |
former | -3.664 |
rol | -3.614 |
bek | -3.567 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.857 |
, | +2.702 |
. | +2.650 |
the | +2.583 |
a | +2.412 |
Neg logit contributions | |
lor | -6.045 |
umm | -5.937 |
ocol | -5.834 |
rol | -5.834 |
osity | -5.811 |
Token | this |
Token ID | 428 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.346 |
, | +3.279 |
. | +3.264 |
the | +3.018 |
a | +2.810 |
Neg logit contributions | |
lor | -5.627 |
umm | -5.466 |
former | -5.433 |
osity | -5.408 |
ocol | -5.391 |
Token | It |
Token ID | 632 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.540 |
, | +3.523 |
. | +3.407 |
the | +3.312 |
a | +3.069 |
Neg logit contributions | |
lor | -5.406 |
umm | -5.271 |
former | -5.241 |
osity | -5.203 |
rol | -5.199 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.583 |
, | +1.571 |
. | +1.458 |
the | +1.351 |
a | +1.135 |
Neg logit contributions | |
lor | -7.336 |
umm | -7.156 |
rol | -7.154 |
former | -7.146 |
osity | -7.060 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.368 |
, | +1.366 |
. | +1.248 |
the | +1.116 |
a | +0.862 |
Neg logit contributions | |
lor | -7.513 |
former | -7.439 |
umm | -7.395 |
rol | -7.370 |
ocol | -7.327 |
Token | tall |
Token ID | 7331 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.146 |
, | +4.116 |
. | +4.021 |
the | +3.942 |
a | +3.696 |
Neg logit contributions | |
lor | -4.764 |
former | -4.668 |
umm | -4.659 |
bek | -4.580 |
osity | -4.535 |
Token | pink |
Token ID | 11398 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.492 |
, | +4.457 |
. | +4.407 |
the | +4.343 |
a | +4.164 |
Neg logit contributions | |
lor | -4.279 |
umm | -4.264 |
former | -4.192 |
ocol | -4.133 |
bek | -4.094 |
Token | drink |
Token ID | 4144 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.805 |
, | +4.790 |
. | +4.688 |
the | +4.669 |
a | +4.425 |
Neg logit contributions | |
lor | -4.070 |
umm | -3.974 |
former | -3.924 |
ocol | -3.840 |
osity | -3.829 |
Token | ! |
Token ID | 0 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.538 |
, | +2.518 |
the | +2.398 |
. | +2.379 |
a | +2.163 |
Neg logit contributions | |
lor | -6.306 |
umm | -6.243 |
rol | -6.153 |
former | -6.077 |
osity | -6.044 |
Token | She |
Token ID | 1375 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.237 |
, | +3.223 |
. | +3.100 |
the | +3.004 |
a | +2.786 |
Neg logit contributions | |
lor | -5.747 |
umm | -5.597 |
former | -5.552 |
rol | -5.530 |
osity | -5.503 |
Token | had |
Token ID | 550 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.362 |
and | +3.330 |
. | +3.254 |
the | +3.153 |
a | +2.925 |
Neg logit contributions | |
lor | -5.567 |
former | -5.444 |
umm | -5.390 |
rol | -5.366 |
bek | -5.363 |
Token | never |
Token ID | 1239 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.305 |
and | +3.255 |
. | +3.146 |
the | +3.012 |
a | +2.747 |
Neg logit contributions | |
lor | -5.720 |
former | -5.545 |
rol | -5.457 |
umm | -5.413 |
osity | -5.401 |
Token | seen |
Token ID | 1775 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +5.374 |
and | +5.374 |
. | +5.228 |
the | +5.146 |
a | +4.913 |
Neg logit contributions | |
lor | -3.537 |
former | -3.409 |
umm | -3.370 |
osity | -3.339 |
rol | -3.336 |
Token | best |
Token ID | 1266 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.499 |
, | +3.462 |
. | +3.330 |
the | +3.317 |
a | +3.047 |
Neg logit contributions | |
lor | -5.419 |
former | -5.357 |
umm | -5.343 |
osity | -5.190 |
ocol | -5.184 |
Token | friend |
Token ID | 1545 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.449 |
, | +3.416 |
the | +3.282 |
. | +3.270 |
a | +3.003 |
Neg logit contributions | |
lor | -5.471 |
umm | -5.359 |
former | -5.342 |
osity | -5.267 |
rol | -5.246 |
Token | Sal |
Token ID | 4849 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.152 |
, | +3.102 |
. | +3.016 |
the | +2.935 |
a | +2.728 |
Neg logit contributions | |
lor | -5.710 |
umm | -5.553 |
rol | -5.527 |
former | -5.522 |
osity | -5.505 |
Token | brought |
Token ID | 3181 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.046 |
, | +4.016 |
. | +3.871 |
the | +3.815 |
a | +3.626 |
Neg logit contributions | |
lor | -4.850 |
former | -4.661 |
bek | -4.641 |
ocol | -4.634 |
umm | -4.631 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.111 |
and | +2.099 |
. | +1.929 |
the | +1.884 |
a | +1.644 |
Neg logit contributions | |
lor | -6.692 |
former | -6.596 |
umm | -6.587 |
rol | -6.581 |
ocol | -6.531 |
Token | pill |
Token ID | 9582 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.215 |
, | +4.184 |
. | +4.076 |
the | +3.995 |
a | +3.745 |
Neg logit contributions | |
lor | -4.716 |
former | -4.621 |
umm | -4.585 |
rol | -4.515 |
bek | -4.504 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.762 |
and | +2.750 |
the | +2.650 |
. | +2.571 |
a | +2.370 |
Neg logit contributions | |
lor | -6.148 |
rol | -5.982 |
umm | -5.967 |
former | -5.945 |
osity | -5.886 |
Token | show |
Token ID | 905 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.664 |
, | +3.624 |
. | +3.473 |
the | +3.304 |
a | +3.106 |
Neg logit contributions | |
former | -5.243 |
lor | -5.210 |
ocol | -5.123 |
umm | -5.063 |
rol | -5.037 |
Token | her |
Token ID | 607 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.469 |
, | +2.423 |
. | +2.236 |
the | +2.160 |
a | +1.960 |
Neg logit contributions | |
lor | -6.480 |
rol | -6.312 |
former | -6.272 |
ocol | -6.256 |
umm | -6.252 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.812 |
, | +1.799 |
. | +1.597 |
the | +1.562 |
a | +1.349 |
Neg logit contributions | |
lor | -7.111 |
former | -7.001 |
rol | -6.911 |
umm | -6.894 |
osity | -6.853 |
Token | Joe |
Token ID | 5689 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.323 |
, | +3.313 |
. | +3.186 |
the | +3.104 |
a | +2.916 |
Neg logit contributions | |
lor | -5.576 |
umm | -5.479 |
former | -5.424 |
rol | -5.422 |
osity | -5.393 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | you |
Token ID | 345 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.403 |
and | +3.402 |
. | +3.289 |
the | +3.217 |
a | +3.026 |
Neg logit contributions | |
lor | -5.435 |
former | -5.294 |
umm | -5.283 |
rol | -5.268 |
osity | -5.241 |
Token | talking |
Token ID | 3375 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.889 |
, | +3.845 |
. | +3.712 |
the | +3.687 |
a | +3.450 |
Neg logit contributions | |
lor | -5.000 |
former | -4.889 |
rol | -4.812 |
umm | -4.795 |
osity | -4.775 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | talking |
Token ID | 3375 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.889 |
, | +3.845 |
. | +3.712 |
the | +3.687 |
a | +3.450 |
Neg logit contributions | |
lor | -5.000 |
former | -4.889 |
rol | -4.812 |
umm | -4.795 |
osity | -4.775 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.601 |
, | +1.591 |
. | +1.410 |
the | +1.216 |
a | +1.010 |
Neg logit contributions | |
lor | -7.244 |
former | -7.150 |
ocol | -7.140 |
umm | -7.100 |
rol | -7.005 |
Token | covers |
Token ID | 8698 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.583 |
and | +4.563 |
. | +4.404 |
the | +4.384 |
a | +4.187 |
Neg logit contributions | |
lor | -4.297 |
umm | -4.177 |
former | -4.141 |
ocol | -4.119 |
rol | -4.072 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.794 |
and | +0.792 |
the | +0.595 |
. | +0.576 |
a | +0.415 |
Neg logit contributions | |
lor | -8.100 |
umm | -7.919 |
rol | -7.903 |
former | -7.860 |
ocol | -7.823 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.601 |
, | +1.591 |
. | +1.410 |
the | +1.216 |
a | +1.010 |
Neg logit contributions | |
lor | -7.244 |
former | -7.150 |
ocol | -7.140 |
umm | -7.100 |
rol | -7.005 |
Token | covers |
Token ID | 8698 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.583 |
and | +4.563 |
. | +4.404 |
the | +4.384 |
a | +4.187 |
Neg logit contributions | |
lor | -4.297 |
umm | -4.177 |
former | -4.141 |
ocol | -4.119 |
rol | -4.072 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.601 |
, | +1.591 |
. | +1.410 |
the | +1.216 |
a | +1.010 |
Neg logit contributions | |
lor | -7.244 |
former | -7.150 |
ocol | -7.140 |
umm | -7.100 |
rol | -7.005 |
Token | talking |
Token ID | 3375 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.889 |
, | +3.845 |
. | +3.712 |
the | +3.687 |
a | +3.450 |
Neg logit contributions | |
lor | -5.000 |
former | -4.889 |
rol | -4.812 |
umm | -4.795 |
osity | -4.775 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | you |
Token ID | 345 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.403 |
and | +3.402 |
. | +3.289 |
the | +3.217 |
a | +3.026 |
Neg logit contributions | |
lor | -5.435 |
former | -5.294 |
umm | -5.283 |
rol | -5.268 |
osity | -5.241 |
Token | talking |
Token ID | 3375 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.889 |
, | +3.845 |
. | +3.712 |
the | +3.687 |
a | +3.450 |
Neg logit contributions | |
lor | -5.000 |
former | -4.889 |
rol | -4.812 |
umm | -4.795 |
osity | -4.775 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | The |
Token ID | 383 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.377 |
and | +3.367 |
. | +3.279 |
the | +3.203 |
a | +3.006 |
Neg logit contributions | |
lor | -5.505 |
former | -5.368 |
umm | -5.313 |
rol | -5.284 |
osity | -5.262 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.258 |
, | +4.243 |
. | +4.142 |
the | +3.956 |
a | +3.798 |
Neg logit contributions | |
lor | -4.688 |
umm | -4.574 |
former | -4.574 |
osity | -4.493 |
bek | -4.492 |
Token | Professor |
Token ID | 8129 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.499 |
, | +3.488 |
. | +3.347 |
the | +3.243 |
a | +2.986 |
Neg logit contributions | |
lor | -5.475 |
former | -5.395 |
umm | -5.365 |
ocol | -5.259 |
osity | -5.236 |
Token | became |
Token ID | 2627 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +6.040 |
, | +6.019 |
. | +5.884 |
the | +5.835 |
a | +5.621 |
Neg logit contributions | |
lor | -2.939 |
umm | -2.810 |
former | -2.753 |
osity | -2.708 |
rol | -2.705 |
Token | good |
Token ID | 922 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.532 |
, | +3.492 |
. | +3.377 |
the | +3.225 |
a | +3.026 |
Neg logit contributions | |
lor | -5.360 |
former | -5.305 |
umm | -5.273 |
rol | -5.227 |
bek | -5.193 |
Token | friends |
Token ID | 2460 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.905 |
and | +2.893 |
. | +2.775 |
the | +2.754 |
a | +2.522 |
Neg logit contributions | |
lor | -5.960 |
umm | -5.945 |
former | -5.934 |
rol | -5.825 |
ocol | -5.795 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.250 |
and | +1.247 |
the | +1.111 |
. | +1.091 |
a | +0.922 |
Neg logit contributions | |
lor | -7.576 |
umm | -7.401 |
former | -7.391 |
rol | -7.376 |
osity | -7.328 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.759 |
and | +2.703 |
. | +2.651 |
the | +2.525 |
a | +2.330 |
Neg logit contributions | |
lor | -6.098 |
former | -6.023 |
umm | -5.994 |
rol | -5.972 |
osity | -5.940 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.723 |
, | +2.707 |
. | +2.632 |
the | +2.426 |
a | +2.276 |
Neg logit contributions | |
lor | -6.143 |
former | -6.082 |
umm | -6.053 |
osity | -5.996 |
bek | -5.975 |
Token | little |
Token ID | 1310 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.291 |
, | +3.283 |
. | +3.146 |
the | +3.045 |
a | +2.788 |
Neg logit contributions | |
lor | -5.666 |
former | -5.597 |
umm | -5.567 |
ocol | -5.462 |
osity | -5.417 |
Token | frog |
Token ID | 21264 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.904 |
, | +3.880 |
. | +3.755 |
the | +3.665 |
a | +3.449 |
Neg logit contributions | |
umm | -4.994 |
lor | -4.986 |
former | -4.886 |
ocol | -4.827 |
rol | -4.814 |
Token | showed |
Token ID | 3751 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.884 |
and | +3.879 |
. | +3.757 |
the | +3.701 |
a | +3.491 |
Neg logit contributions | |
lor | -4.993 |
former | -4.841 |
umm | -4.814 |
rol | -4.814 |
arians | -4.773 |
Token | it |
Token ID | 340 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.692 |
, | +2.684 |
. | +2.535 |
the | +2.403 |
a | +2.206 |
Neg logit contributions | |
lor | -6.244 |
rol | -6.081 |
umm | -6.073 |
former | -6.042 |
osity | -5.997 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +1.566 |
, | +1.562 |
. | +1.393 |
the | +1.328 |
a | +1.094 |
Neg logit contributions | |
lor | -7.316 |
former | -7.201 |
umm | -7.153 |
rol | -7.150 |
osity | -7.126 |
Token | his |
Token ID | 465 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.487 |
, | +4.483 |
. | +4.322 |
the | +4.160 |
a | +3.982 |
Neg logit contributions | |
lor | -4.432 |
former | -4.360 |
umm | -4.310 |
rol | -4.260 |
arians | -4.256 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.480 |
, | +3.467 |
. | +3.329 |
the | +3.260 |
a | +3.030 |
Neg logit contributions | |
former | -5.409 |
lor | -5.390 |
umm | -5.336 |
arians | -5.252 |
bek | -5.229 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.668 |
and | +1.662 |
the | +1.507 |
. | +1.502 |
a | +1.315 |
Neg logit contributions | |
lor | -7.097 |
former | -7.001 |
umm | -6.982 |
rol | -6.981 |
osity | -6.948 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.446 |
, | +3.436 |
. | +3.297 |
the | +3.216 |
a | +3.005 |
Neg logit contributions | |
lor | -5.530 |
umm | -5.391 |
former | -5.374 |
rol | -5.348 |
osity | -5.314 |
Token |
|
Token ID | 198 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.356 |
and | +2.355 |
. | +2.209 |
the | +2.123 |
a | +1.915 |
Neg logit contributions | |
lor | -6.652 |
rol | -6.443 |
former | -6.426 |
umm | -6.411 |
ocol | -6.362 |
Token | " |
Token ID | 1 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +5.293 |
, | +5.288 |
. | +5.155 |
the | +5.074 |
a | +4.856 |
Neg logit contributions | |
lor | -3.711 |
umm | -3.551 |
former | -3.548 |
rol | -3.515 |
osity | -3.466 |
Token | I |
Token ID | 40 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +5.408 |
and | +5.404 |
. | +5.266 |
the | +5.177 |
a | +4.951 |
Neg logit contributions | |
lor | -3.607 |
umm | -3.482 |
former | -3.459 |
rol | -3.414 |
osity | -3.371 |
Token | decorated |
Token ID | 24789 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.392 |
, | +4.373 |
. | +4.255 |
the | +4.204 |
a | +3.955 |
Neg logit contributions | |
lor | -4.551 |
former | -4.458 |
umm | -4.405 |
rol | -4.364 |
bek | -4.350 |
Token | in |
Token ID | 287 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.032 |
and | +1.008 |
the | +0.927 |
. | +0.881 |
a | +0.690 |
Neg logit contributions | |
lor | -7.720 |
former | -7.590 |
osity | -7.546 |
umm | -7.540 |
rol | -7.468 |
Token | his |
Token ID | 465 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.783 |
and | +2.782 |
. | +2.613 |
the | +2.471 |
a | +2.272 |
Neg logit contributions | |
lor | -6.124 |
ocol | -6.023 |
former | -6.003 |
umm | -5.964 |
bek | -5.918 |
Token | head |
Token ID | 1182 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.644 |
, | +4.611 |
. | +4.470 |
the | +4.385 |
a | +4.174 |
Neg logit contributions | |
lor | -4.319 |
former | -4.282 |
umm | -4.236 |
ocol | -4.163 |
bek | -4.133 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +1.472 |
and | +1.463 |
. | +1.311 |
the | +1.310 |
a | +1.096 |
Neg logit contributions | |
lor | -7.390 |
former | -7.212 |
rol | -7.171 |
umm | -7.154 |
osity | -7.139 |
Token | He |
Token ID | 679 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.163 |
, | +3.152 |
. | +2.995 |
the | +2.923 |
a | +2.697 |
Neg logit contributions | |
lor | -5.801 |
former | -5.688 |
umm | -5.654 |
osity | -5.584 |
rol | -5.544 |
Token | wishes |
Token ID | 12802 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.567 |
and | +4.552 |
. | +4.428 |
the | +4.358 |
a | +4.128 |
Neg logit contributions | |
lor | -4.384 |
former | -4.255 |
umm | -4.213 |
rol | -4.168 |
ocol | -4.131 |
Token | he |
Token ID | 339 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.284 |
, | +2.262 |
. | +2.121 |
the | +2.001 |
a | +1.817 |
Neg logit contributions | |
lor | -6.598 |
former | -6.433 |
umm | -6.413 |
osity | -6.382 |
rol | -6.367 |
Token | did |
Token ID | 750 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.366 |
and | +3.339 |
. | +3.209 |
the | +3.134 |
a | +2.909 |
Neg logit contributions | |
lor | -5.628 |
former | -5.440 |
umm | -5.425 |
rol | -5.376 |
bek | -5.363 |
Token | not |
Token ID | 407 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.821 |
, | +2.811 |
. | +2.640 |
the | +2.529 |
a | +2.283 |
Neg logit contributions | |
lor | -6.118 |
former | -6.007 |
umm | -5.836 |
osity | -5.832 |
ocol | -5.829 |
Token | write |
Token ID | 3551 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.202 |
, | +4.175 |
. | +4.003 |
the | +3.959 |
a | +3.730 |
Neg logit contributions | |
lor | -4.686 |
former | -4.668 |
umm | -4.584 |
osity | -4.543 |
ocol | -4.533 |
Token | with |
Token ID | 351 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.734 |
, | +2.731 |
. | +2.557 |
the | +2.493 |
a | +2.271 |
Neg logit contributions | |
lor | -6.139 |
former | -5.990 |
umm | -5.951 |
ocol | -5.929 |
rol | -5.914 |
Token | better |
Token ID | 1365 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.784 |
, | +3.762 |
. | +3.638 |
the | +3.528 |
a | +3.297 |
Neg logit contributions | |
lor | -5.109 |
former | -5.057 |
umm | -5.001 |
rol | -4.968 |
osity | -4.928 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.384 |
and | +2.373 |
the | +2.279 |
. | +2.258 |
a | +2.052 |
Neg logit contributions | |
lor | -6.452 |
former | -6.389 |
umm | -6.305 |
osity | -6.242 |
bek | -6.189 |
Token | He |
Token ID | 679 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.849 |
and | +3.833 |
. | +3.709 |
the | +3.601 |
a | +3.392 |
Neg logit contributions | |
lor | -5.171 |
former | -5.086 |
umm | -5.073 |
rol | -4.980 |
osity | -4.968 |
Token | sw |
Token ID | 1509 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.658 |
and | +3.638 |
. | +3.549 |
the | +3.455 |
a | +3.247 |
Neg logit contributions | |
lor | -5.244 |
former | -5.140 |
umm | -5.047 |
rol | -5.037 |
bek | -4.999 |
Token | am |
Token ID | 321 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +5.920 |
, | +5.910 |
. | +5.788 |
the | +5.714 |
a | +5.498 |
Neg logit contributions | |
lor | -3.093 |
former | -2.963 |
umm | -2.952 |
rol | -2.909 |
osity | -2.866 |
Token | with |
Token ID | 351 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.743 |
and | +2.739 |
. | +2.647 |
the | +2.545 |
a | +2.341 |
Neg logit contributions | |
lor | -6.134 |
rol | -6.023 |
former | -5.994 |
umm | -5.958 |
osity | -5.926 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.087 |
, | +3.062 |
. | +2.934 |
the | +2.732 |
a | +2.540 |
Neg logit contributions | |
lor | -5.848 |
former | -5.764 |
umm | -5.754 |
rol | -5.741 |
ocol | -5.713 |
Token | duck |
Token ID | 22045 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.406 |
and | +4.400 |
. | +4.259 |
the | +4.162 |
a | +3.945 |
Neg logit contributions | |
lor | -4.519 |
former | -4.508 |
umm | -4.485 |
ocol | -4.379 |
rol | -4.365 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.126 |
, | +3.114 |
. | +3.021 |
the | +2.957 |
a | +2.761 |
Neg logit contributions | |
lor | -5.716 |
former | -5.594 |
rol | -5.556 |
osity | -5.523 |
umm | -5.522 |
Token | the |
Token ID | 262 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.022 |
and | +3.974 |
. | +3.930 |
the | +3.761 |
a | +3.587 |
Neg logit contributions | |
lor | -4.850 |
former | -4.769 |
rol | -4.730 |
osity | -4.709 |
umm | -4.699 |
Token | leaves |
Token ID | 5667 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +4.457 |
and | +4.452 |
. | +4.311 |
the | +4.198 |
a | +3.978 |
Neg logit contributions | |
lor | -4.452 |
former | -4.446 |
umm | -4.413 |
ocol | -4.300 |
rol | -4.274 |
Token | knew |
Token ID | 2993 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.812 |
and | +3.804 |
. | +3.677 |
the | +3.588 |
a | +3.374 |
Neg logit contributions | |
lor | -5.078 |
former | -4.995 |
umm | -4.946 |
rol | -4.931 |
bek | -4.916 |
Token | it |
Token ID | 340 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.208 |
, | +2.176 |
. | +2.039 |
the | +1.873 |
a | +1.690 |
Neg logit contributions | |
lor | -6.701 |
former | -6.610 |
umm | -6.535 |
bek | -6.481 |
osity | -6.476 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.319 |
, | +2.316 |
. | +2.177 |
the | +2.121 |
a | +1.891 |
Neg logit contributions | |
lor | -6.615 |
umm | -6.472 |
former | -6.454 |
rol | -6.406 |
bek | -6.391 |
Token | unique |
Token ID | 3748 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +3.242 |
, | +3.233 |
. | +3.061 |
the | +2.937 |
a | +2.714 |
Neg logit contributions | |
lor | -5.594 |
former | -5.578 |
umm | -5.544 |
ocol | -5.476 |
bek | -5.435 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +0.971 |
and | +0.958 |
the | +0.863 |
. | +0.806 |
a | +0.630 |
Neg logit contributions | |
lor | -7.786 |
umm | -7.775 |
former | -7.696 |
rol | -7.590 |
arians | -7.565 |
Token | It |
Token ID | 632 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.600 |
and | +2.594 |
. | +2.445 |
the | +2.366 |
a | +2.150 |
Neg logit contributions | |
lor | -6.385 |
former | -6.254 |
umm | -6.228 |
rol | -6.172 |
osity | -6.139 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.488 |
and | +2.467 |
. | +2.337 |
the | +2.256 |
a | +2.036 |
Neg logit contributions | |
lor | -6.470 |
former | -6.352 |
umm | -6.344 |
rol | -6.284 |
bek | -6.251 |
Token | their |
Token ID | 511 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +3.090 |
and | +3.082 |
. | +2.934 |
the | +2.786 |
a | +2.559 |
Neg logit contributions | |
former | -5.751 |
lor | -5.742 |
umm | -5.693 |
ocol | -5.660 |
rol | -5.624 |
Token | cake |
Token ID | 12187 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +4.337 |
, | +4.328 |
. | +4.193 |
the | +4.117 |
a | +3.888 |
Neg logit contributions | |
former | -4.562 |
lor | -4.553 |
umm | -4.541 |
ocol | -4.396 |
bek | -4.377 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
and | +2.170 |
, | +2.167 |
the | +2.037 |
. | +1.999 |
a | +1.818 |
Neg logit contributions | |
lor | -6.695 |
umm | -6.601 |
former | -6.540 |
rol | -6.444 |
arians | -6.441 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
, | +2.917 |
and | +2.912 |
. | +2.762 |
the | +2.673 |
a | +2.447 |
Neg logit contributions | |
lor | -6.081 |
former | -5.931 |
umm | -5.917 |
rol | -5.867 |
ocol | -5.837 |