Token | share |
Token ID | 2648 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.186 |
the | +3.072 |
, | +3.054 |
. | +2.943 |
a | +2.914 |
Neg logit contributions | |
lor | -5.870 |
arians | -5.792 |
rol | -5.704 |
umm | -5.682 |
ides | -5.638 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.182 |
, | +2.121 |
the | +2.085 |
. | +1.958 |
a | +1.942 |
Neg logit contributions | |
lor | -6.713 |
arians | -6.577 |
rol | -6.488 |
ocol | -6.425 |
ides | -6.385 |
Token | have |
Token ID | 423 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.984 |
, | +3.845 |
the | +3.827 |
. | +3.737 |
a | +3.693 |
Neg logit contributions | |
lor | -4.932 |
arians | -4.909 |
umm | -4.810 |
ocol | -4.792 |
rol | -4.762 |
Token | fun |
Token ID | 1257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.793 |
, | +2.658 |
the | +2.643 |
. | +2.521 |
a | +2.420 |
Neg logit contributions | |
lor | -6.325 |
arians | -6.168 |
umm | -6.127 |
rol | -6.105 |
ides | -6.020 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.495 |
the | +0.461 |
, | +0.355 |
a | +0.273 |
. | +0.179 |
Neg logit contributions | |
lor | -8.545 |
arians | -8.450 |
umm | -8.368 |
rol | -8.332 |
ides | -8.300 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.225 |
the | +3.121 |
, | +3.117 |
. | +2.957 |
a | +2.895 |
Neg logit contributions | |
lor | -5.877 |
arians | -5.768 |
umm | -5.739 |
osity | -5.630 |
rol | -5.612 |
Token | Anna |
Token ID | 31160 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.242 |
the | +4.128 |
, | +4.103 |
a | +3.948 |
. | +3.925 |
Neg logit contributions | |
lor | -4.928 |
rol | -4.649 |
umm | -4.642 |
arians | -4.614 |
ocol | -4.579 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.688 |
the | +2.677 |
, | +2.589 |
. | +2.509 |
a | +2.503 |
Neg logit contributions | |
lor | -6.325 |
arians | -6.150 |
umm | -6.113 |
rol | -6.076 |
ides | -6.025 |
Token | Ben |
Token ID | 3932 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.711 |
, | +2.564 |
the | +2.559 |
. | +2.482 |
a | +2.379 |
Neg logit contributions | |
lor | -6.397 |
arians | -6.227 |
umm | -6.192 |
rol | -6.185 |
osity | -6.124 |
Token | are |
Token ID | 389 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.124 |
the | +3.036 |
, | +2.992 |
. | +2.894 |
a | +2.853 |
Neg logit contributions | |
lor | -5.986 |
arians | -5.820 |
umm | -5.801 |
rol | -5.781 |
ides | -5.693 |
Token | twins |
Token ID | 20345 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.602 |
the | +3.513 |
, | +3.463 |
. | +3.369 |
a | +3.295 |
Neg logit contributions | |
lor | -5.502 |
rol | -5.369 |
arians | -5.355 |
umm | -5.333 |
ocol | -5.288 |
Token | careful |
Token ID | 8161 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.333 |
the | +4.299 |
, | +4.249 |
. | +4.127 |
a | +4.094 |
Neg logit contributions | |
lor | -4.717 |
arians | -4.601 |
umm | -4.594 |
osity | -4.509 |
beh | -4.508 |
Token | when |
Token ID | 618 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.857 |
and | +1.856 |
, | +1.764 |
a | +1.662 |
. | +1.629 |
Neg logit contributions | |
lor | -7.141 |
arians | -7.001 |
umm | -6.986 |
rol | -6.938 |
osity | -6.894 |
Token | she |
Token ID | 673 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.617 |
, | +3.411 |
the | +3.406 |
. | +3.314 |
a | +3.272 |
Neg logit contributions | |
lor | -5.388 |
arians | -5.342 |
umm | -5.333 |
ocol | -5.284 |
osity | -5.248 |
Token | painted |
Token ID | 13055 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.215 |
the | +4.195 |
, | +4.134 |
a | +4.010 |
. | +3.963 |
Neg logit contributions | |
lor | -4.764 |
arians | -4.736 |
umm | -4.677 |
ides | -4.624 |
rol | -4.586 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.884 |
, | +2.760 |
the | +2.720 |
. | +2.599 |
a | +2.565 |
Neg logit contributions | |
lor | -6.030 |
umm | -5.962 |
rol | -5.946 |
arians | -5.907 |
ocol | -5.872 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.213 |
the | +2.107 |
, | +2.088 |
. | +1.965 |
a | +1.933 |
Neg logit contributions | |
lor | -6.976 |
umm | -6.797 |
arians | -6.741 |
rol | -6.734 |
osity | -6.670 |
Token | Once |
Token ID | 7454 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.338 |
, | +1.240 |
the | +1.228 |
a | +1.039 |
. | +1.028 |
Neg logit contributions | |
lor | -7.760 |
rol | -7.455 |
umm | -7.372 |
arians | -7.369 |
ides | -7.310 |
Token | upon |
Token ID | 2402 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.101 |
the | +3.988 |
, | +3.936 |
. | +3.842 |
a | +3.837 |
Neg logit contributions | |
lor | -5.002 |
rol | -4.805 |
umm | -4.794 |
arians | -4.785 |
ocol | -4.709 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.436 |
, | +0.362 |
the | +0.314 |
. | +0.176 |
a | +0.029 |
Neg logit contributions | |
lor | -8.630 |
rol | -8.358 |
arians | -8.334 |
umm | -8.311 |
ides | -8.270 |
Token | time |
Token ID | 640 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.451 |
the | +2.403 |
, | +2.320 |
. | +2.214 |
a | +2.192 |
Neg logit contributions | |
lor | -6.684 |
umm | -6.491 |
arians | -6.470 |
rol | -6.446 |
ides | -6.394 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.211 |
the | +0.121 |
, | +0.011 |
. | -0.024 |
a | -0.057 |
Neg logit contributions | |
lor | -8.900 |
rol | -8.690 |
arians | -8.689 |
umm | -8.682 |
ocol | -8.608 |
Token | toys |
Token ID | 14958 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.051 |
the | +4.982 |
, | +4.943 |
. | +4.836 |
a | +4.783 |
Neg logit contributions | |
lor | -4.019 |
arians | -3.891 |
ocol | -3.842 |
umm | -3.833 |
isher | -3.761 |
Token | with |
Token ID | 351 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.039 |
the | +1.023 |
, | +0.930 |
a | +0.850 |
. | +0.818 |
Neg logit contributions | |
lor | -8.002 |
arians | -7.815 |
umm | -7.775 |
rol | -7.765 |
ides | -7.642 |
Token | her |
Token ID | 607 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.852 |
, | +2.695 |
the | +2.627 |
. | +2.514 |
a | +2.487 |
Neg logit contributions | |
lor | -6.177 |
arians | -6.107 |
rol | -6.011 |
ocol | -5.997 |
umm | -5.988 |
Token | friend |
Token ID | 1545 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.652 |
the | +3.564 |
, | +3.506 |
a | +3.450 |
. | +3.358 |
Neg logit contributions | |
arians | -5.371 |
lor | -5.288 |
umm | -5.175 |
ocol | -5.145 |
isher | -5.098 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.503 |
the | +1.452 |
, | +1.346 |
a | +1.327 |
. | +1.216 |
Neg logit contributions | |
lor | -7.381 |
arians | -7.343 |
rol | -7.218 |
umm | -7.114 |
osity | -7.062 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.588 |
the | +3.489 |
, | +3.466 |
. | +3.341 |
a | +3.337 |
Neg logit contributions | |
lor | -5.550 |
rol | -5.372 |
arians | -5.341 |
umm | -5.338 |
osity | -5.253 |
Token | Once |
Token ID | 7454 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.469 |
, | +1.364 |
the | +1.337 |
a | +1.182 |
. | +1.144 |
Neg logit contributions | |
lor | -7.652 |
rol | -7.337 |
arians | -7.230 |
umm | -7.217 |
ides | -7.161 |
Token | upon |
Token ID | 2402 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.292 |
the | +4.163 |
, | +4.112 |
. | +4.026 |
a | +4.025 |
Neg logit contributions | |
lor | -4.809 |
rol | -4.627 |
umm | -4.588 |
arians | -4.575 |
ocol | -4.532 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.480 |
, | +0.441 |
the | +0.358 |
. | +0.214 |
a | +0.010 |
Neg logit contributions | |
lor | -8.540 |
rol | -8.271 |
arians | -8.220 |
umm | -8.199 |
ides | -8.171 |
Token | time |
Token ID | 640 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.500 |
the | +2.473 |
, | +2.368 |
. | +2.278 |
a | +2.250 |
Neg logit contributions | |
lor | -6.612 |
umm | -6.426 |
arians | -6.390 |
rol | -6.371 |
ides | -6.339 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.236 |
the | +0.149 |
, | +0.017 |
. | +0.003 |
a | -0.038 |
Neg logit contributions | |
lor | -8.890 |
rol | -8.683 |
arians | -8.669 |
umm | -8.668 |
ocol | -8.580 |
Token | with |
Token ID | 351 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.039 |
the | +1.023 |
, | +0.930 |
a | +0.850 |
. | +0.818 |
Neg logit contributions | |
lor | -8.002 |
arians | -7.815 |
umm | -7.775 |
rol | -7.765 |
ides | -7.642 |
Token | her |
Token ID | 607 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.852 |
, | +2.695 |
the | +2.627 |
. | +2.514 |
a | +2.487 |
Neg logit contributions | |
lor | -6.177 |
arians | -6.107 |
rol | -6.011 |
ocol | -5.997 |
umm | -5.988 |
Token | friend |
Token ID | 1545 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.652 |
the | +3.564 |
, | +3.506 |
a | +3.450 |
. | +3.358 |
Neg logit contributions | |
arians | -5.371 |
lor | -5.288 |
umm | -5.175 |
ocol | -5.145 |
isher | -5.098 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.503 |
the | +1.452 |
, | +1.346 |
a | +1.327 |
. | +1.216 |
Neg logit contributions | |
lor | -7.381 |
arians | -7.343 |
rol | -7.218 |
umm | -7.114 |
osity | -7.062 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.588 |
the | +3.489 |
, | +3.466 |
. | +3.341 |
a | +3.337 |
Neg logit contributions | |
lor | -5.550 |
rol | -5.372 |
arians | -5.341 |
umm | -5.338 |
osity | -5.253 |
Token | Once |
Token ID | 7454 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.469 |
, | +1.364 |
the | +1.337 |
a | +1.182 |
. | +1.144 |
Neg logit contributions | |
lor | -7.652 |
rol | -7.337 |
arians | -7.230 |
umm | -7.217 |
ides | -7.161 |
Token | upon |
Token ID | 2402 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.292 |
the | +4.163 |
, | +4.112 |
. | +4.026 |
a | +4.025 |
Neg logit contributions | |
lor | -4.809 |
rol | -4.627 |
umm | -4.588 |
arians | -4.575 |
ocol | -4.532 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.480 |
, | +0.441 |
the | +0.358 |
. | +0.214 |
a | +0.010 |
Neg logit contributions | |
lor | -8.540 |
rol | -8.271 |
arians | -8.220 |
umm | -8.199 |
ides | -8.171 |
Token | time |
Token ID | 640 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.500 |
the | +2.473 |
, | +2.368 |
. | +2.278 |
a | +2.250 |
Neg logit contributions | |
lor | -6.612 |
umm | -6.426 |
arians | -6.390 |
rol | -6.371 |
ides | -6.339 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.236 |
the | +0.149 |
, | +0.017 |
. | +0.003 |
a | -0.038 |
Neg logit contributions | |
lor | -8.890 |
rol | -8.683 |
arians | -8.669 |
umm | -8.668 |
ocol | -8.580 |
Token | there |
Token ID | 612 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.894 |
the | +1.762 |
, | +1.734 |
. | +1.663 |
a | +1.549 |
Neg logit contributions | |
lor | -7.186 |
rol | -7.012 |
arians | -6.939 |
umm | -6.924 |
osity | -6.888 |
Token |
|
Token ID | 198 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.008 |
the | +2.866 |
, | +2.833 |
. | +2.711 |
a | +2.658 |
Neg logit contributions | |
lor | -6.162 |
arians | -5.991 |
umm | -5.930 |
rol | -5.905 |
osity | -5.865 |
Token |
|
Token ID | 198 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.487 |
the | +1.350 |
, | +1.350 |
. | +1.192 |
a | +1.164 |
Neg logit contributions | |
lor | -7.691 |
arians | -7.440 |
rol | -7.414 |
ocol | -7.355 |
ides | -7.337 |
Token | The |
Token ID | 464 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.219 |
the | +4.114 |
, | +4.076 |
. | +3.967 |
a | +3.926 |
Neg logit contributions | |
lor | -5.013 |
arians | -4.828 |
rol | -4.766 |
umm | -4.752 |
ocol | -4.702 |
Token | end |
Token ID | 886 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.307 |
the | +4.197 |
, | +4.179 |
. | +4.042 |
a | +3.967 |
Neg logit contributions | |
lor | -4.799 |
arians | -4.733 |
umm | -4.712 |
ocol | -4.604 |
isher | -4.573 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.507 |
the | +0.433 |
, | +0.329 |
a | +0.244 |
. | +0.148 |
Neg logit contributions | |
lor | -8.608 |
umm | -8.427 |
arians | -8.420 |
rol | -8.373 |
ides | -8.324 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.806 |
, | +2.678 |
the | +2.644 |
. | +2.534 |
a | +2.463 |
Neg logit contributions | |
lor | -6.520 |
umm | -6.219 |
arians | -6.216 |
rol | -6.205 |
osity | -6.163 |
Token | A |
Token ID | 32 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.261 |
the | +4.145 |
, | +4.123 |
a | +3.966 |
. | +3.959 |
Neg logit contributions | |
lor | -4.940 |
rol | -4.659 |
umm | -4.631 |
arians | -4.575 |
ocol | -4.552 |
Token | woman |
Token ID | 2415 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.780 |
the | +3.712 |
, | +3.599 |
a | +3.532 |
. | +3.530 |
Neg logit contributions | |
lor | -5.371 |
umm | -5.211 |
arians | -5.157 |
rol | -5.073 |
ides | -5.065 |
Token | had |
Token ID | 550 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +2.974 |
and | +2.971 |
, | +2.884 |
a | +2.822 |
. | +2.814 |
Neg logit contributions | |
lor | -6.019 |
arians | -5.838 |
rol | -5.783 |
umm | -5.723 |
ocol | -5.699 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.024 |
, | +2.913 |
the | +2.911 |
. | +2.795 |
a | +2.633 |
Neg logit contributions | |
lor | -6.170 |
rol | -5.966 |
ocol | -5.852 |
arians | -5.820 |
umm | -5.802 |
Token | broken |
Token ID | 5445 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.361 |
the | +4.289 |
, | +4.177 |
. | +4.139 |
a | +4.047 |
Neg logit contributions | |
lor | -4.729 |
umm | -4.613 |
arians | -4.568 |
rol | -4.513 |
ocol | -4.504 |
Token | night |
Token ID | 1755 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.624 |
the | +4.618 |
, | +4.489 |
. | +4.398 |
a | +4.367 |
Neg logit contributions | |
lor | -4.484 |
umm | -4.334 |
arians | -4.278 |
rol | -4.245 |
ides | -4.228 |
Token | 's |
Token ID | 338 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +3.013 |
and | +3.013 |
, | +2.877 |
a | +2.839 |
. | +2.687 |
Neg logit contributions | |
lor | -6.047 |
umm | -5.912 |
arians | -5.782 |
rol | -5.752 |
ides | -5.743 |
Token | sleep |
Token ID | 3993 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.281 |
the | +5.265 |
, | +5.151 |
a | +4.997 |
. | +4.961 |
Neg logit contributions | |
lor | -3.748 |
umm | -3.609 |
arians | -3.592 |
ides | -3.528 |
ocol | -3.502 |
Token | again |
Token ID | 757 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +3.241 |
and | +3.236 |
, | +3.105 |
a | +3.038 |
. | +2.858 |
Neg logit contributions | |
lor | -5.942 |
arians | -5.678 |
umm | -5.618 |
ides | -5.557 |
rol | -5.553 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.567 |
and | +0.563 |
a | +0.432 |
, | +0.429 |
. | +0.081 |
Neg logit contributions | |
lor | -8.359 |
arians | -8.103 |
ides | -8.076 |
umm | -8.041 |
beh | -7.976 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.481 |
, | +1.381 |
the | +1.349 |
. | +1.234 |
a | +1.167 |
Neg logit contributions | |
lor | -7.699 |
umm | -7.485 |
arians | -7.433 |
rol | -7.427 |
osity | -7.351 |
Token | Once |
Token ID | 7454 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.947 |
, | +1.842 |
the | +1.821 |
a | +1.651 |
. | +1.633 |
Neg logit contributions | |
lor | -7.213 |
rol | -6.899 |
umm | -6.809 |
arians | -6.802 |
ides | -6.725 |
Token | upon |
Token ID | 2402 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.125 |
the | +4.009 |
, | +3.949 |
a | +3.868 |
. | +3.868 |
Neg logit contributions | |
lor | -4.970 |
rol | -4.768 |
umm | -4.738 |
arians | -4.736 |
osity | -4.674 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.449 |
, | +0.394 |
the | +0.326 |
. | +0.193 |
a | +0.024 |
Neg logit contributions | |
lor | -8.589 |
rol | -8.319 |
arians | -8.277 |
umm | -8.251 |
ides | -8.223 |
Token | time |
Token ID | 640 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.474 |
the | +2.431 |
, | +2.340 |
. | +2.240 |
a | +2.213 |
Neg logit contributions | |
lor | -6.656 |
umm | -6.446 |
arians | -6.431 |
rol | -6.406 |
ides | -6.366 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.231 |
the | +0.139 |
, | +0.017 |
. | -0.007 |
a | -0.042 |
Neg logit contributions | |
lor | -8.890 |
rol | -8.679 |
arians | -8.673 |
umm | -8.663 |
ocol | -8.584 |
Token | mighty |
Token ID | 18680 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.940 |
the | +4.825 |
, | +4.799 |
. | +4.671 |
a | +4.518 |
Neg logit contributions | |
lor | -4.249 |
arians | -4.224 |
umm | -4.068 |
ides | -3.952 |
ocol | -3.940 |
Token | lion |
Token ID | 18744 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.792 |
the | +4.765 |
, | +4.619 |
. | +4.549 |
a | +4.526 |
Neg logit contributions | |
lor | -4.330 |
arians | -4.261 |
umm | -4.192 |
ocol | -4.114 |
ides | -4.113 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.837 |
the | +2.720 |
, | +2.708 |
. | +2.557 |
a | +2.491 |
Neg logit contributions | |
lor | -6.301 |
rol | -6.052 |
arians | -6.049 |
umm | -5.964 |
osity | -5.938 |
Token | shiny |
Token ID | 22441 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.857 |
the | +4.777 |
, | +4.664 |
. | +4.616 |
a | +4.462 |
Neg logit contributions | |
lor | -4.333 |
bek | -4.059 |
umm | -4.055 |
arians | -4.045 |
rol | -3.996 |
Token | red |
Token ID | 2266 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.014 |
the | +4.972 |
, | +4.855 |
. | +4.786 |
a | +4.743 |
Neg logit contributions | |
lor | -4.090 |
umm | -3.938 |
arians | -3.906 |
ocol | -3.859 |
rol | -3.852 |
Token | apple |
Token ID | 17180 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.819 |
the | +4.780 |
, | +4.669 |
. | +4.576 |
a | +4.552 |
Neg logit contributions | |
lor | -4.316 |
umm | -4.146 |
arians | -4.124 |
rol | -4.073 |
ocol | -4.034 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.979 |
and | +1.962 |
, | +1.841 |
a | +1.751 |
. | +1.660 |
Neg logit contributions | |
lor | -7.073 |
umm | -6.894 |
arians | -6.855 |
rol | -6.842 |
ides | -6.749 |
Token | The |
Token ID | 383 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.828 |
, | +3.751 |
the | +3.717 |
. | +3.636 |
a | +3.551 |
Neg logit contributions | |
lor | -5.371 |
arians | -5.216 |
umm | -5.205 |
rol | -5.167 |
osity | -5.087 |
Token | lion |
Token ID | 18744 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.900 |
, | +4.768 |
the | +4.721 |
. | +4.661 |
a | +4.482 |
Neg logit contributions | |
arians | -4.245 |
lor | -4.148 |
umm | -4.119 |
icians | -3.985 |
ocol | -3.975 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.555 |
the | +3.551 |
, | +3.469 |
. | +3.428 |
a | +3.372 |
Neg logit contributions | |
lor | -5.482 |
arians | -5.341 |
rol | -5.231 |
umm | -5.182 |
ides | -5.141 |
Token | very |
Token ID | 845 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.242 |
, | +3.132 |
. | +3.087 |
the | +3.053 |
a | +2.808 |
Neg logit contributions | |
lor | -5.764 |
rol | -5.714 |
arians | -5.541 |
icians | -5.446 |
beh | -5.443 |
Token | they |
Token ID | 484 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.096 |
, | +4.993 |
the | +4.963 |
. | +4.895 |
a | +4.852 |
Neg logit contributions | |
lor | -3.939 |
arians | -3.854 |
umm | -3.765 |
rol | -3.717 |
osity | -3.679 |
Token | all |
Token ID | 477 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.634 |
the | +3.522 |
, | +3.501 |
. | +3.391 |
a | +3.359 |
Neg logit contributions | |
lor | -5.487 |
arians | -5.346 |
rol | -5.294 |
umm | -5.290 |
ides | -5.211 |
Token | have |
Token ID | 423 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.735 |
the | +3.593 |
, | +3.591 |
. | +3.468 |
a | +3.452 |
Neg logit contributions | |
lor | -5.394 |
rol | -5.230 |
arians | -5.204 |
umm | -5.202 |
osity | -5.134 |
Token | fun |
Token ID | 1257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.025 |
, | +2.904 |
the | +2.852 |
. | +2.767 |
a | +2.600 |
Neg logit contributions | |
lor | -6.065 |
arians | -5.850 |
rol | -5.835 |
umm | -5.776 |
ides | -5.747 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.298 |
the | +2.249 |
, | +2.157 |
a | +2.059 |
. | +2.017 |
Neg logit contributions | |
lor | -6.781 |
arians | -6.668 |
umm | -6.618 |
rol | -6.585 |
ocol | -6.548 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.798 |
, | +2.721 |
the | +2.643 |
. | +2.584 |
a | +2.461 |
Neg logit contributions | |
lor | -6.301 |
umm | -6.157 |
rol | -6.075 |
arians | -6.068 |
osity | -6.034 |
Token | Anna |
Token ID | 31160 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.084 |
the | +2.960 |
, | +2.946 |
a | +2.781 |
. | +2.780 |
Neg logit contributions | |
lor | -6.055 |
rol | -5.756 |
umm | -5.703 |
arians | -5.699 |
ides | -5.597 |
Token | is |
Token ID | 318 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.236 |
the | +3.198 |
, | +3.120 |
. | +3.056 |
a | +3.038 |
Neg logit contributions | |
lor | -5.800 |
arians | -5.599 |
umm | -5.561 |
rol | -5.544 |
ocol | -5.478 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.217 |
the | +3.095 |
, | +3.080 |
. | +3.010 |
a | +2.867 |
Neg logit contributions | |
lor | -5.852 |
rol | -5.735 |
umm | -5.696 |
arians | -5.695 |
ocol | -5.656 |
Token | big |
Token ID | 1263 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.931 |
the | +2.838 |
, | +2.781 |
. | +2.703 |
a | +2.641 |
Neg logit contributions | |
lor | -6.092 |
umm | -5.989 |
arians | -5.960 |
bek | -5.856 |
ocol | -5.828 |
Token | girl |
Token ID | 2576 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.746 |
the | +3.678 |
, | +3.606 |
. | +3.548 |
a | +3.512 |
Neg logit contributions | |
lor | -5.279 |
umm | -5.180 |
arians | -5.158 |
rol | -5.059 |
ocol | -5.052 |
Token | coins |
Token ID | 10796 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.279 |
, | +3.121 |
the | +3.072 |
. | +3.032 |
a | +2.850 |
Neg logit contributions | |
lor | -5.745 |
rol | -5.615 |
arians | -5.591 |
ocol | -5.582 |
isher | -5.541 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.695 |
the | +1.679 |
, | +1.538 |
a | +1.519 |
. | +1.476 |
Neg logit contributions | |
lor | -7.283 |
arians | -7.138 |
rol | -7.100 |
umm | -7.033 |
ides | -7.031 |
Token | buttons |
Token ID | 12163 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.155 |
, | +4.103 |
the | +4.083 |
. | +4.049 |
a | +3.890 |
Neg logit contributions | |
lor | -4.748 |
arians | -4.728 |
rol | -4.673 |
ocol | -4.623 |
umm | -4.616 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.395 |
the | +1.381 |
, | +1.233 |
a | +1.218 |
. | +1.189 |
Neg logit contributions | |
lor | -7.597 |
arians | -7.497 |
rol | -7.449 |
umm | -7.390 |
ides | -7.376 |
Token | or |
Token ID | 393 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.085 |
the | +4.077 |
, | +4.032 |
. | +3.996 |
a | +3.872 |
Neg logit contributions | |
lor | -4.826 |
arians | -4.741 |
ocol | -4.650 |
rol | -4.644 |
umm | -4.604 |
Token | shells |
Token ID | 19679 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.164 |
, | +5.029 |
the | +5.001 |
. | +4.931 |
a | +4.778 |
Neg logit contributions | |
lor | -3.797 |
arians | -3.776 |
ocol | -3.710 |
umm | -3.650 |
rol | -3.623 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.116 |
the | +2.107 |
a | +1.964 |
, | +1.954 |
. | +1.830 |
Neg logit contributions | |
lor | -6.900 |
arians | -6.739 |
rol | -6.720 |
ides | -6.674 |
ocol | -6.652 |
Token | But |
Token ID | 887 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.997 |
the | +3.906 |
, | +3.870 |
. | +3.717 |
a | +3.708 |
Neg logit contributions | |
lor | -5.164 |
arians | -5.092 |
rol | -5.030 |
umm | -4.994 |
osity | -4.913 |
Token | today |
Token ID | 1909 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.201 |
. | +2.996 |
, | +2.948 |
the | +2.928 |
a | +2.807 |
Neg logit contributions | |
lor | -5.806 |
arians | -5.789 |
ocol | -5.738 |
umm | -5.687 |
osity | -5.679 |
Token | they |
Token ID | 484 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.127 |
the | +1.971 |
, | +1.886 |
a | +1.842 |
. | +1.837 |
Neg logit contributions | |
lor | -7.038 |
umm | -6.815 |
arians | -6.798 |
rol | -6.750 |
ides | -6.647 |
Token | found |
Token ID | 1043 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.466 |
the | +3.362 |
, | +3.326 |
. | +3.230 |
a | +3.193 |
Neg logit contributions | |
lor | -5.688 |
arians | -5.537 |
rol | -5.489 |
umm | -5.488 |
ides | -5.413 |
Token | single |
Token ID | 2060 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.368 |
the | +4.290 |
, | +4.227 |
. | +4.123 |
a | +4.046 |
Neg logit contributions | |
lor | -4.736 |
umm | -4.556 |
arians | -4.525 |
rol | -4.497 |
bek | -4.476 |
Token | day |
Token ID | 1110 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.021 |
the | +3.978 |
, | +3.864 |
a | +3.766 |
. | +3.736 |
Neg logit contributions | |
lor | -5.064 |
umm | -4.960 |
arians | -4.900 |
rol | -4.829 |
ocol | -4.810 |
Token | spent |
Token ID | 3377 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.026 |
the | +2.014 |
, | +1.882 |
a | +1.853 |
. | +1.746 |
Neg logit contributions | |
lor | -6.989 |
arians | -6.878 |
umm | -6.809 |
rol | -6.772 |
ides | -6.725 |
Token | together |
Token ID | 1978 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.425 |
, | +3.303 |
the | +3.283 |
. | +3.203 |
a | +3.161 |
Neg logit contributions | |
lor | -5.598 |
arians | -5.399 |
umm | -5.287 |
rol | -5.249 |
icians | -5.219 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.757 |
the | +2.741 |
, | +2.617 |
a | +2.581 |
. | +2.498 |
Neg logit contributions | |
lor | -6.261 |
arians | -6.121 |
umm | -6.051 |
rol | -6.047 |
ides | -5.975 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.056 |
, | +3.945 |
the | +3.939 |
. | +3.828 |
a | +3.776 |
Neg logit contributions | |
lor | -5.241 |
arians | -5.016 |
rol | -4.913 |
umm | -4.879 |
osity | -4.822 |
Token | M |
Token ID | 44 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.915 |
the | +3.815 |
, | +3.782 |
a | +3.638 |
. | +3.607 |
Neg logit contributions | |
lor | -5.257 |
rol | -5.005 |
arians | -4.911 |
umm | -4.900 |
ides | -4.790 |
Token | um |
Token ID | 388 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +6.193 |
the | +6.096 |
, | +6.033 |
. | +5.939 |
a | +5.910 |
Neg logit contributions | |
lor | -3.064 |
umm | -2.862 |
arians | -2.859 |
rol | -2.822 |
ocol | -2.737 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.160 |
the | +2.113 |
, | +2.053 |
. | +1.996 |
a | +1.970 |
Neg logit contributions | |
lor | -6.871 |
arians | -6.690 |
rol | -6.682 |
umm | -6.627 |
ocol | -6.557 |
Token | Dad |
Token ID | 17415 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.377 |
, | +4.250 |
the | +4.205 |
. | +4.187 |
a | +4.040 |
Neg logit contributions | |
lor | -4.672 |
rol | -4.567 |
umm | -4.520 |
arians | -4.511 |
ocol | -4.458 |
Token | were |
Token ID | 547 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.313 |
the | +3.233 |
, | +3.175 |
. | +3.094 |
a | +3.071 |
Neg logit contributions | |
lor | -5.767 |
arians | -5.615 |
rol | -5.610 |
umm | -5.585 |
osity | -5.491 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.500 |
the | +4.499 |
, | +4.384 |
a | +4.296 |
. | +4.275 |
Neg logit contributions | |
lor | -4.529 |
arians | -4.360 |
rol | -4.352 |
isher | -4.310 |
umm | -4.293 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.836 |
, | +3.748 |
. | +3.688 |
the | +3.673 |
a | +3.536 |
Neg logit contributions | |
lor | -5.176 |
arians | -5.095 |
osity | -5.071 |
umm | -5.015 |
bek | -4.962 |
Token | very |
Token ID | 845 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.029 |
, | +3.900 |
the | +3.823 |
. | +3.773 |
a | +3.605 |
Neg logit contributions | |
lor | -5.060 |
rol | -4.869 |
arians | -4.842 |
osity | -4.796 |
beh | -4.795 |
Token | happy |
Token ID | 3772 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.416 |
the | +4.243 |
, | +4.242 |
. | +4.123 |
a | +4.048 |
Neg logit contributions | |
lor | -4.606 |
osity | -4.558 |
beh | -4.558 |
umm | -4.549 |
ocol | -4.538 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.502 |
the | +1.451 |
, | +1.377 |
a | +1.279 |
. | +1.233 |
Neg logit contributions | |
lor | -7.583 |
umm | -7.473 |
arians | -7.433 |
rol | -7.356 |
osity | -7.318 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.234 |
, | +2.110 |
the | +2.103 |
. | +1.976 |
a | +1.947 |
Neg logit contributions | |
lor | -7.001 |
umm | -6.780 |
rol | -6.724 |
arians | -6.718 |
osity | -6.680 |
Token | Once |
Token ID | 7454 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.900 |
, | +2.784 |
the | +2.780 |
a | +2.618 |
. | +2.580 |
Neg logit contributions | |
lor | -6.267 |
rol | -5.992 |
umm | -5.890 |
arians | -5.871 |
ides | -5.787 |
Token | upon |
Token ID | 2402 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.199 |
the | +4.073 |
, | +4.023 |
a | +3.939 |
. | +3.934 |
Neg logit contributions | |
lor | -4.896 |
rol | -4.705 |
umm | -4.673 |
arians | -4.671 |
osity | -4.614 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.453 |
, | +0.397 |
the | +0.330 |
. | +0.192 |
a | +0.010 |
Neg logit contributions | |
lor | -8.599 |
rol | -8.326 |
arians | -8.290 |
umm | -8.240 |
ides | -8.229 |
Token | time |
Token ID | 640 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.469 |
the | +2.432 |
, | +2.341 |
. | +2.239 |
a | +2.212 |
Neg logit contributions | |
lor | -6.653 |
umm | -6.459 |
arians | -6.440 |
rol | -6.410 |
ides | -6.369 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.235 |
the | +0.138 |
, | +0.019 |
. | -0.000 |
a | -0.039 |
Neg logit contributions | |
lor | -8.879 |
rol | -8.679 |
arians | -8.669 |
umm | -8.665 |
ocol | -8.585 |
Token | mission |
Token ID | 4365 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.892 |
the | +4.807 |
, | +4.735 |
. | +4.660 |
a | +4.648 |
Neg logit contributions | |
umm | -4.145 |
lor | -4.145 |
arians | -4.108 |
isher | -4.009 |
ocol | -3.997 |
Token | had |
Token ID | 550 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.992 |
the | +2.953 |
, | +2.875 |
a | +2.791 |
. | +2.741 |
Neg logit contributions | |
lor | -6.096 |
arians | -5.882 |
rol | -5.838 |
ides | -5.770 |
umm | -5.761 |
Token | been |
Token ID | 587 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.691 |
, | +4.554 |
the | +4.476 |
. | +4.414 |
a | +4.286 |
Neg logit contributions | |
lor | -4.477 |
rol | -4.246 |
arians | -4.228 |
umm | -4.180 |
ides | -4.139 |
Token | accomplished |
Token ID | 13013 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.828 |
, | +4.652 |
the | +4.618 |
. | +4.517 |
a | +4.448 |
Neg logit contributions | |
lor | -4.273 |
arians | -4.090 |
rol | -4.084 |
umm | -4.003 |
isher | -3.959 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.909 |
the | +1.886 |
, | +1.792 |
a | +1.693 |
. | +1.632 |
Neg logit contributions | |
lor | -7.171 |
arians | -6.882 |
ides | -6.810 |
rol | -6.802 |
umm | -6.800 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.997 |
, | +1.899 |
the | +1.865 |
. | +1.772 |
a | +1.711 |
Neg logit contributions | |
lor | -7.299 |
umm | -7.007 |
rol | -7.005 |
arians | -7.001 |
osity | -6.898 |
Token | One |
Token ID | 3198 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.027 |
the | +3.922 |
, | +3.898 |
a | +3.755 |
. | +3.719 |
Neg logit contributions | |
lor | -5.151 |
rol | -4.903 |
umm | -4.811 |
arians | -4.792 |
ides | -4.688 |
Token | day |
Token ID | 1110 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.937 |
, | +2.768 |
the | +2.767 |
. | +2.649 |
a | +2.577 |
Neg logit contributions | |
lor | -6.050 |
rol | -5.940 |
umm | -5.925 |
osity | -5.822 |
ocol | -5.803 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.481 |
the | +0.373 |
, | +0.289 |
. | +0.225 |
a | +0.177 |
Neg logit contributions | |
lor | -8.675 |
rol | -8.467 |
arians | -8.465 |
umm | -8.449 |
ocol | -8.372 |
Token | Max |
Token ID | 5436 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.471 |
the | +1.341 |
, | +1.296 |
. | +1.224 |
a | +1.086 |
Neg logit contributions | |
lor | -7.566 |
rol | -7.444 |
arians | -7.353 |
umm | -7.342 |
osity | -7.288 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.196 |
the | +2.161 |
, | +2.103 |
. | +2.029 |
a | +1.967 |
Neg logit contributions | |
lor | -6.793 |
rol | -6.561 |
umm | -6.556 |
arians | -6.543 |
ides | -6.455 |
Token | see |
Token ID | 766 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.486 |
, | +3.417 |
the | +3.272 |
. | +3.264 |
a | +3.105 |
Neg logit contributions | |
lor | -5.626 |
arians | -5.489 |
umm | -5.333 |
osity | -5.299 |
ides | -5.273 |
Token | it |
Token ID | 340 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.401 |
, | +2.315 |
. | +2.150 |
the | +2.147 |
a | +2.000 |
Neg logit contributions | |
lor | -6.581 |
arians | -6.409 |
ocol | -6.343 |
umm | -6.343 |
rol | -6.341 |
Token | again |
Token ID | 757 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.104 |
the | +3.087 |
, | +2.992 |
a | +2.907 |
. | +2.862 |
Neg logit contributions | |
lor | -5.871 |
rol | -5.651 |
arians | -5.642 |
ides | -5.544 |
osity | -5.517 |
Token | soon |
Token ID | 2582 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +3.033 |
and | +3.024 |
, | +2.932 |
a | +2.896 |
. | +2.771 |
Neg logit contributions | |
lor | -5.802 |
arians | -5.669 |
bek | -5.565 |
umm | -5.525 |
ides | -5.503 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.132 |
the | +1.123 |
a | +1.024 |
, | +0.998 |
. | +0.838 |
Neg logit contributions | |
lor | -7.854 |
arians | -7.666 |
ides | -7.592 |
umm | -7.565 |
rol | -7.537 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.793 |
the | +2.684 |
, | +2.672 |
. | +2.582 |
a | +2.508 |
Neg logit contributions | |
lor | -6.417 |
umm | -6.180 |
arians | -6.143 |
rol | -6.137 |
osity | -6.076 |
Token | Once |
Token ID | 7454 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.662 |
the | +2.546 |
, | +2.536 |
a | +2.373 |
. | +2.345 |
Neg logit contributions | |
lor | -6.524 |
rol | -6.247 |
arians | -6.151 |
umm | -6.128 |
ides | -6.032 |
Token | upon |
Token ID | 2402 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.189 |
the | +4.064 |
, | +4.011 |
a | +3.928 |
. | +3.927 |
Neg logit contributions | |
lor | -4.925 |
rol | -4.729 |
arians | -4.704 |
umm | -4.685 |
osity | -4.626 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.433 |
, | +0.377 |
the | +0.321 |
. | +0.184 |
a | +0.012 |
Neg logit contributions | |
lor | -8.613 |
rol | -8.357 |
arians | -8.306 |
umm | -8.263 |
ides | -8.247 |
Token | time |
Token ID | 640 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.473 |
the | +2.436 |
, | +2.345 |
. | +2.239 |
a | +2.210 |
Neg logit contributions | |
lor | -6.658 |
umm | -6.440 |
arians | -6.433 |
rol | -6.415 |
ides | -6.365 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.250 |
the | +0.156 |
, | +0.017 |
. | +0.016 |
a | -0.026 |
Neg logit contributions | |
lor | -8.856 |
rol | -8.654 |
arians | -8.638 |
umm | -8.617 |
ocol | -8.561 |
Token | seen |
Token ID | 1775 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.261 |
, | +3.116 |
the | +3.017 |
. | +2.986 |
a | +2.804 |
Neg logit contributions | |
lor | -5.998 |
umm | -5.667 |
rol | -5.665 |
arians | -5.601 |
ides | -5.532 |
Token | the |
Token ID | 262 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.212 |
, | +2.075 |
. | +1.880 |
the | +1.863 |
a | +1.744 |
Neg logit contributions | |
lor | -6.874 |
umm | -6.689 |
rol | -6.686 |
ocol | -6.651 |
arians | -6.648 |
Token | beautiful |
Token ID | 4950 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.915 |
, | +3.814 |
the | +3.800 |
. | +3.655 |
a | +3.559 |
Neg logit contributions | |
lor | -5.291 |
umm | -5.161 |
arians | -5.082 |
rol | -5.001 |
osity | -4.936 |
Token | landscape |
Token ID | 10747 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.863 |
the | +3.809 |
, | +3.733 |
a | +3.643 |
. | +3.636 |
Neg logit contributions | |
lor | -5.273 |
umm | -5.100 |
arians | -5.007 |
rol | -4.973 |
ocol | -4.939 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.321 |
the | +2.240 |
, | +2.182 |
a | +2.103 |
. | +2.015 |
Neg logit contributions | |
lor | -6.778 |
rol | -6.610 |
umm | -6.605 |
arians | -6.546 |
osity | -6.435 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.401 |
, | +2.278 |
the | +2.271 |
. | +2.149 |
a | +2.120 |
Neg logit contributions | |
lor | -6.795 |
rol | -6.594 |
umm | -6.593 |
arians | -6.542 |
osity | -6.470 |
Token | Once |
Token ID | 7454 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.610 |
the | +1.486 |
, | +1.481 |
a | +1.314 |
. | +1.275 |
Neg logit contributions | |
lor | -7.530 |
rol | -7.247 |
umm | -7.144 |
arians | -7.134 |
ides | -7.046 |
Token | upon |
Token ID | 2402 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.189 |
the | +4.066 |
, | +4.012 |
a | +3.926 |
. | +3.925 |
Neg logit contributions | |
lor | -4.911 |
rol | -4.725 |
umm | -4.698 |
arians | -4.689 |
osity | -4.623 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.421 |
, | +0.348 |
the | +0.306 |
. | +0.164 |
a | +0.019 |
Neg logit contributions | |
lor | -8.652 |
rol | -8.397 |
arians | -8.356 |
umm | -8.334 |
ides | -8.292 |
Token | time |
Token ID | 640 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.456 |
the | +2.407 |
, | +2.325 |
. | +2.220 |
a | +2.192 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.478 |
arians | -6.463 |
rol | -6.442 |
ides | -6.388 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.225 |
the | +0.134 |
, | +0.012 |
. | -0.012 |
a | -0.050 |
Neg logit contributions | |
lor | -8.899 |
rol | -8.695 |
arians | -8.681 |
umm | -8.676 |
ocol | -8.595 |
Token | out |
Token ID | 503 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.583 |
the | +2.472 |
, | +2.432 |
. | +2.300 |
a | +2.276 |
Neg logit contributions | |
lor | -6.749 |
arians | -6.545 |
umm | -6.537 |
rol | -6.465 |
ides | -6.411 |
Token | the |
Token ID | 262 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.373 |
, | +1.247 |
the | +1.242 |
. | +1.157 |
a | +1.101 |
Neg logit contributions | |
lor | -7.689 |
rol | -7.552 |
umm | -7.529 |
arians | -7.522 |
ocol | -7.481 |
Token | window |
Token ID | 4324 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.489 |
the | +4.421 |
, | +4.392 |
. | +4.300 |
a | +4.252 |
Neg logit contributions | |
lor | -4.692 |
umm | -4.540 |
arians | -4.510 |
rol | -4.485 |
osity | -4.397 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.702 |
and | +0.639 |
, | +0.543 |
a | +0.523 |
. | +0.507 |
Neg logit contributions | |
lor | -8.201 |
umm | -8.113 |
rol | -8.057 |
arians | -8.039 |
osity | -7.990 |
Token | saw |
Token ID | 2497 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.693 |
, | +2.540 |
the | +2.515 |
. | +2.498 |
a | +2.391 |
Neg logit contributions | |
lor | -6.331 |
arians | -6.211 |
rol | -6.205 |
umm | -6.140 |
osity | -6.132 |
Token | cherry |
Token ID | 23612 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.381 |
, | +1.253 |
. | +1.158 |
the | +1.143 |
a | +0.921 |
Neg logit contributions | |
lor | -7.719 |
rol | -7.575 |
umm | -7.493 |
arians | -7.478 |
isher | -7.423 |
Token | trees |
Token ID | 7150 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.260 |
the | +4.186 |
, | +4.125 |
a | +4.040 |
. | +4.018 |
Neg logit contributions | |
lor | -4.842 |
umm | -4.714 |
arians | -4.697 |
rol | -4.653 |
ocol | -4.527 |
Token | growing |
Token ID | 3957 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.039 |
the | +1.015 |
, | +0.907 |
a | +0.874 |
. | +0.806 |
Neg logit contributions | |
lor | -7.940 |
rol | -7.789 |
arians | -7.784 |
umm | -7.773 |
osity | -7.656 |
Token | all |
Token ID | 477 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.181 |
the | +2.107 |
, | +2.062 |
a | +1.933 |
. | +1.894 |
Neg logit contributions | |
lor | -6.861 |
rol | -6.793 |
umm | -6.772 |
arians | -6.616 |
ocol | -6.589 |
Token | around |
Token ID | 1088 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.782 |
, | +2.630 |
the | +2.600 |
a | +2.529 |
. | +2.474 |
Neg logit contributions | |
lor | -6.261 |
rol | -6.233 |
umm | -6.203 |
arians | -6.056 |
osity | -6.038 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.468 |
, | +1.318 |
the | +1.235 |
a | +1.176 |
. | +1.107 |
Neg logit contributions | |
lor | -7.457 |
umm | -7.363 |
ocol | -7.360 |
arians | -7.319 |
rol | -7.297 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +3.396 |
and | +3.360 |
, | +3.305 |
a | +3.240 |
. | +3.237 |
Neg logit contributions | |
lor | -5.675 |
arians | -5.527 |
rol | -5.416 |
umm | -5.371 |
ides | -5.354 |
Token | Morris |
Token ID | 14433 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +6.320 |
, | +6.128 |
. | +6.086 |
the | +6.077 |
a | +5.965 |
Neg logit contributions | |
lor | -2.917 |
arians | -2.776 |
umm | -2.693 |
rol | -2.653 |
osity | -2.640 |
Token | became |
Token ID | 2627 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.142 |
the | +4.074 |
, | +4.007 |
. | +3.931 |
a | +3.922 |
Neg logit contributions | |
lor | -4.916 |
arians | -4.814 |
rol | -4.767 |
ides | -4.674 |
osity | -4.631 |
Token | friends |
Token ID | 2460 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.110 |
, | +2.906 |
the | +2.828 |
. | +2.805 |
a | +2.664 |
Neg logit contributions | |
lor | -5.889 |
arians | -5.841 |
rol | -5.828 |
umm | -5.781 |
beh | -5.702 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.892 |
the | +2.879 |
, | +2.778 |
a | +2.703 |
. | +2.642 |
Neg logit contributions | |
lor | -6.191 |
arians | -5.974 |
rol | -5.947 |
umm | -5.921 |
ides | -5.803 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.054 |
, | +3.923 |
the | +3.914 |
. | +3.811 |
a | +3.787 |
Neg logit contributions | |
lor | -5.225 |
rol | -5.011 |
umm | -4.966 |
arians | -4.947 |
osity | -4.865 |
Token | Once |
Token ID | 7454 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.743 |
the | +3.623 |
, | +3.608 |
a | +3.454 |
. | +3.425 |
Neg logit contributions | |
lor | -5.431 |
rol | -5.181 |
arians | -5.075 |
umm | -5.054 |
ides | -4.956 |
Token | upon |
Token ID | 2402 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.292 |
the | +4.155 |
, | +4.103 |
a | +4.029 |
. | +4.022 |
Neg logit contributions | |
lor | -4.806 |
rol | -4.625 |
arians | -4.575 |
umm | -4.566 |
osity | -4.531 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.474 |
, | +0.419 |
the | +0.355 |
. | +0.211 |
a | +0.009 |
Neg logit contributions | |
lor | -8.566 |
rol | -8.310 |
arians | -8.241 |
umm | -8.186 |
ides | -8.182 |
Token | time |
Token ID | 640 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.495 |
the | +2.473 |
, | +2.366 |
. | +2.264 |
a | +2.237 |
Neg logit contributions | |
lor | -6.618 |
umm | -6.406 |
arians | -6.384 |
rol | -6.378 |
ides | -6.332 |
Token | there |
Token ID | 612 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.254 |
the | +0.163 |
, | +0.024 |
. | +0.012 |
a | -0.026 |
Neg logit contributions | |
lor | -8.847 |
rol | -8.655 |
arians | -8.634 |
umm | -8.610 |
ocol | -8.553 |
Token | tree |
Token ID | 5509 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.070 |
the | +3.010 |
, | +2.947 |
a | +2.847 |
. | +2.836 |
Neg logit contributions | |
lor | -6.028 |
umm | -5.900 |
arians | -5.837 |
rol | -5.811 |
ocol | -5.711 |
Token | with |
Token ID | 351 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.036 |
the | +1.989 |
, | +1.922 |
a | +1.810 |
. | +1.796 |
Neg logit contributions | |
lor | -7.045 |
umm | -6.863 |
rol | -6.851 |
arians | -6.845 |
osity | -6.731 |
Token | lots |
Token ID | 6041 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.910 |
, | +2.803 |
the | +2.738 |
. | +2.676 |
a | +2.506 |
Neg logit contributions | |
lor | -6.210 |
umm | -6.098 |
rol | -6.086 |
arians | -5.990 |
ocol | -5.979 |
Token | of |
Token ID | 286 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.222 |
the | +2.190 |
, | +2.117 |
a | +2.022 |
. | +1.993 |
Neg logit contributions | |
lor | -6.833 |
umm | -6.748 |
rol | -6.685 |
ocol | -6.641 |
arians | -6.636 |
Token | cher |
Token ID | 21382 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.239 |
the | +5.132 |
, | +5.114 |
. | +5.000 |
a | +4.947 |
Neg logit contributions | |
lor | -3.860 |
umm | -3.748 |
rol | -3.714 |
arians | -3.700 |
ocol | -3.636 |
Token | ries |
Token ID | 1678 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +7.142 |
the | +7.039 |
, | +7.010 |
. | +6.904 |
a | +6.839 |
Neg logit contributions | |
lor | -2.023 |
arians | -1.856 |
umm | -1.828 |
rol | -1.801 |
osity | -1.725 |
Token | on |
Token ID | 319 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.172 |
the | +1.139 |
, | +1.058 |
a | +0.963 |
. | +0.896 |
Neg logit contributions | |
lor | -7.855 |
umm | -7.722 |
rol | -7.712 |
arians | -7.700 |
ides | -7.597 |
Token | it |
Token ID | 340 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.893 |
, | +2.773 |
the | +2.714 |
. | +2.597 |
a | +2.570 |
Neg logit contributions | |
lor | -6.177 |
umm | -5.985 |
arians | -5.969 |
rol | -5.887 |
ocol | -5.845 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.454 |
the | +0.449 |
, | +0.329 |
a | +0.265 |
. | +0.031 |
Neg logit contributions | |
lor | -8.488 |
rol | -8.288 |
arians | -8.274 |
umm | -8.249 |
ides | -8.209 |
Token | She |
Token ID | 1375 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.912 |
the | +2.807 |
, | +2.783 |
. | +2.684 |
a | +2.654 |
Neg logit contributions | |
lor | -6.221 |
umm | -6.049 |
arians | -6.000 |
rol | -5.998 |
osity | -5.895 |
Token | wanted |
Token ID | 2227 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.032 |
the | +2.937 |
, | +2.901 |
. | +2.802 |
a | +2.753 |
Neg logit contributions | |
lor | -6.149 |
arians | -5.983 |
umm | -5.961 |
rol | -5.940 |
ides | -5.839 |
Token | cherry |
Token ID | 23612 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.620 |
the | +3.545 |
, | +3.463 |
. | +3.422 |
a | +3.339 |
Neg logit contributions | |
lor | -5.484 |
umm | -5.341 |
arians | -5.309 |
bek | -5.211 |
rol | -5.197 |
Token | tree |
Token ID | 5509 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.070 |
the | +3.010 |
, | +2.947 |
a | +2.847 |
. | +2.836 |
Neg logit contributions | |
lor | -6.028 |
umm | -5.900 |
arians | -5.837 |
rol | -5.811 |
ocol | -5.711 |
Token | with |
Token ID | 351 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.036 |
the | +1.989 |
, | +1.922 |
a | +1.810 |
. | +1.796 |
Neg logit contributions | |
lor | -7.045 |
umm | -6.863 |
rol | -6.851 |
arians | -6.845 |
osity | -6.731 |
Token | lots |
Token ID | 6041 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.910 |
, | +2.803 |
the | +2.738 |
. | +2.676 |
a | +2.506 |
Neg logit contributions | |
lor | -6.210 |
umm | -6.098 |
rol | -6.086 |
arians | -5.990 |
ocol | -5.979 |
Token | of |
Token ID | 286 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.222 |
the | +2.190 |
, | +2.117 |
a | +2.022 |
. | +1.993 |
Neg logit contributions | |
lor | -6.833 |
umm | -6.748 |
rol | -6.685 |
ocol | -6.641 |
arians | -6.636 |
Token | cher |
Token ID | 21382 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.239 |
the | +5.132 |
, | +5.114 |
. | +5.000 |
a | +4.947 |
Neg logit contributions | |
lor | -3.860 |
umm | -3.748 |
rol | -3.714 |
arians | -3.700 |
ocol | -3.636 |
Token | ries |
Token ID | 1678 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +7.142 |
the | +7.039 |
, | +7.010 |
. | +6.904 |
a | +6.839 |
Neg logit contributions | |
lor | -2.023 |
arians | -1.856 |
umm | -1.828 |
rol | -1.801 |
osity | -1.725 |
Token | on |
Token ID | 319 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.172 |
the | +1.139 |
, | +1.058 |
a | +0.963 |
. | +0.896 |
Neg logit contributions | |
lor | -7.855 |
umm | -7.722 |
rol | -7.712 |
arians | -7.700 |
ides | -7.597 |
Token | it |
Token ID | 340 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.893 |
, | +2.773 |
the | +2.714 |
. | +2.597 |
a | +2.570 |
Neg logit contributions | |
lor | -6.177 |
umm | -5.985 |
arians | -5.969 |
rol | -5.887 |
ocol | -5.845 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.454 |
the | +0.449 |
, | +0.329 |
a | +0.265 |
. | +0.031 |
Neg logit contributions | |
lor | -8.488 |
rol | -8.288 |
arians | -8.274 |
umm | -8.249 |
ides | -8.209 |
Token | She |
Token ID | 1375 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.912 |
the | +2.807 |
, | +2.783 |
. | +2.684 |
a | +2.654 |
Neg logit contributions | |
lor | -6.221 |
umm | -6.049 |
arians | -6.000 |
rol | -5.998 |
osity | -5.895 |
Token | the |
Token ID | 262 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.130 |
, | +4.034 |
. | +3.971 |
the | +3.922 |
a | +3.776 |
Neg logit contributions | |
lor | -4.903 |
rol | -4.712 |
arians | -4.702 |
umm | -4.691 |
osity | -4.686 |
Token | care |
Token ID | 1337 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.466 |
, | +4.350 |
the | +4.333 |
. | +4.198 |
a | +4.109 |
Neg logit contributions | |
lor | -4.706 |
arians | -4.620 |
umm | -4.586 |
rol | -4.530 |
ocol | -4.386 |
Token | it |
Token ID | 340 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.614 |
the | +5.483 |
, | +5.462 |
a | +5.326 |
. | +5.317 |
Neg logit contributions | |
lor | -3.532 |
rol | -3.404 |
umm | -3.320 |
arians | -3.303 |
osity | -3.301 |
Token | provided |
Token ID | 2810 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.555 |
, | +3.469 |
the | +3.421 |
. | +3.287 |
a | +3.253 |
Neg logit contributions | |
lor | -5.579 |
arians | -5.351 |
rol | -5.330 |
umm | -5.256 |
beh | -5.216 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.813 |
, | +2.706 |
the | +2.685 |
a | +2.500 |
. | +2.483 |
Neg logit contributions | |
lor | -6.246 |
rol | -6.060 |
umm | -6.001 |
arians | -5.994 |
isher | -5.925 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.233 |
the | +3.114 |
, | +3.103 |
. | +2.985 |
a | +2.950 |
Neg logit contributions | |
lor | -6.009 |
umm | -5.789 |
rol | -5.766 |
arians | -5.718 |
osity | -5.671 |
Token | Once |
Token ID | 7454 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.821 |
the | +1.698 |
, | +1.684 |
a | +1.524 |
. | +1.491 |
Neg logit contributions | |
lor | -7.320 |
rol | -7.035 |
arians | -6.936 |
umm | -6.928 |
ides | -6.835 |
Token | upon |
Token ID | 2402 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.256 |
the | +4.131 |
, | +4.073 |
a | +3.994 |
. | +3.990 |
Neg logit contributions | |
lor | -4.835 |
rol | -4.654 |
umm | -4.619 |
arians | -4.607 |
osity | -4.552 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.450 |
, | +0.386 |
the | +0.328 |
. | +0.184 |
a | +0.015 |
Neg logit contributions | |
lor | -8.601 |
rol | -8.343 |
arians | -8.293 |
umm | -8.265 |
ides | -8.238 |
Token | time |
Token ID | 640 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.471 |
the | +2.437 |
, | +2.341 |
. | +2.240 |
a | +2.216 |
Neg logit contributions | |
lor | -6.649 |
umm | -6.447 |
arians | -6.427 |
rol | -6.406 |
ides | -6.361 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.238 |
the | +0.150 |
, | +0.013 |
. | +0.004 |
a | -0.038 |
Neg logit contributions | |
lor | -8.870 |
rol | -8.669 |
arians | -8.653 |
umm | -8.650 |
ocol | -8.575 |
Token | day |
Token ID | 1110 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.977 |
the | +2.918 |
, | +2.855 |
. | +2.773 |
a | +2.721 |
Neg logit contributions | |
lor | -5.894 |
umm | -5.861 |
rol | -5.751 |
bek | -5.689 |
osity | -5.688 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.137 |
the | +0.039 |
, | +0.006 |
. | -0.103 |
a | -0.145 |
Neg logit contributions | |
lor | -9.076 |
arians | -8.903 |
umm | -8.891 |
rol | -8.864 |
ides | -8.763 |
Token | she |
Token ID | 673 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.248 |
the | +2.091 |
, | +2.078 |
. | +2.008 |
a | +1.915 |
Neg logit contributions | |
lor | -6.796 |
arians | -6.660 |
umm | -6.660 |
rol | -6.625 |
ocol | -6.578 |
Token | saw |
Token ID | 2497 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.777 |
the | +2.749 |
, | +2.689 |
. | +2.618 |
a | +2.551 |
Neg logit contributions | |
lor | -6.276 |
rol | -6.063 |
arians | -6.055 |
umm | -6.049 |
isher | -5.949 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.806 |
, | +0.670 |
the | +0.610 |
. | +0.574 |
a | +0.383 |
Neg logit contributions | |
lor | -8.326 |
rol | -8.121 |
umm | -8.085 |
arians | -8.060 |
ocol | -8.007 |
Token | cherry |
Token ID | 23612 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.620 |
the | +3.545 |
, | +3.463 |
. | +3.422 |
a | +3.339 |
Neg logit contributions | |
lor | -5.484 |
umm | -5.341 |
arians | -5.309 |
bek | -5.211 |
rol | -5.197 |
Token | tree |
Token ID | 5509 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.070 |
the | +3.010 |
, | +2.947 |
a | +2.847 |
. | +2.836 |
Neg logit contributions | |
lor | -6.028 |
umm | -5.900 |
arians | -5.837 |
rol | -5.811 |
ocol | -5.711 |
Token | with |
Token ID | 351 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.036 |
the | +1.989 |
, | +1.922 |
a | +1.810 |
. | +1.796 |
Neg logit contributions | |
lor | -7.045 |
umm | -6.863 |
rol | -6.851 |
arians | -6.845 |
osity | -6.731 |
Token | lots |
Token ID | 6041 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.910 |
, | +2.803 |
the | +2.738 |
. | +2.676 |
a | +2.506 |
Neg logit contributions | |
lor | -6.210 |
umm | -6.098 |
rol | -6.086 |
arians | -5.990 |
ocol | -5.979 |
Token | of |
Token ID | 286 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.222 |
the | +2.190 |
, | +2.117 |
a | +2.022 |
. | +1.993 |
Neg logit contributions | |
lor | -6.833 |
umm | -6.748 |
rol | -6.685 |
ocol | -6.641 |
arians | -6.636 |
Token | cher |
Token ID | 21382 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.239 |
the | +5.132 |
, | +5.114 |
. | +5.000 |
a | +4.947 |
Neg logit contributions | |
lor | -3.860 |
umm | -3.748 |
rol | -3.714 |
arians | -3.700 |
ocol | -3.636 |
Token | animals |
Token ID | 4695 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.072 |
, | +3.964 |
the | +3.948 |
. | +3.883 |
a | +3.766 |
Neg logit contributions | |
arians | -5.078 |
lor | -4.942 |
umm | -4.905 |
icians | -4.842 |
ocol | -4.825 |
Token | were |
Token ID | 547 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.687 |
the | +3.630 |
, | +3.567 |
. | +3.509 |
a | +3.506 |
Neg logit contributions | |
lor | -5.285 |
arians | -5.185 |
rol | -5.170 |
ides | -5.052 |
osity | -5.043 |
Token | very |
Token ID | 845 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.689 |
, | +3.573 |
the | +3.540 |
. | +3.477 |
a | +3.336 |
Neg logit contributions | |
lor | -5.277 |
rol | -5.230 |
arians | -5.219 |
beh | -5.071 |
osity | -5.039 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.930 |
the | +3.803 |
, | +3.761 |
. | +3.673 |
a | +3.628 |
Neg logit contributions | |
rol | -4.989 |
arians | -4.982 |
lor | -4.978 |
beh | -4.964 |
umm | -4.956 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.788 |
and | +0.785 |
, | +0.661 |
a | +0.656 |
. | +0.569 |
Neg logit contributions | |
lor | -8.067 |
umm | -7.986 |
arians | -7.980 |
rol | -7.961 |
osity | -7.850 |
Token | kept |
Token ID | 4030 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.156 |
, | +3.979 |
the | +3.909 |
. | +3.884 |
a | +3.815 |
Neg logit contributions | |
lor | -4.845 |
arians | -4.812 |
rol | -4.812 |
osity | -4.696 |
beh | -4.691 |
Token | quiet |
Token ID | 5897 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.270 |
, | +4.156 |
the | +4.079 |
. | +4.024 |
a | +3.927 |
Neg logit contributions | |
lor | -4.782 |
arians | -4.670 |
rol | -4.638 |
ocol | -4.587 |
beh | -4.567 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +2.025 |
and | +2.007 |
, | +1.873 |
a | +1.840 |
. | +1.729 |
Neg logit contributions | |
lor | -6.960 |
umm | -6.873 |
arians | -6.843 |
rol | -6.786 |
ides | -6.693 |
Token |
|
Token ID | 198 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.308 |
, | +4.206 |
the | +4.184 |
. | +4.061 |
a | +4.014 |
Neg logit contributions | |
lor | -4.888 |
arians | -4.791 |
umm | -4.712 |
rol | -4.698 |
ides | -4.585 |
Token |
|
Token ID | 198 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.649 |
, | +1.547 |
the | +1.522 |
. | +1.406 |
a | +1.357 |
Neg logit contributions | |
lor | -7.581 |
arians | -7.311 |
rol | -7.309 |
ides | -7.200 |
umm | -7.165 |
Token | Then |
Token ID | 6423 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.207 |
, | +5.111 |
the | +5.089 |
. | +4.991 |
a | +4.907 |
Neg logit contributions | |
lor | -4.099 |
arians | -3.899 |
rol | -3.842 |
umm | -3.805 |
bek | -3.740 |
Token | roared |
Token ID | 45615 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +3.640 |
and | +3.616 |
, | +3.528 |
. | +3.502 |
a | +3.483 |
Neg logit contributions | |
lor | -5.390 |
arians | -5.260 |
rol | -5.080 |
umm | -5.054 |
ides | -5.047 |
Token | again |
Token ID | 757 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +2.899 |
and | +2.877 |
, | +2.776 |
. | +2.734 |
a | +2.661 |
Neg logit contributions | |
lor | -5.890 |
arians | -5.798 |
rol | -5.783 |
osity | -5.666 |
ides | -5.663 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.887 |
and | +0.825 |
a | +0.759 |
, | +0.686 |
. | +0.648 |
Neg logit contributions | |
lor | -7.917 |
arians | -7.842 |
ides | -7.730 |
osity | -7.727 |
umm | -7.677 |
Token | this |
Token ID | 428 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.025 |
, | +2.996 |
the | +2.978 |
. | +2.938 |
a | +2.878 |
Neg logit contributions | |
lor | -5.807 |
arians | -5.777 |
rol | -5.706 |
osity | -5.642 |
umm | -5.623 |
Token | time |
Token ID | 640 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.745 |
the | +2.734 |
, | +2.638 |
a | +2.538 |
. | +2.531 |
Neg logit contributions | |
lor | -6.334 |
umm | -6.110 |
arians | -6.078 |
ides | -6.042 |
rol | -6.020 |
Token | louder |
Token ID | 27089 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.862 |
the | +1.705 |
, | +1.665 |
. | +1.623 |
a | +1.563 |
Neg logit contributions | |
lor | -7.069 |
arians | -6.978 |
rol | -6.900 |
umm | -6.853 |
osity | -6.837 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.316 |
the | +2.291 |
, | +2.172 |
a | +2.144 |
. | +2.089 |
Neg logit contributions | |
lor | -6.668 |
arians | -6.530 |
umm | -6.505 |
ocol | -6.432 |
ides | -6.422 |
Token | more |
Token ID | 517 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.104 |
, | +3.916 |
. | +3.880 |
the | +3.767 |
a | +3.680 |
Neg logit contributions | |
lor | -4.921 |
arians | -4.891 |
umm | -4.820 |
rol | -4.797 |
bek | -4.768 |
Token | fiercely |
Token ID | 33285 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.920 |
the | +4.801 |
, | +4.785 |
a | +4.664 |
. | +4.613 |
Neg logit contributions | |
arians | -4.062 |
ocol | -4.042 |
umm | -4.006 |
lor | -3.965 |
osity | -3.862 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.391 |
the | +4.290 |
, | +4.226 |
a | +4.152 |
. | +4.111 |
Neg logit contributions | |
lor | -4.616 |
arians | -4.544 |
umm | -4.479 |
rol | -4.417 |
ocol | -4.408 |
Token | He |
Token ID | 679 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.107 |
, | +4.024 |
the | +3.982 |
. | +3.867 |
a | +3.762 |
Neg logit contributions | |
lor | -5.080 |
umm | -4.998 |
arians | -4.975 |
rol | -4.910 |
osity | -4.835 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.709 |
and | +1.613 |
, | +1.521 |
a | +1.481 |
. | +1.438 |
Neg logit contributions | |
lor | -7.177 |
rol | -7.123 |
arians | -7.105 |
osity | -7.048 |
ides | -7.017 |
Token | they |
Token ID | 484 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.806 |
the | +3.616 |
, | +3.592 |
. | +3.546 |
a | +3.495 |
Neg logit contributions | |
lor | -5.227 |
arians | -5.172 |
rol | -5.101 |
osity | -5.002 |
bek | -4.955 |
Token | were |
Token ID | 547 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.533 |
the | +3.409 |
, | +3.366 |
. | +3.278 |
a | +3.240 |
Neg logit contributions | |
lor | -5.546 |
arians | -5.471 |
rol | -5.471 |
ides | -5.315 |
umm | -5.310 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.120 |
, | +3.970 |
the | +3.954 |
. | +3.844 |
a | +3.743 |
Neg logit contributions | |
rol | -4.917 |
lor | -4.913 |
arians | -4.913 |
beh | -4.696 |
icians | -4.692 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.131 |
the | +1.080 |
, | +0.982 |
a | +0.936 |
. | +0.830 |
Neg logit contributions | |
lor | -7.773 |
umm | -7.717 |
arians | -7.702 |
rol | -7.699 |
osity | -7.596 |
Token | They |
Token ID | 1119 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.151 |
the | +3.029 |
, | +3.018 |
. | +2.925 |
a | +2.861 |
Neg logit contributions | |
lor | -5.996 |
arians | -5.898 |
rol | -5.791 |
umm | -5.767 |
osity | -5.666 |
Token | tried |
Token ID | 3088 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.779 |
the | +3.655 |
, | +3.640 |
. | +3.552 |
a | +3.486 |
Neg logit contributions | |
lor | -5.262 |
arians | -5.213 |
rol | -5.168 |
ides | -5.046 |
bek | -5.045 |
Token | to |
Token ID | 284 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.545 |
the | +1.467 |
, | +1.433 |
. | +1.396 |
a | +1.295 |
Neg logit contributions | |
lor | -7.363 |
arians | -7.263 |
rol | -7.165 |
osity | -7.146 |
bek | -7.071 |
Token | think |
Token ID | 892 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.319 |
, | +4.223 |
the | +4.183 |
. | +4.100 |
a | +3.995 |
Neg logit contributions | |
arians | -4.727 |
lor | -4.680 |
ides | -4.483 |
rol | -4.438 |
umm | -4.435 |
Token | of |
Token ID | 286 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.533 |
the | +2.492 |
, | +2.410 |
a | +2.351 |
. | +2.343 |
Neg logit contributions | |
lor | -6.344 |
arians | -6.206 |
rol | -6.156 |
ocol | -6.138 |
ides | -6.125 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.799 |
, | +2.655 |
. | +2.528 |
the | +2.510 |
a | +2.255 |
Neg logit contributions | |
lor | -6.339 |
arians | -6.238 |
umm | -6.026 |
icians | -5.983 |
ocol | -5.973 |
Token |
|
Token ID | 198 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.615 |
the | +1.528 |
, | +1.517 |
. | +1.382 |
a | +1.345 |
Neg logit contributions | |
lor | -7.626 |
arians | -7.359 |
rol | -7.330 |
ides | -7.225 |
umm | -7.168 |
Token | The |
Token ID | 464 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.710 |
, | +4.610 |
the | +4.608 |
. | +4.499 |
a | +4.413 |
Neg logit contributions | |
lor | -4.572 |
arians | -4.406 |
rol | -4.321 |
umm | -4.269 |
bek | -4.229 |
Token | monkey |
Token ID | 21657 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.884 |
, | +4.742 |
the | +4.711 |
. | +4.633 |
a | +4.480 |
Neg logit contributions | |
arians | -4.311 |
lor | -4.205 |
umm | -4.192 |
ocol | -4.046 |
Majesty | -4.028 |
Token | decided |
Token ID | 3066 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +3.510 |
and | +3.484 |
, | +3.391 |
. | +3.371 |
a | +3.327 |
Neg logit contributions | |
lor | -5.526 |
arians | -5.402 |
rol | -5.260 |
ides | -5.207 |
umm | -5.190 |
Token | to |
Token ID | 284 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.279 |
the | +1.185 |
, | +1.145 |
. | +1.063 |
a | +1.017 |
Neg logit contributions | |
lor | -7.843 |
arians | -7.656 |
rol | -7.556 |
umm | -7.523 |
osity | -7.521 |
Token | be |
Token ID | 307 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.204 |
the | +4.075 |
, | +4.043 |
. | +3.958 |
a | +3.894 |
Neg logit contributions | |
lor | -4.944 |
arians | -4.821 |
umm | -4.677 |
ides | -4.662 |
rol | -4.646 |
Token | brave |
Token ID | 14802 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.609 |
, | +3.428 |
the | +3.361 |
. | +3.300 |
a | +3.104 |
Neg logit contributions | |
lor | -5.521 |
arians | -5.382 |
rol | -5.338 |
beh | -5.310 |
icians | -5.272 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.255 |
and | +1.243 |
, | +1.136 |
a | +1.075 |
. | +1.022 |
Neg logit contributions | |
lor | -7.705 |
arians | -7.625 |
umm | -7.552 |
rol | -7.497 |
isher | -7.429 |
Token | gave |
Token ID | 2921 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.041 |
, | +3.887 |
. | +3.800 |
the | +3.792 |
a | +3.583 |
Neg logit contributions | |
lor | -4.990 |
arians | -4.943 |
bek | -4.875 |
beh | -4.854 |
osity | -4.806 |
Token | the |
Token ID | 262 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.397 |
, | +2.256 |
. | +2.110 |
the | +2.055 |
a | +1.953 |
Neg logit contributions | |
lor | -6.783 |
rol | -6.637 |
arians | -6.600 |
isher | -6.559 |
umm | -6.510 |
Token | mighty |
Token ID | 18680 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.940 |
the | +4.825 |
, | +4.799 |
. | +4.671 |
a | +4.518 |
Neg logit contributions | |
lor | -4.249 |
arians | -4.224 |
umm | -4.068 |
ides | -3.952 |
ocol | -3.940 |
Token | heard |
Token ID | 2982 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.679 |
, | +3.618 |
the | +3.601 |
. | +3.505 |
a | +3.412 |
Neg logit contributions | |
lor | -5.401 |
arians | -5.216 |
rol | -5.124 |
ides | -5.039 |
bek | -5.035 |
Token | the |
Token ID | 262 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.246 |
, | +2.166 |
. | +2.014 |
the | +1.978 |
a | +1.760 |
Neg logit contributions | |
lor | -6.759 |
rol | -6.612 |
ocol | -6.544 |
umm | -6.527 |
arians | -6.511 |
Token | sound |
Token ID | 2128 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.225 |
the | +4.164 |
, | +4.153 |
. | +3.958 |
a | +3.921 |
Neg logit contributions | |
lor | -4.872 |
umm | -4.751 |
arians | -4.731 |
rol | -4.658 |
ocol | -4.611 |
Token | again |
Token ID | 757 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.041 |
and | +1.007 |
, | +0.948 |
a | +0.916 |
. | +0.800 |
Neg logit contributions | |
lor | -7.716 |
rol | -7.581 |
arians | -7.518 |
umm | -7.509 |
ides | -7.490 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.452 |
and | +0.361 |
a | +0.359 |
, | +0.267 |
. | +0.074 |
Neg logit contributions | |
lor | -8.264 |
ides | -8.142 |
ocol | -8.138 |
arians | -8.137 |
umm | -8.086 |
Token | It |
Token ID | 632 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.388 |
, | +3.273 |
the | +3.244 |
. | +3.124 |
a | +3.010 |
Neg logit contributions | |
lor | -5.795 |
umm | -5.582 |
arians | -5.536 |
rol | -5.500 |
osity | -5.471 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.554 |
, | +3.458 |
the | +3.428 |
. | +3.330 |
a | +3.242 |
Neg logit contributions | |
lor | -5.526 |
rol | -5.332 |
arians | -5.300 |
umm | -5.269 |
ides | -5.158 |
Token | coming |
Token ID | 2406 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.682 |
, | +2.578 |
the | +2.407 |
. | +2.377 |
a | +2.186 |
Neg logit contributions | |
ocol | -6.143 |
lor | -6.141 |
rol | -6.102 |
umm | -6.031 |
arians | -6.017 |
Token | from |
Token ID | 422 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.280 |
the | +2.239 |
, | +2.183 |
a | +2.032 |
. | +2.032 |
Neg logit contributions | |
lor | -6.652 |
rol | -6.575 |
umm | -6.566 |
arians | -6.513 |
ides | -6.420 |
Token | his |
Token ID | 465 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.546 |
, | +2.479 |
the | +2.333 |
. | +2.268 |
a | +2.166 |
Neg logit contributions | |
lor | -6.320 |
ocol | -6.259 |
arians | -6.236 |
umm | -6.201 |
isher | -6.170 |
Token | closet |
Token ID | 21615 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.344 |
the | +4.311 |
, | +4.198 |
a | +4.079 |
. | +4.065 |
Neg logit contributions | |
lor | -4.701 |
arians | -4.631 |
umm | -4.589 |
ocol | -4.435 |
rol | -4.411 |
Token | table |
Token ID | 3084 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.877 |
the | +3.825 |
, | +3.797 |
. | +3.738 |
a | +3.664 |
Neg logit contributions | |
lor | -5.072 |
arians | -4.996 |
umm | -4.929 |
rol | -4.873 |
osity | -4.853 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +2.418 |
and | +2.400 |
, | +2.267 |
a | +2.210 |
. | +2.162 |
Neg logit contributions | |
lor | -6.640 |
umm | -6.442 |
arians | -6.439 |
rol | -6.383 |
ides | -6.305 |
Token | The |
Token ID | 383 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.238 |
, | +3.084 |
the | +3.069 |
. | +2.977 |
a | +2.929 |
Neg logit contributions | |
lor | -5.794 |
arians | -5.628 |
rol | -5.581 |
ocol | -5.555 |
umm | -5.545 |
Token | table |
Token ID | 3084 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.448 |
the | +4.340 |
, | +4.332 |
. | +4.194 |
a | +4.133 |
Neg logit contributions | |
lor | -4.612 |
umm | -4.527 |
arians | -4.524 |
ocol | -4.451 |
isher | -4.411 |
Token | did |
Token ID | 750 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.991 |
the | +3.975 |
, | +3.864 |
a | +3.772 |
. | +3.769 |
Neg logit contributions | |
lor | -5.076 |
rol | -4.849 |
arians | -4.843 |
umm | -4.838 |
ides | -4.770 |
Token | not |
Token ID | 407 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.502 |
the | +2.409 |
, | +2.348 |
. | +2.230 |
a | +2.200 |
Neg logit contributions | |
lor | -6.549 |
arians | -6.345 |
ides | -6.288 |
rol | -6.270 |
umm | -6.241 |
Token | say |
Token ID | 910 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.025 |
the | +3.967 |
, | +3.894 |
. | +3.755 |
a | +3.746 |
Neg logit contributions | |
lor | -4.921 |
ides | -4.875 |
arians | -4.843 |
umm | -4.828 |
ocol | -4.797 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.523 |
the | +4.299 |
, | +4.230 |
. | +4.156 |
a | +4.102 |
Neg logit contributions | |
lor | -4.699 |
arians | -4.379 |
ocol | -4.348 |
osity | -4.330 |
rol | -4.326 |
Token | either |
Token ID | 2035 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.034 |
the | +2.004 |
, | +1.888 |
a | +1.854 |
. | +1.729 |
Neg logit contributions | |
lor | -6.922 |
arians | -6.773 |
rol | -6.700 |
umm | -6.662 |
ides | -6.642 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.020 |
and | +0.995 |
a | +0.863 |
, | +0.827 |
. | +0.678 |
Neg logit contributions | |
lor | -7.927 |
ides | -7.706 |
arians | -7.688 |
rol | -7.687 |
umm | -7.677 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.143 |
, | +3.028 |
the | +2.994 |
. | +2.860 |
a | +2.802 |
Neg logit contributions | |
lor | -6.068 |
arians | -5.816 |
rol | -5.790 |
umm | -5.758 |
osity | -5.698 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.607 |
and | +0.539 |
, | +0.475 |
a | +0.421 |
. | +0.330 |
Neg logit contributions | |
lor | -8.418 |
arians | -8.222 |
rol | -8.187 |
ides | -8.163 |
umm | -8.088 |
Token | said |
Token ID | 531 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.659 |
, | +3.541 |
. | +3.458 |
the | +3.412 |
a | +3.277 |
Neg logit contributions | |
lor | -5.277 |
arians | -5.194 |
umm | -5.123 |
bek | -5.119 |
ocol | -5.099 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.020 |
the | +0.900 |
, | +0.815 |
. | +0.758 |
a | +0.723 |
Neg logit contributions | |
lor | -8.166 |
arians | -7.944 |
rol | -7.934 |
umm | -7.926 |
ocol | -7.868 |
Token | " |
Token ID | 366 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.302 |
the | +2.231 |
, | +2.174 |
. | +2.087 |
a | +2.080 |
Neg logit contributions | |
lor | -6.700 |
arians | -6.545 |
osity | -6.473 |
rol | -6.437 |
umm | -6.405 |
Token | I |
Token ID | 40 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.982 |
the | +5.873 |
, | +5.856 |
. | +5.740 |
a | +5.690 |
Neg logit contributions | |
lor | -3.274 |
arians | -3.090 |
umm | -3.083 |
rol | -3.057 |
ocol | -2.954 |
Token | will |
Token ID | 481 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.513 |
the | +4.463 |
, | +4.347 |
. | +4.287 |
a | +4.235 |
Neg logit contributions | |
lor | -4.625 |
rol | -4.437 |
arians | -4.406 |
umm | -4.356 |
ides | -4.350 |
Token | scare |
Token ID | 19437 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.803 |
the | +3.693 |
, | +3.606 |
. | +3.505 |
a | +3.486 |
Neg logit contributions | |
lor | -5.307 |
arians | -5.177 |
ides | -5.036 |
rol | -5.020 |
umm | -4.983 |
Token | you |
Token ID | 345 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.132 |
, | +2.992 |
the | +2.922 |
. | +2.877 |
a | +2.808 |
Neg logit contributions | |
lor | -5.956 |
arians | -5.788 |
rol | -5.771 |
umm | -5.733 |
ocol | -5.708 |
Token | every |
Token ID | 790 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +2.926 |
and | +2.925 |
, | +2.778 |
a | +2.701 |
. | +2.649 |
Neg logit contributions | |
lor | -6.136 |
rol | -5.938 |
arians | -5.918 |
ides | -5.821 |
umm | -5.788 |
Token | night |
Token ID | 1755 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.592 |
the | +3.509 |
, | +3.439 |
. | +3.314 |
a | +3.283 |
Neg logit contributions | |
lor | -5.548 |
umm | -5.320 |
rol | -5.284 |
arians | -5.265 |
ides | -5.197 |
Token | !" |
Token ID | 2474 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +2.334 |
and | +2.328 |
, | +2.171 |
a | +2.160 |
. | +1.997 |
Neg logit contributions | |
lor | -6.716 |
arians | -6.531 |
umm | -6.528 |
ides | -6.440 |
rol | -6.408 |
Token | day |
Token ID | 1110 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.889 |
the | +2.811 |
, | +2.707 |
. | +2.671 |
a | +2.644 |
Neg logit contributions | |
lor | -6.186 |
umm | -5.956 |
arians | -5.909 |
rol | -5.872 |
ides | -5.840 |
Token | on |
Token ID | 319 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.931 |
the | +1.831 |
, | +1.757 |
. | +1.682 |
a | +1.656 |
Neg logit contributions | |
lor | -7.236 |
arians | -7.043 |
umm | -7.014 |
rol | -7.014 |
ides | -6.928 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.346 |
the | +0.205 |
. | +0.112 |
a | +0.108 |
, | +0.102 |
Neg logit contributions | |
lor | -8.769 |
arians | -8.563 |
umm | -8.519 |
rol | -8.435 |
ocol | -8.409 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.713 |
, | +2.559 |
. | +2.507 |
the | +2.427 |
a | +2.318 |
Neg logit contributions | |
arians | -6.135 |
lor | -6.092 |
umm | -6.079 |
rol | -5.991 |
osity | -5.968 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.074 |
the | +3.070 |
, | +2.984 |
. | +2.937 |
a | +2.905 |
Neg logit contributions | |
lor | -5.959 |
arians | -5.776 |
rol | -5.679 |
umm | -5.601 |
osity | -5.593 |
Token | always |
Token ID | 1464 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.340 |
, | +3.188 |
the | +3.077 |
. | +3.068 |
a | +2.852 |
Neg logit contributions | |
lor | -5.821 |
rol | -5.614 |
arians | -5.593 |
beh | -5.518 |
icians | -5.510 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.759 |
, | +3.603 |
the | +3.534 |
. | +3.500 |
a | +3.296 |
Neg logit contributions | |
lor | -5.178 |
beh | -5.084 |
rol | -5.065 |
arians | -5.033 |
icians | -4.967 |
Token | in |
Token ID | 287 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.594 |
the | +1.581 |
, | +1.493 |
a | +1.450 |
. | +1.377 |
Neg logit contributions | |
lor | -7.184 |
umm | -7.130 |
rol | -7.120 |
arians | -7.087 |
ocol | -7.026 |
Token | his |
Token ID | 465 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.582 |
, | +3.405 |
. | +3.251 |
the | +3.216 |
a | +3.092 |
Neg logit contributions | |
lor | -5.402 |
ocol | -5.355 |
arians | -5.234 |
umm | -5.179 |
rol | -5.139 |
Token | room |
Token ID | 2119 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.031 |
the | +4.928 |
, | +4.784 |
a | +4.729 |
. | +4.707 |
Neg logit contributions | |
lor | -4.002 |
umm | -3.924 |
arians | -3.852 |
ocol | -3.799 |
former | -3.794 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.470 |
and | +1.382 |
, | +1.272 |
a | +1.257 |
. | +1.109 |
Neg logit contributions | |
lor | -7.513 |
arians | -7.379 |
rol | -7.264 |
umm | -7.221 |
ides | -7.194 |
Token | not |
Token ID | 407 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.464 |
the | +2.317 |
, | +2.304 |
. | +2.181 |
a | +2.138 |
Neg logit contributions | |
lor | -6.621 |
arians | -6.475 |
umm | -6.359 |
rol | -6.353 |
ides | -6.342 |
Token | work |
Token ID | 670 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.486 |
the | +3.405 |
, | +3.343 |
a | +3.215 |
. | +3.211 |
Neg logit contributions | |
lor | -5.573 |
arians | -5.462 |
umm | -5.430 |
ides | -5.425 |
osity | -5.370 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.072 |
the | +2.006 |
, | +1.910 |
a | +1.838 |
. | +1.722 |
Neg logit contributions | |
lor | -6.889 |
arians | -6.741 |
rol | -6.706 |
ides | -6.688 |
umm | -6.686 |
Token | It |
Token ID | 632 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.549 |
, | +3.450 |
the | +3.420 |
. | +3.282 |
a | +3.212 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.518 |
arians | -5.407 |
rol | -5.384 |
osity | -5.282 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.107 |
, | +3.017 |
the | +3.003 |
. | +2.860 |
a | +2.804 |
Neg logit contributions | |
lor | -5.952 |
rol | -5.848 |
arians | -5.806 |
umm | -5.784 |
isher | -5.702 |
Token | still |
Token ID | 991 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.193 |
, | +3.061 |
the | +2.951 |
. | +2.918 |
a | +2.734 |
Neg logit contributions | |
rol | -5.649 |
ocol | -5.641 |
lor | -5.631 |
arians | -5.601 |
umm | -5.600 |
Token | broken |
Token ID | 5445 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.755 |
the | +3.631 |
, | +3.619 |
. | +3.468 |
a | +3.395 |
Neg logit contributions | |
lor | -5.145 |
umm | -5.103 |
ocol | -5.076 |
rol | -5.057 |
arians | -5.045 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.548 |
and | +0.488 |
, | +0.372 |
a | +0.354 |
. | +0.187 |
Neg logit contributions | |
lor | -8.251 |
arians | -8.220 |
umm | -8.206 |
rol | -8.094 |
ides | -8.072 |
Token | The |
Token ID | 383 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.241 |
, | +3.116 |
the | +3.090 |
. | +2.965 |
a | +2.904 |
Neg logit contributions | |
lor | -5.910 |
umm | -5.770 |
arians | -5.721 |
rol | -5.709 |
ocol | -5.571 |
Token | woman |
Token ID | 2415 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.420 |
, | +4.371 |
the | +4.369 |
. | +4.224 |
a | +4.156 |
Neg logit contributions | |
lor | -4.648 |
arians | -4.574 |
umm | -4.543 |
isher | -4.475 |
ocol | -4.420 |
Token | cried |
Token ID | 16896 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.988 |
the | +2.972 |
, | +2.904 |
. | +2.818 |
a | +2.815 |
Neg logit contributions | |
lor | -6.003 |
arians | -5.901 |
rol | -5.812 |
isher | -5.753 |
umm | -5.742 |
Token | toy |
Token ID | 13373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.709 |
, | +3.650 |
the | +3.648 |
. | +3.494 |
a | +3.404 |
Neg logit contributions | |
lor | -5.342 |
arians | -5.267 |
umm | -5.256 |
isher | -5.212 |
ocol | -5.110 |
Token | did |
Token ID | 750 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.581 |
the | +3.538 |
, | +3.468 |
. | +3.378 |
a | +3.348 |
Neg logit contributions | |
lor | -5.520 |
arians | -5.392 |
umm | -5.279 |
rol | -5.273 |
isher | -5.224 |
Token | not |
Token ID | 407 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.464 |
the | +2.317 |
, | +2.304 |
. | +2.181 |
a | +2.138 |
Neg logit contributions | |
lor | -6.621 |
arians | -6.475 |
umm | -6.359 |
rol | -6.353 |
ides | -6.342 |
Token | work |
Token ID | 670 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.486 |
the | +3.405 |
, | +3.343 |
a | +3.215 |
. | +3.211 |
Neg logit contributions | |
lor | -5.573 |
arians | -5.462 |
umm | -5.430 |
ides | -5.425 |
osity | -5.370 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.072 |
the | +2.006 |
, | +1.910 |
a | +1.838 |
. | +1.722 |
Neg logit contributions | |
lor | -6.889 |
arians | -6.741 |
rol | -6.706 |
ides | -6.688 |
umm | -6.686 |
Token | It |
Token ID | 632 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.549 |
, | +3.450 |
the | +3.420 |
. | +3.282 |
a | +3.212 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.518 |
arians | -5.407 |
rol | -5.384 |
osity | -5.282 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.107 |
, | +3.017 |
the | +3.003 |
. | +2.860 |
a | +2.804 |
Neg logit contributions | |
lor | -5.952 |
rol | -5.848 |
arians | -5.806 |
umm | -5.784 |
isher | -5.702 |
Token | still |
Token ID | 991 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.193 |
, | +3.061 |
the | +2.951 |
. | +2.918 |
a | +2.734 |
Neg logit contributions | |
rol | -5.649 |
ocol | -5.641 |
lor | -5.631 |
arians | -5.601 |
umm | -5.600 |
Token | broken |
Token ID | 5445 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.755 |
the | +3.631 |
, | +3.619 |
. | +3.468 |
a | +3.395 |
Neg logit contributions | |
lor | -5.145 |
umm | -5.103 |
ocol | -5.076 |
rol | -5.057 |
arians | -5.045 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.548 |
and | +0.488 |
, | +0.372 |
a | +0.354 |
. | +0.187 |
Neg logit contributions | |
lor | -8.251 |
arians | -8.220 |
umm | -8.206 |
rol | -8.094 |
ides | -8.072 |
Token | The |
Token ID | 383 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.241 |
, | +3.116 |
the | +3.090 |
. | +2.965 |
a | +2.904 |
Neg logit contributions | |
lor | -5.910 |
umm | -5.770 |
arians | -5.721 |
rol | -5.709 |
ocol | -5.571 |
Token | the |
Token ID | 262 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.222 |
, | +2.126 |
the | +2.061 |
. | +2.016 |
a | +1.915 |
Neg logit contributions | |
lor | -6.788 |
arians | -6.687 |
umm | -6.681 |
rol | -6.635 |
ocol | -6.634 |
Token | toy |
Token ID | 13373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.770 |
the | +4.694 |
, | +4.664 |
. | +4.533 |
a | +4.447 |
Neg logit contributions | |
lor | -4.318 |
umm | -4.262 |
arians | -4.181 |
rol | -4.140 |
isher | -4.113 |
Token | very |
Token ID | 845 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.302 |
the | +3.295 |
, | +3.176 |
a | +3.101 |
. | +3.054 |
Neg logit contributions | |
lor | -5.663 |
arians | -5.609 |
rol | -5.494 |
umm | -5.489 |
isher | -5.385 |
Token | much |
Token ID | 881 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.025 |
the | +2.942 |
, | +2.863 |
. | +2.722 |
a | +2.718 |
Neg logit contributions | |
lor | -6.117 |
umm | -5.939 |
rol | -5.931 |
arians | -5.916 |
ocol | -5.848 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.482 |
and | +0.410 |
a | +0.336 |
, | +0.300 |
. | +0.117 |
Neg logit contributions | |
lor | -8.327 |
arians | -8.274 |
umm | -8.239 |
rol | -8.105 |
isher | -8.068 |
Token | It |
Token ID | 632 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.569 |
, | +3.467 |
the | +3.443 |
. | +3.311 |
a | +3.274 |
Neg logit contributions | |
lor | -5.538 |
umm | -5.485 |
arians | -5.377 |
rol | -5.376 |
ocol | -5.347 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.106 |
the | +3.008 |
, | +3.007 |
. | +2.861 |
a | +2.822 |
Neg logit contributions | |
lor | -5.931 |
rol | -5.813 |
arians | -5.796 |
umm | -5.688 |
isher | -5.629 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.783 |
, | +2.638 |
. | +2.549 |
the | +2.545 |
a | +2.299 |
Neg logit contributions | |
lor | -6.057 |
rol | -6.055 |
ocol | -6.050 |
arians | -5.929 |
umm | -5.912 |
Token | red |
Token ID | 2266 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.465 |
the | +3.390 |
, | +3.296 |
. | +3.235 |
a | +3.154 |
Neg logit contributions | |
lor | -5.566 |
umm | -5.499 |
arians | -5.411 |
bek | -5.406 |
ocol | -5.331 |
Token | car |
Token ID | 1097 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.226 |
the | +4.198 |
, | +4.093 |
. | +4.001 |
a | +3.986 |
Neg logit contributions | |
lor | -4.860 |
umm | -4.716 |
arians | -4.697 |
rol | -4.647 |
ocol | -4.593 |
Token | that |
Token ID | 326 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.404 |
and | +1.401 |
, | +1.267 |
a | +1.203 |
. | +1.121 |
Neg logit contributions | |
lor | -7.565 |
arians | -7.479 |
rol | -7.378 |
umm | -7.341 |
ides | -7.259 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.930 |
the | +1.907 |
, | +1.797 |
a | +1.737 |
. | +1.655 |
Neg logit contributions | |
lor | -6.983 |
rol | -6.886 |
arians | -6.808 |
ides | -6.778 |
osity | -6.754 |
Token | But |
Token ID | 887 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.529 |
the | +3.437 |
, | +3.435 |
. | +3.304 |
a | +3.255 |
Neg logit contributions | |
umm | -5.484 |
lor | -5.454 |
arians | -5.432 |
rol | -5.333 |
osity | -5.303 |
Token | the |
Token ID | 262 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.830 |
. | +1.667 |
, | +1.617 |
the | +1.568 |
a | +1.513 |
Neg logit contributions | |
lor | -6.998 |
arians | -6.984 |
ocol | -6.955 |
umm | -6.919 |
rol | -6.899 |
Token | toy |
Token ID | 13373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.709 |
, | +3.650 |
the | +3.648 |
. | +3.494 |
a | +3.404 |
Neg logit contributions | |
lor | -5.342 |
arians | -5.267 |
umm | -5.256 |
isher | -5.212 |
ocol | -5.110 |
Token | did |
Token ID | 750 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.581 |
the | +3.538 |
, | +3.468 |
. | +3.378 |
a | +3.348 |
Neg logit contributions | |
lor | -5.520 |
arians | -5.392 |
umm | -5.279 |
rol | -5.273 |
isher | -5.224 |
Token | not |
Token ID | 407 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.464 |
the | +2.317 |
, | +2.304 |
. | +2.181 |
a | +2.138 |
Neg logit contributions | |
lor | -6.621 |
arians | -6.475 |
umm | -6.359 |
rol | -6.353 |
ides | -6.342 |
Token | work |
Token ID | 670 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.486 |
the | +3.405 |
, | +3.343 |
a | +3.215 |
. | +3.211 |
Neg logit contributions | |
lor | -5.573 |
arians | -5.462 |
umm | -5.430 |
ides | -5.425 |
osity | -5.370 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.072 |
the | +2.006 |
, | +1.910 |
a | +1.838 |
. | +1.722 |
Neg logit contributions | |
lor | -6.889 |
arians | -6.741 |
rol | -6.706 |
ides | -6.688 |
umm | -6.686 |
Token | It |
Token ID | 632 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.549 |
, | +3.450 |
the | +3.420 |
. | +3.282 |
a | +3.212 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.518 |
arians | -5.407 |
rol | -5.384 |
osity | -5.282 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.107 |
, | +3.017 |
the | +3.003 |
. | +2.860 |
a | +2.804 |
Neg logit contributions | |
lor | -5.952 |
rol | -5.848 |
arians | -5.806 |
umm | -5.784 |
isher | -5.702 |
Token | still |
Token ID | 991 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.193 |
, | +3.061 |
the | +2.951 |
. | +2.918 |
a | +2.734 |
Neg logit contributions | |
rol | -5.649 |
ocol | -5.641 |
lor | -5.631 |
arians | -5.601 |
umm | -5.600 |
Token | toy |
Token ID | 13373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.595 |
the | +4.544 |
, | +4.464 |
. | +4.337 |
a | +4.278 |
Neg logit contributions | |
lor | -4.536 |
arians | -4.427 |
umm | -4.426 |
ocol | -4.307 |
isher | -4.307 |
Token | is |
Token ID | 318 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.276 |
the | +3.195 |
, | +3.140 |
. | +3.036 |
a | +3.006 |
Neg logit contributions | |
lor | -5.891 |
arians | -5.729 |
umm | -5.690 |
rol | -5.661 |
ides | -5.572 |
Token | broken |
Token ID | 5445 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.766 |
, | +3.596 |
the | +3.578 |
. | +3.480 |
a | +3.361 |
Neg logit contributions | |
lor | -5.229 |
arians | -5.120 |
umm | -5.070 |
rol | -5.067 |
ocol | -5.067 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.888 |
and | +0.843 |
, | +0.710 |
a | +0.669 |
. | +0.557 |
Neg logit contributions | |
lor | -7.986 |
arians | -7.897 |
umm | -7.862 |
rol | -7.777 |
isher | -7.760 |
Token | I |
Token ID | 314 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.898 |
the | +4.778 |
, | +4.769 |
. | +4.664 |
a | +4.580 |
Neg logit contributions | |
lor | -4.333 |
arians | -4.181 |
umm | -4.165 |
rol | -4.095 |
osity | -4.090 |
Token | can |
Token ID | 460 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.919 |
the | +3.878 |
, | +3.804 |
. | +3.691 |
a | +3.666 |
Neg logit contributions | |
lor | -5.165 |
arians | -5.001 |
rol | -4.990 |
umm | -4.936 |
ides | -4.920 |
Token | 't |
Token ID | 470 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.042 |
the | +3.950 |
, | +3.906 |
. | +3.797 |
a | +3.762 |
Neg logit contributions | |
lor | -5.115 |
arians | -4.973 |
umm | -4.907 |
rol | -4.882 |
ides | -4.827 |
Token | fix |
Token ID | 4259 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.958 |
the | +3.896 |
, | +3.832 |
a | +3.706 |
. | +3.695 |
Neg logit contributions | |
lor | -5.150 |
arians | -5.022 |
umm | -4.971 |
ides | -4.924 |
rol | -4.912 |
Token | it |
Token ID | 340 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.638 |
, | +1.472 |
the | +1.375 |
. | +1.322 |
a | +1.274 |
Neg logit contributions | |
lor | -7.426 |
arians | -7.283 |
ocol | -7.233 |
umm | -7.184 |
rol | -7.136 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +2.448 |
and | +2.418 |
, | +2.260 |
a | +2.247 |
. | +2.035 |
Neg logit contributions | |
lor | -6.476 |
arians | -6.379 |
rol | -6.322 |
umm | -6.311 |
ides | -6.302 |
Token | I |
Token ID | 314 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.978 |
the | +4.893 |
, | +4.870 |
. | +4.752 |
a | +4.665 |
Neg logit contributions | |
lor | -4.225 |
arians | -4.115 |
umm | -4.087 |
rol | -3.993 |
osity | -3.989 |
Token | said |
Token ID | 531 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.362 |
the | +3.337 |
, | +3.264 |
. | +3.197 |
a | +3.168 |
Neg logit contributions | |
lor | -5.674 |
arians | -5.508 |
rol | -5.430 |
umm | -5.381 |
isher | -5.359 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.343 |
the | +0.231 |
, | +0.156 |
. | +0.088 |
a | +0.053 |
Neg logit contributions | |
lor | -8.837 |
arians | -8.659 |
umm | -8.637 |
rol | -8.619 |
ocol | -8.544 |
Token | " |
Token ID | 366 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.308 |
the | +2.215 |
, | +2.164 |
. | +2.081 |
a | +2.049 |
Neg logit contributions | |
lor | -6.702 |
arians | -6.582 |
osity | -6.463 |
rol | -6.445 |
umm | -6.436 |
Token | My |
Token ID | 3666 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.682 |
the | +4.578 |
, | +4.578 |
. | +4.447 |
a | +4.394 |
Neg logit contributions | |
lor | -4.590 |
arians | -4.403 |
umm | -4.376 |
rol | -4.357 |
osity | -4.255 |
Token | toy |
Token ID | 13373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.595 |
the | +4.544 |
, | +4.464 |
. | +4.337 |
a | +4.278 |
Neg logit contributions | |
lor | -4.536 |
arians | -4.427 |
umm | -4.426 |
ocol | -4.307 |
isher | -4.307 |
Token | is |
Token ID | 318 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.276 |
the | +3.195 |
, | +3.140 |
. | +3.036 |
a | +3.006 |
Neg logit contributions | |
lor | -5.891 |
arians | -5.729 |
umm | -5.690 |
rol | -5.661 |
ides | -5.572 |
Token | broken |
Token ID | 5445 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.766 |
, | +3.596 |
the | +3.578 |
. | +3.480 |
a | +3.361 |
Neg logit contributions | |
lor | -5.229 |
arians | -5.120 |
umm | -5.070 |
rol | -5.067 |
ocol | -5.067 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +0.888 |
and | +0.843 |
, | +0.710 |
a | +0.669 |
. | +0.557 |
Neg logit contributions | |
lor | -7.986 |
arians | -7.897 |
umm | -7.862 |
rol | -7.777 |
isher | -7.760 |
Token | I |
Token ID | 314 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.898 |
the | +4.778 |
, | +4.769 |
. | +4.664 |
a | +4.580 |
Neg logit contributions | |
lor | -4.333 |
arians | -4.181 |
umm | -4.165 |
rol | -4.095 |
osity | -4.090 |
Token | can |
Token ID | 460 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.919 |
the | +3.878 |
, | +3.804 |
. | +3.691 |
a | +3.666 |
Neg logit contributions | |
lor | -5.165 |
arians | -5.001 |
rol | -4.990 |
umm | -4.936 |
ides | -4.920 |
Token | 't |
Token ID | 470 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.042 |
the | +3.950 |
, | +3.906 |
. | +3.797 |
a | +3.762 |
Neg logit contributions | |
lor | -5.115 |
arians | -4.973 |
umm | -4.907 |
rol | -4.882 |
ides | -4.827 |
Token | 't |
Token ID | 470 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.057 |
the | +3.946 |
, | +3.915 |
. | +3.813 |
a | +3.774 |
Neg logit contributions | |
lor | -5.145 |
arians | -4.964 |
umm | -4.941 |
rol | -4.909 |
ides | -4.815 |
Token | cry |
Token ID | 3960 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.731 |
the | +4.634 |
, | +4.568 |
. | +4.464 |
a | +4.457 |
Neg logit contributions | |
lor | -4.417 |
umm | -4.283 |
arians | -4.283 |
rol | -4.198 |
ides | -4.169 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.111 |
the | +1.100 |
a | +0.926 |
, | +0.882 |
. | +0.800 |
Neg logit contributions | |
lor | -7.874 |
arians | -7.791 |
umm | -7.758 |
rol | -7.700 |
osity | -7.658 |
Token | woman |
Token ID | 2415 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.035 |
, | +3.925 |
the | +3.913 |
. | +3.862 |
a | +3.785 |
Neg logit contributions | |
lor | -5.095 |
arians | -4.937 |
umm | -4.908 |
ocol | -4.804 |
rol | -4.771 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.756 |
the | +0.685 |
, | +0.569 |
a | +0.527 |
. | +0.429 |
Neg logit contributions | |
lor | -8.331 |
arians | -8.196 |
rol | -8.096 |
umm | -8.090 |
osity | -8.040 |
Token | I |
Token ID | 314 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.544 |
the | +4.433 |
, | +4.396 |
. | +4.300 |
a | +4.244 |
Neg logit contributions | |
lor | -4.663 |
arians | -4.505 |
umm | -4.482 |
rol | -4.432 |
osity | -4.395 |
Token | have |
Token ID | 423 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.318 |
the | +4.286 |
, | +4.188 |
. | +4.087 |
a | +4.070 |
Neg logit contributions | |
lor | -4.815 |
arians | -4.652 |
rol | -4.617 |
umm | -4.594 |
ides | -4.547 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.734 |
, | +2.589 |
the | +2.582 |
. | +2.478 |
a | +2.376 |
Neg logit contributions | |
lor | -6.444 |
arians | -6.248 |
umm | -6.218 |
rol | -6.195 |
ocol | -6.151 |
Token | gift |
Token ID | 6979 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.237 |
the | +4.166 |
, | +4.063 |
. | +4.006 |
a | +3.917 |
Neg logit contributions | |
lor | -4.895 |
umm | -4.717 |
arians | -4.696 |
rol | -4.597 |
isher | -4.594 |
Token | for |
Token ID | 329 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.971 |
the | +1.938 |
, | +1.840 |
a | +1.724 |
. | +1.697 |
Neg logit contributions | |
lor | -7.103 |
arians | -6.941 |
rol | -6.911 |
umm | -6.871 |
ides | -6.767 |
Token | you |
Token ID | 345 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.463 |
, | +3.245 |
. | +3.134 |
the | +3.125 |
a | +2.973 |
Neg logit contributions | |
arians | -5.677 |
lor | -5.617 |
ocol | -5.606 |
umm | -5.468 |
icians | -5.416 |
Token | cry |
Token ID | 3960 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.731 |
the | +4.634 |
, | +4.568 |
. | +4.464 |
a | +4.457 |
Neg logit contributions | |
lor | -4.417 |
umm | -4.283 |
arians | -4.283 |
rol | -4.198 |
ides | -4.169 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.111 |
the | +1.100 |
a | +0.926 |
, | +0.882 |
. | +0.800 |
Neg logit contributions | |
lor | -7.874 |
arians | -7.791 |
umm | -7.758 |
rol | -7.700 |
osity | -7.658 |
Token | woman |
Token ID | 2415 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.035 |
, | +3.925 |
the | +3.913 |
. | +3.862 |
a | +3.785 |
Neg logit contributions | |
lor | -5.095 |
arians | -4.937 |
umm | -4.908 |
ocol | -4.804 |
rol | -4.771 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +0.756 |
the | +0.685 |
, | +0.569 |
a | +0.527 |
. | +0.429 |
Neg logit contributions | |
lor | -8.331 |
arians | -8.196 |
rol | -8.096 |
umm | -8.090 |
osity | -8.040 |
Token | I |
Token ID | 314 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.544 |
the | +4.433 |
, | +4.396 |
. | +4.300 |
a | +4.244 |
Neg logit contributions | |
lor | -4.663 |
arians | -4.505 |
umm | -4.482 |
rol | -4.432 |
osity | -4.395 |
Token | have |
Token ID | 423 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.318 |
the | +4.286 |
, | +4.188 |
. | +4.087 |
a | +4.070 |
Neg logit contributions | |
lor | -4.815 |
arians | -4.652 |
rol | -4.617 |
umm | -4.594 |
ides | -4.547 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.734 |
, | +2.589 |
the | +2.582 |
. | +2.478 |
a | +2.376 |
Neg logit contributions | |
lor | -6.444 |
arians | -6.248 |
umm | -6.218 |
rol | -6.195 |
ocol | -6.151 |
Token | gift |
Token ID | 6979 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.237 |
the | +4.166 |
, | +4.063 |
. | +4.006 |
a | +3.917 |
Neg logit contributions | |
lor | -4.895 |
umm | -4.717 |
arians | -4.696 |
rol | -4.597 |
isher | -4.594 |
Token | for |
Token ID | 329 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.971 |
the | +1.938 |
, | +1.840 |
a | +1.724 |
. | +1.697 |
Neg logit contributions | |
lor | -7.103 |
arians | -6.941 |
rol | -6.911 |
umm | -6.871 |
ides | -6.767 |
Token | you |
Token ID | 345 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.463 |
, | +3.245 |
. | +3.134 |
the | +3.125 |
a | +2.973 |
Neg logit contributions | |
arians | -5.677 |
lor | -5.617 |
ocol | -5.606 |
umm | -5.468 |
icians | -5.416 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.412 |
and | +1.350 |
, | +1.216 |
a | +1.158 |
. | +1.023 |
Neg logit contributions | |
lor | -7.535 |
arians | -7.446 |
ides | -7.379 |
rol | -7.331 |
osity | -7.294 |
Token | the |
Token ID | 262 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.497 |
, | +2.356 |
the | +2.303 |
. | +2.224 |
a | +2.214 |
Neg logit contributions | |
lor | -6.502 |
ocol | -6.376 |
arians | -6.372 |
rol | -6.354 |
isher | -6.281 |
Token | door |
Token ID | 3420 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.810 |
the | +4.717 |
, | +4.678 |
. | +4.559 |
a | +4.535 |
Neg logit contributions | |
lor | -4.308 |
umm | -4.171 |
arians | -4.156 |
ocol | -4.108 |
rol | -4.099 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.891 |
and | +1.834 |
a | +1.740 |
, | +1.675 |
. | +1.546 |
Neg logit contributions | |
lor | -7.001 |
rol | -6.895 |
arians | -6.883 |
umm | -6.848 |
ides | -6.771 |
Token | She |
Token ID | 1375 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.448 |
the | +3.340 |
, | +3.308 |
. | +3.192 |
a | +3.137 |
Neg logit contributions | |
lor | -5.722 |
arians | -5.561 |
umm | -5.498 |
rol | -5.495 |
ocol | -5.446 |
Token | could |
Token ID | 714 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.321 |
the | +3.287 |
, | +3.254 |
. | +3.132 |
a | +3.090 |
Neg logit contributions | |
lor | -5.721 |
arians | -5.624 |
rol | -5.535 |
ides | -5.440 |
umm | -5.437 |
Token | not |
Token ID | 407 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.768 |
, | +2.645 |
the | +2.613 |
. | +2.519 |
a | +2.427 |
Neg logit contributions | |
lor | -6.283 |
arians | -6.170 |
rol | -6.068 |
ides | -6.020 |
umm | -6.011 |
Token | save |
Token ID | 3613 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.776 |
the | +3.710 |
, | +3.637 |
a | +3.502 |
. | +3.454 |
Neg logit contributions | |
lor | -5.250 |
arians | -5.171 |
ides | -5.114 |
umm | -5.049 |
rol | -5.004 |
Token | them |
Token ID | 606 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.308 |
, | +3.142 |
the | +3.041 |
. | +2.976 |
a | +2.913 |
Neg logit contributions | |
arians | -5.715 |
lor | -5.699 |
ocol | -5.610 |
rol | -5.566 |
umm | -5.496 |
Token | . |
Token ID | 13 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.455 |
the | +1.419 |
, | +1.305 |
a | +1.240 |
. | +1.123 |
Neg logit contributions | |
lor | -7.518 |
arians | -7.401 |
rol | -7.356 |
ides | -7.279 |
umm | -7.264 |
Token | She |
Token ID | 1375 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.300 |
the | +3.189 |
, | +3.148 |
. | +3.022 |
a | +2.980 |
Neg logit contributions | |
lor | -5.895 |
arians | -5.743 |
umm | -5.661 |
rol | -5.638 |
ocol | -5.573 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.218 |
the | +3.180 |
, | +3.144 |
. | +3.015 |
a | +2.974 |
Neg logit contributions | |
lor | -5.859 |
arians | -5.749 |
rol | -5.667 |
umm | -5.578 |
ides | -5.562 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +2.058 |
and | +2.052 |
, | +1.940 |
a | +1.915 |
. | +1.851 |
Neg logit contributions | |
lor | -6.838 |
arians | -6.734 |
rol | -6.605 |
isher | -6.572 |
osity | -6.544 |
Token | said |
Token ID | 531 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.171 |
, | +3.030 |
. | +2.980 |
the | +2.908 |
a | +2.807 |
Neg logit contributions | |
lor | -5.786 |
arians | -5.782 |
bek | -5.683 |
isher | -5.612 |
rol | -5.577 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.636 |
the | +1.504 |
, | +1.411 |
. | +1.371 |
a | +1.319 |
Neg logit contributions | |
lor | -7.527 |
arians | -7.341 |
umm | -7.304 |
rol | -7.281 |
osity | -7.229 |
Token | " |
Token ID | 366 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.312 |
the | +2.246 |
, | +2.162 |
. | +2.087 |
a | +2.052 |
Neg logit contributions | |
lor | -6.673 |
arians | -6.583 |
osity | -6.471 |
rol | -6.440 |
umm | -6.431 |
Token | I |
Token ID | 40 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.568 |
the | +5.465 |
, | +5.459 |
. | +5.336 |
a | +5.283 |
Neg logit contributions | |
lor | -3.696 |
arians | -3.514 |
umm | -3.504 |
rol | -3.466 |
ocol | -3.357 |
Token | can |
Token ID | 460 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.120 |
the | +4.068 |
, | +3.965 |
. | +3.889 |
a | +3.839 |
Neg logit contributions | |
lor | -5.030 |
arians | -4.842 |
rol | -4.813 |
umm | -4.812 |
ides | -4.762 |
Token | help |
Token ID | 1037 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.035 |
the | +3.946 |
, | +3.882 |
. | +3.789 |
a | +3.754 |
Neg logit contributions | |
lor | -5.108 |
arians | -4.986 |
umm | -4.894 |
rol | -4.851 |
ides | -4.823 |
Token | you |
Token ID | 345 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.047 |
the | +2.857 |
, | +2.856 |
. | +2.746 |
a | +2.733 |
Neg logit contributions | |
lor | -5.992 |
arians | -5.980 |
umm | -5.763 |
ocol | -5.759 |
ides | -5.724 |
Token | fix |
Token ID | 4259 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.769 |
the | +3.730 |
, | +3.590 |
a | +3.531 |
. | +3.482 |
Neg logit contributions | |
lor | -5.334 |
arians | -5.179 |
ides | -5.063 |
umm | -5.051 |
rol | -5.014 |
Token | your |
Token ID | 534 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.579 |
, | +2.388 |
. | +2.291 |
the | +2.280 |
a | +2.198 |
Neg logit contributions | |
lor | -6.472 |
arians | -6.404 |
ocol | -6.301 |
isher | -6.209 |
umm | -6.176 |
Token | bike |
Token ID | 7161 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.133 |
the | +5.042 |
, | +4.986 |
a | +4.872 |
. | +4.840 |
Neg logit contributions | |
lor | -3.910 |
arians | -3.832 |
umm | -3.794 |
ocol | -3.721 |
isher | -3.705 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.074 |
the | +3.070 |
, | +2.984 |
. | +2.937 |
a | +2.905 |
Neg logit contributions | |
lor | -5.959 |
arians | -5.776 |
rol | -5.679 |
umm | -5.601 |
osity | -5.593 |
Token | always |
Token ID | 1464 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.340 |
, | +3.188 |
the | +3.077 |
. | +3.068 |
a | +2.852 |
Neg logit contributions | |
lor | -5.821 |
rol | -5.614 |
arians | -5.593 |
beh | -5.518 |
icians | -5.510 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.759 |
, | +3.603 |
the | +3.534 |
. | +3.500 |
a | +3.296 |
Neg logit contributions | |
lor | -5.178 |
beh | -5.084 |
rol | -5.065 |
arians | -5.033 |
icians | -4.967 |
Token | in |
Token ID | 287 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +1.594 |
the | +1.581 |
, | +1.493 |
a | +1.450 |
. | +1.377 |
Neg logit contributions | |
lor | -7.184 |
umm | -7.130 |
rol | -7.120 |
arians | -7.087 |
ocol | -7.026 |
Token | his |
Token ID | 465 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.582 |
, | +3.405 |
. | +3.251 |
the | +3.216 |
a | +3.092 |
Neg logit contributions | |
lor | -5.402 |
ocol | -5.355 |
arians | -5.234 |
umm | -5.179 |
rol | -5.139 |
Token | room |
Token ID | 2119 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.031 |
the | +4.928 |
, | +4.784 |
a | +4.729 |
. | +4.707 |
Neg logit contributions | |
lor | -4.002 |
umm | -3.924 |
arians | -3.852 |
ocol | -3.799 |
former | -3.794 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.470 |
and | +1.382 |
, | +1.272 |
a | +1.257 |
. | +1.109 |
Neg logit contributions | |
lor | -7.513 |
arians | -7.379 |
rol | -7.264 |
umm | -7.221 |
ides | -7.194 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
, | +2.419 |
and | +2.404 |
the | +2.391 |
. | +2.334 |
a | +2.244 |
Neg logit contributions | |
lor | -6.401 |
arians | -6.323 |
rol | -6.272 |
umm | -6.203 |
osity | -6.168 |
Token | he |
Token ID | 339 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.762 |
, | +2.665 |
. | +2.610 |
the | +2.552 |
a | +2.418 |
Neg logit contributions | |
lor | -6.190 |
arians | -6.062 |
rol | -6.028 |
umm | -5.963 |
osity | -5.960 |
Token | never |
Token ID | 1239 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.624 |
the | +3.584 |
, | +3.542 |
. | +3.444 |
a | +3.401 |
Neg logit contributions | |
lor | -5.479 |
arians | -5.322 |
rol | -5.246 |
umm | -5.162 |
ides | -5.121 |
Token | had |
Token ID | 550 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.098 |
the | +3.979 |
, | +3.919 |
. | +3.819 |
a | +3.795 |
Neg logit contributions | |
lor | -4.960 |
rol | -4.813 |
arians | -4.798 |
beh | -4.787 |
osity | -4.782 |
Token | his |
Token ID | 465 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.582 |
, | +3.405 |
. | +3.251 |
the | +3.216 |
a | +3.092 |
Neg logit contributions | |
lor | -5.402 |
ocol | -5.355 |
arians | -5.234 |
umm | -5.179 |
rol | -5.139 |
Token | room |
Token ID | 2119 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.031 |
the | +4.928 |
, | +4.784 |
a | +4.729 |
. | +4.707 |
Neg logit contributions | |
lor | -4.002 |
umm | -3.924 |
arians | -3.852 |
ocol | -3.799 |
former | -3.794 |
Token | , |
Token ID | 11 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +1.470 |
and | +1.382 |
, | +1.272 |
a | +1.257 |
. | +1.109 |
Neg logit contributions | |
lor | -7.513 |
arians | -7.379 |
rol | -7.264 |
umm | -7.221 |
ides | -7.194 |
Token | and |
Token ID | 290 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
, | +2.419 |
and | +2.404 |
the | +2.391 |
. | +2.334 |
a | +2.244 |
Neg logit contributions | |
lor | -6.401 |
arians | -6.323 |
rol | -6.272 |
umm | -6.203 |
osity | -6.168 |
Token | he |
Token ID | 339 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.762 |
, | +2.665 |
. | +2.610 |
the | +2.552 |
a | +2.418 |
Neg logit contributions | |
lor | -6.190 |
arians | -6.062 |
rol | -6.028 |
umm | -5.963 |
osity | -5.960 |
Token | never |
Token ID | 1239 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +3.624 |
the | +3.584 |
, | +3.542 |
. | +3.444 |
a | +3.401 |
Neg logit contributions | |
lor | -5.479 |
arians | -5.322 |
rol | -5.246 |
umm | -5.162 |
ides | -5.121 |
Token | had |
Token ID | 550 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.098 |
the | +3.979 |
, | +3.919 |
. | +3.819 |
a | +3.795 |
Neg logit contributions | |
lor | -4.960 |
rol | -4.813 |
arians | -4.798 |
beh | -4.787 |
osity | -4.782 |
Token | a |
Token ID | 257 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +2.655 |
, | +2.493 |
the | +2.416 |
. | +2.337 |
a | +2.189 |
Neg logit contributions | |
lor | -6.492 |
rol | -6.285 |
arians | -6.263 |
umm | -6.203 |
beh | -6.197 |
Token | good |
Token ID | 922 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +5.545 |
the | +5.518 |
, | +5.333 |
. | +5.317 |
a | +5.239 |
Neg logit contributions | |
lor | -3.595 |
arians | -3.393 |
umm | -3.363 |
osity | -3.287 |
bek | -3.278 |
Token | night |
Token ID | 1755 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
and | +4.624 |
the | +4.618 |
, | +4.489 |
. | +4.398 |
a | +4.367 |
Neg logit contributions | |
lor | -4.484 |
umm | -4.334 |
arians | -4.278 |
rol | -4.245 |
ides | -4.228 |
Token | 's |
Token ID | 338 |
Feature activation | +5.40e+02 |
Pos logit contributions | |
the | +3.013 |
and | +3.013 |
, | +2.877 |
a | +2.839 |
. | +2.687 |
Neg logit contributions | |
lor | -6.047 |
umm | -5.912 |
arians | -5.782 |
rol | -5.752 |
ides | -5.743 |