Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | hid |
Token ID | 24519 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.543 |
. | +3.368 |
the | +3.304 |
a | +3.118 |
Neg logit contributions | |
lor | -4.928 |
former | -4.828 |
umm | -4.792 |
arians | -4.754 |
ocol | -4.704 |
Token | under |
Token ID | 739 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.979 |
, | +2.932 |
the | +2.691 |
. | +2.671 |
a | +2.539 |
Neg logit contributions | |
umm | -5.514 |
lor | -5.502 |
ocol | -5.462 |
arians | -5.382 |
former | -5.375 |
Token | the |
Token ID | 262 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.522 |
, | +1.455 |
. | +1.240 |
the | +1.145 |
a | +0.965 |
Neg logit contributions | |
lor | -7.000 |
umm | -6.994 |
ocol | -6.941 |
former | -6.897 |
arians | -6.814 |
Token | covers |
Token ID | 8698 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.470 |
, | +4.430 |
the | +4.264 |
. | +4.212 |
a | +4.092 |
Neg logit contributions | |
umm | -4.070 |
lor | -4.055 |
ocol | -3.938 |
former | -3.901 |
arians | -3.855 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.786 |
, | +0.733 |
the | +0.569 |
. | +0.470 |
a | +0.416 |
Neg logit contributions | |
lor | -7.755 |
umm | -7.709 |
ocol | -7.545 |
former | -7.513 |
arians | -7.512 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | hid |
Token ID | 24519 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.543 |
. | +3.368 |
the | +3.304 |
a | +3.118 |
Neg logit contributions | |
lor | -4.928 |
former | -4.828 |
umm | -4.792 |
arians | -4.754 |
ocol | -4.704 |
Token | under |
Token ID | 739 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.979 |
, | +2.932 |
the | +2.691 |
. | +2.671 |
a | +2.539 |
Neg logit contributions | |
umm | -5.514 |
lor | -5.502 |
ocol | -5.462 |
arians | -5.382 |
former | -5.375 |
Token | the |
Token ID | 262 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.522 |
, | +1.455 |
. | +1.240 |
the | +1.145 |
a | +0.965 |
Neg logit contributions | |
lor | -7.000 |
umm | -6.994 |
ocol | -6.941 |
former | -6.897 |
arians | -6.814 |
Token | covers |
Token ID | 8698 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.470 |
, | +4.430 |
the | +4.264 |
. | +4.212 |
a | +4.092 |
Neg logit contributions | |
umm | -4.070 |
lor | -4.055 |
ocol | -3.938 |
former | -3.901 |
arians | -3.855 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | hid |
Token ID | 24519 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.543 |
. | +3.368 |
the | +3.304 |
a | +3.118 |
Neg logit contributions | |
lor | -4.928 |
former | -4.828 |
umm | -4.792 |
arians | -4.754 |
ocol | -4.704 |
Token | under |
Token ID | 739 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.979 |
, | +2.932 |
the | +2.691 |
. | +2.671 |
a | +2.539 |
Neg logit contributions | |
umm | -5.514 |
lor | -5.502 |
ocol | -5.462 |
arians | -5.382 |
former | -5.375 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | hid |
Token ID | 24519 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.543 |
. | +3.368 |
the | +3.304 |
a | +3.118 |
Neg logit contributions | |
lor | -4.928 |
former | -4.828 |
umm | -4.792 |
arians | -4.754 |
ocol | -4.704 |
Token | under |
Token ID | 739 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.979 |
, | +2.932 |
the | +2.691 |
. | +2.671 |
a | +2.539 |
Neg logit contributions | |
umm | -5.514 |
lor | -5.502 |
ocol | -5.462 |
arians | -5.382 |
former | -5.375 |
Token | the |
Token ID | 262 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.522 |
, | +1.455 |
. | +1.240 |
the | +1.145 |
a | +0.965 |
Neg logit contributions | |
lor | -7.000 |
umm | -6.994 |
ocol | -6.941 |
former | -6.897 |
arians | -6.814 |
Token | talking |
Token ID | 3375 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.747 |
, | +3.641 |
the | +3.525 |
. | +3.464 |
a | +3.313 |
Neg logit contributions | |
lor | -4.784 |
umm | -4.701 |
former | -4.678 |
arians | -4.632 |
ocol | -4.603 |
Token | , |
Token ID | 11 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.797 |
, | +2.754 |
the | +2.622 |
. | +2.545 |
a | +2.407 |
Neg logit contributions | |
lor | -5.717 |
umm | -5.661 |
former | -5.592 |
arians | -5.549 |
osity | -5.504 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.712 |
, | +3.680 |
. | +3.535 |
the | +3.501 |
a | +3.327 |
Neg logit contributions | |
umm | -4.769 |
lor | -4.735 |
former | -4.696 |
arians | -4.645 |
ocol | -4.630 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.158 |
, | +2.092 |
the | +2.021 |
. | +1.916 |
a | +1.810 |
Neg logit contributions | |
lor | -6.318 |
umm | -6.313 |
former | -6.163 |
arians | -6.139 |
ocol | -6.126 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | you |
Token ID | 345 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.218 |
, | +3.173 |
the | +3.031 |
. | +3.026 |
a | +2.883 |
Neg logit contributions | |
lor | -5.200 |
umm | -5.170 |
arians | -5.158 |
former | -5.056 |
osity | -5.025 |
Token | talking |
Token ID | 3375 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.747 |
, | +3.641 |
the | +3.525 |
. | +3.464 |
a | +3.313 |
Neg logit contributions | |
lor | -4.784 |
umm | -4.701 |
former | -4.678 |
arians | -4.632 |
ocol | -4.603 |
Token | , |
Token ID | 11 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.797 |
, | +2.754 |
the | +2.622 |
. | +2.545 |
a | +2.407 |
Neg logit contributions | |
lor | -5.717 |
umm | -5.661 |
former | -5.592 |
arians | -5.549 |
osity | -5.504 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.712 |
, | +3.680 |
. | +3.535 |
the | +3.501 |
a | +3.327 |
Neg logit contributions | |
umm | -4.769 |
lor | -4.735 |
former | -4.696 |
arians | -4.645 |
ocol | -4.630 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.158 |
, | +2.092 |
the | +2.021 |
. | +1.916 |
a | +1.810 |
Neg logit contributions | |
lor | -6.318 |
umm | -6.313 |
former | -6.163 |
arians | -6.139 |
ocol | -6.126 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | , |
Token ID | 11 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.797 |
, | +2.754 |
the | +2.622 |
. | +2.545 |
a | +2.407 |
Neg logit contributions | |
lor | -5.717 |
umm | -5.661 |
former | -5.592 |
arians | -5.549 |
osity | -5.504 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.712 |
, | +3.680 |
. | +3.535 |
the | +3.501 |
a | +3.327 |
Neg logit contributions | |
umm | -4.769 |
lor | -4.735 |
former | -4.696 |
arians | -4.645 |
ocol | -4.630 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.158 |
, | +2.092 |
the | +2.021 |
. | +1.916 |
a | +1.810 |
Neg logit contributions | |
lor | -6.318 |
umm | -6.313 |
former | -6.163 |
arians | -6.139 |
ocol | -6.126 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.712 |
, | +3.680 |
. | +3.535 |
the | +3.501 |
a | +3.327 |
Neg logit contributions | |
umm | -4.769 |
lor | -4.735 |
former | -4.696 |
arians | -4.645 |
ocol | -4.630 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.158 |
, | +2.092 |
the | +2.021 |
. | +1.916 |
a | +1.810 |
Neg logit contributions | |
lor | -6.318 |
umm | -6.313 |
former | -6.163 |
arians | -6.139 |
ocol | -6.126 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | hid |
Token ID | 24519 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.543 |
. | +3.368 |
the | +3.304 |
a | +3.118 |
Neg logit contributions | |
lor | -4.928 |
former | -4.828 |
umm | -4.792 |
arians | -4.754 |
ocol | -4.704 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.158 |
, | +2.092 |
the | +2.021 |
. | +1.916 |
a | +1.810 |
Neg logit contributions | |
lor | -6.318 |
umm | -6.313 |
former | -6.163 |
arians | -6.139 |
ocol | -6.126 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | hid |
Token ID | 24519 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.543 |
. | +3.368 |
the | +3.304 |
a | +3.118 |
Neg logit contributions | |
lor | -4.928 |
former | -4.828 |
umm | -4.792 |
arians | -4.754 |
ocol | -4.704 |
Token | under |
Token ID | 739 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.979 |
, | +2.932 |
the | +2.691 |
. | +2.671 |
a | +2.539 |
Neg logit contributions | |
umm | -5.514 |
lor | -5.502 |
ocol | -5.462 |
arians | -5.382 |
former | -5.375 |
Token | the |
Token ID | 262 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.522 |
, | +1.455 |
. | +1.240 |
the | +1.145 |
a | +0.965 |
Neg logit contributions | |
lor | -7.000 |
umm | -6.994 |
ocol | -6.941 |
former | -6.897 |
arians | -6.814 |
Token | covers |
Token ID | 8698 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.470 |
, | +4.430 |
the | +4.264 |
. | +4.212 |
a | +4.092 |
Neg logit contributions | |
umm | -4.070 |
lor | -4.055 |
ocol | -3.938 |
former | -3.901 |
arians | -3.855 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.786 |
, | +0.733 |
the | +0.569 |
. | +0.470 |
a | +0.416 |
Neg logit contributions | |
lor | -7.755 |
umm | -7.709 |
ocol | -7.545 |
former | -7.513 |
arians | -7.512 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | hid |
Token ID | 24519 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.543 |
. | +3.368 |
the | +3.304 |
a | +3.118 |
Neg logit contributions | |
lor | -4.928 |
former | -4.828 |
umm | -4.792 |
arians | -4.754 |
ocol | -4.704 |
Token | under |
Token ID | 739 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.979 |
, | +2.932 |
the | +2.691 |
. | +2.671 |
a | +2.539 |
Neg logit contributions | |
umm | -5.514 |
lor | -5.502 |
ocol | -5.462 |
arians | -5.382 |
former | -5.375 |
Token | the |
Token ID | 262 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.522 |
, | +1.455 |
. | +1.240 |
the | +1.145 |
a | +0.965 |
Neg logit contributions | |
lor | -7.000 |
umm | -6.994 |
ocol | -6.941 |
former | -6.897 |
arians | -6.814 |
Token | covers |
Token ID | 8698 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.470 |
, | +4.430 |
the | +4.264 |
. | +4.212 |
a | +4.092 |
Neg logit contributions | |
umm | -4.070 |
lor | -4.055 |
ocol | -3.938 |
former | -3.901 |
arians | -3.855 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | hid |
Token ID | 24519 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.543 |
. | +3.368 |
the | +3.304 |
a | +3.118 |
Neg logit contributions | |
lor | -4.928 |
former | -4.828 |
umm | -4.792 |
arians | -4.754 |
ocol | -4.704 |
Token | under |
Token ID | 739 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.979 |
, | +2.932 |
the | +2.691 |
. | +2.671 |
a | +2.539 |
Neg logit contributions | |
umm | -5.514 |
lor | -5.502 |
ocol | -5.462 |
arians | -5.382 |
former | -5.375 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | hid |
Token ID | 24519 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.543 |
. | +3.368 |
the | +3.304 |
a | +3.118 |
Neg logit contributions | |
lor | -4.928 |
former | -4.828 |
umm | -4.792 |
arians | -4.754 |
ocol | -4.704 |
Token | under |
Token ID | 739 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.979 |
, | +2.932 |
the | +2.691 |
. | +2.671 |
a | +2.539 |
Neg logit contributions | |
umm | -5.514 |
lor | -5.502 |
ocol | -5.462 |
arians | -5.382 |
former | -5.375 |
Token | the |
Token ID | 262 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.522 |
, | +1.455 |
. | +1.240 |
the | +1.145 |
a | +0.965 |
Neg logit contributions | |
lor | -7.000 |
umm | -6.994 |
ocol | -6.941 |
former | -6.897 |
arians | -6.814 |
Token | talking |
Token ID | 3375 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.747 |
, | +3.641 |
the | +3.525 |
. | +3.464 |
a | +3.313 |
Neg logit contributions | |
lor | -4.784 |
umm | -4.701 |
former | -4.678 |
arians | -4.632 |
ocol | -4.603 |
Token | , |
Token ID | 11 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.797 |
, | +2.754 |
the | +2.622 |
. | +2.545 |
a | +2.407 |
Neg logit contributions | |
lor | -5.717 |
umm | -5.661 |
former | -5.592 |
arians | -5.549 |
osity | -5.504 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.712 |
, | +3.680 |
. | +3.535 |
the | +3.501 |
a | +3.327 |
Neg logit contributions | |
umm | -4.769 |
lor | -4.735 |
former | -4.696 |
arians | -4.645 |
ocol | -4.630 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.158 |
, | +2.092 |
the | +2.021 |
. | +1.916 |
a | +1.810 |
Neg logit contributions | |
lor | -6.318 |
umm | -6.313 |
former | -6.163 |
arians | -6.139 |
ocol | -6.126 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | you |
Token ID | 345 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.218 |
, | +3.173 |
the | +3.031 |
. | +3.026 |
a | +2.883 |
Neg logit contributions | |
lor | -5.200 |
umm | -5.170 |
arians | -5.158 |
former | -5.056 |
osity | -5.025 |
Token | talking |
Token ID | 3375 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.747 |
, | +3.641 |
the | +3.525 |
. | +3.464 |
a | +3.313 |
Neg logit contributions | |
lor | -4.784 |
umm | -4.701 |
former | -4.678 |
arians | -4.632 |
ocol | -4.603 |
Token | , |
Token ID | 11 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.797 |
, | +2.754 |
the | +2.622 |
. | +2.545 |
a | +2.407 |
Neg logit contributions | |
lor | -5.717 |
umm | -5.661 |
former | -5.592 |
arians | -5.549 |
osity | -5.504 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.712 |
, | +3.680 |
. | +3.535 |
the | +3.501 |
a | +3.327 |
Neg logit contributions | |
umm | -4.769 |
lor | -4.735 |
former | -4.696 |
arians | -4.645 |
ocol | -4.630 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.158 |
, | +2.092 |
the | +2.021 |
. | +1.916 |
a | +1.810 |
Neg logit contributions | |
lor | -6.318 |
umm | -6.313 |
former | -6.163 |
arians | -6.139 |
ocol | -6.126 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | , |
Token ID | 11 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.797 |
, | +2.754 |
the | +2.622 |
. | +2.545 |
a | +2.407 |
Neg logit contributions | |
lor | -5.717 |
umm | -5.661 |
former | -5.592 |
arians | -5.549 |
osity | -5.504 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.712 |
, | +3.680 |
. | +3.535 |
the | +3.501 |
a | +3.327 |
Neg logit contributions | |
umm | -4.769 |
lor | -4.735 |
former | -4.696 |
arians | -4.645 |
ocol | -4.630 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.158 |
, | +2.092 |
the | +2.021 |
. | +1.916 |
a | +1.810 |
Neg logit contributions | |
lor | -6.318 |
umm | -6.313 |
former | -6.163 |
arians | -6.139 |
ocol | -6.126 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.712 |
, | +3.680 |
. | +3.535 |
the | +3.501 |
a | +3.327 |
Neg logit contributions | |
umm | -4.769 |
lor | -4.735 |
former | -4.696 |
arians | -4.645 |
ocol | -4.630 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.158 |
, | +2.092 |
the | +2.021 |
. | +1.916 |
a | +1.810 |
Neg logit contributions | |
lor | -6.318 |
umm | -6.313 |
former | -6.163 |
arians | -6.139 |
ocol | -6.126 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.383 |
, | +1.315 |
the | +1.114 |
. | +1.106 |
a | +0.935 |
Neg logit contributions | |
lor | -7.234 |
umm | -7.128 |
former | -7.036 |
ocol | -7.012 |
arians | -7.001 |
Token | Tom |
Token ID | 13787 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.722 |
, | +3.648 |
the | +3.469 |
. | +3.459 |
a | +3.279 |
Neg logit contributions | |
lor | -4.973 |
umm | -4.889 |
arians | -4.775 |
former | -4.765 |
ocol | -4.742 |
Token | went |
Token ID | 1816 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.927 |
, | +2.916 |
the | +2.810 |
. | +2.786 |
a | +2.616 |
Neg logit contributions | |
lor | -5.511 |
umm | -5.380 |
arians | -5.377 |
former | -5.303 |
ides | -5.258 |
Token | to |
Token ID | 284 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.848 |
, | +1.794 |
the | +1.622 |
. | +1.601 |
a | +1.441 |
Neg logit contributions | |
lor | -6.669 |
umm | -6.581 |
former | -6.508 |
arians | -6.506 |
ocol | -6.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.369 |
, | +2.305 |
. | +2.102 |
the | +1.996 |
a | +1.856 |
Neg logit contributions | |
lor | -6.126 |
umm | -6.102 |
former | -6.073 |
ocol | -6.058 |
arians | -6.011 |
Token | bed |
Token ID | 3996 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.835 |
, | +3.775 |
the | +3.617 |
. | +3.593 |
a | +3.413 |
Neg logit contributions | |
umm | -4.721 |
former | -4.675 |
lor | -4.675 |
arians | -4.597 |
ocol | -4.498 |
Token | and |
Token ID | 290 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.133 |
, | +1.086 |
the | +1.013 |
. | +0.890 |
a | +0.805 |
Neg logit contributions | |
lor | -7.376 |
umm | -7.292 |
former | -7.225 |
arians | -7.161 |
ides | -7.064 |
Token | hid |
Token ID | 24519 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.593 |
, | +3.543 |
. | +3.368 |
the | +3.304 |
a | +3.118 |
Neg logit contributions | |
lor | -4.928 |
former | -4.828 |
umm | -4.792 |
arians | -4.754 |
ocol | -4.704 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token |
|
Token ID | 198 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.084 |
, | +3.016 |
the | +2.812 |
. | +2.803 |
a | +2.615 |
Neg logit contributions | |
umm | -5.523 |
lor | -5.520 |
former | -5.382 |
arians | -5.346 |
ocol | -5.324 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.491 |
, | +0.432 |
the | +0.344 |
. | +0.229 |
a | +0.192 |
Neg logit contributions | |
umm | -7.942 |
lor | -7.831 |
ocol | -7.786 |
arians | -7.716 |
former | -7.705 |
Token | ?" |
Token ID | 1701 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.158 |
, | +2.092 |
the | +2.021 |
. | +1.916 |
a | +1.810 |
Neg logit contributions | |
lor | -6.318 |
umm | -6.313 |
former | -6.163 |
arians | -6.139 |
ocol | -6.126 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | The |
Token ID | 383 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.131 |
, | +3.049 |
. | +2.872 |
the | +2.839 |
a | +2.681 |
Neg logit contributions | |
lor | -5.368 |
umm | -5.329 |
former | -5.269 |
ocol | -5.258 |
arians | -5.220 |
Token | table |
Token ID | 3084 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.219 |
, | +4.165 |
the | +3.971 |
. | +3.966 |
a | +3.766 |
Neg logit contributions | |
umm | -4.374 |
lor | -4.297 |
former | -4.247 |
ocol | -4.242 |
arians | -4.204 |
Token | did |
Token ID | 750 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.742 |
, | +3.681 |
the | +3.577 |
. | +3.515 |
a | +3.371 |
Neg logit contributions | |
lor | -4.756 |
umm | -4.712 |
former | -4.565 |
ocol | -4.549 |
arians | -4.546 |
Token | not |
Token ID | 407 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.394 |
, | +2.310 |
the | +2.157 |
. | +2.124 |
a | +1.947 |
Neg logit contributions | |
lor | -6.103 |
umm | -6.006 |
former | -6.004 |
ocol | -5.932 |
arians | -5.923 |
Token | say |
Token ID | 910 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.909 |
, | +3.843 |
the | +3.693 |
. | +3.645 |
a | +3.480 |
Neg logit contributions | |
umm | -4.622 |
lor | -4.556 |
ocol | -4.515 |
former | -4.502 |
arians | -4.463 |
Token | anything |
Token ID | 1997 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +4.176 |
, | +4.008 |
the | +3.856 |
. | +3.853 |
a | +3.658 |
Neg logit contributions | |
lor | -4.458 |
umm | -4.343 |
ocol | -4.271 |
arians | -4.211 |
former | -4.209 |
Token | either |
Token ID | 2035 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +1.833 |
, | +1.756 |
the | +1.639 |
. | +1.542 |
a | +1.475 |
Neg logit contributions | |
lor | -6.610 |
umm | -6.563 |
arians | -6.473 |
former | -6.463 |
ocol | -6.441 |
Token | . |
Token ID | 13 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +0.887 |
, | +0.799 |
the | +0.719 |
. | +0.597 |
a | +0.547 |
Neg logit contributions | |
lor | -7.568 |
umm | -7.535 |
ocol | -7.396 |
arians | -7.374 |
ides | -7.353 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.964 |
, | +2.905 |
. | +2.699 |
the | +2.697 |
a | +2.504 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.598 |
former | -5.505 |
arians | -5.461 |
ocol | -5.458 |
Token | was |
Token ID | 373 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +2.969 |
, | +2.967 |
the | +2.847 |
. | +2.823 |
a | +2.651 |
Neg logit contributions | |
lor | -5.452 |
umm | -5.350 |
arians | -5.325 |
former | -5.295 |
ides | -5.204 |
Token | scared |
Token ID | 12008 |
Feature activation | +5.47e+00 |
Pos logit contributions | |
and | +3.689 |
, | +3.647 |
. | +3.446 |
the | +3.415 |
a | +3.173 |
Neg logit contributions | |
lor | -4.789 |
former | -4.755 |
umm | -4.751 |
ocol | -4.683 |
arians | -4.661 |