Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | hid |
Token ID | 24519 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.485 |
, | +3.462 |
. | +3.277 |
the | +3.180 |
a | +3.024 |
Neg logit contributions | |
lor | -4.871 |
former | -4.818 |
umm | -4.776 |
ocol | -4.726 |
arians | -4.710 |
Token | under |
Token ID | 739 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.879 |
, | +2.857 |
. | +2.609 |
the | +2.575 |
a | +2.443 |
Neg logit contributions | |
umm | -5.473 |
lor | -5.457 |
ocol | -5.448 |
former | -5.383 |
arians | -5.336 |
Token | the |
Token ID | 262 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.456 |
, | +1.420 |
. | +1.206 |
the | +1.091 |
a | +0.939 |
Neg logit contributions | |
umm | -6.918 |
lor | -6.914 |
ocol | -6.888 |
former | -6.856 |
arians | -6.745 |
Token | covers |
Token ID | 8698 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.343 |
, | +4.330 |
. | +4.109 |
the | +4.103 |
a | +3.960 |
Neg logit contributions | |
umm | -4.028 |
lor | -4.008 |
ocol | -3.948 |
former | -3.912 |
arians | -3.823 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.721 |
, | +0.694 |
the | +0.467 |
. | +0.454 |
a | +0.332 |
Neg logit contributions | |
lor | -7.660 |
umm | -7.640 |
ocol | -7.531 |
former | -7.513 |
arians | -7.458 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | hid |
Token ID | 24519 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.485 |
, | +3.462 |
. | +3.277 |
the | +3.180 |
a | +3.024 |
Neg logit contributions | |
lor | -4.871 |
former | -4.818 |
umm | -4.776 |
ocol | -4.726 |
arians | -4.710 |
Token | under |
Token ID | 739 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.879 |
, | +2.857 |
. | +2.609 |
the | +2.575 |
a | +2.443 |
Neg logit contributions | |
umm | -5.473 |
lor | -5.457 |
ocol | -5.448 |
former | -5.383 |
arians | -5.336 |
Token | the |
Token ID | 262 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.456 |
, | +1.420 |
. | +1.206 |
the | +1.091 |
a | +0.939 |
Neg logit contributions | |
umm | -6.918 |
lor | -6.914 |
ocol | -6.888 |
former | -6.856 |
arians | -6.745 |
Token | covers |
Token ID | 8698 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.343 |
, | +4.330 |
. | +4.109 |
the | +4.103 |
a | +3.960 |
Neg logit contributions | |
umm | -4.028 |
lor | -4.008 |
ocol | -3.948 |
former | -3.912 |
arians | -3.823 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | hid |
Token ID | 24519 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.485 |
, | +3.462 |
. | +3.277 |
the | +3.180 |
a | +3.024 |
Neg logit contributions | |
lor | -4.871 |
former | -4.818 |
umm | -4.776 |
ocol | -4.726 |
arians | -4.710 |
Token | under |
Token ID | 739 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.879 |
, | +2.857 |
. | +2.609 |
the | +2.575 |
a | +2.443 |
Neg logit contributions | |
umm | -5.473 |
lor | -5.457 |
ocol | -5.448 |
former | -5.383 |
arians | -5.336 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | hid |
Token ID | 24519 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.485 |
, | +3.462 |
. | +3.277 |
the | +3.180 |
a | +3.024 |
Neg logit contributions | |
lor | -4.871 |
former | -4.818 |
umm | -4.776 |
ocol | -4.726 |
arians | -4.710 |
Token | under |
Token ID | 739 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.879 |
, | +2.857 |
. | +2.609 |
the | +2.575 |
a | +2.443 |
Neg logit contributions | |
umm | -5.473 |
lor | -5.457 |
ocol | -5.448 |
former | -5.383 |
arians | -5.336 |
Token | the |
Token ID | 262 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.456 |
, | +1.420 |
. | +1.206 |
the | +1.091 |
a | +0.939 |
Neg logit contributions | |
umm | -6.918 |
lor | -6.914 |
ocol | -6.888 |
former | -6.856 |
arians | -6.745 |
Token | talking |
Token ID | 3375 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.632 |
, | +3.569 |
. | +3.383 |
the | +3.378 |
a | +3.203 |
Neg logit contributions | |
lor | -4.728 |
umm | -4.678 |
former | -4.668 |
ocol | -4.616 |
arians | -4.584 |
Token | , |
Token ID | 11 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.690 |
, | +2.673 |
the | +2.471 |
. | +2.462 |
a | +2.293 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.621 |
former | -5.582 |
ocol | -5.509 |
arians | -5.499 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.617 |
, | +3.607 |
. | +3.444 |
the | +3.371 |
a | +3.223 |
Neg logit contributions | |
umm | -4.713 |
lor | -4.680 |
former | -4.671 |
ocol | -4.623 |
arians | -4.581 |
Token | ?" |
Token ID | 1701 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.056 |
, | +2.020 |
the | +1.860 |
. | +1.835 |
a | +1.686 |
Neg logit contributions | |
umm | -6.270 |
lor | -6.266 |
former | -6.171 |
ocol | -6.146 |
arians | -6.102 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | you |
Token ID | 345 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.147 |
, | +3.126 |
. | +2.959 |
the | +2.914 |
a | +2.783 |
Neg logit contributions | |
lor | -5.146 |
umm | -5.134 |
arians | -5.074 |
former | -5.059 |
ocol | -5.030 |
Token | talking |
Token ID | 3375 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.632 |
, | +3.569 |
. | +3.383 |
the | +3.378 |
a | +3.203 |
Neg logit contributions | |
lor | -4.728 |
umm | -4.678 |
former | -4.668 |
ocol | -4.616 |
arians | -4.584 |
Token | , |
Token ID | 11 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.690 |
, | +2.673 |
the | +2.471 |
. | +2.462 |
a | +2.293 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.621 |
former | -5.582 |
ocol | -5.509 |
arians | -5.499 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.617 |
, | +3.607 |
. | +3.444 |
the | +3.371 |
a | +3.223 |
Neg logit contributions | |
umm | -4.713 |
lor | -4.680 |
former | -4.671 |
ocol | -4.623 |
arians | -4.581 |
Token | ?" |
Token ID | 1701 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.056 |
, | +2.020 |
the | +1.860 |
. | +1.835 |
a | +1.686 |
Neg logit contributions | |
umm | -6.270 |
lor | -6.266 |
former | -6.171 |
ocol | -6.146 |
arians | -6.102 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | , |
Token ID | 11 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.690 |
, | +2.673 |
the | +2.471 |
. | +2.462 |
a | +2.293 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.621 |
former | -5.582 |
ocol | -5.509 |
arians | -5.499 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.617 |
, | +3.607 |
. | +3.444 |
the | +3.371 |
a | +3.223 |
Neg logit contributions | |
umm | -4.713 |
lor | -4.680 |
former | -4.671 |
ocol | -4.623 |
arians | -4.581 |
Token | ?" |
Token ID | 1701 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.056 |
, | +2.020 |
the | +1.860 |
. | +1.835 |
a | +1.686 |
Neg logit contributions | |
umm | -6.270 |
lor | -6.266 |
former | -6.171 |
ocol | -6.146 |
arians | -6.102 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.617 |
, | +3.607 |
. | +3.444 |
the | +3.371 |
a | +3.223 |
Neg logit contributions | |
umm | -4.713 |
lor | -4.680 |
former | -4.671 |
ocol | -4.623 |
arians | -4.581 |
Token | ?" |
Token ID | 1701 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.056 |
, | +2.020 |
the | +1.860 |
. | +1.835 |
a | +1.686 |
Neg logit contributions | |
umm | -6.270 |
lor | -6.266 |
former | -6.171 |
ocol | -6.146 |
arians | -6.102 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | hid |
Token ID | 24519 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.485 |
, | +3.462 |
. | +3.277 |
the | +3.180 |
a | +3.024 |
Neg logit contributions | |
lor | -4.871 |
former | -4.818 |
umm | -4.776 |
ocol | -4.726 |
arians | -4.710 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token | ?" |
Token ID | 1701 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.056 |
, | +2.020 |
the | +1.860 |
. | +1.835 |
a | +1.686 |
Neg logit contributions | |
umm | -6.270 |
lor | -6.266 |
former | -6.171 |
ocol | -6.146 |
arians | -6.102 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.234 |
, | +2.113 |
the | +1.937 |
. | +1.924 |
a | +1.796 |
Neg logit contributions | |
umm | -6.091 |
lor | -6.080 |
ocol | -6.013 |
arians | -5.991 |
former | -5.967 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.586 |
, | +4.539 |
. | +4.379 |
the | +4.314 |
a | +4.154 |
Neg logit contributions | |
lor | -3.866 |
umm | -3.850 |
former | -3.751 |
arians | -3.745 |
ocol | -3.716 |
Token | more |
Token ID | 517 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.433 |
, | +4.391 |
. | +4.207 |
the | +4.153 |
a | +3.969 |
Neg logit contributions | |
umm | -4.013 |
former | -3.959 |
lor | -3.957 |
ocol | -3.913 |
arians | -3.877 |
Token | , |
Token ID | 11 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.928 |
, | +3.861 |
. | +3.693 |
the | +3.673 |
a | +3.522 |
Neg logit contributions | |
umm | -4.455 |
lor | -4.415 |
former | -4.369 |
ocol | -4.363 |
arians | -4.304 |
Token | the |
Token ID | 262 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.623 |
, | +3.614 |
. | +3.463 |
the | +3.326 |
a | +3.187 |
Neg logit contributions | |
umm | -4.763 |
former | -4.684 |
lor | -4.681 |
ocol | -4.681 |
arians | -4.593 |
Token | mer |
Token ID | 4017 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.291 |
, | +4.247 |
. | +4.059 |
the | +3.998 |
a | +3.810 |
Neg logit contributions | |
umm | -4.164 |
former | -4.110 |
lor | -4.090 |
ocol | -4.051 |
arians | -4.016 |
Token | rier |
Token ID | 5277 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +7.245 |
, | +7.220 |
the | +7.061 |
. | +7.043 |
a | +6.895 |
Neg logit contributions | |
umm | -1.236 |
lor | -1.226 |
former | -1.150 |
ocol | -1.127 |
arians | -1.083 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.130 |
, | +3.089 |
the | +2.934 |
. | +2.899 |
a | +2.770 |
Neg logit contributions | |
lor | -5.225 |
umm | -5.188 |
former | -5.104 |
ocol | -5.084 |
arians | -5.063 |
Token | Come |
Token ID | 7911 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.032 |
, | +3.997 |
. | +3.801 |
the | +3.742 |
a | +3.579 |
Neg logit contributions | |
umm | -4.451 |
lor | -4.435 |
former | -4.353 |
ocol | -4.331 |
arians | -4.273 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.062 |
, | +2.015 |
. | +1.873 |
the | +1.839 |
a | +1.680 |
Neg logit contributions | |
lor | -6.296 |
umm | -6.247 |
arians | -6.162 |
ocol | -6.151 |
former | -6.142 |
Token | my |
Token ID | 616 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.857 |
, | +2.797 |
. | +2.627 |
the | +2.454 |
a | +2.334 |
Neg logit contributions | |
lor | -5.552 |
former | -5.548 |
umm | -5.535 |
ocol | -5.509 |
arians | -5.408 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | hid |
Token ID | 24519 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.485 |
, | +3.462 |
. | +3.277 |
the | +3.180 |
a | +3.024 |
Neg logit contributions | |
lor | -4.871 |
former | -4.818 |
umm | -4.776 |
ocol | -4.726 |
arians | -4.710 |
Token | under |
Token ID | 739 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.879 |
, | +2.857 |
. | +2.609 |
the | +2.575 |
a | +2.443 |
Neg logit contributions | |
umm | -5.473 |
lor | -5.457 |
ocol | -5.448 |
former | -5.383 |
arians | -5.336 |
Token | the |
Token ID | 262 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.456 |
, | +1.420 |
. | +1.206 |
the | +1.091 |
a | +0.939 |
Neg logit contributions | |
umm | -6.918 |
lor | -6.914 |
ocol | -6.888 |
former | -6.856 |
arians | -6.745 |
Token | covers |
Token ID | 8698 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.343 |
, | +4.330 |
. | +4.109 |
the | +4.103 |
a | +3.960 |
Neg logit contributions | |
umm | -4.028 |
lor | -4.008 |
ocol | -3.948 |
former | -3.912 |
arians | -3.823 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | hid |
Token ID | 24519 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.485 |
, | +3.462 |
. | +3.277 |
the | +3.180 |
a | +3.024 |
Neg logit contributions | |
lor | -4.871 |
former | -4.818 |
umm | -4.776 |
ocol | -4.726 |
arians | -4.710 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | hid |
Token ID | 24519 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.485 |
, | +3.462 |
. | +3.277 |
the | +3.180 |
a | +3.024 |
Neg logit contributions | |
lor | -4.871 |
former | -4.818 |
umm | -4.776 |
ocol | -4.726 |
arians | -4.710 |
Token | under |
Token ID | 739 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.879 |
, | +2.857 |
. | +2.609 |
the | +2.575 |
a | +2.443 |
Neg logit contributions | |
umm | -5.473 |
lor | -5.457 |
ocol | -5.448 |
former | -5.383 |
arians | -5.336 |
Token | the |
Token ID | 262 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.456 |
, | +1.420 |
. | +1.206 |
the | +1.091 |
a | +0.939 |
Neg logit contributions | |
umm | -6.918 |
lor | -6.914 |
ocol | -6.888 |
former | -6.856 |
arians | -6.745 |
Token | talking |
Token ID | 3375 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.632 |
, | +3.569 |
. | +3.383 |
the | +3.378 |
a | +3.203 |
Neg logit contributions | |
lor | -4.728 |
umm | -4.678 |
former | -4.668 |
ocol | -4.616 |
arians | -4.584 |
Token | , |
Token ID | 11 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.690 |
, | +2.673 |
the | +2.471 |
. | +2.462 |
a | +2.293 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.621 |
former | -5.582 |
ocol | -5.509 |
arians | -5.499 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.617 |
, | +3.607 |
. | +3.444 |
the | +3.371 |
a | +3.223 |
Neg logit contributions | |
umm | -4.713 |
lor | -4.680 |
former | -4.671 |
ocol | -4.623 |
arians | -4.581 |
Token | ?" |
Token ID | 1701 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.056 |
, | +2.020 |
the | +1.860 |
. | +1.835 |
a | +1.686 |
Neg logit contributions | |
umm | -6.270 |
lor | -6.266 |
former | -6.171 |
ocol | -6.146 |
arians | -6.102 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | you |
Token ID | 345 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.147 |
, | +3.126 |
. | +2.959 |
the | +2.914 |
a | +2.783 |
Neg logit contributions | |
lor | -5.146 |
umm | -5.134 |
arians | -5.074 |
former | -5.059 |
ocol | -5.030 |
Token | talking |
Token ID | 3375 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.632 |
, | +3.569 |
. | +3.383 |
the | +3.378 |
a | +3.203 |
Neg logit contributions | |
lor | -4.728 |
umm | -4.678 |
former | -4.668 |
ocol | -4.616 |
arians | -4.584 |
Token | , |
Token ID | 11 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.690 |
, | +2.673 |
the | +2.471 |
. | +2.462 |
a | +2.293 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.621 |
former | -5.582 |
ocol | -5.509 |
arians | -5.499 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.617 |
, | +3.607 |
. | +3.444 |
the | +3.371 |
a | +3.223 |
Neg logit contributions | |
umm | -4.713 |
lor | -4.680 |
former | -4.671 |
ocol | -4.623 |
arians | -4.581 |
Token | ?" |
Token ID | 1701 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.056 |
, | +2.020 |
the | +1.860 |
. | +1.835 |
a | +1.686 |
Neg logit contributions | |
umm | -6.270 |
lor | -6.266 |
former | -6.171 |
ocol | -6.146 |
arians | -6.102 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | , |
Token ID | 11 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.690 |
, | +2.673 |
the | +2.471 |
. | +2.462 |
a | +2.293 |
Neg logit contributions | |
lor | -5.655 |
umm | -5.621 |
former | -5.582 |
ocol | -5.509 |
arians | -5.499 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.617 |
, | +3.607 |
. | +3.444 |
the | +3.371 |
a | +3.223 |
Neg logit contributions | |
umm | -4.713 |
lor | -4.680 |
former | -4.671 |
ocol | -4.623 |
arians | -4.581 |
Token | ?" |
Token ID | 1701 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.056 |
, | +2.020 |
the | +1.860 |
. | +1.835 |
a | +1.686 |
Neg logit contributions | |
umm | -6.270 |
lor | -6.266 |
former | -6.171 |
ocol | -6.146 |
arians | -6.102 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | hid |
Token ID | 24519 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.485 |
, | +3.462 |
. | +3.277 |
the | +3.180 |
a | +3.024 |
Neg logit contributions | |
lor | -4.871 |
former | -4.818 |
umm | -4.776 |
ocol | -4.726 |
arians | -4.710 |
Token | under |
Token ID | 739 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.879 |
, | +2.857 |
. | +2.609 |
the | +2.575 |
a | +2.443 |
Neg logit contributions | |
umm | -5.473 |
lor | -5.457 |
ocol | -5.448 |
former | -5.383 |
arians | -5.336 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | to |
Token ID | 284 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.787 |
, | +1.760 |
. | +1.562 |
the | +1.528 |
a | +1.375 |
Neg logit contributions | |
lor | -6.580 |
umm | -6.527 |
former | -6.482 |
ocol | -6.451 |
arians | -6.428 |
Token | his |
Token ID | 465 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.282 |
, | +2.249 |
. | +2.041 |
the | +1.910 |
a | +1.790 |
Neg logit contributions | |
lor | -6.056 |
umm | -6.045 |
former | -6.040 |
ocol | -6.032 |
arians | -5.941 |
Token | bed |
Token ID | 3996 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.694 |
, | +3.665 |
. | +3.474 |
the | +3.445 |
a | +3.274 |
Neg logit contributions | |
umm | -4.693 |
former | -4.681 |
lor | -4.647 |
arians | -4.565 |
ocol | -4.536 |
Token | and |
Token ID | 290 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.096 |
, | +1.073 |
the | +0.906 |
. | +0.874 |
a | +0.735 |
Neg logit contributions | |
lor | -7.260 |
umm | -7.214 |
former | -7.169 |
arians | -7.074 |
ocol | -7.051 |
Token | ?" |
Token ID | 1701 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.056 |
, | +2.020 |
the | +1.860 |
. | +1.835 |
a | +1.686 |
Neg logit contributions | |
umm | -6.270 |
lor | -6.266 |
former | -6.171 |
ocol | -6.146 |
arians | -6.102 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.992 |
, | +2.955 |
. | +2.740 |
the | +2.699 |
a | +2.534 |
Neg logit contributions | |
umm | -5.440 |
lor | -5.430 |
former | -5.347 |
ocol | -5.304 |
arians | -5.268 |
Token |
|
Token ID | 198 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.358 |
, | +1.322 |
. | +1.102 |
the | +1.061 |
a | +0.913 |
Neg logit contributions | |
lor | -7.070 |
umm | -6.971 |
former | -6.928 |
ocol | -6.912 |
arians | -6.845 |
Token | Tom |
Token ID | 13787 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.613 |
, | +3.572 |
. | +3.374 |
the | +3.334 |
a | +3.174 |
Neg logit contributions | |
lor | -4.887 |
umm | -4.823 |
former | -4.745 |
ocol | -4.730 |
arians | -4.703 |
Token | went |
Token ID | 1816 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.868 |
and | +2.864 |
. | +2.715 |
the | +2.684 |
a | +2.522 |
Neg logit contributions | |
lor | -5.440 |
umm | -5.354 |
arians | -5.308 |
former | -5.307 |
ocol | -5.243 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.478 |
, | +0.447 |
the | +0.272 |
. | +0.243 |
a | +0.138 |
Neg logit contributions | |
umm | -7.848 |
lor | -7.766 |
ocol | -7.746 |
former | -7.691 |
arians | -7.646 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.617 |
, | +3.607 |
. | +3.444 |
the | +3.371 |
a | +3.223 |
Neg logit contributions | |
umm | -4.713 |
lor | -4.680 |
former | -4.671 |
ocol | -4.623 |
arians | -4.581 |
Token | ?" |
Token ID | 1701 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.056 |
, | +2.020 |
the | +1.860 |
. | +1.835 |
a | +1.686 |
Neg logit contributions | |
umm | -6.270 |
lor | -6.266 |
former | -6.171 |
ocol | -6.146 |
arians | -6.102 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | The |
Token ID | 383 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.038 |
, | +2.992 |
. | +2.806 |
the | +2.737 |
a | +2.598 |
Neg logit contributions | |
lor | -5.312 |
umm | -5.295 |
former | -5.254 |
ocol | -5.246 |
arians | -5.169 |
Token | table |
Token ID | 3084 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.103 |
, | +4.077 |
. | +3.873 |
the | +3.829 |
a | +3.657 |
Neg logit contributions | |
umm | -4.311 |
lor | -4.243 |
former | -4.229 |
ocol | -4.228 |
arians | -4.144 |
Token | did |
Token ID | 750 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.665 |
, | +3.632 |
. | +3.453 |
the | +3.443 |
a | +3.274 |
Neg logit contributions | |
lor | -4.683 |
umm | -4.664 |
former | -4.567 |
ocol | -4.556 |
arians | -4.502 |
Token | not |
Token ID | 407 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.268 |
, | +2.221 |
. | +2.029 |
the | +2.002 |
a | +1.829 |
Neg logit contributions | |
lor | -6.089 |
umm | -6.036 |
former | -6.032 |
ocol | -5.985 |
arians | -5.927 |
Token | say |
Token ID | 910 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.793 |
, | +3.758 |
. | +3.557 |
the | +3.542 |
a | +3.366 |
Neg logit contributions | |
umm | -4.589 |
lor | -4.535 |
ocol | -4.522 |
former | -4.512 |
arians | -4.432 |
Token | anything |
Token ID | 1997 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +4.064 |
, | +3.968 |
. | +3.795 |
the | +3.748 |
a | +3.585 |
Neg logit contributions | |
lor | -4.377 |
umm | -4.318 |
ocol | -4.264 |
former | -4.230 |
arians | -4.176 |
Token | either |
Token ID | 2035 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +1.779 |
, | +1.737 |
the | +1.538 |
. | +1.530 |
a | +1.393 |
Neg logit contributions | |
lor | -6.547 |
umm | -6.529 |
former | -6.460 |
ocol | -6.444 |
arians | -6.411 |
Token | . |
Token ID | 13 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +0.833 |
, | +0.783 |
the | +0.612 |
. | +0.580 |
a | +0.464 |
Neg logit contributions | |
lor | -7.493 |
umm | -7.479 |
ocol | -7.387 |
former | -7.354 |
arians | -7.321 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +2.864 |
, | +2.834 |
. | +2.627 |
the | +2.577 |
a | +2.416 |
Neg logit contributions | |
lor | -5.563 |
umm | -5.531 |
former | -5.472 |
ocol | -5.440 |
arians | -5.389 |
Token | was |
Token ID | 373 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
, | +2.908 |
and | +2.902 |
. | +2.743 |
the | +2.710 |
a | +2.547 |
Neg logit contributions | |
lor | -5.398 |
umm | -5.341 |
former | -5.304 |
arians | -5.269 |
ocol | -5.231 |
Token | scared |
Token ID | 12008 |
Feature activation | +4.96e+01 |
Pos logit contributions | |
and | +3.567 |
, | +3.548 |
. | +3.345 |
the | +3.276 |
a | +3.081 |
Neg logit contributions | |
lor | -4.770 |
former | -4.758 |
umm | -4.752 |
ocol | -4.709 |
arians | -4.641 |