Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token | the |
Token ID | 262 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.601 |
, | +1.591 |
. | +1.410 |
the | +1.216 |
a | +1.010 |
Neg logit contributions | |
lor | -7.244 |
former | -7.150 |
ocol | -7.140 |
umm | -7.100 |
rol | -7.005 |
Token | covers |
Token ID | 8698 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +4.583 |
and | +4.563 |
. | +4.404 |
the | +4.384 |
a | +4.187 |
Neg logit contributions | |
lor | -4.297 |
umm | -4.177 |
former | -4.141 |
ocol | -4.119 |
rol | -4.072 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.794 |
and | +0.792 |
the | +0.595 |
. | +0.576 |
a | +0.415 |
Neg logit contributions | |
lor | -8.100 |
umm | -7.919 |
rol | -7.903 |
former | -7.860 |
ocol | -7.823 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token | the |
Token ID | 262 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.601 |
, | +1.591 |
. | +1.410 |
the | +1.216 |
a | +1.010 |
Neg logit contributions | |
lor | -7.244 |
former | -7.150 |
ocol | -7.140 |
umm | -7.100 |
rol | -7.005 |
Token | covers |
Token ID | 8698 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +4.583 |
and | +4.563 |
. | +4.404 |
the | +4.384 |
a | +4.187 |
Neg logit contributions | |
lor | -4.297 |
umm | -4.177 |
former | -4.141 |
ocol | -4.119 |
rol | -4.072 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token | the |
Token ID | 262 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.601 |
, | +1.591 |
. | +1.410 |
the | +1.216 |
a | +1.010 |
Neg logit contributions | |
lor | -7.244 |
former | -7.150 |
ocol | -7.140 |
umm | -7.100 |
rol | -7.005 |
Token | talking |
Token ID | 3375 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.889 |
, | +3.845 |
. | +3.712 |
the | +3.687 |
a | +3.450 |
Neg logit contributions | |
lor | -5.000 |
former | -4.889 |
rol | -4.812 |
umm | -4.795 |
osity | -4.775 |
Token | , |
Token ID | 11 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | you |
Token ID | 345 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.403 |
and | +3.402 |
. | +3.289 |
the | +3.217 |
a | +3.026 |
Neg logit contributions | |
lor | -5.435 |
former | -5.294 |
umm | -5.283 |
rol | -5.268 |
osity | -5.241 |
Token | talking |
Token ID | 3375 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.889 |
, | +3.845 |
. | +3.712 |
the | +3.687 |
a | +3.450 |
Neg logit contributions | |
lor | -5.000 |
former | -4.889 |
rol | -4.812 |
umm | -4.795 |
osity | -4.775 |
Token | , |
Token ID | 11 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | , |
Token ID | 11 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token | the |
Token ID | 262 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.601 |
, | +1.591 |
. | +1.410 |
the | +1.216 |
a | +1.010 |
Neg logit contributions | |
lor | -7.244 |
former | -7.150 |
ocol | -7.140 |
umm | -7.100 |
rol | -7.005 |
Token | covers |
Token ID | 8698 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +4.583 |
and | +4.563 |
. | +4.404 |
the | +4.384 |
a | +4.187 |
Neg logit contributions | |
lor | -4.297 |
umm | -4.177 |
former | -4.141 |
ocol | -4.119 |
rol | -4.072 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.794 |
and | +0.792 |
the | +0.595 |
. | +0.576 |
a | +0.415 |
Neg logit contributions | |
lor | -8.100 |
umm | -7.919 |
rol | -7.903 |
former | -7.860 |
ocol | -7.823 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token | the |
Token ID | 262 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.601 |
, | +1.591 |
. | +1.410 |
the | +1.216 |
a | +1.010 |
Neg logit contributions | |
lor | -7.244 |
former | -7.150 |
ocol | -7.140 |
umm | -7.100 |
rol | -7.005 |
Token | covers |
Token ID | 8698 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +4.583 |
and | +4.563 |
. | +4.404 |
the | +4.384 |
a | +4.187 |
Neg logit contributions | |
lor | -4.297 |
umm | -4.177 |
former | -4.141 |
ocol | -4.119 |
rol | -4.072 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | under |
Token ID | 739 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.113 |
and | +3.098 |
. | +2.874 |
the | +2.820 |
a | +2.649 |
Neg logit contributions | |
lor | -5.690 |
ocol | -5.615 |
umm | -5.567 |
former | -5.567 |
rol | -5.564 |
Token | the |
Token ID | 262 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.601 |
, | +1.591 |
. | +1.410 |
the | +1.216 |
a | +1.010 |
Neg logit contributions | |
lor | -7.244 |
former | -7.150 |
ocol | -7.140 |
umm | -7.100 |
rol | -7.005 |
Token | talking |
Token ID | 3375 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.889 |
, | +3.845 |
. | +3.712 |
the | +3.687 |
a | +3.450 |
Neg logit contributions | |
lor | -5.000 |
former | -4.889 |
rol | -4.812 |
umm | -4.795 |
osity | -4.775 |
Token | , |
Token ID | 11 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | you |
Token ID | 345 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.403 |
and | +3.402 |
. | +3.289 |
the | +3.217 |
a | +3.026 |
Neg logit contributions | |
lor | -5.435 |
former | -5.294 |
umm | -5.283 |
rol | -5.268 |
osity | -5.241 |
Token | talking |
Token ID | 3375 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.889 |
, | +3.845 |
. | +3.712 |
the | +3.687 |
a | +3.450 |
Neg logit contributions | |
lor | -5.000 |
former | -4.889 |
rol | -4.812 |
umm | -4.795 |
osity | -4.775 |
Token | , |
Token ID | 11 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | , |
Token ID | 11 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +2.924 |
and | +2.916 |
. | +2.766 |
the | +2.752 |
a | +2.514 |
Neg logit contributions | |
lor | -5.960 |
former | -5.833 |
umm | -5.779 |
rol | -5.761 |
osity | -5.744 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.859 |
and | +3.838 |
. | +3.756 |
the | +3.647 |
a | +3.443 |
Neg logit contributions | |
lor | -4.970 |
former | -4.924 |
umm | -4.866 |
osity | -4.805 |
ocol | -4.792 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.420 |
, | +1.408 |
. | +1.235 |
the | +1.167 |
a | +0.963 |
Neg logit contributions | |
lor | -7.544 |
former | -7.334 |
rol | -7.314 |
umm | -7.280 |
bek | -7.252 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.836 |
, | +3.819 |
. | +3.678 |
the | +3.609 |
a | +3.390 |
Neg logit contributions | |
lor | -5.197 |
former | -5.012 |
umm | -5.005 |
bek | -4.980 |
rol | -4.972 |
Token | went |
Token ID | 1816 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.109 |
and | +3.089 |
. | +3.005 |
the | +2.944 |
a | +2.723 |
Neg logit contributions | |
lor | -5.777 |
former | -5.598 |
rol | -5.569 |
umm | -5.566 |
bek | -5.528 |
Token | to |
Token ID | 284 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.942 |
and | +1.942 |
. | +1.795 |
the | +1.736 |
a | +1.526 |
Neg logit contributions | |
lor | -6.940 |
rol | -6.788 |
former | -6.782 |
umm | -6.727 |
osity | -6.698 |
Token | his |
Token ID | 465 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.454 |
, | +2.446 |
. | +2.284 |
the | +2.091 |
a | +1.927 |
Neg logit contributions | |
lor | -6.377 |
former | -6.332 |
ocol | -6.251 |
umm | -6.214 |
rol | -6.212 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.927 |
, | +3.923 |
. | +3.785 |
the | +3.732 |
a | +3.500 |
Neg logit contributions | |
former | -4.933 |
lor | -4.929 |
umm | -4.840 |
arians | -4.740 |
bek | -4.713 |
Token | and |
Token ID | 290 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +1.251 |
and | +1.242 |
the | +1.146 |
. | +1.099 |
a | +0.910 |
Neg logit contributions | |
lor | -7.614 |
former | -7.463 |
umm | -7.392 |
rol | -7.332 |
arians | -7.284 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.741 |
and | +3.739 |
. | +3.610 |
the | +3.482 |
a | +3.267 |
Neg logit contributions | |
lor | -5.150 |
former | -5.043 |
bek | -4.937 |
rol | -4.933 |
umm | -4.906 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token |
|
Token ID | 198 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.138 |
, | +3.125 |
. | +2.959 |
the | +2.890 |
a | +2.665 |
Neg logit contributions | |
lor | -5.817 |
umm | -5.684 |
former | -5.679 |
rol | -5.612 |
osity | -5.588 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +0.454 |
and | +0.454 |
the | +0.363 |
. | +0.287 |
a | +0.196 |
Neg logit contributions | |
umm | -8.109 |
lor | -8.097 |
ocol | -8.027 |
rol | -8.004 |
osity | -7.979 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.237 |
, | +2.226 |
the | +2.109 |
. | +2.094 |
a | +1.873 |
Neg logit contributions | |
lor | -6.601 |
umm | -6.462 |
former | -6.449 |
rol | -6.374 |
ocol | -6.346 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | The |
Token ID | 383 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.233 |
, | +3.208 |
. | +3.076 |
the | +2.969 |
a | +2.780 |
Neg logit contributions | |
lor | -5.627 |
former | -5.524 |
umm | -5.457 |
ocol | -5.443 |
rol | -5.434 |
Token | table |
Token ID | 3084 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.334 |
, | +4.333 |
. | +4.181 |
the | +4.109 |
a | +3.877 |
Neg logit contributions | |
lor | -4.540 |
former | -4.481 |
umm | -4.474 |
ocol | -4.406 |
bek | -4.354 |
Token | did |
Token ID | 750 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.950 |
, | +3.941 |
. | +3.818 |
the | +3.785 |
a | +3.556 |
Neg logit contributions | |
lor | -4.924 |
umm | -4.759 |
former | -4.749 |
rol | -4.722 |
ocol | -4.663 |
Token | not |
Token ID | 407 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +2.348 |
, | +2.322 |
. | +2.181 |
the | +2.133 |
a | +1.897 |
Neg logit contributions | |
lor | -6.513 |
former | -6.411 |
umm | -6.291 |
ocol | -6.275 |
rol | -6.271 |
Token | say |
Token ID | 910 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.039 |
, | +4.029 |
. | +3.873 |
the | +3.848 |
a | +3.604 |
Neg logit contributions | |
lor | -4.751 |
former | -4.710 |
umm | -4.689 |
ocol | -4.659 |
osity | -4.635 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +4.267 |
, | +4.164 |
. | +4.051 |
the | +3.976 |
a | +3.751 |
Neg logit contributions | |
lor | -4.715 |
former | -4.478 |
umm | -4.477 |
ocol | -4.463 |
osity | -4.461 |
Token | either |
Token ID | 2035 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +1.919 |
, | +1.899 |
the | +1.740 |
. | +1.736 |
a | +1.543 |
Neg logit contributions | |
lor | -6.901 |
former | -6.756 |
umm | -6.726 |
rol | -6.702 |
osity | -6.698 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +0.915 |
, | +0.885 |
the | +0.763 |
. | +0.730 |
a | +0.560 |
Neg logit contributions | |
lor | -7.906 |
umm | -7.741 |
rol | -7.698 |
former | -7.692 |
osity | -7.687 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
and | +3.040 |
, | +3.034 |
. | +2.879 |
the | +2.801 |
a | +2.581 |
Neg logit contributions | |
lor | -5.924 |
former | -5.777 |
umm | -5.745 |
rol | -5.706 |
osity | -5.679 |
Token | was |
Token ID | 373 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.158 |
and | +3.137 |
. | +3.044 |
the | +2.981 |
a | +2.760 |
Neg logit contributions | |
lor | -5.722 |
former | -5.575 |
umm | -5.536 |
rol | -5.517 |
bek | -5.474 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.24e+01 |
Pos logit contributions | |
, | +3.785 |
and | +3.776 |
. | +3.633 |
the | +3.529 |
a | +3.266 |
Neg logit contributions | |
lor | -5.072 |
former | -5.025 |
rol | -4.952 |
umm | -4.904 |
ocol | -4.890 |