Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.581 |
and | +3.545 |
. | +3.374 |
the | +3.282 |
a | +3.031 |
Neg logit contributions | |
lor | -4.994 |
former | -4.898 |
umm | -4.815 |
rol | -4.762 |
arians | -4.753 |
Token | under |
Token ID | 739 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.006 |
and | +2.967 |
. | +2.739 |
the | +2.702 |
a | +2.475 |
Neg logit contributions | |
lor | -5.547 |
umm | -5.465 |
former | -5.434 |
rol | -5.372 |
ocol | -5.369 |
Token | the |
Token ID | 262 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.514 |
and | +1.489 |
. | +1.278 |
the | +1.159 |
a | +0.913 |
Neg logit contributions | |
lor | -7.052 |
umm | -6.958 |
former | -6.957 |
ocol | -6.863 |
rol | -6.813 |
Token | covers |
Token ID | 8698 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.448 |
and | +4.399 |
. | +4.203 |
the | +4.197 |
a | +3.960 |
Neg logit contributions | |
lor | -4.120 |
umm | -4.043 |
former | -3.986 |
ocol | -3.898 |
rol | -3.884 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.757 |
and | +0.723 |
the | +0.507 |
. | +0.491 |
a | +0.280 |
Neg logit contributions | |
lor | -7.826 |
umm | -7.705 |
former | -7.635 |
rol | -7.611 |
arians | -7.538 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.581 |
and | +3.545 |
. | +3.374 |
the | +3.282 |
a | +3.031 |
Neg logit contributions | |
lor | -4.994 |
former | -4.898 |
umm | -4.815 |
rol | -4.762 |
arians | -4.753 |
Token | under |
Token ID | 739 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.006 |
and | +2.967 |
. | +2.739 |
the | +2.702 |
a | +2.475 |
Neg logit contributions | |
lor | -5.547 |
umm | -5.465 |
former | -5.434 |
rol | -5.372 |
ocol | -5.369 |
Token | the |
Token ID | 262 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.514 |
and | +1.489 |
. | +1.278 |
the | +1.159 |
a | +0.913 |
Neg logit contributions | |
lor | -7.052 |
umm | -6.958 |
former | -6.957 |
ocol | -6.863 |
rol | -6.813 |
Token | covers |
Token ID | 8698 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.448 |
and | +4.399 |
. | +4.203 |
the | +4.197 |
a | +3.960 |
Neg logit contributions | |
lor | -4.120 |
umm | -4.043 |
former | -3.986 |
ocol | -3.898 |
rol | -3.884 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.581 |
and | +3.545 |
. | +3.374 |
the | +3.282 |
a | +3.031 |
Neg logit contributions | |
lor | -4.994 |
former | -4.898 |
umm | -4.815 |
rol | -4.762 |
arians | -4.753 |
Token | under |
Token ID | 739 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.006 |
and | +2.967 |
. | +2.739 |
the | +2.702 |
a | +2.475 |
Neg logit contributions | |
lor | -5.547 |
umm | -5.465 |
former | -5.434 |
rol | -5.372 |
ocol | -5.369 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.581 |
and | +3.545 |
. | +3.374 |
the | +3.282 |
a | +3.031 |
Neg logit contributions | |
lor | -4.994 |
former | -4.898 |
umm | -4.815 |
rol | -4.762 |
arians | -4.753 |
Token | under |
Token ID | 739 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.006 |
and | +2.967 |
. | +2.739 |
the | +2.702 |
a | +2.475 |
Neg logit contributions | |
lor | -5.547 |
umm | -5.465 |
former | -5.434 |
rol | -5.372 |
ocol | -5.369 |
Token | the |
Token ID | 262 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.514 |
and | +1.489 |
. | +1.278 |
the | +1.159 |
a | +0.913 |
Neg logit contributions | |
lor | -7.052 |
umm | -6.958 |
former | -6.957 |
ocol | -6.863 |
rol | -6.813 |
Token | talking |
Token ID | 3375 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +3.675 |
, | +3.671 |
. | +3.463 |
the | +3.457 |
a | +3.188 |
Neg logit contributions | |
lor | -4.856 |
former | -4.759 |
umm | -4.707 |
rol | -4.649 |
arians | -4.630 |
Token | , |
Token ID | 11 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.796 |
and | +2.754 |
the | +2.569 |
. | +2.566 |
a | +2.298 |
Neg logit contributions | |
lor | -5.767 |
former | -5.656 |
umm | -5.639 |
rol | -5.551 |
arians | -5.530 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.722 |
and | +3.672 |
. | +3.538 |
the | +3.462 |
a | +3.220 |
Neg logit contributions | |
lor | -4.798 |
former | -4.750 |
umm | -4.733 |
arians | -4.617 |
rol | -4.593 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.125 |
and | +2.100 |
the | +1.940 |
. | +1.918 |
a | +1.672 |
Neg logit contributions | |
lor | -6.394 |
umm | -6.301 |
former | -6.262 |
rol | -6.156 |
arians | -6.150 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | you |
Token ID | 345 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.248 |
and | +3.209 |
. | +3.060 |
the | +3.014 |
a | +2.789 |
Neg logit contributions | |
lor | -5.253 |
umm | -5.143 |
former | -5.128 |
arians | -5.101 |
rol | -5.069 |
Token | talking |
Token ID | 3375 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +3.675 |
, | +3.671 |
. | +3.463 |
the | +3.457 |
a | +3.188 |
Neg logit contributions | |
lor | -4.856 |
former | -4.759 |
umm | -4.707 |
rol | -4.649 |
arians | -4.630 |
Token | , |
Token ID | 11 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.796 |
and | +2.754 |
the | +2.569 |
. | +2.566 |
a | +2.298 |
Neg logit contributions | |
lor | -5.767 |
former | -5.656 |
umm | -5.639 |
rol | -5.551 |
arians | -5.530 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.722 |
and | +3.672 |
. | +3.538 |
the | +3.462 |
a | +3.220 |
Neg logit contributions | |
lor | -4.798 |
former | -4.750 |
umm | -4.733 |
arians | -4.617 |
rol | -4.593 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.125 |
and | +2.100 |
the | +1.940 |
. | +1.918 |
a | +1.672 |
Neg logit contributions | |
lor | -6.394 |
umm | -6.301 |
former | -6.262 |
rol | -6.156 |
arians | -6.150 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | , |
Token ID | 11 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.796 |
and | +2.754 |
the | +2.569 |
. | +2.566 |
a | +2.298 |
Neg logit contributions | |
lor | -5.767 |
former | -5.656 |
umm | -5.639 |
rol | -5.551 |
arians | -5.530 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.722 |
and | +3.672 |
. | +3.538 |
the | +3.462 |
a | +3.220 |
Neg logit contributions | |
lor | -4.798 |
former | -4.750 |
umm | -4.733 |
arians | -4.617 |
rol | -4.593 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.125 |
and | +2.100 |
the | +1.940 |
. | +1.918 |
a | +1.672 |
Neg logit contributions | |
lor | -6.394 |
umm | -6.301 |
former | -6.262 |
rol | -6.156 |
arians | -6.150 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.722 |
and | +3.672 |
. | +3.538 |
the | +3.462 |
a | +3.220 |
Neg logit contributions | |
lor | -4.798 |
former | -4.750 |
umm | -4.733 |
arians | -4.617 |
rol | -4.593 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.125 |
and | +2.100 |
the | +1.940 |
. | +1.918 |
a | +1.672 |
Neg logit contributions | |
lor | -6.394 |
umm | -6.301 |
former | -6.262 |
rol | -6.156 |
arians | -6.150 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.581 |
and | +3.545 |
. | +3.374 |
the | +3.282 |
a | +3.031 |
Neg logit contributions | |
lor | -4.994 |
former | -4.898 |
umm | -4.815 |
rol | -4.762 |
arians | -4.753 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.125 |
and | +2.100 |
the | +1.940 |
. | +1.918 |
a | +1.672 |
Neg logit contributions | |
lor | -6.394 |
umm | -6.301 |
former | -6.262 |
rol | -6.156 |
arians | -6.150 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.581 |
and | +3.545 |
. | +3.374 |
the | +3.282 |
a | +3.031 |
Neg logit contributions | |
lor | -4.994 |
former | -4.898 |
umm | -4.815 |
rol | -4.762 |
arians | -4.753 |
Token | under |
Token ID | 739 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.006 |
and | +2.967 |
. | +2.739 |
the | +2.702 |
a | +2.475 |
Neg logit contributions | |
lor | -5.547 |
umm | -5.465 |
former | -5.434 |
rol | -5.372 |
ocol | -5.369 |
Token | the |
Token ID | 262 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.514 |
and | +1.489 |
. | +1.278 |
the | +1.159 |
a | +0.913 |
Neg logit contributions | |
lor | -7.052 |
umm | -6.958 |
former | -6.957 |
ocol | -6.863 |
rol | -6.813 |
Token | covers |
Token ID | 8698 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.448 |
and | +4.399 |
. | +4.203 |
the | +4.197 |
a | +3.960 |
Neg logit contributions | |
lor | -4.120 |
umm | -4.043 |
former | -3.986 |
ocol | -3.898 |
rol | -3.884 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.757 |
and | +0.723 |
the | +0.507 |
. | +0.491 |
a | +0.280 |
Neg logit contributions | |
lor | -7.826 |
umm | -7.705 |
former | -7.635 |
rol | -7.611 |
arians | -7.538 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.581 |
and | +3.545 |
. | +3.374 |
the | +3.282 |
a | +3.031 |
Neg logit contributions | |
lor | -4.994 |
former | -4.898 |
umm | -4.815 |
rol | -4.762 |
arians | -4.753 |
Token | under |
Token ID | 739 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.006 |
and | +2.967 |
. | +2.739 |
the | +2.702 |
a | +2.475 |
Neg logit contributions | |
lor | -5.547 |
umm | -5.465 |
former | -5.434 |
rol | -5.372 |
ocol | -5.369 |
Token | the |
Token ID | 262 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.514 |
and | +1.489 |
. | +1.278 |
the | +1.159 |
a | +0.913 |
Neg logit contributions | |
lor | -7.052 |
umm | -6.958 |
former | -6.957 |
ocol | -6.863 |
rol | -6.813 |
Token | covers |
Token ID | 8698 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.448 |
and | +4.399 |
. | +4.203 |
the | +4.197 |
a | +3.960 |
Neg logit contributions | |
lor | -4.120 |
umm | -4.043 |
former | -3.986 |
ocol | -3.898 |
rol | -3.884 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.581 |
and | +3.545 |
. | +3.374 |
the | +3.282 |
a | +3.031 |
Neg logit contributions | |
lor | -4.994 |
former | -4.898 |
umm | -4.815 |
rol | -4.762 |
arians | -4.753 |
Token | under |
Token ID | 739 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.006 |
and | +2.967 |
. | +2.739 |
the | +2.702 |
a | +2.475 |
Neg logit contributions | |
lor | -5.547 |
umm | -5.465 |
former | -5.434 |
rol | -5.372 |
ocol | -5.369 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.581 |
and | +3.545 |
. | +3.374 |
the | +3.282 |
a | +3.031 |
Neg logit contributions | |
lor | -4.994 |
former | -4.898 |
umm | -4.815 |
rol | -4.762 |
arians | -4.753 |
Token | under |
Token ID | 739 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.006 |
and | +2.967 |
. | +2.739 |
the | +2.702 |
a | +2.475 |
Neg logit contributions | |
lor | -5.547 |
umm | -5.465 |
former | -5.434 |
rol | -5.372 |
ocol | -5.369 |
Token | the |
Token ID | 262 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.514 |
and | +1.489 |
. | +1.278 |
the | +1.159 |
a | +0.913 |
Neg logit contributions | |
lor | -7.052 |
umm | -6.958 |
former | -6.957 |
ocol | -6.863 |
rol | -6.813 |
Token | talking |
Token ID | 3375 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +3.675 |
, | +3.671 |
. | +3.463 |
the | +3.457 |
a | +3.188 |
Neg logit contributions | |
lor | -4.856 |
former | -4.759 |
umm | -4.707 |
rol | -4.649 |
arians | -4.630 |
Token | , |
Token ID | 11 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.796 |
and | +2.754 |
the | +2.569 |
. | +2.566 |
a | +2.298 |
Neg logit contributions | |
lor | -5.767 |
former | -5.656 |
umm | -5.639 |
rol | -5.551 |
arians | -5.530 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.722 |
and | +3.672 |
. | +3.538 |
the | +3.462 |
a | +3.220 |
Neg logit contributions | |
lor | -4.798 |
former | -4.750 |
umm | -4.733 |
arians | -4.617 |
rol | -4.593 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.125 |
and | +2.100 |
the | +1.940 |
. | +1.918 |
a | +1.672 |
Neg logit contributions | |
lor | -6.394 |
umm | -6.301 |
former | -6.262 |
rol | -6.156 |
arians | -6.150 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | you |
Token ID | 345 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.248 |
and | +3.209 |
. | +3.060 |
the | +3.014 |
a | +2.789 |
Neg logit contributions | |
lor | -5.253 |
umm | -5.143 |
former | -5.128 |
arians | -5.101 |
rol | -5.069 |
Token | talking |
Token ID | 3375 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +3.675 |
, | +3.671 |
. | +3.463 |
the | +3.457 |
a | +3.188 |
Neg logit contributions | |
lor | -4.856 |
former | -4.759 |
umm | -4.707 |
rol | -4.649 |
arians | -4.630 |
Token | , |
Token ID | 11 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.796 |
and | +2.754 |
the | +2.569 |
. | +2.566 |
a | +2.298 |
Neg logit contributions | |
lor | -5.767 |
former | -5.656 |
umm | -5.639 |
rol | -5.551 |
arians | -5.530 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.722 |
and | +3.672 |
. | +3.538 |
the | +3.462 |
a | +3.220 |
Neg logit contributions | |
lor | -4.798 |
former | -4.750 |
umm | -4.733 |
arians | -4.617 |
rol | -4.593 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.125 |
and | +2.100 |
the | +1.940 |
. | +1.918 |
a | +1.672 |
Neg logit contributions | |
lor | -6.394 |
umm | -6.301 |
former | -6.262 |
rol | -6.156 |
arians | -6.150 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | , |
Token ID | 11 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.796 |
and | +2.754 |
the | +2.569 |
. | +2.566 |
a | +2.298 |
Neg logit contributions | |
lor | -5.767 |
former | -5.656 |
umm | -5.639 |
rol | -5.551 |
arians | -5.530 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.722 |
and | +3.672 |
. | +3.538 |
the | +3.462 |
a | +3.220 |
Neg logit contributions | |
lor | -4.798 |
former | -4.750 |
umm | -4.733 |
arians | -4.617 |
rol | -4.593 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.125 |
and | +2.100 |
the | +1.940 |
. | +1.918 |
a | +1.672 |
Neg logit contributions | |
lor | -6.394 |
umm | -6.301 |
former | -6.262 |
rol | -6.156 |
arians | -6.150 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.722 |
and | +3.672 |
. | +3.538 |
the | +3.462 |
a | +3.220 |
Neg logit contributions | |
lor | -4.798 |
former | -4.750 |
umm | -4.733 |
arians | -4.617 |
rol | -4.593 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.125 |
and | +2.100 |
the | +1.940 |
. | +1.918 |
a | +1.672 |
Neg logit contributions | |
lor | -6.394 |
umm | -6.301 |
former | -6.262 |
rol | -6.156 |
arians | -6.150 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.384 |
and | +1.358 |
. | +1.141 |
the | +1.098 |
a | +0.856 |
Neg logit contributions | |
lor | -7.241 |
former | -7.059 |
umm | -7.042 |
rol | -6.998 |
arians | -6.933 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.676 |
and | +3.657 |
. | +3.457 |
the | +3.415 |
a | +3.160 |
Neg logit contributions | |
lor | -5.016 |
umm | -4.853 |
former | -4.835 |
rol | -4.764 |
arians | -4.750 |
Token | went |
Token ID | 1816 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.975 |
and | +2.915 |
. | +2.796 |
the | +2.761 |
a | +2.505 |
Neg logit contributions | |
lor | -5.578 |
former | -5.414 |
umm | -5.407 |
arians | -5.363 |
rol | -5.351 |
Token | to |
Token ID | 284 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.864 |
and | +1.832 |
. | +1.647 |
the | +1.609 |
a | +1.361 |
Neg logit contributions | |
lor | -6.723 |
former | -6.589 |
umm | -6.583 |
rol | -6.538 |
arians | -6.489 |
Token | his |
Token ID | 465 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.339 |
and | +2.311 |
. | +2.108 |
the | +1.968 |
a | +1.757 |
Neg logit contributions | |
lor | -6.191 |
former | -6.142 |
umm | -6.080 |
ocol | -6.007 |
rol | -6.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.788 |
and | +3.758 |
. | +3.576 |
the | +3.543 |
a | +3.280 |
Neg logit contributions | |
lor | -4.768 |
former | -4.751 |
umm | -4.712 |
arians | -4.597 |
rol | -4.503 |
Token | and |
Token ID | 290 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.168 |
and | +1.130 |
the | +0.980 |
. | +0.948 |
a | +0.715 |
Neg logit contributions | |
lor | -7.395 |
former | -7.265 |
umm | -7.249 |
arians | -7.126 |
rol | -7.125 |
Token | hid |
Token ID | 24519 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.581 |
and | +3.545 |
. | +3.374 |
the | +3.282 |
a | +3.031 |
Neg logit contributions | |
lor | -4.994 |
former | -4.898 |
umm | -4.815 |
rol | -4.762 |
arians | -4.753 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token |
|
Token ID | 198 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.049 |
and | +3.025 |
. | +2.815 |
the | +2.771 |
a | +2.513 |
Neg logit contributions | |
lor | -5.571 |
umm | -5.483 |
former | -5.450 |
rol | -5.350 |
arians | -5.328 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.493 |
and | +0.460 |
the | +0.310 |
. | +0.261 |
a | +0.090 |
Neg logit contributions | |
umm | -7.892 |
lor | -7.886 |
former | -7.776 |
rol | -7.738 |
ocol | -7.726 |
Token | ?" |
Token ID | 1701 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.125 |
and | +2.100 |
the | +1.940 |
. | +1.918 |
a | +1.672 |
Neg logit contributions | |
lor | -6.394 |
umm | -6.301 |
former | -6.262 |
rol | -6.156 |
arians | -6.150 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | The |
Token ID | 383 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.096 |
and | +3.083 |
. | +2.888 |
the | +2.812 |
a | +2.583 |
Neg logit contributions | |
lor | -5.426 |
former | -5.335 |
umm | -5.306 |
rol | -5.214 |
ocol | -5.202 |
Token | table |
Token ID | 3084 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +4.191 |
and | +4.157 |
. | +3.967 |
the | +3.920 |
a | +3.655 |
Neg logit contributions | |
lor | -4.365 |
umm | -4.332 |
former | -4.309 |
arians | -4.182 |
ocol | -4.181 |
Token | did |
Token ID | 750 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.748 |
and | +3.719 |
. | +3.547 |
the | +3.537 |
a | +3.274 |
Neg logit contributions | |
lor | -4.796 |
umm | -4.678 |
former | -4.641 |
rol | -4.575 |
arians | -4.532 |
Token | not |
Token ID | 407 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.360 |
and | +2.348 |
. | +2.144 |
the | +2.120 |
a | +1.850 |
Neg logit contributions | |
lor | -6.159 |
former | -6.070 |
umm | -5.991 |
arians | -5.910 |
rol | -5.903 |
Token | say |
Token ID | 910 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.854 |
and | +3.828 |
. | +3.627 |
the | +3.619 |
a | +3.344 |
Neg logit contributions | |
lor | -4.635 |
umm | -4.604 |
former | -4.591 |
ocol | -4.482 |
rol | -4.473 |
Token | anything |
Token ID | 1997 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
and | +4.112 |
, | +4.068 |
. | +3.875 |
the | +3.826 |
a | +3.568 |
Neg logit contributions | |
lor | -4.501 |
umm | -4.334 |
former | -4.306 |
ocol | -4.222 |
rol | -4.221 |
Token | either |
Token ID | 2035 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +1.831 |
and | +1.812 |
the | +1.610 |
. | +1.600 |
a | +1.372 |
Neg logit contributions | |
lor | -6.679 |
umm | -6.561 |
former | -6.553 |
rol | -6.463 |
arians | -6.462 |
Token | . |
Token ID | 13 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +0.840 |
and | +0.832 |
the | +0.658 |
. | +0.612 |
a | +0.418 |
Neg logit contributions | |
lor | -7.641 |
umm | -7.525 |
former | -7.453 |
rol | -7.417 |
arians | -7.382 |
Token | Tom |
Token ID | 4186 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +2.925 |
and | +2.895 |
. | +2.698 |
the | +2.646 |
a | +2.391 |
Neg logit contributions | |
lor | -5.703 |
umm | -5.577 |
former | -5.575 |
rol | -5.471 |
arians | -5.450 |
Token | was |
Token ID | 373 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.018 |
and | +2.954 |
. | +2.830 |
the | +2.794 |
a | +2.538 |
Neg logit contributions | |
lor | -5.525 |
former | -5.394 |
umm | -5.376 |
arians | -5.314 |
rol | -5.301 |
Token | scared |
Token ID | 12008 |
Feature activation | -4.33e+01 |
Pos logit contributions | |
, | +3.665 |
and | +3.627 |
. | +3.444 |
the | +3.378 |
a | +3.096 |
Neg logit contributions | |
lor | -4.904 |
former | -4.839 |
umm | -4.794 |
rol | -4.738 |
arians | -4.690 |