Token | lie |
Token ID | 6486 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
at | +30.945 |
, | +30.939 |
in | +30.512 |
and | +30.282 |
with | +29.792 |
Neg logit contributions | |
exting | -9.370 |
龍� | -7.777 |
| -7.719 |
� | -7.697 |
� | -7.668 |
Token | � |
Token ID | 447 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
S | +31.739 |
J | +30.822 |
E | +30.800 |
Super | +30.693 |
R | +30.648 |
Neg logit contributions | |
exting | -3.130 |
perpetrated | -2.976 |
� | -2.761 |
� | -2.575 |
teasp | -2.463 |
Token | � |
Token ID | 251 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
the | +31.550 |
, | +31.483 |
( | +31.400 |
' | +30.993 |
in | +30.794 |
Neg logit contributions | |
� | -6.849 |
�� | -6.664 |
� | -5.391 |
�� | -5.248 |
�� | -4.574 |
Token | that |
Token ID | 326 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
control | +22.897 |
- | +22.677 |
stuff | +22.346 |
/ | +22.341 |
' | +22.287 |
Neg logit contributions | |
� | -15.218 |
RandomRedditor | -15.192 |
� | -15.102 |
| -15.093 |
| -15.092 |
Token | was |
Token ID | 373 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
. | +31.386 |
- | +30.832 |
( | +30.378 |
and | +29.859 |
/ | +29.510 |
Neg logit contributions | |
Palestin | -9.372 |
cumbers | -8.904 |
undermin | -8.681 |
millenn | -7.463 |
misunder | -6.193 |
Token | used |
Token ID | 973 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
- | +35.488 |
and | +34.600 |
( | +34.245 |
( | +34.219 |
. | +33.672 |
Neg logit contributions | |
perpetrated | -3.239 |
exting | -0.587 |
��� | -0.430 |
untrue | -0.030 |
unworthy | +0.141 |
Token | as |
Token ID | 355 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
- | +17.867 |
G | +17.713 |
C | +17.509 |
P | +17.286 |
( | +17.207 |
Neg logit contributions | |
exting | -16.916 |
eleph | -16.279 |
embedreportprint | -15.206 |
� | -15.162 |
� | -15.137 |
Token | a |
Token ID | 257 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
. | +32.940 |
, | +31.933 |
and | +30.932 |
+ | +30.734 |
( | +30.546 |
Neg logit contributions | |
PDATE | -3.987 |
| -3.871 |
� | -3.770 |
| -3.765 |
| -3.752 |
Token | pretext |
Token ID | 35097 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
, | +38.871 |
and | +38.061 |
. | +37.964 |
at | +37.463 |
with | +37.334 |
Neg logit contributions | |
pretext | -0.855 |
exting | +0.694 |
� | +2.646 |
| +2.715 |
cumbers | +2.722 |
Token | for |
Token ID | 329 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
, | +7.601 |
the | +7.544 |
and | +7.082 |
a | +6.982 |
( | +6.611 |
Neg logit contributions | |
RandomRedditor | -19.965 |
| -19.960 |
| -19.949 |
� | -19.947 |
� | -19.922 |
Token | the |
Token ID | 262 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
. | +36.754 |
, | +36.378 |
- | +34.788 |
and | +34.585 |
/ | +34.558 |
Neg logit contributions | |
persecut | -5.315 |
Palestin | -4.737 |
exting | -3.959 |
repression | -3.178 |
assass | -3.054 |
Token | to |
Token ID | 284 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
to | +6.476 |
, | +5.528 |
in | +4.690 |
and | +4.681 |
the | +4.446 |
Neg logit contributions | |
| -17.702 |
| -17.696 |
| -17.692 |
� | -17.691 |
RandomRedditor | -17.691 |
Token | divide |
Token ID | 14083 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
. | +32.802 |
and | +32.293 |
, | +32.141 |
of | +31.445 |
- | +31.349 |
Neg logit contributions | |
consolidate | -2.741 |
undermine | -2.168 |
discredit | -2.115 |
weaken | -2.080 |
intimidate | -1.741 |
Token | , |
Token ID | 11 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
| +22.668 |
for | +21.991 |
: | +21.679 |
. | +21.637 |
to | +21.277 |
Neg logit contributions | |
aditional | -10.317 |
� | -9.989 |
citiz | -9.928 |
practition | -9.821 |
� | -8.909 |
Token | destabil |
Token ID | 27397 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
, | +37.728 |
. | +36.781 |
: | +36.498 |
- | +35.450 |
Made | +34.815 |
Neg logit contributions | |
weaken | -1.460 |
discredit | +0.031 |
intimidate | +0.040 |
degrade | +0.209 |
infiltrate | +0.775 |
Token | ize |
Token ID | 1096 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
... | +40.261 |
a | +39.723 |
" | +39.631 |
- | +39.351 |
on | +39.301 |
Neg logit contributions | |
ize | -0.006 |
IZE | +1.190 |
strate | +5.239 |
ise | +5.246 |
imize | +5.372 |
Token | , |
Token ID | 11 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
in | +7.188 |
. | +7.028 |
to | +6.901 |
, | +6.784 |
the | +6.769 |
Neg logit contributions | |
� | -19.351 |
| -19.339 |
� | -19.338 |
RandomRedditor | -19.329 |
| -19.327 |
Token | and |
Token ID | 290 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
. | +28.627 |
: | +28.144 |
, | +26.969 |
P | +26.482 |
| +26.399 |
Neg logit contributions | |
exting | -9.179 |
teasp | -6.814 |
� | -6.194 |
| -6.188 |
pione | -6.093 |
Token | demoral |
Token ID | 49077 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
Fresh | +31.616 |
The | +31.573 |
Canary | +31.571 |
P | +31.408 |
On | +31.178 |
Neg logit contributions | |
topple | -2.778 |
intimidate | -2.234 |
weaken | -1.646 |
assassinate | -1.572 |
degrade | -1.504 |
Token | ize |
Token ID | 1096 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
, | +14.454 |
and | +14.066 |
in | +13.604 |
the | +13.576 |
to | +13.118 |
Neg logit contributions | |
� | -10.931 |
RandomRedditor | -10.926 |
� | -10.918 |
| -10.911 |
| -10.902 |
Token | its |
Token ID | 663 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
I | +28.320 |
QC | +27.992 |
show | +27.403 |
- | +27.334 |
| +27.315 |
Neg logit contributions | |
adversaries | -5.509 |
citiz | -4.401 |
democracies | -3.924 |
millenn | -3.611 |
dissidents | -2.905 |
Token | geopolitical |
Token ID | 35493 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
. | +32.960 |
, | +32.953 |
: | +31.749 |
the | +31.567 |
| +31.357 |
Neg logit contributions | |
adversaries | -2.236 |
millenn | -0.604 |
populace | -0.526 |
citiz | -0.166 |
adversary | +0.111 |
Token | , |
Token ID | 11 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
P | +37.221 |
N | +36.835 |
A | +36.818 |
C | +36.668 |
Experiment | +36.482 |
Neg logit contributions | |
denouncing | -2.834 |
condem | -1.521 |
condemning | -0.572 |
criticizing | +0.937 |
exting | +1.228 |
Token | declaring |
Token ID | 18684 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
, | +42.175 |
- | +42.058 |
. | +41.032 |
/ | +39.967 |
( | +38.650 |
Neg logit contributions | |
denouncing | -3.407 |
condem | -1.066 |
exting | -1.065 |
accusing | -0.437 |
condemning | -0.279 |
Token | that |
Token ID | 326 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
and | +21.266 |
- | +20.842 |
. | +20.545 |
& | +20.129 |
but | +19.805 |
Neg logit contributions | |
senal | -11.782 |
millenn | -10.843 |
ThumbnailImage | -10.534 |
� | -10.442 |
exting | -9.492 |
Token | all |
Token ID | 477 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
- | +32.005 |
and | +31.630 |
( | +31.228 |
& | +30.707 |
. | +30.406 |
Neg logit contributions | |
Palestin | -8.453 |
millenn | -5.936 |
senal | -4.541 |
Tehran | -4.151 |
Iranians | -3.619 |
Token | protesters |
Token ID | 9584 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
, | +33.172 |
. | +32.855 |
… | +32.796 |
( | +31.750 |
and | +31.739 |
Neg logit contributions | |
Palestin | -3.645 |
millenn | -3.383 |
zbollah | -3.181 |
Iranians | -3.158 |
mosqu | -2.717 |
Token | would |
Token ID | 561 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
Mystery | +25.513 |
Complex | +25.288 |
Open | +24.909 |
Odyssey | +24.350 |
R | +24.312 |
Neg logit contributions | |
besie | -6.276 |
detained | -5.220 |
belonged | -5.116 |
exting | -5.089 |
risked | -4.995 |
Token | be |
Token ID | 307 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
Creat | +27.899 |
Worth | +27.860 |
Dickens | +27.650 |
Third | +27.371 |
New | +27.229 |
Neg logit contributions | |
disperse | -6.824 |
evacuate | -4.683 |
retaliate | -4.228 |
exting | -4.197 |
obey | -4.093 |
Token | treated |
Token ID | 5716 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
which | +29.896 |
, | +29.746 |
. | +29.198 |
that | +28.672 |
and | +28.624 |
Neg logit contributions | |
exting | -7.607 |
� | -4.522 |
oreAnd | -4.503 |
��� | -4.054 |
� | -3.210 |
Token | as |
Token ID | 355 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
- | +28.066 |
Back | +27.327 |
Research | +27.246 |
, | +26.939 |
Elm | +26.845 |
Neg logit contributions | |
exting | -8.787 |
pione | -7.112 |
� | -5.463 |
rawdownload | -5.141 |
| -5.136 |
Token | Israeli |
Token ID | 6085 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
. | +31.970 |
, | +31.667 |
& | +30.741 |
and | +30.510 |
( | +30.329 |
Neg logit contributions | |
Palestin | -4.395 |
undermin | -3.478 |
gobl | -3.354 |
ikuman | -3.214 |
combatants | -2.873 |
Token | spies |
Token ID | 28801 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
the | +27.131 |
a | +26.411 |
I | +25.357 |
( | +25.353 |
that | +25.191 |
Neg logit contributions | |
practition | -6.137 |
citiz | -6.033 |
isSpecial | -5.139 |
exting | -4.910 |
undermin | -4.807 |
Token | that |
Token ID | 326 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
and | +12.705 |
- | +11.599 |
. | +11.544 |
| +11.366 |
( | +11.178 |
Neg logit contributions | |
� | -16.128 |
|