Token | It |
Token ID | 632 |
Feature activation | +1.50e-04 |
Pos logit contributions | |
enny | +0.001 |
uddy | +0.001 |
unn | +0.001 |
� | +0.001 |
driver | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
away | -0.001 |
things | -0.001 |
Token | 's |
Token ID | 338 |
Feature activation | +4.08e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
things | +0.000 |
everything | +0.000 |
Neg logit contributions | |
enny | -0.000 |
oured | -0.000 |
seek | -0.000 |
ipop | -0.000 |
uddy | -0.000 |
Token | important |
Token ID | 1593 |
Feature activation | -8.03e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
things | +0.004 |
away | +0.004 |
Neg logit contributions | |
enny | -0.007 |
ache | -0.007 |
drop | -0.007 |
unn | -0.007 |
oured | -0.007 |
Token | to |
Token ID | 284 |
Feature activation | -8.84e-04 |
Pos logit contributions | |
enny | +0.019 |
opus | +0.018 |
oured | +0.018 |
uddy | +0.018 |
� | +0.018 |
Neg logit contributions | |
its | -0.009 |
their | -0.008 |
them | -0.008 |
things | -0.008 |
her | -0.007 |
Token | stay |
Token ID | 2652 |
Feature activation | +3.64e-04 |
Pos logit contributions | |
enny | +0.002 |
oured | +0.002 |
driver | +0.002 |
uddy | +0.002 |
ipop | +0.002 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
everything | -0.001 |
Token | hyd |
Token ID | 7409 |
Feature activation | +5.33e-02 |
Pos logit contributions | |
its | +0.000 |
them | +0.000 |
their | +0.000 |
fog | +0.000 |
Wow | +0.000 |
Neg logit contributions | |
enny | -0.001 |
ache | -0.001 |
oured | -0.001 |
coat | -0.001 |
ipop | -0.001 |
Token | rated |
Token ID | 4111 |
Feature activation | +6.52e-03 |
Pos logit contributions | |
its | +0.100 |
their | +0.088 |
them | +0.080 |
fog | +0.079 |
it | +0.078 |
Neg logit contributions | |
ache | -0.076 |
enny | -0.075 |
ave | -0.073 |
oured | -0.073 |
drop | -0.072 |
Token | and |
Token ID | 290 |
Feature activation | -7.45e-04 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
things | +0.005 |
her | +0.005 |
Neg logit contributions | |
enny | -0.015 |
oured | -0.014 |
ipop | -0.014 |
drop | -0.014 |
uddy | -0.014 |
Token | healthy |
Token ID | 5448 |
Feature activation | +2.20e-03 |
Pos logit contributions | |
enny | +0.001 |
oured | +0.001 |
ache | +0.001 |
drop | +0.001 |
unn | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
everything | -0.001 |
Token | ," |
Token ID | 553 |
Feature activation | -6.20e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
things | +0.001 |
her | +0.001 |
Neg logit contributions | |
enny | -0.005 |
oured | -0.005 |
uddy | -0.005 |
drop | -0.005 |
driver | -0.005 |
Token | mom |
Token ID | 1995 |
Feature activation | +8.41e-03 |
Pos logit contributions | |
enny | +0.012 |
ipop | +0.012 |
ache | +0.012 |
uddy | +0.011 |
coach | +0.011 |
Neg logit contributions | |
its | -0.007 |
them | -0.006 |
away | -0.006 |
their | -0.005 |
fires | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -2.31e-03 |
Pos logit contributions | |
enny | +0.013 |
seek | +0.013 |
oured | +0.013 |
unn | +0.013 |
uddy | +0.013 |
Neg logit contributions | |
its | -0.007 |
their | -0.006 |
them | -0.006 |
things | -0.005 |
her | -0.005 |
Token | It |
Token ID | 632 |
Feature activation | +8.93e-04 |
Pos logit contributions | |
enny | +0.005 |
ache | +0.004 |
oured | +0.004 |
drop | +0.004 |
unn | +0.004 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
them | -0.002 |
things | -0.002 |
her | -0.002 |
Token | will |
Token ID | 481 |
Feature activation | -6.28e-04 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
it | +0.001 |
Neg logit contributions | |
enny | -0.002 |
seek | -0.002 |
oured | -0.002 |
uddy | -0.002 |
ipop | -0.002 |
Token | keep |
Token ID | 1394 |
Feature activation | -9.31e-03 |
Pos logit contributions | |
enny | +0.001 |
oured | +0.001 |
unn | +0.001 |
ipop | +0.001 |
uddy | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
everything | -0.001 |
Token | you |
Token ID | 345 |
Feature activation | +3.65e-03 |
Pos logit contributions | |
enny | +0.021 |
drop | +0.021 |
ache | +0.021 |
unn | +0.021 |
oured | +0.021 |
Neg logit contributions | |
its | -0.008 |
their | -0.006 |
them | -0.006 |
fog | -0.004 |
away | -0.004 |
Token | hyd |
Token ID | 7409 |
Feature activation | +5.17e-02 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
things | +0.002 |
her | +0.002 |
Neg logit contributions | |
enny | -0.008 |
unn | -0.008 |
oured | -0.008 |
uddy | -0.008 |
drop | -0.008 |
Token | rated |
Token ID | 4111 |
Feature activation | +5.73e-03 |
Pos logit contributions | |
its | +0.096 |
their | +0.085 |
fog | +0.078 |
them | +0.078 |
things | +0.075 |
Neg logit contributions | |
ache | -0.074 |
enny | -0.074 |
oured | -0.072 |
ave | -0.071 |
drop | -0.070 |
Token | . |
Token ID | 13 |
Feature activation | -2.25e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
things | +0.003 |
her | +0.003 |
Neg logit contributions | |
enny | -0.013 |
oured | -0.013 |
ache | -0.013 |
unn | -0.013 |
drop | -0.013 |
Token | You |
Token ID | 921 |
Feature activation | +3.71e-03 |
Pos logit contributions | |
enny | +0.004 |
oured | +0.004 |
unn | +0.004 |
drop | +0.004 |
ache | +0.004 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
them | -0.003 |
things | -0.002 |
everything | -0.002 |
Token | have |
Token ID | 423 |
Feature activation | -6.10e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
it | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.008 |
seek | -0.008 |
oured | -0.008 |
drop | -0.008 |
ipop | -0.008 |
Token | to |
Token ID | 284 |
Feature activation | -1.44e-03 |
Pos logit contributions | |
uddy | +0.015 |
opus | +0.014 |
enny | +0.014 |
� | +0.014 |
drop | +0.014 |
Neg logit contributions | |
its | -0.009 |
their | -0.008 |
them | -0.007 |
it | -0.007 |
everything | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | +1.03e-03 |
Pos logit contributions | |
its | +0.009 |
away | +0.006 |
their | +0.005 |
them | +0.005 |
south | +0.005 |
Neg logit contributions | |
driver | -0.028 |
enny | -0.028 |
chip | -0.027 |
drop | -0.027 |
oured | -0.027 |
Token | car |
Token ID | 1097 |
Feature activation | -5.78e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.001 |
them | +0.001 |
her | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.002 |
ache | -0.002 |
drop | -0.002 |
driver | -0.002 |
oured | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | -2.85e-03 |
Pos logit contributions | |
enny | +0.015 |
unn | +0.014 |
oured | +0.014 |
ipop | +0.014 |
opus | +0.014 |
Neg logit contributions | |
its | -0.005 |
their | -0.004 |
them | -0.004 |
things | -0.003 |
everything | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +8.79e-04 |
Pos logit contributions | |
enny | +0.007 |
oured | +0.006 |
unn | +0.006 |
ache | +0.006 |
drop | +0.006 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
things | -0.002 |
everything | -0.001 |
Token | fire |
Token ID | 2046 |
Feature activation | +7.73e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.002 |
oured | -0.002 |
unn | -0.002 |
ipop | -0.002 |
uddy | -0.002 |
Token | hyd |
Token ID | 7409 |
Feature activation | +5.16e-02 |
Pos logit contributions | |
its | +0.006 |
their | +0.006 |
them | +0.005 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.020 |
unn | -0.019 |
oured | -0.019 |
ipop | -0.018 |
olly | -0.018 |
Token | rant |
Token ID | 5250 |
Feature activation | +8.18e-03 |
Pos logit contributions | |
its | +0.099 |
her | +0.083 |
their | +0.082 |
fant | +0.080 |
it | +0.076 |
Neg logit contributions | |
ache | -0.068 |
drop | -0.068 |
oured | -0.067 |
ucker | -0.066 |
driver | -0.066 |
Token | . |
Token ID | 13 |
Feature activation | -2.94e-04 |
Pos logit contributions | |
its | +0.007 |
their | +0.005 |
them | +0.005 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.020 |
oured | -0.019 |
unn | -0.019 |
ache | -0.019 |
drop | -0.019 |
Token | They |
Token ID | 1119 |
Feature activation | +3.53e-03 |
Pos logit contributions | |
enny | +0.001 |
oured | +0.001 |
driver | +0.001 |
uddy | +0.001 |
unn | +0.001 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
things | -0.000 |
fog | -0.000 |
Token | take |
Token ID | 1011 |
Feature activation | -1.43e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
her | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.008 |
unn | -0.008 |
uddy | -0.007 |
seek | -0.007 |
va | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | +6.48e-04 |
Pos logit contributions | |
enny | +0.003 |
driver | +0.003 |
oured | +0.003 |
drop | +0.003 |
unn | +0.003 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
fog | -0.001 |
fant | -0.001 |
Token | car |
Token ID | 1097 |
Feature activation | -7.09e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
things | +0.002 |
fog | +0.002 |
Neg logit contributions | |
enny | -0.004 |
oured | -0.004 |
unn | -0.004 |
olly | -0.004 |
seek | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -1.64e-03 |
Pos logit contributions | |
enny | +0.017 |
unn | +0.016 |
oured | +0.016 |
va | +0.016 |
scar | +0.016 |
Neg logit contributions | |
its | -0.009 |
their | -0.007 |
them | -0.007 |
things | -0.006 |
it | -0.006 |
Token | and |
Token ID | 290 |
Feature activation | -3.96e-04 |
Pos logit contributions | |
driver | +0.004 |
enny | +0.004 |
drop | +0.004 |
ache | +0.004 |
ipop | +0.004 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
away | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +1.92e-03 |
Pos logit contributions | |
enny | +0.001 |
drop | +0.001 |
driver | +0.001 |
ache | +0.001 |
ipop | +0.001 |
Neg logit contributions | |
its | -0.000 |
them | -0.000 |
their | -0.000 |
things | -0.000 |
away | -0.000 |
Token | fire |
Token ID | 2046 |
Feature activation | +5.70e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
things | +0.002 |
everything | +0.002 |
Neg logit contributions | |
enny | -0.004 |
oured | -0.004 |
unn | -0.004 |
olly | -0.004 |
seek | -0.004 |
Token | hyd |
Token ID | 7409 |
Feature activation | +5.12e-02 |
Pos logit contributions | |
its | +0.007 |
their | +0.007 |
them | +0.006 |
things | +0.005 |
down | +0.005 |
Neg logit contributions | |
enny | -0.013 |
va | -0.012 |
olly | -0.012 |
oured | -0.012 |
seek | -0.012 |
Token | rant |
Token ID | 5250 |
Feature activation | +5.23e-03 |
Pos logit contributions | |
its | +0.098 |
their | +0.083 |
her | +0.083 |
fant | +0.082 |
fog | +0.076 |
Neg logit contributions | |
ache | -0.068 |
drop | -0.067 |
ucker | -0.065 |
oured | -0.065 |
driver | -0.065 |
Token | are |
Token ID | 389 |
Feature activation | +5.14e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
things | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.013 |
uddy | -0.012 |
unn | -0.012 |
oured | -0.012 |
ipop | -0.012 |
Token | wet |
Token ID | 9583 |
Feature activation | +4.52e-03 |
Pos logit contributions | |
its | +0.008 |
their | +0.007 |
them | +0.006 |
everything | +0.005 |
things | +0.005 |
Neg logit contributions | |
enny | -0.010 |
unn | -0.010 |
oured | -0.010 |
seek | -0.010 |
uddy | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | +1.91e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
her | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.010 |
ache | -0.010 |
drop | -0.010 |
driver | -0.010 |
unn | -0.010 |
Token | Lily |
Token ID | 20037 |
Feature activation | +1.37e-03 |
Pos logit contributions | |
its | +0.003 |
them | +0.002 |
their | +0.002 |
away | +0.002 |
things | +0.002 |
Neg logit contributions | |
enny | -0.003 |
uddy | -0.003 |
� | -0.003 |
driver | -0.003 |
unn | -0.003 |
Token | hyd |
Token ID | 7409 |
Feature activation | +4.92e-02 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.003 |
down | +0.002 |
things | +0.002 |
Neg logit contributions | |
enny | -0.007 |
unn | -0.007 |
oured | -0.007 |
olly | -0.006 |
va | -0.006 |
Token | rant |
Token ID | 5250 |
Feature activation | +2.73e-03 |
Pos logit contributions | |
its | +0.094 |
her | +0.084 |
fant | +0.083 |
their | +0.083 |
them | +0.076 |
Neg logit contributions | |
ache | -0.064 |
driver | -0.064 |
ave | -0.062 |
drop | -0.060 |
oured | -0.059 |
Token | . |
Token ID | 13 |
Feature activation | +3.13e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
things | +0.002 |
her | +0.002 |
Neg logit contributions | |
enny | -0.006 |
oured | -0.006 |
ache | -0.006 |
drop | -0.006 |
unn | -0.006 |
Token | The |
Token ID | 383 |
Feature activation | -1.11e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
things | +0.003 |
away | +0.003 |
Neg logit contributions | |
enny | -0.006 |
driver | -0.006 |
uddy | -0.005 |
� | -0.005 |
oured | -0.005 |
Token | fire |
Token ID | 2046 |
Feature activation | +4.56e-03 |
Pos logit contributions | |
enny | +0.002 |
oured | +0.002 |
unn | +0.002 |
seek | +0.002 |
ipop | +0.002 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
everything | -0.001 |
Token | hyd |
Token ID | 7409 |
Feature activation | +5.10e-02 |
Pos logit contributions | |
its | +0.006 |
their | +0.006 |
them | +0.005 |
things | +0.005 |
fires | +0.005 |
Neg logit contributions | |
enny | -0.010 |
seek | -0.009 |
unn | -0.009 |
va | -0.009 |
olly | -0.009 |
Token | rant |
Token ID | 5250 |
Feature activation | +4.12e-03 |
Pos logit contributions | |
its | +0.097 |
fant | +0.086 |
her | +0.086 |
their | +0.084 |
fog | +0.077 |
Neg logit contributions | |
ache | -0.067 |
driver | -0.066 |
ave | -0.063 |
drop | -0.062 |
ucker | -0.062 |
Token | breaks |
Token ID | 9457 |
Feature activation | +4.38e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
things | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.009 |
unn | -0.008 |
uddy | -0.008 |
oured | -0.008 |
ipop | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +2.44e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
things | +0.002 |
her | +0.002 |
Neg logit contributions | |
enny | -0.010 |
ache | -0.010 |
driver | -0.010 |
drop | -0.010 |
oured | -0.010 |
Token | Water |
Token ID | 5638 |
Feature activation | -2.66e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.003 |
away | +0.003 |
things | +0.003 |
Neg logit contributions | |
enny | -0.004 |
� | -0.004 |
driver | -0.004 |
uddy | -0.004 |
drop | -0.004 |
Token | spr |
Token ID | 7500 |
Feature activation | +4.99e-03 |
Pos logit contributions | |
enny | +0.006 |
seek | +0.005 |
unn | +0.005 |
oured | +0.005 |
va | +0.005 |
Neg logit contributions | |
its | -0.004 |
their | -0.003 |
them | -0.003 |
it | -0.003 |
everything | -0.003 |
Token | it |
Token ID | 340 |
Feature activation | -4.20e-04 |
Pos logit contributions | |
its | +0.010 |
their | +0.008 |
them | +0.008 |
things | +0.007 |
everything | +0.007 |
Neg logit contributions | |
enny | -0.016 |
oured | -0.016 |
ipop | -0.015 |
ache | -0.015 |
drop | -0.015 |
Token | 's |
Token ID | 338 |
Feature activation | +1.44e-03 |
Pos logit contributions | |
coat | +0.001 |
seek | +0.001 |
oured | +0.001 |
ipop | +0.001 |
enny | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.000 |
them | -0.000 |
things | -0.000 |
it | -0.000 |
Token | important |
Token ID | 1593 |
Feature activation | -7.96e-03 |
Pos logit contributions | |
its | +0.002 |
them | +0.002 |
their | +0.002 |
away | +0.002 |
things | +0.002 |
Neg logit contributions | |
enny | -0.002 |
ache | -0.002 |
drop | -0.002 |
unn | -0.002 |
ipop | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | -1.45e-03 |
Pos logit contributions | |
oured | +0.019 |
opus | +0.018 |
ache | +0.018 |
enny | +0.018 |
pper | +0.018 |
Neg logit contributions | |
its | -0.010 |
their | -0.008 |
things | -0.008 |
it | -0.008 |
them | -0.007 |
Token | stay |
Token ID | 2652 |
Feature activation | -4.63e-04 |
Pos logit contributions | |
enny | +0.003 |
driver | +0.003 |
oured | +0.003 |
uddy | +0.002 |
ache | +0.002 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
her | -0.002 |
everything | -0.002 |
Token | hyd |
Token ID | 7409 |
Feature activation | +5.09e-02 |
Pos logit contributions | |
enny | +0.001 |
oured | +0.001 |
ache | +0.001 |
ucker | +0.001 |
unn | +0.001 |
Neg logit contributions | |
its | -0.001 |
them | -0.000 |
their | -0.000 |
fog | -0.000 |
Wow | -0.000 |
Token | rated |
Token ID | 4111 |
Feature activation | +5.69e-03 |
Pos logit contributions | |
its | +0.085 |
their | +0.075 |
them | +0.070 |
her | +0.065 |
fog | +0.064 |
Neg logit contributions | |
enny | -0.083 |
ache | -0.079 |
oured | -0.079 |
drop | -0.079 |
seek | -0.078 |
Token | and |
Token ID | 290 |
Feature activation | +7.05e-04 |
Pos logit contributions | |
its | +0.007 |
them | +0.006 |
their | +0.006 |
things | +0.005 |
it | +0.005 |
Neg logit contributions | |
ipop | -0.013 |
uddy | -0.012 |
oured | -0.012 |
enny | -0.012 |
drop | -0.012 |
Token | drink |
Token ID | 4144 |
Feature activation | +4.31e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.001 |
oured | -0.001 |
unn | -0.001 |
ache | -0.001 |
drop | -0.001 |
Token | water |
Token ID | 1660 |
Feature activation | -6.62e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
her | +0.003 |
things | +0.003 |
Neg logit contributions | |
enny | -0.009 |
unn | -0.008 |
ache | -0.008 |
drop | -0.008 |
oured | -0.008 |
Token | when |
Token ID | 618 |
Feature activation | +3.49e-04 |
Pos logit contributions | |
enny | +0.016 |
oured | +0.016 |
unn | +0.015 |
uddy | +0.015 |
drop | +0.015 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
things | -0.003 |
her | -0.003 |
Token | me |
Token ID | 502 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
enny | +0.001 |
ache | +0.001 |
oured | +0.001 |
drop | +0.001 |
ipop | +0.001 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
her | -0.000 |
things | -0.000 |
Token | to |
Token ID | 284 |
Feature activation | -7.15e-04 |
Pos logit contributions | |
its | +0.009 |
out | +0.008 |
them | +0.008 |
their | +0.007 |
down | +0.007 |
Neg logit contributions | |
enny | -0.027 |
� | -0.026 |
va | -0.026 |
uddy | -0.026 |
istent | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | +1.81e-03 |
Pos logit contributions | |
enny | +0.002 |
unn | +0.002 |
oured | +0.002 |
ache | +0.002 |
drop | +0.002 |
Neg logit contributions | |
its | -0.001 |
their | -0.000 |
them | -0.000 |
things | -0.000 |
everything | -0.000 |
Token | nearest |
Token ID | 16936 |
Feature activation | +3.10e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
things | +0.002 |
everything | +0.002 |
Neg logit contributions | |
enny | -0.003 |
unn | -0.003 |
oured | -0.003 |
ipop | -0.003 |
driver | -0.003 |
Token | fire |
Token ID | 2046 |
Feature activation | +9.96e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.005 |
oured | -0.005 |
unn | -0.005 |
drop | -0.005 |
ipop | -0.005 |
Token | hyd |
Token ID | 7409 |
Feature activation | +5.08e-02 |
Pos logit contributions | |
its | +0.008 |
their | +0.006 |
them | +0.006 |
down | +0.005 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.025 |
unn | -0.025 |
oured | -0.024 |
seek | -0.024 |
drop | -0.024 |
Token | rant |
Token ID | 5250 |
Feature activation | +1.35e-02 |
Pos logit contributions | |
its | +0.098 |
their | +0.087 |
things | +0.083 |
her | +0.081 |
fant | +0.081 |
Neg logit contributions | |
oured | -0.063 |
ucker | -0.062 |
zag | -0.062 |
drop | -0.061 |
ache | -0.061 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
its | +0.014 |
their | +0.011 |
them | +0.011 |
everything | +0.009 |
things | +0.008 |
Neg logit contributions | |
enny | -0.032 |
unn | -0.031 |
uddy | -0.031 |
oured | -0.031 |
drop | -0.031 |
Token | |
Token ID | 220 |
Feature activation | -7.58e-03 |
Pos logit contributions | |
enny | +0.031 |
ipop | +0.029 |
oured | +0.029 |
drop | +0.029 |
driver | +0.029 |
Neg logit contributions | |
its | -0.018 |
their | -0.016 |
them | -0.015 |
things | -0.013 |
fog | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | -2.05e-03 |
Pos logit contributions | |
enny | +0.014 |
uddy | +0.013 |
driver | +0.013 |
unn | +0.013 |
olly | +0.013 |
Neg logit contributions | |
its | -0.010 |
their | -0.009 |
them | -0.009 |
fires | -0.008 |
fog | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -2.27e-03 |
Pos logit contributions | |
enny | +0.003 |
uddy | +0.003 |
va | +0.003 |
olly | +0.003 |
t | +0.003 |
Neg logit contributions | |
its | -0.003 |
fires | -0.003 |
their | -0.003 |
fog | -0.003 |
things | -0.003 |
Token | to |
Token ID | 284 |
Feature activation | -1.10e-03 |
Pos logit contributions | |
enny | +0.011 |
uddy | +0.011 |
driver | +0.011 |
opus | +0.011 |
ache | +0.011 |
Neg logit contributions | |
its | -0.007 |
them | -0.006 |
their | -0.006 |
it | -0.006 |
everything | -0.005 |
Token | drink |
Token ID | 4144 |
Feature activation | +4.33e-03 |
Pos logit contributions | |
enny | +0.002 |
driver | +0.002 |
ipop | +0.002 |
uddy | +0.002 |
unn | +0.002 |
Neg logit contributions | |
its | -0.002 |
them | -0.001 |
their | -0.001 |
her | -0.001 |
everything | -0.001 |
Token | it |
Token ID | 340 |
Feature activation | -1.04e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
fog | +0.003 |
things | +0.003 |
Neg logit contributions | |
enny | -0.009 |
oured | -0.009 |
drop | -0.009 |
ipop | -0.009 |
unn | -0.009 |
Token | to |
Token ID | 284 |
Feature activation | -1.16e-03 |
Pos logit contributions | |
enny | +0.002 |
unn | +0.002 |
uddy | +0.002 |
oured | +0.002 |
drop | +0.002 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
everything | -0.001 |
Token | stay |
Token ID | 2652 |
Feature activation | -4.15e-04 |
Pos logit contributions | |
enny | +0.002 |
drop | +0.002 |
oured | +0.002 |
ache | +0.002 |
unn | +0.002 |
Neg logit contributions | |
its | -0.002 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
fog | -0.001 |
Token | hyd |
Token ID | 7409 |
Feature activation | +5.08e-02 |
Pos logit contributions | |
oured | +0.001 |
enny | +0.001 |
ache | +0.001 |
drop | +0.001 |
ipop | +0.001 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
fog | -0.000 |
her | -0.000 |
Token | rated |
Token ID | 4111 |
Feature activation | +6.61e-03 |
Pos logit contributions | |
its | +0.089 |
their | +0.080 |
them | +0.074 |
things | +0.072 |
fog | +0.070 |
Neg logit contributions | |
ache | -0.076 |
oured | -0.075 |
enny | -0.075 |
drop | -0.073 |
seek | -0.071 |
Token | !" |
Token ID | 2474 |
Feature activation | -4.70e-03 |
Pos logit contributions | |
its | +0.007 |
them | +0.006 |
their | +0.005 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.015 |
ipop | -0.015 |
oured | -0.015 |
uddy | -0.015 |
drop | -0.015 |
Token | Billy |
Token ID | 15890 |
Feature activation | +6.16e-04 |
Pos logit contributions | |
enny | +0.009 |
oured | +0.009 |
ipop | +0.009 |
unn | +0.009 |
drop | +0.009 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
things | -0.004 |
fog | -0.004 |
Token | drank |
Token ID | 24070 |
Feature activation | +9.15e-04 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
his | +0.001 |
her | +0.001 |
the | +0.001 |
Neg logit contributions | |
ider | -0.001 |
driver | -0.001 |
unn | -0.001 |
seek | -0.001 |
supervision | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +7.12e-04 |
Pos logit contributions | |
its | +0.001 |
south | +0.001 |
fires | +0.001 |
away | +0.001 |
fant | +0.001 |
Neg logit contributions | |
oured | -0.002 |
enny | -0.002 |
� | -0.002 |
ipop | -0.002 |
chip | -0.002 |
Token | The |
Token ID | 383 |
Feature activation | +1.18e-04 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.009 |
oured | -0.009 |
drop | -0.009 |
driver | -0.009 |
unn | -0.009 |
Token | car |
Token ID | 1097 |
Feature activation | -9.86e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
things | +0.000 |
everything | +0.000 |
Neg logit contributions | |
enny | -0.000 |
oured | -0.000 |
unn | -0.000 |
seek | -0.000 |
olly | -0.000 |
Token | hits |
Token ID | 7127 |
Feature activation | -2.70e-03 |
Pos logit contributions | |
enny | +0.021 |
unn | +0.020 |
oured | +0.019 |
olly | +0.019 |
� | +0.019 |
Neg logit contributions | |
its | -0.014 |
their | -0.012 |
them | -0.012 |
things | -0.011 |
it | -0.011 |
Token | a |
Token ID | 257 |
Feature activation | -8.82e-04 |
Pos logit contributions | |
driver | +0.006 |
enny | +0.006 |
drop | +0.006 |
uddy | +0.006 |
oured | +0.006 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
away | -0.001 |
fant | -0.001 |
Token | fire |
Token ID | 2046 |
Feature activation | +3.03e-03 |
Pos logit contributions | |
enny | +0.001 |
ache | +0.001 |
driver | +0.001 |
drop | +0.001 |
uddy | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
things | -0.001 |
Token | hyd |
Token ID | 7409 |
Feature activation | +4.92e-02 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.003 |
down | +0.002 |
things | +0.002 |
Neg logit contributions | |
enny | -0.007 |
unn | -0.007 |
oured | -0.007 |
olly | -0.006 |
va | -0.006 |
Token | rant |
Token ID | 5250 |
Feature activation | +2.73e-03 |
Pos logit contributions | |
its | +0.094 |
her | +0.084 |
fant | +0.083 |
their | +0.083 |
them | +0.076 |
Neg logit contributions | |
ache | -0.064 |
driver | -0.064 |
ave | -0.062 |
drop | -0.060 |
oured | -0.059 |
Token | . |
Token ID | 13 |
Feature activation | +3.13e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
things | +0.002 |
her | +0.002 |
Neg logit contributions | |
enny | -0.006 |
oured | -0.006 |
ache | -0.006 |
drop | -0.006 |
unn | -0.006 |
Token | The |
Token ID | 383 |
Feature activation | -1.11e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
things | +0.003 |
away | +0.003 |
Neg logit contributions | |
enny | -0.006 |
driver | -0.006 |
uddy | -0.005 |
� | -0.005 |
oured | -0.005 |
Token | fire |
Token ID | 2046 |
Feature activation | +4.56e-03 |
Pos logit contributions | |
enny | +0.002 |
oured | +0.002 |
unn | +0.002 |
seek | +0.002 |
ipop | +0.002 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
everything | -0.001 |
Token | hyd |
Token ID | 7409 |
Feature activation | +5.10e-02 |
Pos logit contributions | |
its | +0.006 |
their | +0.006 |
them | +0.005 |
things | +0.005 |
fires | +0.005 |
Neg logit contributions | |
enny | -0.010 |
seek | -0.009 |
unn | -0.009 |
va | -0.009 |
olly | -0.009 |
Token | turned |
Token ID | 2900 |
Feature activation | +1.13e-03 |
Pos logit contributions | |
enny | +0.007 |
oured | +0.007 |
unn | +0.007 |
� | +0.007 |
seek | +0.007 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
her | -0.005 |
it | -0.005 |
Token | out |
Token ID | 503 |
Feature activation | -5.61e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
her | +0.001 |
Neg logit contributions | |
enny | -0.003 |
unn | -0.003 |
oured | -0.003 |
drop | -0.003 |
ache | -0.003 |
Token | that |
Token ID | 326 |
Feature activation | +1.23e-02 |
Pos logit contributions | |
enny | +0.011 |
oured | +0.011 |
ache | +0.011 |
driver | +0.011 |
drop | +0.011 |
Neg logit contributions | |
its | -0.007 |
their | -0.006 |
them | -0.006 |
things | -0.005 |
everything | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | +3.47e-03 |
Pos logit contributions | |
its | +0.010 |
their | +0.007 |
them | +0.007 |
things | +0.005 |
everything | +0.005 |
Neg logit contributions | |
enny | -0.031 |
oured | -0.030 |
unn | -0.030 |
ache | -0.030 |
drop | -0.030 |
Token | av |
Token ID | 1196 |
Feature activation | +1.88e-02 |
Pos logit contributions | |
its | +0.004 |
things | +0.004 |
fog | +0.004 |
them | +0.004 |
their | +0.003 |
Neg logit contributions | |
enny | -0.008 |
seek | -0.007 |
oured | -0.007 |
ucker | -0.007 |
unn | -0.007 |
Token | oc |
Token ID | 420 |
Feature activation | +4.91e-02 |
Pos logit contributions | |
its | +0.021 |
their | +0.017 |
them | +0.017 |
things | +0.013 |
everything | +0.013 |
Neg logit contributions | |
enny | -0.041 |
oured | -0.039 |
drop | -0.039 |
ipop | -0.039 |
unn | -0.039 |
Token | ados |
Token ID | 22484 |
Feature activation | -1.55e-03 |
Pos logit contributions | |
its | +0.067 |
them | +0.056 |
their | +0.055 |
things | +0.052 |
him | +0.048 |
Neg logit contributions | |
enny | -0.095 |
drop | -0.089 |
coat | -0.089 |
uddy | -0.088 |
oured | -0.087 |
Token | were |
Token ID | 547 |
Feature activation | +3.96e-03 |
Pos logit contributions | |
enny | +0.003 |
unn | +0.003 |
seek | +0.003 |
uddy | +0.003 |
coach | +0.003 |
Neg logit contributions | |
its | -0.002 |
them | -0.002 |
their | -0.002 |
it | -0.002 |
her | -0.001 |
Token | bad |
Token ID | 2089 |
Feature activation | +2.27e-03 |
Pos logit contributions | |
its | +0.006 |
them | +0.005 |
their | +0.005 |
her | +0.005 |
everything | +0.005 |
Neg logit contributions | |
enny | -0.009 |
opus | -0.008 |
unn | -0.008 |
seek | -0.008 |
uddy | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | +1.63e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
things | +0.002 |
it | +0.001 |
Neg logit contributions | |
enny | -0.006 |
oured | -0.006 |
� | -0.006 |
opus | -0.006 |
scar | -0.005 |
Token | made |
Token ID | 925 |
Feature activation | -9.98e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
it | +0.002 |
her | +0.002 |
Neg logit contributions | |
enny | -0.004 |
seek | -0.003 |
uddy | -0.003 |
oured | -0.003 |
unn | -0.003 |
Token | am |
Token ID | 716 |
Feature activation | +1.81e-02 |
Pos logit contributions | |
enny | +0.005 |
uddy | +0.005 |
unn | +0.005 |
driver | +0.005 |
seek | +0.005 |
Neg logit contributions | |
its | -0.003 |
them | -0.003 |
their | -0.003 |
it | -0.002 |
her | -0.002 |
Token | taking |
Token ID | 2263 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
its | +0.023 |
their | +0.020 |
them | +0.019 |
it | +0.017 |
her | +0.016 |
Neg logit contributions | |
enny | -0.042 |
uddy | -0.041 |
unn | -0.041 |
driver | -0.041 |
seek | -0.041 |
Token | the |
Token ID | 262 |
Feature activation | +3.68e-03 |
Pos logit contributions | |
enny | +0.028 |
drop | +0.027 |
uddy | +0.027 |
oured | +0.027 |
unn | +0.027 |
Neg logit contributions | |
its | -0.012 |
them | -0.010 |
their | -0.010 |
things | -0.008 |
her | -0.007 |
Token | rh |
Token ID | 9529 |
Feature activation | -2.74e-02 |
Pos logit contributions | |
its | +0.005 |
things | +0.005 |
their | +0.005 |
them | +0.005 |
fog | +0.005 |
Neg logit contributions | |
enny | -0.007 |
seek | -0.007 |
ucker | -0.007 |
oured | -0.007 |
uddy | -0.006 |
Token | in |
Token ID | 259 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
enny | +0.043 |
oured | +0.043 |
drop | +0.042 |
seek | +0.042 |
coat | +0.042 |
Neg logit contributions | |
its | -0.045 |
them | -0.041 |
their | -0.040 |
things | -0.037 |
away | -0.036 |
Token | oc |
Token ID | 420 |
Feature activation | +4.89e-02 |
Pos logit contributions | |
enny | +0.025 |
oured | +0.024 |
ucker | +0.024 |
unn | +0.024 |
drop | +0.024 |
Neg logit contributions | |
its | -0.010 |
their | -0.008 |
them | -0.007 |
things | -0.007 |
away | -0.006 |
Token | eros |
Token ID | 27498 |
Feature activation | -1.69e-02 |
Pos logit contributions | |
its | +0.076 |
them | +0.065 |
their | +0.062 |
things | +0.062 |
him | +0.060 |
Neg logit contributions | |
enny | -0.087 |
coat | -0.082 |
drop | -0.080 |
uddy | -0.077 |
seek | -0.076 |
Token | to |
Token ID | 284 |
Feature activation | -1.32e-03 |
Pos logit contributions | |
enny | +0.039 |
ucker | +0.038 |
unn | +0.038 |
oured | +0.037 |
ipop | +0.037 |
Neg logit contributions | |
its | -0.019 |
their | -0.016 |
them | -0.016 |
out | -0.013 |
things | -0.013 |
Token | a |
Token ID | 257 |
Feature activation | -2.95e-03 |
Pos logit contributions | |
enny | +0.003 |
oured | +0.003 |
ipop | +0.003 |
unn | +0.003 |
drop | +0.003 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
everything | -0.001 |
her | -0.001 |
Token | new |
Token ID | 649 |
Feature activation | +3.47e-04 |
Pos logit contributions | |
enny | +0.006 |
unn | +0.006 |
ipop | +0.006 |
driver | +0.006 |
oured | +0.006 |
Neg logit contributions | |
its | -0.004 |
their | -0.003 |
them | -0.003 |
everything | -0.003 |
things | -0.003 |
Token | home |
Token ID | 1363 |
Feature activation | -1.94e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
things | +0.000 |
everything | +0.000 |
Neg logit contributions | |
enny | -0.001 |
ipop | -0.001 |
unn | -0.001 |
oured | -0.001 |
drop | -0.001 |
Token | it |
Token ID | 340 |
Feature activation | +1.24e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
her | +0.001 |
things | +0.001 |
Neg logit contributions | |
enny | -0.011 |
ache | -0.011 |
drop | -0.011 |
uddy | -0.011 |
unn | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | +2.13e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.001 |
them | +0.001 |
her | +0.001 |
things | +0.001 |
Neg logit contributions | |
enny | -0.003 |
� | -0.003 |
unn | -0.003 |
opus | -0.003 |
istent | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +3.43e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
her | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.005 |
unn | -0.005 |
oured | -0.005 |
ache | -0.005 |
driver | -0.005 |
Token | rh |
Token ID | 9529 |
Feature activation | -2.76e-02 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
things | +0.004 |
fog | +0.004 |
Neg logit contributions | |
enny | -0.007 |
unn | -0.007 |
oured | -0.007 |
seek | -0.006 |
uddy | -0.006 |
Token | in |
Token ID | 259 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
drop | +0.044 |
oured | +0.044 |
seek | +0.043 |
enny | +0.043 |
coat | +0.043 |
Neg logit contributions | |
its | -0.045 |
them | -0.040 |
their | -0.039 |
things | -0.037 |
away | -0.036 |
Token | oc |
Token ID | 420 |
Feature activation | +4.87e-02 |
Pos logit contributions | |
enny | +0.029 |
drop | +0.028 |
coat | +0.028 |
driver | +0.028 |
unn | +0.028 |
Neg logit contributions | |
its | -0.009 |
their | -0.006 |
them | -0.006 |
things | -0.005 |
his | -0.005 |
Token | eros |
Token ID | 27498 |
Feature activation | -1.72e-02 |
Pos logit contributions | |
its | +0.075 |
them | +0.064 |
their | +0.061 |
him | +0.061 |
things | +0.060 |
Neg logit contributions | |
enny | -0.087 |
coat | -0.085 |
drop | -0.083 |
uddy | -0.079 |
olly | -0.078 |
Token | . |
Token ID | 13 |
Feature activation | +3.65e-03 |
Pos logit contributions | |
enny | +0.045 |
unn | +0.045 |
drop | +0.044 |
driver | +0.044 |
coat | +0.043 |
Neg logit contributions | |
its | -0.014 |
their | -0.011 |
them | -0.010 |
his | -0.007 |
her | -0.007 |
Token | When |
Token ID | 1649 |
Feature activation | -2.70e-04 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.003 |
her | +0.003 |
it | +0.003 |
Neg logit contributions | |
ache | -0.008 |
drop | -0.008 |
enny | -0.008 |
unn | -0.008 |
oured | -0.008 |
Token | he |
Token ID | 339 |
Feature activation | -6.44e-03 |
Pos logit contributions | |
enny | +0.001 |
unn | +0.001 |
oured | +0.001 |
ache | +0.001 |
drop | +0.001 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
her | -0.000 |
things | -0.000 |
Token | tasted |
Token ID | 29187 |
Feature activation | -2.11e-03 |
Pos logit contributions | |
unn | +0.014 |
ider | +0.013 |
uddy | +0.013 |
driver | +0.013 |
seek | +0.013 |
Neg logit contributions | |
its | -0.009 |
their | -0.008 |
them | -0.008 |
his | -0.007 |
it | -0.007 |
Token | spray |
Token ID | 11662 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
its | +0.001 |
their | +0.000 |
them | +0.000 |
things | +0.000 |
fog | +0.000 |
Neg logit contributions | |
enny | -0.001 |
oured | -0.001 |
ipop | -0.001 |
unn | -0.001 |
uddy | -0.001 |
Token | from |
Token ID | 422 |
Feature activation | +6.11e-03 |
Pos logit contributions | |
its | +0.016 |
their | +0.014 |
them | +0.014 |
things | +0.011 |
her | +0.011 |
Neg logit contributions | |
enny | -0.025 |
unn | -0.024 |
seek | -0.023 |
oured | -0.023 |
ache | -0.023 |
Token | a |
Token ID | 257 |
Feature activation | +3.00e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.002 |
things | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.016 |
oured | -0.015 |
drop | -0.015 |
ache | -0.015 |
driver | -0.015 |
Token | nearby |
Token ID | 6716 |
Feature activation | +7.77e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
things | +0.003 |
fog | +0.003 |
Neg logit contributions | |
enny | -0.006 |
unn | -0.006 |
oured | -0.006 |
seek | -0.006 |
ipop | -0.006 |
Token | fire |
Token ID | 2046 |
Feature activation | +8.27e-03 |
Pos logit contributions | |
its | +0.012 |
their | +0.010 |
them | +0.010 |
things | +0.009 |
everything | +0.008 |
Neg logit contributions | |
enny | -0.014 |
unn | -0.013 |
oured | -0.013 |
ipop | -0.013 |
ache | -0.013 |
Token | hyd |
Token ID | 7409 |
Feature activation | +4.84e-02 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
out | +0.003 |
down | +0.003 |
Neg logit contributions | |
enny | -0.022 |
unn | -0.022 |
ucker | -0.021 |
va | -0.021 |
olly | -0.021 |
Token | rant |
Token ID | 5250 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
its | +0.099 |
their | +0.088 |
things | +0.082 |
her | +0.081 |
it | +0.080 |
Neg logit contributions | |
drop | -0.059 |
oured | -0.059 |
ave | -0.058 |
ache | -0.057 |
coat | -0.055 |
Token | to |
Token ID | 284 |
Feature activation | -1.21e-03 |
Pos logit contributions | |
its | +0.013 |
their | +0.011 |
them | +0.011 |
things | +0.008 |
everything | +0.008 |
Neg logit contributions | |
enny | -0.029 |
unn | -0.027 |
oured | -0.027 |
ipop | -0.027 |
uddy | -0.027 |
Token | keep |
Token ID | 1394 |
Feature activation | -1.11e-02 |
Pos logit contributions | |
enny | +0.002 |
drop | +0.002 |
oured | +0.002 |
ache | +0.002 |
driver | +0.002 |
Neg logit contributions | |
its | -0.002 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
fog | -0.001 |
Token | her |
Token ID | 607 |
Feature activation | -1.82e-03 |
Pos logit contributions | |
drop | +0.025 |
enny | +0.025 |
driver | +0.025 |
ache | +0.025 |
oured | +0.025 |
Neg logit contributions | |
its | -0.008 |
their | -0.006 |
them | -0.005 |
away | -0.005 |
Wow | -0.004 |
Token | dry |
Token ID | 5894 |
Feature activation | +1.58e-03 |
Pos logit contributions | |
enny | +0.004 |
unn | +0.004 |
oured | +0.004 |
drop | +0.004 |
ache | +0.004 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
things | -0.001 |
everything | -0.001 |
Token | couldn |
Token ID | 3521 |
Feature activation | +5.51e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
her | +0.003 |
it | +0.003 |
them | +0.003 |
Neg logit contributions | |
unn | -0.005 |
uddy | -0.005 |
enny | -0.005 |
driver | -0.005 |
oured | -0.005 |
Token | 't |
Token ID | 470 |
Feature activation | -6.90e-03 |
Pos logit contributions | |
its | +0.011 |
them | +0.010 |
their | +0.010 |
it | +0.010 |
her | +0.009 |
Neg logit contributions | |
enny | -0.007 |
oured | -0.007 |
unn | -0.007 |
ache | -0.007 |
ipop | -0.007 |
Token | find |
Token ID | 1064 |
Feature activation | +7.55e-03 |
Pos logit contributions | |
enny | +0.011 |
ache | +0.011 |
drop | +0.010 |
driver | +0.010 |
oured | +0.010 |
Neg logit contributions | |
its | -0.011 |
their | -0.010 |
them | -0.010 |
things | -0.009 |
everything | -0.008 |
Token | any |
Token ID | 597 |
Feature activation | +5.17e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.004 |
away | +0.003 |
things | +0.003 |
Neg logit contributions | |
enny | -0.017 |
ipop | -0.017 |
driver | -0.017 |
oured | -0.017 |
drop | -0.017 |
Token | av |
Token ID | 1196 |
Feature activation | +1.88e-02 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
things | +0.005 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.011 |
oured | -0.011 |
seek | -0.011 |
uddy | -0.011 |
drop | -0.011 |
Token | oc |
Token ID | 420 |
Feature activation | +4.84e-02 |
Pos logit contributions | |
its | +0.023 |
their | +0.020 |
them | +0.019 |
things | +0.015 |
her | +0.015 |
Neg logit contributions | |
enny | -0.038 |
unn | -0.037 |
oured | -0.037 |
ache | -0.037 |
drop | -0.037 |
Token | ados |
Token ID | 22484 |
Feature activation | -1.27e-03 |
Pos logit contributions | |
its | +0.061 |
them | +0.053 |
things | +0.048 |
their | +0.048 |
him | +0.045 |
Neg logit contributions | |
enny | -0.098 |
coat | -0.093 |
drop | -0.093 |
uddy | -0.092 |
ipop | -0.090 |
Token | . |
Token ID | 13 |
Feature activation | +5.62e-03 |
Pos logit contributions | |
enny | +0.003 |
unn | +0.003 |
uddy | +0.003 |
oured | +0.003 |
drop | +0.003 |
Neg logit contributions | |
its | -0.001 |
them | -0.001 |
their | -0.001 |
her | -0.001 |
it | -0.001 |
Token | Finally |
Token ID | 9461 |
Feature activation | +2.47e-03 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
her | +0.005 |
everything | +0.005 |
Neg logit contributions | |
ache | -0.012 |
unn | -0.011 |
enny | -0.011 |
drop | -0.011 |
oured | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | +1.95e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.003 |
her | +0.002 |
things | +0.002 |
Neg logit contributions | |
enny | -0.005 |
unn | -0.005 |
oured | -0.005 |
ache | -0.005 |
drop | -0.005 |
Token | she |
Token ID | 673 |
Feature activation | -1.21e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
her | +0.002 |
everything | +0.002 |
Neg logit contributions | |
enny | -0.004 |
unn | -0.004 |
ache | -0.004 |
oured | -0.004 |
driver | -0.004 |
Token | ," |
Token ID | 553 |
Feature activation | +7.30e-03 |
Pos logit contributions | |
enny | +0.014 |
ache | +0.013 |
driver | +0.013 |
drop | +0.013 |
oured | +0.013 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
things | -0.004 |
everything | -0.004 |
Token | said |
Token ID | 531 |
Feature activation | -4.39e-03 |
Pos logit contributions | |
its | +0.009 |
their | +0.008 |
them | +0.008 |
her | +0.007 |
it | +0.006 |
Neg logit contributions | |
enny | -0.015 |
unn | -0.015 |
oured | -0.015 |
drop | -0.015 |
ache | -0.015 |
Token | the |
Token ID | 262 |
Feature activation | +4.97e-03 |
Pos logit contributions | |
enny | +0.009 |
oured | +0.008 |
ipop | +0.008 |
ache | +0.008 |
drop | +0.008 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
things | -0.004 |
everything | -0.004 |
Token | rh |
Token ID | 9529 |
Feature activation | -2.67e-02 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
things | +0.006 |
them | +0.006 |
fog | +0.006 |
Neg logit contributions | |
enny | -0.010 |
oured | -0.010 |
seek | -0.010 |
unn | -0.009 |
uddy | -0.009 |
Token | in |
Token ID | 259 |
Feature activation | -7.02e-03 |
Pos logit contributions | |
oured | +0.043 |
enny | +0.042 |
drop | +0.042 |
coat | +0.041 |
seek | +0.041 |
Neg logit contributions | |
its | -0.044 |
them | -0.039 |
their | -0.039 |
things | -0.036 |
away | -0.034 |
Token | oc |
Token ID | 420 |
Feature activation | +4.84e-02 |
Pos logit contributions | |
unn | +0.017 |
oured | +0.017 |
enny | +0.017 |
� | +0.017 |
drop | +0.017 |
Neg logit contributions | |
its | -0.006 |
their | -0.004 |
them | -0.004 |
his | -0.004 |
things | -0.003 |
Token | eros |
Token ID | 27498 |
Feature activation | -1.56e-02 |
Pos logit contributions | |
its | +0.080 |
them | +0.070 |
their | +0.068 |
things | +0.065 |
him | +0.064 |
Neg logit contributions | |
enny | -0.079 |
coat | -0.074 |
drop | -0.074 |
uddy | -0.072 |
oured | -0.071 |
Token | . |
Token ID | 13 |
Feature activation | +4.71e-03 |
Pos logit contributions | |
unn | +0.040 |
enny | +0.039 |
� | +0.039 |
drop | +0.038 |
ucker | +0.038 |
Neg logit contributions | |
its | -0.013 |
their | -0.010 |
them | -0.010 |
his | -0.008 |
her | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | +9.65e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
her | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.010 |
unn | -0.009 |
oured | -0.009 |
drop | -0.009 |
ache | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | +9.10e-03 |
Pos logit contributions | |
its | +0.011 |
their | +0.009 |
them | +0.009 |
things | +0.007 |
everything | +0.007 |
Neg logit contributions | |
enny | -0.020 |
oured | -0.020 |
unn | -0.020 |
ache | -0.020 |
drop | -0.019 |
Token | The |
Token ID | 464 |
Feature activation | +6.42e-04 |
Pos logit contributions | |
its | +0.012 |
their | +0.010 |
them | +0.010 |
her | +0.008 |
his | +0.008 |
Neg logit contributions | |
oured | -0.018 |
unn | -0.018 |
ipop | -0.018 |
drop | -0.018 |
sed | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | +1.36e-03 |
Pos logit contributions | |
driver | +0.018 |
enny | +0.018 |
drop | +0.018 |
ache | +0.018 |
� | +0.018 |
Neg logit contributions | |
its | -0.007 |
their | -0.005 |
them | -0.005 |
away | -0.004 |
things | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +9.10e-04 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
everything | +0.000 |
her | +0.000 |
Neg logit contributions | |
enny | -0.004 |
unn | -0.003 |
oured | -0.003 |
uddy | -0.003 |
ipop | -0.003 |
Token | lightning |
Token ID | 14357 |
Feature activation | -1.20e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.002 |
oured | -0.002 |
unn | -0.002 |
ipop | -0.002 |
ache | -0.002 |
Token | struck |
Token ID | 7425 |
Feature activation | +9.29e-04 |
Pos logit contributions | |
enny | +0.002 |
unn | +0.002 |
ipop | +0.002 |
oured | +0.002 |
uddy | +0.002 |
Neg logit contributions | |
its | -0.002 |
them | -0.002 |
their | -0.002 |
it | -0.002 |
everything | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | +4.73e-04 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
away | +0.001 |
them | +0.001 |
fant | +0.001 |
Neg logit contributions | |
seek | -0.002 |
drop | -0.002 |
driver | -0.002 |
oured | -0.002 |
ache | -0.002 |
Token | hyd |
Token ID | 7409 |
Feature activation | +4.81e-02 |
Pos logit contributions | |
its | +0.001 |
their | +0.000 |
them | +0.000 |
things | +0.000 |
fog | +0.000 |
Neg logit contributions | |
enny | -0.001 |
ipop | -0.001 |
oured | -0.001 |
unn | -0.001 |
seek | -0.001 |
Token | rant |
Token ID | 5250 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
its | +0.089 |
their | +0.078 |
her | +0.075 |
them | +0.072 |
things | +0.071 |
Neg logit contributions | |
drop | -0.067 |
ache | -0.066 |
oured | -0.064 |
zag | -0.062 |
seek | -0.061 |
Token | . |
Token ID | 13 |
Feature activation | -1.99e-03 |
Pos logit contributions | |
its | +0.010 |
their | +0.009 |
them | +0.008 |
things | +0.006 |
everything | +0.006 |
Neg logit contributions | |
enny | -0.023 |
oured | -0.022 |
unn | -0.022 |
ache | -0.022 |
drop | -0.022 |
Token | Suddenly |
Token ID | 24975 |
Feature activation | -6.09e-03 |
Pos logit contributions | |
enny | +0.004 |
uddy | +0.004 |
oured | +0.004 |
driver | +0.004 |
drop | +0.004 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
things | -0.002 |
her | -0.002 |
Token | water |
Token ID | 1660 |
Feature activation | -7.44e-03 |
Pos logit contributions | |
enny | +0.011 |
ache | +0.011 |
driver | +0.011 |
oured | +0.011 |
unn | +0.011 |
Neg logit contributions | |
its | -0.009 |
their | -0.007 |
them | -0.007 |
things | -0.006 |
her | -0.006 |
Token | was |
Token ID | 373 |
Feature activation | +1.93e-04 |
Pos logit contributions | |
enny | +0.015 |
unn | +0.014 |
seek | +0.013 |
uddy | +0.013 |
oured | +0.013 |
Neg logit contributions | |
its | -0.011 |
them | -0.010 |
their | -0.010 |
everything | -0.009 |
it | -0.008 |
Token | They |
Token ID | 1119 |
Feature activation | -5.12e-04 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.011 |
unn | -0.010 |
uddy | -0.010 |
oured | -0.010 |
ipop | -0.010 |
Token | saw |
Token ID | 2497 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
enny | +0.001 |
unn | +0.001 |
uddy | +0.001 |
driver | +0.001 |
seek | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
it | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +3.35e-03 |
Pos logit contributions | |
its | +0.009 |
their | +0.009 |
them | +0.008 |
her | +0.005 |
everything | +0.005 |
Neg logit contributions | |
enny | -0.030 |
ider | -0.029 |
� | -0.029 |
unn | -0.029 |
seek | -0.028 |
Token | rh |
Token ID | 9529 |
Feature activation | -2.75e-02 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
things | +0.004 |
fog | +0.004 |
Neg logit contributions | |
enny | -0.007 |
seek | -0.007 |
unn | -0.007 |
oured | -0.007 |
uddy | -0.006 |
Token | in |
Token ID | 259 |
Feature activation | -8.21e-03 |
Pos logit contributions | |
enny | +0.042 |
oured | +0.041 |
seek | +0.041 |
drop | +0.040 |
ipop | +0.040 |
Neg logit contributions | |
its | -0.048 |
them | -0.043 |
their | -0.043 |
things | -0.039 |
everything | -0.037 |
Token | oc |
Token ID | 420 |
Feature activation | +4.81e-02 |
Pos logit contributions | |
enny | +0.019 |
oured | +0.018 |
unn | +0.018 |
seek | +0.018 |
coat | +0.018 |
Neg logit contributions | |
its | -0.008 |
their | -0.007 |
them | -0.007 |
things | -0.006 |
everything | -0.005 |
Token | eros |
Token ID | 27498 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
its | +0.075 |
them | +0.065 |
their | +0.064 |
things | +0.062 |
him | +0.061 |
Neg logit contributions | |
enny | -0.087 |
coat | -0.081 |
drop | -0.077 |
uddy | -0.076 |
olly | -0.076 |
Token | . |
Token ID | 13 |
Feature activation | +4.05e-03 |
Pos logit contributions | |
enny | +0.035 |
unn | +0.034 |
uddy | +0.032 |
driver | +0.032 |
oured | +0.032 |
Neg logit contributions | |
its | -0.018 |
their | -0.016 |
them | -0.015 |
things | -0.012 |
it | -0.012 |
Token | They |
Token ID | 1119 |
Feature activation | +1.43e-03 |
Pos logit contributions | |
its | +0.005 |
them | +0.005 |
things | +0.005 |
away | +0.005 |
fog | +0.004 |
Neg logit contributions | |
enny | -0.007 |
� | -0.007 |
uddy | -0.007 |
coach | -0.007 |
driver | -0.006 |
Token | thanked |
Token ID | 26280 |
Feature activation | +2.56e-04 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
his | +0.002 |
her | +0.002 |
Neg logit contributions | |
enny | -0.003 |
unn | -0.003 |
seek | -0.003 |
olly | -0.003 |
uddy | -0.003 |
Token | Mom |
Token ID | 11254 |
Feature activation | +3.67e-03 |
Pos logit contributions | |
its | +0.000 |
fog | +0.000 |
away | +0.000 |
south | +0.000 |
fant | +0.000 |
Neg logit contributions | |
coach | -0.001 |
ipop | -0.001 |
chip | -0.001 |
enny | -0.000 |
oured | -0.000 |
Token | 't |
Token ID | 470 |
Feature activation | -2.58e-02 |
Pos logit contributions | |
enny | +0.012 |
seek | +0.011 |
unn | +0.011 |
oured | +0.011 |
uddy | +0.011 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
it | -0.004 |
her | -0.004 |
Token | know |
Token ID | 760 |
Feature activation | +9.09e-04 |
Pos logit contributions | |
enny | +0.053 |
oured | +0.052 |
� | +0.051 |
opus | +0.050 |
ucker | +0.050 |
Neg logit contributions | |
its | -0.038 |
their | -0.034 |
them | -0.032 |
her | -0.029 |
his | -0.028 |
Token | the |
Token ID | 262 |
Feature activation | +1.89e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
her | +0.001 |
Neg logit contributions | |
enny | -0.002 |
oured | -0.002 |
unn | -0.002 |
drop | -0.002 |
uddy | -0.002 |
Token | rh |
Token ID | 9529 |
Feature activation | -3.06e-02 |
Pos logit contributions | |
its | +0.003 |
things | +0.002 |
their | +0.002 |
them | +0.002 |
fog | +0.002 |
Neg logit contributions | |
enny | -0.004 |
oured | -0.004 |
seek | -0.004 |
unn | -0.004 |
uddy | -0.004 |
Token | in |
Token ID | 259 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
oured | +0.050 |
enny | +0.049 |
drop | +0.049 |
seek | +0.049 |
coat | +0.049 |
Neg logit contributions | |
its | -0.048 |
them | -0.044 |
their | -0.042 |
things | -0.041 |
away | -0.039 |
Token | oc |
Token ID | 420 |
Feature activation | +4.80e-02 |
Pos logit contributions | |
enny | +0.039 |
unn | +0.037 |
oured | +0.037 |
ucker | +0.037 |
coat | +0.036 |
Neg logit contributions | |
its | -0.013 |
their | -0.009 |
things | -0.009 |
them | -0.009 |
it | -0.008 |
Token | eros |
Token ID | 27498 |
Feature activation | -2.15e-02 |
Pos logit contributions | |
its | +0.074 |
them | +0.066 |
things | +0.062 |
their | +0.061 |
him | +0.061 |
Neg logit contributions | |
enny | -0.084 |
coat | -0.080 |
uddy | -0.078 |
drop | -0.078 |
olly | -0.075 |
Token | was |
Token ID | 373 |
Feature activation | +4.97e-03 |
Pos logit contributions | |
enny | +0.047 |
unn | +0.046 |
ucker | +0.045 |
oured | +0.045 |
coat | +0.045 |
Neg logit contributions | |
its | -0.027 |
their | -0.023 |
them | -0.022 |
it | -0.019 |
things | -0.019 |
Token | wild |
Token ID | 4295 |
Feature activation | -1.64e-03 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
his | +0.006 |
her | +0.005 |
Neg logit contributions | |
unn | -0.011 |
enny | -0.011 |
opus | -0.010 |
uddy | -0.010 |
olly | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | +4.93e-03 |
Pos logit contributions | |
enny | +0.004 |
oured | +0.004 |
ipop | +0.004 |
� | +0.004 |
va | +0.004 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
down | -0.001 |
Token | Can |
Token ID | 1680 |
Feature activation | +5.55e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
her | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.010 |
ache | -0.010 |
unn | -0.010 |
oured | -0.010 |
drop | -0.010 |
Token | s |
Token ID | 82 |
Feature activation | +2.31e-03 |
Pos logit contributions | |
unn | +0.031 |
seek | +0.031 |
sed | +0.031 |
drop | +0.031 |
oured | +0.031 |
Neg logit contributions | |
its | -0.038 |
them | -0.035 |
their | -0.035 |
everything | -0.032 |
it | -0.031 |
Token | wrong |
Token ID | 2642 |
Feature activation | +1.40e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.002 |
things | +0.002 |
everything | +0.002 |
Neg logit contributions | |
enny | -0.005 |
ache | -0.004 |
oured | -0.004 |
unn | -0.004 |
drop | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | +7.98e-04 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.003 |
oured | -0.003 |
unn | -0.003 |
seek | -0.003 |
drop | -0.003 |
Token | rh |
Token ID | 9529 |
Feature activation | -3.04e-02 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.002 |
seek | -0.002 |
oured | -0.002 |
unn | -0.001 |
drop | -0.001 |
Token | in |
Token ID | 259 |
Feature activation | -9.99e-03 |
Pos logit contributions | |
oured | +0.052 |
enny | +0.050 |
seek | +0.049 |
sed | +0.049 |
uddy | +0.049 |
Neg logit contributions | |
its | -0.047 |
them | -0.043 |
things | -0.040 |
their | -0.040 |
fog | -0.038 |
Token | oc |
Token ID | 420 |
Feature activation | +4.79e-02 |
Pos logit contributions | |
oured | +0.025 |
unn | +0.025 |
seek | +0.025 |
enny | +0.024 |
driver | +0.024 |
Neg logit contributions | |
its | -0.008 |
their | -0.006 |
them | -0.006 |
it | -0.005 |
things | -0.005 |
Token | eros |
Token ID | 27498 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
its | +0.074 |
them | +0.066 |
things | +0.064 |
him | +0.062 |
their | +0.060 |
Neg logit contributions | |
enny | -0.082 |
coat | -0.078 |
drop | -0.075 |
oured | -0.074 |
uddy | -0.074 |
Token | ? |
Token ID | 30 |
Feature activation | -9.24e-03 |
Pos logit contributions | |
enny | +0.049 |
unn | +0.049 |
seek | +0.048 |
oured | +0.048 |
driver | +0.048 |
Neg logit contributions | |
its | -0.015 |
their | -0.011 |
them | -0.010 |
it | -0.009 |
his | -0.008 |
Token | â |
Token ID | 22940 |
Feature activation | -4.00e-03 |
Pos logit contributions | |
drop | +0.018 |
ache | +0.018 |
unn | +0.017 |
enny | +0.017 |
seek | +0.017 |
Neg logit contributions | |
its | -0.012 |
their | -0.010 |
them | -0.010 |
it | -0.008 |
everything | -0.008 |
Token | € |
Token ID | 26391 |
Feature activation | +4.90e-03 |
Pos logit contributions | |
enny | +0.007 |
unn | +0.007 |
driver | +0.007 |
uddy | +0.007 |
oured | +0.007 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
her | -0.004 |
things | -0.004 |
Token | said |
Token ID | 531 |
Feature activation | -2.96e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
it | +0.005 |
everything | +0.004 |
Neg logit contributions | |
unn | -0.010 |
oured | -0.010 |
ipop | -0.009 |
enny | -0.009 |
driver | -0.009 |
Token | hurt |
Token ID | 5938 |
Feature activation | -4.20e-03 |
Pos logit contributions | |
its | +0.002 |
them | +0.002 |
their | +0.002 |
her | +0.001 |
it | +0.001 |
Neg logit contributions | |
enny | -0.005 |
uddy | -0.005 |
drop | -0.005 |
unn | -0.005 |
seek | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +3.86e-03 |
Pos logit contributions | |
enny | +0.010 |
ache | +0.010 |
drop | +0.010 |
unn | +0.010 |
driver | +0.010 |
Neg logit contributions | |
its | -0.004 |
their | -0.003 |
them | -0.003 |
things | -0.002 |
everything | -0.002 |
Token | The |
Token ID | 383 |
Feature activation | -2.07e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
his | +0.003 |
her | +0.003 |
Neg logit contributions | |
ache | -0.009 |
drop | -0.009 |
unn | -0.008 |
oured | -0.008 |
ipop | -0.008 |
Token | rh |
Token ID | 9529 |
Feature activation | -2.70e-02 |
Pos logit contributions | |
enny | +0.005 |
seek | +0.004 |
ucker | +0.004 |
oured | +0.004 |
unn | +0.004 |
Neg logit contributions | |
its | -0.003 |
things | -0.003 |
fog | -0.002 |
them | -0.002 |
their | -0.002 |
Token | in |
Token ID | 259 |
Feature activation | -7.02e-03 |
Pos logit contributions | |
enny | +0.042 |
oured | +0.042 |
coat | +0.041 |
drop | +0.041 |
seek | +0.041 |
Neg logit contributions | |
its | -0.046 |
them | -0.041 |
their | -0.040 |
things | -0.037 |
everything | -0.035 |
Token | oc |
Token ID | 420 |
Feature activation | +4.78e-02 |
Pos logit contributions | |
enny | +0.020 |
oured | +0.019 |
unn | +0.019 |
� | +0.019 |
seek | +0.019 |
Neg logit contributions | |
its | -0.004 |
their | -0.003 |
things | -0.003 |
his | -0.002 |
them | -0.002 |
Token | eros |
Token ID | 27498 |
Feature activation | -1.36e-02 |
Pos logit contributions | |
its | +0.084 |
them | +0.074 |
their | +0.073 |
things | +0.068 |
him | +0.066 |
Neg logit contributions | |
enny | -0.076 |
coat | -0.069 |
drop | -0.068 |
oured | -0.068 |
uddy | -0.068 |
Token | kept |
Token ID | 4030 |
Feature activation | -4.62e-03 |
Pos logit contributions | |
enny | +0.030 |
unn | +0.029 |
� | +0.029 |
igsaw | +0.028 |
ucker | +0.028 |
Neg logit contributions | |
its | -0.018 |
their | -0.016 |
them | -0.015 |
his | -0.014 |
it | -0.014 |
Token | sn |
Token ID | 3013 |
Feature activation | -1.02e-03 |
Pos logit contributions | |
enny | +0.010 |
unn | +0.009 |
oured | +0.009 |
uddy | +0.009 |
ipop | +0.009 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
her | -0.004 |
everything | -0.004 |
Token | orting |
Token ID | 24707 |
Feature activation | +8.42e-03 |
Pos logit contributions | |
enny | +0.001 |
drop | +0.001 |
ipop | +0.001 |
sed | +0.001 |
ache | +0.001 |
Neg logit contributions | |
its | -0.002 |
them | -0.002 |
their | -0.002 |
down | -0.002 |
away | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | +2.61e-03 |
Pos logit contributions | |
its | +0.010 |
their | +0.009 |
them | +0.008 |
things | +0.007 |
her | +0.007 |
Neg logit contributions | |
enny | -0.019 |
unn | -0.018 |
oured | -0.018 |
ipop | -0.018 |
uddy | -0.018 |
Token | would |
Token ID | 561 |
Feature activation | +3.07e-03 |
Pos logit contributions | |
oured | +0.012 |
enny | +0.012 |
unn | +0.012 |
uddy | +0.012 |
ucker | +0.012 |
Neg logit contributions | |
its | -0.010 |
their | -0.009 |
them | -0.008 |
her | -0.008 |
things | -0.008 |
Token | take |
Token ID | 1011 |
Feature activation | -2.36e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
her | +0.004 |
them | +0.004 |
everything | +0.003 |
Neg logit contributions | |
unn | -0.006 |
enny | -0.006 |
ucker | -0.006 |
uddy | -0.006 |
oured | -0.006 |
Token | out |
Token ID | 503 |
Feature activation | -7.02e-03 |
Pos logit contributions | |
driver | +0.005 |
enny | +0.005 |
seek | +0.005 |
oured | +0.005 |
ache | +0.005 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
fog | -0.001 |
away | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | +1.63e-03 |
Pos logit contributions | |
enny | +0.018 |
drop | +0.018 |
unn | +0.017 |
ache | +0.017 |
uddy | +0.017 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
things | -0.004 |
her | -0.003 |
Token | j |
Token ID | 474 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
things | +0.002 |
her | +0.002 |
Neg logit contributions | |
enny | -0.003 |
unn | -0.003 |
oured | -0.003 |
drop | -0.003 |
seek | -0.003 |
Token | igsaw |
Token ID | 45636 |
Feature activation | -6.84e-02 |
Pos logit contributions | |
drop | +0.015 |
sed | +0.015 |
ache | +0.014 |
driver | +0.013 |
oured | +0.013 |
Neg logit contributions | |
its | -0.065 |
their | -0.061 |
away | -0.060 |
them | -0.059 |
things | -0.058 |
Token | puzzle |
Token ID | 15027 |
Feature activation | -1.05e-03 |
Pos logit contributions | |
oured | +0.092 |
enny | +0.091 |
drop | +0.090 |
ache | +0.090 |
sed | +0.089 |
Neg logit contributions | |
its | -0.126 |
their | -0.116 |
them | -0.112 |
things | -0.109 |
everything | -0.103 |
Token | and |
Token ID | 290 |
Feature activation | -1.42e-04 |
Pos logit contributions | |
oured | +0.003 |
unn | +0.002 |
ucker | +0.002 |
drop | +0.002 |
enny | +0.002 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
her | -0.001 |
Token | try |
Token ID | 1949 |
Feature activation | +2.66e-03 |
Pos logit contributions | |
enny | +0.000 |
unn | +0.000 |
uddy | +0.000 |
ache | +0.000 |
drop | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
her | -0.000 |
it | -0.000 |
Token | to |
Token ID | 284 |
Feature activation | -1.19e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
fog | +0.003 |
away | +0.003 |
Neg logit contributions | |
driver | -0.005 |
enny | -0.005 |
ache | -0.004 |
seek | -0.004 |
oured | -0.004 |
Token | solve |
Token ID | 8494 |
Feature activation | +5.68e-03 |
Pos logit contributions | |
enny | +0.002 |
unn | +0.002 |
ipop | +0.002 |
oured | +0.002 |
uddy | +0.002 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
her | -0.001 |
things | -0.001 |
Token | It |
Token ID | 632 |
Feature activation | -2.96e-03 |
Pos logit contributions | |
ache | +0.001 |
drop | +0.000 |
driver | +0.000 |
unn | +0.000 |
seek | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
her | -0.000 |
everything | -0.000 |
Token | was |
Token ID | 373 |
Feature activation | +6.56e-04 |
Pos logit contributions | |
unn | +0.007 |
oured | +0.007 |
enny | +0.007 |
driver | +0.007 |
ider | +0.007 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
her | -0.002 |
them | -0.002 |
it | -0.002 |
Token | a |
Token ID | 257 |
Feature activation | +1.52e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
her | +0.000 |
them | +0.000 |
his | +0.000 |
Neg logit contributions | |
unn | -0.002 |
opus | -0.002 |
enny | -0.002 |
uddy | -0.002 |
seek | -0.002 |
Token | big |
Token ID | 1263 |
Feature activation | -1.34e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.001 |
fog | +0.001 |
them | +0.001 |
her | +0.001 |
Neg logit contributions | |
unn | -0.004 |
seek | -0.004 |
enny | -0.004 |
ives | -0.004 |
oured | -0.004 |
Token | j |
Token ID | 474 |
Feature activation | -2.47e-02 |
Pos logit contributions | |
unn | +0.003 |
enny | +0.003 |
seek | +0.003 |
ives | +0.003 |
uts | +0.003 |
Neg logit contributions | |
its | -0.002 |
their | -0.001 |
things | -0.001 |
fog | -0.001 |
it | -0.001 |
Token | igsaw |
Token ID | 45636 |
Feature activation | -6.69e-02 |
Pos logit contributions | |
ache | +0.017 |
sed | +0.016 |
driver | +0.015 |
drop | +0.014 |
seek | +0.014 |
Neg logit contributions | |
its | -0.062 |
away | -0.057 |
their | -0.057 |
them | -0.056 |
things | -0.055 |
Token | puzzle |
Token ID | 15027 |
Feature activation | -3.67e-04 |
Pos logit contributions | |
sed | +0.114 |
ucker | +0.113 |
oured | +0.113 |
unn | +0.111 |
enny | +0.110 |
Neg logit contributions | |
its | -0.100 |
their | -0.091 |
things | -0.089 |
them | -0.086 |
it | -0.084 |
Token | and |
Token ID | 290 |
Feature activation | -1.19e-04 |
Pos logit contributions | |
unn | +0.001 |
ucker | +0.001 |
oured | +0.001 |
enny | +0.001 |
sed | +0.001 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
her | -0.000 |
things | -0.000 |
them | -0.000 |
Token | she |
Token ID | 673 |
Feature activation | -1.15e-03 |
Pos logit contributions | |
unn | +0.000 |
ache | +0.000 |
uddy | +0.000 |
driver | +0.000 |
enny | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
it | -0.000 |
her | -0.000 |
them | -0.000 |
Token | wanted |
Token ID | 2227 |
Feature activation | -2.46e-03 |
Pos logit contributions | |
unn | +0.003 |
uddy | +0.003 |
oured | +0.003 |
� | +0.003 |
ucker | +0.003 |
Neg logit contributions | |
its | -0.001 |
it | -0.001 |
their | -0.001 |
her | -0.001 |
them | -0.001 |
Token | to |
Token ID | 284 |
Feature activation | -1.49e-03 |
Pos logit contributions | |
unn | +0.005 |
uddy | +0.005 |
opus | +0.005 |
enny | +0.005 |
drop | +0.005 |
Neg logit contributions | |
its | -0.004 |
them | -0.003 |
their | -0.003 |
it | -0.003 |
her | -0.003 |
Token | box |
Token ID | 3091 |
Feature activation | -4.06e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
everything | +0.003 |
her | +0.003 |
Neg logit contributions | |
enny | -0.003 |
driver | -0.003 |
oured | -0.003 |
ipop | -0.003 |
drop | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +2.89e-03 |
Pos logit contributions | |
unn | +0.008 |
enny | +0.008 |
ache | +0.008 |
drop | +0.008 |
uddy | +0.008 |
Neg logit contributions | |
its | -0.005 |
their | -0.005 |
them | -0.004 |
her | -0.004 |
it | -0.004 |
Token | saw |
Token ID | 2497 |
Feature activation | +7.48e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.005 |
oured | -0.004 |
ipop | -0.004 |
driver | -0.004 |
drop | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | +3.92e-03 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.018 |
drop | -0.018 |
unn | -0.018 |
uddy | -0.017 |
ache | -0.017 |
Token | j |
Token ID | 474 |
Feature activation | -2.28e-02 |
Pos logit contributions | |
its | +0.005 |
their | +0.005 |
them | +0.004 |
things | +0.004 |
it | +0.004 |
Neg logit contributions | |
unn | -0.008 |
enny | -0.008 |
seek | -0.008 |
oured | -0.008 |
uddy | -0.007 |
Token | igsaw |
Token ID | 45636 |
Feature activation | -6.56e-02 |
Pos logit contributions | |
ache | +0.016 |
drop | +0.015 |
seek | +0.014 |
driver | +0.014 |
sed | +0.014 |
Neg logit contributions | |
its | -0.057 |
their | -0.053 |
away | -0.053 |
them | -0.052 |
things | -0.050 |
Token | puzzle |
Token ID | 15027 |
Feature activation | +1.10e-04 |
Pos logit contributions | |
enny | +0.110 |
unn | +0.110 |
oured | +0.109 |
ache | +0.108 |
uddy | +0.106 |
Neg logit contributions | |
its | -0.102 |
their | -0.093 |
them | -0.089 |
things | -0.086 |
it | -0.082 |
Token | inside |
Token ID | 2641 |
Feature activation | +4.94e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
it | +0.000 |
things | +0.000 |
Neg logit contributions | |
unn | -0.000 |
enny | -0.000 |
oured | -0.000 |
uddy | -0.000 |
ugg | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | -7.35e-04 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.003 |
fog | +0.003 |
things | +0.003 |
Neg logit contributions | |
enny | -0.011 |
oured | -0.011 |
drop | -0.011 |
driver | -0.011 |
ipop | -0.011 |
Token | He |
Token ID | 679 |
Feature activation | +1.23e-03 |
Pos logit contributions | |
enny | +0.001 |
ache | +0.001 |
drop | +0.001 |
unn | +0.001 |
oured | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
everything | -0.001 |
things | -0.001 |
Token | paused |
Token ID | 24487 |
Feature activation | +2.24e-03 |
Pos logit contributions | |
its | +0.001 |
it | +0.001 |
their | +0.001 |
his | +0.001 |
them | +0.001 |
Neg logit contributions | |
unn | -0.003 |
fault | -0.003 |
ache | -0.003 |
supervision | -0.003 |
uddy | -0.003 |
Token | gray |
Token ID | 12768 |
Feature activation | -8.99e-03 |
Pos logit contributions | |
enny | +0.023 |
oured | +0.021 |
unn | +0.021 |
ucker | +0.020 |
scar | +0.020 |
Neg logit contributions | |
its | -0.014 |
their | -0.012 |
things | -0.011 |
them | -0.011 |
fog | -0.010 |
Token | bird |
Token ID | 6512 |
Feature activation | -6.26e-03 |
Pos logit contributions | |
enny | +0.019 |
ucker | +0.018 |
seek | +0.018 |
oured | +0.018 |
unn | +0.018 |
Neg logit contributions | |
its | -0.012 |
their | -0.011 |
things | -0.010 |
them | -0.010 |
fog | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +7.67e-04 |
Pos logit contributions | |
enny | +0.016 |
unn | +0.015 |
coach | +0.015 |
oured | +0.015 |
ipop | +0.015 |
Neg logit contributions | |
its | -0.007 |
their | -0.005 |
them | -0.005 |
it | -0.004 |
her | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +9.97e-04 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
her | +0.001 |
it | +0.001 |
Neg logit contributions | |
enny | -0.002 |
unn | -0.002 |
olly | -0.002 |
� | -0.002 |
uddy | -0.002 |
Token | brave |
Token ID | 14802 |
Feature activation | -9.74e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
things | +0.001 |
them | +0.001 |
fog | +0.001 |
Neg logit contributions | |
enny | -0.002 |
seek | -0.002 |
unn | -0.002 |
ucker | -0.002 |
oured | -0.002 |
Token | chip |
Token ID | 11594 |
Feature activation | -6.56e-02 |
Pos logit contributions | |
seek | +0.021 |
enny | +0.020 |
scar | +0.020 |
ll | +0.020 |
oured | +0.020 |
Neg logit contributions | |
its | -0.014 |
them | -0.011 |
their | -0.011 |
things | -0.010 |
it | -0.010 |
Token | m |
Token ID | 76 |
Feature activation | -4.06e-04 |
Pos logit contributions | |
enny | +0.124 |
seek | +0.119 |
oured | +0.118 |
ider | +0.114 |
driver | +0.114 |
Neg logit contributions | |
its | -0.098 |
their | -0.093 |
them | -0.093 |
things | -0.082 |
everything | -0.078 |
Token | unk |
Token ID | 2954 |
Feature activation | -1.47e-02 |
Pos logit contributions | |
enny | +0.001 |
seek | +0.001 |
rook | +0.001 |
oured | +0.001 |
� | +0.001 |
Neg logit contributions | |
its | -0.001 |
them | -0.001 |
their | -0.001 |
things | -0.001 |
her | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +2.13e-03 |
Pos logit contributions | |
unn | +0.033 |
enny | +0.033 |
seek | +0.032 |
driver | +0.032 |
� | +0.032 |
Neg logit contributions | |
its | -0.018 |
their | -0.015 |
them | -0.015 |
it | -0.012 |
her | -0.012 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.63e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
her | +0.002 |
it | +0.002 |
Neg logit contributions | |
ache | -0.005 |
drop | -0.005 |
unn | -0.005 |
enny | -0.005 |
driver | -0.005 |
Token | Once |
Token ID | 7454 |
Feature activation | +9.87e-03 |
Pos logit contributions | |
enny | +0.003 |
� | +0.003 |
uddy | +0.003 |
seek | +0.003 |
drop | +0.003 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
away | -0.002 |
things | -0.002 |
Token | , |
Token ID | 11 |
Feature activation | +2.25e-03 |
Pos logit contributions | |
uddy | +0.024 |
enny | +0.024 |
unn | +0.024 |
scar | +0.023 |
seek | +0.023 |
Neg logit contributions | |
its | -0.007 |
them | -0.005 |
their | -0.005 |
it | -0.004 |
her | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | +2.83e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.003 |
it | +0.002 |
her | +0.002 |
Neg logit contributions | |
enny | -0.005 |
unn | -0.005 |
uddy | -0.005 |
ipop | -0.005 |
seek | -0.005 |
Token | had |
Token ID | 550 |
Feature activation | +5.93e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
it | +0.003 |
her | +0.003 |
Neg logit contributions | |
enny | -0.007 |
uddy | -0.007 |
unn | -0.006 |
� | -0.006 |
seek | -0.006 |
Token | a |
Token ID | 257 |
Feature activation | -1.05e-04 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
her | +0.005 |
it | +0.005 |
Neg logit contributions | |
uddy | -0.016 |
enny | -0.015 |
ider | -0.015 |
unn | -0.015 |
ipop | -0.015 |
Token | chocolate |
Token ID | 11311 |
Feature activation | -6.35e-03 |
Pos logit contributions | |
unn | +0.000 |
seek | +0.000 |
enny | +0.000 |
driver | +0.000 |
uddy | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
it | -0.000 |
things | -0.000 |
Token | chip |
Token ID | 11594 |
Feature activation | -6.15e-02 |
Pos logit contributions | |
enny | +0.013 |
unn | +0.012 |
seek | +0.012 |
uddy | +0.012 |
oured | +0.012 |
Neg logit contributions | |
its | -0.009 |
their | -0.008 |
them | -0.008 |
things | -0.007 |
it | -0.007 |
Token | to |
Token ID | 284 |
Feature activation | -2.11e-03 |
Pos logit contributions | |
enny | +0.111 |
seek | +0.109 |
oured | +0.108 |
uddy | +0.105 |
ider | +0.104 |
Neg logit contributions | |
its | -0.090 |
their | -0.089 |
them | -0.089 |
things | -0.084 |
her | -0.077 |
Token | top |
Token ID | 1353 |
Feature activation | -3.11e-03 |
Pos logit contributions | |
enny | +0.004 |
unn | +0.004 |
oured | +0.004 |
uddy | +0.004 |
ache | +0.004 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
them | -0.003 |
her | -0.003 |
everything | -0.002 |
Token | it |
Token ID | 340 |
Feature activation | -2.85e-03 |
Pos logit contributions | |
sed | +0.007 |
enny | +0.007 |
oured | +0.007 |
unn | +0.007 |
uddy | +0.007 |
Neg logit contributions | |
its | -0.003 |
them | -0.003 |
their | -0.003 |
her | -0.002 |
it | -0.002 |
Token | off |
Token ID | 572 |
Feature activation | -2.01e-03 |
Pos logit contributions | |
enny | +0.007 |
unn | +0.007 |
uddy | +0.007 |
oured | +0.007 |
driver | +0.006 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
her | -0.002 |
everything | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +2.62e-03 |
Pos logit contributions | |
unn | +0.005 |
enny | +0.005 |
ache | +0.005 |
oured | +0.005 |
drop | +0.005 |
Neg logit contributions | |
its | -0.002 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
it | -0.001 |
Token | corner |
Token ID | 5228 |
Feature activation | +4.98e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
things | +0.004 |
fog | +0.003 |
Neg logit contributions | |
enny | -0.007 |
unn | -0.007 |
uddy | -0.007 |
ipop | -0.006 |
driver | -0.006 |
Token | and |
Token ID | 290 |
Feature activation | +5.86e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
her | +0.004 |
things | +0.004 |
Neg logit contributions | |
unn | -0.011 |
ache | -0.011 |
enny | -0.011 |
opus | -0.011 |
ipop | -0.011 |
Token | saw |
Token ID | 2497 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
its | +0.010 |
their | +0.009 |
them | +0.009 |
things | +0.008 |
everything | +0.008 |
Neg logit contributions | |
enny | -0.009 |
oured | -0.008 |
drop | -0.008 |
ipop | -0.008 |
ache | -0.008 |
Token | a |
Token ID | 257 |
Feature activation | +1.32e-03 |
Pos logit contributions | |
its | +0.011 |
their | +0.009 |
them | +0.009 |
her | +0.007 |
things | +0.006 |
Neg logit contributions | |
enny | -0.024 |
unn | -0.024 |
ache | -0.023 |
uddy | -0.023 |
drop | -0.023 |
Token | little |
Token ID | 1310 |
Feature activation | -8.28e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
fog | +0.001 |
Neg logit contributions | |
unn | -0.003 |
enny | -0.003 |
seek | -0.003 |
oured | -0.003 |
driver | -0.003 |
Token | chip |
Token ID | 11594 |
Feature activation | -6.15e-02 |
Pos logit contributions | |
enny | +0.016 |
seek | +0.016 |
unn | +0.016 |
uddy | +0.015 |
scar | +0.015 |
Neg logit contributions | |
its | -0.012 |
their | -0.011 |
them | -0.010 |
things | -0.010 |
it | -0.009 |
Token | m |
Token ID | 76 |
Feature activation | +2.41e-03 |
Pos logit contributions | |
enny | +0.092 |
oured | +0.090 |
seek | +0.089 |
driver | +0.086 |
ache | +0.084 |
Neg logit contributions | |
its | -0.109 |
their | -0.107 |
them | -0.106 |
things | -0.096 |
her | -0.093 |
Token | unk |
Token ID | 2954 |
Feature activation | -9.96e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
her | +0.004 |
things | +0.004 |
Neg logit contributions | |
seek | -0.004 |
oured | -0.003 |
enny | -0.003 |
unn | -0.003 |
Indians | -0.003 |
Token | running |
Token ID | 2491 |
Feature activation | -5.21e-03 |
Pos logit contributions | |
unn | +0.026 |
enny | +0.025 |
seek | +0.025 |
ipop | +0.024 |
oured | +0.024 |
Neg logit contributions | |
its | -0.008 |
their | -0.007 |
them | -0.007 |
her | -0.005 |
it | -0.005 |
Token | away |
Token ID | 1497 |
Feature activation | +4.61e-03 |
Pos logit contributions | |
enny | +0.010 |
oured | +0.010 |
driver | +0.010 |
seek | +0.010 |
drop | +0.010 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
things | -0.004 |
everything | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | +3.52e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
her | +0.002 |
things | +0.002 |
Neg logit contributions | |
enny | -0.012 |
unn | -0.012 |
oured | -0.012 |
ipop | -0.012 |
ache | -0.011 |
Token | time |
Token ID | 640 |
Feature activation | +1.33e-03 |
Pos logit contributions | |
oured | +0.024 |
driver | +0.024 |
enny | +0.024 |
seek | +0.023 |
ache | +0.023 |
Neg logit contributions | |
its | -0.009 |
their | -0.008 |
them | -0.007 |
her | -0.006 |
everything | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | +2.32e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
things | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.002 |
uddy | -0.002 |
unn | -0.002 |
drop | -0.002 |
ipop | -0.002 |
Token | there |
Token ID | 612 |
Feature activation | +9.18e-04 |
Pos logit contributions | |
its | +0.002 |
them | +0.002 |
their | +0.002 |
things | +0.002 |
away | +0.002 |
Neg logit contributions | |
enny | -0.005 |
drop | -0.005 |
driver | -0.005 |
ipop | -0.005 |
uddy | -0.005 |
Token | was |
Token ID | 373 |
Feature activation | +2.22e-03 |
Pos logit contributions | |
its | +0.001 |
them | +0.001 |
their | +0.001 |
away | +0.001 |
fires | +0.001 |
Neg logit contributions | |
enny | -0.001 |
uddy | -0.001 |
drop | -0.001 |
seek | -0.001 |
ipop | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | -5.41e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
things | +0.002 |
everything | +0.002 |
Neg logit contributions | |
enny | -0.005 |
drop | -0.004 |
oured | -0.004 |
unn | -0.004 |
ache | -0.004 |
Token | chip |
Token ID | 11594 |
Feature activation | -6.13e-02 |
Pos logit contributions | |
enny | +0.008 |
ache | +0.008 |
drop | +0.008 |
opus | +0.007 |
uddy | +0.007 |
Neg logit contributions | |
its | -0.010 |
them | -0.008 |
their | -0.008 |
things | -0.007 |
everything | -0.007 |
Token | m |
Token ID | 76 |
Feature activation | +2.33e-03 |
Pos logit contributions | |
oured | +0.093 |
enny | +0.091 |
seek | +0.087 |
driver | +0.086 |
unn | +0.083 |
Neg logit contributions | |
its | -0.110 |
their | -0.103 |
them | -0.099 |
things | -0.092 |
her | -0.090 |
Token | unk |
Token ID | 2954 |
Feature activation | -1.37e-02 |
Pos logit contributions | |
its | +0.005 |
their | +0.005 |
them | +0.005 |
things | +0.004 |
her | +0.004 |
Neg logit contributions | |
oured | -0.003 |
seek | -0.003 |
enny | -0.002 |
driver | -0.002 |
drop | -0.002 |
Token | who |
Token ID | 508 |
Feature activation | -6.13e-03 |
Pos logit contributions | |
oured | +0.031 |
enny | +0.030 |
driver | +0.030 |
unn | +0.030 |
seek | +0.029 |
Neg logit contributions | |
its | -0.016 |
their | -0.013 |
them | -0.012 |
her | -0.011 |
his | -0.010 |
Token | lived |
Token ID | 5615 |
Feature activation | +2.70e-02 |
Pos logit contributions | |
enny | +0.012 |
oured | +0.012 |
unn | +0.012 |
ipop | +0.011 |
driver | +0.011 |
Neg logit contributions | |
its | -0.009 |
their | -0.008 |
them | -0.007 |
her | -0.006 |
everything | -0.006 |
Token | in |
Token ID | 287 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
its | +0.022 |
their | +0.017 |
them | +0.016 |
things | +0.011 |
her | +0.011 |
Neg logit contributions | |
enny | -0.066 |
oured | -0.064 |
unn | -0.064 |
ache | -0.064 |
drop | -0.064 |
Token | floor |
Token ID | 4314 |
Feature activation | -1.88e-02 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.003 |
things | +0.002 |
her | +0.002 |
Neg logit contributions | |
enny | -0.004 |
driver | -0.004 |
unn | -0.004 |
uddy | -0.004 |
oured | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | +2.60e-03 |
Pos logit contributions | |
unn | +0.060 |
enny | +0.059 |
uddy | +0.058 |
opus | +0.057 |
ipop | +0.057 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.004 |
. | -0.001 |
it | +0.000 |
Token |
|
Token ID | 198 |
Feature activation | +3.63e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.002 |
everything | +0.002 |
her | +0.002 |
Neg logit contributions | |
ache | -0.005 |
enny | -0.005 |
unn | -0.005 |
drop | -0.005 |
driver | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | +3.56e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
things | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.008 |
oured | -0.007 |
unn | -0.007 |
ache | -0.007 |
drop | -0.007 |
Token | The |
Token ID | 464 |
Feature activation | -1.27e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
her | +0.004 |
it | +0.004 |
Neg logit contributions | |
unn | -0.007 |
oured | -0.007 |
ache | -0.007 |
ipop | -0.007 |
drop | -0.007 |
Token | chip |
Token ID | 11594 |
Feature activation | -6.10e-02 |
Pos logit contributions | |
seek | +0.003 |
enny | +0.003 |
ucker | +0.003 |
driver | +0.003 |
uts | +0.003 |
Neg logit contributions | |
things | -0.002 |
its | -0.001 |
fog | -0.001 |
ash | -0.001 |
their | -0.001 |
Token | mun |
Token ID | 6199 |
Feature activation | +7.80e-03 |
Pos logit contributions | |
seek | +0.113 |
oured | +0.110 |
enny | +0.108 |
driver | +0.107 |
powers | +0.105 |
Neg logit contributions | |
its | -0.086 |
their | -0.085 |
them | -0.082 |
things | -0.080 |
her | -0.075 |
Token | ks |
Token ID | 591 |
Feature activation | -6.38e-03 |
Pos logit contributions | |
its | +0.012 |
their | +0.011 |
them | +0.011 |
her | +0.009 |
things | +0.009 |
Neg logit contributions | |
enny | -0.014 |
� | -0.013 |
oured | -0.013 |
ipop | -0.013 |
ache | -0.013 |
Token | were |
Token ID | 547 |
Feature activation | +3.99e-03 |
Pos logit contributions | |
unn | +0.013 |
supervision | +0.012 |
ucker | +0.012 |
uddy | +0.012 |
salon | +0.012 |
Neg logit contributions | |
its | -0.009 |
them | -0.009 |
their | -0.008 |
her | -0.007 |
it | -0.007 |
Token | very |
Token ID | 845 |
Feature activation | +4.66e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
her | +0.003 |
his | +0.003 |
Neg logit contributions | |
enny | -0.010 |
unn | -0.010 |
driver | -0.010 |
opus | -0.010 |
ipop | -0.010 |
Token | curious |
Token ID | 11040 |
Feature activation | +5.61e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.006 |
them | +0.005 |
her | +0.004 |
things | +0.004 |
Neg logit contributions | |
driver | -0.009 |
enny | -0.009 |
drop | -0.009 |
ache | -0.009 |
seek | -0.009 |
Token | very |
Token ID | 845 |
Feature activation | +3.35e-03 |
Pos logit contributions | |
its | +0.008 |
their | +0.008 |
them | +0.007 |
her | +0.006 |
out | +0.006 |
Neg logit contributions | |
enny | -0.012 |
driver | -0.011 |
unn | -0.011 |
seek | -0.011 |
opus | -0.011 |
Token | excited |
Token ID | 6568 |
Feature activation | -4.30e-03 |
Pos logit contributions | |
their | +0.004 |
its | +0.004 |
them | +0.004 |
her | +0.003 |
things | +0.003 |
Neg logit contributions | |
enny | -0.007 |
driver | -0.007 |
seek | -0.007 |
drop | -0.007 |
ache | -0.007 |
Token | to |
Token ID | 284 |
Feature activation | +9.66e-04 |
Pos logit contributions | |
enny | +0.009 |
driver | +0.009 |
oured | +0.009 |
unn | +0.009 |
ipop | +0.009 |
Neg logit contributions | |
its | -0.005 |
their | -0.005 |
them | -0.005 |
things | -0.004 |
her | -0.004 |
Token | bake |
Token ID | 28450 |
Feature activation | +1.85e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
her | +0.001 |
things | +0.001 |
Neg logit contributions | |
enny | -0.002 |
unn | -0.002 |
ache | -0.002 |
drop | -0.002 |
oured | -0.002 |
Token | chocolate |
Token ID | 11311 |
Feature activation | -6.03e-03 |
Pos logit contributions | |
its | +0.002 |
away | +0.002 |
Wow | +0.002 |
south | +0.002 |
them | +0.002 |
Neg logit contributions | |
chip | -0.003 |
drop | -0.003 |
oured | -0.003 |
ipop | -0.003 |
ache | -0.003 |
Token | chip |
Token ID | 11594 |
Feature activation | -6.07e-02 |
Pos logit contributions | |
enny | +0.012 |
drop | +0.012 |
ache | +0.012 |
oured | +0.012 |
ipop | +0.012 |
Neg logit contributions | |
its | -0.007 |
their | -0.006 |
them | -0.006 |
things | -0.005 |
everything | -0.005 |
Token | cookies |
Token ID | 14746 |
Feature activation | -5.11e-03 |
Pos logit contributions | |
enny | +0.102 |
oured | +0.096 |
driver | +0.095 |
uddy | +0.095 |
seek | +0.094 |
Neg logit contributions | |
its | -0.096 |
their | -0.093 |
them | -0.092 |
things | -0.083 |
her | -0.080 |
Token | . |
Token ID | 13 |
Feature activation | +4.62e-03 |
Pos logit contributions | |
enny | +0.013 |
unn | +0.012 |
uddy | +0.012 |
oured | +0.012 |
ache | +0.012 |
Neg logit contributions | |
its | -0.004 |
their | -0.004 |
them | -0.003 |
her | -0.002 |
everything | -0.002 |
Token | Lily |
Token ID | 20037 |
Feature activation | -2.72e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
her | +0.003 |
everything | +0.003 |
Neg logit contributions | |
ache | -0.010 |
unn | -0.010 |
enny | -0.010 |
drop | -0.010 |
driver | -0.010 |
Token | helped |
Token ID | 4193 |
Feature activation | -1.79e-03 |
Pos logit contributions | |
unn | +0.006 |
seek | +0.006 |
uddy | +0.006 |
igsaw | +0.006 |
coach | +0.006 |
Neg logit contributions | |
its | -0.003 |
her | -0.003 |
their | -0.003 |
it | -0.002 |
them | -0.002 |
Token | her |
Token ID | 607 |
Feature activation | -5.38e-03 |
Pos logit contributions | |
enny | +0.005 |
unn | +0.005 |
oured | +0.005 |
ache | +0.005 |
seek | +0.005 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
her | -0.000 |
things | -0.000 |
Token | was |
Token ID | 373 |
Feature activation | +3.55e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
it | +0.004 |
things | +0.004 |
Neg logit contributions | |
enny | -0.008 |
� | -0.007 |
ipop | -0.007 |
seek | -0.007 |
unn | -0.007 |
Token | so |
Token ID | 523 |
Feature activation | +3.05e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.003 |
her | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.008 |
unn | -0.008 |
oured | -0.008 |
ipop | -0.008 |
driver | -0.008 |
Token | clever |
Token ID | 14169 |
Feature activation | -5.95e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
her | +0.002 |
everything | +0.002 |
Neg logit contributions | |
enny | -0.007 |
oured | -0.007 |
driver | -0.007 |
ache | -0.007 |
seek | -0.007 |
Token | of |
Token ID | 286 |
Feature activation | -6.89e-03 |
Pos logit contributions | |
oured | +0.015 |
enny | +0.015 |
� | +0.015 |
ucker | +0.014 |
salon | +0.014 |
Neg logit contributions | |
its | -0.006 |
them | -0.004 |
their | -0.004 |
it | -0.004 |
things | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +3.01e-03 |
Pos logit contributions | |
enny | +0.017 |
ache | +0.016 |
oured | +0.016 |
unn | +0.016 |
ipop | +0.016 |
Neg logit contributions | |
its | -0.007 |
their | -0.005 |
them | -0.005 |
things | -0.004 |
everything | -0.004 |
Token | chip |
Token ID | 11594 |
Feature activation | -6.03e-02 |
Pos logit contributions | |
things | +0.005 |
their | +0.004 |
them | +0.004 |
its | +0.004 |
ash | +0.004 |
Neg logit contributions | |
enny | -0.006 |
driver | -0.006 |
seek | -0.005 |
oured | -0.005 |
enna | -0.005 |
Token | m |
Token ID | 76 |
Feature activation | +3.68e-03 |
Pos logit contributions | |
oured | +0.097 |
enny | +0.096 |
seek | +0.093 |
driver | +0.089 |
sed | +0.089 |
Neg logit contributions | |
its | -0.100 |
their | -0.098 |
them | -0.098 |
things | -0.095 |
her | -0.086 |
Token | unk |
Token ID | 2954 |
Feature activation | -5.69e-03 |
Pos logit contributions | |
its | +0.007 |
them | +0.006 |
their | +0.006 |
things | +0.006 |
it | +0.006 |
Neg logit contributions | |
seek | -0.006 |
enny | -0.005 |
oured | -0.005 |
rook | -0.005 |
bars | -0.005 |
Token | to |
Token ID | 284 |
Feature activation | -5.59e-04 |
Pos logit contributions | |
enny | +0.014 |
� | +0.014 |
ucker | +0.014 |
oured | +0.014 |
seek | +0.014 |
Neg logit contributions | |
its | -0.005 |
their | -0.004 |
them | -0.004 |
it | -0.004 |
down | -0.003 |
Token | hide |
Token ID | 7808 |
Feature activation | +6.55e-03 |
Pos logit contributions | |
enny | +0.001 |
driver | +0.001 |
unn | +0.001 |
ipop | +0.001 |
ider | +0.001 |
Neg logit contributions | |
its | -0.001 |
them | -0.001 |
their | -0.001 |
her | -0.001 |
him | -0.001 |
Token | from |
Token ID | 422 |
Feature activation | +7.04e-03 |
Pos logit contributions | |
its | +0.008 |
their | +0.007 |
them | +0.006 |
things | +0.005 |
everything | +0.005 |
Neg logit contributions | |
enny | -0.013 |
driver | -0.013 |
oured | -0.013 |
ache | -0.013 |
unn | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | +2.46e-03 |
Pos logit contributions | |
enny | +0.031 |
unn | +0.030 |
ipop | +0.030 |
oured | +0.029 |
driver | +0.029 |
Neg logit contributions | |
its | -0.008 |
their | -0.006 |
them | -0.005 |
her | -0.003 |
it | -0.003 |
Token | It |
Token ID | 632 |
Feature activation | -3.12e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
her | +0.002 |
it | +0.002 |
Neg logit contributions | |
ache | -0.005 |
enny | -0.005 |
unn | -0.005 |
drop | -0.005 |
driver | -0.005 |
Token | was |
Token ID | 373 |
Feature activation | +2.07e-03 |
Pos logit contributions | |
enny | +0.006 |
unn | +0.006 |
ipop | +0.006 |
driver | +0.006 |
oured | +0.006 |
Neg logit contributions | |
its | -0.004 |
their | -0.004 |
them | -0.004 |
her | -0.003 |
everything | -0.003 |
Token | a |
Token ID | 257 |
Feature activation | +1.90e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
her | +0.001 |
his | +0.001 |
Neg logit contributions | |
enny | -0.005 |
unn | -0.005 |
ipop | -0.005 |
opus | -0.005 |
driver | -0.005 |
Token | small |
Token ID | 1402 |
Feature activation | -3.12e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
fog | +0.002 |
them | +0.002 |
things | +0.002 |
Neg logit contributions | |
enny | -0.004 |
unn | -0.004 |
seek | -0.004 |
oured | -0.004 |
driver | -0.004 |
Token | chip |
Token ID | 11594 |
Feature activation | -6.03e-02 |
Pos logit contributions | |
enny | +0.007 |
seek | +0.007 |
scar | +0.006 |
ll | +0.006 |
ave | +0.006 |
Neg logit contributions | |
its | -0.004 |
their | -0.003 |
things | -0.003 |
fog | -0.003 |
ash | -0.003 |
Token | m |
Token ID | 76 |
Feature activation | +4.54e-03 |
Pos logit contributions | |
seek | +0.103 |
oured | +0.102 |
enny | +0.101 |
driver | +0.098 |
sed | +0.097 |
Neg logit contributions | |
its | -0.096 |
their | -0.088 |
them | -0.087 |
things | -0.080 |
her | -0.079 |
Token | unk |
Token ID | 2954 |
Feature activation | -5.15e-03 |
Pos logit contributions | |
its | +0.009 |
their | +0.008 |
them | +0.008 |
her | +0.007 |
things | +0.007 |
Neg logit contributions | |
seek | -0.007 |
enny | -0.006 |
salon | -0.006 |
oured | -0.006 |
coach | -0.006 |
Token | ! |
Token ID | 0 |
Feature activation | -3.84e-03 |
Pos logit contributions | |
seek | +0.013 |
unn | +0.013 |
enny | +0.013 |
oured | +0.012 |
ucker | +0.012 |
Neg logit contributions | |
its | -0.005 |
their | -0.003 |
them | -0.003 |
it | -0.003 |
her | -0.003 |
Token | The |
Token ID | 383 |
Feature activation | -5.25e-03 |
Pos logit contributions | |
ache | +0.008 |
unn | +0.008 |
drop | +0.008 |
driver | +0.008 |
seek | +0.008 |
Neg logit contributions | |
its | -0.004 |
their | -0.004 |
them | -0.003 |
her | -0.003 |
it | -0.003 |
Token | princess |
Token ID | 21752 |
Feature activation | +7.42e-03 |
Pos logit contributions | |
enny | +0.012 |
seek | +0.012 |
driver | +0.011 |
unn | +0.011 |
enna | +0.011 |
Neg logit contributions | |
things | -0.006 |
its | -0.005 |
people | -0.005 |
their | -0.005 |
ash | -0.005 |
Token | a |
Token ID | 257 |
Feature activation | +2.38e-03 |
Pos logit contributions | |
enny | +0.014 |
oured | +0.013 |
ache | +0.013 |
drop | +0.013 |
unn | +0.013 |
Neg logit contributions | |
its | -0.005 |
their | -0.004 |
them | -0.004 |
things | -0.003 |
everything | -0.003 |
Token | special |
Token ID | 2041 |
Feature activation | -1.86e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
things | +0.003 |
it | +0.003 |
Neg logit contributions | |
enny | -0.004 |
unn | -0.004 |
seek | -0.004 |
uddy | -0.004 |
oured | -0.004 |
Token | treat |
Token ID | 2190 |
Feature activation | +8.29e-03 |
Pos logit contributions | |
enny | +0.004 |
unn | +0.004 |
seek | +0.003 |
uddy | +0.003 |
ucker | +0.003 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
things | -0.002 |
it | -0.002 |
Token | for |
Token ID | 329 |
Feature activation | +9.41e-04 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
her | +0.003 |
it | +0.003 |
Neg logit contributions | |
enny | -0.021 |
unn | -0.021 |
oured | -0.021 |
seek | -0.021 |
uddy | -0.020 |
Token | the |
Token ID | 262 |
Feature activation | +1.24e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.000 |
them | +0.000 |
things | +0.000 |
everything | +0.000 |
Neg logit contributions | |
enny | -0.002 |
oured | -0.002 |
drop | -0.002 |
ache | -0.002 |
ipop | -0.002 |
Token | chip |
Token ID | 11594 |
Feature activation | -6.00e-02 |
Pos logit contributions | |
things | +0.002 |
ash | +0.001 |
people | +0.001 |
its | +0.001 |
them | +0.001 |
Neg logit contributions | |
enny | -0.003 |
driver | -0.002 |
enna | -0.002 |
oured | -0.002 |
ucker | -0.002 |
Token | m |
Token ID | 76 |
Feature activation | +3.25e-03 |
Pos logit contributions | |
oured | +0.092 |
enny | +0.091 |
seek | +0.089 |
driver | +0.088 |
sed | +0.088 |
Neg logit contributions | |
its | -0.099 |
them | -0.098 |
their | -0.098 |
things | -0.094 |
her | -0.090 |
Token | unk |
Token ID | 2954 |
Feature activation | -4.17e-03 |
Pos logit contributions | |
its | +0.006 |
them | +0.005 |
their | +0.005 |
things | +0.005 |
her | +0.005 |
Neg logit contributions | |
seek | -0.005 |
oured | -0.005 |
enny | -0.005 |
rook | -0.005 |
Indians | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -8.05e-04 |
Pos logit contributions | |
unn | +0.011 |
� | +0.011 |
opus | +0.011 |
seek | +0.011 |
enny | +0.011 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
her | -0.002 |
them | -0.002 |
it | -0.002 |
Token | She |
Token ID | 1375 |
Feature activation | +1.84e-03 |
Pos logit contributions | |
ache | +0.002 |
drop | +0.002 |
unn | +0.002 |
enny | +0.002 |
opus | +0.002 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
it | -0.001 |
Token | said |
Token ID | 531 |
Feature activation | -5.66e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
it | +0.002 |
her | +0.002 |
them | +0.002 |
Neg logit contributions | |
unn | -0.004 |
seek | -0.004 |
uddy | -0.004 |
fault | -0.004 |
ider | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | +1.85e-04 |
Pos logit contributions | |
enny | +0.011 |
unn | +0.010 |
uddy | +0.010 |
oured | +0.010 |
ache | +0.010 |
Neg logit contributions | |
its | -0.006 |
their | -0.006 |
them | -0.006 |
things | -0.005 |
her | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | +2.91e-03 |
Pos logit contributions | |
its | +0.000 |
them | +0.000 |
their | +0.000 |
her | +0.000 |
it | +0.000 |
Neg logit contributions | |
enny | -0.000 |
seek | -0.000 |
uddy | -0.000 |
unn | -0.000 |
opus | -0.000 |
Token | even |
Token ID | 772 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
her | +0.004 |
it | +0.004 |
Neg logit contributions | |
uddy | -0.006 |
enny | -0.006 |
seek | -0.005 |
unn | -0.005 |
opus | -0.005 |
Token | mint |
Token ID | 21043 |
Feature activation | -5.82e-03 |
Pos logit contributions | |
its | +0.019 |
their | +0.018 |
them | +0.018 |
her | +0.017 |
his | +0.016 |
Neg logit contributions | |
uddy | -0.029 |
enny | -0.028 |
opus | -0.028 |
sed | -0.027 |
seek | -0.027 |
Token | chocolate |
Token ID | 11311 |
Feature activation | -2.93e-03 |
Pos logit contributions | |
enny | +0.011 |
sed | +0.011 |
uddy | +0.011 |
rivals | +0.011 |
coach | +0.011 |
Neg logit contributions | |
its | -0.008 |
them | -0.008 |
their | -0.007 |
things | -0.007 |
her | -0.007 |
Token | chip |
Token ID | 11594 |
Feature activation | -6.00e-02 |
Pos logit contributions | |
enny | +0.007 |
unn | +0.006 |
uddy | +0.006 |
oured | +0.006 |
seek | +0.006 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
them | -0.003 |
things | -0.002 |
her | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +2.15e-03 |
Pos logit contributions | |
enny | +0.100 |
uddy | +0.096 |
sed | +0.094 |
oured | +0.094 |
driver | +0.094 |
Neg logit contributions | |
its | -0.097 |
them | -0.096 |
their | -0.095 |
things | -0.088 |
her | -0.084 |
Token | But |
Token ID | 887 |
Feature activation | -2.52e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
her | +0.002 |
things | +0.002 |
Neg logit contributions | |
enny | -0.004 |
ache | -0.004 |
unn | -0.004 |
drop | -0.004 |
oured | -0.004 |
Token | her |
Token ID | 607 |
Feature activation | -2.82e-03 |
Pos logit contributions | |
unn | +0.005 |
enny | +0.005 |
ache | +0.005 |
seek | +0.005 |
uddy | +0.005 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
them | -0.003 |
her | -0.003 |
it | -0.003 |
Token | favorite |
Token ID | 4004 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
enny | +0.007 |
driver | +0.006 |
seek | +0.006 |
ives | +0.006 |
unn | +0.006 |
Neg logit contributions | |
things | -0.003 |
its | -0.003 |
their | -0.003 |
it | -0.003 |
everything | -0.003 |
Token | was |
Token ID | 373 |
Feature activation | +1.77e-03 |
Pos logit contributions | |
its | +0.020 |
their | +0.018 |
them | +0.018 |
things | +0.017 |
it | +0.017 |
Neg logit contributions | |
enny | -0.028 |
unn | -0.027 |
driver | -0.027 |
uddy | -0.027 |
seek | -0.026 |
Token | place |
Token ID | 1295 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
enny | +0.014 |
oured | +0.014 |
unn | +0.014 |
ache | +0.014 |
drop | +0.014 |
Neg logit contributions | |
its | -0.004 |
their | -0.003 |
them | -0.003 |
things | -0.002 |
everything | -0.002 |
Token | ! |
Token ID | 0 |
Feature activation | -3.30e-03 |
Pos logit contributions | |
its | +0.013 |
their | +0.012 |
them | +0.011 |
it | +0.009 |
everything | +0.009 |
Neg logit contributions | |
unn | -0.025 |
enny | -0.025 |
ache | -0.024 |
opus | -0.024 |
uddy | -0.024 |
Token |
|
Token ID | 198 |
Feature activation | +2.11e-04 |
Pos logit contributions | |
ache | +0.008 |
drop | +0.008 |
unn | +0.008 |
ipop | +0.008 |
driver | +0.007 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
them | -0.003 |
it | -0.002 |
everything | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | +1.71e-04 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
everything | +0.000 |
it | +0.000 |
Neg logit contributions | |
ache | -0.000 |
oured | -0.000 |
enny | -0.000 |
ipop | -0.000 |
drop | -0.000 |
Token | The |
Token ID | 464 |
Feature activation | -2.44e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
everything | +0.000 |
it | +0.000 |
Neg logit contributions | |
unn | -0.000 |
ipop | -0.000 |
sed | -0.000 |
oured | -0.000 |
ache | -0.000 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.96e-02 |
Pos logit contributions | |
enny | +0.006 |
enna | +0.005 |
seek | +0.005 |
ives | +0.005 |
uts | +0.005 |
Neg logit contributions | |
things | -0.003 |
their | -0.003 |
ash | -0.003 |
people | -0.003 |
fog | -0.003 |
Token | mun |
Token ID | 6199 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
seek | +0.111 |
oured | +0.109 |
enny | +0.107 |
driver | +0.106 |
sed | +0.105 |
Neg logit contributions | |
their | -0.082 |
its | -0.081 |
them | -0.079 |
things | -0.078 |
her | -0.072 |
Token | ks |
Token ID | 591 |
Feature activation | -3.52e-03 |
Pos logit contributions | |
its | +0.016 |
their | +0.014 |
them | +0.013 |
her | +0.011 |
things | +0.011 |
Neg logit contributions | |
enny | -0.019 |
� | -0.019 |
ipop | -0.018 |
oured | -0.018 |
seek | -0.018 |
Token | didn |
Token ID | 1422 |
Feature activation | -3.58e-04 |
Pos logit contributions | |
unn | +0.007 |
ucker | +0.007 |
supervision | +0.007 |
enny | +0.007 |
salon | +0.007 |
Neg logit contributions | |
its | -0.005 |
them | -0.005 |
their | -0.005 |
it | -0.004 |
her | -0.004 |
Token | 't |
Token ID | 470 |
Feature activation | -8.04e-03 |
Pos logit contributions | |
unn | +0.000 |
enny | +0.000 |
ipop | +0.000 |
oured | +0.000 |
ache | +0.000 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
it | -0.001 |
Token | know |
Token ID | 760 |
Feature activation | +1.20e-03 |
Pos logit contributions | |
enny | +0.014 |
oured | +0.013 |
unn | +0.013 |
uddy | +0.013 |
ipop | +0.013 |
Neg logit contributions | |
its | -0.013 |
their | -0.012 |
them | -0.011 |
her | -0.010 |
things | -0.010 |
Token | The |
Token ID | 464 |
Feature activation | -1.98e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
his | +0.001 |
her | +0.001 |
Neg logit contributions | |
sed | -0.006 |
unn | -0.006 |
ipop | -0.006 |
oured | -0.006 |
drop | -0.006 |
Token | boy |
Token ID | 2933 |
Feature activation | -6.10e-03 |
Pos logit contributions | |
enny | +0.004 |
seek | +0.004 |
oured | +0.004 |
driver | +0.004 |
ives | +0.004 |
Neg logit contributions | |
things | -0.003 |
their | -0.002 |
ash | -0.002 |
its | -0.002 |
people | -0.002 |
Token | understood |
Token ID | 7247 |
Feature activation | -3.70e-03 |
Pos logit contributions | |
unn | +0.014 |
enny | +0.013 |
uddy | +0.013 |
igsaw | +0.013 |
driver | +0.013 |
Neg logit contributions | |
its | -0.007 |
their | -0.006 |
them | -0.006 |
it | -0.006 |
his | -0.006 |
Token | that |
Token ID | 326 |
Feature activation | +9.03e-03 |
Pos logit contributions | |
enny | +0.007 |
unn | +0.007 |
oured | +0.007 |
drop | +0.007 |
uddy | +0.007 |
Neg logit contributions | |
its | -0.005 |
their | -0.004 |
them | -0.004 |
her | -0.003 |
things | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +2.55e-03 |
Pos logit contributions | |
its | +0.009 |
their | +0.008 |
them | +0.007 |
it | +0.006 |
things | +0.006 |
Neg logit contributions | |
oured | -0.023 |
enny | -0.023 |
unn | -0.022 |
uddy | -0.022 |
drop | -0.022 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.95e-02 |
Pos logit contributions | |
things | +0.005 |
its | +0.004 |
their | +0.004 |
ash | +0.004 |
them | +0.004 |
Neg logit contributions | |
enny | -0.004 |
oured | -0.004 |
seek | -0.003 |
driver | -0.003 |
enna | -0.003 |
Token | m |
Token ID | 76 |
Feature activation | +3.97e-03 |
Pos logit contributions | |
oured | +0.092 |
seek | +0.091 |
enny | +0.091 |
sed | +0.086 |
ider | +0.086 |
Neg logit contributions | |
its | -0.097 |
them | -0.096 |
their | -0.095 |
things | -0.092 |
everything | -0.085 |
Token | unk |
Token ID | 2954 |
Feature activation | -5.40e-03 |
Pos logit contributions | |
its | +0.007 |
things | +0.007 |
them | +0.007 |
their | +0.006 |
his | +0.006 |
Neg logit contributions | |
seek | -0.006 |
oured | -0.006 |
enny | -0.006 |
rook | -0.006 |
tournament | -0.006 |
Token | was |
Token ID | 373 |
Feature activation | +4.42e-04 |
Pos logit contributions | |
seek | +0.012 |
unn | +0.012 |
coat | +0.011 |
oured | +0.011 |
enny | +0.011 |
Neg logit contributions | |
its | -0.007 |
their | -0.006 |
them | -0.006 |
it | -0.006 |
things | -0.006 |
Token | boss |
Token ID | 6478 |
Feature activation | +4.87e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
her | +0.000 |
his | +0.000 |
Neg logit contributions | |
enny | -0.001 |
unn | -0.001 |
uddy | -0.001 |
opus | -0.001 |
ipop | -0.001 |
Token | y |
Token ID | 88 |
Feature activation | -8.96e-03 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
down | +0.006 |
by | +0.006 |
Neg logit contributions | |
� | -0.010 |
seek | -0.009 |
sed | -0.009 |
ider | -0.009 |
coach | -0.009 |
Token | , |
Token ID | 11 |
Feature activation | -1.14e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.000 |
them | +0.000 |
her | +0.000 |
everything | +0.000 |
Neg logit contributions | |
enny | -0.001 |
unn | -0.001 |
driver | -0.001 |
ache | -0.001 |
ipop | -0.001 |
Token | she |
Token ID | 673 |
Feature activation | +7.91e-04 |
Pos logit contributions | |
enny | +0.003 |
unn | +0.003 |
oured | +0.003 |
ache | +0.003 |
drop | +0.002 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
her | -0.001 |
Token | noticed |
Token ID | 6810 |
Feature activation | +8.39e-03 |
Pos logit contributions | |
its | +0.001 |
them | +0.001 |
their | +0.001 |
it | +0.001 |
everything | +0.001 |
Neg logit contributions | |
unn | -0.002 |
uddy | -0.002 |
driver | -0.002 |
enny | -0.002 |
� | -0.002 |
Token | a |
Token ID | 257 |
Feature activation | +3.81e-03 |
Pos logit contributions | |
its | +0.009 |
their | +0.008 |
them | +0.007 |
her | +0.006 |
everything | +0.006 |
Neg logit contributions | |
enny | -0.020 |
uddy | -0.019 |
unn | -0.019 |
ipop | -0.019 |
driver | -0.019 |
Token | little |
Token ID | 1310 |
Feature activation | -4.62e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
things | +0.004 |
fog | +0.004 |
Neg logit contributions | |
enny | -0.008 |
unn | -0.008 |
seek | -0.008 |
driver | -0.008 |
oured | -0.008 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.92e-02 |
Pos logit contributions | |
enny | +0.009 |
seek | +0.009 |
scar | +0.009 |
driver | +0.009 |
uddy | +0.009 |
Neg logit contributions | |
its | -0.007 |
their | -0.006 |
them | -0.006 |
things | -0.005 |
down | -0.005 |
Token | m |
Token ID | 76 |
Feature activation | +4.21e-03 |
Pos logit contributions | |
enny | +0.096 |
seek | +0.094 |
driver | +0.092 |
oured | +0.092 |
powers | +0.088 |
Neg logit contributions | |
its | -0.100 |
them | -0.095 |
their | -0.094 |
things | -0.085 |
her | -0.084 |
Token | unk |
Token ID | 2954 |
Feature activation | -9.94e-04 |
Pos logit contributions | |
its | +0.008 |
them | +0.008 |
their | +0.007 |
her | +0.007 |
things | +0.006 |
Neg logit contributions | |
seek | -0.006 |
enny | -0.006 |
oured | -0.006 |
rook | -0.006 |
driver | -0.006 |
Token | sc |
Token ID | 629 |
Feature activation | -8.33e-03 |
Pos logit contributions | |
unn | +0.002 |
enny | +0.002 |
seek | +0.002 |
ipop | +0.002 |
uddy | +0.002 |
Neg logit contributions | |
its | -0.001 |
them | -0.001 |
their | -0.001 |
it | -0.001 |
her | -0.001 |
Token | ur |
Token ID | 333 |
Feature activation | -2.64e-03 |
Pos logit contributions | |
va | +0.009 |
drop | +0.009 |
omo | +0.009 |
driver | +0.008 |
ache | +0.008 |
Neg logit contributions | |
its | -0.016 |
them | -0.014 |
their | -0.014 |
out | -0.014 |
down | -0.013 |
Token | rying |
Token ID | 14992 |
Feature activation | +8.67e-03 |
Pos logit contributions | |
enny | +0.004 |
unn | +0.004 |
ache | +0.004 |
oured | +0.004 |
drop | +0.004 |
Neg logit contributions | |
its | -0.004 |
their | -0.004 |
them | -0.004 |
things | -0.003 |
her | -0.003 |
Token | upon |
Token ID | 2402 |
Feature activation | -3.55e-05 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
out | +0.001 |
down | +0.001 |
Neg logit contributions | |
unn | -0.003 |
ipop | -0.003 |
ache | -0.003 |
opus | -0.003 |
drop | -0.003 |
Token | a |
Token ID | 257 |
Feature activation | +7.33e-04 |
Pos logit contributions | |
enny | +0.000 |
unn | +0.000 |
uddy | +0.000 |
oured | +0.000 |
ache | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
her | -0.000 |
things | -0.000 |
Token | very |
Token ID | 845 |
Feature activation | +3.83e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
it | +0.001 |
Neg logit contributions | |
unn | -0.002 |
seek | -0.002 |
driver | -0.002 |
enny | -0.001 |
ives | -0.001 |
Token | boss |
Token ID | 6478 |
Feature activation | +3.11e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.005 |
them | +0.004 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.007 |
driver | -0.007 |
drop | -0.007 |
unn | -0.007 |
seek | -0.007 |
Token | y |
Token ID | 88 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
its | +0.005 |
their | +0.005 |
them | +0.004 |
it | +0.004 |
his | +0.004 |
Neg logit contributions | |
seek | -0.005 |
sed | -0.005 |
ider | -0.005 |
� | -0.005 |
oured | -0.005 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.90e-02 |
Pos logit contributions | |
seek | +0.022 |
unn | +0.022 |
enny | +0.021 |
ucker | +0.021 |
driver | +0.021 |
Neg logit contributions | |
its | -0.015 |
their | -0.013 |
things | -0.013 |
them | -0.013 |
fog | -0.012 |
Token | m |
Token ID | 76 |
Feature activation | +4.71e-03 |
Pos logit contributions | |
enny | +0.088 |
oured | +0.087 |
seek | +0.087 |
sed | +0.085 |
driver | +0.084 |
Neg logit contributions | |
its | -0.100 |
their | -0.098 |
them | -0.097 |
things | -0.091 |
him | -0.086 |
Token | unk |
Token ID | 2954 |
Feature activation | -7.41e-03 |
Pos logit contributions | |
their | +0.008 |
its | +0.008 |
them | +0.008 |
things | +0.008 |
at | +0.007 |
Neg logit contributions | |
seventy | -0.007 |
seek | -0.007 |
oured | -0.007 |
enny | -0.007 |
rook | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +3.04e-03 |
Pos logit contributions | |
unn | +0.021 |
seek | +0.021 |
powers | +0.020 |
enny | +0.020 |
driver | +0.020 |
Neg logit contributions | |
its | -0.004 |
them | -0.003 |
their | -0.003 |
it | -0.002 |
. | -0.002 |
Token | The |
Token ID | 383 |
Feature activation | -2.37e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.003 |
his | +0.002 |
it | +0.002 |
Neg logit contributions | |
unn | -0.007 |
enny | -0.007 |
drop | -0.007 |
ache | -0.007 |
seek | -0.007 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.89e-02 |
Pos logit contributions | |
enny | +0.004 |
driver | +0.003 |
oured | +0.003 |
seek | +0.003 |
uddy | +0.003 |
Neg logit contributions | |
things | -0.004 |
its | -0.004 |
their | -0.004 |
them | -0.004 |
ash | -0.004 |
Token | |
Token ID | 220 |
Feature activation | -4.99e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
things | +0.003 |
fires | +0.003 |
Neg logit contributions | |
enny | -0.006 |
oured | -0.006 |
uddy | -0.006 |
ipop | -0.006 |
unn | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +4.93e-03 |
Pos logit contributions | |
enny | +0.009 |
uddy | +0.009 |
driver | +0.008 |
ipop | +0.008 |
olly | +0.008 |
Neg logit contributions | |
its | -0.007 |
their | -0.006 |
them | -0.006 |
away | -0.005 |
fog | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | +4.49e-03 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
fires | +0.005 |
things | +0.005 |
Neg logit contributions | |
enny | -0.009 |
uddy | -0.009 |
seek | -0.009 |
unn | -0.008 |
olly | -0.008 |
Token | When |
Token ID | 2215 |
Feature activation | -7.39e-04 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
her | +0.005 |
things | +0.005 |
Neg logit contributions | |
enny | -0.008 |
oured | -0.008 |
unn | -0.008 |
ipop | -0.008 |
drop | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | +1.75e-03 |
Pos logit contributions | |
� | +0.001 |
ipop | +0.001 |
enny | +0.001 |
drop | +0.001 |
va | +0.001 |
Neg logit contributions | |
its | -0.001 |
them | -0.001 |
away | -0.001 |
fires | -0.001 |
their | -0.001 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.90e-02 |
Pos logit contributions | |
things | +0.002 |
its | +0.002 |
ash | +0.002 |
fog | +0.002 |
their | +0.002 |
Neg logit contributions | |
enny | -0.003 |
oured | -0.003 |
driver | -0.003 |
seek | -0.003 |
rivals | -0.003 |
Token | m |
Token ID | 76 |
Feature activation | +5.16e-03 |
Pos logit contributions | |
enny | +0.084 |
oured | +0.081 |
driver | +0.079 |
seek | +0.078 |
ache | +0.076 |
Neg logit contributions | |
its | -0.107 |
their | -0.102 |
them | -0.100 |
things | -0.095 |
everything | -0.092 |
Token | unk |
Token ID | 2954 |
Feature activation | -5.33e-03 |
Pos logit contributions | |
its | +0.009 |
things | +0.009 |
their | +0.009 |
ash | +0.008 |
them | +0.008 |
Neg logit contributions | |
seek | -0.007 |
oured | -0.007 |
rook | -0.007 |
seventy | -0.007 |
enny | -0.007 |
Token | reached |
Token ID | 4251 |
Feature activation | +1.26e-03 |
Pos logit contributions | |
unn | +0.010 |
driver | +0.010 |
ucker | +0.010 |
drop | +0.010 |
enny | +0.010 |
Neg logit contributions | |
its | -0.007 |
them | -0.006 |
their | -0.006 |
her | -0.006 |
everything | -0.006 |
Token | her |
Token ID | 607 |
Feature activation | -2.54e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.000 |
everything | +0.000 |
Neg logit contributions | |
enny | -0.003 |
oured | -0.003 |
ipop | -0.003 |
drop | -0.003 |
driver | -0.003 |
Token | home |
Token ID | 1363 |
Feature activation | -3.53e-03 |
Pos logit contributions | |
enny | +0.006 |
unn | +0.006 |
istent | +0.006 |
driver | +0.006 |
va | +0.006 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
down | -0.002 |
things | -0.002 |
out | -0.002 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.90e-02 |
Pos logit contributions | |
seek | +0.022 |
unn | +0.022 |
enny | +0.021 |
ucker | +0.021 |
driver | +0.021 |
Neg logit contributions | |
its | -0.015 |
their | -0.013 |
things | -0.013 |
them | -0.013 |
fog | -0.012 |
Token | m |
Token ID | 76 |
Feature activation | +4.71e-03 |
Pos logit contributions | |
enny | +0.088 |
oured | +0.087 |
seek | +0.087 |
sed | +0.085 |
driver | +0.084 |
Neg logit contributions | |
its | -0.100 |
their | -0.098 |
them | -0.097 |
things | -0.091 |
him | -0.086 |
Token | unk |
Token ID | 2954 |
Feature activation | -7.41e-03 |
Pos logit contributions | |
their | +0.008 |
its | +0.008 |
them | +0.008 |
things | +0.008 |
at | +0.007 |
Neg logit contributions | |
seventy | -0.007 |
seek | -0.007 |
oured | -0.007 |
enny | -0.007 |
rook | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +3.04e-03 |
Pos logit contributions | |
unn | +0.021 |
seek | +0.021 |
powers | +0.020 |
enny | +0.020 |
driver | +0.020 |
Neg logit contributions | |
its | -0.004 |
them | -0.003 |
their | -0.003 |
it | -0.002 |
. | -0.002 |
Token | The |
Token ID | 383 |
Feature activation | -2.37e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.003 |
his | +0.002 |
it | +0.002 |
Neg logit contributions | |
unn | -0.007 |
enny | -0.007 |
drop | -0.007 |
ache | -0.007 |
seek | -0.007 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.89e-02 |
Pos logit contributions | |
enny | +0.004 |
driver | +0.003 |
oured | +0.003 |
seek | +0.003 |
uddy | +0.003 |
Neg logit contributions | |
things | -0.004 |
its | -0.004 |
their | -0.004 |
them | -0.004 |
ash | -0.004 |
Token | m |
Token ID | 76 |
Feature activation | +4.75e-03 |
Pos logit contributions | |
seek | +0.092 |
enny | +0.092 |
oured | +0.091 |
ider | +0.087 |
driver | +0.087 |
Neg logit contributions | |
its | -0.097 |
them | -0.094 |
their | -0.094 |
things | -0.089 |
everything | -0.085 |
Token | unk |
Token ID | 2954 |
Feature activation | -6.84e-03 |
Pos logit contributions | |
its | +0.008 |
them | +0.008 |
their | +0.008 |
things | +0.007 |
everything | +0.007 |
Neg logit contributions | |
seek | -0.008 |
rook | -0.007 |
seventy | -0.007 |
tournament | -0.007 |
enny | -0.007 |
Token | wanted |
Token ID | 2227 |
Feature activation | -1.08e-03 |
Pos logit contributions | |
seek | +0.016 |
unn | +0.015 |
driver | +0.015 |
ider | +0.015 |
enny | +0.015 |
Neg logit contributions | |
its | -0.008 |
them | -0.007 |
their | -0.007 |
it | -0.007 |
her | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | +2.46e-03 |
Pos logit contributions | |
ider | +0.002 |
enny | +0.002 |
unn | +0.002 |
oured | +0.002 |
opus | +0.002 |
Neg logit contributions | |
its | -0.001 |
them | -0.001 |
their | -0.001 |
it | -0.001 |
his | -0.001 |
Token | boy |
Token ID | 2933 |
Feature activation | -7.63e-03 |
Pos logit contributions | |
its | +0.004 |
things | +0.004 |
their | +0.004 |
them | +0.004 |
ash | +0.004 |
Neg logit contributions | |
enny | -0.004 |
driver | -0.004 |
ider | -0.004 |
seek | -0.003 |
unn | -0.003 |
Token | a |
Token ID | 257 |
Feature activation | -4.12e-04 |
Pos logit contributions | |
its | +0.008 |
their | +0.007 |
them | +0.007 |
her | +0.005 |
everything | +0.005 |
Neg logit contributions | |
enny | -0.020 |
opus | -0.019 |
ipop | -0.019 |
oured | -0.019 |
unn | -0.018 |
Token | shiny |
Token ID | 22441 |
Feature activation | -5.06e-03 |
Pos logit contributions | |
enny | +0.001 |
seek | +0.001 |
oured | +0.001 |
unn | +0.001 |
driver | +0.001 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
things | -0.000 |
fog | -0.000 |
Token | collar |
Token ID | 19908 |
Feature activation | -7.65e-03 |
Pos logit contributions | |
enny | +0.009 |
unn | +0.008 |
oured | +0.008 |
seek | +0.008 |
ache | +0.008 |
Neg logit contributions | |
its | -0.008 |
their | -0.007 |
them | -0.007 |
things | -0.006 |
her | -0.006 |
Token | and |
Token ID | 290 |
Feature activation | -4.01e-04 |
Pos logit contributions | |
unn | +0.019 |
enny | +0.018 |
omo | +0.018 |
ucker | +0.018 |
scar | +0.018 |
Neg logit contributions | |
its | -0.008 |
out | -0.006 |
her | -0.006 |
it | -0.006 |
them | -0.006 |
Token | a |
Token ID | 257 |
Feature activation | -4.64e-04 |
Pos logit contributions | |
enny | +0.001 |
oured | +0.001 |
opus | +0.001 |
uddy | +0.001 |
ache | +0.001 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
her | -0.000 |
them | -0.000 |
it | -0.000 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.89e-02 |
Pos logit contributions | |
enny | +0.001 |
unn | +0.001 |
seek | +0.001 |
oured | +0.001 |
uddy | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.000 |
things | -0.000 |
fog | -0.000 |
Token | in |
Token ID | 287 |
Feature activation | -9.76e-03 |
Pos logit contributions | |
enny | +0.100 |
oured | +0.097 |
seek | +0.093 |
driver | +0.092 |
ache | +0.092 |
Neg logit contributions | |
its | -0.095 |
their | -0.087 |
them | -0.085 |
things | -0.075 |
her | -0.074 |
Token | her |
Token ID | 607 |
Feature activation | -4.53e-03 |
Pos logit contributions | |
driver | +0.023 |
enny | +0.023 |
drop | +0.023 |
ipop | +0.023 |
ache | +0.023 |
Neg logit contributions | |
its | -0.005 |
their | -0.004 |
them | -0.004 |
away | -0.003 |
things | -0.003 |
Token | ear |
Token ID | 1027 |
Feature activation | -3.91e-03 |
Pos logit contributions | |
enny | +0.007 |
unn | +0.007 |
oured | +0.007 |
drop | +0.007 |
driver | +0.007 |
Neg logit contributions | |
its | -0.008 |
their | -0.007 |
them | -0.007 |
her | -0.006 |
things | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +1.91e-03 |
Pos logit contributions | |
enny | +0.011 |
va | +0.011 |
igsaw | +0.011 |
scar | +0.011 |
unn | +0.011 |
Neg logit contributions | |
its | -0.002 |
them | -0.001 |
their | -0.001 |
her | -0.001 |
it | -0.000 |
Token | |
Token ID | 220 |
Feature activation | -3.13e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
away | +0.002 |
things | +0.002 |
Neg logit contributions | |
enny | -0.004 |
uddy | -0.003 |
unn | -0.003 |
oured | -0.003 |
� | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | +4.87e-03 |
Pos logit contributions | |
enny | +0.002 |
ache | +0.002 |
ipop | +0.002 |
driver | +0.002 |
oured | +0.002 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
fog | -0.001 |
away | -0.001 |
Token | They |
Token ID | 1119 |
Feature activation | +2.58e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.004 |
her | +0.004 |
it | +0.003 |
Neg logit contributions | |
ache | -0.011 |
drop | -0.011 |
unn | -0.011 |
enny | -0.010 |
driver | -0.010 |
Token | lived |
Token ID | 5615 |
Feature activation | +2.48e-02 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
her | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.005 |
unn | -0.005 |
uddy | -0.005 |
seek | -0.004 |
ider | -0.004 |
Token | happily |
Token ID | 18177 |
Feature activation | +1.80e-02 |
Pos logit contributions | |
its | +0.033 |
their | +0.028 |
them | +0.027 |
things | +0.023 |
her | +0.023 |
Neg logit contributions | |
enny | -0.049 |
unn | -0.047 |
ache | -0.047 |
oured | -0.047 |
drop | -0.047 |
Token | ever |
Token ID | 1683 |
Feature activation | -7.44e-03 |
Pos logit contributions | |
its | +0.030 |
their | +0.028 |
them | +0.025 |
her | +0.023 |
his | +0.022 |
Neg logit contributions | |
enny | -0.033 |
driver | -0.033 |
bars | -0.031 |
opus | -0.031 |
icycle | -0.031 |
Token | after |
Token ID | 706 |
Feature activation | +2.41e-02 |
Pos logit contributions | |
driver | +0.020 |
enny | +0.019 |
uddy | +0.019 |
ipop | +0.019 |
drop | +0.019 |
Neg logit contributions | |
its | -0.005 |
their | -0.004 |
them | -0.004 |
things | -0.003 |
her | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +4.75e-03 |
Pos logit contributions | |
its | +0.020 |
their | +0.016 |
them | +0.015 |
her | +0.011 |
things | +0.011 |
Neg logit contributions | |
enny | -0.062 |
oured | -0.060 |
driver | -0.060 |
unn | -0.060 |
ache | -0.060 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.70e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.010 |
oured | -0.010 |
ache | -0.010 |
unn | -0.010 |
drop | -0.010 |
Token | Once |
Token ID | 7454 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
enny | +0.003 |
� | +0.003 |
uddy | +0.003 |
seek | +0.003 |
olly | +0.003 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
away | -0.002 |
fires | -0.002 |
Token | upon |
Token ID | 2402 |
Feature activation | -1.58e-03 |
Pos logit contributions | |
its | +0.021 |
their | +0.019 |
them | +0.018 |
things | +0.016 |
her | +0.016 |
Neg logit contributions | |
enny | -0.023 |
oured | -0.022 |
unn | -0.022 |
ipop | -0.022 |
uddy | -0.022 |
Token | a |
Token ID | 257 |
Feature activation | -2.08e-03 |
Pos logit contributions | |
enny | +0.003 |
seek | +0.003 |
ache | +0.003 |
drop | +0.003 |
driver | +0.003 |
Neg logit contributions | |
its | -0.002 |
them | -0.002 |
their | -0.002 |
away | -0.002 |
fog | -0.002 |
Token | an |
Token ID | 281 |
Feature activation | +4.21e-03 |
Pos logit contributions | |
enny | +0.002 |
drop | +0.002 |
oured | +0.002 |
� | +0.002 |
olly | +0.001 |
Neg logit contributions | |
its | -0.001 |
them | -0.001 |
their | -0.001 |
away | -0.001 |
things | -0.001 |
Token | old |
Token ID | 1468 |
Feature activation | -8.92e-03 |
Pos logit contributions | |
its | +0.008 |
them | +0.007 |
their | +0.007 |
everything | +0.006 |
it | +0.006 |
Neg logit contributions | |
enny | -0.006 |
unn | -0.006 |
ache | -0.006 |
olly | -0.006 |
oured | -0.006 |
Token | man |
Token ID | 582 |
Feature activation | -1.35e-02 |
Pos logit contributions | |
enny | +0.017 |
oured | +0.017 |
seek | +0.016 |
unn | +0.016 |
ives | +0.016 |
Neg logit contributions | |
its | -0.013 |
their | -0.012 |
things | -0.010 |
them | -0.010 |
fog | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | -9.00e-04 |
Pos logit contributions | |
enny | +0.030 |
unn | +0.029 |
oured | +0.029 |
ipop | +0.029 |
driver | +0.029 |
Neg logit contributions | |
its | -0.016 |
their | -0.013 |
them | -0.012 |
her | -0.011 |
his | -0.010 |
Token | He |
Token ID | 679 |
Feature activation | -2.78e-03 |
Pos logit contributions | |
enny | +0.002 |
driver | +0.002 |
uddy | +0.002 |
ipop | +0.001 |
seek | +0.001 |
Neg logit contributions | |
its | -0.001 |
them | -0.001 |
their | -0.001 |
things | -0.001 |
everything | -0.001 |
Token | lived |
Token ID | 5615 |
Feature activation | +2.40e-02 |
Pos logit contributions | |
enny | +0.005 |
oured | +0.005 |
unn | +0.005 |
driver | +0.005 |
ipop | +0.005 |
Neg logit contributions | |
its | -0.004 |
their | -0.004 |
them | -0.003 |
her | -0.003 |
his | -0.003 |
Token | in |
Token ID | 287 |
Feature activation | -9.26e-03 |
Pos logit contributions | |
its | +0.023 |
them | +0.019 |
their | +0.019 |
things | +0.014 |
fog | +0.013 |
Neg logit contributions | |
enny | -0.053 |
oured | -0.051 |
ipop | -0.051 |
ache | -0.051 |
seek | -0.051 |
Token | a |
Token ID | 257 |
Feature activation | +6.21e-04 |
Pos logit contributions | |
enny | +0.017 |
driver | +0.017 |
seek | +0.016 |
ache | +0.016 |
drop | +0.016 |
Neg logit contributions | |
its | -0.011 |
them | -0.010 |
their | -0.009 |
away | -0.008 |
fog | -0.008 |
Token | house |
Token ID | 2156 |
Feature activation | -1.37e-03 |
Pos logit contributions | |
its | +0.001 |
them | +0.001 |
their | +0.001 |
him | +0.001 |
things | +0.001 |
Neg logit contributions | |
enny | -0.001 |
opus | -0.001 |
ache | -0.001 |
coach | -0.001 |
olly | -0.001 |
Token | on |
Token ID | 319 |
Feature activation | -3.08e-03 |
Pos logit contributions | |
enny | +0.004 |
unn | +0.004 |
oured | +0.003 |
ache | +0.003 |
uddy | +0.003 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
things | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | +3.86e-04 |
Pos logit contributions | |
seek | +0.006 |
driver | +0.006 |
ache | +0.006 |
enny | +0.006 |
drop | +0.006 |
Neg logit contributions | |
its | -0.003 |
them | -0.003 |
their | -0.003 |
away | -0.002 |
down | -0.002 |
Token | Brown |
Token ID | 4373 |
Feature activation | -7.46e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
things | +0.001 |
away | +0.001 |
Neg logit contributions | |
enny | -0.002 |
uddy | -0.002 |
ipop | -0.002 |
unn | -0.002 |
oured | -0.002 |
Token | ie |
Token ID | 494 |
Feature activation | +7.43e-03 |
Pos logit contributions | |
enny | +0.015 |
oured | +0.015 |
drop | +0.015 |
driver | +0.015 |
ipop | +0.015 |
Neg logit contributions | |
its | -0.009 |
their | -0.008 |
them | -0.008 |
her | -0.006 |
things | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | -1.92e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.004 |
things | +0.003 |
her | +0.003 |
Neg logit contributions | |
enny | -0.018 |
oured | -0.018 |
unn | -0.018 |
drop | -0.018 |
ache | -0.018 |
Token | Brown |
Token ID | 4373 |
Feature activation | -7.46e-03 |
Pos logit contributions | |
driver | +0.003 |
uddy | +0.003 |
chip | +0.002 |
unn | +0.002 |
� | +0.002 |
Neg logit contributions | |
its | -0.003 |
them | -0.003 |
their | -0.003 |
away | -0.003 |
fog | -0.003 |
Token | ie |
Token ID | 494 |
Feature activation | +7.60e-03 |
Pos logit contributions | |
enny | +0.015 |
oured | +0.015 |
drop | +0.015 |
driver | +0.015 |
ipop | +0.014 |
Neg logit contributions | |
its | -0.009 |
their | -0.008 |
them | -0.008 |
things | -0.006 |
everything | -0.006 |
Token | lived |
Token ID | 5615 |
Feature activation | +2.38e-02 |
Pos logit contributions | |
its | +0.008 |
their | +0.007 |
them | +0.006 |
it | +0.005 |
her | +0.005 |
Neg logit contributions | |
oured | -0.018 |
enny | -0.018 |
driver | -0.017 |
� | -0.017 |
ipop | -0.017 |
Token | in |
Token ID | 287 |
Feature activation | -9.73e-03 |
Pos logit contributions | |
its | +0.023 |
them | +0.020 |
their | +0.020 |
things | +0.016 |
away | +0.015 |
Neg logit contributions | |
enny | -0.051 |
oured | -0.048 |
seek | -0.048 |
ipop | -0.048 |
ache | -0.048 |
Token | a |
Token ID | 257 |
Feature activation | -2.35e-04 |
Pos logit contributions | |
seek | +0.015 |
driver | +0.015 |
chip | +0.015 |
ache | +0.014 |
drop | +0.014 |
Neg logit contributions | |
its | -0.012 |
them | -0.012 |
away | -0.011 |
their | -0.011 |
down | -0.010 |
Token | stable |
Token ID | 8245 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
opus | +0.000 |
ache | +0.000 |
enny | +0.000 |
olly | +0.000 |
uddy | +0.000 |
Neg logit contributions | |
its | -0.000 |
them | -0.000 |
their | -0.000 |
him | -0.000 |
things | -0.000 |
Token | with |
Token ID | 351 |
Feature activation | -4.54e-03 |
Pos logit contributions | |
its | +0.014 |
their | +0.011 |
them | +0.009 |
her | +0.008 |
things | +0.007 |
Neg logit contributions | |
enny | -0.037 |
unn | -0.036 |
oured | -0.036 |
driver | -0.036 |
ipop | -0.036 |
Token | his |
Token ID | 465 |
Feature activation | -6.89e-03 |
Pos logit contributions | |
enny | +0.011 |
unn | +0.010 |
ache | +0.010 |
driver | +0.010 |
seek | +0.010 |
Neg logit contributions | |
its | -0.004 |
their | -0.003 |
them | -0.003 |
things | -0.002 |
away | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -7.35e-04 |
Pos logit contributions | |
unn | +0.000 |
enny | +0.000 |
oured | +0.000 |
ache | +0.000 |
drop | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
her | -0.000 |
his | -0.000 |
Token | He |
Token ID | 679 |
Feature activation | +8.86e-04 |
Pos logit contributions | |
enny | +0.002 |
ache | +0.002 |
drop | +0.001 |
oured | +0.001 |
unn | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
her | -0.001 |
Token | did |
Token ID | 750 |
Feature activation | -2.81e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
his | +0.001 |
her | +0.001 |
Neg logit contributions | |
igsaw | -0.002 |
driver | -0.002 |
� | -0.002 |
unn | -0.002 |
ider | -0.002 |
Token | not |
Token ID | 407 |
Feature activation | -7.54e-03 |
Pos logit contributions | |
seek | +0.003 |
enny | +0.003 |
driver | +0.002 |
drop | +0.002 |
oured | +0.002 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
fog | -0.005 |
away | -0.005 |
Token | yell |
Token ID | 28946 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
enny | +0.013 |
oured | +0.013 |
unn | +0.012 |
ipop | +0.012 |
uddy | +0.012 |
Neg logit contributions | |
its | -0.012 |
their | -0.011 |
them | -0.011 |
her | -0.009 |
things | -0.009 |
Token | or |
Token ID | 393 |
Feature activation | +1.98e-02 |
Pos logit contributions | |
its | +0.014 |
their | +0.011 |
them | +0.011 |
fog | +0.009 |
things | +0.009 |
Neg logit contributions | |
enny | -0.027 |
ache | -0.026 |
driver | -0.026 |
ipop | -0.025 |
uddy | -0.025 |
Token | run |
Token ID | 1057 |
Feature activation | +2.75e-03 |
Pos logit contributions | |
its | +0.034 |
their | +0.032 |
them | +0.030 |
her | +0.027 |
his | +0.026 |
Neg logit contributions | |
enny | -0.036 |
unn | -0.034 |
oured | -0.034 |
olly | -0.033 |
driver | -0.033 |
Token | too |
Token ID | 1165 |
Feature activation | -4.09e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
fog | +0.002 |
ash | +0.002 |
Neg logit contributions | |
enny | -0.006 |
driver | -0.006 |
seek | -0.006 |
uddy | -0.006 |
ache | -0.006 |
Token | fast |
Token ID | 3049 |
Feature activation | -4.98e-04 |
Pos logit contributions | |
enny | +0.008 |
ache | +0.007 |
uddy | +0.007 |
driver | +0.007 |
unn | +0.007 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
things | -0.004 |
her | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | -1.73e-03 |
Pos logit contributions | |
enny | +0.001 |
oured | +0.001 |
ipop | +0.001 |
unn | +0.001 |
drop | +0.001 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
things | -0.000 |
her | -0.000 |
Token | The |
Token ID | 383 |
Feature activation | -5.00e-03 |
Pos logit contributions | |
enny | +0.003 |
oured | +0.003 |
unn | +0.003 |
ache | +0.003 |
uddy | +0.003 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
things | -0.002 |
her | -0.002 |
Token | And |
Token ID | 843 |
Feature activation | +3.37e-03 |
Pos logit contributions | |
enny | +0.004 |
uddy | +0.003 |
olly | +0.003 |
unn | +0.003 |
ugg | +0.003 |
Neg logit contributions | |
its | -0.003 |
them | -0.003 |
their | -0.003 |
fog | -0.002 |
away | -0.002 |
Token | Lily |
Token ID | 20037 |
Feature activation | +3.68e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
things | +0.003 |
her | +0.003 |
Neg logit contributions | |
enny | -0.007 |
oured | -0.006 |
ache | -0.006 |
unn | -0.006 |
drop | -0.006 |
Token | and |
Token ID | 290 |
Feature activation | +2.86e-04 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
her | +0.004 |
it | +0.004 |
them | +0.004 |
Neg logit contributions | |
uddy | -0.008 |
ider | -0.008 |
unn | -0.007 |
ipop | -0.007 |
driver | -0.007 |
Token | her |
Token ID | 607 |
Feature activation | -7.16e-05 |
Pos logit contributions | |
its | +0.000 |
them | +0.000 |
their | +0.000 |
south | +0.000 |
away | +0.000 |
Neg logit contributions | |
enny | -0.001 |
ipop | -0.001 |
salon | -0.001 |
judge | -0.001 |
seek | -0.001 |
Token | toys |
Token ID | 14958 |
Feature activation | +8.31e-03 |
Pos logit contributions | |
enny | +0.000 |
driver | +0.000 |
ache | +0.000 |
oured | +0.000 |
unn | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
things | -0.000 |
her | -0.000 |
Token | lived |
Token ID | 5615 |
Feature activation | +2.14e-02 |
Pos logit contributions | |
its | +0.010 |
their | +0.009 |
them | +0.008 |
everything | +0.007 |
her | +0.007 |
Neg logit contributions | |
enny | -0.019 |
unn | -0.018 |
opus | -0.018 |
uddy | -0.018 |
oured | -0.018 |
Token | happily |
Token ID | 18177 |
Feature activation | +1.90e-02 |
Pos logit contributions | |
its | +0.032 |
them | +0.028 |
their | +0.027 |
fog | +0.024 |
things | +0.024 |
Neg logit contributions | |
enny | -0.035 |
oured | -0.033 |
seek | -0.033 |
drop | -0.032 |
driver | -0.032 |
Token | in |
Token ID | 287 |
Feature activation | -7.02e-03 |
Pos logit contributions | |
its | +0.032 |
their | +0.029 |
them | +0.027 |
things | +0.025 |
her | +0.024 |
Neg logit contributions | |
enny | -0.032 |
driver | -0.030 |
uddy | -0.030 |
ipop | -0.030 |
scar | -0.030 |
Token | " |
Token ID | 366 |
Feature activation | +5.82e-03 |
Pos logit contributions | |
enny | +0.017 |
oured | +0.017 |
drop | +0.017 |
ache | +0.017 |
unn | +0.017 |
Neg logit contributions | |
its | -0.006 |
their | -0.004 |
them | -0.004 |
things | -0.003 |
everything | -0.003 |
Token | Fun |
Token ID | 24629 |
Feature activation | +1.20e-02 |
Pos logit contributions | |
its | +0.010 |
their | +0.009 |
them | +0.009 |
fog | +0.008 |
things | +0.008 |
Neg logit contributions | |
enny | -0.009 |
drop | -0.008 |
oured | -0.008 |
ache | -0.008 |
ipop | -0.008 |
Token | Land |
Token ID | 6379 |
Feature activation | -3.24e-03 |
Pos logit contributions | |
its | +0.018 |
them | +0.017 |
their | +0.016 |
things | +0.014 |
it | +0.014 |
Neg logit contributions | |
unn | -0.022 |
ache | -0.021 |
ipop | -0.021 |
ucker | -0.021 |
enny | -0.021 |
Token | snack |
Token ID | 26906 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
enny | +0.008 |
ipop | +0.008 |
oured | +0.008 |
ache | +0.008 |
driver | +0.008 |
Neg logit contributions | |
its | -0.012 |
their | -0.011 |
them | -0.010 |
her | -0.009 |
everything | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | -6.22e-04 |
Pos logit contributions | |
its | +0.008 |
their | +0.007 |
them | +0.006 |
things | +0.005 |
everything | +0.004 |
Neg logit contributions | |
unn | -0.027 |
enny | -0.026 |
drop | -0.026 |
uddy | -0.026 |
ache | -0.026 |
Token | t |
Token ID | 256 |
Feature activation | +6.26e-03 |
Pos logit contributions | |
enny | +0.001 |
uddy | +0.001 |
ache | +0.001 |
unn | +0.001 |
opus | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
his | -0.001 |
Token | eddy |
Token ID | 21874 |
Feature activation | +2.66e-03 |
Pos logit contributions | |
its | +0.010 |
them | +0.009 |
their | +0.009 |
things | +0.008 |
him | +0.007 |
Neg logit contributions | |
drop | -0.010 |
ache | -0.010 |
sed | -0.010 |
enny | -0.010 |
seek | -0.010 |
Token | bear |
Token ID | 6842 |
Feature activation | -2.16e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
things | +0.003 |
her | +0.003 |
Neg logit contributions | |
enny | -0.004 |
ache | -0.004 |
oured | -0.004 |
drop | -0.004 |
unn | -0.004 |
Token | inside |
Token ID | 2641 |
Feature activation | +3.29e-03 |
Pos logit contributions | |
enny | +0.005 |
drop | +0.005 |
unn | +0.005 |
ucker | +0.005 |
uddy | +0.005 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
things | -0.001 |
her | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -1.27e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
fog | +0.002 |
away | +0.002 |
Neg logit contributions | |
enny | -0.007 |
oured | -0.007 |
ipop | -0.007 |
driver | -0.007 |
� | -0.007 |
Token | Max |
Token ID | 5436 |
Feature activation | +5.38e-03 |
Pos logit contributions | |
enny | +0.002 |
uddy | +0.002 |
driver | +0.002 |
oured | +0.002 |
� | +0.002 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.001 |
away | -0.001 |
things | -0.001 |
Token | was |
Token ID | 373 |
Feature activation | +2.68e-04 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
his | +0.005 |
it | +0.005 |
them | +0.005 |
Neg logit contributions | |
drop | -0.012 |
unn | -0.012 |
enny | -0.012 |
igsaw | -0.012 |
ider | -0.012 |
Token | so |
Token ID | 523 |
Feature activation | +1.17e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
her | +0.000 |
his | +0.000 |
Neg logit contributions | |
unn | -0.001 |
enny | -0.001 |
uddy | -0.001 |
opus | -0.001 |
drop | -0.001 |
Token | excited |
Token ID | 6568 |
Feature activation | -9.43e-04 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
her | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.002 |
drop | -0.002 |
driver | -0.002 |
oured | -0.002 |
ache | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | -2.67e-03 |
Pos logit contributions | |
enny | +0.016 |
oured | +0.015 |
ache | +0.015 |
unn | +0.015 |
drop | +0.015 |
Neg logit contributions | |
its | -0.018 |
their | -0.016 |
them | -0.016 |
things | -0.014 |
her | -0.014 |
Token | explore |
Token ID | 7301 |
Feature activation | +9.03e-03 |
Pos logit contributions | |
enny | +0.005 |
oured | +0.005 |
unn | +0.005 |
uddy | +0.005 |
ache | +0.005 |
Neg logit contributions | |
its | -0.004 |
their | -0.003 |
them | -0.003 |
her | -0.003 |
things | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | +7.41e-04 |
Pos logit contributions | |
Wow | +0.012 |
Sorry | +0.012 |
Look | +0.011 |
RO | +0.011 |
inct | +0.010 |
Neg logit contributions | |
ents | -0.009 |
chip | -0.009 |
chewing | -0.009 |
olly | -0.009 |
enny | -0.009 |
Token | One |
Token ID | 1881 |
Feature activation | +1.43e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.001 |
away | +0.001 |
Neg logit contributions | |
enny | -0.001 |
uddy | -0.001 |
seek | -0.001 |
drop | -0.001 |
driver | -0.001 |
Token | day |
Token ID | 1110 |
Feature activation | +9.90e-03 |
Pos logit contributions | |
its | +0.002 |
them | +0.002 |
their | +0.002 |
fires | +0.002 |
things | +0.002 |
Neg logit contributions | |
enny | -0.002 |
uddy | -0.002 |
ipop | -0.002 |
drop | -0.002 |
olly | -0.002 |
Token | , |
Token ID | 11 |
Feature activation | +5.83e-05 |
Pos logit contributions | |
its | +0.016 |
them | +0.014 |
their | +0.014 |
away | +0.012 |
fires | +0.012 |
Neg logit contributions | |
enny | -0.016 |
ipop | -0.016 |
uddy | -0.015 |
unn | -0.015 |
drop | -0.015 |
Token | she |
Token ID | 673 |
Feature activation | -1.83e-03 |
Pos logit contributions | |
its | +0.000 |
them | +0.000 |
fires | +0.000 |
away | +0.000 |
their | +0.000 |
Neg logit contributions | |
ipop | -0.000 |
� | -0.000 |
enny | -0.000 |
drop | -0.000 |
coat | -0.000 |
Token | was |
Token ID | 373 |
Feature activation | +1.00e-03 |
Pos logit contributions | |
enny | +0.003 |
oured | +0.003 |
ache | +0.003 |
unn | +0.003 |
ipop | +0.003 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
her | -0.002 |
things | -0.002 |
Token | very |
Token ID | 845 |
Feature activation | +3.28e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
her | +0.001 |
things | +0.001 |
Neg logit contributions | |
enny | -0.002 |
unn | -0.002 |
oured | -0.002 |
ache | -0.002 |
ipop | -0.002 |
Token | hungry |
Token ID | 14720 |
Feature activation | +4.32e-04 |
Pos logit contributions | |
its | +0.005 |
their | +0.005 |
them | +0.005 |
things | +0.004 |
her | +0.004 |
Neg logit contributions | |
enny | -0.005 |
oured | -0.005 |
drop | -0.005 |
ache | -0.005 |
driver | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | -2.60e-04 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
things | +0.000 |
her | +0.000 |
Neg logit contributions | |
enny | -0.001 |
oured | -0.001 |
unn | -0.001 |
uddy | -0.001 |
ipop | -0.001 |
Token | in |
Token ID | 287 |
Feature activation | -7.22e-03 |
Pos logit contributions | |
unn | +0.012 |
enny | +0.011 |
uddy | +0.011 |
ucker | +0.011 |
oured | +0.011 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
her | -0.002 |
it | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +2.33e-03 |
Pos logit contributions | |
enny | +0.018 |
drop | +0.018 |
driver | +0.017 |
seek | +0.017 |
oured | +0.017 |
Neg logit contributions | |
its | -0.004 |
their | -0.003 |
them | -0.003 |
things | -0.002 |
away | -0.002 |
Token | grass |
Token ID | 8701 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
things | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.004 |
drop | -0.004 |
ache | -0.004 |
oured | -0.004 |
seek | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | +4.03e-03 |
Pos logit contributions | |
unn | +0.051 |
enny | +0.050 |
uddy | +0.049 |
oured | +0.049 |
powers | +0.049 |
Neg logit contributions | |
its | -0.011 |
their | -0.007 |
them | -0.007 |
her | -0.004 |
it | -0.004 |
Token | She |
Token ID | 1375 |
Feature activation | +2.20e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
fires | +0.004 |
away | +0.004 |
Neg logit contributions | |
enny | -0.007 |
oured | -0.007 |
ipop | -0.007 |
uddy | -0.007 |
driver | -0.007 |
Token | picked |
Token ID | 6497 |
Feature activation | +4.00e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
her | +0.003 |
them | +0.003 |
it | +0.002 |
Neg logit contributions | |
uddy | -0.004 |
drop | -0.004 |
ache | -0.004 |
� | -0.004 |
unn | -0.004 |
Token | it |
Token ID | 340 |
Feature activation | -1.19e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
fires | +0.002 |
fog | +0.002 |
away | +0.002 |
Neg logit contributions | |
oured | -0.009 |
enny | -0.009 |
driver | -0.009 |
ipop | -0.009 |
drop | -0.008 |
Token | up |
Token ID | 510 |
Feature activation | +3.08e-03 |
Pos logit contributions | |
enny | +0.003 |
oured | +0.003 |
driver | +0.003 |
ipop | +0.003 |
uddy | +0.003 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
fires | -0.001 |
fog | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | +3.64e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.003 |
her | +0.003 |
it | +0.003 |
Neg logit contributions | |
enny | -0.006 |
unn | -0.006 |
uddy | -0.006 |
drop | -0.006 |
ache | -0.006 |
Token | decided |
Token ID | 3066 |
Feature activation | +1.75e-04 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
fires | +0.006 |
away | +0.006 |
Neg logit contributions | |
oured | -0.004 |
enny | -0.004 |
ipop | -0.004 |
driver | -0.004 |
drop | -0.004 |
Token | to |
Token ID | 284 |
Feature activation | -3.21e-04 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
things | +0.000 |
her | +0.000 |
Neg logit contributions | |
enny | -0.000 |
unn | -0.000 |
oured | -0.000 |
drop | -0.000 |
ache | -0.000 |
Token | ! |
Token ID | 0 |
Feature activation | -5.04e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.001 |
them | +0.001 |
her | +0.001 |
things | +0.001 |
Neg logit contributions | |
enny | -0.006 |
unn | -0.006 |
oured | -0.006 |
ipop | -0.006 |
uddy | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | -4.38e-03 |
Pos logit contributions | |
enny | +0.010 |
unn | +0.010 |
oured | +0.010 |
uddy | +0.010 |
drop | +0.010 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
things | -0.004 |
her | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | -4.30e-03 |
Pos logit contributions | |
enny | +0.009 |
uddy | +0.009 |
unn | +0.009 |
drop | +0.009 |
oured | +0.009 |
Neg logit contributions | |
its | -0.005 |
their | -0.004 |
them | -0.004 |
things | -0.004 |
away | -0.003 |
Token | Bob |
Token ID | 18861 |
Feature activation | +2.48e-03 |
Pos logit contributions | |
enny | +0.008 |
oured | +0.007 |
unn | +0.007 |
ache | +0.007 |
drop | +0.007 |
Neg logit contributions | |
its | -0.006 |
their | -0.006 |
them | -0.005 |
things | -0.005 |
everything | -0.005 |
Token | thanked |
Token ID | 26280 |
Feature activation | +2.49e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.002 |
the | +0.002 |
by | +0.002 |
Neg logit contributions | |
driver | -0.006 |
seek | -0.006 |
ider | -0.006 |
salon | -0.005 |
� | -0.005 |
Token | Suz |
Token ID | 22691 |
Feature activation | -8.31e-03 |
Pos logit contributions | |
its | +0.003 |
south | +0.003 |
away | +0.003 |
fog | +0.003 |
fires | +0.003 |
Neg logit contributions | |
enny | -0.004 |
chip | -0.003 |
drop | -0.003 |
ipop | -0.003 |
uddy | -0.003 |
Token | ie |
Token ID | 494 |
Feature activation | +6.33e-03 |
Pos logit contributions | |
enny | +0.017 |
drop | +0.016 |
ache | +0.016 |
oured | +0.016 |
seek | +0.016 |
Neg logit contributions | |
its | -0.010 |
their | -0.009 |
them | -0.009 |
things | -0.007 |
her | -0.007 |
Token | for |
Token ID | 329 |
Feature activation | +2.24e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.004 |
her | +0.004 |
down | +0.004 |
Neg logit contributions | |
drop | -0.016 |
seek | -0.016 |
unn | -0.016 |
� | -0.016 |
coat | -0.015 |
Token | her |
Token ID | 607 |
Feature activation | -5.55e-05 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
things | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.003 |
drop | -0.003 |
driver | -0.003 |
oured | -0.003 |
ache | -0.003 |
Token | help |
Token ID | 1037 |
Feature activation | -4.68e-03 |
Pos logit contributions | |
enny | +0.000 |
unn | +0.000 |
ucker | +0.000 |
opus | +0.000 |
uddy | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
things | -0.000 |
her | -0.000 |
Token | and |
Token ID | 290 |
Feature activation | +3.81e-03 |
Pos logit contributions | |
enny | +0.010 |
unn | +0.010 |
ipop | +0.010 |
oured | +0.010 |
uddy | +0.009 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.005 |
her | -0.004 |
things | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | +1.24e-03 |
Pos logit contributions | |
its | +0.016 |
their | +0.014 |
them | +0.014 |
things | +0.013 |
fog | +0.012 |
Neg logit contributions | |
enny | -0.020 |
driver | -0.019 |
oured | -0.019 |
ipop | -0.019 |
drop | -0.019 |
Token | play |
Token ID | 711 |
Feature activation | +5.49e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
her | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.002 |
unn | -0.002 |
uddy | -0.002 |
driver | -0.002 |
ache | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +5.65e-05 |
Pos logit contributions | |
ost | +0.007 |
its | +0.007 |
volcan | +0.007 |
Wow | +0.007 |
fires | +0.007 |
Neg logit contributions | |
seek | -0.008 |
enny | -0.008 |
driver | -0.007 |
coat | -0.007 |
ider | -0.007 |
Token | She |
Token ID | 1375 |
Feature activation | +2.15e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
her | +0.000 |
things | +0.000 |
Neg logit contributions | |
enny | -0.000 |
ache | -0.000 |
unn | -0.000 |
ipop | -0.000 |
oured | -0.000 |
Token | w |
Token ID | 266 |
Feature activation | -4.13e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
her | +0.003 |
them | +0.003 |
it | +0.003 |
Neg logit contributions | |
uddy | -0.004 |
� | -0.004 |
enny | -0.004 |
igsaw | -0.004 |
driver | -0.004 |
Token | igg |
Token ID | 6950 |
Feature activation | -7.02e-03 |
Pos logit contributions | |
ache | +0.006 |
enny | +0.006 |
drop | +0.006 |
ipop | +0.006 |
driver | +0.006 |
Neg logit contributions | |
its | -0.007 |
them | -0.006 |
their | -0.006 |
things | -0.005 |
her | -0.005 |
Token | led |
Token ID | 992 |
Feature activation | -5.13e-03 |
Pos logit contributions | |
enny | +0.012 |
unn | +0.012 |
oured | +0.012 |
ipop | +0.012 |
ache | +0.011 |
Neg logit contributions | |
its | -0.011 |
their | -0.009 |
them | -0.009 |
things | -0.008 |
everything | -0.008 |
Token | her |
Token ID | 607 |
Feature activation | -2.93e-04 |
Pos logit contributions | |
oured | +0.012 |
ipop | +0.011 |
enny | +0.011 |
seek | +0.011 |
drop | +0.011 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
them | -0.002 |
away | -0.002 |
fires | -0.002 |
Token | toes |
Token ID | 23932 |
Feature activation | +8.81e-03 |
Pos logit contributions | |
enny | +0.001 |
unn | +0.001 |
ache | +0.000 |
seek | +0.000 |
driver | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
things | -0.000 |
her | -0.000 |
Token | in |
Token ID | 287 |
Feature activation | -7.14e-03 |
Pos logit contributions | |
its | +0.008 |
their | +0.006 |
her | +0.006 |
down | +0.005 |
them | +0.005 |
Neg logit contributions | |
unn | -0.024 |
uddy | -0.023 |
enny | -0.023 |
ucker | -0.022 |
coach | -0.022 |
Token | the |
Token ID | 262 |
Feature activation | +8.04e-04 |
Pos logit contributions | |
enny | +0.016 |
oured | +0.015 |
drop | +0.015 |
driver | +0.015 |
coat | +0.015 |
Neg logit contributions | |
its | -0.005 |
their | -0.004 |
them | -0.004 |
away | -0.003 |
things | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +2.29e-03 |
Pos logit contributions | |
� | +0.041 |
unn | +0.040 |
seek | +0.039 |
enny | +0.039 |
oured | +0.039 |
Neg logit contributions | |
its | -0.013 |
their | -0.012 |
them | -0.010 |
his | -0.008 |
. | -0.008 |
Token | Sam |
Token ID | 3409 |
Feature activation | -1.74e-02 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.003 |
his | +0.003 |
her | +0.003 |
Neg logit contributions | |
� | -0.005 |
ider | -0.005 |
ucker | -0.005 |
ache | -0.005 |
oured | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +3.53e-03 |
Pos logit contributions | |
enny | +0.048 |
opus | +0.047 |
unn | +0.046 |
ipop | +0.046 |
ucker | +0.046 |
Neg logit contributions | |
its | -0.012 |
their | -0.011 |
them | -0.010 |
her | -0.007 |
him | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | +6.65e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.003 |
her | +0.003 |
everything | +0.003 |
Neg logit contributions | |
ache | -0.008 |
drop | -0.008 |
enny | -0.008 |
unn | -0.008 |
ipop | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | +6.37e-03 |
Pos logit contributions | |
its | +0.008 |
their | +0.006 |
them | +0.006 |
things | +0.005 |
everything | +0.005 |
Neg logit contributions | |
enny | -0.014 |
oured | -0.014 |
ache | -0.014 |
unn | -0.014 |
drop | -0.014 |
Token | Tony |
Token ID | 29387 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
its | +0.010 |
their | +0.009 |
them | +0.009 |
her | +0.007 |
everything | +0.007 |
Neg logit contributions | |
ache | -0.011 |
oured | -0.011 |
drop | -0.011 |
unn | -0.011 |
ipop | -0.011 |
Token | asked |
Token ID | 1965 |
Feature activation | +5.68e-03 |
Pos logit contributions | |
enny | +0.040 |
uddy | +0.040 |
unn | +0.040 |
driver | +0.040 |
� | +0.040 |
Neg logit contributions | |
its | -0.020 |
their | -0.018 |
them | -0.017 |
it | -0.015 |
the | -0.014 |
Token | Sam |
Token ID | 3409 |
Feature activation | -1.33e-02 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
her | +0.005 |
everything | +0.005 |
Neg logit contributions | |
enny | -0.012 |
drop | -0.012 |
ache | -0.012 |
unn | -0.012 |
oured | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | +1.32e-04 |
Pos logit contributions | |
unn | +0.032 |
drop | +0.032 |
ider | +0.031 |
� | +0.031 |
coat | +0.031 |
Neg logit contributions | |
its | -0.015 |
their | -0.013 |
them | -0.013 |
her | -0.011 |
his | -0.010 |
Token | listen |
Token ID | 6004 |
Feature activation | -6.19e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
her | +0.000 |
his | +0.000 |
Neg logit contributions | |
unn | -0.000 |
enny | -0.000 |
ache | -0.000 |
ucker | -0.000 |
ipop | -0.000 |
Token | very |
Token ID | 845 |
Feature activation | +4.56e-03 |
Pos logit contributions | |
unn | +0.013 |
enny | +0.013 |
drop | +0.013 |
oured | +0.013 |
uddy | +0.013 |
Neg logit contributions | |
its | -0.007 |
their | -0.007 |
them | -0.006 |
her | -0.005 |
it | -0.005 |
Token | liked |
Token ID | 8288 |
Feature activation | -7.55e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
her | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.003 |
unn | -0.002 |
uddy | -0.002 |
ipop | -0.002 |
driver | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | -1.22e-03 |
Pos logit contributions | |
enny | +0.013 |
oured | +0.013 |
unn | +0.013 |
uddy | +0.013 |
ache | +0.013 |
Neg logit contributions | |
its | -0.012 |
their | -0.012 |
them | -0.011 |
her | -0.010 |
things | -0.010 |
Token | play |
Token ID | 711 |
Feature activation | +2.89e-03 |
Pos logit contributions | |
enny | +0.003 |
unn | +0.003 |
uddy | +0.003 |
ache | +0.003 |
oured | +0.003 |
Neg logit contributions | |
its | -0.002 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
his | -0.001 |
Token | in |
Token ID | 287 |
Feature activation | -7.98e-03 |
Pos logit contributions | |
its | +0.004 |
tranqu | +0.003 |
Wow | +0.003 |
Merry | +0.003 |
fant | +0.003 |
Neg logit contributions | |
coach | -0.005 |
� | -0.004 |
rook | -0.004 |
olly | -0.004 |
enny | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +3.82e-03 |
Pos logit contributions | |
enny | +0.017 |
� | +0.017 |
driver | +0.017 |
chip | +0.017 |
drop | +0.017 |
Neg logit contributions | |
its | -0.006 |
them | -0.004 |
away | -0.004 |
their | -0.004 |
south | -0.004 |
Token | park |
Token ID | 3952 |
Feature activation | -1.77e-02 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.005 |
things | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.006 |
drop | -0.006 |
oured | -0.006 |
unn | -0.006 |
ache | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +1.84e-03 |
Pos logit contributions | |
enny | +0.042 |
drop | +0.041 |
oured | +0.041 |
ache | +0.041 |
ipop | +0.041 |
Neg logit contributions | |
its | -0.015 |
their | -0.012 |
them | -0.011 |
things | -0.008 |
everything | -0.008 |
Token | They |
Token ID | 1119 |
Feature activation | +1.54e-03 |
Pos logit contributions | |
its | +0.003 |
away | +0.002 |
them | +0.002 |
their | +0.002 |
things | +0.002 |
Neg logit contributions | |
uddy | -0.003 |
enny | -0.003 |
coat | -0.003 |
� | -0.003 |
driver | -0.003 |
Token | liked |
Token ID | 8288 |
Feature activation | -7.34e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
her | +0.002 |
it | +0.002 |
Neg logit contributions | |
ache | -0.003 |
enny | -0.003 |
opus | -0.003 |
oured | -0.003 |
ider | -0.003 |
Token | to |
Token ID | 284 |
Feature activation | -1.10e-03 |
Pos logit contributions | |
enny | +0.015 |
ache | +0.014 |
oured | +0.014 |
ider | +0.014 |
unn | +0.014 |
Neg logit contributions | |
its | -0.011 |
their | -0.011 |
them | -0.010 |
her | -0.009 |
things | -0.009 |
Token | swing |
Token ID | 9628 |
Feature activation | +9.59e-03 |
Pos logit contributions | |
enny | +0.002 |
unn | +0.002 |
ache | +0.002 |
uddy | +0.002 |
oured | +0.002 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
her | -0.001 |
his | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | -2.68e-03 |
Pos logit contributions | |
enny | +0.033 |
unn | +0.032 |
oured | +0.031 |
drop | +0.031 |
opus | +0.031 |
Neg logit contributions | |
its | -0.018 |
their | -0.016 |
them | -0.015 |
things | -0.012 |
her | -0.012 |
Token | drive |
Token ID | 3708 |
Feature activation | +5.02e-03 |
Pos logit contributions | |
enny | +0.005 |
unn | +0.005 |
ache | +0.005 |
drop | +0.005 |
oured | +0.005 |
Neg logit contributions | |
its | -0.004 |
their | -0.004 |
them | -0.003 |
her | -0.003 |
everything | -0.003 |
Token | back |
Token ID | 736 |
Feature activation | +7.62e-04 |
Pos logit contributions | |
its | +0.004 |
fant | +0.003 |
fog | +0.003 |
ash | +0.003 |
Esk | +0.003 |
Neg logit contributions | |
driver | -0.010 |
enny | -0.010 |
seek | -0.010 |
ipop | -0.010 |
coach | -0.010 |
Token | to |
Token ID | 284 |
Feature activation | -1.17e-03 |
Pos logit contributions | |
its | +0.001 |
them | +0.001 |
their | +0.001 |
fog | +0.001 |
Wow | +0.001 |
Neg logit contributions | |
enny | -0.001 |
seek | -0.001 |
uddy | -0.001 |
unn | -0.001 |
driver | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +1.47e-03 |
Pos logit contributions | |
chip | +0.002 |
coach | +0.002 |
seek | +0.002 |
� | +0.002 |
sed | +0.002 |
Neg logit contributions | |
its | -0.001 |
brightly | -0.001 |
Wow | -0.001 |
fog | -0.001 |
away | -0.001 |
Token | farm |
Token ID | 5318 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
her | +0.002 |
everything | +0.002 |
Neg logit contributions | |
ache | -0.002 |
drop | -0.002 |
enny | -0.002 |
oured | -0.002 |
uddy | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -7.57e-04 |
Pos logit contributions | |
enny | +0.048 |
unn | +0.047 |
oured | +0.046 |
drop | +0.046 |
ipop | +0.046 |
Neg logit contributions | |
its | -0.011 |
their | -0.009 |
them | -0.008 |
things | -0.005 |
everything | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | -1.97e-03 |
Pos logit contributions | |
enny | +0.002 |
oured | +0.002 |
uddy | +0.002 |
unn | +0.002 |
drop | +0.002 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
things | -0.001 |
everything | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -2.14e-03 |
Pos logit contributions | |
enny | +0.004 |
uddy | +0.003 |
unn | +0.003 |
driver | +0.003 |
seek | +0.003 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
things | -0.002 |
fog | -0.002 |
Token | They |
Token ID | 2990 |
Feature activation | +3.13e-04 |
Pos logit contributions | |
enny | +0.004 |
oured | +0.004 |
unn | +0.004 |
drop | +0.004 |
ache | +0.004 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
them | -0.003 |
everything | -0.002 |
things | -0.002 |
Token | un |
Token ID | 555 |
Feature activation | +3.87e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
everything | +0.000 |
her | +0.000 |
Neg logit contributions | |
enny | -0.001 |
unn | -0.001 |
drop | -0.001 |
ucker | -0.001 |
uddy | -0.001 |
Token | hopped |
Token ID | 45230 |
Feature activation | +3.08e-06 |
Pos logit contributions | |
enny | +0.017 |
unn | +0.016 |
seek | +0.016 |
ucker | +0.016 |
ipop | +0.016 |
Neg logit contributions | |
its | -0.011 |
them | -0.010 |
their | -0.009 |
it | -0.008 |
her | -0.008 |
Token | by |
Token ID | 416 |
Feature activation | +8.36e-03 |
Token | and |
Token ID | 290 |
Feature activation | +4.51e-03 |
Pos logit contributions | |
its | +0.011 |
their | +0.009 |
them | +0.009 |
her | +0.007 |
it | +0.007 |
Neg logit contributions | |
enny | -0.018 |
unn | -0.018 |
ache | -0.018 |
ipop | -0.018 |
opus | -0.017 |
Token | saw |
Token ID | 2497 |
Feature activation | +8.66e-03 |
Pos logit contributions | |
its | +0.008 |
their | +0.007 |
them | +0.007 |
it | +0.006 |
her | +0.006 |
Neg logit contributions | |
enny | -0.008 |
unn | -0.007 |
ucker | -0.007 |
driver | -0.007 |
olly | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | +3.60e-03 |
Pos logit contributions | |
its | +0.008 |
their | +0.006 |
them | +0.006 |
her | +0.004 |
things | +0.004 |
Neg logit contributions | |
enny | -0.021 |
unn | -0.021 |
drop | -0.021 |
oured | -0.021 |
ache | -0.021 |
Token | rh |
Token ID | 9529 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
its | +0.004 |
things | +0.004 |
them | +0.004 |
their | +0.004 |
dark | +0.003 |
Neg logit contributions | |
enny | -0.008 |
seek | -0.008 |
ugg | -0.008 |
unn | -0.007 |
driver | -0.007 |
Token | in |
Token ID | 259 |
Feature activation | -4.90e-03 |
Pos logit contributions | |
oured | +0.041 |
seek | +0.041 |
enny | +0.040 |
coat | +0.040 |
ipop | +0.040 |
Neg logit contributions | |
its | -0.041 |
them | -0.037 |
their | -0.035 |
things | -0.033 |
away | -0.032 |
Token | oc |
Token ID | 420 |
Feature activation | +4.55e-02 |
Pos logit contributions | |
enny | +0.013 |
coat | +0.013 |
unn | +0.013 |
seek | +0.013 |
oured | +0.013 |
Neg logit contributions | |
its | -0.004 |
their | -0.002 |
them | -0.002 |
things | -0.002 |
it | -0.002 |
Token | eros |
Token ID | 27498 |
Feature activation | -9.77e-03 |
Pos logit contributions | |
its | +0.073 |
them | +0.063 |
their | +0.061 |
things | +0.060 |
him | +0.057 |
Neg logit contributions | |
enny | -0.080 |
coat | -0.073 |
uddy | -0.070 |
drop | -0.070 |
ipop | -0.070 |
Token | trying |
Token ID | 2111 |
Feature activation | -1.60e-03 |
Pos logit contributions | |
unn | +0.026 |
enny | +0.026 |
seek | +0.024 |
ipop | +0.024 |
uddy | +0.024 |
Neg logit contributions | |
its | -0.009 |
their | -0.007 |
them | -0.006 |
it | -0.005 |
his | -0.005 |
Token | to |
Token ID | 284 |
Feature activation | +1.73e-04 |
Pos logit contributions | |
enny | +0.003 |
unn | +0.003 |
drop | +0.003 |
oured | +0.003 |
opus | +0.003 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
her | -0.002 |
it | -0.002 |
Token | a |
Token ID | 257 |
Feature activation | +3.38e-03 |
Pos logit contributions | |
enny | +0.008 |
seek | +0.008 |
oured | +0.008 |
drop | +0.008 |
unn | +0.008 |
Neg logit contributions | |
its | -0.005 |
their | -0.004 |
them | -0.004 |
away | -0.004 |
things | -0.004 |
Token | nice |
Token ID | 3621 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
everything | +0.003 |
things | +0.003 |
Neg logit contributions | |
unn | -0.007 |
enny | -0.007 |
driver | -0.007 |
seek | -0.007 |
oured | -0.007 |
Token | time |
Token ID | 640 |
Feature activation | +3.42e-03 |
Pos logit contributions | |
driver | +0.026 |
ache | +0.026 |
enny | +0.026 |
ider | +0.026 |
unn | +0.025 |
Neg logit contributions | |
its | -0.016 |
their | -0.016 |
them | -0.014 |
everything | -0.013 |
things | -0.012 |
Token | at |
Token ID | 379 |
Feature activation | +9.05e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
things | +0.001 |
her | +0.001 |
Neg logit contributions | |
enny | -0.009 |
ipop | -0.009 |
ache | -0.009 |
uddy | -0.009 |
unn | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | +2.25e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.004 |
things | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.023 |
oured | -0.022 |
drop | -0.022 |
unn | -0.022 |
ipop | -0.022 |
Token | park |
Token ID | 3952 |
Feature activation | -1.76e-02 |
Pos logit contributions | |
its | +0.003 |
their | +0.003 |
them | +0.003 |
things | +0.002 |
fog | +0.002 |
Neg logit contributions | |
enny | -0.005 |
driver | -0.004 |
unn | -0.004 |
ipop | -0.004 |
ache | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | +2.39e-03 |
Pos logit contributions | |
enny | +0.046 |
unn | +0.045 |
ache | +0.044 |
oured | +0.044 |
driver | +0.044 |
Neg logit contributions | |
its | -0.013 |
their | -0.011 |
them | -0.010 |
her | -0.006 |
everything | -0.006 |
Token | The |
Token ID | 383 |
Feature activation | -4.50e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
everything | +0.002 |
her | +0.002 |
Neg logit contributions | |
ache | -0.005 |
drop | -0.005 |
unn | -0.005 |
driver | -0.005 |
enny | -0.005 |
Token | twins |
Token ID | 20345 |
Feature activation | +8.19e-03 |
Pos logit contributions | |
enny | +0.010 |
driver | +0.010 |
unn | +0.010 |
ache | +0.010 |
ucker | +0.010 |
Neg logit contributions | |
its | -0.005 |
them | -0.005 |
their | -0.005 |
things | -0.004 |
fog | -0.004 |
Token | enjoyed |
Token ID | 8359 |
Feature activation | -3.63e-03 |
Pos logit contributions | |
its | +0.011 |
their | +0.011 |
them | +0.010 |
it | +0.009 |
her | +0.009 |
Neg logit contributions | |
uddy | -0.017 |
unn | -0.017 |
driver | -0.017 |
ucker | -0.017 |
seek | -0.016 |
Token | their |
Token ID | 511 |
Feature activation | +5.36e-04 |
Pos logit contributions | |
enny | +0.009 |
oured | +0.009 |
drop | +0.009 |
unn | +0.008 |
ache | +0.008 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
things | -0.002 |
everything | -0.002 |
Token | treats |
Token ID | 18432 |
Feature activation | +8.60e-03 |
Pos logit contributions | |
unn | +0.005 |
drop | +0.005 |
ache | +0.005 |
ipop | +0.005 |
enny | +0.005 |
Neg logit contributions | |
its | -0.004 |
their | -0.004 |
them | -0.004 |
her | -0.003 |
everything | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | -4.62e-04 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.004 |
her | +0.003 |
things | +0.003 |
Neg logit contributions | |
enny | -0.023 |
unn | -0.022 |
oured | -0.022 |
uddy | -0.022 |
drop | -0.021 |
Token | He |
Token ID | 679 |
Feature activation | -2.10e-03 |
Pos logit contributions | |
enny | +0.001 |
� | +0.001 |
uddy | +0.001 |
oured | +0.001 |
unn | +0.001 |
Neg logit contributions | |
its | -0.001 |
their | -0.001 |
them | -0.001 |
away | -0.001 |
things | -0.001 |
Token | saw |
Token ID | 2497 |
Feature activation | +6.39e-03 |
Pos logit contributions | |
enny | +0.004 |
� | +0.004 |
driver | +0.004 |
igsaw | +0.004 |
unn | +0.004 |
Neg logit contributions | |
its | -0.003 |
their | -0.002 |
them | -0.002 |
her | -0.002 |
it | -0.002 |
Token | chocolate |
Token ID | 11311 |
Feature activation | +2.78e-03 |
Pos logit contributions | |
its | +0.007 |
their | +0.006 |
them | +0.006 |
everything | +0.004 |
things | +0.004 |
Neg logit contributions | |
enny | -0.015 |
drop | -0.014 |
uddy | -0.014 |
oured | -0.014 |
unn | -0.014 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.63e-02 |
Pos logit contributions | |
its | +0.004 |
their | +0.004 |
them | +0.004 |
things | +0.003 |
her | +0.003 |
Neg logit contributions | |
enny | -0.005 |
unn | -0.005 |
oured | -0.005 |
uddy | -0.005 |
seek | -0.005 |
Token | cookies |
Token ID | 14746 |
Feature activation | +7.91e-03 |
Pos logit contributions | |
enny | +0.103 |
oured | +0.097 |
driver | +0.094 |
ider | +0.093 |
seek | +0.093 |
Neg logit contributions | |
its | -0.083 |
them | -0.081 |
their | -0.080 |
things | -0.075 |
everything | -0.069 |
Token | , |
Token ID | 11 |
Feature activation | -1.63e-03 |
Pos logit contributions | |
its | +0.008 |
their | +0.007 |
them | +0.007 |
her | +0.006 |
it | +0.006 |
Neg logit contributions | |
enny | -0.019 |
unn | -0.019 |
powers | -0.018 |
uddy | -0.018 |
oured | -0.018 |
Token | cheese |
Token ID | 9891 |
Feature activation | +1.90e-03 |
Pos logit contributions | |
enny | +0.003 |
uddy | +0.003 |
unn | +0.003 |
seek | +0.003 |
olly | +0.003 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
her | -0.002 |
things | -0.002 |
Token | crack |
Token ID | 8469 |
Feature activation | +4.69e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.001 |
her | +0.001 |
it | +0.001 |
Neg logit contributions | |
enny | -0.005 |
oured | -0.005 |
istent | -0.005 |
seek | -0.005 |
unn | -0.005 |
Token | ers |
Token ID | 364 |
Feature activation | +9.47e-03 |
Pos logit contributions | |
its | +0.007 |
them | +0.006 |
their | +0.006 |
things | +0.005 |
her | +0.005 |
Neg logit contributions | |
enny | -0.009 |
unn | -0.009 |
oured | -0.009 |
coach | -0.009 |
ipop | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | +2.60e-03 |
Pos logit contributions | |
its | +0.018 |
them | +0.016 |
their | +0.015 |
away | +0.015 |
south | +0.014 |
Neg logit contributions | |
enny | -0.016 |
ipop | -0.016 |
driver | -0.015 |
drop | -0.015 |
uddy | -0.015 |
Token | tool |
Token ID | 2891 |
Feature activation | +2.03e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
her | +0.004 |
everything | +0.004 |
Neg logit contributions | |
enny | -0.004 |
ache | -0.003 |
oured | -0.003 |
drop | -0.003 |
driver | -0.003 |
Token | was |
Token ID | 373 |
Feature activation | +5.40e-04 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
things | +0.002 |
it | +0.002 |
them | +0.002 |
Neg logit contributions | |
unn | -0.005 |
ucker | -0.005 |
oured | -0.005 |
igsaw | -0.005 |
istent | -0.005 |
Token | used |
Token ID | 973 |
Feature activation | +8.36e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.000 |
his | +0.000 |
out | +0.000 |
Neg logit contributions | |
unn | -0.001 |
enny | -0.001 |
uddy | -0.001 |
opus | -0.001 |
pillar | -0.001 |
Token | to |
Token ID | 284 |
Feature activation | -1.04e-03 |
Pos logit contributions | |
its | +0.012 |
their | +0.010 |
them | +0.009 |
things | +0.009 |
his | +0.008 |
Neg logit contributions | |
opus | -0.018 |
unn | -0.018 |
enny | -0.018 |
uddy | -0.018 |
ipop | -0.018 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.57e-02 |
Pos logit contributions | |
enny | +0.002 |
unn | +0.002 |
oured | +0.002 |
ipop | +0.002 |
uddy | +0.002 |
Neg logit contributions | |
its | -0.002 |
their | -0.001 |
them | -0.001 |
her | -0.001 |
things | -0.001 |
Token | away |
Token ID | 1497 |
Feature activation | +4.51e-03 |
Pos logit contributions | |
oured | +0.104 |
enny | +0.101 |
uddy | +0.101 |
sed | +0.101 |
drop | +0.101 |
Neg logit contributions | |
them | -0.077 |
its | -0.076 |
their | -0.076 |
things | -0.075 |
him | -0.066 |
Token | at |
Token ID | 379 |
Feature activation | +5.78e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
things | +0.002 |
her | +0.002 |
Neg logit contributions | |
enny | -0.011 |
oured | -0.010 |
ache | -0.010 |
unn | -0.010 |
drop | -0.010 |
Token | a |
Token ID | 257 |
Feature activation | +2.11e-03 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
them | +0.004 |
everything | +0.003 |
her | +0.003 |
Neg logit contributions | |
enny | -0.014 |
unn | -0.014 |
oured | -0.014 |
ache | -0.014 |
ipop | -0.014 |
Token | strange |
Token ID | 6283 |
Feature activation | +3.72e-03 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
things | +0.002 |
everything | +0.002 |
Neg logit contributions | |
unn | -0.004 |
enny | -0.004 |
oured | -0.004 |
ipop | -0.004 |
driver | -0.004 |
Token | object |
Token ID | 2134 |
Feature activation | -8.88e-03 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
things | +0.003 |
everything | +0.003 |
Neg logit contributions | |
enny | -0.008 |
unn | -0.007 |
oured | -0.007 |
uddy | -0.007 |
ipop | -0.007 |
Token | It |
Token ID | 632 |
Feature activation | -2.96e-03 |
Pos logit contributions | |
ache | +0.001 |
drop | +0.000 |
driver | +0.000 |
unn | +0.000 |
seek | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
them | -0.000 |
her | -0.000 |
everything | -0.000 |
Token | was |
Token ID | 373 |
Feature activation | +6.56e-04 |
Pos logit contributions | |
unn | +0.007 |
oured | +0.007 |
enny | +0.007 |
driver | +0.007 |
ider | +0.007 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
her | -0.002 |
them | -0.002 |
it | -0.002 |
Token | a |
Token ID | 257 |
Feature activation | +1.52e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
her | +0.000 |
them | +0.000 |
his | +0.000 |
Neg logit contributions | |
unn | -0.002 |
opus | -0.002 |
enny | -0.002 |
uddy | -0.002 |
seek | -0.002 |
Token | big |
Token ID | 1263 |
Feature activation | -1.34e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.001 |
fog | +0.001 |
them | +0.001 |
her | +0.001 |
Neg logit contributions | |
unn | -0.004 |
seek | -0.004 |
enny | -0.004 |
ives | -0.004 |
oured | -0.004 |
Token | j |
Token ID | 474 |
Feature activation | -2.47e-02 |
Pos logit contributions | |
unn | +0.003 |
enny | +0.003 |
seek | +0.003 |
ives | +0.003 |
uts | +0.003 |
Neg logit contributions | |
its | -0.002 |
their | -0.001 |
things | -0.001 |
fog | -0.001 |
it | -0.001 |
Token | igsaw |
Token ID | 45636 |
Feature activation | -6.69e-02 |
Pos logit contributions | |
ache | +0.017 |
sed | +0.016 |
driver | +0.015 |
drop | +0.014 |
seek | +0.014 |
Neg logit contributions | |
its | -0.062 |
away | -0.057 |
their | -0.057 |
them | -0.056 |
things | -0.055 |
Token | puzzle |
Token ID | 15027 |
Feature activation | -3.67e-04 |
Pos logit contributions | |
sed | +0.114 |
ucker | +0.113 |
oured | +0.113 |
unn | +0.111 |
enny | +0.110 |
Neg logit contributions | |
its | -0.100 |
their | -0.091 |
things | -0.089 |
them | -0.086 |
it | -0.084 |
Token | and |
Token ID | 290 |
Feature activation | -1.19e-04 |
Pos logit contributions | |
unn | +0.001 |
ucker | +0.001 |
oured | +0.001 |
enny | +0.001 |
sed | +0.001 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
her | -0.000 |
things | -0.000 |
them | -0.000 |
Token | she |
Token ID | 673 |
Feature activation | -1.15e-03 |
Pos logit contributions | |
unn | +0.000 |
ache | +0.000 |
uddy | +0.000 |
driver | +0.000 |
enny | +0.000 |
Neg logit contributions | |
its | -0.000 |
their | -0.000 |
it | -0.000 |
her | -0.000 |
them | -0.000 |
Token | wanted |
Token ID | 2227 |
Feature activation | -2.46e-03 |
Pos logit contributions | |
unn | +0.003 |
uddy | +0.003 |
oured | +0.003 |
� | +0.003 |
ucker | +0.003 |
Neg logit contributions | |
its | -0.001 |
it | -0.001 |
their | -0.001 |
her | -0.001 |
them | -0.001 |
Token | to |
Token ID | 284 |
Feature activation | -1.49e-03 |
Pos logit contributions | |
unn | +0.005 |
uddy | +0.005 |
opus | +0.005 |
enny | +0.005 |
drop | +0.005 |
Neg logit contributions | |
its | -0.004 |
them | -0.003 |
their | -0.003 |
it | -0.003 |
her | -0.003 |
Token | They |
Token ID | 1119 |
Feature activation | +4.94e-03 |
Pos logit contributions | |
ache | +0.013 |
drop | +0.012 |
opus | +0.012 |
driver | +0.012 |
ider | +0.012 |
Neg logit contributions | |
its | -0.006 |
their | -0.005 |
them | -0.004 |
her | -0.004 |
it | -0.003 |
Token | ran |
Token ID | 4966 |
Feature activation | +4.89e-03 |
Pos logit contributions | |
its | +0.008 |
their | +0.007 |
them | +0.007 |
her | +0.006 |
everything | +0.006 |
Neg logit contributions | |
enny | -0.009 |
ider | -0.009 |
ucker | -0.009 |
opus | -0.009 |
seek | -0.009 |
Token | together |
Token ID | 1978 |
Feature activation | +2.18e-04 |
Pos logit contributions | |
its | +0.005 |
their | +0.004 |
them | +0.004 |
everything | +0.003 |
her | +0.003 |
Neg logit contributions | |
enny | -0.011 |
ache | -0.011 |
unn | -0.011 |
ipop | -0.011 |
drop | -0.011 |
Token | towards |
Token ID | 3371 |
Feature activation | +1.60e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
her | +0.000 |
out | +0.000 |
Neg logit contributions | |
enny | -0.001 |
ache | -0.001 |
opus | -0.001 |
unn | -0.001 |
ucker | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +1.82e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.000 |
everything | +0.000 |
Neg logit contributions | |
enny | -0.004 |
oured | -0.004 |
unn | -0.004 |
drop | -0.004 |
ache | -0.004 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.45e-02 |
Pos logit contributions | |
its | +0.003 |
their | +0.002 |
them | +0.002 |
things | +0.002 |
everything | +0.002 |
Neg logit contributions | |
enny | -0.004 |
ipop | -0.003 |
driver | -0.003 |
oured | -0.003 |
unn | -0.003 |
Token | m |
Token ID | 76 |
Feature activation | +3.36e-03 |
Pos logit contributions | |
enny | +0.075 |
oured | +0.073 |
driver | +0.069 |
seek | +0.069 |
ache | +0.067 |
Neg logit contributions | |
its | -0.102 |
their | -0.098 |
them | -0.097 |
things | -0.091 |
everything | -0.087 |
Token | unk |
Token ID | 2954 |
Feature activation | +3.72e-04 |
Pos logit contributions | |
its | +0.006 |
them | +0.006 |
their | +0.006 |
things | +0.005 |
. | +0.005 |
Neg logit contributions | |
oured | -0.005 |
seek | -0.005 |
seventy | -0.005 |
enny | -0.005 |
rook | -0.005 |
Token | 's |
Token ID | 338 |
Feature activation | +1.92e-03 |
Pos logit contributions | |
its | +0.000 |
their | +0.000 |
them | +0.000 |
out | +0.000 |
down | +0.000 |
Neg logit contributions | |
unn | -0.001 |
va | -0.001 |
ucker | -0.001 |
enny | -0.001 |
opus | -0.001 |
Token | home |
Token ID | 1363 |
Feature activation | -2.92e-03 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
things | +0.001 |
them | +0.001 |
everything | +0.001 |
Neg logit contributions | |
enny | -0.005 |
ipop | -0.005 |
va | -0.005 |
oured | -0.005 |
driver | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -2.56e-03 |
Pos logit contributions | |
unn | +0.008 |
enny | +0.007 |
opus | +0.007 |
ipop | +0.007 |
ucker | +0.007 |
Neg logit contributions | |
its | -0.002 |
their | -0.002 |
them | -0.002 |
her | -0.001 |
it | -0.001 |
Token | again |
Token ID | 757 |
Feature activation | +8.80e-04 |
Pos logit contributions | |
its | +0.006 |
their | +0.005 |
ash | +0.005 |
them | +0.005 |
fog | +0.005 |
Neg logit contributions | |
seek | -0.009 |
enny | -0.009 |
� | -0.009 |
driver | -0.009 |
drop | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | -2.73e-03 |
Pos logit contributions | |
its | +0.001 |
their | +0.001 |
them | +0.001 |
things | +0.000 |
everything | +0.000 |
Neg logit contributions | |
enny | -0.002 |
ache | -0.002 |
drop | -0.002 |
oured | -0.002 |
unn | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | -7.85e-03 |
Pos logit contributions | |
enny | +0.006 |
ache | +0.006 |
drop | +0.006 |
oured | +0.006 |
ipop | +0.006 |
Neg logit contributions | |
its | -0.003 |
their | -0.003 |
them | -0.003 |
everything | -0.002 |
her | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | -7.67e-03 |
Pos logit contributions | |
enny | +0.017 |
oured | +0.017 |
drop | +0.017 |
ache | +0.017 |
unn | +0.017 |
Neg logit contributions | |
its | -0.008 |
their | -0.007 |
them | -0.007 |
everything | -0.005 |
her | -0.005 |
Token | The |
Token ID | 464 |
Feature activation | -4.15e-03 |
Pos logit contributions | |
enny | +0.014 |
oured | +0.014 |
ipop | +0.014 |
unn | +0.014 |
drop | +0.014 |
Neg logit contributions | |
its | -0.011 |
their | -0.010 |
them | -0.010 |
everything | -0.008 |
her | -0.008 |
Token | chip |
Token ID | 11594 |
Feature activation | -5.62e-02 |
Pos logit contributions | |
enny | +0.008 |
seek | +0.008 |
driver | +0.007 |
unn | +0.007 |
enna | +0.007 |
Neg logit contributions | |
things | -0.007 |
their | -0.006 |
ash | -0.006 |
its | -0.006 |
the | -0.006 |
Token | mun |
Token ID | 6199 |
Feature activation | +1.39e-02 |
Pos logit contributions | |
seek | +0.097 |
enny | +0.095 |
oured | +0.094 |
driver | +0.093 |
powers | +0.091 |
Neg logit contributions | |
its | -0.087 |
their | -0.084 |
them | -0.082 |
things | -0.076 |
her | -0.074 |
Token | ks |
Token ID | 591 |
Feature activation | +1.43e-03 |
Pos logit contributions | |
its | +0.021 |
their | +0.018 |
them | +0.018 |
her | +0.015 |
out | +0.015 |
Neg logit contributions | |
enny | -0.025 |
� | -0.025 |
oured | -0.024 |
ipop | -0.024 |
icycle | -0.024 |
Token | were |
Token ID | 547 |
Feature activation | +3.51e-03 |
Pos logit contributions | |
its | +0.002 |
them | +0.002 |
their | +0.002 |
it | +0.002 |
her | +0.002 |
Neg logit contributions | |
unn | -0.003 |
salon | -0.003 |
enny | -0.003 |
seek | -0.003 |
ucker | -0.003 |
Token | so |
Token ID | 523 |
Feature activation | +1.66e-03 |
Pos logit contributions | |
its | +0.004 |
their | +0.003 |
them | +0.003 |
her | +0.003 |
his | +0.002 |
Neg logit contributions | |
enny | -0.009 |
unn | -0.009 |
driver | -0.009 |
ipop | -0.009 |
opus | -0.009 |
Token | thankful |
Token ID | 25535 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
its | +0.002 |
their | +0.002 |
them | +0.002 |
her | +0.001 |
everything | +0.001 |
Neg logit contributions | |
driver | -0.004 |
enny | -0.004 |
ipop | -0.004 |
ache | -0.004 |
drop | -0.003 |