Token | shop |
Token ID | 6128 |
Feature activation | -4.23e-04 |
Pos logit contributions | |
sound | +0.037 |
listen | +0.029 |
do | +0.029 |
listened | +0.029 |
not | +0.028 |
Neg logit contributions | |
piping | -0.042 |
endant | -0.041 |
million | -0.040 |
ocol | -0.039 |
umm | -0.039 |
Token | keeper |
Token ID | 13884 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
million | +0.000 |
endant | +0.000 |
umm | +0.000 |
brand | +0.000 |
imet | +0.000 |
Neg logit contributions | |
sound | -0.001 |
inker | -0.001 |
listen | -0.001 |
communicate | -0.001 |
ani | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +4.14e-03 |
Pos logit contributions | |
sound | +0.016 |
inker | +0.014 |
ani | +0.012 |
music | +0.011 |
listened | +0.011 |
Neg logit contributions | |
piping | -0.021 |
million | -0.020 |
imet | -0.019 |
dark | -0.019 |
endant | -0.019 |
Token | When |
Token ID | 1649 |
Feature activation | +5.35e-02 |
Pos logit contributions | |
sound | +0.007 |
do | +0.006 |
not | +0.006 |
listen | +0.006 |
listened | +0.006 |
Neg logit contributions | |
endant | -0.007 |
piping | -0.007 |
ocol | -0.006 |
million | -0.006 |
irst | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | +2.25e-02 |
Pos logit contributions | |
sound | +0.083 |
tails | +0.072 |
inker | +0.070 |
ably | +0.068 |
communicate | +0.067 |
Neg logit contributions | |
million | -0.089 |
piping | -0.086 |
umm | -0.082 |
igsaw | -0.081 |
pleasure | -0.080 |
Token | jobs |
Token ID | 3946 |
Feature activation | +1.04e-01 |
Pos logit contributions | |
sound | +0.037 |
do | +0.029 |
listen | +0.029 |
listened | +0.028 |
not | +0.028 |
Neg logit contributions | |
piping | -0.038 |
endant | -0.037 |
million | -0.036 |
ocol | -0.035 |
umm | -0.035 |
Token | were |
Token ID | 547 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
sound | +0.163 |
tails | +0.147 |
inker | +0.140 |
listen | +0.135 |
communicate | +0.130 |
Neg logit contributions | |
million | -0.167 |
� | -0.156 |
piping | -0.155 |
imet | -0.151 |
ocol | -0.147 |
Token | done |
Token ID | 1760 |
Feature activation | +4.03e-02 |
Pos logit contributions | |
sound | +0.037 |
inker | +0.028 |
do | +0.028 |
listen | +0.028 |
communicate | +0.027 |
Neg logit contributions | |
piping | -0.044 |
endant | -0.044 |
million | -0.043 |
ocol | -0.042 |
freshly | -0.041 |
Token | , |
Token ID | 11 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
sound | +0.057 |
inker | +0.046 |
tails | +0.045 |
ani | +0.043 |
communicate | +0.043 |
Neg logit contributions | |
piping | -0.073 |
million | -0.073 |
imet | -0.072 |
ocol | -0.071 |
� | -0.070 |
Token | the |
Token ID | 262 |
Feature activation | +8.75e-03 |
Pos logit contributions | |
sound | +0.028 |
tails | +0.026 |
inker | +0.024 |
behave | +0.023 |
ani | +0.023 |
Neg logit contributions | |
million | -0.022 |
piping | -0.021 |
pleasure | -0.021 |
umm | -0.020 |
igsaw | -0.020 |
Token | shop |
Token ID | 6128 |
Feature activation | +9.01e-03 |
Pos logit contributions | |
sound | +0.014 |
do | +0.011 |
listen | +0.010 |
listened | +0.010 |
not | +0.010 |
Neg logit contributions | |
piping | -0.016 |
endant | -0.015 |
million | -0.015 |
ocol | -0.015 |
umm | -0.014 |
Token | !" |
Token ID | 2474 |
Feature activation | +4.63e-03 |
Pos logit contributions | |
endant | +0.029 |
piping | +0.029 |
million | +0.028 |
umm | +0.028 |
ocol | +0.028 |
Neg logit contributions | |
sound | -0.028 |
listened | -0.022 |
listen | -0.022 |
do | -0.022 |
behave | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | -8.40e-03 |
Pos logit contributions | |
sound | +0.010 |
do | +0.008 |
listen | +0.008 |
listened | +0.008 |
not | +0.008 |
Neg logit contributions | |
piping | -0.006 |
endant | -0.005 |
million | -0.005 |
ocol | -0.005 |
imet | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
umm | +0.020 |
ocol | +0.019 |
piping | +0.018 |
endant | +0.018 |
ifying | +0.018 |
Neg logit contributions | |
sound | -0.011 |
not | -0.009 |
do | -0.009 |
slowly | -0.008 |
listened | -0.007 |
Token | As |
Token ID | 1722 |
Feature activation | +6.36e-02 |
Pos logit contributions | |
endant | +0.017 |
piping | +0.017 |
million | +0.017 |
dark | +0.016 |
ocol | +0.016 |
Neg logit contributions | |
sound | -0.017 |
do | -0.013 |
listen | -0.013 |
listened | -0.013 |
not | -0.012 |
Token | the |
Token ID | 262 |
Feature activation | +3.84e-02 |
Pos logit contributions | |
sound | +0.080 |
inker | +0.062 |
do | +0.059 |
listen | +0.059 |
ably | +0.059 |
Neg logit contributions | |
million | -0.126 |
piping | -0.121 |
camps | -0.119 |
ocol | -0.116 |
imet | -0.115 |
Token | rac |
Token ID | 3444 |
Feature activation | +9.59e-02 |
Pos logit contributions | |
sound | +0.062 |
listen | +0.052 |
ably | +0.051 |
listened | +0.051 |
do | +0.051 |
Neg logit contributions | |
endant | -0.058 |
million | -0.057 |
piping | -0.057 |
ocol | -0.056 |
umm | -0.055 |
Token | coon |
Token ID | 20912 |
Feature activation | +4.50e-02 |
Pos logit contributions | |
sound | +0.194 |
listen | +0.168 |
do | +0.161 |
not | +0.161 |
tails | +0.158 |
Neg logit contributions | |
ocol | -0.112 |
� | -0.110 |
million | -0.108 |
pill | -0.106 |
igsaw | -0.105 |
Token | crawled |
Token ID | 45668 |
Feature activation | +7.57e-03 |
Pos logit contributions | |
sound | +0.074 |
ourselves | +0.067 |
inker | +0.062 |
ics | +0.060 |
ikes | +0.059 |
Neg logit contributions | |
camps | -0.063 |
million | -0.062 |
berry | -0.059 |
� | -0.059 |
endant | -0.058 |
Token | to |
Token ID | 284 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
sound | +0.012 |
do | +0.010 |
behave | +0.010 |
obey | +0.010 |
listen | +0.010 |
Neg logit contributions | |
camps | -0.012 |
endant | -0.011 |
imet | -0.011 |
piping | -0.011 |
million | -0.011 |
Token | explore |
Token ID | 7301 |
Feature activation | +1.91e-02 |
Pos logit contributions | |
sound | +0.018 |
listened | +0.015 |
ards | +0.015 |
ably | +0.015 |
tails | +0.015 |
Neg logit contributions | |
pleasure | -0.024 |
piping | -0.023 |
camps | -0.023 |
ocol | -0.023 |
freshly | -0.023 |
Token | the |
Token ID | 262 |
Feature activation | +1.03e-03 |
Pos logit contributions | |
sound | +0.022 |
inker | +0.016 |
tails | +0.016 |
listened | +0.015 |
behave | +0.015 |
Neg logit contributions | |
piping | -0.038 |
ocol | -0.038 |
endant | -0.038 |
million | -0.037 |
camps | -0.037 |
Token | |
Token ID | 220 |
Feature activation | -4.59e-04 |
Pos logit contributions | |
sound | +0.025 |
ably | +0.024 |
happening | +0.024 |
inker | +0.023 |
ising | +0.023 |
Neg logit contributions | |
There | -0.010 |
� | -0.009 |
imet | -0.009 |
Some | -0.009 |
million | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -1.32e-03 |
Pos logit contributions | |
piping | +0.001 |
endant | +0.001 |
ocol | +0.001 |
umm | +0.001 |
million | +0.001 |
Neg logit contributions | |
sound | -0.001 |
do | -0.001 |
not | -0.001 |
listen | -0.001 |
ics | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -3.03e-03 |
Pos logit contributions | |
endant | +0.002 |
piping | +0.002 |
ocol | +0.002 |
million | +0.002 |
umm | +0.002 |
Neg logit contributions | |
sound | -0.003 |
do | -0.002 |
listen | -0.002 |
listened | -0.002 |
not | -0.002 |
Token | So |
Token ID | 2396 |
Feature activation | +3.94e-02 |
Pos logit contributions | |
million | +0.003 |
camps | +0.003 |
br | +0.003 |
Mic | +0.003 |
ction | +0.003 |
Neg logit contributions | |
sound | -0.006 |
happening | -0.005 |
ably | -0.005 |
ics | -0.005 |
listening | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | +3.34e-02 |
Pos logit contributions | |
sound | +0.059 |
ics | +0.053 |
ably | +0.053 |
behave | +0.049 |
inker | +0.049 |
Neg logit contributions | |
million | -0.061 |
camps | -0.057 |
imet | -0.057 |
Once | -0.057 |
piping | -0.056 |
Token | Stri |
Token ID | 26137 |
Feature activation | +9.12e-02 |
Pos logit contributions | |
sound | +0.058 |
ably | +0.057 |
ics | +0.056 |
inker | +0.053 |
gging | +0.051 |
Neg logit contributions | |
camps | -0.040 |
million | -0.040 |
cel | -0.038 |
There | -0.037 |
imet | -0.036 |
Token | pe |
Token ID | 431 |
Feature activation | +5.18e-02 |
Pos logit contributions | |
sound | +0.163 |
her | +0.134 |
music | +0.131 |
inker | +0.126 |
loudly | +0.124 |
Neg logit contributions | |
� | -0.119 |
endant | -0.117 |
imet | -0.113 |
dark | -0.104 |
seventy | -0.104 |
Token | and |
Token ID | 290 |
Feature activation | +3.12e-02 |
Pos logit contributions | |
sound | +0.076 |
inker | +0.074 |
ourselves | +0.071 |
oa | +0.068 |
behave | +0.067 |
Neg logit contributions | |
dark | -0.074 |
pad | -0.072 |
endant | -0.068 |
camps | -0.068 |
imet | -0.065 |
Token | his |
Token ID | 465 |
Feature activation | +3.58e-02 |
Pos logit contributions | |
inker | +0.037 |
sound | +0.036 |
ably | +0.035 |
ics | +0.034 |
ising | +0.034 |
Neg logit contributions | |
million | -0.052 |
cuc | -0.050 |
camps | -0.050 |
piping | -0.049 |
bead | -0.049 |
Token | friends |
Token ID | 2460 |
Feature activation | +4.28e-02 |
Pos logit contributions | |
sound | +0.049 |
listen | +0.037 |
listened | +0.037 |
do | +0.037 |
behave | +0.035 |
Neg logit contributions | |
endant | -0.066 |
piping | -0.066 |
ocol | -0.063 |
million | -0.063 |
camps | -0.063 |
Token | got |
Token ID | 1392 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
sound | +0.078 |
inker | +0.066 |
ourselves | +0.063 |
ising | +0.063 |
yourself | +0.059 |
Neg logit contributions | |
imet | -0.054 |
camps | -0.052 |
pad | -0.051 |
million | -0.050 |
cuc | -0.048 |
Token | go |
Token ID | 467 |
Feature activation | -6.52e-03 |
Pos logit contributions | |
piping | +0.023 |
pleasure | +0.023 |
million | +0.022 |
endant | +0.022 |
impact | +0.022 |
Neg logit contributions | |
sound | -0.018 |
ards | -0.016 |
inker | -0.016 |
ics | -0.016 |
tails | -0.015 |
Token | away |
Token ID | 1497 |
Feature activation | -5.78e-03 |
Pos logit contributions | |
million | +0.010 |
brand | +0.010 |
camps | +0.010 |
oming | +0.010 |
freshly | +0.010 |
Neg logit contributions | |
sound | -0.009 |
ics | -0.008 |
gging | -0.008 |
listened | -0.008 |
communicate | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | -1.57e-03 |
Pos logit contributions | |
million | +0.010 |
camps | +0.009 |
joy | +0.009 |
brand | +0.009 |
Once | +0.009 |
Neg logit contributions | |
sound | -0.008 |
inker | -0.007 |
tails | -0.007 |
ics | -0.007 |
ards | -0.007 |
Token | Max |
Token ID | 5436 |
Feature activation | +3.30e-02 |
Pos logit contributions | |
piping | +0.003 |
endant | +0.003 |
ocol | +0.003 |
umm | +0.003 |
million | +0.003 |
Neg logit contributions | |
sound | -0.002 |
do | -0.002 |
not | -0.002 |
listened | -0.002 |
listen | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | +2.65e-02 |
Pos logit contributions | |
sound | +0.051 |
inker | +0.046 |
ics | +0.046 |
communicate | +0.044 |
ourselves | +0.044 |
Neg logit contributions | |
million | -0.047 |
endant | -0.045 |
pad | -0.044 |
Wouldn | -0.044 |
imet | -0.042 |
Token | Scot |
Token ID | 7130 |
Feature activation | +9.11e-02 |
Pos logit contributions | |
sound | +0.050 |
ics | +0.044 |
ably | +0.043 |
ising | +0.041 |
loudly | +0.041 |
Neg logit contributions | |
ocol | -0.030 |
million | -0.030 |
camps | -0.029 |
imet | -0.029 |
piping | -0.028 |
Token | ty |
Token ID | 774 |
Feature activation | +5.14e-02 |
Pos logit contributions | |
sound | +0.146 |
music | +0.126 |
listen | +0.125 |
do | +0.125 |
poses | +0.124 |
Neg logit contributions | |
mo | -0.119 |
irst | -0.114 |
million | -0.110 |
dark | -0.105 |
ann | -0.104 |
Token | were |
Token ID | 547 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
sound | +0.084 |
inker | +0.069 |
not | +0.063 |
gging | +0.062 |
ikes | +0.062 |
Neg logit contributions | |
endant | -0.077 |
million | -0.075 |
irst | -0.072 |
camps | -0.071 |
piping | -0.070 |
Token | happy |
Token ID | 3772 |
Feature activation | +1.07e-03 |
Pos logit contributions | |
sound | +0.034 |
listen | +0.028 |
inker | +0.028 |
do | +0.027 |
ably | +0.026 |
Neg logit contributions | |
piping | -0.037 |
million | -0.037 |
pleasure | -0.036 |
endant | -0.036 |
brand | -0.034 |
Token | . |
Token ID | 13 |
Feature activation | +1.96e-03 |
Pos logit contributions | |
sound | +0.001 |
do | +0.001 |
listen | +0.001 |
behave | +0.001 |
inker | +0.001 |
Neg logit contributions | |
endant | -0.002 |
piping | -0.002 |
million | -0.002 |
imet | -0.002 |
umm | -0.002 |
Token | They |
Token ID | 1119 |
Feature activation | +2.45e-02 |
Pos logit contributions | |
sound | +0.003 |
do | +0.003 |
listen | +0.002 |
not | +0.002 |
listened | +0.002 |
Neg logit contributions | |
piping | -0.003 |
endant | -0.003 |
ocol | -0.003 |
million | -0.003 |
umm | -0.003 |
Token | that |
Token ID | 326 |
Feature activation | -4.64e-03 |
Pos logit contributions | |
igsaw | +0.006 |
piping | +0.006 |
endant | +0.006 |
million | +0.006 |
brand | +0.006 |
Neg logit contributions | |
sound | -0.006 |
inker | -0.005 |
tails | -0.005 |
ards | -0.005 |
communicate | -0.005 |
Token | if |
Token ID | 611 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
million | +0.008 |
piping | +0.007 |
imet | +0.007 |
endant | +0.007 |
freshly | +0.007 |
Neg logit contributions | |
sound | -0.007 |
inker | -0.006 |
tails | -0.006 |
gging | -0.005 |
ani | -0.005 |
Token | she |
Token ID | 673 |
Feature activation | +7.01e-03 |
Pos logit contributions | |
sound | +0.015 |
inker | +0.011 |
ards | +0.011 |
tails | +0.011 |
communicate | +0.011 |
Neg logit contributions | |
endant | -0.018 |
million | -0.018 |
ocol | -0.018 |
piping | -0.018 |
imet | -0.017 |
Token | did |
Token ID | 750 |
Feature activation | +5.25e-02 |
Pos logit contributions | |
sound | +0.011 |
tails | +0.008 |
inker | +0.008 |
ics | +0.008 |
listen | +0.007 |
Neg logit contributions | |
endant | -0.012 |
piping | -0.012 |
million | -0.012 |
dark | -0.012 |
imet | -0.012 |
Token | her |
Token ID | 607 |
Feature activation | +9.49e-03 |
Pos logit contributions | |
sound | +0.081 |
inker | +0.076 |
ani | +0.075 |
ards | +0.070 |
ics | +0.069 |
Neg logit contributions | |
million | -0.074 |
piping | -0.073 |
brand | -0.071 |
imet | -0.067 |
Which | -0.066 |
Token | chores |
Token ID | 46173 |
Feature activation | +8.96e-02 |
Pos logit contributions | |
sound | +0.017 |
ards | +0.016 |
ani | +0.015 |
w | +0.015 |
tails | +0.015 |
Neg logit contributions | |
pleasure | -0.012 |
piping | -0.010 |
imet | -0.010 |
igsaw | -0.010 |
brand | -0.010 |
Token | , |
Token ID | 11 |
Feature activation | +9.08e-03 |
Pos logit contributions | |
sound | +0.121 |
tails | +0.114 |
inker | +0.096 |
communicate | +0.096 |
ram | +0.094 |
Neg logit contributions | |
� | -0.152 |
million | -0.150 |
imet | -0.149 |
igsaw | -0.148 |
piping | -0.143 |
Token | she |
Token ID | 673 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
sound | +0.013 |
inker | +0.011 |
tails | +0.010 |
ics | +0.010 |
ably | +0.010 |
Neg logit contributions | |
piping | -0.015 |
million | -0.015 |
freshly | -0.015 |
endant | -0.015 |
ocol | -0.015 |
Token | could |
Token ID | 714 |
Feature activation | +2.84e-03 |
Pos logit contributions | |
endant | +0.017 |
million | +0.016 |
piping | +0.015 |
dark | +0.015 |
imet | +0.015 |
Neg logit contributions | |
sound | -0.019 |
inker | -0.016 |
ics | -0.015 |
music | -0.014 |
listen | -0.014 |
Token | still |
Token ID | 991 |
Feature activation | +3.14e-02 |
Pos logit contributions | |
sound | +0.004 |
inker | +0.003 |
ards | +0.003 |
ably | +0.003 |
tails | +0.003 |
Neg logit contributions | |
� | -0.005 |
piping | -0.005 |
pleasure | -0.005 |
impact | -0.005 |
imet | -0.005 |
Token | get |
Token ID | 651 |
Feature activation | +1.66e-02 |
Pos logit contributions | |
sound | +0.043 |
inker | +0.037 |
tails | +0.035 |
ards | +0.034 |
loudly | +0.034 |
Neg logit contributions | |
piping | -0.052 |
pleasure | -0.051 |
freshly | -0.049 |
� | -0.049 |
impact | -0.049 |
Token | again |
Token ID | 757 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
sound | +0.020 |
do | +0.014 |
listened | +0.014 |
listen | +0.013 |
behave | +0.013 |
Neg logit contributions | |
piping | -0.039 |
endant | -0.039 |
million | -0.039 |
ocol | -0.038 |
umm | -0.037 |
Token | . |
Token ID | 13 |
Feature activation | +3.11e-03 |
Pos logit contributions | |
million | +0.020 |
endant | +0.019 |
joy | +0.019 |
ocol | +0.019 |
freshly | +0.019 |
Neg logit contributions | |
sound | -0.014 |
ics | -0.012 |
inker | -0.011 |
ably | -0.011 |
behave | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
sound | +0.006 |
do | +0.005 |
listen | +0.005 |
not | +0.005 |
listened | +0.005 |
Neg logit contributions | |
piping | -0.005 |
endant | -0.005 |
ocol | -0.005 |
million | -0.004 |
umm | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
endant | +0.017 |
piping | +0.016 |
umm | +0.016 |
ocol | +0.016 |
million | +0.015 |
Neg logit contributions | |
sound | -0.020 |
do | -0.017 |
not | -0.017 |
listen | -0.016 |
listened | -0.016 |
Token | R |
Token ID | 49 |
Feature activation | +3.89e-02 |
Pos logit contributions | |
million | +0.015 |
piping | +0.015 |
endant | +0.014 |
camps | +0.014 |
Wouldn | +0.014 |
Neg logit contributions | |
sound | -0.020 |
do | -0.015 |
listen | -0.015 |
listened | -0.015 |
inker | -0.015 |
Token | over |
Token ID | 2502 |
Feature activation | +8.94e-02 |
Pos logit contributions | |
sound | +0.063 |
do | +0.048 |
listen | +0.047 |
listened | +0.047 |
not | +0.045 |
Neg logit contributions | |
piping | -0.067 |
endant | -0.067 |
ocol | -0.065 |
million | -0.064 |
imet | -0.062 |
Token | wanted |
Token ID | 2227 |
Feature activation | -2.37e-02 |
Pos logit contributions | |
sound | +0.121 |
communicate | +0.110 |
tails | +0.110 |
inker | +0.109 |
listen | +0.103 |
Neg logit contributions | |
million | -0.143 |
endant | -0.137 |
dark | -0.131 |
There | -0.126 |
imet | -0.125 |
Token | to |
Token ID | 284 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
piping | +0.040 |
imet | +0.040 |
pleasure | +0.039 |
million | +0.038 |
camps | +0.038 |
Neg logit contributions | |
sound | -0.034 |
inker | -0.027 |
ising | -0.026 |
ics | -0.026 |
tails | -0.025 |
Token | go |
Token ID | 467 |
Feature activation | +3.70e-03 |
Pos logit contributions | |
sound | +0.016 |
ards | +0.014 |
ably | +0.013 |
inker | +0.013 |
ising | +0.013 |
Neg logit contributions | |
piping | -0.018 |
pleasure | -0.018 |
million | -0.017 |
endant | -0.017 |
tow | -0.017 |
Token | home |
Token ID | 1363 |
Feature activation | -1.06e-03 |
Pos logit contributions | |
sound | +0.006 |
do | +0.004 |
listen | +0.004 |
listened | +0.004 |
not | +0.004 |
Neg logit contributions | |
piping | -0.007 |
endant | -0.007 |
million | -0.006 |
ocol | -0.006 |
umm | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | -1.84e-04 |
Pos logit contributions | |
joy | +0.002 |
pleasure | +0.001 |
brand | +0.001 |
camps | +0.001 |
Once | +0.001 |
Neg logit contributions | |
sound | -0.002 |
w | -0.002 |
inker | -0.001 |
ards | -0.001 |
listened | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
endant | +0.021 |
ocol | +0.020 |
umm | +0.020 |
piping | +0.019 |
freshly | +0.018 |
Neg logit contributions | |
sound | -0.016 |
do | -0.014 |
not | -0.014 |
listen | -0.013 |
listened | -0.013 |
Token | " |
Token ID | 1 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
million | +0.018 |
piping | +0.017 |
dark | +0.017 |
endant | +0.017 |
imet | +0.016 |
Neg logit contributions | |
sound | -0.018 |
do | -0.014 |
listen | -0.014 |
listened | -0.013 |
tails | -0.013 |
Token | Hello |
Token ID | 15496 |
Feature activation | -5.57e-02 |
Pos logit contributions | |
sound | +0.040 |
do | +0.033 |
listen | +0.032 |
listened | +0.032 |
not | +0.031 |
Neg logit contributions | |
endant | -0.028 |
piping | -0.028 |
ocol | -0.026 |
million | -0.026 |
umm | -0.025 |
Token | !" |
Token ID | 2474 |
Feature activation | +2.09e-02 |
Pos logit contributions | |
piping | +0.117 |
endant | +0.116 |
ocol | +0.112 |
million | +0.112 |
umm | +0.109 |
Neg logit contributions | |
sound | -0.069 |
do | -0.051 |
listen | -0.048 |
listened | -0.047 |
not | -0.045 |
Token | the |
Token ID | 262 |
Feature activation | +2.85e-02 |
Pos logit contributions | |
sound | +0.026 |
inker | +0.026 |
ics | +0.025 |
ably | +0.024 |
behave | +0.024 |
Neg logit contributions | |
million | -0.036 |
There | -0.036 |
dark | -0.035 |
piping | -0.034 |
cuc | -0.033 |
Token | rac |
Token ID | 3444 |
Feature activation | +8.87e-02 |
Pos logit contributions | |
sound | +0.053 |
listen | +0.046 |
listened | +0.045 |
ably | +0.045 |
obey | +0.044 |
Neg logit contributions | |
piping | -0.037 |
million | -0.037 |
endant | -0.036 |
umm | -0.033 |
ocol | -0.033 |
Token | coon |
Token ID | 20912 |
Feature activation | +3.57e-02 |
Pos logit contributions | |
sound | +0.179 |
listen | +0.151 |
do | +0.148 |
tails | +0.145 |
not | +0.144 |
Neg logit contributions | |
ocol | -0.102 |
million | -0.099 |
� | -0.097 |
endant | -0.097 |
igsaw | -0.095 |
Token | said |
Token ID | 531 |
Feature activation | -1.17e-03 |
Pos logit contributions | |
sound | +0.043 |
inker | +0.042 |
ourselves | +0.040 |
ics | +0.039 |
behave | +0.038 |
Neg logit contributions | |
million | -0.060 |
endant | -0.059 |
dark | -0.058 |
piping | -0.056 |
berry | -0.055 |
Token | . |
Token ID | 13 |
Feature activation | -2.85e-03 |
Pos logit contributions | |
joy | +0.002 |
piping | +0.002 |
imet | +0.002 |
million | +0.002 |
pleasure | +0.002 |
Neg logit contributions | |
sound | -0.001 |
inker | -0.001 |
w | -0.001 |
behave | -0.001 |
ics | -0.001 |
Token | |
Token ID | 220 |
Feature activation | -1.39e-02 |
Pos logit contributions | |
piping | +0.005 |
endant | +0.005 |
ocol | +0.005 |
umm | +0.005 |
million | +0.005 |
Neg logit contributions | |
sound | -0.004 |
not | -0.004 |
do | -0.003 |
listened | -0.003 |
listen | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -1.49e-02 |
Pos logit contributions | |
piping | +0.024 |
endant | +0.024 |
ocol | +0.023 |
umm | +0.023 |
million | +0.022 |
Neg logit contributions | |
sound | -0.023 |
not | -0.020 |
do | -0.020 |
listen | -0.018 |
loudly | -0.017 |
Token | a |
Token ID | 257 |
Feature activation | -2.42e-02 |
Pos logit contributions | |
endant | +0.016 |
piping | +0.016 |
million | +0.016 |
ocol | +0.016 |
camps | +0.016 |
Neg logit contributions | |
sound | -0.011 |
inker | -0.008 |
listen | -0.008 |
do | -0.008 |
listened | -0.008 |
Token | place |
Token ID | 1295 |
Feature activation | -1.11e-03 |
Pos logit contributions | |
piping | +0.039 |
endant | +0.039 |
million | +0.037 |
ocol | +0.037 |
umm | +0.036 |
Neg logit contributions | |
sound | -0.041 |
do | -0.032 |
listen | -0.032 |
listened | -0.032 |
not | -0.031 |
Token | where |
Token ID | 810 |
Feature activation | -6.25e-03 |
Pos logit contributions | |
endant | +0.002 |
brand | +0.002 |
piping | +0.002 |
freshly | +0.002 |
million | +0.002 |
Neg logit contributions | |
sound | -0.002 |
inker | -0.001 |
listened | -0.001 |
gging | -0.001 |
tails | -0.001 |
Token | scientists |
Token ID | 5519 |
Feature activation | +5.06e-02 |
Pos logit contributions | |
million | +0.011 |
endant | +0.010 |
There | +0.010 |
dark | +0.010 |
diamonds | +0.010 |
Neg logit contributions | |
sound | -0.008 |
ising | -0.007 |
gging | -0.007 |
ably | -0.007 |
inker | -0.007 |
Token | did |
Token ID | 750 |
Feature activation | +5.01e-02 |
Pos logit contributions | |
sound | +0.076 |
inker | +0.066 |
tails | +0.060 |
loudly | +0.059 |
ani | +0.057 |
Neg logit contributions | |
endant | -0.081 |
freshly | -0.080 |
piping | -0.078 |
million | -0.075 |
ocol | -0.075 |
Token | experiments |
Token ID | 10256 |
Feature activation | +8.86e-02 |
Pos logit contributions | |
sound | +0.064 |
ani | +0.058 |
inker | +0.058 |
tails | +0.055 |
ably | +0.051 |
Neg logit contributions | |
brand | -0.084 |
endant | -0.084 |
million | -0.082 |
freshly | -0.081 |
piping | -0.077 |
Token | . |
Token ID | 13 |
Feature activation | +4.95e-03 |
Pos logit contributions | |
sound | +0.121 |
inker | +0.106 |
ani | +0.105 |
tails | +0.105 |
listened | +0.093 |
Neg logit contributions | |
brand | -0.142 |
endant | -0.142 |
million | -0.140 |
dark | -0.138 |
imet | -0.137 |
Token | Jack |
Token ID | 3619 |
Feature activation | +1.98e-02 |
Pos logit contributions | |
sound | +0.009 |
do | +0.007 |
listen | +0.007 |
listened | +0.007 |
not | +0.007 |
Neg logit contributions | |
piping | -0.007 |
endant | -0.007 |
ocol | -0.007 |
million | -0.007 |
umm | -0.007 |
Token | thought |
Token ID | 1807 |
Feature activation | -5.37e-03 |
Pos logit contributions | |
sound | +0.033 |
ourselves | +0.028 |
inker | +0.027 |
listen | +0.025 |
communicate | +0.024 |
Neg logit contributions | |
million | -0.027 |
camps | -0.025 |
endant | -0.025 |
piping | -0.025 |
berry | -0.025 |
Token | it |
Token ID | 340 |
Feature activation | -2.49e-02 |
Pos logit contributions | |
piping | +0.009 |
ocol | +0.009 |
imet | +0.009 |
brand | +0.008 |
igsaw | +0.008 |
Neg logit contributions | |
sound | -0.009 |
tails | -0.007 |
inker | -0.007 |
listened | -0.006 |
ising | -0.006 |
Token | was |
Token ID | 373 |
Feature activation | -7.49e-03 |
Pos logit contributions | |
brand | +0.034 |
million | +0.032 |
dark | +0.030 |
There | +0.029 |
Wouldn | +0.029 |
Neg logit contributions | |
ani | -0.040 |
sound | -0.039 |
obey | -0.038 |
inker | -0.037 |
ister | -0.037 |
Token | and |
Token ID | 290 |
Feature activation | -7.61e-03 |
Pos logit contributions | |
sound | +0.037 |
inker | +0.035 |
obey | +0.034 |
behave | +0.033 |
listen | +0.032 |
Neg logit contributions | |
berry | -0.047 |
million | -0.047 |
joy | -0.046 |
camps | -0.045 |
pad | -0.045 |
Token | listened |
Token ID | 16399 |
Feature activation | +1.88e-02 |
Pos logit contributions | |
million | +0.010 |
piping | +0.010 |
endant | +0.010 |
There | +0.009 |
camps | +0.009 |
Neg logit contributions | |
sound | -0.012 |
inker | -0.012 |
ics | -0.011 |
oo | -0.011 |
gg | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | +2.89e-03 |
Pos logit contributions | |
sound | +0.029 |
inker | +0.025 |
behave | +0.025 |
ards | +0.024 |
tails | +0.024 |
Neg logit contributions | |
brand | -0.030 |
imet | -0.029 |
million | -0.028 |
dark | -0.028 |
endant | -0.028 |
Token | When |
Token ID | 1649 |
Feature activation | +5.37e-02 |
Pos logit contributions | |
sound | +0.005 |
do | +0.004 |
listen | +0.004 |
her | +0.004 |
not | +0.004 |
Neg logit contributions | |
endant | -0.005 |
ocol | -0.005 |
piping | -0.005 |
umm | -0.004 |
camps | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +2.83e-02 |
Pos logit contributions | |
sound | +0.073 |
ably | +0.061 |
gging | +0.061 |
behave | +0.061 |
ards | +0.059 |
Neg logit contributions | |
million | -0.097 |
piping | -0.092 |
imet | -0.087 |
freshly | -0.087 |
brand | -0.086 |
Token | noises |
Token ID | 26782 |
Feature activation | +8.86e-02 |
Pos logit contributions | |
sound | +0.048 |
behave | +0.043 |
listen | +0.042 |
ics | +0.042 |
not | +0.042 |
Neg logit contributions | |
piping | -0.040 |
million | -0.039 |
endant | -0.039 |
umm | -0.038 |
igsaw | -0.037 |
Token | didn |
Token ID | 1422 |
Feature activation | +4.83e-02 |
Pos logit contributions | |
sound | +0.154 |
tails | +0.152 |
inker | +0.141 |
ourselves | +0.139 |
behave | +0.136 |
Neg logit contributions | |
million | -0.117 |
dark | -0.105 |
There | -0.103 |
imet | -0.101 |
omed | -0.099 |
Token | 't |
Token ID | 470 |
Feature activation | +4.54e-03 |
Pos logit contributions | |
sound | +0.073 |
listened | +0.056 |
listen | +0.053 |
do | +0.053 |
behave | +0.052 |
Neg logit contributions | |
piping | -0.085 |
million | -0.082 |
endant | -0.082 |
imet | -0.080 |
ocol | -0.080 |
Token | stop |
Token ID | 2245 |
Feature activation | +3.63e-02 |
Pos logit contributions | |
sound | +0.006 |
tails | +0.005 |
ards | +0.005 |
inker | +0.005 |
ics | +0.005 |
Neg logit contributions | |
million | -0.008 |
piping | -0.008 |
pleasure | -0.007 |
imet | -0.007 |
dark | -0.007 |
Token | , |
Token ID | 11 |
Feature activation | -4.38e-03 |
Pos logit contributions | |
sound | +0.045 |
listened | +0.037 |
behave | +0.036 |
inker | +0.036 |
ics | +0.034 |
Neg logit contributions | |
ocol | -0.068 |
piping | -0.068 |
million | -0.068 |
freshly | -0.065 |
joy | -0.065 |
Token | she |
Token ID | 673 |
Feature activation | -9.60e-03 |
Pos logit contributions | |
million | +0.008 |
freshly | +0.007 |
brand | +0.007 |
piping | +0.007 |
endant | +0.007 |
Neg logit contributions | |
sound | -0.006 |
ics | -0.006 |
behave | -0.005 |
inker | -0.005 |
ably | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | -7.59e-03 |
Pos logit contributions | |
sound | +0.005 |
do | +0.004 |
listen | +0.004 |
listened | +0.004 |
not | +0.004 |
Neg logit contributions | |
endant | -0.005 |
piping | -0.004 |
ocol | -0.004 |
million | -0.004 |
umm | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | -7.32e-03 |
Pos logit contributions | |
endant | +0.014 |
umm | +0.013 |
ocol | +0.013 |
piping | +0.012 |
million | +0.012 |
Neg logit contributions | |
sound | -0.012 |
do | -0.011 |
not | -0.011 |
listened | -0.010 |
listen | -0.010 |
Token | After |
Token ID | 3260 |
Feature activation | +5.79e-02 |
Pos logit contributions | |
piping | +0.011 |
million | +0.011 |
endant | +0.011 |
ocol | +0.010 |
dark | +0.010 |
Neg logit contributions | |
sound | -0.013 |
do | -0.011 |
listen | -0.010 |
listened | -0.010 |
not | -0.010 |
Token | a |
Token ID | 257 |
Feature activation | +3.50e-02 |
Pos logit contributions | |
sound | +0.087 |
ably | +0.072 |
inker | +0.068 |
ignore | +0.065 |
ising | +0.064 |
Neg logit contributions | |
piping | -0.099 |
million | -0.097 |
� | -0.096 |
ocol | -0.095 |
freshly | -0.093 |
Token | few |
Token ID | 1178 |
Feature activation | +5.50e-02 |
Pos logit contributions | |
sound | +0.053 |
do | +0.041 |
listen | +0.040 |
listened | +0.037 |
not | +0.036 |
Neg logit contributions | |
endant | -0.071 |
ocol | -0.068 |
piping | -0.067 |
umm | -0.064 |
dark | -0.062 |
Token | rounds |
Token ID | 9196 |
Feature activation | +8.84e-02 |
Pos logit contributions | |
sound | +0.135 |
do | +0.114 |
listen | +0.113 |
inker | +0.112 |
not | +0.111 |
Neg logit contributions | |
piping | -0.048 |
million | -0.045 |
ocol | -0.043 |
endant | -0.042 |
imet | -0.038 |
Token | , |
Token ID | 11 |
Feature activation | +2.05e-02 |
Pos logit contributions | |
sound | +0.160 |
listened | +0.133 |
tails | +0.132 |
listen | +0.132 |
inker | +0.131 |
Neg logit contributions | |
ocol | -0.118 |
imet | -0.115 |
million | -0.115 |
igsaw | -0.108 |
There | -0.107 |
Token | it |
Token ID | 340 |
Feature activation | -2.34e-04 |
Pos logit contributions | |
sound | +0.041 |
inker | +0.037 |
behave | +0.036 |
tails | +0.035 |
do | +0.034 |
Neg logit contributions | |
million | -0.024 |
piping | -0.022 |
pleasure | -0.022 |
lettuce | -0.021 |
cuc | -0.020 |
Token | was |
Token ID | 373 |
Feature activation | +1.34e-02 |
Pos logit contributions | |
million | +0.000 |
camps | +0.000 |
endant | +0.000 |
dark | +0.000 |
transformed | +0.000 |
Neg logit contributions | |
sound | -0.000 |
listen | -0.000 |
tails | -0.000 |
inker | -0.000 |
obey | -0.000 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
sound | +0.019 |
do | +0.014 |
listen | +0.014 |
listened | +0.014 |
not | +0.013 |
Neg logit contributions | |
piping | -0.026 |
endant | -0.025 |
million | -0.025 |
ocol | -0.024 |
umm | -0.024 |
Token | One |
Token ID | 3198 |
Feature activation | +1.03e-03 |
Pos logit contributions | |
endant | +0.023 |
piping | +0.022 |
ocol | +0.021 |
umm | +0.020 |
brand | +0.020 |
Neg logit contributions | |
sound | -0.028 |
do | -0.025 |
her | -0.023 |
listened | -0.023 |
when | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | +3.26e-03 |
Pos logit contributions | |
sound | +0.035 |
tails | +0.033 |
listened | +0.031 |
listen | +0.029 |
obey | +0.029 |
Neg logit contributions | |
million | -0.050 |
camps | -0.049 |
ocol | -0.049 |
brand | -0.048 |
igsaw | -0.047 |
Token | |
Token ID | 220 |
Feature activation | -7.61e-03 |
Pos logit contributions | |
sound | +0.006 |
do | +0.005 |
not | +0.005 |
listen | +0.005 |
listened | +0.005 |
Neg logit contributions | |
endant | -0.005 |
piping | -0.005 |
ocol | -0.005 |
million | -0.005 |
dark | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | -7.90e-03 |
Pos logit contributions | |
piping | +0.012 |
endant | +0.012 |
ocol | +0.012 |
umm | +0.011 |
million | +0.011 |
Neg logit contributions | |
sound | -0.013 |
do | -0.011 |
not | -0.011 |
listen | -0.011 |
listened | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | -7.39e-03 |
Pos logit contributions | |
endant | +0.013 |
ocol | +0.012 |
piping | +0.012 |
umm | +0.012 |
igsaw | +0.011 |
Neg logit contributions | |
sound | -0.014 |
do | -0.012 |
not | -0.012 |
listen | -0.012 |
listened | -0.012 |
Token | R |
Token ID | 49 |
Feature activation | +3.72e-02 |
Pos logit contributions | |
piping | +0.011 |
million | +0.011 |
endant | +0.010 |
camps | +0.010 |
ocol | +0.010 |
Neg logit contributions | |
sound | -0.013 |
do | -0.010 |
listen | -0.010 |
listened | -0.010 |
not | -0.010 |
Token | over |
Token ID | 2502 |
Feature activation | +8.78e-02 |
Pos logit contributions | |
sound | +0.066 |
do | +0.051 |
listened | +0.050 |
listen | +0.050 |
not | +0.048 |
Neg logit contributions | |
piping | -0.057 |
ocol | -0.056 |
endant | -0.056 |
million | -0.054 |
camps | -0.054 |
Token | stayed |
Token ID | 9658 |
Feature activation | +2.12e-02 |
Pos logit contributions | |
sound | +0.127 |
inker | +0.114 |
tails | +0.113 |
communicate | +0.110 |
listen | +0.104 |
Neg logit contributions | |
million | -0.135 |
endant | -0.133 |
piping | -0.126 |
seventy | -0.125 |
dark | -0.125 |
Token | away |
Token ID | 1497 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
sound | +0.029 |
inker | +0.024 |
do | +0.023 |
listen | +0.023 |
ards | +0.023 |
Neg logit contributions | |
joy | -0.036 |
camps | -0.035 |
million | -0.035 |
piping | -0.035 |
brand | -0.035 |
Token | for |
Token ID | 329 |
Feature activation | +5.84e-02 |
Pos logit contributions | |
million | +0.021 |
camps | +0.021 |
joy | +0.020 |
asleep | +0.020 |
pleasure | +0.019 |
Neg logit contributions | |
sound | -0.016 |
inker | -0.015 |
tails | -0.015 |
ards | -0.015 |
communicate | -0.014 |
Token | a |
Token ID | 257 |
Feature activation | +9.67e-03 |
Pos logit contributions | |
sound | +0.078 |
ics | +0.060 |
inker | +0.060 |
do | +0.057 |
tails | +0.056 |
Neg logit contributions | |
piping | -0.107 |
million | -0.104 |
ocol | -0.104 |
pleasure | -0.102 |
camps | -0.101 |
Token | while |
Token ID | 981 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
sound | +0.014 |
do | +0.010 |
listen | +0.010 |
listened | +0.010 |
not | +0.009 |
Neg logit contributions | |
endant | -0.019 |
piping | -0.019 |
ocol | -0.019 |
umm | -0.018 |
million | -0.018 |
Token | home |
Token ID | 1363 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
endant | +0.073 |
piping | +0.070 |
million | +0.070 |
camps | +0.068 |
ocol | +0.067 |
Neg logit contributions | |
sound | -0.066 |
listened | -0.055 |
listen | -0.052 |
do | -0.052 |
communicate | -0.051 |
Token | . |
Token ID | 13 |
Feature activation | +1.91e-03 |
Pos logit contributions | |
million | +0.027 |
brand | +0.026 |
endant | +0.025 |
igsaw | +0.025 |
camps | +0.024 |
Neg logit contributions | |
sound | -0.022 |
listened | -0.020 |
inker | -0.020 |
listen | -0.019 |
communicate | -0.019 |
Token |
|
Token ID | 198 |
Feature activation | -9.77e-03 |
Pos logit contributions | |
sound | +0.003 |
do | +0.003 |
listen | +0.003 |
not | +0.003 |
listened | +0.003 |
Neg logit contributions | |
endant | -0.003 |
piping | -0.003 |
ocol | -0.003 |
million | -0.003 |
umm | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
endant | +0.016 |
umm | +0.015 |
ocol | +0.015 |
piping | +0.015 |
million | +0.014 |
Neg logit contributions | |
sound | -0.017 |
do | -0.015 |
not | -0.014 |
listen | -0.014 |
listened | -0.014 |
Token | R |
Token ID | 49 |
Feature activation | +3.47e-02 |
Pos logit contributions | |
piping | +0.015 |
million | +0.015 |
endant | +0.014 |
ocol | +0.014 |
camps | +0.014 |
Neg logit contributions | |
sound | -0.018 |
do | -0.014 |
listen | -0.014 |
listened | -0.014 |
not | -0.014 |
Token | over |
Token ID | 2502 |
Feature activation | +8.75e-02 |
Pos logit contributions | |
sound | +0.059 |
do | +0.044 |
listen | +0.044 |
listened | +0.044 |
not | +0.043 |
Neg logit contributions | |
piping | -0.057 |
endant | -0.056 |
ocol | -0.055 |
million | -0.054 |
imet | -0.054 |
Token | was |
Token ID | 373 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
sound | +0.127 |
inker | +0.122 |
tails | +0.119 |
communicate | +0.117 |
listen | +0.111 |
Neg logit contributions | |
million | -0.132 |
endant | -0.120 |
dark | -0.119 |
piping | -0.116 |
seventy | -0.114 |
Token | very |
Token ID | 845 |
Feature activation | +2.75e-02 |
Pos logit contributions | |
sound | +0.032 |
inker | +0.026 |
listen | +0.026 |
do | +0.025 |
communicate | +0.024 |
Neg logit contributions | |
piping | -0.041 |
million | -0.039 |
endant | -0.039 |
pleasure | -0.038 |
brand | -0.037 |
Token | happy |
Token ID | 3772 |
Feature activation | +2.63e-03 |
Pos logit contributions | |
sound | +0.047 |
tails | +0.043 |
inker | +0.041 |
ards | +0.040 |
listen | +0.040 |
Neg logit contributions | |
piping | -0.039 |
million | -0.037 |
pleasure | -0.037 |
endant | -0.036 |
brand | -0.036 |
Token | and |
Token ID | 290 |
Feature activation | +5.09e-03 |
Pos logit contributions | |
sound | +0.003 |
tails | +0.003 |
communicate | +0.003 |
inker | +0.003 |
ards | +0.003 |
Neg logit contributions | |
joy | -0.005 |
million | -0.004 |
pleasure | -0.004 |
endant | -0.004 |
umm | -0.004 |
Token | excited |
Token ID | 6568 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
inker | +0.008 |
communicate | +0.008 |
sound | +0.008 |
ix | +0.007 |
ably | +0.007 |
Neg logit contributions | |
brand | -0.007 |
pleasure | -0.007 |
million | -0.007 |
freshly | -0.007 |
piping | -0.006 |
Token | she |
Token ID | 673 |
Feature activation | -3.50e-05 |
Pos logit contributions | |
sound | +0.014 |
inker | +0.011 |
communicate | +0.011 |
do | +0.011 |
behave | +0.010 |
Neg logit contributions | |
piping | -0.018 |
endant | -0.017 |
million | -0.017 |
freshly | -0.016 |
dark | -0.016 |
Token | said |
Token ID | 531 |
Feature activation | -8.99e-03 |
Pos logit contributions | |
endant | +0.000 |
piping | +0.000 |
million | +0.000 |
dark | +0.000 |
brand | +0.000 |
Neg logit contributions | |
sound | -0.000 |
ourselves | -0.000 |
inker | -0.000 |
ising | -0.000 |
communicate | -0.000 |
Token | ." |
Token ID | 526 |
Feature activation | +6.52e-03 |
Pos logit contributions | |
piping | +0.014 |
pleasure | +0.013 |
brand | +0.013 |
imet | +0.012 |
endant | +0.012 |
Neg logit contributions | |
inker | -0.013 |
sound | -0.013 |
communicate | -0.012 |
ani | -0.011 |
ards | -0.011 |
Token | But |
Token ID | 1537 |
Feature activation | +1.30e-02 |
Pos logit contributions | |
sound | +0.012 |
do | +0.010 |
listen | +0.010 |
listened | +0.010 |
her | +0.010 |
Neg logit contributions | |
ocol | -0.011 |
endant | -0.010 |
piping | -0.010 |
umm | -0.010 |
igsaw | -0.010 |
Token | why |
Token ID | 1521 |
Feature activation | +4.57e-02 |
Pos logit contributions | |
sound | +0.023 |
inker | +0.021 |
communicate | +0.020 |
tails | +0.019 |
do | +0.019 |
Neg logit contributions | |
piping | -0.018 |
million | -0.017 |
pleasure | -0.017 |
endant | -0.016 |
irst | -0.016 |
Token | does |
Token ID | 857 |
Feature activation | +8.71e-02 |
Pos logit contributions | |
sound | +0.061 |
tails | +0.058 |
inker | +0.055 |
communicate | +0.052 |
ani | +0.049 |
Neg logit contributions | |
million | -0.078 |
piping | -0.076 |
freshly | -0.074 |
endant | -0.073 |
dark | -0.072 |
Token | it |
Token ID | 340 |
Feature activation | +1.97e-02 |
Pos logit contributions | |
sound | +0.135 |
ably | +0.129 |
inker | +0.118 |
heads | +0.116 |
k | +0.115 |
Neg logit contributions | |
million | -0.135 |
piping | -0.131 |
igsaw | -0.124 |
There | -0.119 |
brand | -0.116 |
Token | have |
Token ID | 423 |
Feature activation | -6.63e-03 |
Pos logit contributions | |
ably | +0.025 |
inker | +0.024 |
gging | +0.024 |
sound | +0.024 |
gg | +0.023 |
Neg logit contributions | |
dark | -0.031 |
million | -0.030 |
endant | -0.028 |
There | -0.027 |
run | -0.027 |
Token | a |
Token ID | 257 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
million | +0.012 |
endant | +0.011 |
piping | +0.011 |
pleasure | +0.010 |
freshly | +0.010 |
Neg logit contributions | |
sound | -0.009 |
inker | -0.008 |
ising | -0.008 |
ably | -0.008 |
ek | -0.007 |
Token | mask |
Token ID | 9335 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
sound | +0.015 |
listened | +0.011 |
do | +0.011 |
listen | +0.011 |
inker | +0.011 |
Neg logit contributions | |
piping | -0.019 |
endant | -0.018 |
million | -0.018 |
ocol | -0.017 |
imet | -0.017 |
Token | on |
Token ID | 319 |
Feature activation | -9.74e-03 |
Pos logit contributions | |
tails | +0.035 |
sound | +0.034 |
ani | +0.034 |
inker | +0.034 |
heads | +0.033 |
Neg logit contributions | |
brand | -0.035 |
dark | -0.033 |
million | -0.033 |
There | -0.033 |
endant | -0.032 |
Token |
|
Token ID | 198 |
Feature activation | -1.31e-02 |
Pos logit contributions | |
sound | +0.014 |
not | +0.012 |
do | +0.012 |
each | +0.012 |
when | +0.011 |
Neg logit contributions | |
endant | -0.026 |
ocol | -0.026 |
umm | -0.025 |
igsaw | -0.025 |
brand | -0.024 |
Token |
|
Token ID | 198 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
umm | +0.031 |
ocol | +0.028 |
endant | +0.027 |
igsaw | +0.026 |
piping | +0.026 |
Neg logit contributions | |
sound | -0.017 |
not | -0.016 |
do | -0.015 |
listen | -0.014 |
each | -0.013 |
Token | When |
Token ID | 2215 |
Feature activation | +4.58e-02 |
Pos logit contributions | |
piping | +0.020 |
endant | +0.020 |
million | +0.019 |
ocol | +0.019 |
dark | +0.018 |
Neg logit contributions | |
sound | -0.018 |
do | -0.014 |
listen | -0.013 |
listened | -0.013 |
inker | -0.013 |
Token | Mom |
Token ID | 11254 |
Feature activation | +2.69e-02 |
Pos logit contributions | |
sound | +0.062 |
do | +0.045 |
listen | +0.043 |
listened | +0.043 |
inker | +0.042 |
Neg logit contributions | |
piping | -0.091 |
endant | -0.089 |
million | -0.087 |
ocol | -0.085 |
imet | -0.083 |
Token | is |
Token ID | 318 |
Feature activation | +3.33e-02 |
Pos logit contributions | |
sound | +0.045 |
do | +0.034 |
listen | +0.034 |
listened | +0.034 |
not | +0.033 |
Neg logit contributions | |
piping | -0.045 |
endant | -0.044 |
million | -0.043 |
ocol | -0.042 |
imet | -0.041 |
Token | busy |
Token ID | 8179 |
Feature activation | +8.70e-02 |
Pos logit contributions | |
sound | +0.041 |
do | +0.030 |
listen | +0.029 |
tails | +0.029 |
inker | +0.029 |
Neg logit contributions | |
piping | -0.067 |
endant | -0.064 |
million | -0.063 |
ocol | -0.061 |
freshly | -0.060 |
Token | in |
Token ID | 287 |
Feature activation | -7.46e-04 |
Pos logit contributions | |
sound | +0.129 |
inker | +0.104 |
tails | +0.101 |
ably | +0.098 |
communicate | +0.098 |
Neg logit contributions | |
� | -0.142 |
ocol | -0.142 |
piping | -0.142 |
million | -0.139 |
igsaw | -0.136 |
Token | the |
Token ID | 262 |
Feature activation | +1.95e-02 |
Pos logit contributions | |
piping | +0.002 |
million | +0.002 |
ocol | +0.002 |
endant | +0.002 |
freshly | +0.002 |
Neg logit contributions | |
sound | -0.001 |
listened | -0.001 |
listen | -0.001 |
do | -0.001 |
inker | -0.000 |
Token | kitchen |
Token ID | 9592 |
Feature activation | +4.59e-02 |
Pos logit contributions | |
sound | +0.036 |
do | +0.029 |
listen | +0.028 |
listened | +0.027 |
not | +0.027 |
Neg logit contributions | |
endant | -0.031 |
piping | -0.031 |
ocol | -0.030 |
million | -0.029 |
imet | -0.028 |
Token | , |
Token ID | 11 |
Feature activation | +6.28e-03 |
Pos logit contributions | |
sound | +0.069 |
communicate | +0.060 |
inker | +0.058 |
ably | +0.057 |
tails | +0.056 |
Neg logit contributions | |
piping | -0.076 |
million | -0.076 |
There | -0.071 |
� | -0.070 |
umm | -0.069 |
Token | they |
Token ID | 484 |
Feature activation | +2.93e-02 |
Pos logit contributions | |
sound | +0.011 |
inker | +0.010 |
tails | +0.009 |
communicate | +0.009 |
ably | +0.009 |
Neg logit contributions | |
piping | -0.009 |
freshly | -0.008 |
camps | -0.008 |
million | -0.008 |
endant | -0.008 |
Token | it |
Token ID | 340 |
Feature activation | -3.39e-02 |
Pos logit contributions | |
piping | +0.066 |
endant | +0.066 |
ocol | +0.064 |
million | +0.064 |
imet | +0.062 |
Neg logit contributions | |
sound | -0.033 |
do | -0.023 |
listen | -0.022 |
listened | -0.021 |
behave | -0.020 |
Token | ! |
Token ID | 0 |
Feature activation | +3.81e-03 |
Pos logit contributions | |
endant | +0.061 |
million | +0.059 |
camps | +0.058 |
piping | +0.056 |
brand | +0.056 |
Neg logit contributions | |
sound | -0.049 |
listen | -0.037 |
inker | -0.037 |
communicate | -0.036 |
do | -0.035 |
Token |
|
Token ID | 198 |
Feature activation | -8.59e-03 |
Pos logit contributions | |
sound | +0.005 |
not | +0.004 |
do | +0.004 |
listen | +0.004 |
each | +0.004 |
Neg logit contributions | |
endant | -0.007 |
ocol | -0.007 |
piping | -0.007 |
umm | -0.007 |
dark | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | -8.41e-03 |
Pos logit contributions | |
umm | +0.017 |
endant | +0.016 |
ocol | +0.016 |
piping | +0.015 |
igsaw | +0.015 |
Neg logit contributions | |
sound | -0.013 |
do | -0.012 |
not | -0.011 |
listen | -0.010 |
listened | -0.010 |
Token | R |
Token ID | 49 |
Feature activation | +3.79e-02 |
Pos logit contributions | |
piping | +0.014 |
endant | +0.014 |
million | +0.013 |
ocol | +0.013 |
umm | +0.013 |
Neg logit contributions | |
sound | -0.014 |
do | -0.011 |
listen | -0.011 |
listened | -0.011 |
not | -0.010 |
Token | over |
Token ID | 2502 |
Feature activation | +8.68e-02 |
Pos logit contributions | |
sound | +0.062 |
do | +0.047 |
listen | +0.046 |
listened | +0.046 |
not | +0.045 |
Neg logit contributions | |
endant | -0.064 |
piping | -0.064 |
ocol | -0.063 |
million | -0.061 |
imet | -0.060 |
Token | was |
Token ID | 373 |
Feature activation | +2.36e-02 |
Pos logit contributions | |
sound | +0.122 |
inker | +0.107 |
communicate | +0.105 |
tails | +0.105 |
listen | +0.102 |
Neg logit contributions | |
million | -0.143 |
endant | -0.139 |
piping | -0.133 |
dark | -0.130 |
seventy | -0.129 |
Token | so |
Token ID | 523 |
Feature activation | +2.17e-02 |
Pos logit contributions | |
sound | +0.031 |
listen | +0.023 |
do | +0.023 |
inker | +0.022 |
listened | +0.021 |
Neg logit contributions | |
piping | -0.047 |
endant | -0.046 |
million | -0.045 |
pleasure | -0.043 |
ocol | -0.043 |
Token | happy |
Token ID | 3772 |
Feature activation | +6.95e-03 |
Pos logit contributions | |
sound | +0.037 |
listen | +0.030 |
do | +0.029 |
tails | +0.029 |
inker | +0.029 |
Neg logit contributions | |
piping | -0.034 |
endant | -0.033 |
million | -0.032 |
pleasure | -0.030 |
dark | -0.029 |
Token | he |
Token ID | 339 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
sound | +0.010 |
communicate | +0.008 |
inker | +0.008 |
tails | +0.008 |
behave | +0.008 |
Neg logit contributions | |
joy | -0.012 |
endant | -0.011 |
imet | -0.011 |
million | -0.011 |
camps | -0.011 |
Token | had |
Token ID | 550 |
Feature activation | -4.33e-02 |
Pos logit contributions | |
million | +0.016 |
endant | +0.015 |
dark | +0.014 |
freshly | +0.014 |
piping | +0.014 |
Neg logit contributions | |
sound | -0.020 |
communicate | -0.017 |
inker | -0.016 |
listen | -0.016 |
ics | -0.016 |
Token | !" |
Token ID | 2474 |
Feature activation | +3.48e-02 |
Pos logit contributions | |
sound | +0.000 |
inker | +0.000 |
listened | +0.000 |
tails | +0.000 |
communicate | +0.000 |
Neg logit contributions | |
million | -0.000 |
piping | -0.000 |
endant | -0.000 |
camps | -0.000 |
pleasure | -0.000 |
Token | one |
Token ID | 530 |
Feature activation | +6.27e-02 |
Pos logit contributions | |
sound | +0.058 |
ably | +0.052 |
tails | +0.052 |
ics | +0.050 |
inker | +0.050 |
Neg logit contributions | |
There | -0.052 |
piping | -0.050 |
million | -0.048 |
endant | -0.048 |
Some | -0.046 |
Token | of |
Token ID | 286 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
sound | +0.125 |
behave | +0.110 |
listen | +0.109 |
communicate | +0.108 |
ics | +0.107 |
Neg logit contributions | |
piping | -0.073 |
million | -0.070 |
endant | -0.067 |
dark | -0.063 |
ocol | -0.061 |
Token | the |
Token ID | 262 |
Feature activation | +2.19e-02 |
Pos logit contributions | |
sound | +0.021 |
do | +0.015 |
listened | +0.015 |
listen | +0.014 |
behave | +0.013 |
Neg logit contributions | |
piping | -0.035 |
ocol | -0.034 |
endant | -0.034 |
million | -0.034 |
freshly | -0.032 |
Token | fire |
Token ID | 2046 |
Feature activation | +4.04e-02 |
Pos logit contributions | |
sound | +0.037 |
do | +0.030 |
listen | +0.030 |
listened | +0.030 |
inker | +0.029 |
Neg logit contributions | |
piping | -0.034 |
endant | -0.033 |
million | -0.033 |
ocol | -0.032 |
camps | -0.031 |
Token | men |
Token ID | 3653 |
Feature activation | +8.68e-02 |
Pos logit contributions | |
sound | +0.058 |
behave | +0.055 |
listen | +0.054 |
inker | +0.054 |
her | +0.053 |
Neg logit contributions | |
million | -0.060 |
piping | -0.058 |
endant | -0.058 |
camps | -0.056 |
dark | -0.056 |
Token | said |
Token ID | 531 |
Feature activation | -9.51e-03 |
Pos logit contributions | |
sound | +0.099 |
inker | +0.083 |
behave | +0.077 |
ising | +0.076 |
listen | +0.076 |
Neg logit contributions | |
million | -0.161 |
piping | -0.157 |
umbs | -0.152 |
berry | -0.149 |
There | -0.148 |
Token | . |
Token ID | 13 |
Feature activation | +1.64e-02 |
Pos logit contributions | |
piping | +0.016 |
imet | +0.016 |
endant | +0.016 |
joy | +0.016 |
ocol | +0.015 |
Neg logit contributions | |
sound | -0.013 |
inker | -0.011 |
behave | -0.010 |
do | -0.010 |
communicate | -0.010 |
Token | " |
Token ID | 366 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
sound | +0.028 |
do | +0.023 |
listened | +0.022 |
listen | +0.022 |
not | +0.022 |
Neg logit contributions | |
piping | -0.027 |
endant | -0.027 |
ocol | -0.026 |
million | -0.025 |
umm | -0.025 |
Token | Did |
Token ID | 11633 |
Feature activation | +1.35e-02 |
Pos logit contributions | |
sound | +0.023 |
do | +0.018 |
listen | +0.017 |
listened | +0.017 |
not | +0.016 |
Neg logit contributions | |
piping | -0.028 |
endant | -0.028 |
million | -0.027 |
ocol | -0.027 |
dark | -0.026 |
Token | you |
Token ID | 345 |
Feature activation | +1.11e-03 |
Pos logit contributions | |
sound | +0.021 |
inker | +0.017 |
ably | +0.017 |
tails | +0.015 |
ising | +0.015 |
Neg logit contributions | |
endant | -0.021 |
ocol | -0.020 |
piping | -0.020 |
million | -0.020 |
imet | -0.020 |
Token | smile |
Token ID | 8212 |
Feature activation | -4.32e-02 |
Pos logit contributions | |
pleasure | +0.006 |
piping | +0.006 |
million | +0.006 |
freshly | +0.006 |
brand | +0.005 |
Neg logit contributions | |
inker | -0.005 |
ably | -0.004 |
sound | -0.004 |
ix | -0.004 |
gg | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | -1.27e-03 |
Pos logit contributions | |
million | +0.061 |
brand | +0.059 |
ifying | +0.059 |
asleep | +0.058 |
joy | +0.057 |
Neg logit contributions | |
obey | -0.063 |
sound | -0.063 |
inker | -0.061 |
prove | -0.061 |
ics | -0.060 |
Token | As |
Token ID | 1081 |
Feature activation | +5.97e-02 |
Pos logit contributions | |
endant | +0.002 |
ocol | +0.002 |
piping | +0.002 |
million | +0.002 |
umm | +0.002 |
Neg logit contributions | |
sound | -0.002 |
do | -0.002 |
not | -0.002 |
listened | -0.002 |
listen | -0.002 |
Token | he |
Token ID | 339 |
Feature activation | +2.37e-02 |
Pos logit contributions | |
sound | +0.085 |
inker | +0.067 |
ics | +0.065 |
do | +0.065 |
behave | +0.064 |
Neg logit contributions | |
million | -0.106 |
piping | -0.105 |
camps | -0.101 |
ocol | -0.099 |
endant | -0.098 |
Token | r |
Token ID | 374 |
Feature activation | +4.96e-02 |
Pos logit contributions | |
sound | +0.036 |
inker | +0.029 |
not | +0.029 |
listen | +0.028 |
ics | +0.027 |
Neg logit contributions | |
endant | -0.038 |
million | -0.038 |
camps | -0.037 |
piping | -0.037 |
dark | -0.036 |
Token | ained |
Token ID | 1328 |
Feature activation | +8.65e-02 |
Pos logit contributions | |
sound | +0.092 |
do | +0.078 |
listen | +0.077 |
not | +0.071 |
listened | +0.070 |
Neg logit contributions | |
endant | -0.074 |
piping | -0.071 |
million | -0.069 |
ocol | -0.069 |
umm | -0.068 |
Token | he |
Token ID | 339 |
Feature activation | +4.81e-03 |
Pos logit contributions | |
sound | +0.105 |
tails | +0.086 |
inker | +0.081 |
listen | +0.080 |
communicate | +0.080 |
Neg logit contributions | |
million | -0.163 |
imet | -0.159 |
ocol | -0.156 |
piping | -0.155 |
� | -0.153 |
Token | said |
Token ID | 531 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
sound | +0.008 |
inker | +0.007 |
ics | +0.006 |
ising | +0.006 |
listen | +0.006 |
Neg logit contributions | |
million | -0.007 |
endant | -0.007 |
dark | -0.007 |
imet | -0.006 |
camps | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | +8.12e-03 |
Pos logit contributions | |
piping | +0.029 |
million | +0.027 |
brand | +0.027 |
imet | +0.027 |
pleasure | +0.026 |
Neg logit contributions | |
sound | -0.028 |
tails | -0.025 |
inker | -0.024 |
ising | -0.023 |
ably | -0.023 |
Token | " |
Token ID | 366 |
Feature activation | -6.27e-03 |
Pos logit contributions | |
sound | +0.012 |
inker | +0.011 |
tails | +0.011 |
ics | +0.011 |
ably | +0.010 |
Neg logit contributions | |
million | -0.013 |
imet | -0.013 |
piping | -0.012 |
There | -0.012 |
joy | -0.012 |
Token | Hi |
Token ID | 17250 |
Feature activation | -5.47e-02 |
Pos logit contributions | |
piping | +0.010 |
endant | +0.009 |
million | +0.009 |
ocol | +0.009 |
umm | +0.009 |
Neg logit contributions | |
sound | -0.011 |
do | -0.009 |
listen | -0.009 |
listened | -0.009 |
not | -0.009 |
Token | keep |
Token ID | 1394 |
Feature activation | +2.15e-03 |
Pos logit contributions | |
million | +0.010 |
piping | +0.009 |
imet | +0.009 |
ocol | +0.009 |
camps | +0.009 |
Neg logit contributions | |
sound | -0.011 |
ably | -0.009 |
listened | -0.008 |
ising | -0.008 |
communicate | -0.008 |
Token | going |
Token ID | 1016 |
Feature activation | +1.80e-03 |
Pos logit contributions | |
sound | +0.003 |
ably | +0.003 |
inker | +0.002 |
communicate | +0.002 |
listened | +0.002 |
Neg logit contributions | |
ocol | -0.003 |
piping | -0.003 |
freshly | -0.003 |
million | -0.003 |
brand | -0.003 |
Token | ." |
Token ID | 526 |
Feature activation | +3.46e-03 |
Pos logit contributions | |
sound | +0.003 |
listened | +0.002 |
do | +0.002 |
communicate | +0.002 |
inker | +0.002 |
Neg logit contributions | |
endant | -0.003 |
million | -0.003 |
piping | -0.003 |
camps | -0.003 |
imet | -0.003 |
Token | Max |
Token ID | 5436 |
Feature activation | +3.47e-02 |
Pos logit contributions | |
sound | +0.008 |
do | +0.006 |
listen | +0.006 |
listened | +0.006 |
behave | +0.006 |
Neg logit contributions | |
piping | -0.004 |
endant | -0.004 |
million | -0.003 |
imet | -0.003 |
ocol | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +1.68e-02 |
Pos logit contributions | |
sound | +0.049 |
ourselves | +0.048 |
inker | +0.047 |
ics | +0.046 |
communicate | +0.044 |
Neg logit contributions | |
berry | -0.049 |
imet | -0.048 |
endant | -0.048 |
pad | -0.048 |
million | -0.048 |
Token | Scot |
Token ID | 7130 |
Feature activation | +8.64e-02 |
Pos logit contributions | |
sound | +0.034 |
ably | +0.032 |
ising | +0.031 |
ics | +0.030 |
communicate | +0.030 |
Neg logit contributions | |
Bub | -0.015 |
camps | -0.014 |
imet | -0.014 |
run | -0.014 |
million | -0.014 |
Token | ty |
Token ID | 774 |
Feature activation | +4.97e-02 |
Pos logit contributions | |
sound | +0.136 |
music | +0.120 |
early | +0.114 |
do | +0.113 |
poses | +0.113 |
Neg logit contributions | |
mo | -0.110 |
irst | -0.107 |
million | -0.097 |
Em | -0.097 |
omed | -0.097 |
Token | kept |
Token ID | 4030 |
Feature activation | +1.77e-02 |
Pos logit contributions | |
sound | +0.083 |
inker | +0.070 |
ourselves | +0.064 |
yourself | +0.063 |
communicate | +0.063 |
Neg logit contributions | |
berry | -0.063 |
endant | -0.063 |
million | -0.063 |
camps | -0.062 |
� | -0.062 |
Token | walking |
Token ID | 6155 |
Feature activation | +6.79e-04 |
Pos logit contributions | |
sound | +0.030 |
ably | +0.026 |
inker | +0.025 |
ics | +0.024 |
do | +0.024 |
Neg logit contributions | |
joy | -0.024 |
freshly | -0.024 |
piping | -0.023 |
camps | -0.022 |
million | -0.022 |
Token | , |
Token ID | 11 |
Feature activation | +4.86e-03 |
Pos logit contributions | |
sound | +0.001 |
ics | +0.001 |
listened | +0.001 |
w | +0.001 |
disob | +0.001 |
Neg logit contributions | |
camps | -0.001 |
joy | -0.001 |
pleasure | -0.001 |
million | -0.001 |
brand | -0.001 |
Token | but |
Token ID | 475 |
Feature activation | +7.60e-03 |
Pos logit contributions | |
sound | +0.008 |
inker | +0.008 |
ics | +0.007 |
communicate | +0.007 |
ister | +0.007 |
Neg logit contributions | |
joy | -0.007 |
freshly | -0.006 |
brand | -0.006 |
Once | -0.006 |
imet | -0.006 |
Token | air |
Token ID | 1633 |
Feature activation | +3.36e-02 |
Pos logit contributions | |
sound | +0.008 |
do | +0.007 |
listen | +0.007 |
listened | +0.007 |
inker | +0.006 |
Neg logit contributions | |
piping | -0.007 |
endant | -0.007 |
million | -0.007 |
ocol | -0.007 |
umm | -0.007 |
Token | is |
Token ID | 318 |
Feature activation | +1.58e-02 |
Pos logit contributions | |
inker | +0.053 |
sound | +0.050 |
tails | +0.047 |
communicate | +0.045 |
ably | +0.045 |
Neg logit contributions | |
million | -0.052 |
freshly | -0.048 |
piping | -0.047 |
endant | -0.047 |
dark | -0.046 |
Token | so |
Token ID | 523 |
Feature activation | +6.75e-03 |
Pos logit contributions | |
sound | +0.022 |
inker | +0.018 |
do | +0.017 |
listen | +0.017 |
listened | +0.017 |
Neg logit contributions | |
piping | -0.029 |
million | -0.029 |
endant | -0.029 |
ocol | -0.027 |
freshly | -0.027 |
Token | cool |
Token ID | 3608 |
Feature activation | -1.29e-02 |
Pos logit contributions | |
sound | +0.011 |
inker | +0.010 |
tails | +0.009 |
communicate | +0.009 |
ably | +0.009 |
Neg logit contributions | |
million | -0.011 |
piping | -0.011 |
endant | -0.011 |
freshly | -0.010 |
ocol | -0.010 |
Token | ." |
Token ID | 526 |
Feature activation | +6.39e-03 |
Pos logit contributions | |
million | +0.023 |
piping | +0.022 |
umm | +0.022 |
endant | +0.022 |
imet | +0.021 |
Neg logit contributions | |
sound | -0.019 |
communicate | -0.016 |
inker | -0.016 |
tails | -0.015 |
listened | -0.015 |
Token | Mut |
Token ID | 13859 |
Feature activation | +8.63e-02 |
Pos logit contributions | |
sound | +0.013 |
do | +0.011 |
listen | +0.011 |
listened | +0.011 |
not | +0.011 |
Neg logit contributions | |
piping | -0.008 |
endant | -0.008 |
ocol | -0.008 |
million | -0.008 |
umm | -0.007 |
Token | t |
Token ID | 83 |
Feature activation | +4.80e-02 |
Pos logit contributions | |
sound | +0.149 |
tails | +0.133 |
listen | +0.129 |
her | +0.128 |
heads | +0.127 |
Neg logit contributions | |
million | -0.120 |
piping | -0.108 |
dark | -0.106 |
oke | -0.102 |
endant | -0.100 |
Token | was |
Token ID | 373 |
Feature activation | +2.48e-02 |
Pos logit contributions | |
sound | +0.075 |
tails | +0.061 |
listen | +0.061 |
communicate | +0.061 |
ics | +0.059 |
Neg logit contributions | |
million | -0.077 |
ocol | -0.074 |
piping | -0.074 |
dark | -0.071 |
endant | -0.070 |
Token | then |
Token ID | 788 |
Feature activation | -6.98e-03 |
Pos logit contributions | |
sound | +0.036 |
inker | +0.031 |
listen | +0.029 |
tails | +0.028 |
ising | +0.028 |
Neg logit contributions | |
piping | -0.042 |
million | -0.041 |
endant | -0.040 |
freshly | -0.039 |
brand | -0.039 |
Token | more |
Token ID | 517 |
Feature activation | +5.08e-02 |
Pos logit contributions | |
piping | +0.011 |
million | +0.011 |
freshly | +0.011 |
brand | +0.010 |
joy | +0.010 |
Neg logit contributions | |
sound | -0.010 |
inker | -0.010 |
ics | -0.009 |
tails | -0.009 |
ably | -0.008 |
Token | relaxed |
Token ID | 18397 |
Feature activation | +3.75e-02 |
Pos logit contributions | |
sound | +0.074 |
listen | +0.061 |
inker | +0.061 |
tails | +0.060 |
ics | +0.059 |
Neg logit contributions | |
piping | -0.091 |
million | -0.087 |
ocol | -0.086 |
endant | -0.084 |
joy | -0.083 |
Token | , |
Token ID | 11 |
Feature activation | -3.73e-03 |
Pos logit contributions | |
sound | +0.022 |
behave | +0.020 |
obey | +0.020 |
listen | +0.018 |
disob | +0.018 |
Neg logit contributions | |
piping | -0.025 |
brand | -0.025 |
endant | -0.024 |
ocol | -0.024 |
million | -0.024 |
Token | drawing |
Token ID | 8263 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
piping | +0.006 |
endant | +0.006 |
brand | +0.006 |
There | +0.006 |
million | +0.006 |
Neg logit contributions | |
sound | -0.005 |
inker | -0.005 |
ek | -0.004 |
ably | -0.004 |
ising | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -4.62e-03 |
Pos logit contributions | |
sound | +0.024 |
behave | +0.021 |
obey | +0.021 |
listened | +0.021 |
listen | +0.021 |
Neg logit contributions | |
piping | -0.025 |
million | -0.025 |
dark | -0.024 |
brand | -0.024 |
endant | -0.024 |
Token | and |
Token ID | 290 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
piping | +0.008 |
endant | +0.008 |
million | +0.007 |
camps | +0.007 |
There | +0.007 |
Neg logit contributions | |
sound | -0.006 |
inker | -0.006 |
ek | -0.005 |
ably | -0.005 |
ising | -0.005 |
Token | doing |
Token ID | 1804 |
Feature activation | +4.65e-02 |
Pos logit contributions | |
sound | +0.015 |
inker | +0.013 |
ably | +0.013 |
oo | +0.012 |
ek | +0.012 |
Neg logit contributions | |
piping | -0.020 |
million | -0.019 |
endant | -0.018 |
freshly | -0.018 |
ocol | -0.018 |
Token | experiments |
Token ID | 10256 |
Feature activation | +8.58e-02 |
Pos logit contributions | |
w | +0.071 |
sound | +0.069 |
bye | +0.067 |
oo | +0.064 |
listened | +0.063 |
Neg logit contributions | |
brand | -0.070 |
piping | -0.065 |
igsaw | -0.061 |
million | -0.061 |
ocol | -0.060 |
Token | . |
Token ID | 13 |
Feature activation | +1.24e-02 |
Pos logit contributions | |
sound | +0.130 |
w | +0.115 |
tails | +0.113 |
ani | +0.112 |
inker | +0.112 |
Neg logit contributions | |
piping | -0.117 |
dark | -0.117 |
brand | -0.117 |
million | -0.116 |
There | -0.115 |
Token | Lily |
Token ID | 20037 |
Feature activation | +7.61e-03 |
Pos logit contributions | |
sound | +0.013 |
not | +0.012 |
do | +0.011 |
when | +0.011 |
each | +0.011 |
Neg logit contributions | |
endant | -0.028 |
ocol | -0.027 |
tal | -0.025 |
piping | -0.025 |
million | -0.025 |
Token | and |
Token ID | 290 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
sound | +0.012 |
communicate | +0.008 |
inker | +0.008 |
oo | +0.008 |
tails | +0.008 |
Neg logit contributions | |
endant | -0.013 |
camps | -0.012 |
imet | -0.012 |
piping | -0.012 |
Wouldn | -0.012 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.01e-02 |
Pos logit contributions | |
sound | +0.047 |
inker | +0.041 |
ising | +0.041 |
ably | +0.040 |
izes | +0.039 |
Neg logit contributions | |
piping | -0.014 |
There | -0.014 |
berries | -0.014 |
joy | -0.013 |
imet | -0.013 |
Token | want |
Token ID | 765 |
Feature activation | +5.50e-04 |
Pos logit contributions | |
sound | +0.081 |
oo | +0.071 |
inker | +0.070 |
ister | +0.066 |
ggy | +0.061 |
Neg logit contributions | |
piping | -0.079 |
pleasure | -0.071 |
There | -0.070 |
dark | -0.068 |
freshly | -0.068 |
Token | . |
Token ID | 13 |
Feature activation | +3.10e-03 |
Pos logit contributions | |
endant | +0.030 |
piping | +0.029 |
million | +0.028 |
ocol | +0.028 |
freshly | +0.027 |
Neg logit contributions | |
sound | -0.016 |
inker | -0.011 |
listen | -0.011 |
listened | -0.011 |
communicate | -0.010 |
Token | Mom |
Token ID | 11254 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
sound | +0.005 |
do | +0.004 |
listen | +0.004 |
not | +0.003 |
listened | +0.003 |
Neg logit contributions | |
endant | -0.006 |
piping | -0.006 |
million | -0.005 |
ocol | -0.005 |
igsaw | -0.005 |
Token | says |
Token ID | 1139 |
Feature activation | -2.49e-02 |
Pos logit contributions | |
sound | +0.022 |
do | +0.016 |
listen | +0.016 |
listened | +0.015 |
inker | +0.015 |
Neg logit contributions | |
piping | -0.026 |
endant | -0.026 |
million | -0.025 |
ocol | -0.024 |
camps | -0.024 |
Token | they |
Token ID | 484 |
Feature activation | -2.12e-03 |
Pos logit contributions | |
piping | +0.057 |
endant | +0.057 |
million | +0.055 |
ocol | +0.055 |
imet | +0.053 |
Neg logit contributions | |
sound | -0.026 |
do | -0.017 |
listen | -0.016 |
listened | -0.016 |
inker | -0.015 |
Token | are |
Token ID | 389 |
Feature activation | +4.15e-03 |
Pos logit contributions | |
piping | +0.003 |
endant | +0.003 |
million | +0.003 |
ocol | +0.003 |
umm | +0.003 |
Neg logit contributions | |
sound | -0.004 |
do | -0.003 |
listen | -0.003 |
listened | -0.003 |
not | -0.003 |
Token | av |
Token ID | 1196 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
sound | +0.005 |
do | +0.004 |
listen | +0.004 |
listened | +0.004 |
not | +0.004 |
Neg logit contributions | |
piping | -0.009 |
endant | -0.008 |
million | -0.008 |
ocol | -0.008 |
umm | -0.008 |
Token | oc |
Token ID | 420 |
Feature activation | -4.89e-02 |
Pos logit contributions | |
piping | +0.130 |
endant | +0.129 |
dark | +0.118 |
imet | +0.118 |
ocol | +0.117 |
Neg logit contributions | |
sound | -0.231 |
tails | -0.196 |
do | -0.194 |
listen | -0.191 |
listened | -0.191 |
Token | ados |
Token ID | 22484 |
Feature activation | -2.80e-02 |
Pos logit contributions | |
ocol | +0.045 |
endant | +0.044 |
umm | +0.044 |
imet | +0.040 |
piping | +0.039 |
Neg logit contributions | |
sound | -0.121 |
do | -0.106 |
listen | -0.101 |
listened | -0.099 |
behave | -0.098 |
Token | . |
Token ID | 13 |
Feature activation | +4.52e-03 |
Pos logit contributions | |
endant | +0.049 |
camps | +0.045 |
piping | +0.044 |
million | +0.044 |
freshly | +0.044 |
Neg logit contributions | |
sound | -0.044 |
inker | -0.034 |
gging | -0.032 |
listened | -0.032 |
communicate | -0.031 |
Token | Sara |
Token ID | 24799 |
Feature activation | +1.64e-02 |
Pos logit contributions | |
sound | +0.007 |
do | +0.006 |
not | +0.005 |
listen | +0.005 |
her | +0.005 |
Neg logit contributions | |
endant | -0.008 |
piping | -0.008 |
ocol | -0.008 |
million | -0.008 |
igsaw | -0.008 |
Token | wants |
Token ID | 3382 |
Feature activation | -5.16e-03 |
Pos logit contributions | |
sound | +0.026 |
listen | +0.018 |
inker | +0.017 |
listened | +0.017 |
do | +0.017 |
Neg logit contributions | |
endant | -0.029 |
piping | -0.029 |
imet | -0.027 |
million | -0.027 |
camps | -0.027 |
Token | the |
Token ID | 262 |
Feature activation | -2.65e-02 |
Pos logit contributions | |
sound | +0.015 |
do | +0.010 |
not | +0.010 |
listen | +0.009 |
listened | +0.009 |
Neg logit contributions | |
endant | -0.032 |
piping | -0.032 |
ocol | -0.032 |
million | -0.031 |
imet | -0.030 |
Token | prett |
Token ID | 46442 |
Feature activation | -2.23e-02 |
Pos logit contributions | |
piping | +0.044 |
endant | +0.041 |
million | +0.040 |
umm | +0.040 |
pleasure | +0.039 |
Neg logit contributions | |
sound | -0.043 |
listened | -0.035 |
inker | -0.035 |
listen | -0.034 |
do | -0.034 |
Token | iest |
Token ID | 6386 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
piping | +0.037 |
endant | +0.037 |
ocol | +0.035 |
million | +0.035 |
umm | +0.034 |
Neg logit contributions | |
sound | -0.038 |
do | -0.030 |
listen | -0.029 |
listened | -0.029 |
not | -0.028 |
Token | a |
Token ID | 257 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
piping | +0.023 |
endant | +0.023 |
ocol | +0.022 |
million | +0.022 |
umm | +0.021 |
Neg logit contributions | |
sound | -0.025 |
do | -0.020 |
listen | -0.020 |
listened | -0.019 |
not | -0.019 |
Token | pron |
Token ID | 31186 |
Feature activation | -4.22e-03 |
Pos logit contributions | |
ocol | +0.023 |
endant | +0.023 |
umbs | +0.022 |
irst | +0.021 |
piping | +0.021 |
Neg logit contributions | |
sound | -0.018 |
do | -0.013 |
not | -0.012 |
listen | -0.012 |
music | -0.012 |
Token | I |
Token ID | 314 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
piping | +0.007 |
million | +0.007 |
endant | +0.007 |
umm | +0.007 |
dark | +0.007 |
Neg logit contributions | |
sound | -0.006 |
inker | -0.005 |
communicate | -0.005 |
listen | -0.005 |
listened | -0.005 |
Token | have |
Token ID | 423 |
Feature activation | -5.21e-02 |
Pos logit contributions | |
piping | +0.184 |
endant | +0.182 |
million | +0.176 |
ocol | +0.174 |
umm | +0.173 |
Neg logit contributions | |
sound | -0.174 |
do | -0.145 |
listen | -0.140 |
listened | -0.138 |
not | -0.131 |
Token | ever |
Token ID | 1683 |
Feature activation | -7.34e-02 |
Pos logit contributions | |
endant | +0.094 |
piping | +0.093 |
million | +0.090 |
ocol | +0.089 |
dark | +0.087 |
Neg logit contributions | |
sound | -0.079 |
do | -0.060 |
listen | -0.059 |
listened | -0.057 |
inker | -0.056 |
Token | seen |
Token ID | 1775 |
Feature activation | -3.66e-02 |
Pos logit contributions | |
piping | +0.124 |
endant | +0.124 |
ocol | +0.118 |
million | +0.118 |
umm | +0.115 |
Neg logit contributions | |
sound | -0.121 |
do | -0.095 |
listen | -0.093 |
listened | -0.092 |
not | -0.089 |
Token | !" |
Token ID | 2474 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
piping | +0.069 |
endant | +0.068 |
million | +0.066 |
ocol | +0.066 |
umm | +0.063 |
Neg logit contributions | |
sound | -0.052 |
do | -0.040 |
listen | -0.039 |
listened | -0.038 |
not | -0.037 |
Token | exclaimed |
Token ID | 33552 |
Feature activation | -2.64e-02 |
Pos logit contributions | |
sound | +0.016 |
do | +0.012 |
listen | +0.012 |
listened | +0.011 |
not | +0.011 |
Neg logit contributions | |
piping | -0.022 |
endant | -0.022 |
million | -0.021 |
ocol | -0.021 |
umm | -0.020 |
Token | is |
Token ID | 318 |
Feature activation | +9.88e-03 |
Pos logit contributions | |
sound | +0.006 |
inker | +0.005 |
loudly | +0.005 |
ably | +0.005 |
listened | +0.005 |
Neg logit contributions | |
piping | -0.006 |
endant | -0.006 |
million | -0.006 |
bead | -0.006 |
dark | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | -2.47e-02 |
Pos logit contributions | |
sound | +0.013 |
do | +0.009 |
listen | +0.009 |
listened | +0.009 |
inker | +0.008 |
Neg logit contributions | |
piping | -0.020 |
endant | -0.020 |
million | -0.019 |
ocol | -0.019 |
dark | -0.019 |
Token | most |
Token ID | 749 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
piping | +0.042 |
endant | +0.041 |
million | +0.040 |
ocol | +0.039 |
umm | +0.039 |
Neg logit contributions | |
sound | -0.039 |
do | -0.031 |
listened | -0.031 |
listen | -0.030 |
inker | -0.029 |
Token | beautiful |
Token ID | 4950 |
Feature activation | -3.07e-02 |
Pos logit contributions | |
sound | +0.033 |
do | +0.025 |
listen | +0.024 |
listened | +0.024 |
not | +0.023 |
Neg logit contributions | |
piping | -0.037 |
endant | -0.036 |
ocol | -0.035 |
million | -0.035 |
imet | -0.034 |
Token | card |
Token ID | 2657 |
Feature activation | +2.87e-03 |
Pos logit contributions | |
piping | +0.055 |
endant | +0.054 |
million | +0.052 |
ocol | +0.052 |
umm | +0.050 |
Neg logit contributions | |
sound | -0.046 |
do | -0.036 |
listened | -0.036 |
listen | -0.035 |
not | -0.035 |
Token | I |
Token ID | 314 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
sound | +0.004 |
inker | +0.003 |
tails | +0.003 |
listen | +0.003 |
ising | +0.003 |
Neg logit contributions | |
endant | -0.005 |
piping | -0.005 |
million | -0.005 |
dark | -0.005 |
bead | -0.005 |
Token | ever |
Token ID | 1683 |
Feature activation | -7.37e-02 |
Pos logit contributions | |
piping | +0.171 |
endant | +0.170 |
ocol | +0.163 |
million | +0.160 |
dark | +0.159 |
Neg logit contributions | |
sound | -0.183 |
inker | -0.135 |
loudly | -0.134 |
do | -0.133 |
tails | -0.132 |
Token | got |
Token ID | 1392 |
Feature activation | +1.35e-03 |
Pos logit contributions | |
piping | +0.133 |
endant | +0.133 |
million | +0.128 |
ocol | +0.125 |
dark | +0.123 |
Neg logit contributions | |
sound | -0.110 |
do | -0.082 |
listen | -0.080 |
inker | -0.079 |
not | -0.079 |
Token | . |
Token ID | 13 |
Feature activation | +3.32e-04 |
Pos logit contributions | |
sound | +0.002 |
do | +0.001 |
listen | +0.001 |
listened | +0.001 |
inker | +0.001 |
Neg logit contributions | |
endant | -0.003 |
piping | -0.003 |
million | -0.003 |
ocol | -0.002 |
dark | -0.002 |
Token | You |
Token ID | 921 |
Feature activation | -3.40e-02 |
Pos logit contributions | |
sound | +0.001 |
listen | +0.000 |
do | +0.000 |
not | +0.000 |
her | +0.000 |
Neg logit contributions | |
endant | -0.001 |
million | -0.001 |
ocol | -0.001 |
piping | -0.001 |
camps | -0.001 |
Token | are |
Token ID | 389 |
Feature activation | +9.67e-04 |
Pos logit contributions | |
endant | +0.053 |
million | +0.050 |
piping | +0.049 |
pleasure | +0.048 |
dark | +0.047 |
Neg logit contributions | |
sound | -0.058 |
inker | -0.048 |
loudly | -0.045 |
ably | -0.043 |
ising | -0.043 |
Token | is |
Token ID | 318 |
Feature activation | +1.39e-02 |
Pos logit contributions | |
sound | +0.017 |
do | +0.013 |
not | +0.011 |
listened | +0.011 |
listen | +0.011 |
Neg logit contributions | |
ocol | -0.028 |
piping | -0.028 |
umm | -0.027 |
million | -0.027 |
igsaw | -0.027 |
Token | the |
Token ID | 262 |
Feature activation | -2.15e-02 |
Pos logit contributions | |
sound | +0.014 |
not | +0.010 |
do | +0.010 |
listen | +0.009 |
listened | +0.008 |
Neg logit contributions | |
piping | -0.032 |
endant | -0.032 |
ocol | -0.032 |
million | -0.032 |
umm | -0.032 |
Token | most |
Token ID | 749 |
Feature activation | +2.38e-02 |
Pos logit contributions | |
ocol | +0.038 |
piping | +0.038 |
million | +0.037 |
endant | +0.037 |
igsaw | +0.036 |
Neg logit contributions | |
sound | -0.036 |
do | -0.028 |
not | -0.026 |
listen | -0.026 |
music | -0.024 |
Token | beautiful |
Token ID | 4950 |
Feature activation | -2.66e-02 |
Pos logit contributions | |
sound | +0.033 |
do | +0.024 |
music | +0.021 |
not | +0.021 |
when | +0.019 |
Neg logit contributions | |
� | -0.051 |
imet | -0.051 |
umbs | -0.050 |
piping | -0.049 |
ocol | -0.049 |
Token | necklace |
Token ID | 38987 |
Feature activation | -3.76e-02 |
Pos logit contributions | |
piping | +0.041 |
ocol | +0.039 |
imet | +0.038 |
million | +0.038 |
endant | +0.037 |
Neg logit contributions | |
sound | -0.053 |
do | -0.041 |
listen | -0.039 |
her | -0.038 |
music | -0.038 |
Token | I |
Token ID | 314 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
endant | +0.072 |
piping | +0.069 |
dark | +0.069 |
million | +0.068 |
bead | +0.065 |
Neg logit contributions | |
sound | -0.048 |
inker | -0.040 |
communicate | -0.037 |
listen | -0.037 |
listened | -0.035 |
Token | have |
Token ID | 423 |
Feature activation | -4.89e-02 |
Pos logit contributions | |
piping | +0.185 |
endant | +0.182 |
million | +0.177 |
umm | +0.176 |
ocol | +0.175 |
Neg logit contributions | |
sound | -0.170 |
do | -0.141 |
listen | -0.137 |
listened | -0.136 |
not | -0.130 |
Token | ever |
Token ID | 1683 |
Feature activation | -7.20e-02 |
Pos logit contributions | |
endant | +0.084 |
piping | +0.082 |
ocol | +0.079 |
million | +0.078 |
dark | +0.078 |
Neg logit contributions | |
sound | -0.079 |
do | -0.059 |
listen | -0.059 |
inker | -0.058 |
listened | -0.056 |
Token | seen |
Token ID | 1775 |
Feature activation | -3.17e-02 |
Pos logit contributions | |
piping | +0.109 |
endant | +0.106 |
ocol | +0.102 |
umm | +0.102 |
million | +0.102 |
Neg logit contributions | |
sound | -0.133 |
do | -0.107 |
listened | -0.106 |
listen | -0.105 |
not | -0.101 |
Token | . |
Token ID | 13 |
Feature activation | +1.61e-03 |
Pos logit contributions | |
endant | +0.067 |
piping | +0.067 |
million | +0.065 |
ocol | +0.065 |
dark | +0.063 |
Neg logit contributions | |
sound | -0.038 |
do | -0.026 |
listen | -0.026 |
listened | -0.026 |
not | -0.024 |
Token | You |
Token ID | 921 |
Feature activation | -3.60e-02 |
Pos logit contributions | |
sound | +0.002 |
listen | +0.002 |
do | +0.002 |
not | +0.002 |
say | +0.002 |
Neg logit contributions | |
million | -0.003 |
endant | -0.003 |
camps | -0.003 |
ocol | -0.003 |
igsaw | -0.002 |
Token | quiet |
Token ID | 5897 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
freshly | +0.016 |
pleasure | +0.016 |
endant | +0.016 |
million | +0.016 |
piping | +0.016 |
Neg logit contributions | |
inker | -0.012 |
ics | -0.011 |
sound | -0.011 |
oo | -0.011 |
ister | -0.010 |
Token | anymore |
Token ID | 7471 |
Feature activation | +8.22e-03 |
Pos logit contributions | |
sound | +0.015 |
inker | +0.014 |
listen | +0.013 |
behave | +0.013 |
listened | +0.013 |
Neg logit contributions | |
million | -0.022 |
piping | -0.022 |
umm | -0.021 |
endant | -0.021 |
ocol | -0.021 |
Token | . |
Token ID | 13 |
Feature activation | +6.64e-03 |
Pos logit contributions | |
sound | +0.011 |
inker | +0.009 |
listen | +0.009 |
listened | +0.008 |
behave | +0.008 |
Neg logit contributions | |
million | -0.015 |
endant | -0.014 |
piping | -0.014 |
ocol | -0.014 |
imet | -0.013 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
sound | +0.010 |
her | +0.008 |
not | +0.008 |
do | +0.008 |
listen | +0.008 |
Neg logit contributions | |
ocol | -0.012 |
piping | -0.012 |
endant | -0.012 |
camps | -0.011 |
umm | -0.011 |
Token | " |
Token ID | 1 |
Feature activation | +3.84e-04 |
Pos logit contributions | |
endant | +0.027 |
ocol | +0.026 |
piping | +0.026 |
umm | +0.025 |
brand | +0.024 |
Neg logit contributions | |
sound | -0.028 |
do | -0.025 |
her | -0.023 |
listened | -0.022 |
did | -0.022 |
Token | Look |
Token ID | 8567 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
sound | +0.001 |
do | +0.001 |
listened | +0.001 |
listen | +0.001 |
not | +0.001 |
Neg logit contributions | |
endant | -0.001 |
piping | -0.001 |
ocol | -0.001 |
million | -0.001 |
igsaw | -0.001 |
Token | Mom |
Token ID | 11254 |
Feature activation | -4.49e-02 |
Pos logit contributions | |
piping | +0.260 |
million | +0.256 |
endant | +0.256 |
umm | +0.254 |
ocol | +0.248 |
Neg logit contributions | |
sound | -0.085 |
do | -0.059 |
listen | -0.052 |
not | -0.049 |
listened | -0.048 |
Token | my |
Token ID | 1820 |
Feature activation | -4.81e-02 |
Pos logit contributions | |
piping | +0.071 |
endant | +0.069 |
million | +0.066 |
ocol | +0.065 |
imet | +0.063 |
Neg logit contributions | |
sound | -0.079 |
do | -0.062 |
listen | -0.062 |
listened | -0.061 |
communicate | -0.059 |
Token | , |
Token ID | 11 |
Feature activation | -6.12e-02 |
Pos logit contributions | |
piping | +0.096 |
endant | +0.094 |
million | +0.092 |
ocol | +0.090 |
imet | +0.089 |
Neg logit contributions | |
sound | -0.064 |
do | -0.045 |
listen | -0.044 |
inker | -0.044 |
communicate | -0.044 |
Token | what |
Token ID | 644 |
Feature activation | -9.04e-03 |
Pos logit contributions | |
piping | +0.116 |
endant | +0.112 |
million | +0.108 |
ocol | +0.107 |
freshly | +0.104 |
Neg logit contributions | |
sound | -0.091 |
listened | -0.066 |
do | -0.066 |
listen | -0.065 |
inker | -0.064 |
Token | can |
Token ID | 460 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
piping | +0.019 |
endant | +0.018 |
million | +0.018 |
ocol | +0.017 |
dark | +0.017 |
Neg logit contributions | |
sound | -0.011 |
listen | -0.008 |
do | -0.008 |
listened | -0.008 |
behave | -0.007 |
Token | says |
Token ID | 1139 |
Feature activation | -1.20e-02 |
Pos logit contributions | |
sound | +0.049 |
behave | +0.032 |
listen | +0.032 |
inker | +0.032 |
do | +0.032 |
Neg logit contributions | |
endant | -0.069 |
piping | -0.068 |
million | -0.065 |
imet | -0.065 |
dark | -0.064 |
Token | , |
Token ID | 11 |
Feature activation | -1.34e-03 |
Pos logit contributions | |
piping | +0.024 |
endant | +0.023 |
imet | +0.022 |
million | +0.022 |
ocol | +0.022 |
Neg logit contributions | |
sound | -0.016 |
inker | -0.012 |
ably | -0.011 |
behave | -0.011 |
ising | -0.011 |
Token | " |
Token ID | 366 |
Feature activation | +7.96e-03 |
Pos logit contributions | |
piping | +0.002 |
endant | +0.002 |
million | +0.002 |
ocol | +0.002 |
imet | +0.002 |
Neg logit contributions | |
sound | -0.003 |
do | -0.002 |
listen | -0.002 |
listened | -0.002 |
inker | -0.002 |
Token | They |
Token ID | 2990 |
Feature activation | +7.55e-03 |
Pos logit contributions | |
sound | +0.014 |
do | +0.012 |
listen | +0.011 |
listened | +0.011 |
not | +0.011 |
Neg logit contributions | |
piping | -0.012 |
endant | -0.012 |
ocol | -0.012 |
million | -0.012 |
umm | -0.011 |
Token | are |
Token ID | 389 |
Feature activation | +1.30e-02 |
Pos logit contributions | |
sound | +0.013 |
inker | +0.011 |
ably | +0.010 |
loudly | +0.010 |
oo | +0.009 |
Neg logit contributions | |
endant | -0.012 |
pleasure | -0.011 |
freshly | -0.011 |
million | -0.011 |
piping | -0.010 |
Token | av |
Token ID | 1196 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
sound | +0.017 |
do | +0.013 |
listen | +0.012 |
listened | +0.012 |
not | +0.012 |
Neg logit contributions | |
piping | -0.026 |
endant | -0.026 |
million | -0.025 |
ocol | -0.025 |
umm | -0.024 |
Token | oc |
Token ID | 420 |
Feature activation | -3.82e-02 |
Pos logit contributions | |
piping | +0.110 |
endant | +0.109 |
ocol | +0.097 |
million | +0.096 |
dark | +0.096 |
Neg logit contributions | |
sound | -0.238 |
do | -0.202 |
listen | -0.198 |
listened | -0.197 |
tails | -0.194 |
Token | ados |
Token ID | 22484 |
Feature activation | -2.86e-02 |
Pos logit contributions | |
ocol | +0.034 |
umm | +0.033 |
endant | +0.032 |
imet | +0.030 |
piping | +0.028 |
Neg logit contributions | |
sound | -0.095 |
do | -0.083 |
listen | -0.080 |
listened | -0.079 |
not | -0.079 |
Token | . |
Token ID | 13 |
Feature activation | +3.46e-03 |
Pos logit contributions | |
million | +0.049 |
endant | +0.049 |
camps | +0.048 |
piping | +0.046 |
lettuce | +0.045 |
Neg logit contributions | |
sound | -0.043 |
inker | -0.035 |
communicate | -0.034 |
listened | -0.033 |
listen | -0.032 |
Token | My |
Token ID | 2011 |
Feature activation | +2.33e-04 |
Pos logit contributions | |
sound | +0.005 |
do | +0.004 |
listen | +0.004 |
each | +0.004 |
not | +0.004 |
Neg logit contributions | |
endant | -0.006 |
piping | -0.006 |
million | -0.006 |
ocol | -0.006 |
igsaw | -0.006 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
sound | +0.000 |
do | +0.000 |
listen | +0.000 |
not | +0.000 |
listened | +0.000 |
Neg logit contributions | |
piping | -0.000 |
endant | -0.000 |
million | -0.000 |
ocol | -0.000 |
dark | -0.000 |
Token | so |
Token ID | 523 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
sound | +0.004 |
do | +0.003 |
listen | +0.003 |
inker | +0.003 |
listened | +0.003 |
Neg logit contributions | |
piping | -0.005 |
endant | -0.005 |
million | -0.004 |
pleasure | -0.004 |
ocol | -0.004 |
Token | happy |
Token ID | 3772 |
Feature activation | +2.58e-03 |
Pos logit contributions | |
sound | +0.025 |
inker | +0.020 |
listen | +0.020 |
do | +0.020 |
behave | +0.019 |
Neg logit contributions | |
piping | -0.025 |
endant | -0.025 |
million | -0.024 |
pleasure | -0.023 |
freshly | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | +9.10e-04 |
Pos logit contributions | |
sound | +0.003 |
inker | +0.003 |
communicate | +0.003 |
behave | +0.003 |
tails | +0.003 |
Neg logit contributions | |
endant | -0.005 |
million | -0.005 |
freshly | -0.005 |
umm | -0.005 |
joy | -0.005 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
her | +0.001 |
each | +0.001 |
sound | +0.001 |
not | +0.001 |
when | +0.001 |
Neg logit contributions | |
ocol | -0.002 |
endant | -0.002 |
piping | -0.002 |
camps | -0.002 |
imet | -0.002 |
Token | " |
Token ID | 1 |
Feature activation | -1.61e-03 |
Pos logit contributions | |
endant | +0.027 |
ocol | +0.026 |
piping | +0.025 |
umm | +0.024 |
imet | +0.023 |
Neg logit contributions | |
sound | -0.027 |
do | -0.024 |
listened | -0.022 |
her | -0.022 |
did | -0.021 |
Token | Look |
Token ID | 8567 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
endant | +0.003 |
piping | +0.002 |
ocol | +0.002 |
igsaw | +0.002 |
million | +0.002 |
Neg logit contributions | |
sound | -0.003 |
do | -0.002 |
listened | -0.002 |
listen | -0.002 |
not | -0.002 |
Token | !" |
Token ID | 2474 |
Feature activation | +7.95e-04 |
Pos logit contributions | |
piping | +0.254 |
endant | +0.252 |
million | +0.252 |
umm | +0.250 |
ocol | +0.244 |
Neg logit contributions | |
sound | -0.086 |
do | -0.062 |
listen | -0.054 |
not | -0.053 |
her | -0.051 |
Token | Mary |
Token ID | 5335 |
Feature activation | +1.70e-02 |
Pos logit contributions | |
sound | +0.001 |
communicate | +0.001 |
inker | +0.001 |
behave | +0.001 |
ising | +0.001 |
Neg logit contributions | |
There | -0.001 |
piping | -0.001 |
million | -0.001 |
endant | -0.001 |
lettuce | -0.001 |
Token | said |
Token ID | 531 |
Feature activation | -9.70e-03 |
Pos logit contributions | |
sound | +0.024 |
inker | +0.017 |
listen | +0.017 |
do | +0.016 |
communicate | +0.016 |
Neg logit contributions | |
piping | -0.033 |
endant | -0.032 |
dark | -0.031 |
million | -0.031 |
imet | -0.031 |
Token | to |
Token ID | 284 |
Feature activation | -4.32e-03 |
Pos logit contributions | |
piping | +0.017 |
pleasure | +0.017 |
brand | +0.016 |
million | +0.016 |
igsaw | +0.016 |
Neg logit contributions | |
sound | -0.013 |
inker | -0.011 |
ards | -0.011 |
tails | -0.010 |
ani | -0.010 |
Token | her |
Token ID | 607 |
Feature activation | +4.20e-03 |
Pos logit contributions | |
piping | +0.010 |
ocol | +0.009 |
endant | +0.009 |
pleasure | +0.009 |
freshly | +0.009 |
Neg logit contributions | |
sound | -0.004 |
listened | -0.003 |
do | -0.003 |
ising | -0.003 |
inker | -0.003 |
Token | too |
Token ID | 1165 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
piping | +0.025 |
endant | +0.025 |
million | +0.024 |
ocol | +0.024 |
freshly | +0.023 |
Neg logit contributions | |
sound | -0.022 |
do | -0.017 |
listen | -0.017 |
listened | -0.016 |
inker | -0.016 |
Token | late |
Token ID | 2739 |
Feature activation | +1.70e-02 |
Pos logit contributions | |
sound | +0.022 |
communicate | +0.019 |
inker | +0.019 |
do | +0.019 |
listen | +0.018 |
Neg logit contributions | |
million | -0.018 |
piping | -0.017 |
endant | -0.017 |
freshly | -0.016 |
brand | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | -1.87e-03 |
Pos logit contributions | |
sound | +0.026 |
inker | +0.023 |
communicate | +0.022 |
behave | +0.021 |
listened | +0.021 |
Neg logit contributions | |
imet | -0.027 |
freshly | -0.025 |
endant | -0.025 |
joy | -0.024 |
piping | -0.024 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.77e-02 |
Pos logit contributions | |
endant | +0.004 |
ocol | +0.004 |
seventeen | +0.004 |
piping | +0.004 |
camps | +0.004 |
Neg logit contributions | |
sound | -0.002 |
her | -0.002 |
not | -0.002 |
when | -0.002 |
do | -0.002 |
Token | " |
Token ID | 1 |
Feature activation | -1.85e-03 |
Pos logit contributions | |
endant | +0.029 |
ocol | +0.028 |
piping | +0.027 |
umm | +0.026 |
brand | +0.025 |
Neg logit contributions | |
sound | -0.031 |
do | -0.028 |
listened | -0.025 |
her | -0.025 |
did | -0.025 |
Token | Look |
Token ID | 8567 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
endant | +0.003 |
piping | +0.003 |
ocol | +0.003 |
million | +0.003 |
imet | +0.003 |
Neg logit contributions | |
sound | -0.003 |
do | -0.003 |
listened | -0.003 |
listen | -0.003 |
not | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | -5.63e-02 |
Pos logit contributions | |
piping | +0.241 |
endant | +0.239 |
million | +0.237 |
umm | +0.233 |
ocol | +0.228 |
Neg logit contributions | |
sound | -0.100 |
do | -0.076 |
listen | -0.068 |
not | -0.066 |
listened | -0.064 |
Token | Mom |
Token ID | 11254 |
Feature activation | -3.72e-02 |
Pos logit contributions | |
piping | +0.090 |
endant | +0.086 |
million | +0.084 |
ocol | +0.083 |
imet | +0.082 |
Neg logit contributions | |
sound | -0.097 |
listened | -0.074 |
do | -0.074 |
inker | -0.073 |
listen | -0.073 |
Token | my |
Token ID | 1820 |
Feature activation | -3.93e-02 |
Pos logit contributions | |
piping | +0.053 |
endant | +0.051 |
million | +0.049 |
ocol | +0.048 |
freshly | +0.046 |
Neg logit contributions | |
sound | -0.071 |
do | -0.057 |
communicate | -0.056 |
listen | -0.056 |
listened | -0.056 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.72e-03 |
Pos logit contributions | |
piping | +0.076 |
endant | +0.074 |
million | +0.073 |
ocol | +0.072 |
imet | +0.070 |
Neg logit contributions | |
sound | -0.054 |
communicate | -0.040 |
inker | -0.039 |
do | -0.037 |
listen | -0.037 |
Token | exclaimed |
Token ID | 33552 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
piping | +0.003 |
million | +0.003 |
endant | +0.003 |
There | +0.003 |
dark | +0.003 |
Neg logit contributions | |
sound | -0.003 |
communicate | -0.002 |
inker | -0.002 |
behave | -0.002 |
listen | -0.002 |
Token | is |
Token ID | 318 |
Feature activation | +9.37e-03 |
Pos logit contributions | |
sound | +0.011 |
do | +0.008 |
listen | +0.008 |
listened | +0.008 |
not | +0.008 |
Neg logit contributions | |
endant | -0.013 |
piping | -0.012 |
ocol | -0.012 |
million | -0.012 |
umm | -0.012 |
Token | the |
Token ID | 262 |
Feature activation | -2.85e-02 |
Pos logit contributions | |
sound | +0.010 |
do | +0.007 |
not | +0.006 |
listen | +0.006 |
listened | +0.006 |
Neg logit contributions | |
endant | -0.022 |
piping | -0.022 |
ocol | -0.021 |
million | -0.021 |
umm | -0.020 |
Token | best |
Token ID | 1266 |
Feature activation | +3.18e-04 |
Pos logit contributions | |
endant | +0.051 |
piping | +0.050 |
ocol | +0.049 |
million | +0.048 |
imet | +0.047 |
Neg logit contributions | |
sound | -0.045 |
do | -0.035 |
listen | -0.034 |
listened | -0.033 |
not | -0.033 |
Token | yellow |
Token ID | 7872 |
Feature activation | -2.96e-02 |
Pos logit contributions | |
sound | +0.001 |
do | +0.000 |
listen | +0.000 |
not | +0.000 |
listened | +0.000 |
Neg logit contributions | |
endant | -0.001 |
ocol | -0.001 |
piping | -0.001 |
imet | -0.001 |
pill | -0.001 |
Token | cake |
Token ID | 12187 |
Feature activation | -1.39e-02 |
Pos logit contributions | |
piping | +0.043 |
endant | +0.042 |
million | +0.040 |
ocol | +0.040 |
umm | +0.038 |
Neg logit contributions | |
sound | -0.056 |
do | -0.046 |
listen | -0.045 |
listened | -0.045 |
not | -0.044 |
Token | I |
Token ID | 314 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
piping | +0.022 |
million | +0.022 |
endant | +0.021 |
umm | +0.021 |
dark | +0.021 |
Neg logit contributions | |
sound | -0.022 |
inker | -0.019 |
communicate | -0.018 |
tails | -0.018 |
gging | -0.018 |
Token | ever |
Token ID | 1683 |
Feature activation | -7.52e-02 |
Pos logit contributions | |
endant | +0.157 |
piping | +0.156 |
ocol | +0.149 |
dark | +0.147 |
freshly | +0.147 |
Neg logit contributions | |
sound | -0.187 |
inker | -0.142 |
loudly | -0.140 |
tails | -0.138 |
music | -0.135 |
Token | saw |
Token ID | 2497 |
Feature activation | -3.16e-02 |
Pos logit contributions | |
piping | +0.130 |
endant | +0.130 |
million | +0.128 |
dark | +0.121 |
ocol | +0.119 |
Neg logit contributions | |
sound | -0.115 |
inker | -0.088 |
do | -0.088 |
listen | -0.086 |
not | -0.084 |
Token | ! |
Token ID | 0 |
Feature activation | -9.02e-03 |
Pos logit contributions | |
million | +0.058 |
piping | +0.057 |
endant | +0.057 |
ocol | +0.055 |
dark | +0.055 |
Neg logit contributions | |
sound | -0.045 |
do | -0.034 |
listen | -0.034 |
communicate | -0.034 |
tails | -0.033 |
Token | Thank |
Token ID | 6952 |
Feature activation | -3.34e-02 |
Pos logit contributions | |
endant | +0.015 |
ocol | +0.014 |
camps | +0.014 |
piping | +0.013 |
million | +0.013 |
Neg logit contributions | |
sound | -0.015 |
listen | -0.013 |
do | -0.013 |
not | -0.012 |
listened | -0.012 |
Token | you |
Token ID | 345 |
Feature activation | -2.59e-02 |
Pos logit contributions | |
piping | +0.060 |
ocol | +0.059 |
million | +0.056 |
endant | +0.055 |
umm | +0.055 |
Neg logit contributions | |
sound | -0.050 |
do | -0.036 |
ably | -0.036 |
communicate | -0.035 |
ignore | -0.035 |
Token | 's |
Token ID | 338 |
Feature activation | +7.30e-03 |
Pos logit contributions | |
endant | +0.064 |
million | +0.059 |
piping | +0.058 |
dark | +0.058 |
bead | +0.055 |
Neg logit contributions | |
sound | -0.063 |
inker | -0.054 |
listen | -0.051 |
ably | -0.050 |
ising | -0.048 |
Token | the |
Token ID | 262 |
Feature activation | -2.54e-02 |
Pos logit contributions | |
sound | +0.008 |
do | +0.005 |
not | +0.005 |
listen | +0.005 |
listened | +0.005 |
Neg logit contributions | |
piping | -0.017 |
endant | -0.016 |
million | -0.016 |
ocol | -0.016 |
umm | -0.016 |
Token | most |
Token ID | 749 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
piping | +0.046 |
endant | +0.046 |
ocol | +0.045 |
million | +0.045 |
igsaw | +0.043 |
Neg logit contributions | |
sound | -0.040 |
do | -0.031 |
listen | -0.029 |
not | -0.029 |
listened | -0.028 |
Token | beautiful |
Token ID | 4950 |
Feature activation | -3.18e-02 |
Pos logit contributions | |
sound | +0.024 |
do | +0.017 |
not | +0.016 |
music | +0.015 |
when | +0.014 |
Neg logit contributions | |
� | -0.033 |
piping | -0.033 |
umbs | -0.032 |
ocol | -0.032 |
imet | -0.031 |
Token | thing |
Token ID | 1517 |
Feature activation | +2.17e-03 |
Pos logit contributions | |
piping | +0.055 |
ocol | +0.054 |
endant | +0.053 |
million | +0.053 |
� | +0.052 |
Neg logit contributions | |
sound | -0.056 |
do | -0.042 |
listen | -0.040 |
listened | -0.038 |
not | -0.038 |
Token | I |
Token ID | 314 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
sound | +0.003 |
inker | +0.003 |
do | +0.003 |
listen | +0.002 |
ising | +0.002 |
Neg logit contributions | |
endant | -0.004 |
piping | -0.004 |
dark | -0.004 |
million | -0.004 |
ocol | -0.003 |
Token | ever |
Token ID | 1683 |
Feature activation | -7.08e-02 |
Pos logit contributions | |
endant | +0.184 |
piping | +0.183 |
ocol | +0.175 |
million | +0.172 |
dark | +0.170 |
Neg logit contributions | |
sound | -0.161 |
do | -0.114 |
listen | -0.114 |
listened | -0.113 |
inker | -0.112 |
Token | saw |
Token ID | 2497 |
Feature activation | -3.16e-02 |
Pos logit contributions | |
endant | +0.127 |
piping | +0.127 |
million | +0.121 |
ocol | +0.120 |
dark | +0.117 |
Neg logit contributions | |
sound | -0.108 |
do | -0.081 |
listen | -0.079 |
listened | -0.077 |
not | -0.077 |
Token | . |
Token ID | 13 |
Feature activation | +2.45e-03 |
Pos logit contributions | |
endant | +0.058 |
piping | +0.057 |
million | +0.056 |
ocol | +0.056 |
dark | +0.056 |
Neg logit contributions | |
sound | -0.045 |
listen | -0.034 |
do | -0.034 |
listened | -0.033 |
inker | -0.033 |
Token | You |
Token ID | 921 |
Feature activation | -3.48e-02 |
Pos logit contributions | |
sound | +0.004 |
do | +0.004 |
listen | +0.004 |
not | +0.003 |
say | +0.003 |
Neg logit contributions | |
endant | -0.004 |
million | -0.004 |
piping | -0.004 |
camps | -0.004 |
ocol | -0.004 |
Token | 're |
Token ID | 821 |
Feature activation | +7.20e-03 |
Pos logit contributions | |
endant | +0.050 |
million | +0.043 |
dark | +0.042 |
piping | +0.041 |
bead | +0.040 |
Neg logit contributions | |
sound | -0.069 |
inker | -0.057 |
ising | -0.053 |
ics | -0.052 |
ably | -0.052 |
Token | fish |
Token ID | 5916 |
Feature activation | +3.82e-02 |
Pos logit contributions | |
sound | +0.001 |
do | +0.000 |
listen | +0.000 |
listened | +0.000 |
not | +0.000 |
Neg logit contributions | |
piping | -0.001 |
endant | -0.001 |
million | -0.000 |
ocol | -0.000 |
umm | -0.000 |
Token | said |
Token ID | 531 |
Feature activation | -3.11e-02 |
Pos logit contributions | |
sound | +0.052 |
inker | +0.047 |
tails | +0.043 |
listen | +0.042 |
ably | +0.042 |
Neg logit contributions | |
million | -0.066 |
endant | -0.063 |
lettuce | -0.060 |
piping | -0.059 |
dark | -0.059 |
Token | , |
Token ID | 11 |
Feature activation | -1.77e-02 |
Pos logit contributions | |
piping | +0.049 |
imet | +0.049 |
million | +0.048 |
cuc | +0.047 |
ocol | +0.047 |
Neg logit contributions | |
sound | -0.047 |
inker | -0.044 |
tails | -0.039 |
ising | -0.039 |
ably | -0.038 |
Token | " |
Token ID | 366 |
Feature activation | -2.11e-02 |
Pos logit contributions | |
piping | +0.019 |
imet | +0.019 |
million | +0.018 |
endant | +0.018 |
ocol | +0.017 |
Neg logit contributions | |
sound | -0.038 |
inker | -0.032 |
do | -0.031 |
ably | -0.031 |
listened | -0.031 |
Token | Hi |
Token ID | 17250 |
Feature activation | -6.52e-02 |
Pos logit contributions | |
piping | +0.031 |
million | +0.030 |
endant | +0.029 |
ocol | +0.028 |
dark | +0.028 |
Neg logit contributions | |
sound | -0.039 |
do | -0.032 |
not | -0.031 |
listen | -0.031 |
listened | -0.030 |
Token | Gab |
Token ID | 12300 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
piping | +0.142 |
endant | +0.140 |
million | +0.137 |
ocol | +0.136 |
umm | +0.132 |
Neg logit contributions | |
sound | -0.075 |
do | -0.051 |
listen | -0.050 |
listened | -0.050 |
not | -0.047 |
Token | ri |
Token ID | 380 |
Feature activation | +8.23e-03 |
Pos logit contributions | |
piping | +0.197 |
endant | +0.192 |
million | +0.189 |
ocol | +0.183 |
umm | +0.180 |
Neg logit contributions | |
sound | -0.147 |
do | -0.112 |
listen | -0.111 |
listened | -0.106 |
not | -0.101 |
Token | ella |
Token ID | 12627 |
Feature activation | -3.11e-02 |
Pos logit contributions | |
sound | +0.014 |
inker | +0.011 |
do | +0.011 |
her | +0.011 |
communicate | +0.011 |
Neg logit contributions | |
ocol | -0.012 |
imet | -0.012 |
endant | -0.012 |
piping | -0.012 |
dark | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | -2.59e-02 |
Pos logit contributions | |
piping | +0.061 |
endant | +0.059 |
million | +0.059 |
ocol | +0.058 |
imet | +0.057 |
Neg logit contributions | |
sound | -0.042 |
listened | -0.029 |
listen | -0.029 |
do | -0.029 |
inker | -0.029 |
Token | would |
Token ID | 561 |
Feature activation | +5.27e-03 |
Pos logit contributions | |
piping | +0.045 |
endant | +0.044 |
million | +0.043 |
ocol | +0.043 |
imet | +0.041 |
Neg logit contributions | |
sound | -0.040 |
listened | -0.030 |
do | -0.030 |
listen | -0.030 |
inker | -0.029 |
Token | you |
Token ID | 345 |
Feature activation | -7.33e-03 |
Pos logit contributions | |
sound | +0.007 |
inker | +0.006 |
ably | +0.006 |
ics | +0.005 |
tails | +0.005 |
Neg logit contributions | |
piping | -0.009 |
pleasure | -0.009 |
freshly | -0.009 |
ocol | -0.009 |
endant | -0.009 |
Token | from |
Token ID | 422 |
Feature activation | -3.78e-02 |
Pos logit contributions | |
endant | +0.068 |
piping | +0.066 |
million | +0.064 |
dark | +0.063 |
ocol | +0.062 |
Neg logit contributions | |
sound | -0.041 |
listen | -0.030 |
do | -0.030 |
listened | -0.029 |
inker | -0.029 |
Token | the |
Token ID | 262 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
piping | +0.103 |
endant | +0.103 |
million | +0.100 |
umm | +0.099 |
ocol | +0.099 |
Neg logit contributions | |
sound | -0.025 |
do | -0.011 |
listen | -0.010 |
listened | -0.008 |
not | -0.008 |
Token | attic |
Token ID | 46113 |
Feature activation | -4.18e-02 |
Pos logit contributions | |
piping | +0.018 |
ocol | +0.018 |
endant | +0.018 |
imet | +0.017 |
igsaw | +0.017 |
Neg logit contributions | |
sound | -0.018 |
do | -0.015 |
not | -0.013 |
listen | -0.013 |
music | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -1.29e-02 |
Pos logit contributions | |
endant | +0.088 |
million | +0.085 |
piping | +0.084 |
dark | +0.082 |
umm | +0.081 |
Neg logit contributions | |
sound | -0.048 |
listen | -0.035 |
do | -0.035 |
listened | -0.034 |
inker | -0.034 |
Token | " |
Token ID | 366 |
Feature activation | +3.88e-04 |
Pos logit contributions | |
ocol | +0.031 |
endant | +0.029 |
umm | +0.028 |
piping | +0.027 |
tal | +0.027 |
Neg logit contributions | |
sound | -0.015 |
her | -0.015 |
do | -0.015 |
not | -0.012 |
when | -0.012 |
Token | Look |
Token ID | 8567 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
sound | +0.001 |
listened | +0.000 |
listen | +0.000 |
do | +0.000 |
her | +0.000 |
Neg logit contributions | |
endant | -0.001 |
ocol | -0.001 |
piping | -0.001 |
igsaw | -0.001 |
imet | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | -4.68e-02 |
Pos logit contributions | |
piping | +0.257 |
endant | +0.253 |
million | +0.250 |
umm | +0.248 |
ocol | +0.246 |
Neg logit contributions | |
sound | -0.086 |
do | -0.059 |
listen | -0.053 |
not | -0.049 |
listened | -0.048 |
Token | Lily |
Token ID | 20037 |
Feature activation | -4.08e-02 |
Pos logit contributions | |
piping | +0.070 |
endant | +0.069 |
ocol | +0.067 |
million | +0.066 |
umm | +0.065 |
Neg logit contributions | |
sound | -0.087 |
do | -0.074 |
listen | -0.071 |
not | -0.069 |
listened | -0.069 |
Token | ! |
Token ID | 0 |
Feature activation | -2.42e-02 |
Pos logit contributions | |
endant | +0.086 |
piping | +0.084 |
million | +0.084 |
ocol | +0.079 |
umm | +0.079 |
Neg logit contributions | |
sound | -0.047 |
listen | -0.033 |
do | -0.032 |
listened | -0.032 |
communicate | -0.032 |
Token | This |
Token ID | 770 |
Feature activation | -4.92e-04 |
Pos logit contributions | |
ocol | +0.039 |
piping | +0.036 |
freshly | +0.035 |
million | +0.033 |
endant | +0.033 |
Neg logit contributions | |
sound | -0.040 |
do | -0.039 |
listen | -0.035 |
when | -0.035 |
not | -0.034 |
Token | chest |
Token ID | 7721 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
piping | +0.001 |
endant | +0.001 |
ocol | +0.001 |
million | +0.001 |
umm | +0.001 |
Neg logit contributions | |
sound | -0.001 |
do | -0.001 |
listen | -0.001 |
listened | -0.001 |
not | -0.001 |
Token | for |
Token ID | 329 |
Feature activation | +4.58e-02 |
Pos logit contributions | |
endant | +0.012 |
million | +0.012 |
pleasure | +0.011 |
piping | +0.011 |
igsaw | +0.011 |
Neg logit contributions | |
sound | -0.012 |
listened | -0.010 |
argue | -0.010 |
listen | -0.009 |
behave | -0.009 |
Token | others |
Token ID | 1854 |
Feature activation | +1.81e-02 |
Pos logit contributions | |
sound | +0.063 |
inker | +0.049 |
ics | +0.048 |
do | +0.047 |
tails | +0.047 |
Neg logit contributions | |
ocol | -0.078 |
million | -0.077 |
piping | -0.077 |
freshly | -0.075 |
endant | -0.074 |
Token | . |
Token ID | 13 |
Feature activation | +7.04e-04 |
Pos logit contributions | |
sound | +0.026 |
inker | +0.021 |
ics | +0.019 |
ards | +0.018 |
oo | +0.017 |
Neg logit contributions | |
million | -0.031 |
pleasure | -0.031 |
endant | -0.030 |
piping | -0.029 |
ifying | -0.029 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
sound | +0.001 |
not | +0.001 |
do | +0.001 |
listen | +0.001 |
obey | +0.001 |
Neg logit contributions | |
endant | -0.001 |
camps | -0.001 |
ocol | -0.001 |
piping | -0.001 |
imet | -0.001 |
Token | " |
Token ID | 1 |
Feature activation | -2.64e-03 |
Pos logit contributions | |
endant | +0.030 |
ocol | +0.029 |
piping | +0.028 |
umm | +0.027 |
imet | +0.026 |
Neg logit contributions | |
sound | -0.031 |
do | -0.028 |
her | -0.025 |
listened | -0.024 |
when | -0.024 |
Token | Look |
Token ID | 8567 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
piping | +0.004 |
endant | +0.004 |
million | +0.004 |
ocol | +0.004 |
umm | +0.003 |
Neg logit contributions | |
sound | -0.005 |
do | -0.004 |
listen | -0.004 |
listened | -0.004 |
not | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -5.27e-02 |
Pos logit contributions | |
piping | +0.231 |
endant | +0.230 |
ocol | +0.222 |
million | +0.222 |
umm | +0.215 |
Neg logit contributions | |
sound | -0.112 |
do | -0.075 |
listen | -0.073 |
listened | -0.071 |
not | -0.067 |
Token | there |
Token ID | 612 |
Feature activation | -4.64e-02 |
Pos logit contributions | |
piping | +0.074 |
endant | +0.071 |
million | +0.069 |
pleasure | +0.069 |
imet | +0.068 |
Neg logit contributions | |
sound | -0.098 |
inker | -0.077 |
tails | -0.077 |
ising | -0.076 |
listened | -0.076 |
Token | 's |
Token ID | 338 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
piping | +0.063 |
endant | +0.063 |
million | +0.063 |
pleasure | +0.059 |
There | +0.059 |
Neg logit contributions | |
sound | -0.081 |
ably | -0.069 |
inker | -0.065 |
listen | -0.065 |
listened | -0.065 |
Token | a |
Token ID | 257 |
Feature activation | +1.42e-03 |
Pos logit contributions | |
sound | +0.026 |
inker | +0.020 |
listened | +0.020 |
ably | +0.019 |
tails | +0.019 |
Neg logit contributions | |
piping | -0.042 |
endant | -0.041 |
pleasure | -0.040 |
freshly | -0.040 |
dark | -0.040 |
Token | stand |
Token ID | 1302 |
Feature activation | -2.08e-03 |
Pos logit contributions | |
sound | +0.002 |
do | +0.002 |
listen | +0.002 |
music | +0.002 |
listened | +0.002 |
Neg logit contributions | |
endant | -0.003 |
piping | -0.003 |
ocol | -0.003 |
imet | -0.002 |
umbs | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | -2.85e-02 |
Pos logit contributions | |
imet | +0.039 |
piping | +0.038 |
ocol | +0.038 |
endant | +0.038 |
pleasure | +0.037 |
Neg logit contributions | |
sound | -0.031 |
listened | -0.024 |
ards | -0.023 |
behave | -0.022 |
obey | -0.022 |
Token | her |
Token ID | 607 |
Feature activation | -2.70e-02 |
Pos logit contributions | |
piping | +0.071 |
endant | +0.069 |
ocol | +0.067 |
million | +0.067 |
imet | +0.066 |
Neg logit contributions | |
sound | -0.021 |
do | -0.011 |
listened | -0.011 |
inker | -0.010 |
ards | -0.010 |
Token | mom |
Token ID | 1995 |
Feature activation | -2.65e-02 |
Pos logit contributions | |
piping | +0.047 |
endant | +0.047 |
million | +0.045 |
ocol | +0.044 |
imet | +0.043 |
Neg logit contributions | |
sound | -0.042 |
do | -0.032 |
listen | -0.032 |
listened | -0.032 |
behave | -0.031 |
Token | , |
Token ID | 11 |
Feature activation | -3.39e-02 |
Pos logit contributions | |
piping | +0.034 |
endant | +0.031 |
imet | +0.030 |
million | +0.030 |
berry | +0.029 |
Neg logit contributions | |
sound | -0.052 |
inker | -0.043 |
do | -0.042 |
listened | -0.042 |
communicate | -0.041 |
Token | " |
Token ID | 366 |
Feature activation | -1.43e-02 |
Pos logit contributions | |
piping | +0.047 |
endant | +0.046 |
million | +0.044 |
ocol | +0.043 |
imet | +0.043 |
Neg logit contributions | |
sound | -0.065 |
do | -0.053 |
listen | -0.051 |
listened | -0.051 |
inker | -0.050 |
Token | Look |
Token ID | 8567 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
endant | +0.026 |
ocol | +0.025 |
igsaw | +0.025 |
piping | +0.024 |
imet | +0.023 |
Neg logit contributions | |
sound | -0.024 |
listened | -0.019 |
do | -0.018 |
listen | -0.018 |
her | -0.017 |
Token | , |
Token ID | 11 |
Feature activation | -4.89e-02 |
Pos logit contributions | |
piping | +0.243 |
endant | +0.241 |
million | +0.236 |
ocol | +0.233 |
umm | +0.231 |
Neg logit contributions | |
sound | -0.098 |
do | -0.067 |
listen | -0.062 |
listened | -0.059 |
not | -0.058 |
Token | Mom |
Token ID | 11254 |
Feature activation | -3.47e-02 |
Pos logit contributions | |
endant | +0.094 |
piping | +0.093 |
ocol | +0.093 |
umm | +0.091 |
million | +0.090 |
Neg logit contributions | |
sound | -0.071 |
do | -0.057 |
listen | -0.054 |
not | -0.053 |
listened | -0.051 |
Token | my |
Token ID | 1820 |
Feature activation | -3.77e-02 |
Pos logit contributions | |
piping | +0.049 |
endant | +0.048 |
million | +0.047 |
ocol | +0.044 |
umm | +0.044 |
Neg logit contributions | |
sound | -0.065 |
do | -0.053 |
listen | -0.053 |
listened | -0.052 |
communicate | -0.050 |
Token | ! |
Token ID | 0 |
Feature activation | -2.66e-02 |
Pos logit contributions | |
endant | +0.066 |
million | +0.066 |
piping | +0.066 |
pleasure | +0.063 |
imet | +0.061 |
Neg logit contributions | |
sound | -0.054 |
communicate | -0.043 |
inker | -0.041 |
ably | -0.041 |
ards | -0.040 |
Token | A |
Token ID | 317 |
Feature activation | -1.36e-02 |
Pos logit contributions | |
ocol | +0.046 |
endant | +0.042 |
irst | +0.040 |
igsaw | +0.039 |
piping | +0.039 |
Neg logit contributions | |
sound | -0.043 |
do | -0.039 |
listen | -0.036 |
not | -0.035 |
listened | -0.034 |
Token | room |
Token ID | 2119 |
Feature activation | +2.16e-03 |
Pos logit contributions | |
sound | +0.007 |
listen | +0.006 |
listened | +0.006 |
inker | +0.006 |
loudly | +0.006 |
Neg logit contributions | |
piping | -0.007 |
endant | -0.007 |
million | -0.006 |
freshly | -0.006 |
dark | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | -5.19e-04 |
Pos logit contributions | |
sound | +0.003 |
inker | +0.003 |
communicate | +0.003 |
tails | +0.003 |
gging | +0.003 |
Neg logit contributions | |
endant | -0.003 |
freshly | -0.003 |
ago | -0.003 |
piping | -0.003 |
brand | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
endant | +0.001 |
umm | +0.001 |
million | +0.001 |
impact | +0.001 |
bead | +0.001 |
Neg logit contributions | |
do | -0.001 |
her | -0.001 |
sound | -0.000 |
not | -0.000 |
each | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
endant | +0.034 |
ocol | +0.034 |
umm | +0.033 |
piping | +0.030 |
imet | +0.030 |
Neg logit contributions | |
sound | -0.029 |
do | -0.026 |
not | -0.024 |
listen | -0.022 |
her | -0.022 |
Token | " |
Token ID | 1 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
piping | +0.031 |
endant | +0.031 |
million | +0.029 |
ocol | +0.029 |
umm | +0.028 |
Neg logit contributions | |
sound | -0.031 |
do | -0.024 |
listen | -0.024 |
listened | -0.023 |
not | -0.023 |
Token | Look |
Token ID | 8567 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
sound | +0.030 |
listened | +0.025 |
listen | +0.025 |
do | +0.024 |
her | +0.023 |
Neg logit contributions | |
endant | -0.035 |
ocol | -0.032 |
igsaw | -0.031 |
tal | -0.030 |
imet | -0.030 |
Token | , |
Token ID | 11 |
Feature activation | -4.26e-02 |
Pos logit contributions | |
piping | +0.238 |
endant | +0.237 |
million | +0.229 |
ocol | +0.228 |
umm | +0.223 |
Neg logit contributions | |
sound | -0.103 |
do | -0.067 |
listen | -0.064 |
listened | -0.063 |
not | -0.059 |
Token | L |
Token ID | 406 |
Feature activation | -7.26e-03 |
Pos logit contributions | |
piping | +0.072 |
endant | +0.071 |
million | +0.068 |
ocol | +0.067 |
imet | +0.064 |
Neg logit contributions | |
sound | -0.070 |
listened | -0.053 |
do | -0.053 |
listen | -0.053 |
inker | -0.052 |
Token | ila |
Token ID | 10102 |
Feature activation | -2.35e-02 |
Pos logit contributions | |
piping | +0.015 |
million | +0.015 |
endant | +0.015 |
umm | +0.014 |
ocol | +0.014 |
Neg logit contributions | |
sound | -0.009 |
do | -0.007 |
listen | -0.007 |
listened | -0.006 |
not | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | -2.95e-02 |
Pos logit contributions | |
endant | +0.046 |
piping | +0.044 |
million | +0.043 |
imet | +0.042 |
dark | +0.041 |
Neg logit contributions | |
sound | -0.031 |
communicate | -0.024 |
inker | -0.024 |
listen | -0.022 |
behave | -0.022 |
Token | I |
Token ID | 314 |
Feature activation | -8.21e-02 |
Pos logit contributions | |
piping | +0.052 |
endant | +0.050 |
million | +0.048 |
ocol | +0.047 |
pleasure | +0.046 |
Neg logit contributions | |
sound | -0.047 |
inker | -0.035 |
ably | -0.034 |
ising | -0.034 |
listened | -0.034 |
Token | is |
Token ID | 318 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
sound | +0.018 |
inker | +0.015 |
communicate | +0.015 |
loudly | +0.015 |
obey | +0.015 |
Neg logit contributions | |
piping | -0.018 |
million | -0.017 |
endant | -0.017 |
dark | -0.016 |
freshly | -0.016 |
Token | the |
Token ID | 262 |
Feature activation | -2.23e-02 |
Pos logit contributions | |
sound | +0.017 |
do | +0.012 |
listen | +0.012 |
listened | +0.011 |
not | +0.011 |
Neg logit contributions | |
piping | -0.030 |
endant | -0.030 |
million | -0.029 |
ocol | -0.029 |
umm | -0.028 |
Token | most |
Token ID | 749 |
Feature activation | +2.23e-02 |
Pos logit contributions | |
piping | +0.039 |
endant | +0.039 |
million | +0.037 |
ocol | +0.036 |
umm | +0.036 |
Neg logit contributions | |
sound | -0.034 |
listened | -0.027 |
do | -0.026 |
listen | -0.026 |
inker | -0.025 |
Token | special |
Token ID | 2041 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
sound | +0.035 |
do | +0.027 |
listen | +0.025 |
not | +0.025 |
listened | +0.025 |
Neg logit contributions | |
endant | -0.041 |
piping | -0.041 |
ocol | -0.039 |
million | -0.038 |
imet | -0.038 |
Token | doll |
Token ID | 3654 |
Feature activation | -3.47e-02 |
Pos logit contributions | |
piping | +0.023 |
endant | +0.023 |
million | +0.022 |
ocol | +0.022 |
umm | +0.021 |
Neg logit contributions | |
sound | -0.024 |
do | -0.019 |
listen | -0.019 |
listened | -0.019 |
not | -0.018 |
Token | I |
Token ID | 314 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
endant | +0.058 |
piping | +0.057 |
dark | +0.057 |
million | +0.057 |
bead | +0.052 |
Neg logit contributions | |
sound | -0.052 |
inker | -0.044 |
gging | -0.041 |
communicate | -0.040 |
ising | -0.040 |
Token | ever |
Token ID | 1683 |
Feature activation | -6.99e-02 |
Pos logit contributions | |
piping | +0.169 |
endant | +0.168 |
ocol | +0.160 |
million | +0.159 |
dark | +0.156 |
Neg logit contributions | |
sound | -0.170 |
do | -0.124 |
listen | -0.123 |
inker | -0.122 |
listened | -0.121 |
Token | had |
Token ID | 550 |
Feature activation | -5.76e-02 |
Pos logit contributions | |
piping | +0.124 |
endant | +0.123 |
million | +0.119 |
dark | +0.115 |
ocol | +0.114 |
Neg logit contributions | |
sound | -0.106 |
inker | -0.079 |
do | -0.078 |
listen | -0.076 |
not | -0.075 |
Token | . |
Token ID | 13 |
Feature activation | +7.45e-04 |
Pos logit contributions | |
endant | +0.099 |
piping | +0.096 |
million | +0.094 |
dark | +0.091 |
ocol | +0.091 |
Neg logit contributions | |
sound | -0.087 |
inker | -0.067 |
listen | -0.065 |
communicate | -0.064 |
do | -0.064 |
Token | Thank |
Token ID | 6952 |
Feature activation | -3.00e-02 |
Pos logit contributions | |
sound | +0.001 |
listen | +0.001 |
do | +0.001 |
not | +0.001 |
her | +0.001 |
Neg logit contributions | |
endant | -0.001 |
million | -0.001 |
piping | -0.001 |
ocol | -0.001 |
camps | -0.001 |
Token | you |
Token ID | 345 |
Feature activation | -2.35e-02 |
Pos logit contributions | |
piping | +0.055 |
ocol | +0.055 |
endant | +0.053 |
million | +0.052 |
umm | +0.051 |
Neg logit contributions | |
sound | -0.043 |
do | -0.031 |
ably | -0.030 |
listened | -0.030 |
listen | -0.029 |
Token | , |
Token ID | 11 |
Feature activation | +9.74e-03 |
Pos logit contributions | |
million | +0.056 |
endant | +0.056 |
piping | +0.054 |
dark | +0.054 |
camps | +0.052 |
Neg logit contributions | |
sound | -0.050 |
inker | -0.040 |
listened | -0.039 |
listen | -0.039 |
communicate | -0.038 |
Token | we |
Token ID | 356 |
Feature activation | -2.73e-02 |
Pos logit contributions | |
sound | +0.014 |
inker | +0.012 |
listened | +0.011 |
ably | +0.011 |
ising | +0.011 |
Neg logit contributions | |
piping | -0.017 |
million | -0.016 |
endant | -0.016 |
freshly | -0.016 |
ocol | -0.016 |
Token | found |
Token ID | 1043 |
Feature activation | -2.66e-02 |
Pos logit contributions | |
piping | +0.038 |
endant | +0.037 |
million | +0.037 |
ocol | +0.036 |
pleasure | +0.035 |
Neg logit contributions | |
sound | -0.051 |
inker | -0.041 |
ably | -0.039 |
tails | -0.038 |
ising | -0.038 |
Token | a |
Token ID | 257 |
Feature activation | -1.63e-02 |
Pos logit contributions | |
piping | +0.057 |
endant | +0.057 |
million | +0.055 |
ocol | +0.055 |
dark | +0.053 |
Neg logit contributions | |
sound | -0.031 |
do | -0.022 |
listen | -0.021 |
listened | -0.021 |
behave | -0.020 |
Token | rare |
Token ID | 4071 |
Feature activation | -4.39e-02 |
Pos logit contributions | |
ocol | +0.028 |
endant | +0.028 |
piping | +0.028 |
umm | +0.028 |
dark | +0.027 |
Neg logit contributions | |
sound | -0.027 |
do | -0.021 |
not | -0.020 |
listen | -0.020 |
behave | -0.018 |
Token | rad |
Token ID | 2511 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
piping | +0.064 |
endant | +0.063 |
million | +0.060 |
ocol | +0.060 |
umm | +0.058 |
Neg logit contributions | |
sound | -0.083 |
do | -0.068 |
listen | -0.066 |
listened | -0.064 |
not | -0.063 |
Token | ish |
Token ID | 680 |
Feature activation | -3.13e-02 |
Pos logit contributions | |
piping | +0.191 |
igsaw | +0.186 |
endant | +0.181 |
dark | +0.178 |
million | +0.178 |
Neg logit contributions | |
sound | -0.143 |
do | -0.112 |
each | -0.110 |
ising | -0.108 |
listen | -0.103 |
Token | !" |
Token ID | 2474 |
Feature activation | +2.06e-02 |
Pos logit contributions | |
endant | +0.062 |
piping | +0.061 |
million | +0.060 |
ocol | +0.060 |
dark | +0.058 |
Neg logit contributions | |
sound | -0.040 |
listened | -0.030 |
listen | -0.029 |
inker | -0.029 |
do | -0.028 |
Token | they |
Token ID | 484 |
Feature activation | +6.01e-02 |
Pos logit contributions | |
sound | +0.039 |
do | +0.032 |
inker | +0.031 |
listen | +0.031 |
communicate | +0.031 |
Neg logit contributions | |
piping | -0.029 |
million | -0.027 |
endant | -0.027 |
imet | -0.025 |
ocol | -0.025 |
Token | shouted |
Token ID | 17293 |
Feature activation | -7.01e-03 |
Pos logit contributions | |
sound | +0.080 |
inker | +0.075 |
ising | +0.066 |
ably | +0.063 |
cles | +0.061 |
Neg logit contributions | |
cuc | -0.105 |
lettuce | -0.100 |
piping | -0.100 |
million | -0.100 |
Grac | -0.090 |
Token | , |
Token ID | 11 |
Feature activation | +9.67e-03 |
Pos logit contributions | |
imet | +0.012 |
pleasure | +0.012 |
joy | +0.012 |
piping | +0.012 |
ocol | +0.011 |
Neg logit contributions | |
sound | -0.010 |
inker | -0.008 |
tails | -0.008 |
ics | -0.007 |
listened | -0.007 |
Token | big |
Token ID | 1263 |
Feature activation | -5.18e-02 |
Pos logit contributions | |
piping | +0.045 |
endant | +0.045 |
million | +0.043 |
ocol | +0.042 |
igsaw | +0.040 |
Neg logit contributions | |
sound | -0.048 |
do | -0.038 |
listen | -0.037 |
listened | -0.037 |
not | -0.036 |
Token | map |
Token ID | 3975 |
Feature activation | -2.44e-02 |
Pos logit contributions | |
piping | +0.072 |
endant | +0.071 |
million | +0.069 |
ocol | +0.067 |
igsaw | +0.065 |
Neg logit contributions | |
sound | -0.098 |
listened | -0.080 |
do | -0.080 |
listen | -0.079 |
not | -0.078 |
Token | and |
Token ID | 290 |
Feature activation | -2.46e-02 |
Pos logit contributions | |
endant | +0.049 |
piping | +0.047 |
million | +0.046 |
dark | +0.045 |
imet | +0.045 |
Neg logit contributions | |
sound | -0.030 |
inker | -0.024 |
listen | -0.022 |
communicate | -0.022 |
do | -0.021 |
Token | said |
Token ID | 531 |
Feature activation | -3.15e-02 |
Pos logit contributions | |
piping | +0.044 |
million | +0.044 |
brand | +0.043 |
endant | +0.043 |
lettuce | +0.041 |
Neg logit contributions | |
sound | -0.032 |
inker | -0.028 |
ics | -0.025 |
ising | -0.025 |
ards | -0.025 |
Token | " |
Token ID | 366 |
Feature activation | -2.34e-02 |
Pos logit contributions | |
piping | +0.061 |
imet | +0.059 |
endant | +0.057 |
ocol | +0.057 |
million | +0.056 |
Neg logit contributions | |
sound | -0.044 |
inker | -0.033 |
ably | -0.032 |
tails | -0.031 |
behave | -0.031 |
Token | Look |
Token ID | 8567 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
piping | +0.031 |
million | +0.030 |
endant | +0.029 |
dark | +0.029 |
umm | +0.028 |
Neg logit contributions | |
sound | -0.046 |
not | -0.039 |
do | -0.039 |
listen | -0.039 |
listened | -0.037 |
Token | , |
Token ID | 11 |
Feature activation | -3.76e-02 |
Pos logit contributions | |
piping | +0.219 |
endant | +0.218 |
ocol | +0.211 |
million | +0.210 |
umm | +0.204 |
Neg logit contributions | |
sound | -0.119 |
do | -0.083 |
listen | -0.080 |
listened | -0.080 |
not | -0.075 |
Token | this |
Token ID | 428 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
piping | +0.057 |
endant | +0.056 |
million | +0.054 |
ocol | +0.051 |
pleasure | +0.050 |
Neg logit contributions | |
sound | -0.066 |
inker | -0.053 |
listened | -0.052 |
ably | -0.052 |
ising | -0.051 |
Token | map |
Token ID | 3975 |
Feature activation | -2.84e-02 |
Pos logit contributions | |
endant | +0.033 |
piping | +0.032 |
million | +0.031 |
dark | +0.030 |
camps | +0.030 |
Neg logit contributions | |
sound | -0.030 |
listened | -0.023 |
listen | -0.023 |
behave | -0.022 |
do | -0.022 |
Token | is |
Token ID | 318 |
Feature activation | +6.54e-03 |
Pos logit contributions | |
endant | +0.044 |
million | +0.043 |
piping | +0.041 |
dark | +0.040 |
imet | +0.039 |
Neg logit contributions | |
sound | -0.049 |
listen | -0.039 |
listened | -0.038 |
inker | -0.038 |
communicate | -0.038 |
Token | very |
Token ID | 845 |
Feature activation | +6.83e-04 |
Pos logit contributions | |
sound | +0.008 |
listen | +0.006 |
do | +0.006 |
listened | +0.006 |
inker | +0.006 |
Neg logit contributions | |
endant | -0.013 |
piping | -0.013 |
million | -0.013 |
ocol | -0.012 |
imet | -0.012 |
Token | scared |
Token ID | 12008 |
Feature activation | +1.73e-02 |
Pos logit contributions | |
piping | +0.004 |
endant | +0.004 |
ocol | +0.004 |
million | +0.003 |
freshly | +0.003 |
Neg logit contributions | |
sound | -0.003 |
listened | -0.002 |
do | -0.002 |
inker | -0.002 |
listen | -0.002 |
Token | of |
Token ID | 286 |
Feature activation | +8.49e-03 |
Pos logit contributions | |
sound | +0.025 |
listened | +0.019 |
do | +0.019 |
listen | +0.019 |
behave | +0.018 |
Neg logit contributions | |
piping | -0.031 |
million | -0.031 |
endant | -0.031 |
ocol | -0.030 |
umm | -0.029 |
Token | the |
Token ID | 262 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
sound | +0.011 |
listened | +0.008 |
ably | +0.008 |
listen | +0.008 |
inker | +0.008 |
Neg logit contributions | |
ocol | -0.016 |
endant | -0.016 |
million | -0.016 |
piping | -0.016 |
imet | -0.015 |
Token | weird |
Token ID | 7650 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
piping | +0.028 |
endant | +0.027 |
million | +0.026 |
ocol | +0.026 |
umm | +0.025 |
Neg logit contributions | |
sound | -0.031 |
do | -0.025 |
listen | -0.024 |
listened | -0.024 |
not | -0.023 |
Token | thing |
Token ID | 1517 |
Feature activation | -4.66e-03 |
Pos logit contributions | |
piping | +0.030 |
endant | +0.029 |
million | +0.028 |
ocol | +0.027 |
umm | +0.026 |
Neg logit contributions | |
sound | -0.055 |
do | -0.046 |
listen | -0.045 |
listened | -0.045 |
not | -0.044 |
Token | I |
Token ID | 314 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
million | +0.007 |
endant | +0.007 |
piping | +0.007 |
dark | +0.007 |
imet | +0.006 |
Neg logit contributions | |
sound | -0.008 |
inker | -0.007 |
communicate | -0.006 |
listened | -0.006 |
listen | -0.006 |
Token | saw |
Token ID | 2497 |
Feature activation | -2.91e-02 |
Pos logit contributions | |
endant | +0.164 |
dark | +0.156 |
freshly | +0.153 |
Wouldn | +0.151 |
million | +0.150 |
Neg logit contributions | |
sound | -0.159 |
ably | -0.119 |
ising | -0.119 |
inker | -0.118 |
loudly | -0.116 |
Token | ," |
Token ID | 553 |
Feature activation | +1.20e-02 |
Pos logit contributions | |
endant | +0.052 |
piping | +0.052 |
million | +0.052 |
ocol | +0.050 |
dark | +0.049 |
Neg logit contributions | |
sound | -0.042 |
listen | -0.033 |
do | -0.033 |
listened | -0.032 |
behave | -0.031 |
Token | the |
Token ID | 262 |
Feature activation | +1.30e-02 |
Pos logit contributions | |
inker | +0.015 |
sound | +0.014 |
ics | +0.014 |
ably | +0.013 |
tails | +0.013 |
Neg logit contributions | |
million | -0.021 |
piping | -0.021 |
freshly | -0.020 |
dark | -0.020 |
imet | -0.020 |
Token | pig |
Token ID | 12967 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
sound | +0.021 |
do | +0.016 |
not | +0.015 |
listened | +0.015 |
listen | +0.015 |
Neg logit contributions | |
endant | -0.025 |
ocol | -0.024 |
igsaw | -0.024 |
piping | -0.024 |
imet | -0.023 |
Token | said |
Token ID | 531 |
Feature activation | -9.00e-03 |
Pos logit contributions | |
sound | +0.020 |
inker | +0.019 |
music | +0.019 |
communicate | +0.018 |
behave | +0.018 |
Neg logit contributions | |
endant | -0.025 |
million | -0.024 |
pad | -0.022 |
tal | -0.022 |
berry | -0.022 |
Token | lively |
Token ID | 29696 |
Feature activation | -4.26e-03 |
Pos logit contributions | |
sound | +0.000 |
listen | +0.000 |
listened | +0.000 |
do | +0.000 |
inker | +0.000 |
Neg logit contributions | |
piping | -0.000 |
endant | -0.000 |
ocol | -0.000 |
million | -0.000 |
umm | -0.000 |
Token | adventure |
Token ID | 8855 |
Feature activation | +7.98e-03 |
Pos logit contributions | |
piping | +0.007 |
ocol | +0.006 |
endant | +0.006 |
million | +0.006 |
umm | +0.006 |
Neg logit contributions | |
sound | -0.007 |
listened | -0.006 |
do | -0.006 |
listen | -0.006 |
not | -0.006 |
Token | ! |
Token ID | 0 |
Feature activation | -2.75e-05 |
Pos logit contributions | |
sound | +0.011 |
listen | +0.010 |
inker | +0.010 |
communicate | +0.009 |
ignore | +0.009 |
Neg logit contributions | |
million | -0.013 |
umm | -0.013 |
igsaw | -0.013 |
� | -0.013 |
pleasure | -0.013 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.29e-02 |
Pos logit contributions | |
ocol | +0.000 |
endant | +0.000 |
piping | +0.000 |
camps | +0.000 |
umm | +0.000 |
Neg logit contributions | |
sound | -0.000 |
not | -0.000 |
each | -0.000 |
do | -0.000 |
her | -0.000 |
Token | " |
Token ID | 1 |
Feature activation | -1.03e-03 |
Pos logit contributions | |
endant | +0.020 |
ocol | +0.019 |
piping | +0.019 |
umm | +0.018 |
imet | +0.017 |
Neg logit contributions | |
sound | -0.024 |
do | -0.022 |
listened | -0.020 |
her | -0.020 |
listen | -0.019 |
Token | Look |
Token ID | 8567 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
endant | +0.002 |
piping | +0.002 |
ocol | +0.002 |
million | +0.001 |
igsaw | +0.001 |
Neg logit contributions | |
sound | -0.002 |
do | -0.002 |
listened | -0.001 |
listen | -0.001 |
not | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | -5.44e-02 |
Pos logit contributions | |
piping | +0.230 |
endant | +0.228 |
million | +0.224 |
ocol | +0.220 |
umm | +0.219 |
Neg logit contributions | |
sound | -0.106 |
do | -0.075 |
listen | -0.070 |
listened | -0.068 |
not | -0.066 |
Token | Mom |
Token ID | 11254 |
Feature activation | -3.19e-02 |
Pos logit contributions | |
piping | +0.089 |
endant | +0.085 |
million | +0.083 |
ocol | +0.082 |
pleasure | +0.081 |
Neg logit contributions | |
sound | -0.091 |
listened | -0.069 |
do | -0.068 |
listen | -0.068 |
inker | -0.067 |
Token | ! |
Token ID | 0 |
Feature activation | -3.69e-02 |
Pos logit contributions | |
piping | +0.046 |
endant | +0.045 |
million | +0.043 |
ocol | +0.041 |
freshly | +0.041 |
Neg logit contributions | |
sound | -0.060 |
communicate | -0.048 |
do | -0.047 |
listen | -0.047 |
inker | -0.047 |
Token | It |
Token ID | 632 |
Feature activation | -4.84e-02 |
Pos logit contributions | |
endant | +0.068 |
ocol | +0.062 |
piping | +0.061 |
brand | +0.060 |
impact | +0.060 |
Neg logit contributions | |
sound | -0.050 |
do | -0.042 |
listen | -0.040 |
when | -0.040 |
her | -0.040 |
Token | 's |
Token ID | 338 |
Feature activation | +6.94e-03 |
Pos logit contributions | |
piping | +0.094 |
million | +0.093 |
endant | +0.091 |
dark | +0.088 |
freshly | +0.087 |
Neg logit contributions | |
sound | -0.066 |
listen | -0.049 |
do | -0.047 |
inker | -0.047 |
listened | -0.046 |
Token | " |
Token ID | 366 |
Feature activation | -7.90e-03 |
Pos logit contributions | |
piping | +0.018 |
imet | +0.018 |
million | +0.018 |
endant | +0.018 |
freshly | +0.017 |
Neg logit contributions | |
sound | -0.026 |
inker | -0.023 |
tails | -0.022 |
ics | -0.021 |
do | -0.021 |
Token | Thanks |
Token ID | 9690 |
Feature activation | -4.80e-02 |
Pos logit contributions | |
piping | +0.012 |
endant | +0.012 |
ocol | +0.012 |
million | +0.012 |
umm | +0.011 |
Neg logit contributions | |
sound | -0.014 |
do | -0.011 |
listen | -0.011 |
listened | -0.011 |
not | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | -2.38e-02 |
Pos logit contributions | |
endant | +0.086 |
pleasure | +0.085 |
piping | +0.083 |
imet | +0.082 |
umm | +0.081 |
Neg logit contributions | |
sound | -0.068 |
listened | -0.054 |
ards | -0.052 |
communicate | -0.052 |
ably | -0.049 |
Token | Dad |
Token ID | 17415 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
piping | +0.036 |
endant | +0.036 |
ocol | +0.034 |
million | +0.034 |
umm | +0.034 |
Neg logit contributions | |
sound | -0.042 |
listened | -0.033 |
do | -0.033 |
tails | -0.032 |
listen | -0.032 |
Token | , |
Token ID | 11 |
Feature activation | -1.41e-02 |
Pos logit contributions | |
piping | +0.025 |
million | +0.024 |
endant | +0.024 |
pleasure | +0.023 |
berry | +0.023 |
Neg logit contributions | |
sound | -0.027 |
communicate | -0.023 |
inker | -0.023 |
listen | -0.020 |
do | -0.020 |
Token | for |
Token ID | 329 |
Feature activation | +5.27e-02 |
Pos logit contributions | |
piping | +0.022 |
endant | +0.022 |
million | +0.021 |
ocol | +0.021 |
umm | +0.021 |
Neg logit contributions | |
sound | -0.024 |
listened | -0.018 |
do | -0.018 |
listen | -0.018 |
inker | -0.018 |
Token | attaching |
Token ID | 39550 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
sound | +0.075 |
ably | +0.061 |
inker | +0.059 |
tails | +0.057 |
listen | +0.057 |
Neg logit contributions | |
million | -0.089 |
piping | -0.087 |
ocol | -0.086 |
endant | -0.085 |
pleasure | -0.083 |
Token | my |
Token ID | 616 |
Feature activation | -1.86e-02 |
Pos logit contributions | |
sound | +0.032 |
listened | +0.025 |
do | +0.024 |
listen | +0.024 |
inker | +0.023 |
Neg logit contributions | |
piping | -0.046 |
endant | -0.046 |
ocol | -0.045 |
imet | -0.044 |
million | -0.044 |
Token | pedal |
Token ID | 26667 |
Feature activation | -2.16e-02 |
Pos logit contributions | |
piping | +0.033 |
endant | +0.033 |
million | +0.032 |
ocol | +0.032 |
imet | +0.031 |
Neg logit contributions | |
sound | -0.028 |
do | -0.022 |
listen | -0.021 |
listened | -0.021 |
not | -0.020 |
Token | !" |
Token ID | 2474 |
Feature activation | +8.03e-03 |
Pos logit contributions | |
endant | +0.037 |
imet | +0.035 |
million | +0.035 |
piping | +0.034 |
brand | +0.034 |
Neg logit contributions | |
sound | -0.030 |
listened | -0.026 |
listen | -0.025 |
communicate | -0.025 |
inker | -0.024 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.29e-02 |
Pos logit contributions | |
sound | +0.017 |
do | +0.014 |
listen | +0.014 |
listened | +0.013 |
not | +0.013 |
Neg logit contributions | |
piping | -0.010 |
endant | -0.010 |
million | -0.010 |
ocol | -0.010 |
umm | -0.009 |
Token | what |
Token ID | 644 |
Feature activation | +2.39e-04 |
Pos logit contributions | |
endant | +0.059 |
piping | +0.058 |
umm | +0.056 |
million | +0.056 |
ocol | +0.056 |
Neg logit contributions | |
sound | -0.043 |
do | -0.033 |
listen | -0.032 |
not | -0.031 |
listened | -0.031 |
Token | was |
Token ID | 373 |
Feature activation | -5.10e-03 |
Pos logit contributions | |
sound | +0.000 |
listen | +0.000 |
do | +0.000 |
listened | +0.000 |
inker | +0.000 |
Neg logit contributions | |
piping | -0.000 |
endant | -0.000 |
million | -0.000 |
ocol | -0.000 |
dark | -0.000 |
Token | behind |
Token ID | 2157 |
Feature activation | -3.45e-02 |
Pos logit contributions | |
piping | +0.008 |
endant | +0.008 |
million | +0.008 |
ocol | +0.008 |
dark | +0.008 |
Neg logit contributions | |
sound | -0.009 |
do | -0.007 |
listen | -0.007 |
listened | -0.007 |
inker | -0.006 |
Token | it |
Token ID | 340 |
Feature activation | -2.86e-02 |
Pos logit contributions | |
piping | +0.062 |
ocol | +0.061 |
million | +0.060 |
endant | +0.057 |
freshly | +0.057 |
Neg logit contributions | |
sound | -0.051 |
listened | -0.040 |
listen | -0.039 |
behave | -0.039 |
inker | -0.038 |
Token | . |
Token ID | 13 |
Feature activation | +2.60e-03 |
Pos logit contributions | |
million | +0.049 |
piping | +0.048 |
endant | +0.047 |
� | +0.046 |
imet | +0.046 |
Neg logit contributions | |
sound | -0.040 |
listened | -0.034 |
inker | -0.032 |
behave | -0.032 |
listen | -0.032 |
Token | When |
Token ID | 1649 |
Feature activation | +5.39e-02 |
Pos logit contributions | |
sound | +0.005 |
do | +0.004 |
listen | +0.004 |
not | +0.004 |
listened | +0.004 |
Neg logit contributions | |
endant | -0.004 |
piping | -0.004 |
ocol | -0.004 |
million | -0.004 |
umm | -0.004 |
Token | he |
Token ID | 339 |
Feature activation | +4.23e-02 |
Pos logit contributions | |
sound | +0.096 |
inker | +0.083 |
tails | +0.082 |
ably | +0.082 |
communicate | +0.080 |
Neg logit contributions | |
million | -0.076 |
piping | -0.074 |
igsaw | -0.072 |
� | -0.071 |
imet | -0.071 |
Token | was |
Token ID | 373 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
sound | +0.064 |
do | +0.048 |
listen | +0.047 |
listened | +0.046 |
not | +0.045 |
Neg logit contributions | |
piping | -0.078 |
endant | -0.077 |
million | -0.075 |
ocol | -0.074 |
imet | -0.072 |
Token | close |
Token ID | 1969 |
Feature activation | +7.02e-04 |
Pos logit contributions | |
sound | +0.038 |
do | +0.028 |
listen | +0.028 |
inker | +0.027 |
tails | +0.027 |
Neg logit contributions | |
piping | -0.044 |
endant | -0.043 |
million | -0.042 |
ocol | -0.041 |
imet | -0.040 |
Token | , |
Token ID | 11 |
Feature activation | +6.12e-03 |
Pos logit contributions | |
sound | +0.001 |
behave | +0.001 |
communicate | +0.001 |
listen | +0.001 |
do | +0.001 |
Neg logit contributions | |
joy | -0.001 |
endant | -0.001 |
piping | -0.001 |
ocol | -0.001 |
imet | -0.001 |
Token | he |
Token ID | 339 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
sound | +0.011 |
tails | +0.009 |
inker | +0.009 |
behave | +0.009 |
ani | +0.009 |
Neg logit contributions | |
million | -0.009 |
piping | -0.008 |
brand | -0.008 |
igsaw | -0.008 |
pleasure | -0.008 |
Token | of |
Token ID | 286 |
Feature activation | +5.15e-04 |
Pos logit contributions | |
sound | +0.007 |
listened | +0.006 |
do | +0.006 |
listen | +0.006 |
inker | +0.006 |
Neg logit contributions | |
piping | -0.004 |
endant | -0.004 |
million | -0.004 |
ocol | -0.004 |
dark | -0.004 |
Token | it |
Token ID | 340 |
Feature activation | -3.79e-02 |
Pos logit contributions | |
sound | +0.001 |
listened | +0.001 |
inker | +0.001 |
ably | +0.001 |
do | +0.001 |
Neg logit contributions | |
ocol | -0.001 |
piping | -0.001 |
million | -0.001 |
freshly | -0.001 |
endant | -0.001 |
Token | ." |
Token ID | 526 |
Feature activation | -1.01e-03 |
Pos logit contributions | |
million | +0.057 |
camps | +0.054 |
dark | +0.051 |
piping | +0.050 |
umbs | +0.050 |
Neg logit contributions | |
sound | -0.063 |
inker | -0.054 |
communicate | -0.053 |
listened | -0.052 |
do | -0.051 |
Token |
|
Token ID | 198 |
Feature activation | -1.36e-02 |
Pos logit contributions | |
ocol | +0.002 |
endant | +0.002 |
piping | +0.002 |
camps | +0.001 |
umm | +0.001 |
Neg logit contributions | |
sound | -0.002 |
do | -0.001 |
not | -0.001 |
listened | -0.001 |
listen | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
endant | +0.023 |
umm | +0.023 |
ocol | +0.023 |
piping | +0.022 |
imet | +0.020 |
Neg logit contributions | |
sound | -0.023 |
do | -0.020 |
not | -0.019 |
listen | -0.018 |
listened | -0.018 |
Token | After |
Token ID | 3260 |
Feature activation | +5.61e-02 |
Pos logit contributions | |
million | +0.024 |
piping | +0.023 |
endant | +0.022 |
igsaw | +0.021 |
ocol | +0.021 |
Neg logit contributions | |
sound | -0.023 |
do | -0.018 |
listen | -0.018 |
listened | -0.017 |
inker | -0.017 |
Token | breakfast |
Token ID | 12607 |
Feature activation | +5.28e-02 |
Pos logit contributions | |
sound | +0.084 |
inker | +0.067 |
ably | +0.066 |
ising | +0.062 |
do | +0.060 |
Neg logit contributions | |
piping | -0.102 |
million | -0.097 |
freshly | -0.096 |
ocol | -0.096 |
� | -0.096 |
Token | , |
Token ID | 11 |
Feature activation | +9.25e-03 |
Pos logit contributions | |
sound | +0.072 |
communicate | +0.062 |
tails | +0.061 |
inker | +0.061 |
listen | +0.057 |
Neg logit contributions | |
� | -0.096 |
million | -0.095 |
piping | -0.093 |
imet | -0.088 |
berry | -0.088 |
Token | Lily |
Token ID | 20037 |
Feature activation | +7.29e-03 |
Pos logit contributions | |
sound | +0.016 |
inker | +0.013 |
do | +0.013 |
listen | +0.013 |
communicate | +0.013 |
Neg logit contributions | |
piping | -0.014 |
million | -0.014 |
endant | -0.013 |
freshly | -0.013 |
ocol | -0.013 |
Token | was |
Token ID | 373 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
sound | +0.012 |
inker | +0.009 |
communicate | +0.009 |
ourselves | +0.009 |
listen | +0.009 |
Neg logit contributions | |
million | -0.012 |
piping | -0.011 |
endant | -0.011 |
camps | -0.011 |
imet | -0.011 |
Token | playing |
Token ID | 2712 |
Feature activation | +4.13e-02 |
Pos logit contributions | |
sound | +0.021 |
do | +0.016 |
listen | +0.015 |
inker | +0.015 |
listened | +0.015 |
Neg logit contributions | |
piping | -0.025 |
endant | -0.025 |
million | -0.024 |
ocol | -0.024 |
dark | -0.023 |
Token | Rena |
Token ID | 27694 |
Feature activation | +4.97e-02 |
Pos logit contributions | |
sound | +0.053 |
ards | +0.048 |
ics | +0.045 |
behave | +0.044 |
ably | +0.040 |
Neg logit contributions | |
Once | -0.042 |
By | -0.041 |
There | -0.040 |
million | -0.040 |
Which | -0.038 |
Token | used |
Token ID | 973 |
Feature activation | +4.85e-03 |
Pos logit contributions | |
sound | +0.085 |
inker | +0.065 |
ourselves | +0.065 |
ics | +0.063 |
ikes | +0.059 |
Neg logit contributions | |
dark | -0.072 |
imet | -0.071 |
There | -0.070 |
endant | -0.070 |
Wouldn | -0.066 |
Token | her |
Token ID | 607 |
Feature activation | -2.21e-02 |
Pos logit contributions | |
sound | +0.006 |
ising | +0.004 |
inker | +0.004 |
do | +0.004 |
listen | +0.004 |
Neg logit contributions | |
piping | -0.010 |
igsaw | -0.009 |
ocol | -0.009 |
million | -0.009 |
brand | -0.009 |
Token | hands |
Token ID | 2832 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
piping | +0.037 |
endant | +0.037 |
million | +0.035 |
ocol | +0.035 |
umm | +0.034 |
Neg logit contributions | |
sound | -0.037 |
do | -0.030 |
listen | -0.029 |
listened | -0.028 |
not | -0.028 |
Token | to |
Token ID | 284 |
Feature activation | +8.06e-03 |
Pos logit contributions | |
pad | +0.014 |
run | +0.014 |
imet | +0.014 |
endant | +0.014 |
nowhere | +0.013 |
Neg logit contributions | |
sound | -0.022 |
inker | -0.019 |
prove | -0.019 |
ising | -0.018 |
do | -0.018 |
Token | communicate |
Token ID | 10996 |
Feature activation | +7.44e-02 |
Pos logit contributions | |
w | +0.010 |
inker | +0.010 |
ics | +0.010 |
ards | +0.009 |
sound | +0.009 |
Neg logit contributions | |
tow | -0.011 |
pleasure | -0.011 |
piping | -0.011 |
freshly | -0.011 |
impact | -0.011 |
Token | with |
Token ID | 351 |
Feature activation | +3.51e-04 |
Pos logit contributions | |
sound | +0.091 |
w | +0.086 |
ics | +0.086 |
inker | +0.083 |
listened | +0.079 |
Neg logit contributions | |
brand | -0.110 |
igsaw | -0.106 |
run | -0.103 |
joy | -0.101 |
Some | -0.101 |
Token | Rose |
Token ID | 8049 |
Feature activation | -5.30e-03 |
Pos logit contributions | |
sound | +0.001 |
listened | +0.000 |
ics | +0.000 |
obey | +0.000 |
listen | +0.000 |
Neg logit contributions | |
ocol | -0.001 |
piping | -0.000 |
pill | -0.000 |
igsaw | -0.000 |
pleasure | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | +2.83e-03 |
Pos logit contributions | |
pad | +0.009 |
endant | +0.008 |
million | +0.008 |
igsaw | +0.008 |
piping | +0.008 |
Neg logit contributions | |
sound | -0.008 |
inker | -0.007 |
listen | -0.006 |
w | -0.006 |
behave | -0.006 |
Token | She |
Token ID | 1375 |
Feature activation | -8.54e-03 |
Pos logit contributions | |
sound | +0.006 |
listened | +0.005 |
do | +0.005 |
listen | +0.005 |
behave | +0.005 |
Neg logit contributions | |
There | -0.003 |
imet | -0.003 |
igsaw | -0.003 |
piping | -0.003 |
By | -0.003 |
Token | showed |
Token ID | 3751 |
Feature activation | -3.42e-02 |
Pos logit contributions | |
endant | +0.012 |
million | +0.012 |
camps | +0.012 |
dark | +0.011 |
Wouldn | +0.011 |
Neg logit contributions | |
sound | -0.014 |
inker | -0.012 |
ourselves | -0.011 |
ics | -0.011 |
ising | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | -4.56e-03 |
Pos logit contributions | |
endant | +0.005 |
piping | +0.005 |
umm | +0.005 |
million | +0.004 |
� | +0.004 |
Neg logit contributions | |
sound | -0.013 |
listen | -0.012 |
do | -0.012 |
communicate | -0.011 |
listened | -0.011 |
Token | But |
Token ID | 887 |
Feature activation | +5.48e-03 |
Pos logit contributions | |
ocol | +0.010 |
endant | +0.010 |
piping | +0.009 |
million | +0.009 |
camps | +0.009 |
Neg logit contributions | |
sound | -0.006 |
do | -0.005 |
her | -0.005 |
not | -0.004 |
listen | -0.004 |
Token | while |
Token ID | 981 |
Feature activation | +3.04e-02 |
Pos logit contributions | |
sound | +0.006 |
inker | +0.004 |
listen | +0.004 |
do | +0.004 |
communicate | +0.004 |
Neg logit contributions | |
endant | -0.012 |
piping | -0.011 |
million | -0.011 |
ocol | -0.011 |
imet | -0.011 |
Token | she |
Token ID | 673 |
Feature activation | +1.45e-02 |
Pos logit contributions | |
sound | +0.030 |
do | +0.020 |
listen | +0.019 |
not | +0.019 |
listened | +0.019 |
Neg logit contributions | |
endant | -0.073 |
piping | -0.072 |
ocol | -0.070 |
umm | -0.070 |
million | -0.069 |
Token | was |
Token ID | 373 |
Feature activation | +2.18e-02 |
Pos logit contributions | |
sound | +0.018 |
listen | +0.012 |
do | +0.012 |
not | +0.011 |
listened | +0.011 |
Neg logit contributions | |
piping | -0.030 |
endant | -0.030 |
million | -0.029 |
ocol | -0.029 |
dark | -0.028 |
Token | playing |
Token ID | 2712 |
Feature activation | +6.11e-02 |
Pos logit contributions | |
sound | +0.035 |
do | +0.027 |
inker | +0.026 |
listen | +0.026 |
communicate | +0.025 |
Neg logit contributions | |
piping | -0.037 |
endant | -0.036 |
million | -0.035 |
ocol | -0.035 |
freshly | -0.033 |
Token | , |
Token ID | 11 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
sound | +0.065 |
listened | +0.044 |
tails | +0.043 |
listen | +0.042 |
inker | +0.042 |
Neg logit contributions | |
piping | -0.131 |
ocol | -0.128 |
million | -0.127 |
endant | -0.127 |
imet | -0.122 |
Token | the |
Token ID | 262 |
Feature activation | +6.31e-03 |
Pos logit contributions | |
sound | +0.014 |
inker | +0.011 |
obey | +0.011 |
listen | +0.011 |
ably | +0.011 |
Neg logit contributions | |
piping | -0.021 |
million | -0.020 |
endant | -0.020 |
ocol | -0.019 |
freshly | -0.019 |
Token | necklace |
Token ID | 38987 |
Feature activation | -1.00e-02 |
Pos logit contributions | |
sound | +0.011 |
do | +0.008 |
listen | +0.008 |
listened | +0.008 |
not | +0.008 |
Neg logit contributions | |
piping | -0.011 |
endant | -0.010 |
ocol | -0.010 |
million | -0.010 |
imet | -0.010 |
Token | slipped |
Token ID | 18859 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
million | +0.017 |
endant | +0.017 |
dark | +0.015 |
piping | +0.015 |
imet | +0.015 |
Neg logit contributions | |
sound | -0.015 |
listen | -0.013 |
inker | -0.012 |
obey | -0.012 |
behave | -0.012 |
Token | off |
Token ID | 572 |
Feature activation | -1.31e-02 |
Pos logit contributions | |
million | +0.037 |
piping | +0.035 |
imet | +0.034 |
endant | +0.034 |
camps | +0.034 |
Neg logit contributions | |
sound | -0.022 |
communicate | -0.017 |
obey | -0.017 |
listened | -0.017 |
listen | -0.017 |
Token | looked |
Token ID | 3114 |
Feature activation | -3.95e-02 |
Pos logit contributions | |
sound | +0.038 |
inker | +0.034 |
ics | +0.032 |
loudly | +0.031 |
ably | +0.030 |
Neg logit contributions | |
piping | -0.037 |
endant | -0.037 |
million | -0.036 |
pleasure | -0.036 |
freshly | -0.035 |
Token | both |
Token ID | 1111 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
piping | +0.070 |
endant | +0.070 |
million | +0.068 |
ocol | +0.068 |
camps | +0.065 |
Neg logit contributions | |
sound | -0.059 |
do | -0.045 |
listened | -0.044 |
listen | -0.043 |
inker | -0.042 |
Token | ways |
Token ID | 2842 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
pleasure | +0.021 |
piping | +0.021 |
endant | +0.021 |
million | +0.020 |
joy | +0.020 |
Neg logit contributions | |
sound | -0.018 |
inker | -0.015 |
behave | -0.015 |
do | -0.015 |
listen | -0.015 |
Token | before |
Token ID | 878 |
Feature activation | +4.09e-02 |
Pos logit contributions | |
sound | +0.024 |
inker | +0.019 |
do | +0.018 |
listened | +0.018 |
tails | +0.017 |
Neg logit contributions | |
endant | -0.029 |
imet | -0.028 |
piping | -0.028 |
million | -0.028 |
ocol | -0.028 |
Token | he |
Token ID | 339 |
Feature activation | +8.72e-05 |
Pos logit contributions | |
sound | +0.060 |
ably | +0.048 |
behave | +0.047 |
listen | +0.047 |
inker | +0.047 |
Neg logit contributions | |
million | -0.069 |
piping | -0.069 |
endant | -0.067 |
camps | -0.066 |
freshly | -0.066 |
Token | started |
Token ID | 2067 |
Feature activation | +2.65e-02 |
Pos logit contributions | |
sound | +0.000 |
ics | +0.000 |
inker | +0.000 |
listen | +0.000 |
not | +0.000 |
Neg logit contributions | |
endant | -0.000 |
piping | -0.000 |
dark | -0.000 |
ocol | -0.000 |
imet | -0.000 |
Token | to |
Token ID | 284 |
Feature activation | +9.83e-03 |
Pos logit contributions | |
sound | +0.040 |
ably | +0.033 |
inker | +0.032 |
do | +0.032 |
behave | +0.031 |
Neg logit contributions | |
million | -0.042 |
joy | -0.042 |
piping | -0.041 |
endant | -0.040 |
imet | -0.039 |
Token | scrape |
Token ID | 42778 |
Feature activation | +7.77e-03 |
Pos logit contributions | |
sound | +0.013 |
inker | +0.012 |
ably | +0.012 |
ena | +0.012 |
ards | +0.011 |
Neg logit contributions | |
impact | -0.016 |
million | -0.015 |
piping | -0.015 |
pleasure | -0.014 |
camps | -0.014 |
Token | along |
Token ID | 1863 |
Feature activation | +2.79e-02 |
Pos logit contributions | |
sound | +0.010 |
do | +0.008 |
listen | +0.008 |
listened | +0.008 |
ics | +0.008 |
Neg logit contributions | |
ocol | -0.015 |
million | -0.015 |
piping | -0.014 |
imet | -0.014 |
endant | -0.014 |
Token | the |
Token ID | 262 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
sound | +0.032 |
listened | +0.028 |
listen | +0.028 |
inker | +0.027 |
ics | +0.027 |
Neg logit contributions | |
million | -0.052 |
ocol | -0.051 |
brand | -0.050 |
camps | -0.049 |
piping | -0.049 |
Token | ocean |
Token ID | 9151 |
Feature activation | +2.81e-02 |
Pos logit contributions | |
sound | +0.023 |
do | +0.019 |
listen | +0.019 |
listened | +0.018 |
not | +0.018 |
Neg logit contributions | |
piping | -0.021 |
endant | -0.020 |
million | -0.019 |
ocol | -0.019 |
umm | -0.019 |
Token | knew |
Token ID | 2993 |
Feature activation | -2.00e-02 |
Pos logit contributions | |
sound | +0.020 |
inker | +0.016 |
listen | +0.015 |
do | +0.015 |
behave | +0.014 |
Neg logit contributions | |
endant | -0.025 |
piping | -0.024 |
million | -0.024 |
dark | -0.023 |
imet | -0.023 |
Token | that |
Token ID | 326 |
Feature activation | -2.14e-03 |
Pos logit contributions | |
endant | +0.038 |
piping | +0.037 |
million | +0.036 |
ocol | +0.036 |
pleasure | +0.036 |
Neg logit contributions | |
sound | -0.026 |
inker | -0.020 |
tails | -0.019 |
do | -0.018 |
listen | -0.018 |
Token | no |
Token ID | 645 |
Feature activation | +3.61e-03 |
Pos logit contributions | |
million | +0.004 |
piping | +0.004 |
endant | +0.004 |
ocol | +0.004 |
pleasure | +0.004 |
Neg logit contributions | |
sound | -0.003 |
inker | -0.002 |
tails | -0.002 |
do | -0.002 |
listen | -0.002 |
Token | matter |
Token ID | 2300 |
Feature activation | +1.98e-02 |
Pos logit contributions | |
sound | +0.005 |
do | +0.004 |
listen | +0.004 |
listened | +0.004 |
not | +0.004 |
Neg logit contributions | |
piping | -0.007 |
endant | -0.007 |
ocol | -0.006 |
million | -0.006 |
umm | -0.006 |
Token | how |
Token ID | 703 |
Feature activation | +4.19e-02 |
Pos logit contributions | |
sound | +0.028 |
do | +0.021 |
listen | +0.020 |
listened | +0.020 |
not | +0.019 |
Neg logit contributions | |
piping | -0.037 |
endant | -0.037 |
ocol | -0.036 |
million | -0.036 |
umm | -0.034 |
Token | confused |
Token ID | 10416 |
Feature activation | +4.46e-02 |
Pos logit contributions | |
sound | +0.072 |
listen | +0.056 |
do | +0.056 |
listened | +0.054 |
behave | +0.054 |
Neg logit contributions | |
million | -0.068 |
endant | -0.066 |
piping | -0.065 |
ocol | -0.063 |
igsaw | -0.061 |
Token | he |
Token ID | 339 |
Feature activation | +3.56e-03 |
Pos logit contributions | |
sound | +0.061 |
inker | +0.057 |
tails | +0.051 |
ably | +0.049 |
ics | +0.049 |
Neg logit contributions | |
million | -0.077 |
piping | -0.074 |
ocol | -0.073 |
diamonds | -0.070 |
imet | -0.069 |
Token | might |
Token ID | 1244 |
Feature activation | +2.89e-02 |
Pos logit contributions | |
sound | +0.005 |
inker | +0.004 |
tails | +0.004 |
ics | +0.004 |
listen | +0.004 |
Neg logit contributions | |
endant | -0.006 |
dark | -0.006 |
piping | -0.006 |
million | -0.006 |
imet | -0.006 |
Token | be |
Token ID | 307 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
sound | +0.044 |
inker | +0.036 |
tails | +0.034 |
music | +0.033 |
loudly | +0.033 |
Neg logit contributions | |
endant | -0.047 |
million | -0.046 |
piping | -0.045 |
� | -0.045 |
pleasure | -0.044 |
Token | , |
Token ID | 11 |
Feature activation | +1.43e-02 |
Pos logit contributions | |
sound | +0.026 |
inker | +0.022 |
tails | +0.018 |
ably | +0.018 |
ani | +0.018 |
Neg logit contributions | |
million | -0.038 |
endant | -0.037 |
piping | -0.036 |
pleasure | -0.035 |
igsaw | -0.034 |
Token | sharing |
Token ID | 7373 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
sound | +0.020 |
inker | +0.017 |
tails | +0.016 |
ably | +0.016 |
ics | +0.015 |
Neg logit contributions | |
million | -0.025 |
piping | -0.024 |
pleasure | -0.024 |
endant | -0.024 |
ocol | -0.024 |
Token | old |
Token ID | 1468 |
Feature activation | -3.16e-02 |
Pos logit contributions | |
piping | +0.008 |
Wouldn | +0.008 |
million | +0.008 |
� | +0.008 |
Doesn | +0.008 |
Neg logit contributions | |
sound | -0.004 |
her | -0.002 |
do | -0.002 |
not | -0.002 |
loudly | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
endant | +0.067 |
piping | +0.067 |
million | +0.065 |
freshly | +0.063 |
umm | +0.062 |
Neg logit contributions | |
sound | -0.034 |
ics | -0.024 |
listen | -0.024 |
inker | -0.024 |
do | -0.023 |
Token | very |
Token ID | 845 |
Feature activation | +1.93e-02 |
Pos logit contributions | |
piping | +0.029 |
freshly | +0.029 |
brand | +0.027 |
million | +0.027 |
endant | +0.027 |
Neg logit contributions | |
sound | -0.026 |
inker | -0.024 |
ising | -0.024 |
ics | -0.022 |
communicate | -0.022 |
Token | smart |
Token ID | 4451 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
sound | +0.029 |
communicate | +0.022 |
inker | +0.022 |
ising | +0.022 |
listen | +0.021 |
Neg logit contributions | |
piping | -0.034 |
endant | -0.033 |
ocol | -0.032 |
million | -0.032 |
dark | -0.032 |
Token | . |
Token ID | 13 |
Feature activation | -3.06e-03 |
Pos logit contributions | |
sound | +0.020 |
communicate | +0.015 |
listen | +0.015 |
ics | +0.015 |
listened | +0.015 |
Neg logit contributions | |
million | -0.029 |
endant | -0.029 |
piping | -0.029 |
umm | -0.028 |
camps | -0.027 |
Token | One |
Token ID | 1881 |
Feature activation | +8.62e-03 |
Pos logit contributions | |
ocol | +0.006 |
endant | +0.006 |
piping | +0.006 |
umm | +0.006 |
million | +0.006 |
Neg logit contributions | |
sound | -0.004 |
do | -0.004 |
her | -0.004 |
not | -0.003 |
each | -0.003 |
Token | day |
Token ID | 1110 |
Feature activation | +1.26e-03 |
Pos logit contributions | |
sound | +0.015 |
inker | +0.013 |
tails | +0.013 |
ising | +0.013 |
communicate | +0.013 |
Neg logit contributions | |
piping | -0.012 |
dark | -0.012 |
endant | -0.011 |
million | -0.011 |
igsaw | -0.011 |
Token | she |
Token ID | 673 |
Feature activation | -5.36e-03 |
Pos logit contributions | |
sound | +0.002 |
listen | +0.001 |
behave | +0.001 |
do | +0.001 |
listened | +0.001 |
Neg logit contributions | |
piping | -0.003 |
million | -0.003 |
endant | -0.003 |
ocol | -0.003 |
imet | -0.003 |
Token | went |
Token ID | 1816 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
endant | +0.010 |
piping | +0.009 |
million | +0.009 |
dark | +0.009 |
camps | +0.009 |
Neg logit contributions | |
sound | -0.008 |
listen | -0.006 |
communicate | -0.006 |
tails | -0.006 |
inker | -0.006 |
Token | with |
Token ID | 351 |
Feature activation | -1.74e-02 |
Pos logit contributions | |
endant | +0.037 |
piping | +0.037 |
camps | +0.036 |
dark | +0.036 |
freshly | +0.035 |
Neg logit contributions | |
sound | -0.030 |
listened | -0.022 |
do | -0.022 |
inker | -0.022 |
communicate | -0.022 |
Token | her |
Token ID | 607 |
Feature activation | -2.79e-02 |
Pos logit contributions | |
piping | +0.048 |
endant | +0.047 |
million | +0.046 |
ocol | +0.046 |
umm | +0.045 |
Neg logit contributions | |
sound | -0.011 |
do | -0.004 |
listen | -0.004 |
listened | -0.004 |
not | -0.003 |
Token | icians |
Token ID | 5106 |
Feature activation | +4.11e-02 |
Pos logit contributions | |
ocol | +0.008 |
endant | +0.008 |
piping | +0.007 |
million | +0.007 |
pill | +0.007 |
Neg logit contributions | |
sound | -0.018 |
listen | -0.015 |
do | -0.015 |
say | -0.014 |
listened | -0.014 |
Token | do |
Token ID | 466 |
Feature activation | +3.69e-02 |
Pos logit contributions | |
sound | +0.061 |
inker | +0.052 |
obey | +0.048 |
ably | +0.047 |
Fine | +0.046 |
Neg logit contributions | |
endant | -0.061 |
oming | -0.060 |
berry | -0.059 |
piping | -0.059 |
ago | -0.059 |
Token | amazing |
Token ID | 4998 |
Feature activation | -1.31e-03 |
Pos logit contributions | |
sound | +0.052 |
bye | +0.050 |
w | +0.049 |
aunts | +0.047 |
obey | +0.046 |
Neg logit contributions | |
brand | -0.060 |
million | -0.052 |
freshly | -0.051 |
endant | -0.051 |
pill | -0.051 |
Token | tricks |
Token ID | 15910 |
Feature activation | +3.77e-02 |
Pos logit contributions | |
ocol | +0.002 |
brand | +0.002 |
million | +0.002 |
piping | +0.002 |
imet | +0.002 |
Neg logit contributions | |
sound | -0.002 |
behave | -0.002 |
listened | -0.002 |
ics | -0.002 |
not | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | -4.93e-03 |
Pos logit contributions | |
sound | +0.058 |
inker | +0.054 |
heads | +0.051 |
obey | +0.051 |
ignore | +0.050 |
Neg logit contributions | |
There | -0.050 |
brand | -0.050 |
million | -0.049 |
piping | -0.048 |
br | -0.048 |
Token | felt |
Token ID | 2936 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
piping | +0.008 |
million | +0.008 |
endant | +0.008 |
lettuce | +0.008 |
Would | +0.008 |
Neg logit contributions | |
sound | -0.006 |
oo | -0.006 |
ister | -0.006 |
ek | -0.006 |
inker | -0.006 |
Token | like |
Token ID | 588 |
Feature activation | +1.59e-02 |
Pos logit contributions | |
sound | +0.014 |
inker | +0.012 |
listened | +0.011 |
tails | +0.011 |
ably | +0.011 |
Neg logit contributions | |
piping | -0.020 |
pleasure | -0.020 |
brand | -0.019 |
ocol | -0.019 |
million | -0.019 |
Token | joining |
Token ID | 9679 |
Feature activation | +4.29e-02 |
Pos logit contributions | |
sound | +0.021 |
obey | +0.016 |
listen | +0.016 |
ising | +0.015 |
inker | +0.015 |
Neg logit contributions | |
piping | -0.030 |
endant | -0.029 |
million | -0.028 |
pleasure | -0.028 |
brand | -0.028 |
Token | in |
Token ID | 287 |
Feature activation | -1.75e-03 |
Pos logit contributions | |
sound | +0.063 |
obey | +0.052 |
behave | +0.052 |
listened | +0.052 |
listen | +0.051 |
Neg logit contributions | |
ocol | -0.070 |
piping | -0.060 |
joy | -0.060 |
diamonds | -0.060 |
igsaw | -0.059 |
Token | with |
Token ID | 351 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
piping | +0.003 |
million | +0.003 |
ocol | +0.003 |
freshly | +0.003 |
igsaw | +0.003 |
Neg logit contributions | |
sound | -0.002 |
listened | -0.002 |
ably | -0.002 |
listen | -0.001 |
ising | -0.001 |
Token | them |
Token ID | 606 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
piping | +0.023 |
ocol | +0.023 |
endant | +0.022 |
pleasure | +0.022 |
million | +0.021 |
Neg logit contributions | |
sound | -0.012 |
listened | -0.009 |
listen | -0.008 |
do | -0.008 |
behave | -0.008 |
Token | explore |
Token ID | 7301 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
sound | +0.005 |
ards | +0.004 |
inker | +0.004 |
tails | +0.004 |
ising | +0.004 |
Neg logit contributions | |
piping | -0.005 |
There | -0.005 |
tow | -0.005 |
pleasure | -0.005 |
million | -0.005 |
Token | further |
Token ID | 2252 |
Feature activation | +2.81e-02 |
Pos logit contributions | |
sound | +0.019 |
tails | +0.014 |
inker | +0.014 |
listened | +0.014 |
behave | +0.013 |
Neg logit contributions | |
piping | -0.032 |
endant | -0.032 |
ocol | -0.032 |
freshly | -0.031 |
million | -0.031 |
Token | , |
Token ID | 11 |
Feature activation | +1.51e-02 |
Pos logit contributions | |
sound | +0.039 |
behave | +0.033 |
listened | +0.033 |
inker | +0.032 |
communicate | +0.031 |
Neg logit contributions | |
million | -0.045 |
endant | -0.045 |
piping | -0.044 |
joy | -0.043 |
freshly | -0.043 |
Token | she |
Token ID | 673 |
Feature activation | -3.51e-03 |
Pos logit contributions | |
sound | +0.021 |
inker | +0.017 |
listened | +0.016 |
listen | +0.016 |
communicate | +0.016 |
Neg logit contributions | |
million | -0.026 |
joy | -0.025 |
freshly | -0.025 |
piping | -0.025 |
pleasure | -0.025 |
Token | heard |
Token ID | 2982 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
endant | +0.005 |
camps | +0.005 |
million | +0.005 |
piping | +0.005 |
imet | +0.005 |
Neg logit contributions | |
sound | -0.006 |
inker | -0.005 |
listen | -0.005 |
ards | -0.005 |
gging | -0.005 |
Token | an |
Token ID | 281 |
Feature activation | -6.02e-04 |
Pos logit contributions | |
sound | +0.017 |
behave | +0.016 |
ards | +0.015 |
gg | +0.015 |
inker | +0.015 |
Neg logit contributions | |
endant | -0.023 |
brand | -0.022 |
dark | -0.022 |
million | -0.022 |
piping | -0.022 |
Token | angry |
Token ID | 7954 |
Feature activation | +1.46e-02 |
Pos logit contributions | |
piping | +0.001 |
endant | +0.001 |
ocol | +0.001 |
million | +0.001 |
umm | +0.001 |
Neg logit contributions | |
sound | -0.001 |
listened | -0.001 |
listen | -0.001 |
do | -0.001 |
not | -0.001 |
Token | voice |
Token ID | 3809 |
Feature activation | +1.35e-02 |
Pos logit contributions | |
ics | +0.017 |
listened | +0.016 |
sound | +0.015 |
behave | +0.015 |
obey | +0.015 |
Neg logit contributions | |
ocol | -0.025 |
umm | -0.025 |
piping | -0.024 |
endant | -0.024 |
igsaw | -0.024 |
Token | coming |
Token ID | 2406 |
Feature activation | -3.94e-03 |
Pos logit contributions | |
sound | +0.017 |
inker | +0.016 |
ics | +0.015 |
w | +0.015 |
behave | +0.015 |
Neg logit contributions | |
piping | -0.022 |
dark | -0.021 |
ocol | -0.021 |
endant | -0.021 |
million | -0.020 |
Token | from |
Token ID | 422 |
Feature activation | -1.64e-02 |
Pos logit contributions | |
million | +0.006 |
camps | +0.006 |
ocol | +0.005 |
tow | +0.005 |
irst | +0.005 |
Neg logit contributions | |
listened | -0.005 |
sound | -0.005 |
behave | -0.005 |
ics | -0.005 |
gging | -0.005 |
Token | behind |
Token ID | 2157 |
Feature activation | -3.12e-02 |
Pos logit contributions | |
piping | +0.035 |
ocol | +0.035 |
endant | +0.034 |
freshly | +0.034 |
million | +0.034 |
Neg logit contributions | |
sound | -0.018 |
listened | -0.013 |
do | -0.012 |
listen | -0.012 |
behave | -0.011 |
Token | the |
Token ID | 262 |
Feature activation | +2.70e-03 |
Pos logit contributions | |
sound | +0.014 |
ics | +0.012 |
do | +0.011 |
listened | +0.011 |
inker | +0.010 |
Neg logit contributions | |
ocol | -0.026 |
piping | -0.026 |
million | -0.026 |
igsaw | -0.025 |
pleasure | -0.024 |
Token | box |
Token ID | 3091 |
Feature activation | -3.11e-02 |
Pos logit contributions | |
sound | +0.005 |
do | +0.004 |
listen | +0.004 |
listened | +0.004 |
not | +0.004 |
Neg logit contributions | |
piping | -0.004 |
endant | -0.004 |
ocol | -0.004 |
million | -0.004 |
umm | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
endant | +0.055 |
million | +0.054 |
igsaw | +0.053 |
piping | +0.051 |
brand | +0.051 |
Neg logit contributions | |
sound | -0.043 |
listened | -0.035 |
do | -0.034 |
inker | -0.033 |
listen | -0.033 |
Token | so |
Token ID | 523 |
Feature activation | +2.95e-02 |
Pos logit contributions | |
million | +0.023 |
endant | +0.023 |
freshly | +0.023 |
piping | +0.023 |
brand | +0.022 |
Neg logit contributions | |
sound | -0.023 |
inker | -0.023 |
tails | -0.021 |
ics | -0.021 |
communicate | -0.020 |
Token | she |
Token ID | 673 |
Feature activation | -9.71e-03 |
Pos logit contributions | |
sound | +0.040 |
inker | +0.034 |
behave | +0.033 |
ising | +0.032 |
listen | +0.031 |
Neg logit contributions | |
million | -0.052 |
endant | -0.051 |
piping | -0.051 |
dark | -0.047 |
joy | -0.047 |
Token | went |
Token ID | 1816 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
endant | +0.019 |
piping | +0.018 |
million | +0.018 |
dark | +0.018 |
imet | +0.018 |
Neg logit contributions | |
sound | -0.012 |
do | -0.009 |
inker | -0.009 |
listen | -0.009 |
communicate | -0.008 |
Token | back |
Token ID | 736 |
Feature activation | -2.03e-02 |
Pos logit contributions | |
endant | +0.024 |
piping | +0.024 |
million | +0.023 |
ocol | +0.023 |
camps | +0.022 |
Neg logit contributions | |
sound | -0.022 |
do | -0.017 |
listened | -0.017 |
listen | -0.017 |
not | -0.016 |
Token | to |
Token ID | 284 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
piping | +0.042 |
endant | +0.042 |
million | +0.041 |
ocol | +0.041 |
imet | +0.039 |
Neg logit contributions | |
sound | -0.025 |
do | -0.018 |
listen | -0.017 |
listened | -0.017 |
not | -0.016 |
Token | the |
Token ID | 262 |
Feature activation | +1.67e-02 |
Pos logit contributions | |
sound | +0.018 |
ably | +0.014 |
ising | +0.013 |
listened | +0.013 |
ards | +0.013 |
Neg logit contributions | |
piping | -0.031 |
freshly | -0.030 |
endant | -0.030 |
ocol | -0.029 |
million | -0.029 |
Token | man |
Token ID | 582 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
sound | +0.028 |
listen | +0.022 |
do | +0.022 |
listened | +0.022 |
not | +0.021 |
Neg logit contributions | |
endant | -0.027 |
piping | -0.027 |
million | -0.026 |
ocol | -0.025 |
umm | -0.025 |
Token | and |
Token ID | 290 |
Feature activation | +4.33e-04 |
Pos logit contributions | |
sound | +0.014 |
do | +0.009 |
listen | +0.009 |
listened | +0.009 |
inker | +0.008 |
Neg logit contributions | |
endant | -0.026 |
piping | -0.026 |
million | -0.025 |
ocol | -0.025 |
dark | -0.025 |
Token | . |
Token ID | 13 |
Feature activation | +2.11e-02 |
Pos logit contributions | |
piping | +0.009 |
camps | +0.008 |
brand | +0.008 |
freshly | +0.008 |
endant | +0.008 |
Neg logit contributions | |
inker | -0.011 |
sound | -0.010 |
ani | -0.009 |
prove | -0.009 |
w | -0.009 |
Token | They |
Token ID | 1119 |
Feature activation | +3.02e-02 |
Pos logit contributions | |
sound | +0.025 |
not | +0.020 |
do | +0.019 |
each | +0.019 |
listen | +0.018 |
Neg logit contributions | |
ocol | -0.046 |
endant | -0.046 |
million | -0.045 |
igsaw | -0.044 |
umm | -0.044 |
Token | looked |
Token ID | 3114 |
Feature activation | -2.37e-02 |
Pos logit contributions | |
sound | +0.053 |
ising | +0.045 |
inker | +0.044 |
ourselves | +0.041 |
oo | +0.040 |
Neg logit contributions | |
endant | -0.042 |
million | -0.042 |
camps | -0.041 |
piping | -0.041 |
freshly | -0.039 |
Token | for |
Token ID | 329 |
Feature activation | +3.17e-02 |
Pos logit contributions | |
piping | +0.048 |
endant | +0.047 |
million | +0.046 |
ocol | +0.046 |
camps | +0.045 |
Neg logit contributions | |
sound | -0.030 |
do | -0.021 |
listened | -0.021 |
listen | -0.021 |
inker | -0.021 |
Token | their |
Token ID | 511 |
Feature activation | -5.19e-04 |
Pos logit contributions | |
sound | +0.042 |
listened | +0.031 |
do | +0.030 |
listen | +0.029 |
inker | +0.029 |
Neg logit contributions | |
piping | -0.062 |
ocol | -0.061 |
endant | -0.060 |
freshly | -0.057 |
million | -0.057 |
Token | gate |
Token ID | 8946 |
Feature activation | -2.22e-02 |
Pos logit contributions | |
endant | +0.001 |
piping | +0.001 |
pleasure | +0.001 |
camps | +0.001 |
imet | +0.001 |
Neg logit contributions | |
sound | -0.001 |
listened | -0.001 |
listen | -0.001 |
inker | -0.001 |
do | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
endant | +0.042 |
camps | +0.039 |
brand | +0.038 |
million | +0.037 |
piping | +0.037 |
Neg logit contributions | |
sound | -0.030 |
inker | -0.024 |
listen | -0.024 |
communicate | -0.023 |
do | -0.023 |
Token |
|
Token ID | 198 |
Feature activation | -8.56e-03 |
Pos logit contributions | |
sound | +0.019 |
do | +0.017 |
not | +0.017 |
each | +0.017 |
their | +0.015 |
Neg logit contributions | |
ocol | -0.041 |
endant | -0.040 |
igsaw | -0.039 |
million | -0.039 |
umm | -0.039 |
Token |
|
Token ID | 198 |
Feature activation | -7.49e-03 |
Pos logit contributions | |
umm | +0.019 |
ocol | +0.018 |
endant | +0.017 |
igsaw | +0.017 |
piping | +0.016 |
Neg logit contributions | |
sound | -0.012 |
not | -0.011 |
do | -0.011 |
each | -0.009 |
slowly | -0.009 |
Token | " |
Token ID | 1 |
Feature activation | +2.24e-02 |
Pos logit contributions | |
piping | +0.013 |
endant | +0.013 |
million | +0.013 |
ocol | +0.012 |
dark | +0.012 |
Neg logit contributions | |
sound | -0.012 |
do | -0.009 |
listen | -0.009 |
listened | -0.009 |
not | -0.008 |
Token | Look |
Token ID | 8567 |
Feature activation | -9.32e-02 |
Pos logit contributions | |
sound | +0.039 |
listened | +0.033 |
listen | +0.032 |
do | +0.032 |
behave | +0.029 |
Neg logit contributions | |
endant | -0.038 |
ocol | -0.036 |
igsaw | -0.035 |
piping | -0.034 |
umm | -0.033 |
Token | She |
Token ID | 1375 |
Feature activation | -2.09e-02 |
Pos logit contributions | |
endant | +0.013 |
piping | +0.013 |
ocol | +0.012 |
million | +0.012 |
umm | +0.011 |
Neg logit contributions | |
sound | -0.017 |
do | -0.014 |
listen | -0.014 |
listened | -0.014 |
not | -0.014 |
Token | stood |
Token ID | 6204 |
Feature activation | +3.34e-03 |
Pos logit contributions | |
piping | +0.039 |
endant | +0.039 |
dark | +0.038 |
million | +0.037 |
freshly | +0.037 |
Neg logit contributions | |
sound | -0.029 |
inker | -0.022 |
listen | -0.021 |
ising | -0.020 |
communicate | -0.020 |
Token | in |
Token ID | 287 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
sound | +0.004 |
listen | +0.003 |
do | +0.003 |
behave | +0.003 |
listened | +0.003 |
Neg logit contributions | |
endant | -0.007 |
piping | -0.007 |
ocol | -0.006 |
million | -0.006 |
camps | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
endant | +0.050 |
piping | +0.049 |
million | +0.048 |
ocol | +0.047 |
imet | +0.047 |
Neg logit contributions | |
sound | -0.015 |
do | -0.008 |
listen | -0.008 |
listened | -0.007 |
not | -0.007 |
Token | garden |
Token ID | 11376 |
Feature activation | +7.45e-04 |
Pos logit contributions | |
sound | +0.020 |
do | +0.016 |
listen | +0.015 |
listened | +0.015 |
her | +0.015 |
Neg logit contributions | |
endant | -0.015 |
ocol | -0.014 |
piping | -0.014 |
imet | -0.014 |
million | -0.013 |
Token | all |
Token ID | 477 |
Feature activation | -8.64e-03 |
Pos logit contributions | |
sound | +0.001 |
inker | +0.001 |
communicate | +0.001 |
tails | +0.001 |
ards | +0.001 |
Neg logit contributions | |
endant | -0.001 |
camps | -0.001 |
freshly | -0.001 |
piping | -0.001 |
joy | -0.001 |
Token | day |
Token ID | 1110 |
Feature activation | -1.03e-03 |
Pos logit contributions | |
piping | +0.015 |
endant | +0.015 |
dark | +0.014 |
million | +0.014 |
ocol | +0.014 |
Neg logit contributions | |
sound | -0.013 |
do | -0.010 |
inker | -0.010 |
listen | -0.010 |
communicate | -0.010 |
Token | , |
Token ID | 11 |
Feature activation | -2.71e-03 |
Pos logit contributions | |
endant | +0.002 |
million | +0.002 |
piping | +0.002 |
� | +0.002 |
camps | +0.002 |
Neg logit contributions | |
sound | -0.002 |
communicate | -0.001 |
inker | -0.001 |
behave | -0.001 |
listen | -0.001 |
Token | soaking |
Token ID | 41714 |
Feature activation | +2.16e-02 |
Pos logit contributions | |
piping | +0.005 |
endant | +0.005 |
freshly | +0.005 |
million | +0.005 |
dark | +0.005 |
Neg logit contributions | |
sound | -0.004 |
inker | -0.003 |
tails | -0.003 |
communicate | -0.003 |
do | -0.003 |
Token | in |
Token ID | 287 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
sound | +0.025 |
communicate | +0.021 |
behave | +0.020 |
listen | +0.020 |
do | +0.020 |
Neg logit contributions | |
piping | -0.043 |
endant | -0.042 |
ocol | -0.042 |
million | -0.042 |
freshly | -0.041 |
Token | the |
Token ID | 262 |
Feature activation | +5.85e-03 |
Pos logit contributions | |
endant | +0.049 |
piping | +0.049 |
ocol | +0.047 |
million | +0.047 |
imet | +0.047 |
Neg logit contributions | |
sound | -0.015 |
do | -0.008 |
listen | -0.007 |
not | -0.007 |
listened | -0.007 |
Token | of |
Token ID | 286 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
million | +0.009 |
run | +0.008 |
dark | +0.007 |
ifying | +0.007 |
piping | +0.006 |
Neg logit contributions | |
behave | -0.025 |
sound | -0.024 |
listen | -0.024 |
ics | -0.023 |
listened | -0.023 |
Token | the |
Token ID | 262 |
Feature activation | -1.73e-02 |
Pos logit contributions | |
piping | +0.030 |
endant | +0.030 |
ocol | +0.029 |
million | +0.029 |
umm | +0.028 |
Neg logit contributions | |
sound | -0.010 |
do | -0.006 |
listen | -0.006 |
listened | -0.006 |
not | -0.005 |
Token | dirt |
Token ID | 13647 |
Feature activation | -4.28e-03 |
Pos logit contributions | |
piping | +0.031 |
endant | +0.031 |
ocol | +0.030 |
million | +0.029 |
umm | +0.029 |
Neg logit contributions | |
sound | -0.027 |
do | -0.021 |
listen | -0.020 |
listened | -0.020 |
not | -0.019 |
Token | . |
Token ID | 13 |
Feature activation | -9.08e-03 |
Pos logit contributions | |
million | +0.008 |
endant | +0.008 |
umm | +0.007 |
camps | +0.007 |
lettuce | +0.007 |
Neg logit contributions | |
sound | -0.005 |
communicate | -0.005 |
listen | -0.005 |
obey | -0.005 |
inker | -0.005 |
Token | She |
Token ID | 1375 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
piping | +0.012 |
endant | +0.012 |
ocol | +0.011 |
million | +0.011 |
umm | +0.011 |
Neg logit contributions | |
sound | -0.019 |
do | -0.016 |
listen | -0.015 |
listened | -0.015 |
not | -0.015 |
Token | bent |
Token ID | 17157 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
endant | +0.033 |
piping | +0.033 |
million | +0.032 |
ocol | +0.031 |
dark | +0.031 |
Neg logit contributions | |
sound | -0.022 |
listen | -0.016 |
do | -0.016 |
behave | -0.015 |
listened | -0.015 |
Token | down |
Token ID | 866 |
Feature activation | -6.56e-03 |
Pos logit contributions | |
piping | +0.017 |
endant | +0.016 |
Wouldn | +0.015 |
imet | +0.015 |
joy | +0.015 |
Neg logit contributions | |
sound | -0.019 |
communicate | -0.016 |
behave | -0.016 |
ising | -0.016 |
do | -0.015 |
Token | and |
Token ID | 290 |
Feature activation | -4.50e-03 |
Pos logit contributions | |
imet | +0.012 |
� | +0.011 |
joy | +0.011 |
endant | +0.011 |
piping | +0.011 |
Neg logit contributions | |
sound | -0.009 |
tails | -0.007 |
communicate | -0.007 |
behave | -0.007 |
ics | -0.007 |
Token | carefully |
Token ID | 7773 |
Feature activation | +1.18e-03 |
Pos logit contributions | |
endant | +0.008 |
piping | +0.008 |
million | +0.007 |
imet | +0.007 |
dark | +0.007 |
Neg logit contributions | |
sound | -0.007 |
do | -0.005 |
inker | -0.005 |
communicate | -0.005 |
listen | -0.005 |
Token | poked |
Token ID | 47320 |
Feature activation | +7.52e-04 |
Pos logit contributions | |
sound | +0.002 |
do | +0.001 |
inker | +0.001 |
listen | +0.001 |
communicate | +0.001 |
Neg logit contributions | |
endant | -0.002 |
piping | -0.002 |
ocol | -0.002 |
imet | -0.002 |
dark | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
sound | +0.001 |
behave | +0.001 |
ics | +0.001 |
listened | +0.001 |
listen | +0.001 |
Neg logit contributions | |
piping | -0.001 |
endant | -0.001 |
ocol | -0.001 |
imet | -0.001 |
million | -0.001 |
Token | took |
Token ID | 1718 |
Feature activation | -5.55e-03 |
Pos logit contributions | |
sound | +0.068 |
inker | +0.051 |
listen | +0.050 |
do | +0.050 |
ising | +0.049 |
Neg logit contributions | |
piping | -0.076 |
million | -0.074 |
endant | -0.073 |
camps | -0.069 |
dark | -0.069 |
Token | the |
Token ID | 262 |
Feature activation | -6.02e-03 |
Pos logit contributions | |
endant | +0.013 |
piping | +0.013 |
ocol | +0.012 |
million | +0.012 |
umm | +0.012 |
Neg logit contributions | |
sound | -0.006 |
do | -0.004 |
listen | -0.004 |
listened | -0.003 |
not | -0.003 |
Token | cookies |
Token ID | 14746 |
Feature activation | +3.47e-02 |
Pos logit contributions | |
piping | +0.009 |
endant | +0.008 |
million | +0.008 |
ocol | +0.008 |
umm | +0.008 |
Neg logit contributions | |
sound | -0.012 |
do | -0.010 |
listen | -0.009 |
listened | -0.009 |
not | -0.009 |
Token | out |
Token ID | 503 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
sound | +0.046 |
inker | +0.036 |
do | +0.035 |
communicate | +0.034 |
listened | +0.034 |
Neg logit contributions | |
piping | -0.063 |
endant | -0.063 |
million | -0.063 |
umbs | -0.062 |
imet | -0.062 |
Token | of |
Token ID | 286 |
Feature activation | -9.07e-03 |
Pos logit contributions | |
million | +0.019 |
piping | +0.019 |
endant | +0.017 |
dark | +0.017 |
ocol | +0.016 |
Neg logit contributions | |
sound | -0.032 |
do | -0.028 |
inker | -0.028 |
listen | -0.028 |
behave | -0.027 |
Token | the |
Token ID | 262 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
endant | +0.024 |
piping | +0.023 |
imet | +0.022 |
umm | +0.022 |
ocol | +0.022 |
Neg logit contributions | |
sound | -0.008 |
do | -0.004 |
not | -0.004 |
listen | -0.004 |
her | -0.004 |
Token | oven |
Token ID | 14361 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
endant | +0.018 |
ocol | +0.016 |
imet | +0.016 |
piping | +0.016 |
igsaw | +0.016 |
Neg logit contributions | |
sound | -0.025 |
do | -0.021 |
listen | -0.019 |
not | -0.019 |
sounds | -0.019 |
Token | and |
Token ID | 290 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
sound | +0.015 |
inker | +0.013 |
communicate | +0.013 |
listen | +0.012 |
behave | +0.012 |
Neg logit contributions | |
piping | -0.024 |
million | -0.024 |
endant | -0.024 |
umm | -0.024 |
imet | -0.023 |
Token | they |
Token ID | 484 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
piping | +0.021 |
endant | +0.021 |
million | +0.020 |
ocol | +0.019 |
dark | +0.019 |
Neg logit contributions | |
sound | -0.016 |
inker | -0.012 |
do | -0.012 |
listen | -0.012 |
communicate | -0.011 |
Token | were |
Token ID | 547 |
Feature activation | +9.01e-03 |
Pos logit contributions | |
sound | +0.028 |
inker | +0.023 |
ising | +0.022 |
listen | +0.021 |
do | +0.021 |
Neg logit contributions | |
piping | -0.031 |
million | -0.030 |
endant | -0.029 |
freshly | -0.028 |
camps | -0.028 |
Token | perfect |
Token ID | 2818 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
sound | +0.013 |
do | +0.010 |
listen | +0.010 |
inker | +0.010 |
listened | +0.009 |
Neg logit contributions | |
piping | -0.017 |
endant | -0.017 |
million | -0.016 |
ocol | -0.016 |
freshly | -0.016 |
Token | was |
Token ID | 373 |
Feature activation | -1.50e-02 |
Pos logit contributions | |
million | +0.059 |
endant | +0.057 |
dark | +0.057 |
piping | +0.057 |
brand | +0.057 |
Neg logit contributions | |
sound | -0.053 |
listen | -0.044 |
obey | -0.044 |
inker | -0.043 |
behave | -0.043 |
Token | the |
Token ID | 262 |
Feature activation | -2.54e-02 |
Pos logit contributions | |
endant | +0.028 |
piping | +0.028 |
million | +0.027 |
ocol | +0.026 |
freshly | +0.026 |
Neg logit contributions | |
sound | -0.020 |
listen | -0.016 |
inker | -0.015 |
do | -0.015 |
listened | -0.015 |
Token | most |
Token ID | 749 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
piping | +0.047 |
endant | +0.047 |
ocol | +0.046 |
million | +0.045 |
dark | +0.043 |
Neg logit contributions | |
sound | -0.039 |
do | -0.030 |
listen | -0.029 |
listened | -0.028 |
not | -0.028 |
Token | beautiful |
Token ID | 4950 |
Feature activation | -3.19e-02 |
Pos logit contributions | |
sound | +0.020 |
do | +0.015 |
not | +0.013 |
when | +0.013 |
listened | +0.013 |
Neg logit contributions | |
piping | -0.030 |
ocol | -0.029 |
endant | -0.028 |
million | -0.028 |
umbs | -0.028 |
Token | thing |
Token ID | 1517 |
Feature activation | +2.94e-03 |
Pos logit contributions | |
piping | +0.051 |
ocol | +0.050 |
endant | +0.049 |
imet | +0.048 |
umbs | +0.048 |
Neg logit contributions | |
sound | -0.064 |
do | -0.048 |
her | -0.046 |
listened | -0.045 |
listen | -0.045 |
Token | she |
Token ID | 673 |
Feature activation | -7.03e-02 |
Pos logit contributions | |
sound | +0.004 |
inker | +0.003 |
ising | +0.003 |
listen | +0.003 |
do | +0.003 |
Neg logit contributions | |
endant | -0.006 |
piping | -0.005 |
million | -0.005 |
dark | -0.005 |
imet | -0.005 |
Token | had |
Token ID | 550 |
Feature activation | -7.15e-02 |
Pos logit contributions | |
piping | +0.136 |
endant | +0.133 |
ocol | +0.131 |
million | +0.130 |
umm | +0.126 |
Neg logit contributions | |
sound | -0.101 |
do | -0.081 |
listened | -0.078 |
listen | -0.076 |
not | -0.074 |
Token | ever |
Token ID | 1683 |
Feature activation | -6.72e-02 |
Pos logit contributions | |
endant | +0.118 |
piping | +0.108 |
dark | +0.107 |
million | +0.104 |
ocol | +0.101 |
Neg logit contributions | |
sound | -0.117 |
tails | -0.088 |
listen | -0.088 |
loudly | -0.088 |
do | -0.087 |
Token | seen |
Token ID | 1775 |
Feature activation | -3.16e-02 |
Pos logit contributions | |
piping | +0.101 |
endant | +0.100 |
million | +0.095 |
ocol | +0.095 |
umm | +0.092 |
Neg logit contributions | |
sound | -0.123 |
do | -0.100 |
listen | -0.098 |
listened | -0.097 |
not | -0.094 |
Token | . |
Token ID | 13 |
Feature activation | -9.37e-04 |
Pos logit contributions | |
endant | +0.062 |
million | +0.061 |
piping | +0.061 |
ocol | +0.060 |
dark | +0.059 |
Neg logit contributions | |
sound | -0.038 |
listen | -0.029 |
do | -0.027 |
inker | -0.027 |
listened | -0.027 |
Token | But |
Token ID | 887 |
Feature activation | +8.46e-03 |
Pos logit contributions | |
ocol | +0.002 |
piping | +0.002 |
endant | +0.002 |
ifying | +0.002 |
ction | +0.002 |
Neg logit contributions | |
sound | -0.001 |
not | -0.001 |
when | -0.001 |
her | -0.001 |
do | -0.001 |
Token | He |
Token ID | 679 |
Feature activation | +5.82e-03 |
Pos logit contributions | |
sound | +0.006 |
do | +0.005 |
not | +0.005 |
listened | +0.004 |
listen | +0.004 |
Neg logit contributions | |
ocol | -0.007 |
piping | -0.007 |
endant | -0.007 |
million | -0.006 |
umm | -0.006 |
Token | said |
Token ID | 531 |
Feature activation | -2.54e-02 |
Pos logit contributions | |
sound | +0.009 |
inker | +0.008 |
ics | +0.007 |
ourselves | +0.007 |
ards | +0.007 |
Neg logit contributions | |
endant | -0.009 |
camps | -0.009 |
million | -0.009 |
imet | -0.008 |
brand | -0.008 |
Token | " |
Token ID | 366 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
piping | +0.042 |
imet | +0.042 |
million | +0.041 |
endant | +0.040 |
seventy | +0.040 |
Neg logit contributions | |
sound | -0.037 |
inker | -0.031 |
tails | -0.029 |
ards | -0.029 |
ising | -0.028 |
Token | Yes |
Token ID | 5297 |
Feature activation | -4.21e-02 |
Pos logit contributions | |
piping | +0.016 |
million | +0.016 |
umm | +0.015 |
endant | +0.015 |
dark | +0.015 |
Neg logit contributions | |
sound | -0.019 |
do | -0.016 |
not | -0.016 |
listen | -0.015 |
listened | -0.015 |
Token | , |
Token ID | 11 |
Feature activation | -3.03e-02 |
Pos logit contributions | |
piping | +0.077 |
million | +0.077 |
ocol | +0.076 |
pleasure | +0.075 |
imet | +0.075 |
Neg logit contributions | |
sound | -0.055 |
communicate | -0.043 |
inker | -0.043 |
tails | -0.043 |
listened | -0.042 |
Token | I |
Token ID | 314 |
Feature activation | -7.99e-02 |
Pos logit contributions | |
piping | +0.042 |
endant | +0.041 |
million | +0.039 |
ocol | +0.039 |
umm | +0.037 |
Neg logit contributions | |
sound | -0.058 |
do | -0.047 |
listened | -0.047 |
listen | -0.047 |
not | -0.045 |
Token | 'm |
Token ID | 1101 |
Feature activation | -5.02e-03 |
Pos logit contributions | |
endant | +0.122 |
dark | +0.116 |
pleasure | +0.115 |
piping | +0.114 |
Wouldn | +0.113 |
Neg logit contributions | |
sound | -0.130 |
ising | -0.102 |
inker | -0.100 |
ards | -0.100 |
ics | -0.100 |
Token | OK |
Token ID | 7477 |
Feature activation | -9.38e-03 |
Pos logit contributions | |
piping | +0.009 |
endant | +0.008 |
million | +0.008 |
ocol | +0.008 |
pleasure | +0.008 |
Neg logit contributions | |
sound | -0.008 |
do | -0.006 |
inker | -0.006 |
listened | -0.006 |
listen | -0.006 |
Token | ". |
Token ID | 1911 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
piping | +0.015 |
million | +0.015 |
endant | +0.014 |
pleasure | +0.014 |
Wouldn | +0.014 |
Neg logit contributions | |
sound | -0.015 |
listened | -0.011 |
do | -0.011 |
inker | -0.011 |
communicate | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | -5.50e-03 |
Pos logit contributions | |
sound | +0.029 |
do | +0.024 |
listen | +0.023 |
listened | +0.023 |
not | +0.023 |
Neg logit contributions | |
piping | -0.021 |
endant | -0.021 |
ocol | -0.020 |
million | -0.019 |
umm | -0.019 |
Token |
|
Token ID | 198 |
Feature activation | -5.69e-03 |
Pos logit contributions | |
ocol | +0.009 |
endant | +0.009 |
piping | +0.009 |
umm | +0.009 |
million | +0.008 |
Neg logit contributions | |
sound | -0.010 |
do | -0.008 |
not | -0.008 |
listened | -0.008 |
listen | -0.008 |
Token | elevator |
Token ID | 20932 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
endant | +0.020 |
piping | +0.019 |
million | +0.019 |
umm | +0.017 |
freshly | +0.017 |
Neg logit contributions | |
sound | -0.034 |
listen | -0.029 |
listened | -0.029 |
do | -0.029 |
behave | -0.029 |
Token | and |
Token ID | 290 |
Feature activation | -2.40e-02 |
Pos logit contributions | |
endant | +0.022 |
brand | +0.021 |
piping | +0.020 |
million | +0.020 |
imet | +0.019 |
Neg logit contributions | |
sound | -0.016 |
inker | -0.016 |
behave | -0.015 |
listened | -0.015 |
listen | -0.015 |
Token | said |
Token ID | 531 |
Feature activation | -2.15e-02 |
Pos logit contributions | |
million | +0.046 |
endant | +0.044 |
piping | +0.044 |
brand | +0.043 |
freshly | +0.042 |
Neg logit contributions | |
sound | -0.029 |
inker | -0.027 |
ics | -0.024 |
communicate | -0.023 |
do | -0.023 |
Token | , |
Token ID | 11 |
Feature activation | -4.57e-03 |
Pos logit contributions | |
piping | +0.038 |
endant | +0.038 |
imet | +0.036 |
ocol | +0.036 |
million | +0.036 |
Neg logit contributions | |
sound | -0.031 |
inker | -0.024 |
behave | -0.023 |
tails | -0.023 |
ising | -0.022 |
Token | " |
Token ID | 366 |
Feature activation | +4.45e-04 |
Pos logit contributions | |
piping | +0.006 |
endant | +0.005 |
million | +0.005 |
imet | +0.005 |
ocol | +0.005 |
Neg logit contributions | |
sound | -0.009 |
do | -0.008 |
inker | -0.008 |
listen | -0.008 |
tails | -0.007 |
Token | Look |
Token ID | 8567 |
Feature activation | -8.89e-02 |
Pos logit contributions | |
sound | +0.001 |
do | +0.001 |
listen | +0.001 |
listened | +0.001 |
not | +0.001 |
Neg logit contributions | |
piping | -0.001 |
endant | -0.001 |
million | -0.001 |
ocol | -0.001 |
umm | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
piping | +0.179 |
endant | +0.178 |
ocol | +0.171 |
million | +0.169 |
imet | +0.167 |
Neg logit contributions | |
sound | -0.118 |
do | -0.083 |
listened | -0.082 |
listen | -0.082 |
behave | -0.078 |
Token | Mom |
Token ID | 11254 |
Feature activation | -2.24e-02 |
Pos logit contributions | |
piping | +0.040 |
endant | +0.038 |
million | +0.038 |
ocol | +0.037 |
imet | +0.035 |
Neg logit contributions | |
sound | -0.044 |
do | -0.034 |
listened | -0.034 |
inker | -0.034 |
listen | -0.033 |
Token | my |
Token ID | 1820 |
Feature activation | -2.64e-02 |
Pos logit contributions | |
endant | +0.023 |
piping | +0.023 |
million | +0.022 |
berry | +0.020 |
dark | +0.019 |
Neg logit contributions | |
sound | -0.049 |
communicate | -0.043 |
inker | -0.042 |
listen | -0.041 |
loudly | -0.041 |
Token | ! |
Token ID | 0 |
Feature activation | -1.47e-02 |
Pos logit contributions | |
endant | +0.045 |
million | +0.042 |
piping | +0.042 |
imet | +0.041 |
pleasure | +0.041 |
Neg logit contributions | |
sound | -0.040 |
inker | -0.033 |
communicate | -0.032 |
ably | -0.030 |
ising | -0.028 |
Token | It |
Token ID | 632 |
Feature activation | -4.55e-02 |
Pos logit contributions | |
endant | +0.020 |
ocol | +0.019 |
piping | +0.019 |
million | +0.018 |
umm | +0.017 |
Neg logit contributions | |
sound | -0.028 |
do | -0.025 |
listen | -0.024 |
listened | -0.023 |
not | -0.023 |
Token | Bird |
Token ID | 14506 |
Feature activation | +2.92e-02 |
Pos logit contributions | |
piping | +0.001 |
endant | +0.001 |
ocol | +0.001 |
igsaw | +0.001 |
umm | +0.001 |
Neg logit contributions | |
sound | -0.001 |
do | -0.001 |
listened | -0.001 |
listen | -0.001 |
not | -0.001 |
Token | ie |
Token ID | 494 |
Feature activation | +1.81e-02 |
Pos logit contributions | |
sound | +0.045 |
do | +0.037 |
listen | +0.037 |
not | +0.035 |
behave | +0.035 |
Neg logit contributions | |
endant | -0.049 |
piping | -0.049 |
million | -0.049 |
dark | -0.046 |
ocol | -0.045 |
Token | said |
Token ID | 531 |
Feature activation | -1.79e-02 |
Pos logit contributions | |
sound | +0.024 |
inker | +0.023 |
ics | +0.020 |
communicate | +0.020 |
ourselves | +0.019 |
Neg logit contributions | |
endant | -0.030 |
million | -0.029 |
dark | -0.028 |
berry | -0.028 |
bead | -0.028 |
Token | , |
Token ID | 11 |
Feature activation | -9.06e-03 |
Pos logit contributions | |
piping | +0.033 |
million | +0.031 |
imet | +0.031 |
endant | +0.031 |
pleasure | +0.030 |
Neg logit contributions | |
sound | -0.023 |
inker | -0.022 |
tails | -0.019 |
ards | -0.018 |
ics | -0.018 |
Token | " |
Token ID | 366 |
Feature activation | +1.97e-03 |
Pos logit contributions | |
piping | +0.010 |
million | +0.010 |
endant | +0.010 |
imet | +0.010 |
freshly | +0.009 |
Neg logit contributions | |
sound | -0.019 |
inker | -0.016 |
do | -0.016 |
tails | -0.015 |
ising | -0.015 |
Token | I |
Token ID | 40 |
Feature activation | -6.91e-02 |
Pos logit contributions | |
sound | +0.004 |
do | +0.003 |
listen | +0.003 |
listened | +0.003 |
not | +0.003 |
Neg logit contributions | |
piping | -0.003 |
endant | -0.003 |
million | -0.003 |
umm | -0.003 |
dark | -0.003 |
Token | will |
Token ID | 481 |
Feature activation | +5.03e-03 |
Pos logit contributions | |
endant | +0.113 |
piping | +0.109 |
million | +0.105 |
pleasure | +0.103 |
ocol | +0.103 |
Neg logit contributions | |
sound | -0.115 |
inker | -0.087 |
ics | -0.084 |
ards | -0.084 |
music | -0.083 |
Token | help |
Token ID | 1037 |
Feature activation | +2.62e-02 |
Pos logit contributions | |
sound | +0.007 |
inker | +0.007 |
ards | +0.006 |
ably | +0.006 |
ics | +0.006 |
Neg logit contributions | |
pleasure | -0.008 |
endant | -0.008 |
piping | -0.008 |
� | -0.008 |
freshly | -0.008 |
Token | you |
Token ID | 345 |
Feature activation | -4.16e-03 |
Pos logit contributions | |
sound | +0.036 |
inker | +0.034 |
listened | +0.032 |
ably | +0.031 |
ics | +0.031 |
Neg logit contributions | |
ocol | -0.040 |
million | -0.039 |
dark | -0.037 |
freshly | -0.037 |
lettuce | -0.037 |
Token | . |
Token ID | 13 |
Feature activation | -3.70e-03 |
Pos logit contributions | |
endant | +0.007 |
piping | +0.007 |
million | +0.007 |
dark | +0.007 |
pleasure | +0.007 |
Neg logit contributions | |
sound | -0.006 |
inker | -0.005 |
listened | -0.005 |
ards | -0.004 |
ably | -0.004 |
Token | I |
Token ID | 314 |
Feature activation | -6.65e-02 |
Pos logit contributions | |
endant | +0.007 |
piping | +0.006 |
million | +0.006 |
ocol | +0.006 |
camps | +0.006 |
Neg logit contributions | |
sound | -0.006 |
listen | -0.005 |
do | -0.005 |
not | -0.005 |
listened | -0.005 |
Token | L |
Token ID | 43 |
Feature activation | +4.94e-03 |
Pos logit contributions | |
endant | +0.036 |
piping | +0.035 |
umm | +0.035 |
ocol | +0.034 |
imet | +0.033 |
Neg logit contributions | |
sound | -0.031 |
do | -0.025 |
listen | -0.024 |
listened | -0.024 |
not | -0.024 |
Token | ily |
Token ID | 813 |
Feature activation | -2.56e-03 |
Pos logit contributions | |
sound | +0.008 |
do | +0.006 |
listened | +0.006 |
not | +0.006 |
listen | +0.006 |
Neg logit contributions | |
piping | -0.009 |
endant | -0.008 |
umm | -0.008 |
million | -0.008 |
pleasure | -0.008 |
Token | replied |
Token ID | 8712 |
Feature activation | -2.08e-02 |
Pos logit contributions | |
endant | +0.004 |
million | +0.004 |
piping | +0.004 |
� | +0.004 |
brand | +0.004 |
Neg logit contributions | |
sound | -0.004 |
inker | -0.003 |
ics | -0.003 |
communicate | -0.003 |
ourselves | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | -4.78e-03 |
Pos logit contributions | |
piping | +0.044 |
endant | +0.043 |
million | +0.042 |
ocol | +0.042 |
imet | +0.042 |
Neg logit contributions | |
sound | -0.024 |
inker | -0.016 |
do | -0.016 |
listen | -0.015 |
tails | -0.015 |
Token | " |
Token ID | 366 |
Feature activation | +3.19e-03 |
Pos logit contributions | |
piping | +0.006 |
endant | +0.006 |
million | +0.006 |
ocol | +0.006 |
imet | +0.006 |
Neg logit contributions | |
sound | -0.009 |
do | -0.008 |
inker | -0.007 |
listen | -0.007 |
listened | -0.007 |
Token | I |
Token ID | 40 |
Feature activation | -6.89e-02 |
Pos logit contributions | |
sound | +0.006 |
do | +0.005 |
listen | +0.005 |
listened | +0.005 |
not | +0.004 |
Neg logit contributions | |
piping | -0.005 |
endant | -0.005 |
ocol | -0.005 |
million | -0.005 |
umm | -0.004 |
Token | fell |
Token ID | 3214 |
Feature activation | -2.16e-02 |
Pos logit contributions | |
endant | +0.115 |
piping | +0.115 |
million | +0.112 |
ocol | +0.107 |
dark | +0.107 |
Neg logit contributions | |
sound | -0.111 |
listen | -0.082 |
do | -0.082 |
listened | -0.081 |
inker | -0.080 |
Token | and |
Token ID | 290 |
Feature activation | +8.34e-04 |
Pos logit contributions | |
million | +0.040 |
piping | +0.037 |
endant | +0.036 |
imet | +0.035 |
dark | +0.035 |
Neg logit contributions | |
sound | -0.028 |
communicate | -0.025 |
listened | -0.024 |
do | -0.023 |
listen | -0.023 |
Token | my |
Token ID | 616 |
Feature activation | -8.31e-03 |
Pos logit contributions | |
sound | +0.001 |
inker | +0.001 |
do | +0.001 |
listen | +0.001 |
communicate | +0.001 |
Neg logit contributions | |
piping | -0.001 |
endant | -0.001 |
million | -0.001 |
dark | -0.001 |
ocol | -0.001 |
Token | leg |
Token ID | 1232 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
piping | +0.013 |
endant | +0.013 |
million | +0.013 |
ocol | +0.012 |
umm | +0.012 |
Neg logit contributions | |
sound | -0.014 |
do | -0.011 |
listen | -0.011 |
listened | -0.011 |
not | -0.011 |
Token | hurts |
Token ID | 20406 |
Feature activation | +3.19e-03 |
Pos logit contributions | |
sound | +0.016 |
inker | +0.015 |
communicate | +0.015 |
ani | +0.013 |
listen | +0.013 |
Neg logit contributions | |
million | -0.018 |
endant | -0.017 |
piping | -0.016 |
dark | -0.016 |
imet | -0.016 |