Token | sne |
Token ID | 10505 |
Feature activation | +6.29e-03 |
Pos logit contributions | |
groom | +0.002 |
scar | +0.002 |
burn | +0.002 |
pony | +0.002 |
salon | +0.002 |
Neg logit contributions | |
eway | -0.003 |
ining | -0.002 |
ered | -0.002 |
kered | -0.002 |
ooks | -0.002 |
Token | e |
Token ID | 68 |
Feature activation | +4.73e-04 |
Pos logit contributions | |
groom | +0.013 |
scar | +0.013 |
burn | +0.013 |
rob | +0.012 |
pony | +0.012 |
Neg logit contributions | |
eway | -0.009 |
ining | -0.007 |
ooks | -0.007 |
ered | -0.006 |
Turns | -0.006 |
Token | ze |
Token ID | 2736 |
Feature activation | +2.52e-02 |
Pos logit contributions | |
groom | +0.001 |
scar | +0.001 |
burn | +0.001 |
pony | +0.001 |
rob | +0.001 |
Neg logit contributions | |
eway | -0.001 |
ining | -0.001 |
ered | -0.000 |
kered | -0.000 |
earing | -0.000 |
Token | in |
Token ID | 287 |
Feature activation | -4.52e-03 |
Pos logit contributions | |
groom | +0.046 |
scar | +0.043 |
burn | +0.041 |
pony | +0.041 |
rob | +0.040 |
Neg logit contributions | |
eway | -0.042 |
ining | -0.037 |
ered | -0.035 |
kered | -0.035 |
rum | -0.034 |
Token | my |
Token ID | 616 |
Feature activation | +3.03e-03 |
Pos logit contributions | |
eway | +0.006 |
itself | +0.006 |
rum | +0.005 |
ining | +0.005 |
ered | +0.005 |
Neg logit contributions | |
groom | -0.009 |
rob | -0.008 |
pony | -0.008 |
burn | -0.008 |
scar | -0.008 |
Token | elbow |
Token ID | 22662 |
Feature activation | +6.12e-02 |
Pos logit contributions | |
groom | +0.005 |
burn | +0.005 |
rob | +0.004 |
scar | +0.004 |
ponies | +0.004 |
Neg logit contributions | |
eway | -0.005 |
ining | -0.005 |
earing | -0.004 |
Turns | -0.004 |
aged | -0.004 |
Token | next |
Token ID | 1306 |
Feature activation | +1.80e-02 |
Pos logit contributions | |
groom | +0.119 |
scar | +0.114 |
pony | +0.109 |
avail | +0.105 |
rob | +0.105 |
Neg logit contributions | |
eway | -0.081 |
rum | -0.077 |
ining | -0.077 |
kered | -0.076 |
aged | -0.074 |
Token | time |
Token ID | 640 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
groom | +0.040 |
rob | +0.040 |
ponies | +0.036 |
burn | +0.035 |
pony | +0.035 |
Neg logit contributions | |
eway | -0.022 |
anny | -0.017 |
ining | -0.016 |
ered | -0.016 |
way | -0.015 |
Token | ." |
Token ID | 526 |
Feature activation | +5.62e-03 |
Pos logit contributions | |
groom | +0.050 |
rob | +0.049 |
scar | +0.048 |
pony | +0.045 |
burn | +0.045 |
Neg logit contributions | |
eway | -0.037 |
ining | -0.035 |
earing | -0.034 |
ooks | -0.033 |
rum | -0.032 |
Token | She |
Token ID | 1375 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
groom | +0.011 |
scar | +0.010 |
pony | +0.010 |
burn | +0.010 |
salon | +0.009 |
Neg logit contributions | |
eway | -0.010 |
ered | -0.008 |
ining | -0.008 |
kered | -0.008 |
rum | -0.007 |
Token | wiped |
Token ID | 21122 |
Feature activation | -6.18e-03 |
Pos logit contributions | |
groom | +0.022 |
burn | +0.021 |
ponies | +0.021 |
pony | +0.021 |
rob | +0.020 |
Neg logit contributions | |
eway | -0.019 |
kered | -0.018 |
ered | -0.018 |
ining | -0.018 |
aged | -0.017 |
Token | some |
Token ID | 617 |
Feature activation | -8.03e-04 |
Pos logit contributions | |
groom | +0.043 |
salon | +0.042 |
scar | +0.040 |
poet | +0.040 |
burn | +0.040 |
Neg logit contributions | |
eway | -0.026 |
itself | -0.024 |
Everyone | -0.024 |
ining | -0.024 |
ered | -0.024 |
Token | apples |
Token ID | 22514 |
Feature activation | +2.22e-02 |
Pos logit contributions | |
eway | +0.001 |
ered | +0.001 |
ining | +0.001 |
Everyone | +0.001 |
ooks | +0.001 |
Neg logit contributions | |
groom | -0.001 |
burn | -0.001 |
poet | -0.001 |
salon | -0.001 |
rob | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | +7.40e-03 |
Pos logit contributions | |
groom | +0.034 |
scar | +0.031 |
poet | +0.030 |
rob | +0.030 |
pony | +0.029 |
Neg logit contributions | |
eway | -0.040 |
ining | -0.037 |
ered | -0.036 |
itself | -0.036 |
earing | -0.036 |
Token | please |
Token ID | 3387 |
Feature activation | +8.09e-03 |
Pos logit contributions | |
groom | +0.012 |
rob | +0.012 |
burn | +0.011 |
poet | +0.010 |
salon | +0.010 |
Neg logit contributions | |
eway | -0.012 |
ered | -0.011 |
Suz | -0.010 |
ining | -0.010 |
Everyone | -0.010 |
Token | ?" |
Token ID | 1701 |
Feature activation | +3.68e-02 |
Pos logit contributions | |
groom | +0.010 |
rob | +0.010 |
burn | +0.010 |
scar | +0.009 |
pony | +0.009 |
Neg logit contributions | |
eway | -0.016 |
ered | -0.015 |
ining | -0.015 |
ooks | -0.015 |
earing | -0.015 |
Token | Anna |
Token ID | 11735 |
Feature activation | +5.98e-02 |
Pos logit contributions | |
burn | +0.068 |
rob | +0.064 |
groom | +0.062 |
scar | +0.061 |
salon | +0.055 |
Neg logit contributions | |
Everyone | -0.056 |
eway | -0.053 |
Turns | -0.052 |
Everything | -0.051 |
His | -0.051 |
Token | says |
Token ID | 1139 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
burn | +0.098 |
groom | +0.096 |
rob | +0.094 |
usual | +0.088 |
scar | +0.087 |
Neg logit contributions | |
From | -0.091 |
ining | -0.091 |
eway | -0.090 |
It | -0.087 |
Everyone | -0.086 |
Token | . |
Token ID | 13 |
Feature activation | +3.10e-02 |
Pos logit contributions | |
groom | +0.046 |
rob | +0.044 |
scar | +0.044 |
burn | +0.042 |
salon | +0.041 |
Neg logit contributions | |
eway | -0.038 |
kered | -0.034 |
ining | -0.034 |
ered | -0.033 |
earing | -0.033 |
Token |
|
Token ID | 198 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
groom | +0.083 |
scar | +0.082 |
rob | +0.080 |
burn | +0.080 |
salon | +0.079 |
Neg logit contributions | |
eway | -0.019 |
Everyone | -0.019 |
Everything | -0.017 |
In | -0.016 |
It | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | +8.28e-03 |
Pos logit contributions | |
groom | +0.048 |
burn | +0.046 |
scar | +0.045 |
salon | +0.044 |
rob | +0.044 |
Neg logit contributions | |
eway | -0.014 |
Everyone | -0.013 |
ining | -0.012 |
From | -0.011 |
ooks | -0.011 |
Token | Mr |
Token ID | 5246 |
Feature activation | +2.76e-02 |
Pos logit contributions | |
burn | +0.018 |
groom | +0.018 |
rob | +0.018 |
scar | +0.017 |
pony | +0.016 |
Neg logit contributions | |
eway | -0.008 |
ining | -0.008 |
kered | -0.007 |
ooks | -0.007 |
rum | -0.007 |
Token | " |
Token ID | 1 |
Feature activation | -3.15e-03 |
Pos logit contributions | |
eway | +0.015 |
ered | +0.013 |
ining | +0.012 |
kered | +0.012 |
rum | +0.011 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.014 |
burn | -0.013 |
salon | -0.013 |
rob | -0.012 |
Token | Are |
Token ID | 8491 |
Feature activation | +4.08e-03 |
Pos logit contributions | |
eway | +0.004 |
kered | +0.004 |
ining | +0.004 |
Everyone | +0.004 |
Turns | +0.004 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.006 |
pony | -0.006 |
burn | -0.006 |
ponies | -0.006 |
Token | you |
Token ID | 345 |
Feature activation | +8.23e-03 |
Pos logit contributions | |
groom | +0.008 |
burn | +0.007 |
scar | +0.007 |
pony | +0.007 |
rob | +0.007 |
Neg logit contributions | |
eway | -0.006 |
ining | -0.006 |
ered | -0.005 |
earing | -0.005 |
kered | -0.005 |
Token | OK |
Token ID | 7477 |
Feature activation | +7.33e-03 |
Pos logit contributions | |
groom | +0.019 |
salon | +0.019 |
pony | +0.019 |
rob | +0.019 |
ponies | +0.018 |
Neg logit contributions | |
ered | -0.007 |
ining | -0.006 |
eway | -0.006 |
aged | -0.006 |
earing | -0.006 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.31e-02 |
Pos logit contributions | |
groom | +0.011 |
rob | +0.010 |
scar | +0.010 |
pony | +0.009 |
ponies | +0.009 |
Neg logit contributions | |
eway | -0.014 |
ered | -0.013 |
ining | -0.013 |
Suz | -0.013 |
rum | -0.012 |
Token | Ben |
Token ID | 3932 |
Feature activation | +5.89e-02 |
Pos logit contributions | |
burn | +0.032 |
groom | +0.032 |
rob | +0.028 |
pony | +0.028 |
scar | +0.028 |
Neg logit contributions | |
eway | -0.045 |
Everyone | -0.043 |
Suz | -0.042 |
Everything | -0.042 |
ooks | -0.041 |
Token | asks |
Token ID | 7893 |
Feature activation | +8.83e-03 |
Pos logit contributions | |
burn | +0.094 |
rob | +0.086 |
groom | +0.085 |
usual | +0.083 |
salon | +0.077 |
Neg logit contributions | |
Everyone | -0.091 |
Everything | -0.090 |
ered | -0.089 |
ining | -0.089 |
It | -0.086 |
Token | . |
Token ID | 13 |
Feature activation | +2.96e-03 |
Pos logit contributions | |
groom | +0.016 |
scar | +0.015 |
burn | +0.015 |
pony | +0.014 |
rob | +0.014 |
Neg logit contributions | |
eway | -0.015 |
ered | -0.013 |
kered | -0.013 |
ooks | -0.013 |
ining | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | +1.95e-04 |
Pos logit contributions | |
groom | +0.006 |
scar | +0.006 |
burn | +0.006 |
pony | +0.006 |
salon | +0.005 |
Neg logit contributions | |
eway | -0.004 |
ining | -0.004 |
ered | -0.003 |
kered | -0.003 |
ooks | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -5.75e-03 |
Pos logit contributions | |
groom | +0.000 |
scar | +0.000 |
burn | +0.000 |
pony | +0.000 |
rob | +0.000 |
Neg logit contributions | |
eway | -0.000 |
ining | -0.000 |
ered | -0.000 |
kered | -0.000 |
earing | -0.000 |
Token | " |
Token ID | 1 |
Feature activation | -3.11e-03 |
Pos logit contributions | |
eway | +0.010 |
ining | +0.008 |
ered | +0.008 |
kered | +0.008 |
earing | +0.008 |
Neg logit contributions | |
groom | -0.011 |
scar | -0.010 |
burn | -0.010 |
pony | -0.009 |
salon | -0.009 |
Token | still |
Token ID | 991 |
Feature activation | -3.96e-04 |
Pos logit contributions | |
groom | +0.001 |
scar | +0.001 |
burn | +0.001 |
pony | +0.001 |
salon | +0.001 |
Neg logit contributions | |
eway | -0.001 |
ining | -0.001 |
ered | -0.001 |
kered | -0.001 |
ooks | -0.001 |
Token | draw |
Token ID | 3197 |
Feature activation | +2.75e-02 |
Pos logit contributions | |
eway | +0.001 |
ining | +0.001 |
kered | +0.001 |
rum | +0.001 |
ooks | +0.001 |
Neg logit contributions | |
groom | -0.001 |
scar | -0.001 |
burn | -0.001 |
pony | -0.001 |
salon | -0.001 |
Token | our |
Token ID | 674 |
Feature activation | -8.71e-03 |
Pos logit contributions | |
groom | +0.053 |
burn | +0.050 |
pony | +0.047 |
salon | +0.047 |
scar | +0.047 |
Neg logit contributions | |
eway | -0.041 |
ining | -0.036 |
ered | -0.036 |
itself | -0.035 |
kered | -0.035 |
Token | clothes |
Token ID | 8242 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
eway | +0.017 |
ining | +0.015 |
ered | +0.014 |
kered | +0.014 |
rum | +0.014 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.013 |
pony | -0.012 |
burn | -0.012 |
ponies | -0.012 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.36e-02 |
Pos logit contributions | |
groom | +0.022 |
scar | +0.020 |
rob | +0.020 |
pony | +0.020 |
burn | +0.020 |
Neg logit contributions | |
eway | -0.016 |
ered | -0.015 |
ining | -0.015 |
earing | -0.014 |
itself | -0.014 |
Token | Anna |
Token ID | 11735 |
Feature activation | +5.85e-02 |
Pos logit contributions | |
burn | +0.041 |
rob | +0.039 |
groom | +0.037 |
scar | +0.037 |
pony | +0.033 |
Neg logit contributions | |
Everyone | -0.040 |
eway | -0.038 |
Everything | -0.037 |
Everybody | -0.036 |
From | -0.036 |
Token | asks |
Token ID | 7893 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
burn | +0.097 |
rob | +0.094 |
groom | +0.092 |
usual | +0.089 |
scar | +0.087 |
Neg logit contributions | |
From | -0.089 |
ining | -0.088 |
Everyone | -0.086 |
It | -0.084 |
Everything | -0.083 |
Token | . |
Token ID | 13 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
groom | +0.032 |
rob | +0.031 |
scar | +0.031 |
burn | +0.030 |
pony | +0.028 |
Neg logit contributions | |
eway | -0.020 |
itself | -0.018 |
kered | -0.018 |
ered | -0.018 |
ooks | -0.017 |
Token |
|
Token ID | 198 |
Feature activation | +6.46e-03 |
Pos logit contributions | |
groom | +0.025 |
scar | +0.025 |
burn | +0.024 |
rob | +0.024 |
salon | +0.023 |
Neg logit contributions | |
eway | -0.012 |
ining | -0.009 |
Everyone | -0.009 |
ooks | -0.009 |
Turns | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | -1.23e-03 |
Pos logit contributions | |
groom | +0.014 |
scar | +0.014 |
burn | +0.013 |
pony | +0.013 |
salon | +0.013 |
Neg logit contributions | |
eway | -0.008 |
ining | -0.007 |
ooks | -0.007 |
ered | -0.007 |
kered | -0.006 |
Token | " |
Token ID | 1 |
Feature activation | +1.07e-03 |
Pos logit contributions | |
eway | +0.002 |
ining | +0.001 |
kered | +0.001 |
ered | +0.001 |
ooks | +0.001 |
Neg logit contributions | |
groom | -0.003 |
scar | -0.003 |
burn | -0.003 |
pony | -0.003 |
rob | -0.002 |
Token | read |
Token ID | 1100 |
Feature activation | +3.62e-02 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.007 |
rum | +0.007 |
kered | +0.007 |
ered | +0.007 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.007 |
pony | -0.006 |
burn | -0.006 |
salon | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | -6.19e-03 |
Pos logit contributions | |
groom | +0.064 |
burn | +0.060 |
scar | +0.057 |
pony | +0.056 |
salon | +0.056 |
Neg logit contributions | |
eway | -0.060 |
ining | -0.052 |
ered | -0.052 |
itself | -0.051 |
kered | -0.051 |
Token | book |
Token ID | 1492 |
Feature activation | +2.41e-02 |
Pos logit contributions | |
eway | +0.011 |
ining | +0.010 |
kered | +0.010 |
Turns | +0.009 |
earing | +0.009 |
Neg logit contributions | |
groom | -0.010 |
burn | -0.010 |
scar | -0.008 |
salon | -0.008 |
pony | -0.008 |
Token | together |
Token ID | 1978 |
Feature activation | +2.23e-02 |
Pos logit contributions | |
groom | +0.045 |
scar | +0.041 |
burn | +0.041 |
pony | +0.039 |
rob | +0.039 |
Neg logit contributions | |
eway | -0.040 |
ining | -0.035 |
ered | -0.033 |
earing | -0.033 |
kered | -0.033 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.64e-02 |
Pos logit contributions | |
groom | +0.036 |
burn | +0.033 |
scar | +0.033 |
rob | +0.033 |
pony | +0.032 |
Neg logit contributions | |
eway | -0.039 |
ining | -0.036 |
itself | -0.035 |
ered | -0.034 |
earing | -0.034 |
Token | Ben |
Token ID | 3932 |
Feature activation | +5.82e-02 |
Pos logit contributions | |
groom | +0.040 |
burn | +0.040 |
rob | +0.038 |
scar | +0.038 |
pony | +0.033 |
Neg logit contributions | |
Everyone | -0.048 |
From | -0.045 |
Everything | -0.044 |
Suz | -0.044 |
His | -0.044 |
Token | says |
Token ID | 1139 |
Feature activation | +1.14e-02 |
Pos logit contributions | |
burn | +0.105 |
groom | +0.101 |
usual | +0.098 |
salon | +0.095 |
rob | +0.094 |
Neg logit contributions | |
From | -0.082 |
ining | -0.079 |
Everyone | -0.079 |
Everything | -0.076 |
ered | -0.074 |
Token | . |
Token ID | 13 |
Feature activation | +6.57e-03 |
Pos logit contributions | |
groom | +0.019 |
scar | +0.018 |
burn | +0.018 |
pony | +0.017 |
rob | +0.017 |
Neg logit contributions | |
eway | -0.021 |
ining | -0.018 |
ered | -0.018 |
kered | -0.018 |
earing | -0.017 |
Token |
|
Token ID | 198 |
Feature activation | -1.06e-03 |
Pos logit contributions | |
groom | +0.015 |
scar | +0.015 |
burn | +0.015 |
salon | +0.014 |
pony | +0.014 |
Neg logit contributions | |
eway | -0.008 |
ining | -0.006 |
ooks | -0.006 |
kered | -0.006 |
Turns | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | -9.44e-03 |
Pos logit contributions | |
eway | +0.002 |
ining | +0.001 |
ered | +0.001 |
kered | +0.001 |
earing | +0.001 |
Neg logit contributions | |
groom | -0.002 |
scar | -0.002 |
burn | -0.002 |
pony | -0.002 |
salon | -0.002 |
Token | " |
Token ID | 1 |
Feature activation | -1.00e-02 |
Pos logit contributions | |
eway | +0.016 |
ining | +0.014 |
ered | +0.014 |
kered | +0.013 |
earing | +0.013 |
Neg logit contributions | |
groom | -0.017 |
scar | -0.016 |
burn | -0.016 |
pony | -0.015 |
salon | -0.015 |
Token | the |
Token ID | 262 |
Feature activation | +1.76e-03 |
Pos logit contributions | |
burn | +0.029 |
groom | +0.028 |
scar | +0.027 |
pony | +0.026 |
ponies | +0.026 |
Neg logit contributions | |
eway | -0.015 |
ining | -0.013 |
ered | -0.012 |
itself | -0.011 |
kered | -0.011 |
Token | music |
Token ID | 2647 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
burn | +0.003 |
scar | +0.003 |
please | +0.003 |
groom | +0.002 |
rob | +0.002 |
Neg logit contributions | |
eway | -0.003 |
ining | -0.003 |
kered | -0.002 |
Everyone | -0.002 |
taker | -0.002 |
Token | for |
Token ID | 329 |
Feature activation | -4.95e-03 |
Pos logit contributions | |
groom | +0.033 |
burn | +0.031 |
scar | +0.031 |
rob | +0.029 |
ponies | +0.028 |
Neg logit contributions | |
eway | -0.041 |
ining | -0.035 |
ered | -0.033 |
Everyone | -0.033 |
anny | -0.032 |
Token | me |
Token ID | 502 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
eway | +0.007 |
ered | +0.006 |
ining | +0.006 |
kered | +0.006 |
itself | +0.006 |
Neg logit contributions | |
groom | -0.010 |
burn | -0.010 |
pony | -0.009 |
rob | -0.009 |
scar | -0.009 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.85e-02 |
Pos logit contributions | |
groom | +0.033 |
rob | +0.030 |
burn | +0.029 |
scar | +0.028 |
pony | +0.028 |
Neg logit contributions | |
eway | -0.038 |
ining | -0.035 |
earing | -0.034 |
ered | -0.033 |
and | -0.033 |
Token | Anna |
Token ID | 11735 |
Feature activation | +5.82e-02 |
Pos logit contributions | |
burn | +0.046 |
groom | +0.046 |
rob | +0.044 |
scar | +0.041 |
please | +0.038 |
Neg logit contributions | |
eway | -0.049 |
Everyone | -0.048 |
Everything | -0.046 |
Turns | -0.045 |
From | -0.045 |
Token | says |
Token ID | 1139 |
Feature activation | +2.24e-02 |
Pos logit contributions | |
burn | +0.087 |
groom | +0.081 |
rob | +0.079 |
scar | +0.075 |
salon | +0.073 |
Neg logit contributions | |
ining | -0.102 |
eway | -0.100 |
Everyone | -0.097 |
From | -0.096 |
Everything | -0.096 |
Token | . |
Token ID | 13 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
groom | +0.044 |
rob | +0.041 |
scar | +0.041 |
burn | +0.040 |
pony | +0.039 |
Neg logit contributions | |
eway | -0.034 |
kered | -0.030 |
ered | -0.030 |
ining | -0.030 |
earing | -0.029 |
Token |
|
Token ID | 198 |
Feature activation | +7.69e-03 |
Pos logit contributions | |
groom | +0.040 |
scar | +0.039 |
burn | +0.038 |
rob | +0.038 |
salon | +0.036 |
Neg logit contributions | |
eway | -0.016 |
ining | -0.012 |
Everyone | -0.012 |
Everything | -0.012 |
Turns | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | +3.09e-04 |
Pos logit contributions | |
groom | +0.016 |
scar | +0.015 |
burn | +0.015 |
pony | +0.015 |
salon | +0.014 |
Neg logit contributions | |
eway | -0.011 |
ining | -0.009 |
ered | -0.009 |
kered | -0.008 |
ooks | -0.008 |
Token | " |
Token ID | 1 |
Feature activation | +3.18e-03 |
Pos logit contributions | |
groom | +0.001 |
scar | +0.001 |
burn | +0.000 |
pony | +0.000 |
salon | +0.000 |
Neg logit contributions | |
eway | -0.001 |
ining | -0.000 |
ered | -0.000 |
kered | -0.000 |
ooks | -0.000 |
Token | Can |
Token ID | 1680 |
Feature activation | +7.08e-03 |
Pos logit contributions | |
eway | +0.025 |
ered | +0.022 |
ining | +0.021 |
kered | +0.020 |
eways | +0.020 |
Neg logit contributions | |
groom | -0.022 |
scar | -0.021 |
pony | -0.021 |
burn | -0.020 |
Velvet | -0.020 |
Token | you |
Token ID | 345 |
Feature activation | +9.49e-04 |
Pos logit contributions | |
groom | +0.010 |
scar | +0.009 |
pony | +0.009 |
burn | +0.009 |
salon | +0.008 |
Neg logit contributions | |
eway | -0.015 |
ining | -0.014 |
kered | -0.013 |
ered | -0.013 |
ooks | -0.013 |
Token | help |
Token ID | 1037 |
Feature activation | -1.33e-03 |
Pos logit contributions | |
groom | +0.002 |
scar | +0.001 |
burn | +0.001 |
pony | +0.001 |
salon | +0.001 |
Neg logit contributions | |
eway | -0.002 |
ining | -0.002 |
kered | -0.001 |
ered | -0.001 |
ooks | -0.001 |
Token | us |
Token ID | 514 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
eway | +0.002 |
ered | +0.002 |
ining | +0.002 |
itself | +0.001 |
ooks | +0.001 |
Neg logit contributions | |
groom | -0.003 |
scar | -0.003 |
burn | -0.003 |
rob | -0.003 |
pony | -0.003 |
Token | ?" |
Token ID | 1701 |
Feature activation | +3.55e-02 |
Pos logit contributions | |
eway | +0.034 |
ining | +0.031 |
ered | +0.030 |
kered | +0.030 |
ooks | +0.029 |
Neg logit contributions | |
groom | -0.019 |
scar | -0.018 |
burn | -0.017 |
pony | -0.017 |
salon | -0.016 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.81e-02 |
Pos logit contributions | |
groom | +0.067 |
burn | +0.064 |
rob | +0.061 |
scar | +0.060 |
pony | +0.056 |
Neg logit contributions | |
eway | -0.056 |
Everyone | -0.052 |
Suz | -0.049 |
Everything | -0.049 |
Turns | -0.049 |
Token | and |
Token ID | 290 |
Feature activation | +2.57e-02 |
Pos logit contributions | |
groom | +0.102 |
burn | +0.099 |
rob | +0.096 |
usual | +0.091 |
salon | +0.087 |
Neg logit contributions | |
From | -0.083 |
ining | -0.083 |
eway | -0.082 |
rum | -0.082 |
earing | -0.079 |
Token | Sam |
Token ID | 3409 |
Feature activation | +3.55e-02 |
Pos logit contributions | |
groom | +0.061 |
rob | +0.060 |
burn | +0.057 |
bride | +0.055 |
salon | +0.055 |
Neg logit contributions | |
eway | -0.025 |
Suz | -0.024 |
Maria | -0.021 |
Andy | -0.020 |
Jan | -0.020 |
Token | say |
Token ID | 910 |
Feature activation | +9.28e-03 |
Pos logit contributions | |
groom | +0.053 |
burn | +0.051 |
rob | +0.048 |
scar | +0.047 |
pony | +0.045 |
Neg logit contributions | |
eway | -0.068 |
ered | -0.064 |
ining | -0.061 |
earing | -0.060 |
kered | -0.059 |
Token | . |
Token ID | 13 |
Feature activation | +5.96e-03 |
Pos logit contributions | |
groom | +0.013 |
scar | +0.012 |
burn | +0.012 |
pony | +0.012 |
salon | +0.011 |
Neg logit contributions | |
eway | -0.019 |
ining | -0.017 |
ered | -0.017 |
ooks | -0.016 |
earing | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | +6.96e-03 |
Pos logit contributions | |
groom | +0.014 |
scar | +0.013 |
burn | +0.013 |
pony | +0.012 |
salon | +0.012 |
Neg logit contributions | |
eway | -0.007 |
ining | -0.006 |
kered | -0.006 |
ooks | -0.006 |
Turns | -0.005 |
Token | Dad |
Token ID | 17415 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
groom | +0.028 |
burn | +0.027 |
scar | +0.027 |
rob | +0.027 |
pony | +0.026 |
Neg logit contributions | |
eway | -0.030 |
ining | -0.028 |
ered | -0.028 |
itself | -0.028 |
kered | -0.026 |
Token | 's |
Token ID | 338 |
Feature activation | -1.33e-02 |
Pos logit contributions | |
groom | +0.046 |
scar | +0.044 |
rob | +0.043 |
pony | +0.042 |
avail | +0.041 |
Neg logit contributions | |
ining | -0.038 |
ered | -0.038 |
earing | -0.036 |
eway | -0.035 |
and | -0.034 |
Token | birthday |
Token ID | 10955 |
Feature activation | +2.89e-02 |
Pos logit contributions | |
eway | +0.026 |
ining | +0.023 |
ered | +0.023 |
kered | +0.022 |
earing | +0.022 |
Neg logit contributions | |
groom | -0.020 |
scar | -0.019 |
burn | -0.019 |
pony | -0.018 |
rob | -0.018 |
Token | now |
Token ID | 783 |
Feature activation | +2.88e-02 |
Pos logit contributions | |
rob | +0.049 |
groom | +0.049 |
burn | +0.047 |
pony | +0.045 |
scar | +0.045 |
Neg logit contributions | |
eway | -0.037 |
ining | -0.037 |
and | -0.036 |
ered | -0.035 |
anny | -0.035 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.66e-02 |
Pos logit contributions | |
groom | +0.048 |
scar | +0.047 |
rob | +0.045 |
pony | +0.044 |
salon | +0.044 |
Neg logit contributions | |
ered | -0.044 |
ining | -0.044 |
eway | -0.041 |
earing | -0.041 |
itself | -0.040 |
Token | Mom |
Token ID | 11254 |
Feature activation | +5.81e-02 |
Pos logit contributions | |
groom | +0.052 |
burn | +0.050 |
scar | +0.050 |
rob | +0.049 |
pony | +0.046 |
Neg logit contributions | |
eway | -0.038 |
ooks | -0.033 |
ining | -0.033 |
Everyone | -0.033 |
ered | -0.032 |
Token | says |
Token ID | 1139 |
Feature activation | +5.82e-03 |
Pos logit contributions | |
groom | +0.072 |
burn | +0.064 |
scar | +0.064 |
pony | +0.060 |
rob | +0.059 |
Neg logit contributions | |
eway | -0.126 |
ining | -0.118 |
ered | -0.117 |
rum | -0.113 |
earing | -0.113 |
Token | . |
Token ID | 13 |
Feature activation | +1.73e-02 |
Pos logit contributions | |
groom | +0.008 |
scar | +0.008 |
burn | +0.008 |
pony | +0.008 |
salon | +0.007 |
Neg logit contributions | |
eway | -0.012 |
ining | -0.010 |
ered | -0.010 |
kered | -0.010 |
ooks | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +5.18e-03 |
Pos logit contributions | |
groom | +0.040 |
scar | +0.038 |
burn | +0.037 |
rob | +0.036 |
pony | +0.036 |
Neg logit contributions | |
eway | -0.020 |
ining | -0.017 |
ooks | -0.016 |
kered | -0.015 |
Turns | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | -1.96e-03 |
Pos logit contributions | |
groom | +0.011 |
scar | +0.011 |
burn | +0.010 |
pony | +0.010 |
salon | +0.010 |
Neg logit contributions | |
eway | -0.007 |
ining | -0.006 |
ered | -0.006 |
kered | -0.006 |
ooks | -0.006 |
Token | Anna |
Token ID | 31160 |
Feature activation | +3.67e-02 |
Pos logit contributions | |
eway | +0.004 |
ining | +0.004 |
ered | +0.004 |
kered | +0.004 |
earing | +0.003 |
Neg logit contributions | |
groom | -0.003 |
scar | -0.003 |
burn | -0.003 |
pony | -0.002 |
salon | -0.002 |
Token | read |
Token ID | 1100 |
Feature activation | +4.17e-02 |
Pos logit contributions | |
groom | +0.007 |
scar | +0.007 |
burn | +0.006 |
pony | +0.006 |
rob | +0.006 |
Neg logit contributions | |
eway | -0.009 |
ining | -0.008 |
ered | -0.008 |
kered | -0.008 |
earing | -0.008 |
Token | it |
Token ID | 340 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
groom | +0.088 |
burn | +0.086 |
scar | +0.081 |
rob | +0.080 |
salon | +0.079 |
Neg logit contributions | |
eway | -0.055 |
ining | -0.046 |
itself | -0.046 |
ered | -0.046 |
Everyone | -0.042 |
Token | for |
Token ID | 329 |
Feature activation | +8.89e-04 |
Pos logit contributions | |
groom | +0.031 |
burn | +0.028 |
scar | +0.027 |
pony | +0.026 |
rob | +0.026 |
Neg logit contributions | |
eway | -0.033 |
ining | -0.028 |
ered | -0.027 |
itself | -0.026 |
earing | -0.026 |
Token | us |
Token ID | 514 |
Feature activation | +2.62e-03 |
Pos logit contributions | |
burn | +0.002 |
groom | +0.002 |
salon | +0.002 |
pony | +0.002 |
rob | +0.002 |
Neg logit contributions | |
eway | -0.001 |
ered | -0.001 |
itself | -0.001 |
ining | -0.001 |
Everyone | -0.001 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.45e-02 |
Pos logit contributions | |
groom | +0.003 |
rob | +0.003 |
burn | +0.003 |
scar | +0.003 |
pony | +0.003 |
Neg logit contributions | |
eway | -0.005 |
ining | -0.005 |
ered | -0.005 |
earing | -0.005 |
ooks | -0.005 |
Token | Anna |
Token ID | 11735 |
Feature activation | +5.80e-02 |
Pos logit contributions | |
burn | +0.050 |
rob | +0.045 |
groom | +0.044 |
scar | +0.041 |
please | +0.039 |
Neg logit contributions | |
Everyone | -0.039 |
Everything | -0.034 |
From | -0.034 |
Everybody | -0.034 |
In | -0.034 |
Token | says |
Token ID | 1139 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
burn | +0.091 |
groom | +0.087 |
scar | +0.080 |
salon | +0.079 |
rob | +0.079 |
Neg logit contributions | |
ining | -0.098 |
eway | -0.098 |
From | -0.093 |
Everyone | -0.093 |
earing | -0.091 |
Token | . |
Token ID | 13 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
groom | +0.030 |
scar | +0.028 |
rob | +0.028 |
burn | +0.027 |
pony | +0.026 |
Neg logit contributions | |
eway | -0.025 |
kered | -0.023 |
ining | -0.022 |
ered | -0.022 |
earing | -0.022 |
Token | She |
Token ID | 1375 |
Feature activation | +3.69e-02 |
Pos logit contributions | |
groom | +0.048 |
scar | +0.047 |
burn | +0.047 |
rob | +0.046 |
salon | +0.045 |
Neg logit contributions | |
eway | -0.015 |
Everyone | -0.013 |
Everything | -0.012 |
ining | -0.012 |
Turns | -0.012 |
Token | offers |
Token ID | 4394 |
Feature activation | +1.84e-02 |
Pos logit contributions | |
burn | +0.067 |
groom | +0.063 |
scar | +0.058 |
please | +0.058 |
rob | +0.058 |
Neg logit contributions | |
ining | -0.054 |
eway | -0.054 |
ered | -0.052 |
From | -0.051 |
Everything | -0.050 |
Token | the |
Token ID | 262 |
Feature activation | +7.48e-03 |
Pos logit contributions | |
rob | +0.036 |
groom | +0.036 |
burn | +0.036 |
scar | +0.035 |
salon | +0.033 |
Neg logit contributions | |
eway | -0.025 |
itself | -0.022 |
ered | -0.022 |
kered | -0.021 |
ining | -0.021 |
Token | fly |
Token ID | 6129 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
ered | +0.005 |
eway | +0.005 |
kered | +0.005 |
ining | +0.005 |
Everyone | +0.005 |
Neg logit contributions | |
rob | -0.007 |
groom | -0.007 |
ponies | -0.006 |
scar | -0.006 |
pony | -0.006 |
Token | your |
Token ID | 534 |
Feature activation | +9.67e-03 |
Pos logit contributions | |
groom | +0.037 |
rob | +0.032 |
burn | +0.032 |
ponies | +0.031 |
syrup | +0.031 |
Neg logit contributions | |
eway | -0.042 |
ining | -0.036 |
itself | -0.036 |
ered | -0.036 |
Suz | -0.033 |
Token | k |
Token ID | 479 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
rob | +0.016 |
poet | +0.014 |
groom | +0.014 |
please | +0.014 |
Nikki | +0.013 |
Neg logit contributions | |
eway | -0.014 |
ining | -0.014 |
aged | -0.014 |
itself | -0.013 |
Tears | -0.013 |
Token | ites |
Token ID | 2737 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
groom | +0.023 |
scar | +0.022 |
prince | +0.021 |
poet | +0.021 |
syrup | +0.020 |
Neg logit contributions | |
eway | -0.019 |
ining | -0.017 |
aged | -0.017 |
ooks | -0.016 |
kered | -0.016 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.54e-02 |
Pos logit contributions | |
groom | +0.024 |
syrup | +0.022 |
rob | +0.022 |
scar | +0.022 |
strawberries | +0.021 |
Neg logit contributions | |
eway | -0.030 |
ining | -0.028 |
ered | -0.027 |
itself | -0.026 |
earing | -0.025 |
Token | Mom |
Token ID | 11254 |
Feature activation | +5.78e-02 |
Pos logit contributions | |
rob | +0.052 |
burn | +0.049 |
scar | +0.046 |
groom | +0.045 |
salon | +0.044 |
Neg logit contributions | |
Everyone | -0.033 |
Suz | -0.031 |
eway | -0.030 |
ooks | -0.030 |
Turns | -0.030 |
Token | asks |
Token ID | 7893 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
groom | +0.070 |
burn | +0.067 |
scar | +0.061 |
rob | +0.060 |
salon | +0.057 |
Neg logit contributions | |
eway | -0.118 |
ining | -0.114 |
ered | -0.112 |
Everything | -0.109 |
Turns | -0.108 |
Token | . |
Token ID | 13 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
groom | +0.024 |
scar | +0.024 |
rob | +0.023 |
burn | +0.023 |
pony | +0.022 |
Neg logit contributions | |
eway | -0.018 |
ered | -0.016 |
ooks | -0.016 |
kered | -0.016 |
itself | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
groom | +0.041 |
scar | +0.040 |
burn | +0.039 |
rob | +0.039 |
salon | +0.037 |
Neg logit contributions | |
eway | -0.017 |
ining | -0.014 |
Turns | -0.013 |
ooks | -0.013 |
Everyone | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | +4.60e-03 |
Pos logit contributions | |
groom | +0.027 |
scar | +0.025 |
burn | +0.025 |
pony | +0.024 |
rob | +0.024 |
Neg logit contributions | |
eway | -0.015 |
ining | -0.012 |
ooks | -0.012 |
kered | -0.011 |
ered | -0.011 |
Token | " |
Token ID | 1 |
Feature activation | +3.67e-04 |
Pos logit contributions | |
groom | +0.011 |
scar | +0.010 |
burn | +0.010 |
rob | +0.010 |
pony | +0.010 |
Neg logit contributions | |
eway | -0.005 |
ining | -0.004 |
ooks | -0.004 |
kered | -0.004 |
earing | -0.004 |
Token | we |
Token ID | 356 |
Feature activation | -2.54e-04 |
Pos logit contributions | |
groom | +0.014 |
scar | +0.013 |
burn | +0.013 |
pony | +0.012 |
salon | +0.012 |
Neg logit contributions | |
eway | -0.016 |
ining | -0.014 |
ered | -0.014 |
kered | -0.014 |
ooks | -0.014 |
Token | be |
Token ID | 307 |
Feature activation | -9.32e-03 |
Pos logit contributions | |
eway | +0.001 |
ining | +0.000 |
kered | +0.000 |
ered | +0.000 |
ooks | +0.000 |
Neg logit contributions | |
groom | -0.000 |
scar | -0.000 |
burn | -0.000 |
pony | -0.000 |
salon | -0.000 |
Token | friends |
Token ID | 2460 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
eway | +0.016 |
ining | +0.014 |
ered | +0.014 |
kered | +0.013 |
earing | +0.013 |
Neg logit contributions | |
groom | -0.017 |
scar | -0.016 |
burn | -0.015 |
pony | -0.015 |
ponies | -0.014 |
Token | again |
Token ID | 757 |
Feature activation | +2.21e-02 |
Pos logit contributions | |
groom | +0.029 |
burn | +0.027 |
scar | +0.027 |
rob | +0.027 |
syrup | +0.026 |
Neg logit contributions | |
ining | -0.027 |
eway | -0.027 |
ered | -0.025 |
kered | -0.025 |
lived | -0.024 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.23e-02 |
Pos logit contributions | |
rob | +0.038 |
groom | +0.037 |
salon | +0.036 |
burn | +0.035 |
pony | +0.034 |
Neg logit contributions | |
ooks | -0.032 |
ining | -0.031 |
eway | -0.030 |
itself | -0.029 |
ered | -0.029 |
Token | Anna |
Token ID | 11735 |
Feature activation | +5.77e-02 |
Pos logit contributions | |
burn | +0.041 |
rob | +0.041 |
groom | +0.038 |
scar | +0.037 |
pony | +0.034 |
Neg logit contributions | |
Everyone | -0.034 |
His | -0.033 |
eway | -0.031 |
Turns | -0.031 |
From | -0.031 |
Token | says |
Token ID | 1139 |
Feature activation | +1.68e-02 |
Pos logit contributions | |
burn | +0.099 |
groom | +0.098 |
rob | +0.094 |
usual | +0.093 |
scar | +0.088 |
Neg logit contributions | |
From | -0.084 |
ining | -0.081 |
Everyone | -0.081 |
Everything | -0.079 |
It | -0.079 |
Token | . |
Token ID | 13 |
Feature activation | +1.67e-02 |
Pos logit contributions | |
groom | +0.030 |
scar | +0.028 |
rob | +0.026 |
burn | +0.026 |
pony | +0.026 |
Neg logit contributions | |
eway | -0.029 |
ining | -0.026 |
kered | -0.025 |
ered | -0.025 |
earing | -0.025 |
Token |
|
Token ID | 198 |
Feature activation | +6.17e-03 |
Pos logit contributions | |
groom | +0.043 |
scar | +0.042 |
burn | +0.041 |
rob | +0.041 |
salon | +0.040 |
Neg logit contributions | |
eway | -0.013 |
Everyone | -0.011 |
Everything | -0.011 |
ining | -0.010 |
Turns | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | -3.52e-03 |
Pos logit contributions | |
groom | +0.014 |
scar | +0.013 |
burn | +0.013 |
pony | +0.013 |
salon | +0.012 |
Neg logit contributions | |
eway | -0.008 |
ining | -0.007 |
ooks | -0.006 |
kered | -0.006 |
ered | -0.006 |
Token | Anna |
Token ID | 31160 |
Feature activation | +4.02e-02 |
Pos logit contributions | |
eway | +0.007 |
ining | +0.006 |
kered | +0.006 |
ered | +0.006 |
earing | +0.006 |
Neg logit contributions | |
groom | -0.005 |
scar | -0.005 |
burn | -0.005 |
pony | -0.005 |
rob | -0.004 |
Token | Can |
Token ID | 1680 |
Feature activation | +1.96e-02 |
Pos logit contributions | |
groom | +0.036 |
scar | +0.034 |
pony | +0.033 |
burn | +0.033 |
salon | +0.032 |
Neg logit contributions | |
eway | -0.029 |
ining | -0.024 |
ered | -0.024 |
kered | -0.023 |
earing | -0.023 |
Token | she |
Token ID | 673 |
Feature activation | +2.09e-02 |
Pos logit contributions | |
groom | +0.032 |
scar | +0.030 |
burn | +0.029 |
pony | +0.028 |
rob | +0.027 |
Neg logit contributions | |
eway | -0.036 |
ining | -0.032 |
ered | -0.031 |
kered | -0.031 |
earing | -0.030 |
Token | wear |
Token ID | 5806 |
Feature activation | +1.95e-02 |
Pos logit contributions | |
rob | +0.037 |
groom | +0.035 |
burn | +0.035 |
scar | +0.035 |
ponies | +0.034 |
Neg logit contributions | |
eway | -0.030 |
ered | -0.030 |
ining | -0.029 |
Everyone | -0.027 |
kered | -0.027 |
Token | jeans |
Token ID | 21029 |
Feature activation | +5.19e-02 |
Pos logit contributions | |
groom | +0.036 |
burn | +0.033 |
scar | +0.032 |
salon | +0.032 |
pony | +0.031 |
Neg logit contributions | |
eway | -0.031 |
ining | -0.027 |
ered | -0.027 |
kered | -0.026 |
earing | -0.025 |
Token | and |
Token ID | 290 |
Feature activation | +7.69e-03 |
Pos logit contributions | |
groom | +0.085 |
rob | +0.078 |
scar | +0.077 |
burn | +0.075 |
strawberries | +0.074 |
Neg logit contributions | |
eway | -0.081 |
ining | -0.076 |
ered | -0.074 |
earing | -0.073 |
Everyone | -0.073 |
Token | sneakers |
Token ID | 42649 |
Feature activation | +5.76e-02 |
Pos logit contributions | |
rob | +0.009 |
groom | +0.009 |
burn | +0.009 |
salon | +0.008 |
poet | +0.008 |
Neg logit contributions | |
eway | -0.015 |
ered | -0.014 |
kered | -0.014 |
Everyone | -0.013 |
ining | -0.013 |
Token | ?" |
Token ID | 1701 |
Feature activation | +3.52e-02 |
Pos logit contributions | |
groom | +0.096 |
burn | +0.086 |
scar | +0.084 |
ponies | +0.083 |
rob | +0.083 |
Neg logit contributions | |
eway | -0.095 |
ining | -0.089 |
ered | -0.086 |
earing | -0.085 |
Everyone | -0.084 |
Token | Lily |
Token ID | 20037 |
Feature activation | +2.92e-02 |
Pos logit contributions | |
groom | +0.072 |
burn | +0.071 |
scar | +0.070 |
rob | +0.069 |
butter | +0.064 |
Neg logit contributions | |
eway | -0.043 |
Everyone | -0.042 |
Suz | -0.041 |
Turns | -0.039 |
Everything | -0.039 |
Token | said |
Token ID | 531 |
Feature activation | +2.34e-02 |
Pos logit contributions | |
burn | +0.049 |
groom | +0.048 |
rob | +0.047 |
scar | +0.047 |
pony | +0.044 |
Neg logit contributions | |
ining | -0.046 |
eway | -0.043 |
earing | -0.043 |
ered | -0.042 |
From | -0.040 |
Token | . |
Token ID | 13 |
Feature activation | +2.01e-02 |
Pos logit contributions | |
groom | +0.043 |
scar | +0.042 |
rob | +0.041 |
burn | +0.039 |
pony | +0.038 |
Neg logit contributions | |
eway | -0.037 |
ining | -0.033 |
ered | -0.033 |
kered | -0.032 |
earing | -0.032 |
Token |
|
Token ID | 198 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
groom | +0.048 |
scar | +0.046 |
burn | +0.045 |
rob | +0.045 |
pony | +0.044 |
Neg logit contributions | |
eway | -0.021 |
ining | -0.017 |
Everyone | -0.017 |
Turns | -0.016 |
ooks | -0.016 |
Token | art |
Token ID | 1242 |
Feature activation | -6.29e-03 |
Pos logit contributions | |
eway | +0.010 |
ining | +0.009 |
ered | +0.008 |
kered | +0.008 |
ooks | +0.008 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.008 |
burn | -0.008 |
pony | -0.008 |
rob | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | -3.22e-04 |
Pos logit contributions | |
eway | +0.010 |
ining | +0.009 |
ered | +0.008 |
kered | +0.008 |
ooks | +0.008 |
Neg logit contributions | |
groom | -0.012 |
scar | -0.011 |
burn | -0.011 |
pony | -0.011 |
salon | -0.010 |
Token | Can |
Token ID | 1680 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
eway | +0.000 |
ered | +0.000 |
ining | +0.000 |
kered | +0.000 |
rum | +0.000 |
Neg logit contributions | |
groom | -0.001 |
scar | -0.001 |
pony | -0.001 |
burn | -0.001 |
ponies | -0.001 |
Token | we |
Token ID | 356 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
groom | +0.026 |
scar | +0.024 |
burn | +0.023 |
pony | +0.023 |
rob | +0.022 |
Neg logit contributions | |
eway | -0.035 |
ining | -0.031 |
ered | -0.030 |
kered | -0.030 |
ooks | -0.030 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.39e-02 |
Pos logit contributions | |
groom | +0.015 |
scar | +0.013 |
burn | +0.013 |
pony | +0.013 |
salon | +0.012 |
Neg logit contributions | |
eway | -0.022 |
ining | -0.019 |
kered | -0.018 |
rum | -0.018 |
ered | -0.018 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.74e-02 |
Pos logit contributions | |
groom | +0.045 |
burn | +0.044 |
scar | +0.041 |
rob | +0.041 |
pony | +0.039 |
Neg logit contributions | |
eway | -0.037 |
Everyone | -0.034 |
Suz | -0.033 |
Everything | -0.032 |
Turns | -0.031 |
Token | and |
Token ID | 290 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
burn | +0.094 |
groom | +0.093 |
rob | +0.082 |
salon | +0.081 |
scar | +0.081 |
Neg logit contributions | |
ining | -0.093 |
eway | -0.092 |
From | -0.089 |
earing | -0.086 |
Everyone | -0.085 |
Token | Sam |
Token ID | 3409 |
Feature activation | +3.35e-02 |
Pos logit contributions | |
groom | +0.039 |
burn | +0.038 |
rob | +0.036 |
salon | +0.036 |
scar | +0.035 |
Neg logit contributions | |
eway | -0.020 |
Suz | -0.018 |
ered | -0.016 |
Everyone | -0.016 |
ining | -0.016 |
Token | ask |
Token ID | 1265 |
Feature activation | +2.60e-03 |
Pos logit contributions | |
burn | +0.050 |
groom | +0.050 |
rob | +0.046 |
scar | +0.046 |
pony | +0.043 |
Neg logit contributions | |
eway | -0.061 |
ered | -0.058 |
ining | -0.056 |
Everyone | -0.054 |
earing | -0.054 |
Token | . |
Token ID | 13 |
Feature activation | +6.44e-03 |
Pos logit contributions | |
groom | +0.004 |
scar | +0.004 |
burn | +0.004 |
pony | +0.004 |
salon | +0.004 |
Neg logit contributions | |
eway | -0.005 |
ining | -0.004 |
ered | -0.004 |
kered | -0.004 |
ooks | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +4.54e-03 |
Pos logit contributions | |
groom | +0.014 |
scar | +0.014 |
burn | +0.013 |
pony | +0.013 |
salon | +0.013 |
Neg logit contributions | |
eway | -0.008 |
ining | -0.007 |
kered | -0.007 |
ooks | -0.006 |
ered | -0.006 |
Token | You |
Token ID | 921 |
Feature activation | +2.39e-03 |
Pos logit contributions | |
groom | +0.005 |
scar | +0.004 |
burn | +0.004 |
pony | +0.004 |
poet | +0.004 |
Neg logit contributions | |
eway | -0.004 |
ered | -0.004 |
ining | -0.004 |
kered | -0.003 |
aged | -0.003 |
Token | can |
Token ID | 460 |
Feature activation | +1.90e-02 |
Pos logit contributions | |
groom | +0.004 |
scar | +0.004 |
burn | +0.004 |
pony | +0.004 |
butter | +0.004 |
Neg logit contributions | |
eway | -0.004 |
ining | -0.004 |
ooks | -0.004 |
rum | -0.004 |
ered | -0.004 |
Token | have |
Token ID | 423 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
groom | +0.031 |
scar | +0.030 |
burn | +0.029 |
pony | +0.029 |
rob | +0.028 |
Neg logit contributions | |
eway | -0.033 |
ered | -0.030 |
ining | -0.030 |
kered | -0.029 |
ooks | -0.028 |
Token | blue |
Token ID | 4171 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
burn | +0.032 |
groom | +0.032 |
salon | +0.030 |
pony | +0.030 |
scar | +0.030 |
Neg logit contributions | |
eway | -0.026 |
ining | -0.024 |
ered | -0.024 |
itself | -0.024 |
Everyone | -0.022 |
Token | berry |
Token ID | 8396 |
Feature activation | +1.49e-02 |
Pos logit contributions | |
groom | +0.020 |
pony | +0.018 |
burn | +0.018 |
scar | +0.018 |
rider | +0.017 |
Neg logit contributions | |
eway | -0.022 |
ered | -0.019 |
ining | -0.019 |
ooks | -0.019 |
rum | -0.019 |
Token | yogurt |
Token ID | 32132 |
Feature activation | +5.72e-02 |
Pos logit contributions | |
groom | +0.022 |
burn | +0.020 |
scar | +0.020 |
pony | +0.019 |
rob | +0.019 |
Neg logit contributions | |
eway | -0.028 |
ining | -0.025 |
kered | -0.024 |
ered | -0.024 |
earing | -0.024 |
Token | today |
Token ID | 1909 |
Feature activation | +4.01e-02 |
Pos logit contributions | |
groom | +0.117 |
rob | +0.112 |
burn | +0.110 |
scar | +0.109 |
avail | +0.108 |
Neg logit contributions | |
eway | -0.059 |
ining | -0.058 |
and | -0.057 |
itself | -0.055 |
nicely | -0.055 |
Token | and |
Token ID | 290 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
groom | +0.080 |
rob | +0.079 |
burn | +0.077 |
scar | +0.077 |
pony | +0.072 |
Neg logit contributions | |
eway | -0.056 |
ining | -0.051 |
itself | -0.050 |
earing | -0.048 |
and | -0.047 |
Token | pink |
Token ID | 11398 |
Feature activation | +1.29e-02 |
Pos logit contributions | |
burn | +0.023 |
groom | +0.022 |
rob | +0.022 |
scar | +0.021 |
pony | +0.021 |
Neg logit contributions | |
eway | -0.026 |
ining | -0.023 |
ered | -0.023 |
itself | -0.023 |
Everyone | -0.023 |
Token | yogurt |
Token ID | 32132 |
Feature activation | +5.45e-02 |
Pos logit contributions | |
groom | +0.022 |
burn | +0.022 |
scar | +0.021 |
rob | +0.021 |
pony | +0.021 |
Neg logit contributions | |
eway | -0.020 |
kered | -0.017 |
ered | -0.017 |
ining | -0.017 |
rum | -0.017 |
Token | tomorrow |
Token ID | 9439 |
Feature activation | +5.83e-02 |
Pos logit contributions | |
scar | +0.109 |
groom | +0.109 |
burn | +0.107 |
rob | +0.107 |
avail | +0.104 |
Neg logit contributions | |
eway | -0.059 |
ining | -0.058 |
and | -0.055 |
itself | -0.054 |
earing | -0.054 |
Token | a |
Token ID | 257 |
Feature activation | -1.10e-03 |
Pos logit contributions | |
groom | +0.025 |
burn | +0.023 |
scar | +0.022 |
rob | +0.022 |
salon | +0.022 |
Neg logit contributions | |
eway | -0.015 |
ered | -0.014 |
ining | -0.013 |
itself | -0.012 |
Everyone | -0.012 |
Token | trick |
Token ID | 6908 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
eway | +0.002 |
ining | +0.001 |
earing | +0.001 |
ered | +0.001 |
kered | +0.001 |
Neg logit contributions | |
groom | -0.002 |
rob | -0.002 |
ponies | -0.002 |
burn | -0.002 |
strawberries | -0.002 |
Token | for |
Token ID | 329 |
Feature activation | +3.61e-03 |
Pos logit contributions | |
groom | +0.021 |
scar | +0.019 |
burn | +0.018 |
strawberries | +0.017 |
syrup | +0.017 |
Neg logit contributions | |
eway | -0.028 |
ered | -0.025 |
ining | -0.024 |
rum | -0.024 |
kered | -0.024 |
Token | us |
Token ID | 514 |
Feature activation | +2.84e-03 |
Pos logit contributions | |
groom | +0.007 |
burn | +0.007 |
rob | +0.007 |
pony | +0.007 |
scar | +0.007 |
Neg logit contributions | |
eway | -0.005 |
ered | -0.004 |
ining | -0.004 |
itself | -0.004 |
Everyone | -0.004 |
Token | ?" |
Token ID | 1701 |
Feature activation | +3.45e-02 |
Pos logit contributions | |
groom | +0.004 |
rob | +0.004 |
burn | +0.004 |
scar | +0.004 |
pony | +0.004 |
Neg logit contributions | |
eway | -0.005 |
ered | -0.005 |
ining | -0.005 |
earing | -0.005 |
rum | -0.005 |
Token | Ben |
Token ID | 3932 |
Feature activation | +5.72e-02 |
Pos logit contributions | |
groom | +0.064 |
burn | +0.061 |
rob | +0.057 |
scar | +0.056 |
salon | +0.054 |
Neg logit contributions | |
eway | -0.052 |
Everyone | -0.050 |
Everything | -0.049 |
Turns | -0.047 |
From | -0.046 |
Token | asks |
Token ID | 7893 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
burn | +0.093 |
groom | +0.090 |
usual | +0.087 |
rob | +0.083 |
salon | +0.082 |
Neg logit contributions | |
ining | -0.087 |
From | -0.085 |
ered | -0.085 |
eway | -0.084 |
Everything | -0.082 |
Token | . |
Token ID | 13 |
Feature activation | +1.59e-02 |
Pos logit contributions | |
groom | +0.038 |
burn | +0.034 |
scar | +0.034 |
rob | +0.034 |
salon | +0.033 |
Neg logit contributions | |
eway | -0.027 |
kered | -0.023 |
ered | -0.023 |
itself | -0.022 |
rum | -0.022 |
Token |
|
Token ID | 198 |
Feature activation | +9.23e-03 |
Pos logit contributions | |
groom | +0.038 |
scar | +0.036 |
burn | +0.036 |
salon | +0.035 |
pony | +0.034 |
Neg logit contributions | |
eway | -0.018 |
ining | -0.015 |
Turns | -0.013 |
kered | -0.013 |
Everyone | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | +2.82e-03 |
Pos logit contributions | |
groom | +0.020 |
scar | +0.019 |
burn | +0.019 |
pony | +0.018 |
salon | +0.018 |
Neg logit contributions | |
eway | -0.013 |
ining | -0.011 |
ered | -0.010 |
kered | -0.010 |
ooks | -0.010 |
Token | Max |
Token ID | 11518 |
Feature activation | +4.18e-02 |
Pos logit contributions | |
groom | +0.005 |
scar | +0.004 |
burn | +0.004 |
pony | +0.004 |
salon | +0.004 |
Neg logit contributions | |
eway | -0.005 |
ining | -0.005 |
ered | -0.004 |
kered | -0.004 |
ooks | -0.004 |
Token | can |
Token ID | 460 |
Feature activation | +1.66e-02 |
Pos logit contributions | |
groom | +0.010 |
scar | +0.010 |
burn | +0.010 |
pony | +0.010 |
rob | +0.010 |
Neg logit contributions | |
eway | -0.005 |
ining | -0.004 |
kered | -0.004 |
ered | -0.004 |
earing | -0.004 |
Token | we |
Token ID | 356 |
Feature activation | -1.14e-05 |
Pos logit contributions | |
groom | +0.030 |
scar | +0.029 |
burn | +0.028 |
rob | +0.028 |
pony | +0.027 |
Neg logit contributions | |
eway | -0.026 |
ered | -0.024 |
ining | -0.023 |
kered | -0.023 |
Everyone | -0.022 |
Token | fix |
Token ID | 4259 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
eway | +0.000 |
ining | +0.000 |
ooks | +0.000 |
kered | +0.000 |
ered | +0.000 |
Neg logit contributions | |
groom | -0.000 |
scar | -0.000 |
burn | -0.000 |
pony | -0.000 |
salon | -0.000 |
Token | it |
Token ID | 340 |
Feature activation | +9.36e-03 |
Pos logit contributions | |
groom | +0.031 |
burn | +0.029 |
scar | +0.028 |
pony | +0.028 |
salon | +0.027 |
Neg logit contributions | |
eway | -0.019 |
ered | -0.016 |
ining | -0.016 |
itself | -0.016 |
kered | -0.015 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.91e-02 |
Pos logit contributions | |
groom | +0.014 |
scar | +0.012 |
pony | +0.012 |
burn | +0.012 |
ponies | +0.012 |
Neg logit contributions | |
eway | -0.018 |
ining | -0.017 |
ered | -0.017 |
itself | -0.016 |
earing | -0.016 |
Token | Mom |
Token ID | 11254 |
Feature activation | +5.71e-02 |
Pos logit contributions | |
rob | +0.069 |
burn | +0.066 |
scar | +0.065 |
groom | +0.064 |
cowboy | +0.059 |
Neg logit contributions | |
Everyone | -0.028 |
Suz | -0.026 |
eway | -0.026 |
Turns | -0.025 |
From | -0.025 |
Token | asks |
Token ID | 7893 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
groom | +0.086 |
burn | +0.079 |
scar | +0.075 |
rob | +0.071 |
pony | +0.071 |
Neg logit contributions | |
eway | -0.103 |
ered | -0.100 |
ining | -0.100 |
Everything | -0.096 |
earing | -0.095 |
Token | . |
Token ID | 13 |
Feature activation | +2.10e-02 |
Pos logit contributions | |
groom | +0.022 |
scar | +0.021 |
rob | +0.021 |
burn | +0.021 |
poet | +0.020 |
Neg logit contributions | |
eway | -0.015 |
ered | -0.014 |
itself | -0.013 |
kered | -0.013 |
earing | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | +8.79e-03 |
Pos logit contributions | |
groom | +0.050 |
scar | +0.049 |
burn | +0.048 |
rob | +0.048 |
salon | +0.046 |
Neg logit contributions | |
eway | -0.021 |
ining | -0.017 |
Turns | -0.016 |
Everyone | -0.016 |
Everything | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | +5.41e-04 |
Pos logit contributions | |
groom | +0.021 |
scar | +0.020 |
burn | +0.020 |
pony | +0.019 |
salon | +0.019 |
Neg logit contributions | |
eway | -0.010 |
ining | -0.008 |
ooks | -0.008 |
kered | -0.007 |
ered | -0.007 |
Token | S |
Token ID | 50 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
groom | +0.001 |
scar | +0.001 |
burn | +0.001 |
rob | +0.001 |
pony | +0.001 |
Neg logit contributions | |
eway | -0.001 |
ooks | -0.001 |
ining | -0.001 |
earing | -0.001 |
kered | -0.001 |
Token | ind |
Token ID | 521 |
Feature activation | -8.74e-03 |
Pos logit contributions | |
eway | +0.010 |
ining | +0.009 |
ered | +0.009 |
kered | +0.009 |
ooks | +0.009 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.007 |
burn | -0.007 |
pony | -0.006 |
salon | -0.006 |
Token | eer |
Token ID | 28153 |
Feature activation | +2.38e-03 |
Pos logit contributions | |
eway | +0.017 |
ining | +0.015 |
rum | +0.015 |
kered | +0.015 |
ered | +0.014 |
Neg logit contributions | |
groom | -0.013 |
scar | -0.012 |
burn | -0.012 |
salon | -0.012 |
pony | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | -7.83e-03 |
Pos logit contributions | |
groom | +0.004 |
rob | +0.004 |
scar | +0.004 |
burn | +0.004 |
ponies | +0.004 |
Neg logit contributions | |
eway | -0.004 |
ered | -0.003 |
ining | -0.003 |
earing | -0.003 |
rum | -0.003 |
Token | please |
Token ID | 3387 |
Feature activation | +5.33e-03 |
Pos logit contributions | |
eway | +0.013 |
ining | +0.011 |
ered | +0.011 |
ooks | +0.011 |
earing | +0.010 |
Neg logit contributions | |
groom | -0.014 |
rob | -0.013 |
burn | -0.013 |
scar | -0.013 |
pony | -0.012 |
Token | ?" |
Token ID | 1701 |
Feature activation | +3.03e-02 |
Pos logit contributions | |
rob | +0.007 |
groom | +0.007 |
ponies | +0.007 |
scar | +0.007 |
burn | +0.007 |
Neg logit contributions | |
eway | -0.010 |
ered | -0.010 |
ining | -0.010 |
earing | -0.009 |
itself | -0.009 |
Token | Ben |
Token ID | 3932 |
Feature activation | +5.71e-02 |
Pos logit contributions | |
rob | +0.065 |
burn | +0.062 |
groom | +0.060 |
scar | +0.059 |
pony | +0.056 |
Neg logit contributions | |
Everyone | -0.037 |
Suz | -0.036 |
eway | -0.034 |
Everything | -0.033 |
From | -0.033 |
Token | asks |
Token ID | 7893 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
burn | +0.089 |
groom | +0.085 |
rob | +0.084 |
usual | +0.083 |
salon | +0.077 |
Neg logit contributions | |
ining | -0.092 |
From | -0.092 |
Everyone | -0.088 |
Everything | -0.088 |
It | -0.088 |
Token | Lily |
Token ID | 20037 |
Feature activation | +2.38e-02 |
Pos logit contributions | |
groom | +0.036 |
rob | +0.036 |
scar | +0.035 |
burn | +0.034 |
pony | +0.033 |
Neg logit contributions | |
eway | -0.026 |
ooks | -0.023 |
ered | -0.023 |
kered | -0.023 |
itself | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
groom | +0.048 |
rob | +0.047 |
scar | +0.046 |
burn | +0.044 |
strawberries | +0.042 |
Neg logit contributions | |
eway | -0.032 |
ining | -0.030 |
rum | -0.029 |
earing | -0.029 |
ered | -0.029 |
Token |
|
Token ID | 198 |
Feature activation | +5.23e-03 |
Pos logit contributions | |
groom | +0.024 |
scar | +0.023 |
burn | +0.023 |
rob | +0.022 |
salon | +0.022 |
Neg logit contributions | |
eway | -0.011 |
ining | -0.008 |
Turns | -0.008 |
ooks | -0.008 |
Everyone | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -3.18e-03 |
Pos logit contributions | |
groom | +0.011 |
scar | +0.010 |
burn | +0.010 |
pony | +0.010 |
salon | +0.010 |
Neg logit contributions | |
eway | -0.007 |
ining | -0.006 |
ered | -0.006 |
kered | -0.006 |
ooks | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | -9.83e-03 |
Pos logit contributions | |
groom | +0.008 |
scar | +0.007 |
burn | +0.007 |
pony | +0.007 |
rob | +0.007 |
Neg logit contributions | |
eway | -0.008 |
ining | -0.007 |
ered | -0.007 |
kered | -0.007 |
earing | -0.007 |
Token | Do |
Token ID | 2141 |
Feature activation | +2.34e-03 |
Pos logit contributions | |
eway | +0.013 |
ered | +0.011 |
ining | +0.011 |
kered | +0.010 |
earing | +0.010 |
Neg logit contributions | |
groom | -0.021 |
scar | -0.020 |
burn | -0.020 |
pony | -0.020 |
ponies | -0.019 |
Token | you |
Token ID | 345 |
Feature activation | +1.32e-03 |
Pos logit contributions | |
groom | +0.005 |
burn | +0.004 |
scar | +0.004 |
pony | +0.004 |
rob | +0.004 |
Neg logit contributions | |
eway | -0.003 |
ered | -0.003 |
ining | -0.003 |
kered | -0.003 |
earing | -0.003 |
Token | understand |
Token ID | 1833 |
Feature activation | +7.43e-03 |
Pos logit contributions | |
groom | +0.002 |
burn | +0.002 |
scar | +0.002 |
rob | +0.002 |
pony | +0.002 |
Neg logit contributions | |
eway | -0.002 |
ining | -0.002 |
ered | -0.002 |
earing | -0.002 |
ooks | -0.002 |
Token | ?" |
Token ID | 1701 |
Feature activation | +3.10e-02 |
Pos logit contributions | |
groom | +0.009 |
scar | +0.008 |
burn | +0.008 |
pony | +0.008 |
rob | +0.008 |
Neg logit contributions | |
eway | -0.016 |
ered | -0.015 |
ining | -0.015 |
itself | -0.014 |
ooks | -0.014 |
Token | Mom |
Token ID | 11254 |
Feature activation | +5.70e-02 |
Pos logit contributions | |
rob | +0.069 |
groom | +0.068 |
burn | +0.067 |
scar | +0.065 |
salon | +0.061 |
Neg logit contributions | |
Suz | -0.032 |
Everyone | -0.031 |
eway | -0.031 |
From | -0.030 |
ooks | -0.029 |
Token | asks |
Token ID | 7893 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
groom | +0.085 |
burn | +0.078 |
scar | +0.073 |
rob | +0.072 |
pony | +0.069 |
Neg logit contributions | |
eway | -0.101 |
ining | -0.101 |
ered | -0.099 |
Everything | -0.096 |
earing | -0.095 |
Token | . |
Token ID | 13 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
groom | +0.032 |
scar | +0.029 |
burn | +0.029 |
rob | +0.029 |
pony | +0.028 |
Neg logit contributions | |
eway | -0.022 |
ered | -0.019 |
itself | -0.019 |
kered | -0.019 |
ining | -0.019 |
Token |
|
Token ID | 198 |
Feature activation | +1.39e-02 |
Pos logit contributions | |
groom | +0.040 |
scar | +0.038 |
burn | +0.037 |
pony | +0.036 |
rob | +0.036 |
Neg logit contributions | |
eway | -0.022 |
ining | -0.018 |
ooks | -0.017 |
kered | -0.017 |
earing | -0.017 |
Token |
|
Token ID | 198 |
Feature activation | +7.46e-03 |
Pos logit contributions | |
groom | +0.033 |
burn | +0.031 |
scar | +0.031 |
pony | +0.030 |
salon | +0.029 |
Neg logit contributions | |
eway | -0.016 |
ining | -0.014 |
ooks | -0.013 |
earing | -0.012 |
kered | -0.012 |
Token | " |
Token ID | 1 |
Feature activation | -4.71e-03 |
Pos logit contributions | |
groom | +0.016 |
scar | +0.015 |
burn | +0.015 |
pony | +0.014 |
rob | +0.014 |
Neg logit contributions | |
eway | -0.010 |
ining | -0.009 |
ooks | -0.008 |
kered | -0.008 |
ered | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | -2.11e-03 |
Pos logit contributions | |
groom | +0.008 |
burn | +0.008 |
rob | +0.008 |
scar | +0.008 |
salon | +0.008 |
Neg logit contributions | |
eway | -0.005 |
rum | -0.004 |
ining | -0.004 |
kered | -0.004 |
itself | -0.004 |
Token | I |
Token ID | 314 |
Feature activation | -3.38e-04 |
Pos logit contributions | |
eway | +0.004 |
ered | +0.003 |
ining | +0.003 |
kered | +0.003 |
aged | +0.003 |
Neg logit contributions | |
groom | -0.004 |
scar | -0.003 |
pony | -0.003 |
burn | -0.003 |
chicken | -0.003 |
Token | like |
Token ID | 588 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
eway | +0.001 |
ining | +0.001 |
ered | +0.001 |
kered | +0.001 |
ooks | +0.001 |
Neg logit contributions | |
groom | -0.001 |
scar | -0.001 |
burn | -0.001 |
pony | -0.001 |
salon | -0.001 |
Token | blue |
Token ID | 4171 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
rob | +0.026 |
groom | +0.026 |
burn | +0.026 |
scar | +0.025 |
pony | +0.024 |
Neg logit contributions | |
eway | -0.023 |
ining | -0.021 |
itself | -0.020 |
ered | -0.020 |
earing | -0.019 |
Token | berry |
Token ID | 8396 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
groom | +0.014 |
scar | +0.013 |
burn | +0.013 |
pony | +0.013 |
rob | +0.013 |
Neg logit contributions | |
eway | -0.019 |
ered | -0.017 |
kered | -0.017 |
rum | -0.017 |
ining | -0.017 |
Token | yogurt |
Token ID | 32132 |
Feature activation | +5.70e-02 |
Pos logit contributions | |
groom | +0.022 |
burn | +0.020 |
scar | +0.020 |
pony | +0.019 |
rob | +0.019 |
Neg logit contributions | |
eway | -0.024 |
ining | -0.022 |
kered | -0.021 |
ered | -0.021 |
rum | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +7.09e-03 |
Pos logit contributions | |
groom | +0.125 |
avail | +0.121 |
scar | +0.121 |
burn | +0.120 |
rob | +0.118 |
Neg logit contributions | |
ining | -0.048 |
itself | -0.046 |
eway | -0.045 |
and | -0.044 |
kered | -0.043 |
Token | Can |
Token ID | 1680 |
Feature activation | +1.91e-02 |
Pos logit contributions | |
groom | +0.014 |
scar | +0.013 |
pony | +0.012 |
burn | +0.012 |
ponies | +0.012 |
Neg logit contributions | |
eway | -0.011 |
ining | -0.010 |
ered | -0.010 |
kered | -0.009 |
earing | -0.009 |
Token | I |
Token ID | 314 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
groom | +0.031 |
scar | +0.029 |
burn | +0.028 |
pony | +0.027 |
rob | +0.027 |
Neg logit contributions | |
eway | -0.035 |
ining | -0.031 |
ered | -0.031 |
kered | -0.030 |
earing | -0.030 |
Token | have |
Token ID | 423 |
Feature activation | +2.73e-02 |
Pos logit contributions | |
groom | +0.020 |
scar | +0.019 |
burn | +0.019 |
pony | +0.019 |
rob | +0.019 |
Neg logit contributions | |
eway | -0.021 |
ining | -0.018 |
ered | -0.018 |
kered | -0.018 |
earing | -0.018 |
Token | more |
Token ID | 517 |
Feature activation | +7.34e-03 |
Pos logit contributions | |
burn | +0.052 |
rider | +0.051 |
groom | +0.050 |
rob | +0.049 |
pony | +0.049 |
Neg logit contributions | |
ered | -0.033 |
Everyone | -0.030 |
eway | -0.030 |
itself | -0.030 |
ining | -0.029 |
Token | is |
Token ID | 318 |
Feature activation | +9.49e-03 |
Pos logit contributions | |
groom | +0.017 |
scar | +0.016 |
burn | +0.015 |
pony | +0.015 |
salon | +0.014 |
Neg logit contributions | |
eway | -0.020 |
ining | -0.017 |
ered | -0.017 |
kered | -0.017 |
ooks | -0.017 |
Token | also |
Token ID | 635 |
Feature activation | +7.68e-03 |
Pos logit contributions | |
groom | +0.017 |
rob | +0.017 |
burn | +0.016 |
scar | +0.016 |
salon | +0.016 |
Neg logit contributions | |
eway | -0.015 |
ining | -0.014 |
ered | -0.013 |
itself | -0.013 |
ooks | -0.013 |
Token | a |
Token ID | 257 |
Feature activation | +3.84e-03 |
Pos logit contributions | |
groom | +0.013 |
rob | +0.012 |
burn | +0.012 |
salon | +0.012 |
scar | +0.012 |
Neg logit contributions | |
eway | -0.013 |
ining | -0.012 |
ered | -0.011 |
earing | -0.011 |
ooks | -0.011 |
Token | toy |
Token ID | 13373 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
groom | +0.006 |
rob | +0.006 |
burn | +0.006 |
scar | +0.006 |
salon | +0.005 |
Neg logit contributions | |
eway | -0.007 |
ining | -0.006 |
Turns | -0.006 |
ooks | -0.005 |
rum | -0.005 |
Token | ," |
Token ID | 553 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
groom | +0.032 |
burn | +0.030 |
scar | +0.029 |
rob | +0.029 |
strawberries | +0.027 |
Neg logit contributions | |
eway | -0.027 |
kered | -0.022 |
taker | -0.022 |
ining | -0.022 |
Everyone | -0.021 |
Token | Mom |
Token ID | 11254 |
Feature activation | +5.69e-02 |
Pos logit contributions | |
rob | +0.057 |
burn | +0.057 |
groom | +0.052 |
scar | +0.051 |
salon | +0.050 |
Neg logit contributions | |
Suz | -0.029 |
Everyone | -0.028 |
eway | -0.025 |
Everything | -0.025 |
His | -0.024 |
Token | says |
Token ID | 1139 |
Feature activation | +7.56e-03 |
Pos logit contributions | |
groom | +0.082 |
burn | +0.073 |
scar | +0.071 |
rob | +0.067 |
pony | +0.066 |
Neg logit contributions | |
eway | -0.110 |
ining | -0.102 |
ered | -0.101 |
rum | -0.098 |
earing | -0.097 |
Token | . |
Token ID | 13 |
Feature activation | +1.70e-02 |
Pos logit contributions | |
groom | +0.011 |
scar | +0.010 |
burn | +0.010 |
pony | +0.010 |
salon | +0.009 |
Neg logit contributions | |
eway | -0.016 |
ining | -0.014 |
ered | -0.013 |
kered | -0.013 |
ooks | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
groom | +0.039 |
scar | +0.037 |
burn | +0.036 |
pony | +0.035 |
rob | +0.035 |
Neg logit contributions | |
eway | -0.021 |
ining | -0.017 |
ooks | -0.016 |
earing | -0.016 |
kered | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | +5.69e-03 |
Pos logit contributions | |
groom | +0.029 |
scar | +0.027 |
burn | +0.027 |
pony | +0.026 |
salon | +0.026 |
Neg logit contributions | |
eway | -0.016 |
ining | -0.013 |
ooks | -0.012 |
kered | -0.012 |
ered | -0.012 |
Token | " |
Token ID | 1 |
Feature activation | -4.50e-03 |
Pos logit contributions | |
groom | +0.012 |
scar | +0.011 |
burn | +0.011 |
pony | +0.011 |
rob | +0.011 |
Neg logit contributions | |
eway | -0.008 |
ining | -0.007 |
kered | -0.007 |
ooks | -0.006 |
ered | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | -4.30e-03 |
Pos logit contributions | |
eway | +0.011 |
ered | +0.010 |
rum | +0.009 |
kered | +0.009 |
aged | +0.009 |
Neg logit contributions | |
Velvet | -0.010 |
pony | -0.010 |
ponies | -0.010 |
chicken | -0.010 |
groom | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | -1.11e-02 |
Pos logit contributions | |
eway | +0.006 |
ered | +0.005 |
ining | +0.005 |
kered | +0.005 |
rum | +0.005 |
Neg logit contributions | |
groom | -0.008 |
scar | -0.008 |
pony | -0.008 |
rob | -0.008 |
burn | -0.008 |
Token | This |
Token ID | 1212 |
Feature activation | +7.84e-03 |
Pos logit contributions | |
eway | +0.021 |
rum | +0.019 |
ered | +0.019 |
aged | +0.019 |
ooks | +0.018 |
Neg logit contributions | |
groom | -0.016 |
scar | -0.015 |
pony | -0.015 |
salon | -0.014 |
chicken | -0.014 |
Token | story |
Token ID | 1621 |
Feature activation | -8.70e-03 |
Pos logit contributions | |
groom | +0.015 |
scar | +0.014 |
burn | +0.014 |
salon | +0.013 |
pony | +0.013 |
Neg logit contributions | |
eway | -0.013 |
ining | -0.011 |
ered | -0.011 |
kered | -0.011 |
earing | -0.010 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.83e-02 |
Pos logit contributions | |
eway | +0.017 |
ooks | +0.016 |
Suz | +0.015 |
rum | +0.015 |
earing | +0.014 |
Neg logit contributions | |
groom | -0.012 |
blows | -0.011 |
rider | -0.011 |
reads | -0.011 |
concert | -0.011 |
Token | us |
Token ID | 514 |
Feature activation | -6.28e-02 |
Pos logit contributions | |
eway | +0.050 |
ining | +0.043 |
ered | +0.042 |
kered | +0.041 |
ooks | +0.041 |
Neg logit contributions | |
groom | -0.050 |
scar | -0.047 |
burn | -0.045 |
pony | -0.045 |
ponies | -0.043 |
Token | a |
Token ID | 257 |
Feature activation | -3.03e-02 |
Pos logit contributions | |
eway | +0.137 |
Turns | +0.124 |
rum | +0.117 |
ooks | +0.115 |
ining | +0.114 |
Neg logit contributions | |
groom | -0.071 |
chicken | -0.069 |
scar | -0.066 |
ponies | -0.066 |
pony | -0.065 |
Token | valuable |
Token ID | 8119 |
Feature activation | -4.83e-02 |
Pos logit contributions | |
eway | +0.060 |
ered | +0.054 |
kered | +0.053 |
ining | +0.052 |
ooks | +0.052 |
Neg logit contributions | |
groom | -0.044 |
scar | -0.043 |
pony | -0.041 |
burn | -0.039 |
chicken | -0.039 |
Token | lesson |
Token ID | 11483 |
Feature activation | -1.77e-02 |
Pos logit contributions | |
eway | +0.096 |
ining | +0.090 |
ered | +0.089 |
kered | +0.087 |
Turns | +0.086 |
Neg logit contributions | |
groom | -0.062 |
pony | -0.060 |
scar | -0.059 |
horse | -0.057 |
chicken | -0.057 |
Token | - |
Token ID | 532 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
eway | +0.029 |
kered | +0.026 |
ining | +0.026 |
Turns | +0.025 |
ered | +0.025 |
Neg logit contributions | |
groom | -0.029 |
scar | -0.028 |
pony | -0.027 |
ponies | -0.027 |
salon | -0.027 |
Token | it |
Token ID | 340 |
Feature activation | -2.16e-02 |
Pos logit contributions | |
eway | +0.034 |
ining | +0.030 |
kered | +0.030 |
rum | +0.029 |
ered | +0.029 |
Neg logit contributions | |
groom | -0.024 |
scar | -0.023 |
pony | -0.021 |
burn | -0.021 |
chicken | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | -8.07e-03 |
Pos logit contributions | |
eway | +0.018 |
kered | +0.017 |
ered | +0.017 |
amed | +0.016 |
eways | +0.015 |
Neg logit contributions | |
Rudy | -0.012 |
strawberry | -0.012 |
chicken | -0.011 |
fisherman | -0.011 |
Coco | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | -1.37e-02 |
Pos logit contributions | |
eway | +0.015 |
kered | +0.014 |
ered | +0.014 |
ining | +0.013 |
aged | +0.013 |
Neg logit contributions | |
groom | -0.010 |
pony | -0.009 |
scar | -0.009 |
chicken | -0.009 |
� | -0.009 |
Token | This |
Token ID | 1212 |
Feature activation | +6.85e-03 |
Pos logit contributions | |
eway | +0.026 |
ooks | +0.025 |
anny | +0.024 |
Acc | +0.024 |
ered | +0.024 |
Neg logit contributions | |
groom | -0.017 |
fisherman | -0.017 |
pony | -0.016 |
chicken | -0.016 |
strawberry | -0.016 |
Token | story |
Token ID | 1621 |
Feature activation | -1.56e-02 |
Pos logit contributions | |
groom | +0.013 |
burn | +0.012 |
scar | +0.012 |
salon | +0.012 |
pony | +0.012 |
Neg logit contributions | |
eway | -0.011 |
ining | -0.010 |
ered | -0.009 |
kered | -0.009 |
Turns | -0.009 |
Token | teaches |
Token ID | 17324 |
Feature activation | -3.07e-02 |
Pos logit contributions | |
ooks | +0.028 |
eway | +0.027 |
and | +0.024 |
Suz | +0.024 |
rum | +0.024 |
Neg logit contributions | |
blows | -0.021 |
butter | -0.021 |
groom | -0.021 |
rider | -0.021 |
chicken | -0.021 |
Token | us |
Token ID | 514 |
Feature activation | -6.12e-02 |
Pos logit contributions | |
eway | +0.058 |
ining | +0.050 |
ooks | +0.050 |
kered | +0.048 |
rum | +0.048 |
Neg logit contributions | |
groom | -0.050 |
scar | -0.047 |
pony | -0.045 |
ponies | -0.044 |
burn | -0.044 |
Token | that |
Token ID | 326 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
eway | +0.130 |
Turns | +0.121 |
ining | +0.113 |
ooks | +0.112 |
rum | +0.111 |
Neg logit contributions | |
groom | -0.070 |
chicken | -0.069 |
scar | -0.068 |
pony | -0.066 |
butter | -0.065 |
Token | sometimes |
Token ID | 3360 |
Feature activation | -7.62e-03 |
Pos logit contributions | |
eway | +0.021 |
ining | +0.019 |
kered | +0.019 |
ered | +0.019 |
ooks | +0.018 |
Neg logit contributions | |
groom | -0.017 |
scar | -0.016 |
pony | -0.015 |
burn | -0.015 |
chicken | -0.015 |
Token | it |
Token ID | 340 |
Feature activation | -1.35e-02 |
Pos logit contributions | |
eway | +0.014 |
ining | +0.012 |
kered | +0.012 |
ered | +0.012 |
ooks | +0.012 |
Neg logit contributions | |
groom | -0.013 |
scar | -0.012 |
pony | -0.011 |
burn | -0.011 |
ponies | -0.011 |
Token | 's |
Token ID | 338 |
Feature activation | -5.18e-04 |
Pos logit contributions | |
eway | +0.029 |
ooks | +0.024 |
kered | +0.024 |
rum | +0.023 |
ining | +0.023 |
Neg logit contributions | |
groom | -0.018 |
scar | -0.017 |
burn | -0.017 |
pony | -0.016 |
ponies | -0.016 |
Token | best |
Token ID | 1266 |
Feature activation | -4.31e-03 |
Pos logit contributions | |
eway | +0.001 |
ining | +0.001 |
ered | +0.001 |
ooks | +0.001 |
itself | +0.001 |
Neg logit contributions | |
groom | -0.001 |
rob | -0.001 |
salon | -0.001 |
pony | -0.001 |
scar | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
eway | +0.021 |
ining | +0.019 |
kered | +0.019 |
earing | +0.018 |
ooks | +0.018 |
Neg logit contributions | |
groom | -0.015 |
scar | -0.015 |
pony | -0.014 |
burn | -0.014 |
rob | -0.013 |
Token | tree |
Token ID | 5509 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
eway | +0.028 |
ining | +0.024 |
ered | +0.024 |
kered | +0.024 |
earing | +0.024 |
Neg logit contributions | |
groom | -0.019 |
scar | -0.017 |
burn | -0.017 |
rob | -0.016 |
pony | -0.016 |
Token | to |
Token ID | 284 |
Feature activation | -5.25e-03 |
Pos logit contributions | |
eway | +0.028 |
ining | +0.024 |
kered | +0.024 |
ooks | +0.024 |
rum | +0.023 |
Neg logit contributions | |
scar | -0.023 |
groom | -0.023 |
pony | -0.023 |
burn | -0.022 |
salon | -0.022 |
Token | its |
Token ID | 663 |
Feature activation | -1.89e-02 |
Pos logit contributions | |
eway | +0.010 |
ining | +0.009 |
kered | +0.009 |
ooks | +0.009 |
earing | +0.009 |
Neg logit contributions | |
groom | -0.008 |
scar | -0.008 |
pony | -0.007 |
burn | -0.007 |
chicken | -0.007 |
Token | once |
Token ID | 1752 |
Feature activation | -9.99e-03 |
Pos logit contributions | |
eway | +0.034 |
ining | +0.030 |
ered | +0.029 |
kered | +0.028 |
ooks | +0.028 |
Neg logit contributions | |
groom | -0.031 |
scar | -0.029 |
burn | -0.029 |
rob | -0.028 |
pony | -0.028 |
Token | former |
Token ID | 1966 |
Feature activation | -6.10e-02 |
Pos logit contributions | |
eway | +0.020 |
ining | +0.017 |
kered | +0.017 |
ooks | +0.017 |
rum | +0.017 |
Neg logit contributions | |
groom | -0.015 |
scar | -0.014 |
burn | -0.014 |
pony | -0.013 |
butter | -0.013 |
Token | beauty |
Token ID | 8737 |
Feature activation | -1.69e-02 |
Pos logit contributions | |
eway | +0.109 |
kered | +0.091 |
ining | +0.090 |
Turns | +0.088 |
ered | +0.087 |
Neg logit contributions | |
scar | -0.100 |
groom | -0.099 |
ponies | -0.091 |
pony | -0.091 |
butter | -0.087 |
Token | . |
Token ID | 13 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
eway | +0.033 |
ered | +0.029 |
ining | +0.029 |
ooks | +0.029 |
kered | +0.029 |
Neg logit contributions | |
groom | -0.025 |
scar | -0.023 |
pony | -0.023 |
burn | -0.022 |
ponies | -0.022 |
Token | He |
Token ID | 679 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
eway | +0.026 |
kered | +0.025 |
ered | +0.024 |
aged | +0.023 |
amed | +0.022 |
Neg logit contributions | |
groom | -0.027 |
pony | -0.026 |
ponies | -0.025 |
strawberry | -0.025 |
salon | -0.025 |
Token | was |
Token ID | 373 |
Feature activation | -4.84e-03 |
Pos logit contributions | |
eway | +0.018 |
ooks | +0.015 |
ining | +0.015 |
rum | +0.015 |
eways | +0.014 |
Neg logit contributions | |
groom | -0.020 |
scar | -0.019 |
pony | -0.018 |
burn | -0.017 |
butter | -0.017 |
Token | happy |
Token ID | 3772 |
Feature activation | -1.31e-02 |
Pos logit contributions | |
eway | +0.010 |
kered | +0.008 |
eways | +0.008 |
ooks | +0.008 |
rum | +0.008 |
Neg logit contributions | |
groom | -0.008 |
pony | -0.007 |
scar | -0.006 |
bald | -0.006 |
burn | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +1.17e-03 |
Pos logit contributions | |
eway | +0.002 |
ered | +0.001 |
kered | +0.001 |
eways | +0.001 |
aged | +0.001 |
Neg logit contributions | |
Rudy | -0.001 |
� | -0.001 |
Rudolph | -0.001 |
Velvet | -0.001 |
Star | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -4.05e-03 |
Pos logit contributions | |
groom | +0.002 |
scar | +0.002 |
rob | +0.002 |
pony | +0.002 |
burn | +0.002 |
Neg logit contributions | |
eway | -0.002 |
ered | -0.002 |
kered | -0.002 |
ining | -0.002 |
rum | -0.002 |
Token | This |
Token ID | 1212 |
Feature activation | +7.29e-03 |
Pos logit contributions | |
eway | +0.007 |
ered | +0.007 |
aged | +0.007 |
ooks | +0.007 |
Suz | +0.007 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.005 |
pony | -0.005 |
please | -0.005 |
cowboy | -0.005 |
Token | story |
Token ID | 1621 |
Feature activation | -9.32e-03 |
Pos logit contributions | |
groom | +0.013 |
burn | +0.012 |
scar | +0.012 |
rob | +0.011 |
salon | +0.011 |
Neg logit contributions | |
eway | -0.012 |
ining | -0.011 |
ered | -0.011 |
kered | -0.011 |
Turns | -0.010 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.73e-02 |
Pos logit contributions | |
ooks | +0.017 |
eway | +0.017 |
rum | +0.015 |
Suz | +0.015 |
and | +0.015 |
Neg logit contributions | |
groom | -0.013 |
blows | -0.013 |
scar | -0.012 |
rider | -0.012 |
butter | -0.012 |
Token | us |
Token ID | 514 |
Feature activation | -6.09e-02 |
Pos logit contributions | |
eway | +0.050 |
ining | +0.043 |
ooks | +0.042 |
rum | +0.042 |
kered | +0.041 |
Neg logit contributions | |
groom | -0.046 |
scar | -0.044 |
pony | -0.041 |
burn | -0.041 |
ponies | -0.040 |
Token | that |
Token ID | 326 |
Feature activation | -1.11e-02 |
Pos logit contributions | |
eway | +0.127 |
Turns | +0.117 |
ining | +0.110 |
rum | +0.109 |
ooks | +0.109 |
Neg logit contributions | |
groom | -0.075 |
scar | -0.072 |
chicken | -0.072 |
pony | -0.070 |
butter | -0.069 |
Token | courage |
Token ID | 11917 |
Feature activation | -1.00e-02 |
Pos logit contributions | |
eway | +0.023 |
ining | +0.020 |
kered | +0.020 |
ered | +0.020 |
ooks | +0.019 |
Neg logit contributions | |
groom | -0.017 |
scar | -0.015 |
pony | -0.015 |
burn | -0.015 |
chicken | -0.014 |
Token | can |
Token ID | 460 |
Feature activation | -5.29e-03 |
Pos logit contributions | |
eway | +0.021 |
ooks | +0.019 |
kered | +0.018 |
ining | +0.018 |
ered | +0.018 |
Neg logit contributions | |
groom | -0.013 |
scar | -0.012 |
pony | -0.012 |
ponies | -0.011 |
cane | -0.011 |
Token | help |
Token ID | 1037 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
eway | +0.010 |
ining | +0.009 |
kered | +0.008 |
ooks | +0.008 |
earing | +0.008 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.008 |
burn | -0.008 |
pony | -0.008 |
salon | -0.007 |
Token | us |
Token ID | 514 |
Feature activation | -2.99e-02 |
Pos logit contributions | |
eway | +0.030 |
ining | +0.026 |
kered | +0.026 |
earing | +0.025 |
ooks | +0.025 |
Neg logit contributions | |
groom | -0.025 |
scar | -0.024 |
pony | -0.023 |
burn | -0.022 |
chicken | -0.022 |
Token |
|
Token ID | 198 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
eway | +0.021 |
kered | +0.020 |
ered | +0.020 |
amed | +0.019 |
aged | +0.018 |
Neg logit contributions | |
strawberry | -0.013 |
Rudy | -0.013 |
bar | -0.012 |
cones | -0.012 |
fisherman | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | -1.48e-02 |
Pos logit contributions | |
eway | +0.018 |
ered | +0.017 |
kered | +0.017 |
aged | +0.017 |
ooks | +0.016 |
Neg logit contributions | |
pony | -0.014 |
rob | -0.014 |
groom | -0.014 |
chicken | -0.014 |
horse | -0.014 |
Token | This |
Token ID | 1212 |
Feature activation | +6.19e-03 |
Pos logit contributions | |
eway | +0.028 |
ooks | +0.027 |
aged | +0.027 |
Acc | +0.026 |
Suz | +0.026 |
Neg logit contributions | |
pony | -0.018 |
groom | -0.018 |
fisherman | -0.017 |
strawberry | -0.017 |
chicken | -0.017 |
Token | story |
Token ID | 1621 |
Feature activation | -8.99e-03 |
Pos logit contributions | |
groom | +0.012 |
scar | +0.012 |
burn | +0.012 |
salon | +0.011 |
rob | +0.011 |
Neg logit contributions | |
eway | -0.009 |
ining | -0.008 |
ered | -0.008 |
kered | -0.008 |
earing | -0.007 |
Token | teaches |
Token ID | 17324 |
Feature activation | -3.33e-02 |
Pos logit contributions | |
eway | +0.017 |
ooks | +0.016 |
Suz | +0.014 |
rum | +0.014 |
eways | +0.014 |
Neg logit contributions | |
groom | -0.013 |
rider | -0.012 |
blows | -0.012 |
butter | -0.012 |
reads | -0.012 |
Token | us |
Token ID | 514 |
Feature activation | -6.06e-02 |
Pos logit contributions | |
eway | +0.068 |
ooks | +0.060 |
ining | +0.058 |
rum | +0.057 |
earing | +0.057 |
Neg logit contributions | |
groom | -0.049 |
scar | -0.047 |
ponies | -0.045 |
chicken | -0.045 |
pony | -0.044 |
Token | that |
Token ID | 326 |
Feature activation | -1.45e-02 |
Pos logit contributions | |
eway | +0.131 |
Turns | +0.118 |
ining | +0.111 |
ooks | +0.111 |
rum | +0.110 |
Neg logit contributions | |
groom | -0.074 |
chicken | -0.071 |
scar | -0.070 |
butter | -0.068 |
pony | -0.067 |
Token | it |
Token ID | 340 |
Feature activation | -2.43e-02 |
Pos logit contributions | |
eway | +0.028 |
ining | +0.025 |
ered | +0.024 |
kered | +0.024 |
earing | +0.024 |
Neg logit contributions | |
groom | -0.023 |
scar | -0.021 |
pony | -0.021 |
burn | -0.021 |
chicken | -0.020 |
Token | is |
Token ID | 318 |
Feature activation | -1.86e-02 |
Pos logit contributions | |
eway | +0.054 |
ooks | +0.047 |
rum | +0.044 |
kered | +0.044 |
Suz | +0.043 |
Neg logit contributions | |
groom | -0.029 |
blows | -0.028 |
chicken | -0.027 |
scar | -0.027 |
butter | -0.027 |
Token | important |
Token ID | 1593 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
eway | +0.032 |
ining | +0.027 |
kered | +0.026 |
ered | +0.026 |
ooks | +0.025 |
Neg logit contributions | |
groom | -0.034 |
scar | -0.032 |
burn | -0.031 |
pony | -0.030 |
ponies | -0.029 |
Token | to |
Token ID | 284 |
Feature activation | -1.36e-02 |
Pos logit contributions | |
eway | +0.024 |
ining | +0.021 |
kered | +0.021 |
ered | +0.020 |
ooks | +0.020 |
Neg logit contributions | |
groom | -0.016 |
scar | -0.015 |
pony | -0.014 |
burn | -0.014 |
ponies | -0.014 |
Token |
|
Token ID | 198 |
Feature activation | -3.59e-03 |
Pos logit contributions | |
groom | +0.001 |
scar | +0.001 |
Velvet | +0.001 |
pony | +0.001 |
� | +0.001 |
Neg logit contributions | |
eway | -0.001 |
kered | -0.001 |
ered | -0.001 |
ining | -0.001 |
ooks | -0.001 |
Token | The |
Token ID | 464 |
Feature activation | +1.77e-02 |
Pos logit contributions | |
eway | +0.008 |
ered | +0.007 |
kered | +0.007 |
Suz | +0.007 |
ooks | +0.007 |
Neg logit contributions | |
groom | -0.004 |
Nik | -0.004 |
Ba | -0.004 |
scar | -0.004 |
pony | -0.004 |
Token | cat |
Token ID | 3797 |
Feature activation | -3.56e-03 |
Pos logit contributions | |
groom | +0.032 |
burn | +0.029 |
rob | +0.029 |
salon | +0.027 |
scar | +0.027 |
Neg logit contributions | |
eway | -0.027 |
Turns | -0.025 |
kered | -0.025 |
aged | -0.024 |
ining | -0.024 |
Token | grinned |
Token ID | 36268 |
Feature activation | -2.38e-02 |
Pos logit contributions | |
eway | +0.007 |
ooks | +0.006 |
eways | +0.006 |
ining | +0.006 |
rum | +0.006 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.006 |
pony | -0.005 |
horse | -0.005 |
chicken | -0.005 |
Token | mis |
Token ID | 2984 |
Feature activation | -3.10e-02 |
Pos logit contributions | |
eway | +0.050 |
ining | +0.044 |
ered | +0.043 |
ooks | +0.042 |
kered | +0.042 |
Neg logit contributions | |
groom | -0.032 |
scar | -0.031 |
pony | -0.030 |
burn | -0.029 |
ponies | -0.028 |
Token | chie |
Token ID | 3043 |
Feature activation | -6.05e-02 |
Pos logit contributions | |
eway | +0.041 |
ining | +0.031 |
Everything | +0.030 |
Turns | +0.030 |
Everyone | +0.029 |
Neg logit contributions | |
groom | -0.067 |
scar | -0.064 |
burn | -0.063 |
please | -0.061 |
pony | -0.060 |
Token | v |
Token ID | 85 |
Feature activation | -2.59e-02 |
Pos logit contributions | |
eway | +0.107 |
ooks | +0.099 |
ining | +0.088 |
ered | +0.087 |
Turns | +0.086 |
Neg logit contributions | |
groom | -0.088 |
rob | -0.086 |
scar | -0.085 |
pony | -0.085 |
poet | -0.084 |
Token | ously |
Token ID | 3481 |
Feature activation | -2.57e-02 |
Pos logit contributions | |
eway | +0.039 |
ining | +0.032 |
Turns | +0.032 |
ooks | +0.030 |
earing | +0.030 |
Neg logit contributions | |
burn | -0.047 |
groom | -0.044 |
chicken | -0.042 |
horse | -0.042 |
scar | -0.042 |
Token | . |
Token ID | 13 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
eway | +0.058 |
ooks | +0.051 |
anny | +0.049 |
eways | +0.049 |
ining | +0.049 |
Neg logit contributions | |
pony | -0.032 |
scar | -0.031 |
groom | -0.030 |
horse | -0.028 |
burn | -0.028 |
Token | " |
Token ID | 366 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
eway | +0.019 |
kered | +0.017 |
ered | +0.017 |
rum | +0.015 |
ooks | +0.015 |
Neg logit contributions | |
groom | -0.017 |
pony | -0.016 |
Velvet | -0.016 |
Nikki | -0.016 |
scar | -0.016 |
Token | Never |
Token ID | 12295 |
Feature activation | +8.58e-05 |
Pos logit contributions | |
eway | +0.022 |
ooks | +0.019 |
ered | +0.019 |
ining | +0.019 |
earing | +0.018 |
Neg logit contributions | |
groom | -0.016 |
burn | -0.014 |
scar | -0.013 |
pony | -0.013 |
rob | -0.013 |
Token | bad |
Token ID | 2089 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
eway | +0.018 |
ooks | +0.015 |
ining | +0.015 |
eways | +0.015 |
anny | +0.014 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.009 |
pony | -0.009 |
chicken | -0.009 |
butter | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | -4.21e-03 |
Pos logit contributions | |
eway | +0.026 |
ining | +0.023 |
ooks | +0.023 |
ered | +0.023 |
kered | +0.022 |
Neg logit contributions | |
scar | -0.014 |
pony | -0.014 |
groom | -0.013 |
burn | -0.013 |
ponies | -0.013 |
Token | apologized |
Token ID | 22893 |
Feature activation | -1.88e-03 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.007 |
ooks | +0.007 |
rum | +0.007 |
kered | +0.007 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.006 |
pony | -0.006 |
burn | -0.006 |
chicken | -0.006 |
Token | for |
Token ID | 329 |
Feature activation | -1.58e-02 |
Pos logit contributions | |
eway | +0.004 |
ining | +0.004 |
ooks | +0.004 |
ered | +0.004 |
kered | +0.004 |
Neg logit contributions | |
scar | -0.002 |
groom | -0.002 |
pony | -0.002 |
burn | -0.002 |
chicken | -0.002 |
Token | qu |
Token ID | 627 |
Feature activation | -2.85e-02 |
Pos logit contributions | |
eway | +0.031 |
kered | +0.027 |
ining | +0.027 |
ooks | +0.026 |
earing | +0.025 |
Neg logit contributions | |
groom | -0.025 |
scar | -0.024 |
burn | -0.022 |
pony | -0.022 |
butter | -0.022 |
Token | arre |
Token ID | 9624 |
Feature activation | -6.04e-02 |
Pos logit contributions | |
eway | +0.051 |
Turns | +0.041 |
ered | +0.039 |
To | +0.039 |
Suz | +0.038 |
Neg logit contributions | |
burn | -0.046 |
scar | -0.042 |
groom | -0.041 |
butter | -0.040 |
syrup | -0.040 |
Token | ling |
Token ID | 1359 |
Feature activation | -3.01e-02 |
Pos logit contributions | |
eway | +0.129 |
ooks | +0.117 |
Turns | +0.113 |
Everything | +0.112 |
Suz | +0.110 |
Neg logit contributions | |
groom | -0.071 |
rob | -0.069 |
scar | -0.068 |
burn | -0.066 |
chicken | -0.064 |
Token | . |
Token ID | 13 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
eway | +0.072 |
ooks | +0.067 |
ining | +0.066 |
Turns | +0.063 |
ered | +0.062 |
Neg logit contributions | |
scar | -0.027 |
pony | -0.026 |
groom | -0.026 |
chicken | -0.026 |
burn | -0.025 |
Token | " |
Token ID | 366 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
eway | +0.033 |
kered | +0.029 |
ered | +0.028 |
rum | +0.027 |
eways | +0.026 |
Neg logit contributions | |
groom | -0.021 |
pony | -0.021 |
salon | -0.020 |
strawberry | -0.020 |
chicken | -0.019 |
Token | I |
Token ID | 40 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
eway | +0.029 |
ered | +0.025 |
ining | +0.025 |
ooks | +0.025 |
rum | +0.025 |
Neg logit contributions | |
groom | -0.018 |
burn | -0.016 |
scar | -0.016 |
pony | -0.016 |
salon | -0.015 |
Token | 'm |
Token ID | 1101 |
Feature activation | -1.54e-02 |
Pos logit contributions | |
eway | +0.026 |
ining | +0.022 |
ooks | +0.021 |
ered | +0.021 |
kered | +0.020 |
Neg logit contributions | |
groom | -0.030 |
scar | -0.028 |
burn | -0.027 |
pony | -0.027 |
salon | -0.026 |
Token |
|
Token ID | 198 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
eway | +0.018 |
kered | +0.016 |
ered | +0.016 |
rum | +0.015 |
eways | +0.015 |
Neg logit contributions | |
burn | -0.011 |
groom | -0.011 |
� | -0.011 |
rob | -0.011 |
scar | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
eway | +0.025 |
ered | +0.023 |
kered | +0.022 |
aged | +0.022 |
rum | +0.021 |
Neg logit contributions | |
rob | -0.014 |
scar | -0.014 |
� | -0.013 |
burn | -0.013 |
groom | -0.013 |
Token | This |
Token ID | 1212 |
Feature activation | +6.29e-03 |
Pos logit contributions | |
eway | +0.026 |
ered | +0.023 |
aged | +0.023 |
ooks | +0.023 |
rum | +0.022 |
Neg logit contributions | |
scar | -0.016 |
rob | -0.015 |
please | -0.015 |
butter | -0.015 |
pony | -0.015 |
Token | story |
Token ID | 1621 |
Feature activation | -7.80e-03 |
Pos logit contributions | |
groom | +0.013 |
scar | +0.012 |
burn | +0.012 |
pony | +0.011 |
salon | +0.011 |
Neg logit contributions | |
eway | -0.009 |
ining | -0.008 |
kered | -0.008 |
ered | -0.008 |
earing | -0.008 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.58e-02 |
Pos logit contributions | |
eway | +0.017 |
ooks | +0.017 |
Suz | +0.016 |
rum | +0.015 |
eways | +0.015 |
Neg logit contributions | |
blows | -0.008 |
rider | -0.008 |
groom | -0.008 |
reads | -0.008 |
butter | -0.007 |
Token | us |
Token ID | 514 |
Feature activation | -6.02e-02 |
Pos logit contributions | |
eway | +0.053 |
ooks | +0.045 |
rum | +0.045 |
ining | +0.045 |
kered | +0.043 |
Neg logit contributions | |
groom | -0.038 |
scar | -0.038 |
ponies | -0.034 |
butter | -0.034 |
pony | -0.034 |
Token | an |
Token ID | 281 |
Feature activation | -4.86e-02 |
Pos logit contributions | |
eway | +0.133 |
Turns | +0.118 |
ining | +0.112 |
ooks | +0.112 |
rum | +0.112 |
Neg logit contributions | |
groom | -0.069 |
chicken | -0.067 |
butter | -0.065 |
scar | -0.064 |
pony | -0.063 |
Token | important |
Token ID | 1593 |
Feature activation | -3.56e-02 |
Pos logit contributions | |
eway | +0.085 |
ining | +0.073 |
ooks | +0.072 |
kered | +0.071 |
Turns | +0.071 |
Neg logit contributions | |
groom | -0.077 |
scar | -0.074 |
pony | -0.073 |
ponies | -0.070 |
burn | -0.069 |
Token | lesson |
Token ID | 11483 |
Feature activation | -2.20e-02 |
Pos logit contributions | |
eway | +0.070 |
ining | +0.064 |
ered | +0.063 |
kered | +0.062 |
ooks | +0.061 |
Neg logit contributions | |
groom | -0.050 |
pony | -0.046 |
scar | -0.045 |
burn | -0.044 |
cane | -0.044 |
Token | - |
Token ID | 532 |
Feature activation | -1.81e-02 |
Pos logit contributions | |
eway | +0.034 |
ining | +0.031 |
kered | +0.031 |
Turns | +0.031 |
ered | +0.030 |
Neg logit contributions | |
groom | -0.035 |
scar | -0.034 |
ponies | -0.034 |
pony | -0.033 |
rob | -0.033 |
Token | we |
Token ID | 356 |
Feature activation | -2.36e-02 |
Pos logit contributions | |
eway | +0.037 |
ining | +0.032 |
kered | +0.032 |
ered | +0.031 |
amed | +0.030 |
Neg logit contributions | |
groom | -0.027 |
scar | -0.025 |
pony | -0.024 |
chicken | -0.024 |
butter | -0.024 |
Token | ending |
Token ID | 7464 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
groom | +0.009 |
scar | +0.009 |
rob | +0.009 |
burn | +0.009 |
salon | +0.008 |
Neg logit contributions | |
eway | -0.008 |
kered | -0.007 |
aged | -0.007 |
ered | -0.007 |
Turns | -0.007 |
Token | of |
Token ID | 286 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
eway | +0.020 |
ooks | +0.018 |
eways | +0.017 |
rum | +0.017 |
ining | +0.017 |
Neg logit contributions | |
salon | -0.013 |
blows | -0.013 |
last | -0.012 |
l | -0.012 |
Velvet | -0.012 |
Token | this |
Token ID | 428 |
Feature activation | +2.79e-04 |
Pos logit contributions | |
eway | +0.022 |
ining | +0.019 |
ered | +0.019 |
kered | +0.018 |
earing | +0.018 |
Neg logit contributions | |
groom | -0.021 |
scar | -0.020 |
burn | -0.020 |
pony | -0.019 |
salon | -0.019 |
Token | story |
Token ID | 1621 |
Feature activation | -3.28e-03 |
Pos logit contributions | |
groom | +0.000 |
scar | +0.000 |
burn | +0.000 |
pony | +0.000 |
rob | +0.000 |
Neg logit contributions | |
eway | -0.000 |
ining | -0.000 |
ered | -0.000 |
kered | -0.000 |
earing | -0.000 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.84e-02 |
Pos logit contributions | |
eway | +0.006 |
ooks | +0.005 |
ining | +0.005 |
rum | +0.005 |
ered | +0.005 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.005 |
pony | -0.005 |
salon | -0.005 |
burn | -0.005 |
Token | us |
Token ID | 514 |
Feature activation | -5.96e-02 |
Pos logit contributions | |
eway | +0.047 |
ining | +0.042 |
ered | +0.041 |
kered | +0.040 |
earing | +0.040 |
Neg logit contributions | |
groom | -0.052 |
scar | -0.048 |
burn | -0.048 |
pony | -0.047 |
rob | -0.045 |
Token | that |
Token ID | 326 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
eway | +0.142 |
Turns | +0.122 |
ining | +0.120 |
rum | +0.116 |
ooks | +0.113 |
Neg logit contributions | |
butter | -0.065 |
groom | -0.064 |
chicken | -0.064 |
scar | -0.060 |
pony | -0.059 |
Token | we |
Token ID | 356 |
Feature activation | -2.79e-02 |
Pos logit contributions | |
eway | +0.020 |
ining | +0.018 |
kered | +0.017 |
ered | +0.017 |
earing | +0.017 |
Neg logit contributions | |
groom | -0.016 |
scar | -0.015 |
pony | -0.014 |
burn | -0.014 |
butter | -0.014 |
Token | should |
Token ID | 815 |
Feature activation | -2.55e-02 |
Pos logit contributions | |
eway | +0.068 |
eways | +0.056 |
ooks | +0.055 |
rum | +0.055 |
kered | +0.054 |
Neg logit contributions | |
groom | -0.033 |
scar | -0.031 |
butter | -0.029 |
prince | -0.026 |
chicken | -0.026 |
Token | not |
Token ID | 407 |
Feature activation | -1.29e-02 |
Pos logit contributions | |
eway | +0.060 |
eways | +0.052 |
and | +0.049 |
Turns | +0.048 |
ining | +0.048 |
Neg logit contributions | |
groom | -0.034 |
salon | -0.029 |
burn | -0.029 |
scar | -0.028 |
butter | -0.028 |
Token | take |
Token ID | 1011 |
Feature activation | -4.05e-03 |
Pos logit contributions | |
eway | +0.030 |
eways | +0.025 |
ining | +0.025 |
kered | +0.024 |
ooks | +0.024 |
Neg logit contributions | |
groom | -0.016 |
burn | -0.015 |
scar | -0.014 |
salon | -0.014 |
pony | -0.013 |
Token | € |
Token ID | 26391 |
Feature activation | +8.88e-03 |
Pos logit contributions | |
eway | +0.021 |
ooks | +0.018 |
eways | +0.017 |
aged | +0.016 |
rum | +0.016 |
Neg logit contributions | |
groom | -0.014 |
rob | -0.014 |
burn | -0.014 |
salon | -0.013 |
poet | -0.013 |
Token | â„¢ |
Token ID | 8151 |
Feature activation | +2.93e-03 |
Pos logit contributions | |
groom | +0.014 |
salon | +0.013 |
burn | +0.013 |
scar | +0.013 |
pony | +0.013 |
Neg logit contributions | |
eway | -0.016 |
kered | -0.014 |
ered | -0.014 |
rum | -0.013 |
ining | -0.013 |
Token | s |
Token ID | 82 |
Feature activation | -1.79e-02 |
Pos logit contributions | |
groom | +0.005 |
burn | +0.005 |
salon | +0.005 |
scar | +0.005 |
pony | +0.005 |
Neg logit contributions | |
eway | -0.005 |
ining | -0.004 |
ered | -0.004 |
kered | -0.004 |
ooks | -0.004 |
Token | story |
Token ID | 1621 |
Feature activation | -9.65e-03 |
Pos logit contributions | |
eway | +0.036 |
ooks | +0.032 |
ining | +0.031 |
rum | +0.031 |
Turns | +0.031 |
Neg logit contributions | |
groom | -0.027 |
scar | -0.025 |
pony | -0.025 |
horse | -0.023 |
chicken | -0.023 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.86e-02 |
Pos logit contributions | |
eway | +0.015 |
ooks | +0.013 |
Turns | +0.012 |
ining | +0.012 |
rum | +0.012 |
Neg logit contributions | |
groom | -0.018 |
scar | -0.016 |
pony | -0.016 |
salon | -0.016 |
burn | -0.016 |
Token | us |
Token ID | 514 |
Feature activation | -5.93e-02 |
Pos logit contributions | |
eway | +0.046 |
ining | +0.040 |
ered | +0.040 |
kered | +0.039 |
earing | +0.038 |
Neg logit contributions | |
groom | -0.053 |
scar | -0.050 |
burn | -0.050 |
pony | -0.048 |
rob | -0.047 |
Token | an |
Token ID | 281 |
Feature activation | -4.04e-02 |
Pos logit contributions | |
eway | +0.123 |
Turns | +0.114 |
ining | +0.108 |
ooks | +0.106 |
kered | +0.106 |
Neg logit contributions | |
groom | -0.073 |
scar | -0.069 |
chicken | -0.068 |
pony | -0.067 |
ponies | -0.066 |
Token | important |
Token ID | 1593 |
Feature activation | -3.40e-02 |
Pos logit contributions | |
eway | +0.069 |
ining | +0.061 |
kered | +0.060 |
ooks | +0.059 |
aged | +0.059 |
Neg logit contributions | |
groom | -0.067 |
scar | -0.064 |
pony | -0.064 |
ponies | -0.061 |
horse | -0.059 |
Token | lesson |
Token ID | 11483 |
Feature activation | -2.42e-02 |
Pos logit contributions | |
eway | +0.063 |
ining | +0.057 |
kered | +0.056 |
ered | +0.056 |
ooks | +0.055 |
Neg logit contributions | |
groom | -0.053 |
scar | -0.050 |
pony | -0.050 |
burn | -0.047 |
horse | -0.046 |
Token | - |
Token ID | 532 |
Feature activation | -1.95e-02 |
Pos logit contributions | |
eway | +0.041 |
ining | +0.038 |
kered | +0.037 |
Turns | +0.036 |
aged | +0.035 |
Neg logit contributions | |
groom | -0.038 |
pony | -0.036 |
scar | -0.036 |
ponies | -0.036 |
salon | -0.035 |
Token | if |
Token ID | 611 |
Feature activation | +2.17e-03 |
Pos logit contributions | |
eway | +0.040 |
kered | +0.035 |
ining | +0.034 |
rum | +0.034 |
ered | +0.033 |
Neg logit contributions | |
groom | -0.030 |
scar | -0.027 |
pony | -0.027 |
ponies | -0.026 |
salon | -0.025 |
Token |
|
Token ID | 198 |
Feature activation | -7.76e-03 |
Pos logit contributions | |
eway | +0.017 |
ered | +0.017 |
kered | +0.017 |
aged | +0.016 |
amed | +0.015 |
Neg logit contributions | |
Rudy | -0.010 |
strawberry | -0.009 |
� | -0.009 |
cones | -0.009 |
cone | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
eway | +0.013 |
kered | +0.011 |
ining | +0.011 |
ered | +0.011 |
ooks | +0.011 |
Neg logit contributions | |
groom | -0.011 |
scar | -0.011 |
pony | -0.011 |
rob | -0.011 |
chicken | -0.011 |
Token | This |
Token ID | 1212 |
Feature activation | +5.34e-03 |
Pos logit contributions | |
eway | +0.022 |
ooks | +0.021 |
earing | +0.020 |
aged | +0.020 |
Suz | +0.020 |
Neg logit contributions | |
groom | -0.016 |
pony | -0.015 |
chicken | -0.015 |
strawberry | -0.015 |
fisherman | -0.015 |
Token | story |
Token ID | 1621 |
Feature activation | -8.97e-03 |
Pos logit contributions | |
groom | +0.009 |
scar | +0.008 |
burn | +0.008 |
pony | +0.008 |
salon | +0.007 |
Neg logit contributions | |
eway | -0.010 |
ining | -0.009 |
ered | -0.009 |
kered | -0.009 |
ooks | -0.009 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.74e-02 |
Pos logit contributions | |
eway | +0.018 |
ooks | +0.017 |
Suz | +0.015 |
rum | +0.015 |
earing | +0.015 |
Neg logit contributions | |
groom | -0.012 |
blows | -0.011 |
butter | -0.011 |
chicken | -0.011 |
rider | -0.011 |
Token | us |
Token ID | 514 |
Feature activation | -5.92e-02 |
Pos logit contributions | |
eway | +0.054 |
ooks | +0.047 |
ining | +0.046 |
rum | +0.046 |
earing | +0.045 |
Neg logit contributions | |
groom | -0.043 |
scar | -0.040 |
ponies | -0.038 |
pony | -0.038 |
chicken | -0.037 |
Token | that |
Token ID | 326 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
eway | +0.132 |
Turns | +0.119 |
rum | +0.114 |
ooks | +0.113 |
ining | +0.112 |
Neg logit contributions | |
groom | -0.066 |
chicken | -0.062 |
butter | -0.061 |
scar | -0.060 |
pony | -0.058 |
Token | it |
Token ID | 340 |
Feature activation | -2.48e-02 |
Pos logit contributions | |
eway | +0.022 |
kered | +0.020 |
ining | +0.020 |
ered | +0.020 |
ooks | +0.019 |
Neg logit contributions | |
groom | -0.016 |
scar | -0.014 |
pony | -0.014 |
chicken | -0.014 |
burn | -0.014 |
Token | 's |
Token ID | 338 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
eway | +0.055 |
ooks | +0.048 |
rum | +0.046 |
kered | +0.044 |
eways | +0.044 |
Neg logit contributions | |
groom | -0.030 |
blows | -0.029 |
chicken | -0.027 |
butter | -0.027 |
reads | -0.026 |
Token | very |
Token ID | 845 |
Feature activation | -3.28e-02 |
Pos logit contributions | |
eway | +0.018 |
kered | +0.015 |
ining | +0.015 |
ered | +0.015 |
ooks | +0.015 |
Neg logit contributions | |
groom | -0.020 |
scar | -0.019 |
burn | -0.018 |
pony | -0.017 |
ponies | -0.017 |
Token | important |
Token ID | 1593 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
eway | +0.071 |
kered | +0.059 |
rum | +0.058 |
aun | +0.056 |
anish | +0.056 |
Neg logit contributions | |
groom | -0.042 |
scar | -0.040 |
bald | -0.038 |
chicken | -0.037 |
butter | -0.035 |
Token | . |
Token ID | 13 |
Feature activation | +3.77e-04 |
Pos logit contributions | |
eway | +0.004 |
ining | +0.003 |
ooks | +0.003 |
kered | +0.003 |
ered | +0.003 |
Neg logit contributions | |
groom | -0.003 |
scar | -0.003 |
burn | -0.003 |
pony | -0.003 |
salon | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | +4.98e-03 |
Pos logit contributions | |
groom | +0.001 |
pony | +0.001 |
scar | +0.001 |
ponies | +0.001 |
salon | +0.001 |
Neg logit contributions | |
eway | -0.001 |
ered | -0.001 |
kered | -0.001 |
ining | -0.000 |
aged | -0.000 |
Token | This |
Token ID | 1212 |
Feature activation | +4.37e-03 |
Pos logit contributions | |
groom | +0.009 |
scar | +0.009 |
pony | +0.009 |
rob | +0.009 |
burn | +0.009 |
Neg logit contributions | |
eway | -0.007 |
kered | -0.006 |
ered | -0.006 |
ining | -0.006 |
ooks | -0.006 |
Token | story |
Token ID | 1621 |
Feature activation | -8.10e-03 |
Pos logit contributions | |
groom | +0.008 |
burn | +0.008 |
scar | +0.008 |
pony | +0.007 |
rob | +0.007 |
Neg logit contributions | |
eway | -0.007 |
ining | -0.006 |
ered | -0.006 |
kered | -0.006 |
earing | -0.006 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.81e-02 |
Pos logit contributions | |
eway | +0.016 |
ooks | +0.016 |
aged | +0.014 |
rum | +0.014 |
Suz | +0.014 |
Neg logit contributions | |
groom | -0.010 |
reads | -0.010 |
scar | -0.010 |
blows | -0.010 |
butter | -0.010 |
Token | us |
Token ID | 514 |
Feature activation | -5.91e-02 |
Pos logit contributions | |
eway | +0.053 |
ining | +0.045 |
ooks | +0.045 |
rum | +0.044 |
kered | +0.043 |
Neg logit contributions | |
groom | -0.046 |
scar | -0.044 |
pony | -0.041 |
ponies | -0.041 |
burn | -0.040 |
Token | that |
Token ID | 326 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
eway | +0.121 |
Turns | +0.114 |
ooks | +0.106 |
rum | +0.106 |
ining | +0.105 |
Neg logit contributions | |
groom | -0.073 |
scar | -0.069 |
chicken | -0.068 |
pony | -0.066 |
ponies | -0.065 |
Token | when |
Token ID | 618 |
Feature activation | -4.48e-03 |
Pos logit contributions | |
eway | +0.025 |
kered | +0.022 |
ining | +0.022 |
ooks | +0.021 |
ered | +0.021 |
Neg logit contributions | |
groom | -0.019 |
scar | -0.017 |
pony | -0.016 |
chicken | -0.016 |
butter | -0.016 |
Token | we |
Token ID | 356 |
Feature activation | -9.31e-03 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.007 |
kered | +0.007 |
ered | +0.007 |
earing | +0.007 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.007 |
burn | -0.006 |
pony | -0.006 |
ponies | -0.006 |
Token | work |
Token ID | 670 |
Feature activation | +2.59e-03 |
Pos logit contributions | |
eway | +0.020 |
ooks | +0.017 |
ining | +0.017 |
rum | +0.017 |
kered | +0.016 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.013 |
burn | -0.011 |
pony | -0.011 |
butter | -0.011 |
Token | hard |
Token ID | 1327 |
Feature activation | +1.31e-02 |
Pos logit contributions | |
groom | +0.005 |
scar | +0.005 |
burn | +0.005 |
pony | +0.005 |
salon | +0.005 |
Neg logit contributions | |
eway | -0.004 |
ining | -0.003 |
kered | -0.003 |
ooks | -0.003 |
rum | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | -4.30e-03 |
Pos logit contributions | |
eway | +0.046 |
ining | +0.040 |
ered | +0.040 |
ooks | +0.040 |
rum | +0.040 |
Neg logit contributions | |
groom | -0.024 |
scar | -0.021 |
burn | -0.021 |
pony | -0.021 |
chicken | -0.021 |
Token | leaving |
Token ID | 4305 |
Feature activation | -6.61e-03 |
Pos logit contributions | |
eway | +0.009 |
kered | +0.008 |
rum | +0.008 |
ered | +0.008 |
ooks | +0.008 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.006 |
pony | -0.005 |
burn | -0.005 |
butter | -0.005 |
Token | it |
Token ID | 340 |
Feature activation | -2.50e-02 |
Pos logit contributions | |
eway | +0.014 |
ining | +0.012 |
rum | +0.012 |
earing | +0.012 |
kered | +0.012 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.008 |
chicken | -0.008 |
pony | -0.008 |
butter | -0.008 |
Token | to |
Token ID | 284 |
Feature activation | -2.58e-03 |
Pos logit contributions | |
eway | +0.049 |
ooks | +0.044 |
kered | +0.042 |
rum | +0.042 |
ining | +0.041 |
Neg logit contributions | |
groom | -0.036 |
scar | -0.033 |
burn | -0.033 |
pony | -0.031 |
butter | -0.031 |
Token | its |
Token ID | 663 |
Feature activation | -9.15e-03 |
Pos logit contributions | |
eway | +0.005 |
ining | +0.004 |
kered | +0.004 |
earing | +0.004 |
ooks | +0.004 |
Neg logit contributions | |
groom | -0.004 |
scar | -0.004 |
burn | -0.004 |
pony | -0.004 |
chicken | -0.004 |
Token | former |
Token ID | 1966 |
Feature activation | -5.91e-02 |
Pos logit contributions | |
eway | +0.017 |
ining | +0.015 |
ered | +0.015 |
kered | +0.015 |
earing | +0.014 |
Neg logit contributions | |
groom | -0.015 |
scar | -0.014 |
burn | -0.013 |
pony | -0.013 |
salon | -0.013 |
Token | state |
Token ID | 1181 |
Feature activation | -2.99e-04 |
Pos logit contributions | |
eway | +0.114 |
taker | +0.098 |
kered | +0.096 |
Everything | +0.096 |
aun | +0.094 |
Neg logit contributions | |
scar | -0.087 |
groom | -0.081 |
strawberries | -0.071 |
butter | -0.070 |
horses | -0.069 |
Token | . |
Token ID | 13 |
Feature activation | +1.94e-03 |
Pos logit contributions | |
eway | +0.001 |
ining | +0.001 |
ered | +0.001 |
kered | +0.001 |
Turns | +0.001 |
Neg logit contributions | |
groom | -0.000 |
scar | -0.000 |
burn | -0.000 |
pony | -0.000 |
salon | -0.000 |
Token | |
Token ID | 220 |
Feature activation | -7.12e-03 |
Pos logit contributions | |
groom | +0.003 |
� | +0.002 |
Nikki | +0.002 |
Rudy | +0.002 |
Velvet | +0.002 |
Neg logit contributions | |
eway | -0.004 |
kered | -0.003 |
ered | -0.003 |
rum | -0.003 |
aged | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | +1.32e-03 |
Pos logit contributions | |
eway | +0.014 |
kered | +0.013 |
ered | +0.012 |
rum | +0.012 |
ining | +0.011 |
Neg logit contributions | |
groom | -0.008 |
� | -0.008 |
Velvet | -0.008 |
burn | -0.008 |
Rudy | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -2.29e-04 |
Pos logit contributions | |
groom | +0.002 |
rob | +0.002 |
scar | +0.002 |
Velvet | +0.002 |
chicken | +0.002 |
Neg logit contributions | |
eway | -0.003 |
ered | -0.002 |
kered | -0.002 |
earing | -0.002 |
rum | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | -3.08e-02 |
Pos logit contributions | |
eway | +0.073 |
kered | +0.064 |
ining | +0.064 |
ooks | +0.063 |
ered | +0.063 |
Neg logit contributions | |
groom | -0.044 |
scar | -0.043 |
burn | -0.040 |
rob | -0.040 |
pony | -0.040 |
Token | story |
Token ID | 1621 |
Feature activation | -2.75e-02 |
Pos logit contributions | |
eway | +0.058 |
ining | +0.052 |
ered | +0.050 |
ooks | +0.050 |
earing | +0.050 |
Neg logit contributions | |
groom | -0.048 |
scar | -0.047 |
pony | -0.044 |
burn | -0.043 |
chicken | -0.042 |
Token | is |
Token ID | 318 |
Feature activation | -4.39e-02 |
Pos logit contributions | |
eway | +0.066 |
ooks | +0.063 |
aded | +0.062 |
Suz | +0.062 |
aged | +0.061 |
Neg logit contributions | |
blows | -0.019 |
reads | -0.018 |
salon | -0.017 |
� | -0.017 |
rider | -0.016 |
Token | : |
Token ID | 25 |
Feature activation | -1.53e-02 |
Pos logit contributions | |
eway | +0.105 |
kered | +0.097 |
rum | +0.091 |
ining | +0.090 |
amed | +0.089 |
Neg logit contributions | |
chicken | -0.039 |
concert | -0.038 |
groom | -0.037 |
bald | -0.037 |
scar | -0.036 |
Token | Qu |
Token ID | 2264 |
Feature activation | -3.88e-04 |
Pos logit contributions | |
eway | +0.031 |
kered | +0.027 |
amed | +0.027 |
ered | +0.026 |
imm | +0.025 |
Neg logit contributions | |
groom | -0.021 |
chicken | -0.020 |
scar | -0.019 |
poet | -0.019 |
pony | -0.018 |
Token | arre |
Token ID | 9624 |
Feature activation | -5.90e-02 |
Pos logit contributions | |
eway | +0.001 |
ered | +0.001 |
aged | +0.001 |
Suz | +0.001 |
rum | +0.001 |
Neg logit contributions | |
scar | -0.000 |
poet | -0.000 |
ara | -0.000 |
groom | -0.000 |
burn | -0.000 |
Token | lling |
Token ID | 2680 |
Feature activation | -3.82e-02 |
Pos logit contributions | |
eway | +0.123 |
ooks | +0.109 |
Turns | +0.109 |
Suz | +0.108 |
To | +0.104 |
Neg logit contributions | |
blows | -0.069 |
groom | -0.069 |
scar | -0.069 |
rob | -0.065 |
butter | -0.062 |
Token | over |
Token ID | 625 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
eway | +0.085 |
ooks | +0.074 |
Suz | +0.072 |
Turns | +0.071 |
rum | +0.069 |
Neg logit contributions | |
groom | -0.041 |
scar | -0.040 |
chicken | -0.039 |
blows | -0.039 |
cane | -0.038 |
Token | small |
Token ID | 1402 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
eway | +0.027 |
ining | +0.024 |
kered | +0.024 |
ered | +0.023 |
ooks | +0.022 |
Neg logit contributions | |
groom | -0.023 |
scar | -0.022 |
pony | -0.021 |
ponies | -0.021 |
burn | -0.021 |
Token | things |
Token ID | 1243 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
eway | +0.022 |
ining | +0.019 |
ered | +0.018 |
kered | +0.018 |
ooks | +0.018 |
Neg logit contributions | |
groom | -0.019 |
scar | -0.018 |
burn | -0.017 |
pony | -0.017 |
salon | -0.017 |
Token | is |
Token ID | 318 |
Feature activation | -1.96e-02 |
Pos logit contributions | |
eway | +0.048 |
ooks | +0.044 |
kered | +0.041 |
Turns | +0.040 |
rum | +0.040 |
Neg logit contributions | |
groom | -0.029 |
scar | -0.028 |
pony | -0.026 |
butter | -0.026 |
cane | -0.025 |
Token | thanked |
Token ID | 26280 |
Feature activation | +5.30e-03 |
Pos logit contributions | |
eway | +0.024 |
ining | +0.020 |
ooks | +0.020 |
rum | +0.020 |
earing | +0.019 |
Neg logit contributions | |
groom | -0.021 |
scar | -0.020 |
burn | -0.019 |
pony | -0.019 |
salon | -0.018 |
Token | the |
Token ID | 262 |
Feature activation | +3.13e-03 |
Pos logit contributions | |
groom | +0.008 |
scar | +0.008 |
burn | +0.008 |
pony | +0.007 |
salon | +0.007 |
Neg logit contributions | |
eway | -0.010 |
ining | -0.009 |
ered | -0.009 |
kered | -0.009 |
ooks | -0.009 |
Token | girl |
Token ID | 2576 |
Feature activation | -8.39e-03 |
Pos logit contributions | |
burn | +0.005 |
scar | +0.005 |
rob | +0.005 |
groom | +0.005 |
syrup | +0.004 |
Neg logit contributions | |
eway | -0.006 |
ining | -0.005 |
ered | -0.005 |
Everyone | -0.005 |
kered | -0.005 |
Token | for |
Token ID | 329 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
eway | +0.016 |
ining | +0.014 |
ered | +0.013 |
kered | +0.013 |
ooks | +0.013 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.013 |
burn | -0.012 |
pony | -0.012 |
ponies | -0.012 |
Token | sharing |
Token ID | 7373 |
Feature activation | -4.93e-03 |
Pos logit contributions | |
eway | +0.028 |
ining | +0.024 |
ooks | +0.024 |
earing | +0.024 |
kered | +0.024 |
Neg logit contributions | |
groom | -0.024 |
scar | -0.022 |
pony | -0.021 |
burn | -0.020 |
butter | -0.020 |
Token | such |
Token ID | 884 |
Feature activation | -5.89e-02 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.008 |
ered | +0.008 |
kered | +0.008 |
ooks | +0.008 |
Neg logit contributions | |
groom | -0.008 |
scar | -0.008 |
burn | -0.007 |
pony | -0.007 |
salon | -0.007 |
Token | a |
Token ID | 257 |
Feature activation | -3.12e-02 |
Pos logit contributions | |
eway | +0.135 |
rum | +0.119 |
ooks | +0.118 |
Turns | +0.118 |
ining | +0.118 |
Neg logit contributions | |
groom | -0.076 |
scar | -0.068 |
pony | -0.064 |
chicken | -0.062 |
butter | -0.062 |
Token | wonderful |
Token ID | 7932 |
Feature activation | -3.27e-02 |
Pos logit contributions | |
eway | +0.063 |
ered | +0.055 |
ining | +0.055 |
rum | +0.054 |
kered | +0.054 |
Neg logit contributions | |
groom | -0.048 |
scar | -0.045 |
pony | -0.044 |
burn | -0.042 |
butter | -0.040 |
Token | gift |
Token ID | 6979 |
Feature activation | -1.63e-02 |
Pos logit contributions | |
eway | +0.069 |
rum | +0.062 |
ining | +0.062 |
kered | +0.062 |
ered | +0.061 |
Neg logit contributions | |
groom | -0.045 |
pony | -0.041 |
scar | -0.041 |
burn | -0.039 |
chicken | -0.037 |
Token | . |
Token ID | 13 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
eway | +0.032 |
ining | +0.028 |
ered | +0.027 |
kered | +0.027 |
ooks | +0.027 |
Neg logit contributions | |
groom | -0.025 |
scar | -0.023 |
burn | -0.023 |
pony | -0.023 |
salon | -0.021 |
Token | The |
Token ID | 383 |
Feature activation | +7.34e-03 |
Pos logit contributions | |
eway | +0.017 |
ered | +0.014 |
kered | +0.013 |
rum | +0.013 |
ining | +0.013 |
Neg logit contributions | |
groom | -0.023 |
pony | -0.021 |
burn | -0.021 |
ponies | -0.021 |
salon | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | -2.83e-03 |
Pos logit contributions | |
eway | +0.020 |
ered | +0.019 |
kered | +0.018 |
aged | +0.017 |
rum | +0.016 |
Neg logit contributions | |
groom | -0.014 |
Velvet | -0.014 |
Elsa | -0.013 |
Rudy | -0.013 |
� | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | -8.33e-03 |
Pos logit contributions | |
eway | +0.004 |
ered | +0.004 |
kered | +0.004 |
ining | +0.004 |
earing | +0.004 |
Neg logit contributions | |
groom | -0.005 |
scar | -0.005 |
pony | -0.005 |
rob | -0.005 |
burn | -0.005 |
Token | This |
Token ID | 1212 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
eway | +0.016 |
ered | +0.014 |
aged | +0.014 |
rum | +0.014 |
earing | +0.014 |
Neg logit contributions | |
groom | -0.013 |
salon | -0.011 |
scar | -0.011 |
pony | -0.011 |
poet | -0.011 |
Token | story |
Token ID | 1621 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
groom | +0.021 |
burn | +0.020 |
scar | +0.020 |
rob | +0.019 |
pony | +0.019 |
Neg logit contributions | |
eway | -0.014 |
kered | -0.012 |
ining | -0.012 |
ered | -0.012 |
Everything | -0.011 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.65e-02 |
Pos logit contributions | |
eway | +0.023 |
ooks | +0.021 |
rum | +0.020 |
Suz | +0.020 |
eways | +0.019 |
Neg logit contributions | |
groom | -0.016 |
reads | -0.015 |
salon | -0.014 |
blows | -0.014 |
concert | -0.014 |
Token | us |
Token ID | 514 |
Feature activation | -5.86e-02 |
Pos logit contributions | |
eway | +0.049 |
ining | +0.042 |
ered | +0.040 |
kered | +0.040 |
ooks | +0.040 |
Neg logit contributions | |
groom | -0.045 |
scar | -0.043 |
burn | -0.041 |
pony | -0.040 |
ponies | -0.039 |
Token | an |
Token ID | 281 |
Feature activation | -4.04e-02 |
Pos logit contributions | |
eway | +0.133 |
Turns | +0.119 |
ooks | +0.112 |
ining | +0.112 |
rum | +0.112 |
Neg logit contributions | |
groom | -0.064 |
chicken | -0.060 |
butter | -0.060 |
scar | -0.059 |
pony | -0.058 |
Token | important |
Token ID | 1593 |
Feature activation | -3.28e-02 |
Pos logit contributions | |
eway | +0.067 |
ining | +0.058 |
kered | +0.056 |
ooks | +0.056 |
ered | +0.055 |
Neg logit contributions | |
groom | -0.071 |
scar | -0.068 |
pony | -0.066 |
burn | -0.064 |
ponies | -0.064 |
Token | lesson |
Token ID | 11483 |
Feature activation | -2.26e-02 |
Pos logit contributions | |
eway | +0.062 |
ining | +0.055 |
ered | +0.054 |
kered | +0.053 |
ooks | +0.053 |
Neg logit contributions | |
groom | -0.052 |
scar | -0.048 |
pony | -0.047 |
burn | -0.046 |
chicken | -0.045 |
Token | : |
Token ID | 25 |
Feature activation | -2.18e-02 |
Pos logit contributions | |
eway | +0.037 |
ining | +0.033 |
kered | +0.033 |
Turns | +0.033 |
earing | +0.032 |
Neg logit contributions | |
groom | -0.036 |
scar | -0.034 |
ponies | -0.034 |
pony | -0.034 |
salon | -0.033 |
Token | being |
Token ID | 852 |
Feature activation | -3.37e-02 |
Pos logit contributions | |
eway | +0.044 |
kered | +0.037 |
ining | +0.037 |
ered | +0.036 |
amed | +0.036 |
Neg logit contributions | |
groom | -0.034 |
scar | -0.030 |
chicken | -0.030 |
ponies | -0.029 |
salon | -0.029 |
Token | mom |
Token ID | 1995 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
rob | +0.017 |
groom | +0.016 |
burn | +0.016 |
scar | +0.015 |
pony | +0.014 |
Neg logit contributions | |
eway | -0.017 |
kered | -0.015 |
aged | -0.015 |
ered | -0.014 |
ooks | -0.014 |
Token | smiles |
Token ID | 21845 |
Feature activation | +6.08e-03 |
Pos logit contributions | |
groom | +0.032 |
burn | +0.030 |
pony | +0.028 |
scar | +0.028 |
rob | +0.027 |
Neg logit contributions | |
eway | -0.034 |
ered | -0.033 |
ining | -0.033 |
earing | -0.031 |
kered | -0.031 |
Token | . |
Token ID | 13 |
Feature activation | -4.60e-03 |
Pos logit contributions | |
groom | +0.011 |
scar | +0.011 |
rob | +0.010 |
salon | +0.010 |
burn | +0.010 |
Neg logit contributions | |
eway | -0.010 |
ining | -0.009 |
kered | -0.008 |
ered | -0.008 |
earing | -0.008 |
Token | She |
Token ID | 1375 |
Feature activation | +2.51e-02 |
Pos logit contributions | |
eway | +0.006 |
ining | +0.005 |
ooks | +0.004 |
earing | +0.004 |
kered | +0.004 |
Neg logit contributions | |
groom | -0.010 |
scar | -0.010 |
burn | -0.010 |
pony | -0.010 |
rob | -0.010 |
Token | teaches |
Token ID | 17324 |
Feature activation | -1.86e-02 |
Pos logit contributions | |
burn | +0.046 |
groom | +0.044 |
avail | +0.043 |
salon | +0.040 |
pony | +0.039 |
Neg logit contributions | |
ining | -0.036 |
From | -0.035 |
ered | -0.034 |
eway | -0.034 |
earing | -0.032 |
Token | them |
Token ID | 606 |
Feature activation | -5.86e-02 |
Pos logit contributions | |
eway | +0.023 |
Everyone | +0.020 |
ining | +0.020 |
ered | +0.020 |
kered | +0.020 |
Neg logit contributions | |
burn | -0.039 |
groom | -0.039 |
rob | -0.037 |
pony | -0.036 |
rider | -0.036 |
Token | how |
Token ID | 703 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
eway | +0.142 |
rum | +0.124 |
Turns | +0.124 |
ining | +0.123 |
ered | +0.118 |
Neg logit contributions | |
scar | -0.064 |
chicken | -0.064 |
groom | -0.064 |
strawberries | -0.063 |
butter | -0.061 |
Token | to |
Token ID | 284 |
Feature activation | -5.35e-03 |
Pos logit contributions | |
eway | +0.029 |
ining | +0.025 |
ered | +0.025 |
kered | +0.024 |
rum | +0.024 |
Neg logit contributions | |
groom | -0.023 |
scar | -0.021 |
burn | -0.020 |
pony | -0.020 |
ponies | -0.019 |
Token | be |
Token ID | 307 |
Feature activation | -1.81e-02 |
Pos logit contributions | |
eway | +0.011 |
ining | +0.010 |
kered | +0.009 |
ered | +0.009 |
earing | +0.009 |
Neg logit contributions | |
groom | -0.008 |
scar | -0.007 |
burn | -0.007 |
pony | -0.007 |
salon | -0.007 |
Token | safe |
Token ID | 3338 |
Feature activation | -1.54e-02 |
Pos logit contributions | |
eway | +0.036 |
ered | +0.030 |
ining | +0.030 |
kered | +0.030 |
earing | +0.029 |
Neg logit contributions | |
groom | -0.030 |
scar | -0.028 |
pony | -0.026 |
burn | -0.026 |
chicken | -0.026 |
Token | with |
Token ID | 351 |
Feature activation | -2.28e-02 |
Pos logit contributions | |
eway | +0.027 |
ining | +0.024 |
ered | +0.023 |
kered | +0.023 |
ooks | +0.023 |
Neg logit contributions | |
groom | -0.027 |
scar | -0.025 |
burn | -0.024 |
pony | -0.024 |
salon | -0.023 |
Token |
|
Token ID | 198 |
Feature activation | -8.38e-03 |
Pos logit contributions | |
eway | +0.015 |
ered | +0.013 |
kered | +0.013 |
rum | +0.012 |
ining | +0.012 |
Neg logit contributions | |
groom | -0.012 |
burn | -0.012 |
scar | -0.012 |
pony | -0.011 |
Velvet | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | -8.84e-03 |
Pos logit contributions | |
eway | +0.015 |
ered | +0.013 |
ooks | +0.013 |
earing | +0.012 |
rum | +0.012 |
Neg logit contributions | |
groom | -0.013 |
scar | -0.012 |
rob | -0.012 |
pony | -0.012 |
burn | -0.012 |
Token | This |
Token ID | 1212 |
Feature activation | +4.84e-03 |
Pos logit contributions | |
eway | +0.016 |
ered | +0.015 |
ooks | +0.014 |
Suz | +0.014 |
rum | +0.014 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.012 |
pony | -0.012 |
burn | -0.012 |
poet | -0.012 |
Token | story |
Token ID | 1621 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
groom | +0.009 |
scar | +0.009 |
burn | +0.009 |
salon | +0.008 |
pony | +0.008 |
Neg logit contributions | |
eway | -0.008 |
ining | -0.007 |
ered | -0.007 |
kered | -0.007 |
earing | -0.006 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.97e-02 |
Pos logit contributions | |
eway | +0.022 |
ooks | +0.022 |
and | +0.020 |
rum | +0.020 |
Suz | +0.019 |
Neg logit contributions | |
groom | -0.013 |
blows | -0.012 |
scar | -0.012 |
butter | -0.012 |
reads | -0.011 |
Token | us |
Token ID | 514 |
Feature activation | -5.84e-02 |
Pos logit contributions | |
eway | +0.054 |
ining | +0.047 |
ooks | +0.045 |
ered | +0.045 |
kered | +0.045 |
Neg logit contributions | |
groom | -0.051 |
scar | -0.048 |
burn | -0.045 |
pony | -0.045 |
ponies | -0.044 |
Token | an |
Token ID | 281 |
Feature activation | -4.69e-02 |
Pos logit contributions | |
eway | +0.122 |
Turns | +0.112 |
ooks | +0.106 |
ining | +0.104 |
rum | +0.103 |
Neg logit contributions | |
groom | -0.072 |
scar | -0.070 |
chicken | -0.068 |
pony | -0.066 |
butter | -0.065 |
Token | important |
Token ID | 1593 |
Feature activation | -3.72e-02 |
Pos logit contributions | |
eway | +0.078 |
ining | +0.066 |
ooks | +0.065 |
kered | +0.065 |
Turns | +0.064 |
Neg logit contributions | |
groom | -0.081 |
scar | -0.078 |
pony | -0.076 |
burn | -0.074 |
ponies | -0.073 |
Token | lesson |
Token ID | 11483 |
Feature activation | -2.45e-02 |
Pos logit contributions | |
eway | +0.071 |
ining | +0.064 |
ered | +0.063 |
ooks | +0.062 |
kered | +0.062 |
Neg logit contributions | |
groom | -0.055 |
scar | -0.052 |
pony | -0.051 |
burn | -0.050 |
chicken | -0.048 |
Token | : |
Token ID | 25 |
Feature activation | -2.09e-02 |
Pos logit contributions | |
eway | +0.036 |
ining | +0.034 |
Turns | +0.033 |
kered | +0.033 |
aged | +0.033 |
Neg logit contributions | |
groom | -0.040 |
scar | -0.039 |
ponies | -0.039 |
pony | -0.038 |
horse | -0.037 |
Token | to |
Token ID | 284 |
Feature activation | -1.39e-02 |
Pos logit contributions | |
eway | +0.040 |
kered | +0.034 |
ining | +0.033 |
ered | +0.033 |
rum | +0.032 |
Neg logit contributions | |
groom | -0.034 |
scar | -0.031 |
burn | -0.030 |
pony | -0.029 |
chicken | -0.029 |
Token |
|
Token ID | 198 |
Feature activation | -2.67e-03 |
Pos logit contributions | |
groom | +0.000 |
scar | +0.000 |
burn | +0.000 |
pony | +0.000 |
salon | +0.000 |
Neg logit contributions | |
eway | -0.000 |
kered | -0.000 |
ered | -0.000 |
ining | -0.000 |
rum | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | -7.03e-03 |
Pos logit contributions | |
eway | +0.004 |
ered | +0.004 |
kered | +0.004 |
ining | +0.004 |
aged | +0.003 |
Neg logit contributions | |
groom | -0.005 |
scar | -0.005 |
pony | -0.005 |
burn | -0.004 |
rob | -0.004 |
Token | This |
Token ID | 1212 |
Feature activation | +5.60e-03 |
Pos logit contributions | |
eway | +0.013 |
ered | +0.012 |
kered | +0.012 |
aged | +0.012 |
ining | +0.011 |
Neg logit contributions | |
groom | -0.011 |
scar | -0.010 |
pony | -0.010 |
salon | -0.009 |
burn | -0.009 |
Token | story |
Token ID | 1621 |
Feature activation | -7.40e-03 |
Pos logit contributions | |
groom | +0.010 |
burn | +0.010 |
scar | +0.010 |
rob | +0.009 |
pony | +0.009 |
Neg logit contributions | |
eway | -0.009 |
ining | -0.008 |
ered | -0.008 |
kered | -0.008 |
earing | -0.008 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.71e-02 |
Pos logit contributions | |
eway | +0.016 |
ooks | +0.015 |
rum | +0.014 |
Suz | +0.014 |
aged | +0.014 |
Neg logit contributions | |
groom | -0.009 |
reads | -0.008 |
butter | -0.008 |
salon | -0.008 |
pony | -0.008 |
Token | us |
Token ID | 514 |
Feature activation | -5.78e-02 |
Pos logit contributions | |
eway | +0.050 |
ining | +0.043 |
ooks | +0.042 |
ered | +0.042 |
kered | +0.041 |
Neg logit contributions | |
groom | -0.046 |
scar | -0.043 |
pony | -0.041 |
burn | -0.040 |
ponies | -0.040 |
Token | that |
Token ID | 326 |
Feature activation | -1.00e-02 |
Pos logit contributions | |
eway | +0.123 |
Turns | +0.109 |
ining | +0.105 |
rum | +0.103 |
ooks | +0.103 |
Neg logit contributions | |
groom | -0.072 |
chicken | -0.069 |
butter | -0.068 |
scar | -0.067 |
pony | -0.065 |
Token | when |
Token ID | 618 |
Feature activation | -1.63e-03 |
Pos logit contributions | |
eway | +0.020 |
ining | +0.018 |
kered | +0.017 |
ered | +0.017 |
ooks | +0.017 |
Neg logit contributions | |
groom | -0.015 |
scar | -0.014 |
butter | -0.014 |
chicken | -0.014 |
pony | -0.014 |
Token | we |
Token ID | 356 |
Feature activation | -5.19e-03 |
Pos logit contributions | |
eway | +0.003 |
ining | +0.003 |
kered | +0.003 |
ered | +0.003 |
earing | +0.003 |
Neg logit contributions | |
groom | -0.003 |
scar | -0.002 |
burn | -0.002 |
pony | -0.002 |
ponies | -0.002 |
Token | do |
Token ID | 466 |
Feature activation | +2.09e-05 |
Pos logit contributions | |
eway | +0.011 |
ining | +0.010 |
ooks | +0.010 |
rum | +0.009 |
kered | +0.009 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.007 |
burn | -0.006 |
butter | -0.006 |
pony | -0.006 |
Token | something |
Token ID | 1223 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
groom | +0.000 |
scar | +0.000 |
pony | +0.000 |
butter | +0.000 |
chicken | +0.000 |
Neg logit contributions | |
eway | -0.000 |
ining | -0.000 |
kered | -0.000 |
ooks | -0.000 |
ered | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | +4.43e-03 |
Pos logit contributions | |
eway | +0.000 |
ered | +0.000 |
kered | +0.000 |
ining | +0.000 |
rum | +0.000 |
Neg logit contributions | |
scar | -0.000 |
groom | -0.000 |
Velvet | -0.000 |
burn | -0.000 |
bald | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | -1.38e-04 |
Pos logit contributions | |
groom | +0.008 |
scar | +0.008 |
burn | +0.008 |
pony | +0.008 |
rob | +0.008 |
Neg logit contributions | |
eway | -0.007 |
ining | -0.006 |
ered | -0.005 |
kered | -0.005 |
rum | -0.005 |
Token | This |
Token ID | 1212 |
Feature activation | +5.27e-03 |
Pos logit contributions | |
eway | +0.000 |
ered | +0.000 |
ining | +0.000 |
kered | +0.000 |
rum | +0.000 |
Neg logit contributions | |
scar | -0.000 |
groom | -0.000 |
burn | -0.000 |
pony | -0.000 |
rob | -0.000 |
Token | story |
Token ID | 1621 |
Feature activation | -8.74e-03 |
Pos logit contributions | |
groom | +0.009 |
burn | +0.009 |
scar | +0.009 |
pony | +0.008 |
salon | +0.008 |
Neg logit contributions | |
eway | -0.009 |
ining | -0.008 |
ered | -0.008 |
kered | -0.008 |
Turns | -0.007 |
Token | teaches |
Token ID | 17324 |
Feature activation | -2.62e-02 |
Pos logit contributions | |
ooks | +0.016 |
eway | +0.016 |
rum | +0.014 |
and | +0.014 |
Suz | +0.014 |
Neg logit contributions | |
blows | -0.012 |
groom | -0.012 |
scar | -0.011 |
rider | -0.011 |
butter | -0.011 |
Token | us |
Token ID | 514 |
Feature activation | -5.77e-02 |
Pos logit contributions | |
eway | +0.048 |
ining | +0.041 |
ooks | +0.039 |
rum | +0.039 |
ered | +0.039 |
Neg logit contributions | |
groom | -0.044 |
scar | -0.043 |
burn | -0.040 |
pony | -0.040 |
ponies | -0.039 |
Token | that |
Token ID | 326 |
Feature activation | -9.98e-03 |
Pos logit contributions | |
eway | +0.123 |
Turns | +0.114 |
ining | +0.107 |
ooks | +0.107 |
rum | +0.105 |
Neg logit contributions | |
groom | -0.066 |
scar | -0.066 |
chicken | -0.065 |
pony | -0.063 |
butter | -0.062 |
Token | it |
Token ID | 340 |
Feature activation | -2.45e-02 |
Pos logit contributions | |
eway | +0.019 |
ining | +0.017 |
kered | +0.017 |
ered | +0.017 |
ooks | +0.017 |
Neg logit contributions | |
groom | -0.016 |
scar | -0.015 |
pony | -0.014 |
burn | -0.014 |
chicken | -0.014 |
Token | 's |
Token ID | 338 |
Feature activation | -9.74e-03 |
Pos logit contributions | |
eway | +0.054 |
ooks | +0.048 |
rum | +0.045 |
kered | +0.044 |
aun | +0.044 |
Neg logit contributions | |
groom | -0.029 |
blows | -0.028 |
chicken | -0.027 |
scar | -0.027 |
butter | -0.026 |
Token | important |
Token ID | 1593 |
Feature activation | -1.56e-02 |
Pos logit contributions | |
eway | +0.015 |
ining | +0.013 |
ered | +0.012 |
kered | +0.012 |
ooks | +0.012 |
Neg logit contributions | |
groom | -0.019 |
scar | -0.018 |
burn | -0.018 |
pony | -0.017 |
salon | -0.017 |
Token | to |
Token ID | 284 |
Feature activation | -9.87e-03 |
Pos logit contributions | |
eway | +0.034 |
kered | +0.031 |
ining | +0.031 |
ooks | +0.030 |
Turns | +0.030 |
Neg logit contributions | |
groom | -0.018 |
scar | -0.017 |
pony | -0.016 |
cane | -0.016 |
burn | -0.015 |
Token | They |
Token ID | 1119 |
Feature activation | -2.14e-03 |
Pos logit contributions | |
eway | +0.010 |
ining | +0.008 |
ered | +0.008 |
kered | +0.008 |
rum | +0.007 |
Neg logit contributions | |
groom | -0.017 |
scar | -0.016 |
burn | -0.015 |
pony | -0.015 |
salon | -0.015 |
Token | liked |
Token ID | 8288 |
Feature activation | +2.14e-02 |
Pos logit contributions | |
eway | +0.004 |
ining | +0.004 |
ered | +0.003 |
kered | +0.003 |
ooks | +0.003 |
Neg logit contributions | |
groom | -0.003 |
scar | -0.003 |
burn | -0.003 |
pony | -0.003 |
rob | -0.003 |
Token | to |
Token ID | 284 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
groom | +0.041 |
burn | +0.038 |
rob | +0.038 |
scar | +0.038 |
pony | +0.036 |
Neg logit contributions | |
eway | -0.033 |
ining | -0.028 |
ered | -0.027 |
earing | -0.026 |
kered | -0.026 |
Token | swing |
Token ID | 9628 |
Feature activation | +3.73e-02 |
Pos logit contributions | |
groom | +0.016 |
burn | +0.015 |
scar | +0.015 |
rob | +0.015 |
ponies | +0.014 |
Neg logit contributions | |
eway | -0.020 |
ered | -0.019 |
ining | -0.017 |
Suz | -0.016 |
kered | -0.016 |
Token | and |
Token ID | 290 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
groom | +0.075 |
burn | +0.067 |
scar | +0.067 |
pony | +0.066 |
salon | +0.065 |
Neg logit contributions | |
eway | -0.058 |
ining | -0.049 |
ered | -0.048 |
kered | -0.047 |
ooks | -0.045 |
Token | slide |
Token ID | 10649 |
Feature activation | +3.30e-02 |
Pos logit contributions | |
groom | +0.018 |
burn | +0.016 |
scar | +0.016 |
pony | +0.015 |
rob | +0.015 |
Neg logit contributions | |
eway | -0.032 |
ered | -0.029 |
ining | -0.028 |
Suz | -0.028 |
kered | -0.028 |
Token | and |
Token ID | 290 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
groom | +0.068 |
poet | +0.061 |
scar | +0.060 |
burn | +0.059 |
salon | +0.058 |
Neg logit contributions | |
eway | -0.049 |
ining | -0.042 |
ered | -0.042 |
kered | -0.040 |
itself | -0.039 |
Token | run |
Token ID | 1057 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
groom | +0.020 |
burn | +0.018 |
scar | +0.018 |
rob | +0.017 |
pony | +0.017 |
Neg logit contributions | |
eway | -0.028 |
ered | -0.024 |
ining | -0.024 |
Suz | -0.023 |
kered | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | +3.86e-03 |
Pos logit contributions | |
groom | +0.038 |
scar | +0.036 |
burn | +0.034 |
pony | +0.034 |
rob | +0.032 |
Neg logit contributions | |
eway | -0.043 |
ining | -0.037 |
ered | -0.036 |
kered | -0.036 |
ooks | -0.036 |
Token | They |
Token ID | 1119 |
Feature activation | -1.32e-04 |
Pos logit contributions | |
groom | +0.008 |
scar | +0.008 |
burn | +0.008 |
pony | +0.008 |
salon | +0.007 |
Neg logit contributions | |
eway | -0.005 |
ining | -0.004 |
ered | -0.004 |
kered | -0.004 |
ooks | -0.004 |
Token | saw |
Token ID | 2497 |
Feature activation | +1.17e-03 |
Pos logit contributions | |
eway | +0.000 |
ered | +0.000 |
lived | +0.000 |
ining | +0.000 |
Suz | +0.000 |
Neg logit contributions | |
burn | -0.000 |
groom | -0.000 |
scar | -0.000 |
rob | -0.000 |
pony | -0.000 |
Token | with |
Token ID | 351 |
Feature activation | -5.26e-03 |
Pos logit contributions | |
eway | +0.036 |
Turns | +0.031 |
ining | +0.030 |
ered | +0.030 |
kered | +0.030 |
Neg logit contributions | |
burn | -0.019 |
pony | -0.018 |
groom | -0.018 |
scar | -0.017 |
cane | -0.017 |
Token | his |
Token ID | 465 |
Feature activation | -5.57e-03 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.008 |
ered | +0.007 |
kered | +0.007 |
ooks | +0.007 |
Neg logit contributions | |
groom | -0.010 |
scar | -0.009 |
burn | -0.009 |
pony | -0.009 |
salon | -0.008 |
Token | cable |
Token ID | 7862 |
Feature activation | -5.37e-03 |
Pos logit contributions | |
eway | +0.011 |
ining | +0.010 |
ered | +0.010 |
kered | +0.010 |
ooks | +0.010 |
Neg logit contributions | |
groom | -0.008 |
scar | -0.008 |
pony | -0.007 |
burn | -0.007 |
ponies | -0.007 |
Token | so |
Token ID | 523 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
eway | +0.010 |
ining | +0.009 |
ered | +0.008 |
kered | +0.008 |
ooks | +0.008 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.008 |
burn | -0.008 |
pony | -0.008 |
salon | -0.008 |
Token | it |
Token ID | 340 |
Feature activation | -5.72e-03 |
Pos logit contributions | |
eway | +0.024 |
ining | +0.021 |
ered | +0.020 |
ooks | +0.020 |
rum | +0.020 |
Neg logit contributions | |
groom | -0.016 |
scar | -0.016 |
pony | -0.015 |
burn | -0.015 |
ponies | -0.014 |
Token | wouldn |
Token ID | 3636 |
Feature activation | +2.67e-02 |
Pos logit contributions | |
eway | +0.011 |
ooks | +0.010 |
rum | +0.009 |
ining | +0.009 |
earing | +0.009 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.009 |
pony | -0.008 |
burn | -0.008 |
butter | -0.008 |
Token | 't |
Token ID | 470 |
Feature activation | -4.39e-03 |
Pos logit contributions | |
groom | +0.054 |
scar | +0.051 |
burn | +0.050 |
pony | +0.050 |
salon | +0.048 |
Neg logit contributions | |
eway | -0.039 |
ining | -0.033 |
ered | -0.031 |
kered | -0.031 |
ooks | -0.031 |
Token | get |
Token ID | 651 |
Feature activation | +7.22e-03 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.008 |
ered | +0.008 |
kered | +0.008 |
ooks | +0.008 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.006 |
burn | -0.006 |
pony | -0.006 |
salon | -0.005 |
Token | lost |
Token ID | 2626 |
Feature activation | -7.65e-03 |
Pos logit contributions | |
groom | +0.010 |
scar | +0.010 |
burn | +0.009 |
pony | +0.009 |
salon | +0.009 |
Neg logit contributions | |
eway | -0.015 |
ining | -0.013 |
ered | -0.013 |
kered | -0.013 |
ooks | -0.013 |
Token | again |
Token ID | 757 |
Feature activation | +8.96e-03 |
Pos logit contributions | |
eway | +0.015 |
ining | +0.013 |
ered | +0.013 |
kered | +0.012 |
ooks | +0.012 |
Neg logit contributions | |
groom | -0.012 |
scar | -0.011 |
burn | -0.011 |
pony | -0.011 |
salon | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | -8.67e-03 |
Pos logit contributions | |
groom | +0.016 |
scar | +0.015 |
burn | +0.014 |
pony | +0.014 |
salon | +0.014 |
Neg logit contributions | |
eway | -0.016 |
ining | -0.014 |
ered | -0.013 |
rum | -0.013 |
kered | -0.013 |
Token | and |
Token ID | 290 |
Feature activation | +6.27e-03 |
Pos logit contributions | |
groom | +0.020 |
scar | +0.019 |
burn | +0.018 |
pony | +0.018 |
salon | +0.017 |
Neg logit contributions | |
eway | -0.023 |
ining | -0.020 |
ered | -0.020 |
kered | -0.020 |
ooks | -0.019 |
Token | put |
Token ID | 1234 |
Feature activation | +9.68e-03 |
Pos logit contributions | |
groom | +0.010 |
rob | +0.010 |
burn | +0.010 |
ponies | +0.010 |
pony | +0.009 |
Neg logit contributions | |
ered | -0.010 |
eway | -0.010 |
kered | -0.009 |
aged | -0.009 |
ining | -0.009 |
Token | it |
Token ID | 340 |
Feature activation | -4.41e-03 |
Pos logit contributions | |
groom | +0.019 |
scar | +0.017 |
salon | +0.017 |
burn | +0.017 |
pony | +0.017 |
Neg logit contributions | |
eway | -0.014 |
ered | -0.013 |
ining | -0.013 |
kered | -0.012 |
itself | -0.012 |
Token | on |
Token ID | 319 |
Feature activation | -1.15e-03 |
Pos logit contributions | |
eway | +0.008 |
ining | +0.007 |
ooks | +0.007 |
ered | +0.007 |
kered | +0.007 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.007 |
burn | -0.007 |
pony | -0.007 |
butter | -0.006 |
Token | his |
Token ID | 465 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
eway | +0.002 |
ining | +0.002 |
ered | +0.002 |
kered | +0.002 |
earing | +0.002 |
Neg logit contributions | |
groom | -0.002 |
scar | -0.002 |
burn | -0.002 |
rob | -0.002 |
pony | -0.002 |
Token | knee |
Token ID | 10329 |
Feature activation | +4.28e-02 |
Pos logit contributions | |
groom | +0.023 |
rob | +0.023 |
burn | +0.021 |
poet | +0.021 |
scar | +0.020 |
Neg logit contributions | |
eway | -0.014 |
aged | -0.014 |
itself | -0.014 |
rum | -0.013 |
kered | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -5.86e-04 |
Pos logit contributions | |
groom | +0.078 |
scar | +0.070 |
rob | +0.068 |
pony | +0.068 |
burn | +0.067 |
Neg logit contributions | |
eway | -0.071 |
ining | -0.062 |
kered | -0.062 |
ered | -0.061 |
aged | -0.060 |
Token | She |
Token ID | 1375 |
Feature activation | +9.77e-03 |
Pos logit contributions | |
eway | +0.001 |
ining | +0.001 |
ered | +0.001 |
kered | +0.001 |
rum | +0.001 |
Neg logit contributions | |
groom | -0.001 |
scar | -0.001 |
burn | -0.001 |
pony | -0.001 |
salon | -0.001 |
Token | said |
Token ID | 531 |
Feature activation | -5.14e-03 |
Pos logit contributions | |
groom | +0.017 |
burn | +0.017 |
avail | +0.017 |
ponies | +0.016 |
pony | +0.016 |
Neg logit contributions | |
ered | -0.013 |
kered | -0.013 |
aged | -0.013 |
ining | -0.013 |
lived | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | +2.30e-03 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.008 |
ered | +0.007 |
kered | +0.007 |
ooks | +0.007 |
Neg logit contributions | |
groom | -0.010 |
scar | -0.009 |
pony | -0.009 |
burn | -0.009 |
butter | -0.008 |
Token | " |
Token ID | 366 |
Feature activation | -2.05e-03 |
Pos logit contributions | |
groom | +0.004 |
scar | +0.004 |
pony | +0.004 |
burn | +0.004 |
chicken | +0.004 |
Neg logit contributions | |
eway | -0.004 |
ered | -0.003 |
kered | -0.003 |
ining | -0.003 |
ooks | -0.003 |
Token | cat |
Token ID | 3797 |
Feature activation | -8.90e-03 |
Pos logit contributions | |
groom | +0.004 |
scar | +0.004 |
pony | +0.004 |
burn | +0.004 |
ponies | +0.003 |
Neg logit contributions | |
eway | -0.006 |
ining | -0.005 |
ooks | -0.005 |
ered | -0.005 |
kered | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -1.34e-02 |
Pos logit contributions | |
eway | +0.017 |
ining | +0.015 |
ooks | +0.015 |
ered | +0.015 |
kered | +0.015 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.013 |
pony | -0.013 |
burn | -0.013 |
ponies | -0.012 |
Token | She |
Token ID | 1375 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
eway | +0.026 |
ered | +0.023 |
kered | +0.022 |
rum | +0.021 |
ining | +0.021 |
Neg logit contributions | |
pony | -0.021 |
groom | -0.020 |
scar | -0.020 |
Velvet | -0.020 |
chicken | -0.020 |
Token | never |
Token ID | 1239 |
Feature activation | +1.87e-02 |
Pos logit contributions | |
eway | +0.021 |
ining | +0.019 |
ered | +0.019 |
kered | +0.018 |
earing | +0.018 |
Neg logit contributions | |
groom | -0.021 |
scar | -0.019 |
burn | -0.019 |
pony | -0.019 |
rob | -0.018 |
Token | saw |
Token ID | 2497 |
Feature activation | +6.24e-03 |
Pos logit contributions | |
groom | +0.034 |
rob | +0.033 |
pony | +0.033 |
burn | +0.032 |
ponies | +0.032 |
Neg logit contributions | |
eway | -0.026 |
ered | -0.026 |
ining | -0.025 |
earing | -0.025 |
kered | -0.024 |
Token | Mitt |
Token ID | 16627 |
Feature activation | +3.01e-02 |
Pos logit contributions | |
groom | +0.012 |
scar | +0.011 |
rob | +0.011 |
burn | +0.011 |
salon | +0.011 |
Neg logit contributions | |
eway | -0.009 |
ered | -0.008 |
ining | -0.008 |
itself | -0.008 |
kered | -0.008 |
Token | ens |
Token ID | 641 |
Feature activation | -4.85e-03 |
Pos logit contributions | |
groom | +0.037 |
salon | +0.029 |
scar | +0.027 |
bride | +0.027 |
pony | +0.025 |
Neg logit contributions | |
eway | -0.066 |
kered | -0.063 |
ining | -0.063 |
earing | -0.062 |
Everything | -0.062 |
Token | again |
Token ID | 757 |
Feature activation | -7.59e-03 |
Pos logit contributions | |
eway | +0.010 |
ining | +0.009 |
ered | +0.009 |
kered | +0.009 |
earing | +0.009 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.006 |
burn | -0.006 |
pony | -0.006 |
rob | -0.006 |
Token | and |
Token ID | 290 |
Feature activation | +5.31e-04 |
Pos logit contributions | |
eway | +0.014 |
ining | +0.012 |
ered | +0.012 |
kered | +0.011 |
ooks | +0.011 |
Neg logit contributions | |
groom | -0.013 |
scar | -0.012 |
burn | -0.012 |
pony | -0.012 |
salon | -0.011 |
Token | learned |
Token ID | 4499 |
Feature activation | -2.54e-02 |
Pos logit contributions | |
groom | +0.001 |
scar | +0.001 |
burn | +0.001 |
pony | +0.001 |
salon | +0.001 |
Neg logit contributions | |
eway | -0.001 |
ining | -0.001 |
kered | -0.001 |
ooks | -0.001 |
ered | -0.001 |
Token | to |
Token ID | 284 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
eway | +0.052 |
ining | +0.046 |
ooks | +0.045 |
kered | +0.045 |
Turns | +0.044 |
Neg logit contributions | |
groom | -0.036 |
scar | -0.035 |
pony | -0.035 |
burn | -0.034 |
ponies | -0.032 |
Token | record |
Token ID | 1700 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
groom | +0.022 |
scar | +0.021 |
burn | +0.020 |
pony | +0.020 |
rob | +0.019 |
Neg logit contributions | |
eway | -0.027 |
ining | -0.024 |
ered | -0.023 |
kered | -0.023 |
earing | -0.023 |
Token | my |
Token ID | 616 |
Feature activation | +1.70e-02 |
Pos logit contributions | |
groom | +0.030 |
scar | +0.028 |
burn | +0.027 |
pony | +0.027 |
salon | +0.026 |
Neg logit contributions | |
eway | -0.031 |
ining | -0.027 |
ered | -0.026 |
kered | -0.026 |
ooks | -0.026 |
Token | voice |
Token ID | 3809 |
Feature activation | +9.41e-03 |
Pos logit contributions | |
groom | +0.027 |
burn | +0.025 |
scar | +0.025 |
rob | +0.024 |
salon | +0.024 |
Neg logit contributions | |
eway | -0.032 |
ining | -0.028 |
ered | -0.027 |
kered | -0.027 |
earing | -0.026 |
Token | later |
Token ID | 1568 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
groom | +0.014 |
rob | +0.013 |
scar | +0.013 |
burn | +0.013 |
pony | +0.012 |
Neg logit contributions | |
eway | -0.017 |
ining | -0.016 |
ered | -0.016 |
earing | -0.015 |
kered | -0.014 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.80e-02 |
Pos logit contributions | |
groom | +0.051 |
scar | +0.049 |
rob | +0.049 |
burn | +0.045 |
pony | +0.044 |
Neg logit contributions | |
eway | -0.044 |
ered | -0.041 |
Everyone | -0.040 |
ining | -0.040 |
To | -0.040 |
Token | he |
Token ID | 339 |
Feature activation | +3.64e-02 |
Pos logit contributions | |
groom | +0.053 |
scar | +0.050 |
pony | +0.050 |
burn | +0.048 |
chicken | +0.048 |
Neg logit contributions | |
eway | -0.046 |
ining | -0.039 |
kered | -0.038 |
ered | -0.037 |
ooks | -0.036 |
Token | asked |
Token ID | 1965 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
burn | +0.060 |
rob | +0.057 |
groom | +0.057 |
salon | +0.055 |
pony | +0.054 |
Neg logit contributions | |
eway | -0.058 |
ered | -0.057 |
ining | -0.056 |
kered | -0.056 |
aged | -0.054 |
Token | . |
Token ID | 13 |
Feature activation | +8.96e-03 |
Pos logit contributions | |
groom | +0.018 |
scar | +0.016 |
burn | +0.016 |
pony | +0.016 |
rob | +0.015 |
Neg logit contributions | |
eway | -0.020 |
ining | -0.017 |
ered | -0.017 |
kered | -0.017 |
ooks | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | +7.67e-03 |
Pos logit contributions | |
groom | +0.013 |
pony | +0.012 |
scar | +0.012 |
burn | +0.011 |
chicken | +0.011 |
Neg logit contributions | |
eway | -0.018 |
ered | -0.016 |
ining | -0.016 |
kered | -0.016 |
earing | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | -5.16e-03 |
Pos logit contributions | |
groom | +0.012 |
scar | +0.012 |
pony | +0.011 |
burn | +0.011 |
chicken | +0.011 |
Neg logit contributions | |
eway | -0.014 |
ining | -0.012 |
ered | -0.012 |
kered | -0.012 |
earing | -0.011 |
Token | " |
Token ID | 1 |
Feature activation | -1.39e-03 |
Pos logit contributions | |
eway | +0.010 |
ining | +0.009 |
ered | +0.009 |
eways | +0.009 |
Everything | +0.009 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.007 |
pony | -0.007 |
horse | -0.007 |
burn | -0.006 |
Token | make |
Token ID | 787 |
Feature activation | -1.76e-02 |
Pos logit contributions | |
groom | +0.019 |
scar | +0.018 |
burn | +0.017 |
rob | +0.017 |
pony | +0.017 |
Neg logit contributions | |
eway | -0.024 |
ered | -0.022 |
ining | -0.021 |
kered | -0.021 |
rum | -0.020 |
Token | fun |
Token ID | 1257 |
Feature activation | -7.78e-03 |
Pos logit contributions | |
eway | +0.032 |
ining | +0.028 |
ered | +0.027 |
kered | +0.027 |
ooks | +0.027 |
Neg logit contributions | |
groom | -0.030 |
scar | -0.028 |
burn | -0.027 |
pony | -0.027 |
ponies | -0.026 |
Token | of |
Token ID | 286 |
Feature activation | -4.34e-03 |
Pos logit contributions | |
eway | +0.012 |
ining | +0.011 |
ered | +0.011 |
earing | +0.011 |
ooks | +0.010 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.014 |
pony | -0.013 |
chicken | -0.013 |
burn | -0.013 |
Token | the |
Token ID | 262 |
Feature activation | -6.34e-03 |
Pos logit contributions | |
eway | +0.008 |
ining | +0.007 |
ered | +0.007 |
kered | +0.006 |
ooks | +0.006 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.007 |
burn | -0.007 |
pony | -0.007 |
salon | -0.006 |
Token | other |
Token ID | 584 |
Feature activation | +3.14e-03 |
Pos logit contributions | |
eway | +0.011 |
ining | +0.011 |
kered | +0.010 |
ered | +0.010 |
itself | +0.010 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.009 |
burn | -0.009 |
rob | -0.009 |
salon | -0.009 |
Token | ducks |
Token ID | 39694 |
Feature activation | -7.47e-03 |
Pos logit contributions | |
groom | +0.005 |
scar | +0.004 |
salon | +0.004 |
poet | +0.004 |
burn | +0.004 |
Neg logit contributions | |
eway | -0.006 |
ining | -0.005 |
ered | -0.005 |
kered | -0.005 |
itself | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -5.14e-03 |
Pos logit contributions | |
eway | +0.014 |
ining | +0.012 |
ered | +0.012 |
kered | +0.012 |
earing | +0.012 |
Neg logit contributions | |
groom | -0.012 |
scar | -0.011 |
burn | -0.011 |
pony | -0.011 |
salon | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +2.45e-03 |
Pos logit contributions | |
eway | +0.008 |
ered | +0.007 |
ining | +0.007 |
kered | +0.007 |
rum | +0.006 |
Neg logit contributions | |
scar | -0.009 |
groom | -0.009 |
pony | -0.009 |
chicken | -0.009 |
horse | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
groom | +0.005 |
scar | +0.004 |
pony | +0.004 |
burn | +0.004 |
rob | +0.004 |
Neg logit contributions | |
eway | -0.004 |
ining | -0.003 |
ered | -0.003 |
kered | -0.003 |
rum | -0.003 |
Token | " |
Token ID | 1 |
Feature activation | -2.45e-04 |
Pos logit contributions | |
eway | +0.024 |
ered | +0.021 |
ining | +0.021 |
rum | +0.021 |
Suz | +0.021 |
Neg logit contributions | |
groom | -0.016 |
scar | -0.015 |
pony | -0.014 |
salon | -0.014 |
chicken | -0.014 |
Token | Look |
Token ID | 8567 |
Feature activation | -5.71e-03 |
Pos logit contributions | |
eway | +0.000 |
ining | +0.000 |
kered | +0.000 |
Turns | +0.000 |
ered | +0.000 |
Neg logit contributions | |
scar | -0.000 |
groom | -0.000 |
burn | -0.000 |
pony | -0.000 |
salon | -0.000 |
Token | and |
Token ID | 290 |
Feature activation | +6.39e-04 |
Pos logit contributions | |
eway | +0.006 |
ining | +0.005 |
ered | +0.005 |
kered | +0.005 |
ooks | +0.005 |
Neg logit contributions | |
groom | -0.005 |
scar | -0.005 |
burn | -0.004 |
pony | -0.004 |
salon | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | -1.59e-03 |
Pos logit contributions | |
groom | +0.001 |
scar | +0.001 |
burn | +0.001 |
pony | +0.001 |
salon | +0.001 |
Neg logit contributions | |
eway | -0.001 |
ining | -0.001 |
ered | -0.001 |
kered | -0.001 |
ooks | -0.001 |
Token | family |
Token ID | 1641 |
Feature activation | -2.97e-02 |
Pos logit contributions | |
eway | +0.003 |
ining | +0.003 |
ered | +0.003 |
kered | +0.003 |
ooks | +0.003 |
Neg logit contributions | |
groom | -0.002 |
scar | -0.002 |
burn | -0.002 |
pony | -0.002 |
rob | -0.002 |
Token | drove |
Token ID | 10357 |
Feature activation | +3.25e-03 |
Pos logit contributions | |
eway | +0.056 |
ooks | +0.046 |
ining | +0.045 |
rum | +0.044 |
eways | +0.044 |
Neg logit contributions | |
groom | -0.052 |
scar | -0.048 |
pony | -0.048 |
burn | -0.047 |
salon | -0.045 |
Token | away |
Token ID | 1497 |
Feature activation | -2.15e-02 |
Pos logit contributions | |
groom | +0.006 |
scar | +0.005 |
pony | +0.005 |
burn | +0.005 |
ponies | +0.005 |
Neg logit contributions | |
eway | -0.006 |
ining | -0.005 |
kered | -0.005 |
ooks | -0.005 |
rum | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -3.33e-03 |
Pos logit contributions | |
eway | +0.042 |
ining | +0.038 |
kered | +0.037 |
ered | +0.036 |
rum | +0.036 |
Neg logit contributions | |
groom | -0.032 |
scar | -0.030 |
pony | -0.029 |
burn | -0.029 |
salon | -0.028 |
Token | |
Token ID | 220 |
Feature activation | -8.33e-03 |
Pos logit contributions | |
eway | +0.006 |
ered | +0.005 |
kered | +0.005 |
rum | +0.005 |
ining | +0.004 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.006 |
burn | -0.006 |
salon | -0.005 |
pony | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | -4.23e-03 |
Pos logit contributions | |
eway | +0.016 |
kered | +0.015 |
ered | +0.015 |
rum | +0.014 |
ining | +0.013 |
Neg logit contributions | |
burn | -0.011 |
Velvet | -0.010 |
groom | -0.010 |
salon | -0.009 |
ponies | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | -5.35e-03 |
Pos logit contributions | |
eway | +0.008 |
ered | +0.007 |
rum | +0.007 |
kered | +0.007 |
ining | +0.007 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.006 |
rob | -0.006 |
pony | -0.006 |
Velvet | -0.005 |
Token | J |
Token ID | 41 |
Feature activation | +7.77e-03 |
Pos logit contributions | |
eway | +0.010 |
rum | +0.009 |
ered | +0.008 |
aged | +0.008 |
ooks | +0.008 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.008 |
salon | -0.008 |
burn | -0.008 |
poet | -0.008 |
Token | enny |
Token ID | 11870 |
Feature activation | -8.79e-03 |
Pos logit contributions | |
groom | +0.013 |
burn | +0.012 |
scar | +0.012 |
poet | +0.012 |
salon | +0.012 |
Neg logit contributions | |
eway | -0.014 |
ered | -0.012 |
Turns | -0.011 |
ining | -0.011 |
rum | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | -6.00e-03 |
Pos logit contributions | |
groom | +0.028 |
burn | +0.025 |
scar | +0.024 |
salon | +0.024 |
pony | +0.023 |
Neg logit contributions | |
eway | -0.022 |
ining | -0.018 |
ered | -0.018 |
kered | -0.018 |
earing | -0.017 |
Token | so |
Token ID | 523 |
Feature activation | +1.60e-03 |
Pos logit contributions | |
eway | +0.012 |
ining | +0.010 |
ered | +0.010 |
kered | +0.010 |
rum | +0.010 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.009 |
pony | -0.008 |
burn | -0.008 |
salon | -0.008 |
Token | she |
Token ID | 673 |
Feature activation | -9.83e-04 |
Pos logit contributions | |
rob | +0.003 |
burn | +0.003 |
scar | +0.003 |
groom | +0.003 |
salon | +0.003 |
Neg logit contributions | |
eway | -0.002 |
ooks | -0.002 |
Everyone | -0.002 |
earing | -0.002 |
ered | -0.002 |
Token | had |
Token ID | 550 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
eway | +0.002 |
ining | +0.001 |
ered | +0.001 |
ooks | +0.001 |
kered | +0.001 |
Neg logit contributions | |
groom | -0.002 |
scar | -0.002 |
burn | -0.002 |
pony | -0.002 |
salon | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | +4.27e-03 |
Pos logit contributions | |
groom | +0.029 |
rob | +0.028 |
burn | +0.027 |
scar | +0.027 |
salon | +0.026 |
Neg logit contributions | |
eway | -0.023 |
ining | -0.020 |
ered | -0.019 |
earing | -0.019 |
itself | -0.018 |
Token | surrender |
Token ID | 16908 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
groom | +0.007 |
rob | +0.007 |
scar | +0.007 |
burn | +0.007 |
pony | +0.006 |
Neg logit contributions | |
eway | -0.007 |
ered | -0.007 |
ining | -0.006 |
kered | -0.006 |
itself | -0.006 |
Token | her |
Token ID | 607 |
Feature activation | -2.53e-03 |
Pos logit contributions | |
groom | +0.027 |
scar | +0.025 |
burn | +0.025 |
pony | +0.024 |
salon | +0.023 |
Neg logit contributions | |
eway | -0.028 |
ining | -0.024 |
ered | -0.024 |
kered | -0.023 |
ooks | -0.023 |
Token | tall |
Token ID | 7331 |
Feature activation | -4.84e-03 |
Pos logit contributions | |
eway | +0.005 |
ining | +0.004 |
ered | +0.004 |
kered | +0.004 |
earing | +0.004 |
Neg logit contributions | |
groom | -0.004 |
burn | -0.004 |
rob | -0.003 |
scar | -0.003 |
salon | -0.003 |
Token | walking |
Token ID | 6155 |
Feature activation | +3.81e-04 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.008 |
ered | +0.008 |
earing | +0.008 |
rum | +0.008 |
Neg logit contributions | |
groom | -0.007 |
burn | -0.007 |
rob | -0.007 |
scar | -0.007 |
salon | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +3.05e-03 |
Pos logit contributions | |
groom | +0.001 |
scar | +0.001 |
pony | +0.001 |
burn | +0.001 |
ponies | +0.001 |
Neg logit contributions | |
eway | -0.001 |
ining | -0.001 |
ered | -0.000 |
kered | -0.000 |
ooks | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
groom | +0.007 |
scar | +0.007 |
burn | +0.006 |
rob | +0.006 |
poet | +0.006 |
Neg logit contributions | |
eway | -0.004 |
ining | -0.003 |
Everyone | -0.003 |
Everything | -0.003 |
earing | -0.003 |
Token | heard |
Token ID | 2982 |
Feature activation | -2.72e-03 |
Pos logit contributions | |
groom | +0.003 |
scar | +0.003 |
pony | +0.003 |
burn | +0.003 |
chicken | +0.002 |
Neg logit contributions | |
eway | -0.004 |
ining | -0.003 |
ooks | -0.003 |
kered | -0.003 |
rum | -0.003 |
Token | a |
Token ID | 257 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
eway | +0.006 |
ining | +0.005 |
ooks | +0.005 |
earing | +0.005 |
rum | +0.005 |
Neg logit contributions | |
groom | -0.004 |
scar | -0.004 |
pony | -0.004 |
ponies | -0.003 |
chicken | -0.003 |
Token | loud |
Token ID | 7812 |
Feature activation | -9.99e-03 |
Pos logit contributions | |
groom | +0.015 |
scar | +0.015 |
pony | +0.014 |
horse | +0.013 |
chicken | +0.013 |
Neg logit contributions | |
eway | -0.022 |
ooks | -0.020 |
ining | -0.020 |
ered | -0.019 |
earing | -0.019 |
Token | roar |
Token ID | 34532 |
Feature activation | -3.71e-03 |
Pos logit contributions | |
eway | +0.020 |
ooks | +0.020 |
earing | +0.018 |
ining | +0.018 |
amed | +0.017 |
Neg logit contributions | |
scar | -0.014 |
pony | -0.014 |
horse | -0.014 |
groom | -0.014 |
chicken | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -1.60e-03 |
Pos logit contributions | |
eway | +0.007 |
ining | +0.006 |
ooks | +0.006 |
ered | +0.006 |
earing | +0.006 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.006 |
burn | -0.005 |
pony | -0.005 |
chicken | -0.005 |
Token | He |
Token ID | 679 |
Feature activation | -2.71e-03 |
Pos logit contributions | |
eway | +0.002 |
ered | +0.002 |
ining | +0.002 |
kered | +0.002 |
earing | +0.002 |
Neg logit contributions | |
groom | -0.003 |
scar | -0.003 |
chicken | -0.003 |
pony | -0.003 |
horse | -0.003 |
Token | felt |
Token ID | 2936 |
Feature activation | -5.19e-03 |
Pos logit contributions | |
eway | +0.005 |
ining | +0.004 |
ooks | +0.004 |
rum | +0.004 |
earing | +0.004 |
Neg logit contributions | |
groom | -0.004 |
scar | -0.004 |
pony | -0.004 |
burn | -0.004 |
chicken | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | -1.73e-02 |
Pos logit contributions | |
eway | +0.011 |
ining | +0.010 |
ooks | +0.010 |
earing | +0.010 |
kered | +0.010 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.006 |
pony | -0.006 |
chicken | -0.006 |
horses | -0.006 |
Token | hot |
Token ID | 3024 |
Feature activation | +2.55e-03 |
Pos logit contributions | |
eway | +0.040 |
ining | +0.035 |
ered | +0.035 |
ooks | +0.035 |
kered | +0.033 |
Neg logit contributions | |
groom | -0.022 |
scar | -0.021 |
pony | -0.020 |
burn | -0.019 |
chicken | -0.019 |
Token | breath |
Token ID | 8033 |
Feature activation | +9.85e-03 |
Pos logit contributions | |
groom | +0.004 |
scar | +0.004 |
burn | +0.004 |
salon | +0.004 |
pony | +0.004 |
Neg logit contributions | |
eway | -0.005 |
ining | -0.004 |
kered | -0.004 |
ered | -0.004 |
rum | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | +7.64e-03 |
Pos logit contributions | |
groom | +0.015 |
scar | +0.014 |
burn | +0.013 |
pony | +0.013 |
rob | +0.012 |
Neg logit contributions | |
eway | -0.020 |
ining | -0.017 |
ooks | -0.017 |
ered | -0.017 |
kered | -0.017 |
Token | was |
Token ID | 373 |
Feature activation | -6.30e-03 |
Pos logit contributions | |
groom | +0.013 |
scar | +0.013 |
pony | +0.012 |
burn | +0.012 |
salon | +0.011 |
Neg logit contributions | |
eway | -0.013 |
ooks | -0.011 |
ining | -0.010 |
rum | -0.010 |
ered | -0.010 |
Token | amazed |
Token ID | 24562 |
Feature activation | -8.16e-03 |
Pos logit contributions | |
eway | +0.012 |
ooks | +0.010 |
kered | +0.010 |
rum | +0.010 |
eways | +0.010 |
Neg logit contributions | |
groom | -0.010 |
burn | -0.010 |
scar | -0.009 |
pony | -0.009 |
salon | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +1.96e-03 |
Pos logit contributions | |
eway | +0.015 |
ining | +0.013 |
ered | +0.012 |
kered | +0.012 |
ooks | +0.012 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.013 |
burn | -0.013 |
pony | -0.013 |
salon | -0.012 |
Token | so |
Token ID | 523 |
Feature activation | +8.05e-03 |
Pos logit contributions | |
groom | +0.003 |
scar | +0.003 |
pony | +0.003 |
burn | +0.003 |
prince | +0.002 |
Neg logit contributions | |
eway | -0.004 |
ooks | -0.004 |
rum | -0.003 |
ining | -0.003 |
kered | -0.003 |
Token | relieved |
Token ID | 22598 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
groom | +0.013 |
scar | +0.011 |
pony | +0.011 |
burn | +0.011 |
bald | +0.010 |
Neg logit contributions | |
eway | -0.016 |
ooks | -0.013 |
rum | -0.013 |
Turns | -0.012 |
eways | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -8.34e-04 |
Pos logit contributions | |
eway | +0.030 |
ining | +0.027 |
ooks | +0.026 |
rum | +0.026 |
kered | +0.026 |
Neg logit contributions | |
groom | -0.021 |
scar | -0.020 |
pony | -0.019 |
burn | -0.018 |
ponies | -0.017 |
Token | She |
Token ID | 1375 |
Feature activation | -9.98e-03 |
Pos logit contributions | |
eway | +0.001 |
ered | +0.001 |
ining | +0.001 |
kered | +0.001 |
rum | +0.001 |
Neg logit contributions | |
groom | -0.002 |
scar | -0.002 |
pony | -0.002 |
burn | -0.002 |
salon | -0.002 |
Token | had |
Token ID | 550 |
Feature activation | -5.11e-03 |
Pos logit contributions | |
eway | +0.019 |
ooks | +0.016 |
ining | +0.016 |
rum | +0.015 |
kered | +0.015 |
Neg logit contributions | |
groom | -0.017 |
scar | -0.016 |
pony | -0.015 |
burn | -0.015 |
prince | -0.014 |
Token | never |
Token ID | 1239 |
Feature activation | +7.08e-03 |
Pos logit contributions | |
eway | +0.009 |
ooks | +0.008 |
ining | +0.008 |
rum | +0.008 |
kered | +0.008 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.008 |
burn | -0.008 |
pony | -0.008 |
butter | -0.008 |
Token | been |
Token ID | 587 |
Feature activation | -6.56e-03 |
Pos logit contributions | |
groom | +0.013 |
scar | +0.013 |
pony | +0.013 |
burn | +0.012 |
rob | +0.012 |
Neg logit contributions | |
eway | -0.011 |
ered | -0.010 |
ining | -0.010 |
earing | -0.009 |
kered | -0.009 |
Token | so |
Token ID | 523 |
Feature activation | -6.80e-03 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.008 |
ered | +0.008 |
earing | +0.008 |
aged | +0.008 |
Neg logit contributions | |
groom | -0.013 |
scar | -0.012 |
rob | -0.012 |
burn | -0.012 |
pony | -0.012 |
Token | Once |
Token ID | 7454 |
Feature activation | -2.81e-04 |
Pos logit contributions | |
groom | +0.027 |
scar | +0.026 |
burn | +0.025 |
pony | +0.024 |
salon | +0.024 |
Neg logit contributions | |
eway | -0.019 |
ining | -0.016 |
kered | -0.015 |
ered | -0.015 |
ooks | -0.015 |
Token | upon |
Token ID | 2402 |
Feature activation | +1.66e-03 |
Pos logit contributions | |
eway | +0.000 |
ining | +0.000 |
ered | +0.000 |
earing | +0.000 |
ooks | +0.000 |
Neg logit contributions | |
groom | -0.001 |
scar | -0.001 |
burn | -0.001 |
pony | -0.001 |
rob | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | +3.20e-02 |
Pos logit contributions | |
groom | +0.003 |
burn | +0.003 |
scar | +0.003 |
salon | +0.003 |
rob | +0.003 |
Neg logit contributions | |
eway | -0.003 |
ining | -0.002 |
kered | -0.002 |
ered | -0.002 |
itself | -0.002 |
Token | time |
Token ID | 640 |
Feature activation | -8.80e-03 |
Pos logit contributions | |
groom | +0.067 |
burn | +0.059 |
scar | +0.059 |
rob | +0.058 |
salon | +0.058 |
Neg logit contributions | |
eway | -0.047 |
ining | -0.043 |
earing | -0.042 |
ooks | -0.039 |
Turns | -0.037 |
Token | , |
Token ID | 11 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
kered | +0.019 |
eway | +0.018 |
ining | +0.017 |
aged | +0.017 |
age | +0.017 |
Neg logit contributions | |
pony | -0.010 |
scar | -0.009 |
salon | -0.009 |
horse | -0.008 |
ponies | -0.008 |
Token | there |
Token ID | 612 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
eway | +0.025 |
kered | +0.022 |
ining | +0.022 |
rum | +0.022 |
ooks | +0.022 |
Neg logit contributions | |
groom | -0.017 |
scar | -0.016 |
pony | -0.016 |
burn | -0.015 |
chicken | -0.015 |
Token | was |
Token ID | 373 |
Feature activation | +4.24e-03 |
Pos logit contributions | |
eway | +0.040 |
ooks | +0.036 |
rum | +0.035 |
ining | +0.034 |
taker | +0.034 |
Neg logit contributions | |
groom | -0.034 |
pony | -0.033 |
chicken | -0.032 |
scar | -0.032 |
strawberry | -0.032 |
Token | a |
Token ID | 257 |
Feature activation | +2.32e-02 |
Pos logit contributions | |
groom | +0.008 |
salon | +0.008 |
scar | +0.007 |
burn | +0.007 |
rob | +0.007 |
Neg logit contributions | |
eway | -0.007 |
ining | -0.006 |
kered | -0.006 |
ooks | -0.005 |
earing | -0.005 |
Token | boy |
Token ID | 2933 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
rob | +0.046 |
burn | +0.044 |
groom | +0.042 |
scar | +0.041 |
salon | +0.040 |
Neg logit contributions | |
eway | -0.025 |
ining | -0.025 |
Turns | -0.024 |
ooks | -0.024 |
earing | -0.023 |
Token | who |
Token ID | 508 |
Feature activation | +5.64e-03 |
Pos logit contributions | |
eway | +0.030 |
ining | +0.025 |
ered | +0.025 |
kered | +0.024 |
earing | +0.024 |
Neg logit contributions | |
groom | -0.034 |
scar | -0.032 |
burn | -0.031 |
pony | -0.031 |
salon | -0.030 |
Token | lived |
Token ID | 5615 |
Feature activation | -5.38e-03 |
Pos logit contributions | |
groom | +0.011 |
scar | +0.010 |
pony | +0.010 |
burn | +0.010 |
chicken | +0.010 |
Neg logit contributions | |
eway | -0.009 |
ining | -0.007 |
ered | -0.007 |
ooks | -0.007 |
kered | -0.007 |
Token | ack |
Token ID | 441 |
Feature activation | -6.98e-03 |
Pos logit contributions | |
groom | +0.018 |
scar | +0.017 |
burn | +0.017 |
pony | +0.016 |
salon | +0.016 |
Neg logit contributions | |
eway | -0.023 |
ining | -0.020 |
ered | -0.020 |
kered | -0.019 |
ooks | -0.019 |
Token | !" |
Token ID | 2474 |
Feature activation | +6.03e-03 |
Pos logit contributions | |
eway | +0.013 |
ining | +0.011 |
ered | +0.011 |
kered | +0.011 |
rum | +0.010 |
Neg logit contributions | |
groom | -0.012 |
scar | -0.011 |
burn | -0.011 |
salon | -0.010 |
pony | -0.010 |
Token | John |
Token ID | 1757 |
Feature activation | -1.78e-03 |
Pos logit contributions | |
groom | +0.010 |
scar | +0.010 |
pony | +0.009 |
rob | +0.009 |
horse | +0.009 |
Neg logit contributions | |
eway | -0.011 |
ooks | -0.009 |
ered | -0.009 |
kered | -0.009 |
ining | -0.009 |
Token | smiled |
Token ID | 13541 |
Feature activation | -9.76e-03 |
Pos logit contributions | |
eway | +0.003 |
ooks | +0.003 |
ining | +0.003 |
rum | +0.003 |
eways | +0.003 |
Neg logit contributions | |
groom | -0.003 |
scar | -0.003 |
pony | -0.003 |
burn | -0.003 |
chicken | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +6.28e-03 |
Pos logit contributions | |
eway | +0.018 |
ining | +0.016 |
ered | +0.015 |
kered | +0.015 |
ooks | +0.015 |
Neg logit contributions | |
groom | -0.016 |
scar | -0.015 |
burn | -0.015 |
pony | -0.015 |
salon | -0.014 |
Token | said |
Token ID | 531 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
groom | +0.008 |
scar | +0.008 |
pony | +0.007 |
burn | +0.007 |
rob | +0.007 |
Neg logit contributions | |
eway | -0.014 |
ining | -0.012 |
ooks | -0.012 |
ered | -0.012 |
kered | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | -6.36e-04 |
Pos logit contributions | |
eway | +0.030 |
ooks | +0.026 |
ining | +0.026 |
Turns | +0.026 |
earing | +0.025 |
Neg logit contributions | |
groom | -0.022 |
pony | -0.020 |
scar | -0.018 |
prince | -0.018 |
horse | -0.018 |
Token | " |
Token ID | 366 |
Feature activation | -3.74e-03 |
Pos logit contributions | |
eway | +0.001 |
ered | +0.001 |
ooks | +0.001 |
kered | +0.001 |
ining | +0.001 |
Neg logit contributions | |
groom | -0.001 |
pony | -0.001 |
scar | -0.001 |
burn | -0.001 |
chicken | -0.001 |
Token | Hi |
Token ID | 17250 |
Feature activation | +4.02e-03 |
Pos logit contributions | |
eway | +0.007 |
ining | +0.006 |
ered | +0.006 |
kered | +0.006 |
ooks | +0.006 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.006 |
burn | -0.005 |
pony | -0.005 |
salon | -0.005 |
Token | Qu |
Token ID | 2264 |
Feature activation | +5.54e-03 |
Pos logit contributions | |
groom | +0.009 |
salon | +0.009 |
rob | +0.008 |
burn | +0.008 |
poet | +0.008 |
Neg logit contributions | |
eway | -0.004 |
ining | -0.004 |
Suz | -0.003 |
itself | -0.003 |
Everyone | -0.003 |
Token | ack |
Token ID | 441 |
Feature activation | -1.78e-02 |
Pos logit contributions | |
groom | +0.008 |
scar | +0.007 |
burn | +0.007 |
pony | +0.007 |
salon | +0.007 |
Neg logit contributions | |
eway | -0.011 |
ered | -0.010 |
ining | -0.010 |
kered | -0.010 |
rum | -0.010 |
Token | said |
Token ID | 531 |
Feature activation | -9.56e-03 |
Pos logit contributions | |
eway | +0.041 |
ooks | +0.034 |
rum | +0.033 |
ining | +0.033 |
eways | +0.033 |
Neg logit contributions | |
groom | -0.035 |
scar | -0.032 |
pony | -0.031 |
prince | -0.029 |
burn | -0.029 |
Token | goodbye |
Token ID | 24829 |
Feature activation | -1.02e-02 |
Pos logit contributions | |
eway | +0.020 |
ining | +0.017 |
ooks | +0.017 |
rum | +0.017 |
earing | +0.016 |
Neg logit contributions | |
groom | -0.015 |
pony | -0.014 |
scar | -0.013 |
ponies | -0.013 |
butter | -0.013 |
Token | and |
Token ID | 290 |
Feature activation | -2.81e-05 |
Pos logit contributions | |
eway | +0.022 |
ered | +0.019 |
ining | +0.019 |
rum | +0.019 |
kered | +0.019 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.013 |
pony | -0.013 |
burn | -0.012 |
horse | -0.011 |
Token | the |
Token ID | 262 |
Feature activation | -1.19e-03 |
Pos logit contributions | |
eway | +0.000 |
ining | +0.000 |
ooks | +0.000 |
rum | +0.000 |
ered | +0.000 |
Neg logit contributions | |
groom | -0.000 |
scar | -0.000 |
burn | -0.000 |
pony | -0.000 |
salon | -0.000 |
Token | re |
Token ID | 302 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
eway | +0.002 |
ining | +0.002 |
ered | +0.002 |
kered | +0.002 |
Turns | +0.002 |
Neg logit contributions | |
groom | -0.002 |
burn | -0.002 |
scar | -0.002 |
salon | -0.002 |
rob | -0.001 |
Token | ind |
Token ID | 521 |
Feature activation | -2.44e-02 |
Pos logit contributions | |
eway | +0.030 |
Everything | +0.027 |
kered | +0.027 |
Turns | +0.027 |
ining | +0.027 |
Neg logit contributions | |
groom | -0.012 |
pony | -0.010 |
burn | -0.010 |
scar | -0.009 |
ponies | -0.009 |
Token | eer |
Token ID | 28153 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
eway | +0.059 |
ining | +0.053 |
ooks | +0.052 |
ered | +0.051 |
earing | +0.051 |
Neg logit contributions | |
groom | -0.027 |
pony | -0.023 |
scar | -0.022 |
ponies | -0.022 |
burn | -0.021 |
Token | took |
Token ID | 1718 |
Feature activation | -9.91e-04 |
Pos logit contributions | |
eway | +0.019 |
ooks | +0.016 |
ining | +0.016 |
earing | +0.016 |
rum | +0.015 |
Neg logit contributions | |
groom | -0.018 |
scar | -0.016 |
pony | -0.016 |
burn | -0.016 |
horse | -0.015 |
Token | off |
Token ID | 572 |
Feature activation | -1.33e-03 |
Pos logit contributions | |
eway | +0.002 |
ining | +0.002 |
ooks | +0.002 |
rum | +0.002 |
earing | +0.002 |
Neg logit contributions | |
groom | -0.002 |
scar | -0.002 |
pony | -0.001 |
burn | -0.001 |
ponies | -0.001 |
Token | into |
Token ID | 656 |
Feature activation | -7.27e-03 |
Pos logit contributions | |
eway | +0.003 |
ining | +0.002 |
ooks | +0.002 |
earing | +0.002 |
kered | +0.002 |
Neg logit contributions | |
groom | -0.002 |
scar | -0.002 |
burn | -0.002 |
pony | -0.002 |
ponies | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | -1.34e-02 |
Pos logit contributions | |
eway | +0.012 |
ered | +0.010 |
ining | +0.010 |
itself | +0.010 |
rum | +0.010 |
Neg logit contributions | |
groom | -0.013 |
burn | -0.012 |
scar | -0.012 |
pony | -0.012 |
rob | -0.012 |
Token | badly |
Token ID | 11234 |
Feature activation | -1.78e-03 |
Pos logit contributions | |
eway | +0.044 |
ining | +0.038 |
ooks | +0.037 |
kered | +0.037 |
ered | +0.037 |
Neg logit contributions | |
groom | -0.039 |
scar | -0.037 |
burn | -0.036 |
pony | -0.036 |
salon | -0.034 |
Token | . |
Token ID | 13 |
Feature activation | -2.92e-03 |
Pos logit contributions | |
eway | +0.003 |
ining | +0.003 |
ered | +0.003 |
kered | +0.003 |
earing | +0.003 |
Neg logit contributions | |
groom | -0.003 |
scar | -0.003 |
burn | -0.003 |
pony | -0.003 |
salon | -0.003 |
Token | Sadly |
Token ID | 27213 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
eway | +0.005 |
kered | +0.005 |
ered | +0.005 |
ining | +0.004 |
eways | +0.004 |
Neg logit contributions | |
Velvet | -0.004 |
Rudy | -0.004 |
groom | -0.004 |
scar | -0.004 |
chicken | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -9.45e-04 |
Pos logit contributions | |
eway | +0.032 |
ining | +0.027 |
ooks | +0.027 |
kered | +0.026 |
Turns | +0.025 |
Neg logit contributions | |
groom | -0.030 |
scar | -0.030 |
pony | -0.028 |
burn | -0.028 |
rob | -0.027 |
Token | the |
Token ID | 262 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
eway | +0.002 |
ining | +0.002 |
kered | +0.002 |
ered | +0.002 |
earing | +0.002 |
Neg logit contributions | |
groom | -0.001 |
scar | -0.001 |
pony | -0.001 |
burn | -0.001 |
ponies | -0.001 |
Token | man |
Token ID | 582 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
groom | +0.014 |
burn | +0.014 |
rob | +0.013 |
scar | +0.013 |
salon | +0.012 |
Neg logit contributions | |
eway | -0.022 |
ining | -0.019 |
kered | -0.019 |
ered | -0.019 |
Turns | -0.019 |
Token | never |
Token ID | 1239 |
Feature activation | +1.14e-02 |
Pos logit contributions | |
eway | +0.020 |
ining | +0.017 |
ooks | +0.016 |
kered | +0.016 |
rum | +0.015 |
Neg logit contributions | |
groom | -0.024 |
scar | -0.023 |
burn | -0.022 |
pony | -0.022 |
salon | -0.021 |
Token | danced |
Token ID | 39480 |
Feature activation | +1.24e-03 |
Pos logit contributions | |
groom | +0.021 |
scar | +0.020 |
rob | +0.019 |
pony | +0.019 |
burn | +0.019 |
Neg logit contributions | |
eway | -0.018 |
ered | -0.016 |
ining | -0.016 |
kered | -0.016 |
earing | -0.015 |
Token | again |
Token ID | 757 |
Feature activation | +6.13e-03 |
Pos logit contributions | |
groom | +0.002 |
scar | +0.002 |
burn | +0.002 |
pony | +0.002 |
salon | +0.002 |
Neg logit contributions | |
eway | -0.002 |
ining | -0.002 |
ered | -0.002 |
kered | -0.002 |
ooks | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
groom | +0.011 |
scar | +0.011 |
burn | +0.010 |
rob | +0.010 |
pony | +0.010 |
Neg logit contributions | |
eway | -0.010 |
ining | -0.009 |
ered | -0.008 |
earing | -0.008 |
rum | -0.008 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.32e-02 |
Pos logit contributions | |
eway | +0.036 |
ered | +0.034 |
kered | +0.034 |
amed | +0.030 |
eways | +0.030 |
Neg logit contributions | |
Velvet | -0.022 |
Star | -0.021 |
Rudy | -0.021 |
dentist | -0.021 |
prince | -0.021 |
Token | wanted |
Token ID | 2227 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
eway | +0.003 |
ining | +0.003 |
ered | +0.003 |
kered | +0.003 |
earing | +0.002 |
Neg logit contributions | |
groom | -0.004 |
scar | -0.004 |
burn | -0.004 |
pony | -0.004 |
rob | -0.004 |
Token | to |
Token ID | 284 |
Feature activation | -4.70e-04 |
Pos logit contributions | |
groom | +0.029 |
scar | +0.027 |
burn | +0.026 |
pony | +0.026 |
salon | +0.025 |
Neg logit contributions | |
eway | -0.033 |
ining | -0.029 |
ered | -0.028 |
kered | -0.028 |
ooks | -0.027 |
Token | welcome |
Token ID | 7062 |
Feature activation | +8.32e-03 |
Pos logit contributions | |
eway | +0.001 |
ining | +0.001 |
kered | +0.001 |
ered | +0.001 |
ooks | +0.001 |
Neg logit contributions | |
groom | -0.001 |
scar | -0.001 |
burn | -0.001 |
pony | -0.001 |
salon | -0.001 |
Token | her |
Token ID | 607 |
Feature activation | +5.67e-03 |
Pos logit contributions | |
groom | +0.014 |
scar | +0.013 |
rob | +0.013 |
burn | +0.013 |
salon | +0.013 |
Neg logit contributions | |
eway | -0.014 |
ining | -0.013 |
ered | -0.012 |
kered | -0.012 |
ooks | -0.012 |
Token | baby |
Token ID | 5156 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
rob | +0.010 |
groom | +0.009 |
salon | +0.009 |
burn | +0.009 |
scar | +0.009 |
Neg logit contributions | |
eway | -0.008 |
ining | -0.008 |
ooks | -0.008 |
earing | -0.008 |
ered | -0.008 |
Token | chick |
Token ID | 17943 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
rob | +0.020 |
groom | +0.020 |
salon | +0.019 |
Ba | +0.018 |
avail | +0.018 |
Neg logit contributions | |
eway | -0.014 |
ining | -0.013 |
aged | -0.012 |
Suz | -0.012 |
ooks | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -6.41e-03 |
Pos logit contributions | |
eway | +0.030 |
ining | +0.026 |
ered | +0.025 |
ooks | +0.025 |
kered | +0.025 |
Neg logit contributions | |
groom | -0.033 |
rob | -0.031 |
scar | -0.030 |
burn | -0.030 |
salon | -0.029 |
Token | But |
Token ID | 887 |
Feature activation | +1.13e-03 |
Pos logit contributions | |
eway | +0.011 |
ered | +0.009 |
ining | +0.009 |
kered | +0.009 |
rum | +0.009 |
Neg logit contributions | |
groom | -0.012 |
scar | -0.011 |
pony | -0.011 |
burn | -0.011 |
ponies | -0.010 |
Token | , |
Token ID | 11 |
Feature activation | +8.35e-03 |
Pos logit contributions | |
groom | +0.002 |
scar | +0.002 |
pony | +0.002 |
burn | +0.001 |
salon | +0.001 |
Neg logit contributions | |
eway | -0.002 |
ining | -0.002 |
kered | -0.002 |
ooks | -0.002 |
ered | -0.002 |
Token | it |
Token ID | 340 |
Feature activation | -1.11e-02 |
Pos logit contributions | |
groom | +0.014 |
scar | +0.013 |
burn | +0.013 |
rob | +0.012 |
pony | +0.012 |
Neg logit contributions | |
eway | -0.015 |
ining | -0.013 |
ered | -0.013 |
kered | -0.013 |
earing | -0.013 |
Token | was |
Token ID | 373 |
Feature activation | +3.09e-04 |
Pos logit contributions | |
eway | +0.015 |
ining | +0.012 |
ered | +0.012 |
kered | +0.012 |
earing | +0.011 |
Neg logit contributions | |
groom | -0.024 |
scar | -0.023 |
burn | -0.023 |
pony | -0.022 |
rob | -0.022 |
Token | the |
Token ID | 262 |
Feature activation | -4.23e-03 |
Pos logit contributions | |
eway | +0.013 |
ining | +0.011 |
ered | +0.011 |
kered | +0.011 |
ooks | +0.011 |
Neg logit contributions | |
groom | -0.009 |
scar | -0.009 |
burn | -0.008 |
pony | -0.008 |
ponies | -0.008 |
Token | dark |
Token ID | 3223 |
Feature activation | -5.53e-03 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.009 |
ooks | +0.008 |
ered | +0.008 |
kered | +0.008 |
Neg logit contributions | |
groom | -0.005 |
scar | -0.005 |
burn | -0.005 |
pony | -0.004 |
salon | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | -3.60e-03 |
Pos logit contributions | |
eway | +0.012 |
ered | +0.010 |
ining | +0.010 |
kered | +0.010 |
earing | +0.010 |
Neg logit contributions | |
groom | -0.008 |
scar | -0.007 |
burn | -0.007 |
pony | -0.007 |
ponies | -0.006 |
Token | On |
Token ID | 1550 |
Feature activation | -9.15e-03 |
Pos logit contributions | |
eway | +0.005 |
ered | +0.005 |
ining | +0.005 |
aged | +0.004 |
rum | +0.004 |
Neg logit contributions | |
groom | -0.007 |
pony | -0.006 |
scar | -0.006 |
chicken | -0.006 |
ponies | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | -3.98e-03 |
Pos logit contributions | |
eway | +0.018 |
ining | +0.016 |
ered | +0.015 |
kered | +0.015 |
ooks | +0.015 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.013 |
burn | -0.013 |
pony | -0.012 |
salon | -0.012 |
Token | farm |
Token ID | 5318 |
Feature activation | -4.64e-02 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.008 |
Turns | +0.008 |
kered | +0.008 |
ered | +0.008 |
Neg logit contributions | |
groom | -0.004 |
salon | -0.004 |
burn | -0.004 |
scar | -0.004 |
rob | -0.004 |
Token | there |
Token ID | 612 |
Feature activation | -1.72e-02 |
Pos logit contributions | |
eway | +0.090 |
rum | +0.085 |
ining | +0.082 |
kered | +0.078 |
earing | +0.077 |
Neg logit contributions | |
groom | -0.061 |
chicken | -0.060 |
salon | -0.060 |
pony | -0.059 |
horse | -0.059 |
Token | lived |
Token ID | 5615 |
Feature activation | -1.67e-03 |
Pos logit contributions | |
eway | +0.023 |
ining | +0.019 |
rum | +0.019 |
ooks | +0.019 |
earing | +0.018 |
Neg logit contributions | |
groom | -0.035 |
pony | -0.033 |
scar | -0.032 |
burn | -0.032 |
salon | -0.032 |
Token | many |
Token ID | 867 |
Feature activation | -1.94e-02 |
Pos logit contributions | |
eway | +0.004 |
ining | +0.003 |
rum | +0.003 |
ered | +0.003 |
kered | +0.003 |
Neg logit contributions | |
groom | -0.002 |
scar | -0.002 |
pony | -0.002 |
chicken | -0.002 |
burn | -0.002 |
Token | animals |
Token ID | 4695 |
Feature activation | -1.59e-02 |
Pos logit contributions | |
eway | +0.033 |
ining | +0.030 |
ooks | +0.029 |
ered | +0.029 |
kered | +0.029 |
Neg logit contributions | |
groom | -0.033 |
burn | -0.033 |
salon | -0.031 |
scar | -0.030 |
rob | -0.029 |
Token | â |
Token ID | 22940 |
Feature activation | -2.94e-03 |
Pos logit contributions | |
eway | +0.035 |
ered | +0.031 |
ining | +0.031 |
kered | +0.030 |
rum | +0.030 |
Neg logit contributions | |
groom | -0.019 |
scar | -0.018 |
pony | -0.018 |
ponies | -0.017 |
chicken | -0.017 |
Token | ! |
Token ID | 0 |
Feature activation | -6.65e-04 |
Pos logit contributions | |
eway | +0.023 |
ining | +0.020 |
ooks | +0.020 |
ered | +0.020 |
kered | +0.020 |
Neg logit contributions | |
groom | -0.018 |
scar | -0.017 |
burn | -0.017 |
pony | -0.016 |
butter | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | +3.81e-04 |
Pos logit contributions | |
eway | +0.001 |
kered | +0.001 |
ered | +0.001 |
aged | +0.001 |
ining | +0.001 |
Neg logit contributions | |
groom | -0.001 |
salon | -0.001 |
pony | -0.001 |
strawberry | -0.001 |
rob | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -5.19e-03 |
Pos logit contributions | |
groom | +0.001 |
scar | +0.001 |
pony | +0.001 |
rob | +0.001 |
salon | +0.001 |
Neg logit contributions | |
eway | -0.001 |
kered | -0.001 |
ining | -0.001 |
aged | -0.001 |
earing | -0.001 |
Token | M |
Token ID | 44 |
Feature activation | +3.30e-03 |
Pos logit contributions | |
eway | +0.009 |
aged | +0.008 |
ered | +0.008 |
kered | +0.008 |
ooks | +0.008 |
Neg logit contributions | |
groom | -0.008 |
salon | -0.007 |
scar | -0.007 |
rob | -0.007 |
pony | -0.007 |
Token | oral |
Token ID | 6864 |
Feature activation | -2.78e-02 |
Pos logit contributions | |
salon | +0.005 |
groom | +0.005 |
scar | +0.005 |
pony | +0.005 |
ponies | +0.005 |
Neg logit contributions | |
eway | -0.006 |
ining | -0.005 |
aged | -0.005 |
Turns | -0.005 |
kered | -0.004 |
Token | of |
Token ID | 286 |
Feature activation | -4.78e-02 |
Pos logit contributions | |
eway | +0.038 |
ining | +0.032 |
rum | +0.031 |
aged | +0.030 |
ooks | +0.030 |
Neg logit contributions | |
groom | -0.053 |
scar | -0.052 |
pony | -0.051 |
rob | -0.051 |
ponies | -0.051 |
Token | the |
Token ID | 262 |
Feature activation | -3.78e-02 |
Pos logit contributions | |
eway | +0.097 |
kered | +0.086 |
ining | +0.086 |
ooks | +0.084 |
ered | +0.084 |
Neg logit contributions | |
groom | -0.068 |
scar | -0.064 |
burn | -0.061 |
pony | -0.061 |
chicken | -0.059 |
Token | story |
Token ID | 1621 |
Feature activation | -3.07e-02 |
Pos logit contributions | |
eway | +0.069 |
ining | +0.061 |
kered | +0.059 |
ooks | +0.058 |
rum | +0.058 |
Neg logit contributions | |
groom | -0.063 |
scar | -0.060 |
pony | -0.058 |
burn | -0.056 |
ponies | -0.055 |
Token | : |
Token ID | 25 |
Feature activation | -3.12e-02 |
Pos logit contributions | |
eway | +0.046 |
kered | +0.041 |
aged | +0.039 |
ered | +0.039 |
Turns | +0.039 |
Neg logit contributions | |
salon | -0.048 |
reads | -0.046 |
groom | -0.044 |
ara | -0.044 |
Star | -0.044 |
Token | If |
Token ID | 1002 |
Feature activation | -2.02e-02 |
Pos logit contributions | |
eway | +0.055 |
kered | +0.047 |
amed | +0.047 |
ered | +0.045 |
eways | +0.044 |
Neg logit contributions | |
groom | -0.050 |
chicken | -0.047 |
salon | -0.046 |
reads | -0.045 |
ninety | -0.045 |
Token | something |
Token ID | 1223 |
Feature activation | -2.30e-02 |
Pos logit contributions | |
eway | +0.040 |
ining | +0.035 |
kered | +0.034 |
rum | +0.033 |
earing | +0.033 |
Neg logit contributions | |
groom | -0.032 |
scar | -0.030 |
burn | -0.028 |
pony | -0.027 |
salon | -0.027 |
Token | a |
Token ID | 257 |
Feature activation | -4.22e-03 |
Pos logit contributions | |
eway | +0.014 |
ooks | +0.013 |
ining | +0.013 |
earing | +0.013 |
rum | +0.012 |
Neg logit contributions | |
groom | -0.010 |
scar | -0.010 |
pony | -0.009 |
horses | -0.009 |
ponies | -0.009 |
Token | deep |
Token ID | 2769 |
Feature activation | -2.02e-02 |
Pos logit contributions | |
eway | +0.009 |
ining | +0.008 |
ered | +0.008 |
kered | +0.008 |
ooks | +0.008 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.005 |
pony | -0.005 |
burn | -0.005 |
salon | -0.005 |
Token | breath |
Token ID | 8033 |
Feature activation | +6.24e-03 |
Pos logit contributions | |
eway | +0.052 |
ining | +0.048 |
ooks | +0.047 |
kered | +0.046 |
rum | +0.046 |
Neg logit contributions | |
scar | -0.018 |
groom | -0.018 |
pony | -0.015 |
burn | -0.014 |
chicken | -0.014 |
Token | and |
Token ID | 290 |
Feature activation | +3.69e-03 |
Pos logit contributions | |
groom | +0.009 |
scar | +0.009 |
burn | +0.008 |
pony | +0.008 |
butter | +0.008 |
Neg logit contributions | |
eway | -0.012 |
ining | -0.011 |
ooks | -0.011 |
ered | -0.011 |
kered | -0.011 |
Token | showed |
Token ID | 3751 |
Feature activation | -9.50e-03 |
Pos logit contributions | |
groom | +0.006 |
scar | +0.005 |
pony | +0.005 |
burn | +0.005 |
chicken | +0.005 |
Neg logit contributions | |
eway | -0.007 |
ining | -0.006 |
ooks | -0.006 |
rum | -0.006 |
earing | -0.006 |
Token | them |
Token ID | 606 |
Feature activation | -4.75e-02 |
Pos logit contributions | |
eway | +0.018 |
ooks | +0.017 |
earing | +0.016 |
ining | +0.016 |
rum | +0.016 |
Neg logit contributions | |
groom | -0.015 |
pony | -0.014 |
scar | -0.014 |
ponies | -0.013 |
horses | -0.013 |
Token | his |
Token ID | 465 |
Feature activation | -1.01e-03 |
Pos logit contributions | |
eway | +0.096 |
ooks | +0.091 |
Turns | +0.089 |
ining | +0.088 |
kered | +0.087 |
Neg logit contributions | |
scar | -0.059 |
groom | -0.058 |
horses | -0.054 |
pony | -0.053 |
ponies | -0.053 |
Token | new |
Token ID | 649 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
eway | +0.002 |
ining | +0.002 |
ooks | +0.002 |
kered | +0.002 |
ered | +0.002 |
Neg logit contributions | |
groom | -0.002 |
scar | -0.001 |
pony | -0.001 |
burn | -0.001 |
ponies | -0.001 |
Token | trick |
Token ID | 6908 |
Feature activation | -4.69e-03 |
Pos logit contributions | |
eway | +0.037 |
ining | +0.034 |
kered | +0.034 |
ooks | +0.033 |
earing | +0.033 |
Neg logit contributions | |
groom | -0.028 |
scar | -0.027 |
pony | -0.026 |
cane | -0.024 |
horse | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | -1.63e-03 |
Pos logit contributions | |
eway | +0.009 |
ooks | +0.009 |
ining | +0.008 |
Turns | +0.008 |
earing | +0.008 |
Neg logit contributions | |
groom | -0.006 |
scar | -0.006 |
pony | -0.006 |
burn | -0.006 |
horse | -0.006 |
Token | Hipp |
Token ID | 33812 |
Feature activation | -9.21e-03 |
Pos logit contributions | |
eway | +0.003 |
ered | +0.003 |
earing | +0.003 |
kered | +0.002 |
ining | +0.002 |
Neg logit contributions | |
groom | -0.003 |
pony | -0.003 |
horses | -0.003 |
Rudy | -0.002 |
chicken | -0.002 |
Token | their |
Token ID | 511 |
Feature activation | -1.02e-02 |
Pos logit contributions | |
eway | +0.004 |
ered | +0.003 |
ining | +0.003 |
earing | +0.003 |
ooks | +0.003 |
Neg logit contributions | |
groom | -0.004 |
burn | -0.004 |
scar | -0.004 |
pony | -0.004 |
rob | -0.004 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.41e-04 |
Pos logit contributions | |
eway | +0.021 |
ining | +0.019 |
ered | +0.018 |
kered | +0.018 |
ooks | +0.018 |
Neg logit contributions | |
groom | -0.015 |
scar | -0.014 |
burn | -0.013 |
pony | -0.013 |
salon | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -2.35e-02 |
Pos logit contributions | |
eway | +0.000 |
ining | +0.000 |
ered | +0.000 |
earing | +0.000 |
kered | +0.000 |
Neg logit contributions | |
groom | -0.000 |
scar | -0.000 |
rob | -0.000 |
burn | -0.000 |
pony | -0.000 |
Token | She |
Token ID | 1375 |
Feature activation | -5.75e-03 |
Pos logit contributions | |
eway | +0.046 |
ered | +0.045 |
rum | +0.041 |
aged | +0.040 |
kered | +0.039 |
Neg logit contributions | |
groom | -0.027 |
Ben | -0.026 |
grocery | -0.025 |
syrup | -0.025 |
strawberries | -0.025 |
Token | showed |
Token ID | 3751 |
Feature activation | -4.40e-03 |
Pos logit contributions | |
eway | +0.011 |
ining | +0.009 |
kered | +0.009 |
ooks | +0.009 |
ered | +0.009 |
Neg logit contributions | |
groom | -0.010 |
scar | -0.009 |
burn | -0.009 |
pony | -0.009 |
salon | -0.008 |
Token | them |
Token ID | 606 |
Feature activation | -4.88e-02 |
Pos logit contributions | |
eway | +0.009 |
rum | +0.008 |
ining | +0.008 |
ooks | +0.008 |
earing | +0.007 |
Neg logit contributions | |
groom | -0.007 |
scar | -0.006 |
pony | -0.006 |
butter | -0.005 |
chicken | -0.005 |
Token | how |
Token ID | 703 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
eway | +0.112 |
ooks | +0.100 |
rum | +0.099 |
ining | +0.099 |
Turns | +0.097 |
Neg logit contributions | |
groom | -0.060 |
scar | -0.058 |
chicken | -0.054 |
pony | -0.053 |
strawberries | -0.053 |
Token | to |
Token ID | 284 |
Feature activation | -2.25e-03 |
Pos logit contributions | |
eway | +0.024 |
ining | +0.021 |
rum | +0.021 |
kered | +0.020 |
ered | +0.020 |
Neg logit contributions | |
groom | -0.011 |
scar | -0.010 |
butter | -0.010 |
chicken | -0.010 |
strawberries | -0.010 |
Token | organize |
Token ID | 16481 |
Feature activation | -3.41e-03 |
Pos logit contributions | |
eway | +0.005 |
ining | +0.004 |
Turns | +0.004 |
ooks | +0.004 |
kered | +0.004 |
Neg logit contributions | |
groom | -0.003 |
scar | -0.003 |
salon | -0.003 |
burn | -0.003 |
butter | -0.003 |
Token | their |
Token ID | 511 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
eway | +0.007 |
ining | +0.006 |
kered | +0.006 |
rum | +0.006 |
ooks | +0.006 |
Neg logit contributions | |
groom | -0.005 |
scar | -0.005 |
pony | -0.005 |
burn | -0.005 |
butter | -0.005 |
Token | toys |
Token ID | 14958 |
Feature activation | -2.86e-03 |
Pos logit contributions | |
eway | +0.037 |
ining | +0.031 |
kered | +0.031 |
ered | +0.031 |
rum | +0.031 |
Neg logit contributions | |
scar | -0.022 |
groom | -0.021 |
pony | -0.019 |
ponies | -0.019 |
horses | -0.019 |
Token | , |
Token ID | 11 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
kered | +0.017 |
eway | +0.016 |
ining | +0.016 |
age | +0.015 |
amed | +0.015 |
Neg logit contributions | |
pony | -0.007 |
scar | -0.007 |
salon | -0.007 |
horse | -0.006 |
Velvet | -0.006 |
Token | there |
Token ID | 612 |
Feature activation | -2.48e-02 |
Pos logit contributions | |
eway | +0.033 |
kered | +0.030 |
ooks | +0.030 |
ining | +0.030 |
rum | +0.030 |
Neg logit contributions | |
groom | -0.018 |
pony | -0.017 |
scar | -0.017 |
burn | -0.016 |
chicken | -0.016 |
Token | was |
Token ID | 373 |
Feature activation | -7.12e-04 |
Pos logit contributions | |
eway | +0.046 |
ooks | +0.042 |
taker | +0.040 |
rum | +0.040 |
earing | +0.040 |
Neg logit contributions | |
groom | -0.034 |
pony | -0.033 |
chicken | -0.033 |
strawberry | -0.032 |
scar | -0.032 |
Token | an |
Token ID | 281 |
Feature activation | +2.35e-03 |
Pos logit contributions | |
eway | +0.001 |
ining | +0.001 |
kered | +0.001 |
ered | +0.001 |
ooks | +0.001 |
Neg logit contributions | |
groom | -0.001 |
scar | -0.001 |
burn | -0.001 |
salon | -0.001 |
pony | -0.001 |
Token | elderly |
Token ID | 13830 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
groom | +0.003 |
scar | +0.003 |
burn | +0.003 |
rob | +0.003 |
salon | +0.003 |
Neg logit contributions | |
eway | -0.005 |
ining | -0.004 |
ered | -0.004 |
earing | -0.004 |
kered | -0.004 |
Token | couple |
Token ID | 3155 |
Feature activation | -4.81e-02 |
Pos logit contributions | |
eway | +0.030 |
ining | +0.027 |
ooks | +0.026 |
kered | +0.026 |
earing | +0.026 |
Neg logit contributions | |
groom | -0.014 |
scar | -0.014 |
burn | -0.013 |
rob | -0.011 |
salon | -0.011 |
Token | who |
Token ID | 508 |
Feature activation | +5.63e-05 |
Pos logit contributions | |
eway | +0.075 |
ining | +0.064 |
ered | +0.062 |
kered | +0.061 |
ooks | +0.060 |
Neg logit contributions | |
groom | -0.094 |
scar | -0.088 |
burn | -0.086 |
pony | -0.085 |
salon | -0.082 |
Token | owned |
Token ID | 6898 |
Feature activation | -9.53e-04 |
Pos logit contributions | |
groom | +0.000 |
scar | +0.000 |
pony | +0.000 |
burn | +0.000 |
ponies | +0.000 |
Neg logit contributions | |
eway | -0.000 |
ining | -0.000 |
rum | -0.000 |
ooks | -0.000 |
earing | -0.000 |
Token | a |
Token ID | 257 |
Feature activation | +1.81e-02 |
Pos logit contributions | |
eway | +0.002 |
ining | +0.001 |
kered | +0.001 |
ered | +0.001 |
ooks | +0.001 |
Neg logit contributions | |
groom | -0.002 |
scar | -0.002 |
burn | -0.001 |
salon | -0.001 |
pony | -0.001 |
Token | big |
Token ID | 1263 |
Feature activation | +6.88e-03 |
Pos logit contributions | |
rob | +0.029 |
burn | +0.028 |
scar | +0.027 |
syrup | +0.026 |
Velvet | +0.026 |
Neg logit contributions | |
eway | -0.026 |
ining | -0.024 |
ooks | -0.023 |
Turns | -0.023 |
Everyone | -0.023 |
Token | farm |
Token ID | 5318 |
Feature activation | -2.84e-02 |
Pos logit contributions | |
burn | +0.011 |
rob | +0.010 |
groom | +0.010 |
scar | +0.010 |
Velvet | +0.010 |
Neg logit contributions | |
eway | -0.011 |
ining | -0.010 |
earing | -0.009 |
ooks | -0.009 |
Turns | -0.009 |