Token | take |
Token ID | 1011 |
Feature activation | +1.24e-02 |
Pos logit contributions | |
spaghetti | +0.011 |
sidelines | +0.011 |
Seek | +0.010 |
menu | +0.009 |
bed | +0.009 |
Neg logit contributions | |
flew | -0.012 |
bul | -0.012 |
spe | -0.012 |
Bel | -0.011 |
pol | -0.011 |
Token | it |
Token ID | 340 |
Feature activation | +4.17e-03 |
Pos logit contributions | |
sidelines | +0.022 |
spaghetti | +0.020 |
menu | +0.019 |
Seek | +0.019 |
concession | +0.018 |
Neg logit contributions | |
flew | -0.017 |
bul | -0.015 |
soared | -0.014 |
pol | -0.014 |
hon | -0.014 |
Token | down |
Token ID | 866 |
Feature activation | +2.61e-03 |
Pos logit contributions | |
sidelines | +0.007 |
spaghetti | +0.007 |
menu | +0.006 |
Seek | +0.006 |
concession | +0.006 |
Neg logit contributions | |
flew | -0.006 |
bul | -0.005 |
spe | -0.005 |
esh | -0.005 |
pol | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
sidelines | +0.005 |
spaghetti | +0.004 |
Seek | +0.004 |
menu | +0.004 |
concession | +0.004 |
Neg logit contributions | |
flew | -0.004 |
bul | -0.003 |
spe | -0.003 |
soared | -0.003 |
mill | -0.003 |
Token | The |
Token ID | 383 |
Feature activation | +6.99e-03 |
Pos logit contributions | |
sidelines | +0.019 |
spaghetti | +0.018 |
menu | +0.017 |
bed | +0.016 |
hunting | +0.015 |
Neg logit contributions | |
bul | -0.015 |
spe | -0.014 |
paramed | -0.014 |
flew | -0.013 |
Or | -0.013 |
Token | company |
Token ID | 1664 |
Feature activation | +8.60e-02 |
Pos logit contributions | |
spaghetti | +0.012 |
sidelines | +0.011 |
Seek | +0.010 |
shady | +0.009 |
bed | +0.009 |
Neg logit contributions | |
spe | -0.010 |
flew | -0.010 |
bul | -0.010 |
rob | -0.009 |
paramed | -0.009 |
Token | paid |
Token ID | 3432 |
Feature activation | -6.18e-03 |
Pos logit contributions | |
spaghetti | +0.132 |
sidelines | +0.132 |
Seek | +0.116 |
menu | +0.112 |
bed | +0.110 |
Neg logit contributions | |
flew | -0.130 |
bul | -0.128 |
spe | -0.126 |
soared | -0.116 |
pre | -0.113 |
Token | a |
Token ID | 257 |
Feature activation | -2.60e-03 |
Pos logit contributions | |
flew | +0.011 |
bul | +0.011 |
spe | +0.010 |
pol | +0.010 |
soared | +0.010 |
Neg logit contributions | |
sidelines | -0.008 |
spaghetti | -0.008 |
menu | -0.007 |
Seek | -0.007 |
Want | -0.006 |
Token | lot |
Token ID | 1256 |
Feature activation | +2.95e-02 |
Pos logit contributions | |
spe | +0.004 |
bul | +0.004 |
flew | +0.004 |
paramed | +0.004 |
rob | +0.004 |
Neg logit contributions | |
spaghetti | -0.004 |
sidelines | -0.004 |
Seek | -0.004 |
concession | -0.003 |
bed | -0.003 |
Token | of |
Token ID | 286 |
Feature activation | -4.40e-03 |
Pos logit contributions | |
sidelines | +0.046 |
spaghetti | +0.044 |
Seek | +0.038 |
bed | +0.036 |
menu | +0.036 |
Neg logit contributions | |
bul | -0.046 |
flew | -0.045 |
spe | -0.045 |
Bel | -0.040 |
pol | -0.040 |
Token | money |
Token ID | 1637 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
flew | +0.007 |
bul | +0.006 |
spe | +0.006 |
rob | +0.006 |
paramed | +0.006 |
Neg logit contributions | |
sidelines | -0.007 |
spaghetti | -0.006 |
Seek | -0.006 |
Want | -0.006 |
concession | -0.005 |
Token | saw |
Token ID | 2497 |
Feature activation | +2.56e-02 |
Pos logit contributions | |
bul | +0.004 |
spe | +0.004 |
esh | +0.004 |
pre | +0.004 |
paramed | +0.004 |
Neg logit contributions | |
spaghetti | -0.006 |
sidelines | -0.006 |
Seek | -0.005 |
menu | -0.005 |
bed | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | +2.92e-02 |
Pos logit contributions | |
spaghetti | +0.041 |
sidelines | +0.041 |
Seek | +0.037 |
menu | +0.036 |
bed | +0.035 |
Neg logit contributions | |
flew | -0.036 |
bul | -0.036 |
spe | -0.035 |
paramed | -0.033 |
soared | -0.032 |
Token | ball |
Token ID | 2613 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
spaghetti | +0.048 |
Seek | +0.047 |
sidelines | +0.047 |
Control | +0.044 |
Want | +0.043 |
Neg logit contributions | |
flew | -0.037 |
spe | -0.035 |
blew | -0.033 |
bul | -0.032 |
soared | -0.031 |
Token | on |
Token ID | 319 |
Feature activation | +2.39e-02 |
Pos logit contributions | |
spaghetti | +0.022 |
sidelines | +0.022 |
Seek | +0.020 |
menu | +0.019 |
bed | +0.019 |
Neg logit contributions | |
flew | -0.020 |
bul | -0.020 |
spe | -0.019 |
soared | -0.018 |
pol | -0.018 |
Token | the |
Token ID | 262 |
Feature activation | +3.46e-02 |
Pos logit contributions | |
spaghetti | +0.041 |
sidelines | +0.040 |
Seek | +0.036 |
menu | +0.035 |
bed | +0.035 |
Neg logit contributions | |
bul | -0.031 |
flew | -0.031 |
spe | -0.031 |
Bel | -0.028 |
pol | -0.028 |
Token | other |
Token ID | 584 |
Feature activation | +8.35e-02 |
Pos logit contributions | |
spaghetti | +0.050 |
Want | +0.049 |
Seek | +0.048 |
Would | +0.046 |
Do | +0.045 |
Neg logit contributions | |
ostr | -0.048 |
flew | -0.047 |
k | -0.047 |
rob | -0.045 |
Or | -0.045 |
Token | side |
Token ID | 1735 |
Feature activation | +3.35e-02 |
Pos logit contributions | |
spaghetti | +0.112 |
sidelines | +0.107 |
Seek | +0.103 |
menu | +0.094 |
Want | +0.093 |
Neg logit contributions | |
flew | -0.130 |
spe | -0.124 |
ostr | -0.121 |
rob | -0.120 |
bul | -0.118 |
Token | and |
Token ID | 290 |
Feature activation | +4.34e-03 |
Pos logit contributions | |
sidelines | +0.057 |
spaghetti | +0.056 |
Seek | +0.052 |
menu | +0.049 |
robbers | +0.048 |
Neg logit contributions | |
spe | -0.045 |
flew | -0.045 |
bul | -0.044 |
soared | -0.038 |
mill | -0.038 |
Token | ran |
Token ID | 4966 |
Feature activation | -7.44e-03 |
Pos logit contributions | |
spaghetti | +0.008 |
sidelines | +0.008 |
Seek | +0.007 |
menu | +0.007 |
bed | +0.007 |
Neg logit contributions | |
bul | -0.005 |
spe | -0.005 |
flew | -0.005 |
pre | -0.005 |
paramed | -0.005 |
Token | across |
Token ID | 1973 |
Feature activation | -1.45e-02 |
Pos logit contributions | |
flew | +0.012 |
spe | +0.011 |
bul | +0.011 |
pol | +0.011 |
Bel | +0.011 |
Neg logit contributions | |
spaghetti | -0.011 |
sidelines | -0.011 |
Seek | -0.009 |
menu | -0.009 |
bed | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
flew | +0.018 |
spe | +0.018 |
bul | +0.017 |
soared | +0.016 |
esh | +0.016 |
Neg logit contributions | |
sidelines | -0.026 |
spaghetti | -0.026 |
Seek | -0.023 |
menu | -0.023 |
bed | -0.021 |
Token | liked |
Token ID | 8288 |
Feature activation | +2.90e-02 |
Pos logit contributions | |
spe | +0.005 |
bul | +0.005 |
xc | +0.004 |
paramed | +0.004 |
esh | +0.004 |
Neg logit contributions | |
spaghetti | -0.005 |
bone | -0.004 |
skeleton | -0.004 |
hunting | -0.004 |
menu | -0.004 |
Token | to |
Token ID | 284 |
Feature activation | +2.39e-02 |
Pos logit contributions | |
sidelines | +0.051 |
spaghetti | +0.046 |
Seek | +0.045 |
locker | +0.042 |
menu | +0.042 |
Neg logit contributions | |
flew | -0.038 |
bul | -0.037 |
spe | -0.034 |
paramed | -0.032 |
soared | -0.032 |
Token | hide |
Token ID | 7808 |
Feature activation | +4.37e-02 |
Pos logit contributions | |
spaghetti | +0.026 |
sidelines | +0.024 |
bed | +0.021 |
menu | +0.020 |
Seek | +0.020 |
Neg logit contributions | |
spe | -0.049 |
bul | -0.048 |
flew | -0.045 |
pre | -0.044 |
xc | -0.044 |
Token | in |
Token ID | 287 |
Feature activation | +1.32e-03 |
Pos logit contributions | |
sidelines | +0.079 |
spaghetti | +0.071 |
Seek | +0.067 |
Want | +0.066 |
menu | +0.064 |
Neg logit contributions | |
flew | -0.059 |
bul | -0.054 |
spe | -0.053 |
Bel | -0.050 |
esh | -0.050 |
Token | the |
Token ID | 262 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
sidelines | +0.003 |
icious | +0.003 |
ury | +0.003 |
spine | +0.003 |
ouring | +0.003 |
Neg logit contributions | |
flew | -0.001 |
esh | -0.001 |
spr | -0.001 |
bul | -0.001 |
spe | -0.001 |
Token | safe |
Token ID | 3338 |
Feature activation | +8.29e-02 |
Pos logit contributions | |
sidelines | +0.021 |
ours | +0.020 |
ouring | +0.020 |
gency | +0.020 |
assing | +0.019 |
Neg logit contributions | |
flew | -0.015 |
ostr | -0.014 |
went | -0.014 |
spr | -0.014 |
Bel | -0.013 |
Token | home |
Token ID | 1363 |
Feature activation | +4.09e-02 |
Pos logit contributions | |
sidelines | +0.113 |
spaghetti | +0.104 |
Seek | +0.092 |
ours | +0.090 |
Want | +0.089 |
Neg logit contributions | |
flew | -0.144 |
bul | -0.143 |
spe | -0.141 |
spr | -0.129 |
ostr | -0.129 |
Token | he |
Token ID | 339 |
Feature activation | +1.84e-02 |
Pos logit contributions | |
sidelines | +0.092 |
spaghetti | +0.079 |
Want | +0.077 |
Seek | +0.076 |
concession | +0.074 |
Neg logit contributions | |
spe | -0.040 |
flew | -0.040 |
bul | -0.038 |
bel | -0.033 |
Or | -0.032 |
Token | had |
Token ID | 550 |
Feature activation | -5.62e-06 |
Pos logit contributions | |
sidelines | +0.045 |
spaghetti | +0.040 |
ours | +0.039 |
menu | +0.037 |
Seek | +0.036 |
Neg logit contributions | |
flew | -0.020 |
soared | -0.015 |
went | -0.014 |
walked | -0.014 |
blew | -0.013 |
Token | made |
Token ID | 925 |
Feature activation | -2.78e-03 |
Token | for |
Token ID | 329 |
Feature activation | +2.60e-02 |
Pos logit contributions | |
flew | +0.004 |
bul | +0.003 |
spe | +0.003 |
hon | +0.003 |
am | +0.003 |
Neg logit contributions | |
sidelines | -0.005 |
spaghetti | -0.004 |
Seek | -0.004 |
Want | -0.004 |
internet | -0.004 |
Token | take |
Token ID | 1011 |
Feature activation | +8.03e-03 |
Pos logit contributions | |
spaghetti | +0.005 |
sidelines | +0.004 |
Seek | +0.004 |
menu | +0.004 |
bed | +0.004 |
Neg logit contributions | |
flew | -0.005 |
bul | -0.005 |
spe | -0.005 |
Bel | -0.005 |
pol | -0.005 |
Token | it |
Token ID | 340 |
Feature activation | -1.06e-04 |
Pos logit contributions | |
sidelines | +0.014 |
spaghetti | +0.013 |
jar | +0.013 |
menu | +0.013 |
concession | +0.012 |
Neg logit contributions | |
flew | -0.011 |
bul | -0.009 |
soared | -0.009 |
pol | -0.009 |
hon | -0.008 |
Token | down |
Token ID | 866 |
Feature activation | -2.29e-03 |
Pos logit contributions | |
flew | +0.000 |
bul | +0.000 |
spe | +0.000 |
esh | +0.000 |
pol | +0.000 |
Neg logit contributions | |
sidelines | -0.000 |
spaghetti | -0.000 |
menu | -0.000 |
concession | -0.000 |
Seek | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | +8.85e-03 |
Pos logit contributions | |
flew | +0.003 |
bul | +0.003 |
spe | +0.003 |
soared | +0.003 |
mill | +0.003 |
Neg logit contributions | |
sidelines | -0.004 |
spaghetti | -0.004 |
Seek | -0.003 |
menu | -0.003 |
concession | -0.003 |
Token | The |
Token ID | 383 |
Feature activation | +3.57e-03 |
Pos logit contributions | |
sidelines | +0.015 |
spaghetti | +0.015 |
menu | +0.014 |
bed | +0.013 |
hunting | +0.012 |
Neg logit contributions | |
bul | -0.012 |
spe | -0.011 |
paramed | -0.011 |
flew | -0.010 |
Or | -0.010 |
Token | company |
Token ID | 1664 |
Feature activation | +8.29e-02 |
Pos logit contributions | |
spaghetti | +0.006 |
sidelines | +0.006 |
Seek | +0.005 |
shady | +0.005 |
bed | +0.005 |
Neg logit contributions | |
spe | -0.005 |
bul | -0.005 |
flew | -0.005 |
rob | -0.005 |
paramed | -0.005 |
Token | paid |
Token ID | 3432 |
Feature activation | -1.02e-02 |
Pos logit contributions | |
spaghetti | +0.128 |
sidelines | +0.128 |
Seek | +0.112 |
menu | +0.108 |
bed | +0.106 |
Neg logit contributions | |
flew | -0.125 |
bul | -0.123 |
spe | -0.121 |
soared | -0.111 |
pre | -0.109 |
Token | a |
Token ID | 257 |
Feature activation | -6.72e-03 |
Pos logit contributions | |
flew | +0.018 |
bul | +0.017 |
spe | +0.017 |
pol | +0.016 |
soared | +0.016 |
Neg logit contributions | |
sidelines | -0.013 |
spaghetti | -0.013 |
menu | -0.011 |
Seek | -0.011 |
Want | -0.010 |
Token | lot |
Token ID | 1256 |
Feature activation | +2.62e-02 |
Pos logit contributions | |
spe | +0.010 |
bul | +0.010 |
flew | +0.010 |
paramed | +0.009 |
rob | +0.009 |
Neg logit contributions | |
spaghetti | -0.011 |
sidelines | -0.010 |
Seek | -0.009 |
concession | -0.008 |
bed | -0.008 |
Token | of |
Token ID | 286 |
Feature activation | -6.73e-03 |
Pos logit contributions | |
sidelines | +0.040 |
spaghetti | +0.038 |
Seek | +0.033 |
bed | +0.032 |
menu | +0.032 |
Neg logit contributions | |
bul | -0.041 |
flew | -0.041 |
spe | -0.040 |
blew | -0.036 |
Bel | -0.036 |
Token | money |
Token ID | 1637 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
flew | +0.010 |
bul | +0.010 |
rob | +0.009 |
spe | +0.009 |
paramed | +0.009 |
Neg logit contributions | |
sidelines | -0.010 |
spaghetti | -0.010 |
Seek | -0.009 |
Want | -0.009 |
concession | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | -7.26e-03 |
Pos logit contributions | |
flew | +0.015 |
bul | +0.015 |
spe | +0.014 |
Bel | +0.013 |
pre | +0.013 |
Neg logit contributions | |
sidelines | -0.016 |
spaghetti | -0.015 |
Seek | -0.014 |
menu | -0.013 |
internet | -0.013 |
Token | Wra |
Token ID | 27323 |
Feature activation | -6.65e-03 |
Pos logit contributions | |
bul | +0.012 |
flew | +0.012 |
spe | +0.011 |
Bel | +0.011 |
paramed | +0.011 |
Neg logit contributions | |
spaghetti | -0.010 |
sidelines | -0.010 |
Seek | -0.009 |
menu | -0.009 |
bed | -0.008 |
Token | pped |
Token ID | 1496 |
Feature activation | +3.32e-02 |
Pos logit contributions | |
spe | +0.013 |
bul | +0.013 |
flew | +0.012 |
pre | +0.012 |
Or | +0.012 |
Neg logit contributions | |
sidelines | -0.007 |
spaghetti | -0.006 |
Seek | -0.005 |
liking | -0.005 |
mine | -0.005 |
Token | in |
Token ID | 287 |
Feature activation | +3.82e-03 |
Pos logit contributions | |
sidelines | +0.053 |
spaghetti | +0.053 |
Seek | +0.048 |
menu | +0.046 |
bed | +0.044 |
Neg logit contributions | |
flew | -0.048 |
bul | -0.047 |
spe | -0.045 |
soared | -0.042 |
pol | -0.042 |
Token | the |
Token ID | 262 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
sidelines | +0.007 |
spaghetti | +0.007 |
Seek | +0.006 |
menu | +0.006 |
internet | +0.006 |
Neg logit contributions | |
flew | -0.005 |
bul | -0.005 |
spe | -0.004 |
soared | -0.004 |
blew | -0.004 |
Token | cozy |
Token ID | 37438 |
Feature activation | +8.24e-02 |
Pos logit contributions | |
spaghetti | +0.016 |
sidelines | +0.015 |
Seek | +0.015 |
ours | +0.014 |
Want | +0.013 |
Neg logit contributions | |
bul | -0.020 |
flew | -0.019 |
spe | -0.019 |
paramed | -0.019 |
pre | -0.018 |
Token | qu |
Token ID | 627 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
spaghetti | +0.103 |
sidelines | +0.098 |
Seek | +0.092 |
ours | +0.084 |
menu | +0.081 |
Neg logit contributions | |
bul | -0.151 |
flew | -0.148 |
spe | -0.145 |
paramed | -0.138 |
esh | -0.136 |
Token | ilt |
Token ID | 2326 |
Feature activation | +2.74e-02 |
Pos logit contributions | |
spaghetti | +0.032 |
sidelines | +0.032 |
Seek | +0.029 |
menu | +0.029 |
robbers | +0.028 |
Neg logit contributions | |
bul | -0.024 |
flew | -0.024 |
spe | -0.023 |
Bel | -0.021 |
paramed | -0.021 |
Token | , |
Token ID | 11 |
Feature activation | +2.97e-03 |
Pos logit contributions | |
sidelines | +0.045 |
spaghetti | +0.044 |
Seek | +0.040 |
menu | +0.038 |
ours | +0.037 |
Neg logit contributions | |
flew | -0.038 |
bul | -0.037 |
spe | -0.036 |
soared | -0.033 |
Bel | -0.033 |
Token | he |
Token ID | 339 |
Feature activation | +1.80e-02 |
Pos logit contributions | |
sidelines | +0.005 |
spaghetti | +0.005 |
Seek | +0.004 |
menu | +0.004 |
bed | +0.004 |
Neg logit contributions | |
flew | -0.004 |
bul | -0.004 |
spe | -0.004 |
soared | -0.004 |
Bel | -0.004 |
Token | returned |
Token ID | 4504 |
Feature activation | +6.99e-03 |
Pos logit contributions | |
spaghetti | +0.031 |
sidelines | +0.029 |
Seek | +0.027 |
bed | +0.027 |
menu | +0.026 |
Neg logit contributions | |
bul | -0.023 |
paramed | -0.021 |
spe | -0.021 |
xc | -0.021 |
pre | -0.021 |
Token | saw |
Token ID | 2497 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
spaghetti | +0.039 |
sidelines | +0.039 |
Seek | +0.035 |
menu | +0.034 |
bed | +0.034 |
Neg logit contributions | |
bul | -0.030 |
flew | -0.029 |
spe | -0.029 |
paramed | -0.026 |
pol | -0.026 |
Token | her |
Token ID | 607 |
Feature activation | +2.19e-02 |
Pos logit contributions | |
spaghetti | +0.032 |
sidelines | +0.031 |
Seek | +0.027 |
bed | +0.026 |
menu | +0.026 |
Neg logit contributions | |
bul | -0.035 |
spe | -0.035 |
flew | -0.034 |
pol | -0.032 |
pre | -0.032 |
Token | mother |
Token ID | 2802 |
Feature activation | +2.47e-03 |
Pos logit contributions | |
sidelines | +0.047 |
spaghetti | +0.045 |
Seek | +0.043 |
Want | +0.041 |
menu | +0.040 |
Neg logit contributions | |
flew | -0.020 |
bul | -0.020 |
spe | -0.019 |
Bel | -0.017 |
rob | -0.016 |
Token | holding |
Token ID | 4769 |
Feature activation | +1.57e-03 |
Pos logit contributions | |
spaghetti | +0.004 |
sidelines | +0.004 |
Seek | +0.003 |
menu | +0.003 |
ours | +0.003 |
Neg logit contributions | |
flew | -0.004 |
bul | -0.004 |
spe | -0.004 |
soared | -0.003 |
pol | -0.003 |
Token | a |
Token ID | 257 |
Feature activation | +1.21e-03 |
Pos logit contributions | |
sidelines | +0.003 |
spaghetti | +0.003 |
Seek | +0.003 |
menu | +0.003 |
internet | +0.003 |
Neg logit contributions | |
flew | -0.002 |
bul | -0.002 |
pol | -0.002 |
Bel | -0.002 |
soared | -0.002 |
Token | freshly |
Token ID | 29026 |
Feature activation | +8.22e-02 |
Pos logit contributions | |
sidelines | +0.002 |
Seek | +0.002 |
spaghetti | +0.002 |
Want | +0.002 |
concession | +0.002 |
Neg logit contributions | |
bul | -0.002 |
flew | -0.002 |
rob | -0.002 |
paramed | -0.002 |
blew | -0.002 |
Token | - |
Token ID | 12 |
Feature activation | -5.99e-03 |
Pos logit contributions | |
sidelines | +0.146 |
spaghetti | +0.143 |
Seek | +0.130 |
menu | +0.125 |
bed | +0.124 |
Neg logit contributions | |
flew | -0.106 |
bul | -0.102 |
spe | -0.096 |
pol | -0.094 |
soared | -0.093 |
Token | b |
Token ID | 65 |
Feature activation | -3.34e-02 |
Pos logit contributions | |
bul | +0.009 |
flew | +0.009 |
spe | +0.009 |
soared | +0.008 |
paramed | +0.008 |
Neg logit contributions | |
spaghetti | -0.009 |
sidelines | -0.009 |
Seek | -0.008 |
menu | -0.008 |
bed | -0.007 |
Token | aked |
Token ID | 4335 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
spe | +0.050 |
flew | +0.046 |
Or | +0.046 |
paramed | +0.044 |
bul | +0.044 |
Neg logit contributions | |
spaghetti | -0.051 |
bed | -0.044 |
anywhere | -0.043 |
menu | -0.043 |
bone | -0.043 |
Token | muff |
Token ID | 27563 |
Feature activation | -3.02e-02 |
Pos logit contributions | |
bul | +0.018 |
spe | +0.018 |
flew | +0.018 |
Bel | +0.016 |
pre | +0.016 |
Neg logit contributions | |
spaghetti | -0.015 |
sidelines | -0.015 |
Seek | -0.013 |
menu | -0.013 |
bed | -0.012 |
Token | in |
Token ID | 259 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
bul | +0.026 |
flew | +0.025 |
spe | +0.025 |
pol | +0.021 |
Bel | +0.021 |
Neg logit contributions | |
sidelines | -0.066 |
spaghetti | -0.066 |
Seek | -0.060 |
menu | -0.059 |
bed | -0.058 |
Token | many |
Token ID | 867 |
Feature activation | +5.20e-02 |
Pos logit contributions | |
sidelines | +0.044 |
spaghetti | +0.043 |
Seek | +0.039 |
menu | +0.037 |
bed | +0.036 |
Neg logit contributions | |
flew | -0.041 |
bul | -0.041 |
spe | -0.040 |
paramed | -0.037 |
soared | -0.036 |
Token | books |
Token ID | 3835 |
Feature activation | +2.77e-02 |
Pos logit contributions | |
sidelines | +0.085 |
spine | +0.066 |
spaghetti | +0.066 |
Want | +0.065 |
ours | +0.064 |
Neg logit contributions | |
flew | -0.077 |
bul | -0.075 |
spe | -0.073 |
ira | -0.071 |
ele | -0.070 |
Token | on |
Token ID | 319 |
Feature activation | +2.52e-02 |
Pos logit contributions | |
sidelines | +0.058 |
spaghetti | +0.053 |
Seek | +0.050 |
robbers | +0.049 |
Want | +0.048 |
Neg logit contributions | |
flew | -0.033 |
bul | -0.028 |
spe | -0.025 |
blew | -0.025 |
soared | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | +3.84e-02 |
Pos logit contributions | |
sidelines | +0.048 |
spaghetti | +0.046 |
Seek | +0.043 |
menu | +0.040 |
Want | +0.040 |
Neg logit contributions | |
flew | -0.029 |
bul | -0.028 |
spe | -0.027 |
esh | -0.024 |
soared | -0.024 |
Token | books |
Token ID | 3835 |
Feature activation | +4.99e-02 |
Pos logit contributions | |
sidelines | +0.046 |
spaghetti | +0.043 |
Want | +0.041 |
Seek | +0.038 |
ours | +0.038 |
Neg logit contributions | |
ostr | -0.060 |
flew | -0.059 |
spe | -0.059 |
Or | -0.058 |
ira | -0.057 |
Token | he |
Token ID | 258 |
Feature activation | +8.20e-02 |
Pos logit contributions | |
sidelines | +0.097 |
spaghetti | +0.089 |
robbers | +0.085 |
Seek | +0.084 |
unnecessary | +0.083 |
Neg logit contributions | |
flew | -0.061 |
bul | -0.054 |
spe | -0.052 |
master | -0.051 |
blew | -0.049 |
Token | lf |
Token ID | 1652 |
Feature activation | +1.99e-04 |
Pos logit contributions | |
spaghetti | +0.113 |
sidelines | +0.110 |
Seek | +0.096 |
menu | +0.095 |
bed | +0.094 |
Neg logit contributions | |
bul | -0.136 |
flew | -0.134 |
spe | -0.133 |
Bel | -0.126 |
paramed | -0.126 |
Token | . |
Token ID | 13 |
Feature activation | +1.66e-02 |
Pos logit contributions | |
sidelines | +0.000 |
spaghetti | +0.000 |
Seek | +0.000 |
menu | +0.000 |
Want | +0.000 |
Neg logit contributions | |
flew | -0.000 |
spe | -0.000 |
bul | -0.000 |
soared | -0.000 |
pol | -0.000 |
Token | He |
Token ID | 679 |
Feature activation | +7.36e-03 |
Pos logit contributions | |
sidelines | +0.033 |
spaghetti | +0.029 |
Seek | +0.028 |
ours | +0.027 |
hunting | +0.027 |
Neg logit contributions | |
flew | -0.017 |
ira | -0.016 |
spe | -0.015 |
hon | -0.015 |
Ale | -0.015 |
Token | wanted |
Token ID | 2227 |
Feature activation | +1.45e-02 |
Pos logit contributions | |
spaghetti | +0.011 |
Seek | +0.010 |
sidelines | +0.009 |
robbers | +0.009 |
menu | +0.009 |
Neg logit contributions | |
bul | -0.012 |
spe | -0.011 |
esh | -0.011 |
pre | -0.011 |
paramed | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | +2.84e-02 |
Pos logit contributions | |
sidelines | +0.028 |
spaghetti | +0.024 |
Seek | +0.023 |
Want | +0.022 |
internet | +0.022 |
Neg logit contributions | |
flew | -0.018 |
bul | -0.017 |
spe | -0.017 |
pol | -0.015 |
paramed | -0.015 |
Token | saw |
Token ID | 2497 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
spaghetti | +0.010 |
sidelines | +0.009 |
Seek | +0.008 |
menu | +0.008 |
bed | +0.008 |
Neg logit contributions | |
bul | -0.012 |
paramed | -0.011 |
spe | -0.011 |
pre | -0.010 |
esh | -0.010 |
Token | a |
Token ID | 257 |
Feature activation | +1.59e-02 |
Pos logit contributions | |
spaghetti | +0.024 |
sidelines | +0.023 |
Seek | +0.020 |
menu | +0.020 |
bed | +0.020 |
Neg logit contributions | |
bul | -0.025 |
spe | -0.025 |
flew | -0.024 |
pol | -0.023 |
pre | -0.023 |
Token | hoop |
Token ID | 44792 |
Feature activation | +2.88e-03 |
Pos logit contributions | |
sidelines | +0.028 |
spaghetti | +0.027 |
Seek | +0.026 |
ours | +0.025 |
spine | +0.024 |
Neg logit contributions | |
flew | -0.020 |
rob | -0.019 |
blew | -0.018 |
bul | -0.017 |
spr | -0.017 |
Token | at |
Token ID | 379 |
Feature activation | -1.33e-02 |
Pos logit contributions | |
spaghetti | +0.004 |
sidelines | +0.004 |
Seek | +0.004 |
menu | +0.004 |
bed | +0.004 |
Neg logit contributions | |
flew | -0.004 |
bul | -0.004 |
spe | -0.004 |
soared | -0.004 |
pol | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +3.56e-02 |
Pos logit contributions | |
flew | +0.016 |
bul | +0.016 |
spe | +0.015 |
Bel | +0.014 |
pol | +0.014 |
Neg logit contributions | |
spaghetti | -0.024 |
sidelines | -0.024 |
Seek | -0.022 |
menu | -0.021 |
Want | -0.020 |
Token | other |
Token ID | 584 |
Feature activation | +8.20e-02 |
Pos logit contributions | |
spaghetti | +0.063 |
Seek | +0.061 |
Want | +0.061 |
and | +0.060 |
run | +0.060 |
Neg logit contributions | |
flew | -0.037 |
spr | -0.037 |
k | -0.033 |
Bel | -0.032 |
ostr | -0.032 |
Token | end |
Token ID | 886 |
Feature activation | +2.97e-02 |
Pos logit contributions | |
sidelines | +0.123 |
spaghetti | +0.120 |
brand | +0.110 |
Seek | +0.109 |
ours | +0.108 |
Neg logit contributions | |
flew | -0.119 |
spr | -0.111 |
Bel | -0.105 |
went | -0.104 |
Or | -0.102 |
Token | of |
Token ID | 286 |
Feature activation | -5.48e-04 |
Pos logit contributions | |
spaghetti | +0.043 |
sidelines | +0.041 |
Seek | +0.037 |
menu | +0.036 |
bed | +0.036 |
Neg logit contributions | |
bul | -0.046 |
flew | -0.046 |
spe | -0.045 |
paramed | -0.043 |
Bel | -0.042 |
Token | the |
Token ID | 262 |
Feature activation | +1.02e-03 |
Pos logit contributions | |
flew | +0.001 |
bul | +0.001 |
spe | +0.001 |
Bel | +0.001 |
Sher | +0.000 |
Neg logit contributions | |
sidelines | -0.001 |
spaghetti | -0.001 |
Seek | -0.001 |
menu | -0.001 |
Want | -0.001 |
Token | field |
Token ID | 2214 |
Feature activation | +1.88e-02 |
Pos logit contributions | |
sidelines | +0.002 |
spaghetti | +0.002 |
Nice | +0.002 |
ocket | +0.002 |
Deal | +0.002 |
Neg logit contributions | |
flew | -0.001 |
Bel | -0.001 |
blew | -0.001 |
k | -0.001 |
went | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
sidelines | +0.034 |
spaghetti | +0.034 |
Seek | +0.031 |
menu | +0.029 |
robbers | +0.029 |
Neg logit contributions | |
flew | -0.024 |
spe | -0.022 |
bul | -0.022 |
soared | -0.020 |
Bel | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
spaghetti | +0.054 |
sidelines | +0.053 |
Seek | +0.048 |
menu | +0.047 |
bed | +0.046 |
Neg logit contributions | |
bul | -0.044 |
spe | -0.042 |
flew | -0.041 |
pol | -0.039 |
paramed | -0.039 |
Token |
|
Token ID | 198 |
Feature activation | +1.35e-02 |
Pos logit contributions | |
sidelines | +0.028 |
spaghetti | +0.026 |
menu | +0.024 |
Seek | +0.024 |
internet | +0.023 |
Neg logit contributions | |
flew | -0.014 |
hon | -0.013 |
bul | -0.013 |
spe | -0.013 |
paramed | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | +1.54e-02 |
Pos logit contributions | |
sidelines | +0.023 |
spaghetti | +0.023 |
Seek | +0.020 |
menu | +0.020 |
bed | +0.019 |
Neg logit contributions | |
flew | -0.018 |
bul | -0.017 |
spe | -0.017 |
Bel | -0.016 |
pol | -0.016 |
Token | " |
Token ID | 1 |
Feature activation | -2.72e-03 |
Pos logit contributions | |
sidelines | +0.027 |
spaghetti | +0.027 |
Seek | +0.025 |
menu | +0.023 |
robbers | +0.023 |
Neg logit contributions | |
bul | -0.021 |
spe | -0.019 |
flew | -0.019 |
pre | -0.018 |
pol | -0.018 |
Token | W |
Token ID | 54 |
Feature activation | +3.42e-02 |
Pos logit contributions | |
spe | +0.005 |
bul | +0.005 |
imm | +0.005 |
am | +0.005 |
ered | +0.005 |
Neg logit contributions | |
sidelines | -0.003 |
spaghetti | -0.003 |
robbers | -0.003 |
Seek | -0.003 |
Want | -0.003 |
Token | OO |
Token ID | 6684 |
Feature activation | +8.19e-02 |
Pos logit contributions | |
sidelines | +0.062 |
spaghetti | +0.060 |
Seek | +0.058 |
bed | +0.053 |
internet | +0.053 |
Neg logit contributions | |
flew | -0.041 |
ah | -0.040 |
cker | -0.039 |
ck | -0.038 |
hon | -0.038 |
Token | F |
Token ID | 37 |
Feature activation | +4.36e-02 |
Pos logit contributions | |
spaghetti | +0.128 |
sidelines | +0.126 |
menu | +0.112 |
bed | +0.111 |
Seek | +0.109 |
Neg logit contributions | |
flew | -0.123 |
Bel | -0.111 |
hon | -0.110 |
bul | -0.109 |
spe | -0.109 |
Token | ! |
Token ID | 0 |
Feature activation | +3.26e-02 |
Pos logit contributions | |
spaghetti | +0.083 |
sidelines | +0.082 |
Seek | +0.076 |
menu | +0.072 |
bed | +0.070 |
Neg logit contributions | |
flew | -0.049 |
bul | -0.047 |
spe | -0.046 |
Bel | -0.043 |
pre | -0.043 |
Token | W |
Token ID | 370 |
Feature activation | +1.66e-03 |
Pos logit contributions | |
sidelines | +0.042 |
spaghetti | +0.041 |
Seek | +0.035 |
menu | +0.034 |
bed | +0.033 |
Neg logit contributions | |
flew | -0.056 |
spe | -0.056 |
bul | -0.056 |
paramed | -0.054 |
pre | -0.052 |
Token | OO |
Token ID | 6684 |
Feature activation | +7.42e-02 |
Pos logit contributions | |
spaghetti | +0.003 |
sidelines | +0.003 |
Seek | +0.003 |
bed | +0.003 |
robbers | +0.003 |
Neg logit contributions | |
flew | -0.002 |
ira | -0.002 |
pre | -0.002 |
hon | -0.002 |
irled | -0.002 |
Token | F |
Token ID | 37 |
Feature activation | +4.16e-02 |
Pos logit contributions | |
spaghetti | +0.115 |
sidelines | +0.113 |
menu | +0.102 |
bed | +0.101 |
internet | +0.099 |
Neg logit contributions | |
flew | -0.113 |
Bel | -0.102 |
hon | -0.101 |
soared | -0.099 |
swoop | -0.098 |
Token | 't |
Token ID | 470 |
Feature activation | +2.18e-02 |
Pos logit contributions | |
spaghetti | +0.002 |
sidelines | +0.002 |
Seek | +0.002 |
bed | +0.002 |
menu | +0.002 |
Neg logit contributions | |
spe | -0.004 |
flew | -0.004 |
bul | -0.004 |
xc | -0.004 |
soared | -0.004 |
Token | like |
Token ID | 588 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
spaghetti | +0.025 |
sidelines | +0.024 |
Seek | +0.021 |
bed | +0.021 |
menu | +0.020 |
Neg logit contributions | |
spe | -0.041 |
bul | -0.040 |
flew | -0.040 |
xc | -0.038 |
esh | -0.038 |
Token | to |
Token ID | 284 |
Feature activation | +2.11e-02 |
Pos logit contributions | |
spaghetti | +0.026 |
sidelines | +0.026 |
Seek | +0.023 |
menu | +0.022 |
bed | +0.022 |
Neg logit contributions | |
bul | -0.029 |
flew | -0.029 |
spe | -0.028 |
Bel | -0.026 |
pol | -0.026 |
Token | fill |
Token ID | 6070 |
Feature activation | +6.23e-03 |
Pos logit contributions | |
spaghetti | +0.028 |
sidelines | +0.027 |
Seek | +0.023 |
bed | +0.023 |
menu | +0.023 |
Neg logit contributions | |
bul | -0.037 |
spe | -0.036 |
flew | -0.036 |
Bel | -0.033 |
pre | -0.033 |
Token | the |
Token ID | 262 |
Feature activation | +2.16e-02 |
Pos logit contributions | |
sidelines | +0.015 |
spaghetti | +0.013 |
Seek | +0.013 |
Want | +0.013 |
robbers | +0.013 |
Neg logit contributions | |
flew | -0.005 |
bul | -0.004 |
pol | -0.004 |
Bel | -0.004 |
spe | -0.004 |
Token | usual |
Token ID | 6678 |
Feature activation | +8.17e-02 |
Pos logit contributions | |
sidelines | +0.033 |
Seek | +0.030 |
Want | +0.029 |
spaghetti | +0.029 |
robbers | +0.027 |
Neg logit contributions | |
bul | -0.033 |
spe | -0.031 |
flew | -0.031 |
pre | -0.031 |
spr | -0.031 |
Token | things |
Token ID | 1243 |
Feature activation | -1.75e-04 |
Pos logit contributions | |
sidelines | +0.107 |
spaghetti | +0.095 |
Seek | +0.090 |
Want | +0.087 |
ours | +0.080 |
Neg logit contributions | |
bul | -0.141 |
flew | -0.141 |
spe | -0.140 |
spr | -0.129 |
soared | -0.128 |
Token | like |
Token ID | 588 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
flew | +0.000 |
bul | +0.000 |
spe | +0.000 |
pol | +0.000 |
soared | +0.000 |
Neg logit contributions | |
sidelines | -0.000 |
spaghetti | -0.000 |
Seek | -0.000 |
robbers | -0.000 |
Want | -0.000 |
Token | buckets |
Token ID | 38674 |
Feature activation | +3.77e-02 |
Pos logit contributions | |
sidelines | +0.030 |
spaghetti | +0.030 |
Seek | +0.027 |
menu | +0.025 |
bed | +0.024 |
Neg logit contributions | |
flew | -0.030 |
bul | -0.030 |
spe | -0.029 |
soared | -0.027 |
pol | -0.027 |
Token | and |
Token ID | 290 |
Feature activation | +6.52e-03 |
Pos logit contributions | |
sidelines | +0.075 |
spaghetti | +0.068 |
Seek | +0.064 |
Want | +0.063 |
concession | +0.061 |
Neg logit contributions | |
flew | -0.044 |
bul | -0.042 |
spe | -0.039 |
soared | -0.036 |
pol | -0.035 |
Token | cups |
Token ID | 14180 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
sidelines | +0.010 |
spaghetti | +0.009 |
Seek | +0.008 |
Want | +0.008 |
oring | +0.008 |
Neg logit contributions | |
flew | -0.010 |
spe | -0.010 |
bul | -0.010 |
blew | -0.009 |
soared | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
spaghetti | +0.025 |
sidelines | +0.025 |
Seek | +0.022 |
menu | +0.021 |
bed | +0.021 |
Neg logit contributions | |
bul | -0.026 |
flew | -0.026 |
spe | -0.026 |
Bel | -0.023 |
pre | -0.023 |
Token | Ben |
Token ID | 3932 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
sidelines | +0.033 |
spaghetti | +0.031 |
Seek | +0.030 |
mine | +0.028 |
ours | +0.028 |
Neg logit contributions | |
flew | -0.020 |
Bel | -0.020 |
bul | -0.019 |
ira | -0.018 |
spe | -0.018 |
Token | lives |
Token ID | 3160 |
Feature activation | +5.17e-03 |
Pos logit contributions | |
spaghetti | +0.014 |
sidelines | +0.013 |
menu | +0.012 |
Seek | +0.012 |
bed | +0.011 |
Neg logit contributions | |
bul | -0.018 |
spe | -0.017 |
flew | -0.016 |
paramed | -0.016 |
pol | -0.016 |
Token | on |
Token ID | 319 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
sidelines | +0.009 |
spaghetti | +0.009 |
Seek | +0.008 |
menu | +0.007 |
bed | +0.007 |
Neg logit contributions | |
flew | -0.007 |
spe | -0.007 |
bul | -0.007 |
pol | -0.006 |
soared | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | +2.93e-02 |
Pos logit contributions | |
sidelines | +0.032 |
spaghetti | +0.032 |
Seek | +0.029 |
menu | +0.028 |
Want | +0.027 |
Neg logit contributions | |
flew | -0.024 |
bul | -0.023 |
spe | -0.023 |
soared | -0.021 |
Bel | -0.021 |
Token | other |
Token ID | 584 |
Feature activation | +8.16e-02 |
Pos logit contributions | |
spaghetti | +0.045 |
Seek | +0.041 |
Want | +0.040 |
sidelines | +0.038 |
Do | +0.037 |
Neg logit contributions | |
flew | -0.043 |
spe | -0.042 |
ostr | -0.040 |
spr | -0.040 |
bul | -0.040 |
Token | part |
Token ID | 636 |
Feature activation | +2.78e-02 |
Pos logit contributions | |
spaghetti | +0.101 |
sidelines | +0.089 |
Seek | +0.084 |
menu | +0.074 |
Want | +0.074 |
Neg logit contributions | |
spe | -0.153 |
flew | -0.152 |
bul | -0.147 |
ostr | -0.139 |
rob | -0.139 |
Token | . |
Token ID | 13 |
Feature activation | +1.92e-02 |
Pos logit contributions | |
spaghetti | +0.043 |
sidelines | +0.043 |
Seek | +0.039 |
menu | +0.036 |
robbers | +0.035 |
Neg logit contributions | |
spe | -0.041 |
bul | -0.041 |
flew | -0.040 |
soared | -0.036 |
pre | -0.035 |
Token |
|
Token ID | 198 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
sidelines | +0.035 |
spaghetti | +0.034 |
Seek | +0.031 |
ours | +0.030 |
mine | +0.030 |
Neg logit contributions | |
flew | -0.021 |
spe | -0.021 |
bul | -0.021 |
Bel | -0.020 |
Ale | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
sidelines | +0.029 |
spaghetti | +0.029 |
Seek | +0.026 |
menu | +0.025 |
robbers | +0.025 |
Neg logit contributions | |
flew | -0.019 |
spe | -0.018 |
bul | -0.018 |
Bel | -0.018 |
Sher | -0.017 |
Token | One |
Token ID | 3198 |
Feature activation | +8.19e-03 |
Pos logit contributions | |
spaghetti | +0.029 |
sidelines | +0.029 |
Seek | +0.026 |
menu | +0.026 |
bed | +0.025 |
Neg logit contributions | |
bul | -0.022 |
flew | -0.022 |
spe | -0.021 |
pol | -0.019 |
pre | -0.019 |
Token | big |
Token ID | 1263 |
Feature activation | +5.39e-03 |
Pos logit contributions | |
sidelines | +0.039 |
spaghetti | +0.037 |
Seek | +0.036 |
ours | +0.033 |
concession | +0.033 |
Neg logit contributions | |
flew | -0.027 |
rob | -0.026 |
bul | -0.025 |
blew | -0.025 |
paramed | -0.025 |
Token | red |
Token ID | 2266 |
Feature activation | -1.02e-02 |
Pos logit contributions | |
sidelines | +0.010 |
Seek | +0.010 |
spaghetti | +0.009 |
and | +0.009 |
concession | +0.009 |
Neg logit contributions | |
flew | -0.007 |
ostr | -0.006 |
spr | -0.006 |
rob | -0.006 |
k | -0.006 |
Token | ball |
Token ID | 2613 |
Feature activation | -5.68e-04 |
Pos logit contributions | |
flew | +0.015 |
bul | +0.015 |
paramed | +0.013 |
spe | +0.013 |
pre | +0.013 |
Neg logit contributions | |
sidelines | -0.016 |
spaghetti | -0.016 |
Seek | -0.015 |
ours | -0.013 |
internet | -0.013 |
Token | on |
Token ID | 319 |
Feature activation | +2.18e-02 |
Pos logit contributions | |
bul | +0.001 |
flew | +0.001 |
spe | +0.001 |
pol | +0.001 |
Bel | +0.001 |
Neg logit contributions | |
spaghetti | -0.001 |
sidelines | -0.001 |
Seek | -0.001 |
menu | -0.001 |
bed | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +3.41e-02 |
Pos logit contributions | |
spaghetti | +0.036 |
sidelines | +0.036 |
Seek | +0.032 |
menu | +0.031 |
bed | +0.031 |
Neg logit contributions | |
bul | -0.030 |
flew | -0.029 |
spe | -0.029 |
Bel | -0.026 |
pre | -0.026 |
Token | other |
Token ID | 584 |
Feature activation | +8.15e-02 |
Pos logit contributions | |
spaghetti | +0.052 |
Seek | +0.051 |
Want | +0.050 |
Would | +0.049 |
sidelines | +0.047 |
Neg logit contributions | |
ostr | -0.046 |
flew | -0.045 |
k | -0.045 |
rob | -0.043 |
spr | -0.042 |
Token | side |
Token ID | 1735 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
spaghetti | +0.112 |
sidelines | +0.109 |
Seek | +0.101 |
handsome | +0.093 |
menu | +0.092 |
Neg logit contributions | |
flew | -0.132 |
ostr | -0.123 |
spr | -0.121 |
rob | -0.120 |
spe | -0.118 |
Token | of |
Token ID | 286 |
Feature activation | +1.85e-02 |
Pos logit contributions | |
sidelines | +0.051 |
spaghetti | +0.049 |
Seek | +0.045 |
menu | +0.044 |
robbers | +0.042 |
Neg logit contributions | |
flew | -0.039 |
bul | -0.039 |
spe | -0.039 |
pol | -0.034 |
soared | -0.034 |
Token | the |
Token ID | 262 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
sidelines | +0.038 |
spaghetti | +0.036 |
Seek | +0.036 |
menu | +0.034 |
Want | +0.034 |
Neg logit contributions | |
flew | -0.018 |
bul | -0.017 |
blew | -0.014 |
rob | -0.014 |
spe | -0.014 |
Token | fence |
Token ID | 13990 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
sidelines | +0.028 |
spaghetti | +0.028 |
Seek | +0.026 |
Want | +0.025 |
Nice | +0.025 |
Neg logit contributions | |
flew | -0.021 |
k | -0.020 |
spr | -0.020 |
ostr | -0.020 |
went | -0.019 |
Token | . |
Token ID | 13 |
Feature activation | +5.96e-03 |
Pos logit contributions | |
sidelines | +0.024 |
spaghetti | +0.023 |
Seek | +0.022 |
robbers | +0.021 |
menu | +0.021 |
Neg logit contributions | |
flew | -0.013 |
bul | -0.010 |
spe | -0.010 |
soared | -0.010 |
blew | -0.010 |
Token | they |
Token ID | 484 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
bul | +0.015 |
spe | +0.014 |
xc | +0.014 |
paramed | +0.014 |
Bel | +0.014 |
Neg logit contributions | |
spaghetti | -0.016 |
bed | -0.014 |
sidelines | -0.014 |
Seek | -0.013 |
menu | -0.013 |
Token | saw |
Token ID | 2497 |
Feature activation | +2.25e-02 |
Pos logit contributions | |
spaghetti | +0.034 |
sidelines | +0.032 |
Seek | +0.030 |
menu | +0.030 |
bed | +0.029 |
Neg logit contributions | |
bul | -0.022 |
spe | -0.021 |
esh | -0.020 |
xc | -0.020 |
paramed | -0.020 |
Token | animals |
Token ID | 4695 |
Feature activation | +7.45e-03 |
Pos logit contributions | |
spaghetti | +0.033 |
sidelines | +0.032 |
Seek | +0.028 |
menu | +0.027 |
bed | +0.027 |
Neg logit contributions | |
bul | -0.035 |
spe | -0.035 |
flew | -0.035 |
Bel | -0.032 |
pol | -0.032 |
Token | on |
Token ID | 319 |
Feature activation | +1.93e-02 |
Pos logit contributions | |
sidelines | +0.014 |
spaghetti | +0.014 |
Seek | +0.013 |
concession | +0.012 |
menu | +0.012 |
Neg logit contributions | |
flew | -0.009 |
bul | -0.008 |
soared | -0.008 |
spe | -0.008 |
blew | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | +3.48e-02 |
Pos logit contributions | |
sidelines | +0.039 |
spaghetti | +0.037 |
Seek | +0.035 |
menu | +0.033 |
Want | +0.033 |
Neg logit contributions | |
flew | -0.021 |
bul | -0.020 |
spe | -0.019 |
soared | -0.018 |
blew | -0.017 |
Token | other |
Token ID | 584 |
Feature activation | +8.13e-02 |
Pos logit contributions | |
Seek | +0.053 |
Want | +0.051 |
spaghetti | +0.051 |
Would | +0.050 |
sidelines | +0.048 |
Neg logit contributions | |
flew | -0.050 |
ostr | -0.049 |
Or | -0.046 |
k | -0.046 |
cker | -0.045 |
Token | side |
Token ID | 1735 |
Feature activation | +2.76e-02 |
Pos logit contributions | |
spaghetti | +0.096 |
sidelines | +0.095 |
Seek | +0.085 |
menu | +0.076 |
Want | +0.073 |
Neg logit contributions | |
flew | -0.154 |
spe | -0.143 |
bul | -0.142 |
Or | -0.140 |
cker | -0.139 |
Token | of |
Token ID | 286 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
sidelines | +0.048 |
spaghetti | +0.047 |
Seek | +0.043 |
menu | +0.040 |
robbers | +0.039 |
Neg logit contributions | |
flew | -0.037 |
spe | -0.037 |
bul | -0.037 |
soared | -0.032 |
cker | -0.031 |
Token | the |
Token ID | 262 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
sidelines | +0.024 |
spaghetti | +0.023 |
Seek | +0.022 |
menu | +0.021 |
Want | +0.020 |
Neg logit contributions | |
flew | -0.012 |
bul | -0.012 |
spe | -0.011 |
rob | -0.010 |
blew | -0.010 |
Token | fence |
Token ID | 13990 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
spaghetti | +0.023 |
sidelines | +0.023 |
Seek | +0.022 |
Want | +0.021 |
Would | +0.020 |
Neg logit contributions | |
flew | -0.022 |
ostr | -0.021 |
spr | -0.021 |
spe | -0.020 |
Or | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
sidelines | +0.024 |
spaghetti | +0.023 |
Seek | +0.022 |
menu | +0.020 |
robbers | +0.020 |
Neg logit contributions | |
flew | -0.015 |
bul | -0.014 |
spe | -0.013 |
soared | -0.012 |
blew | -0.012 |
Token | red |
Token ID | 2266 |
Feature activation | -1.02e-02 |
Pos logit contributions | |
sidelines | +0.006 |
Seek | +0.006 |
spaghetti | +0.005 |
ours | +0.005 |
internet | +0.005 |
Neg logit contributions | |
flew | -0.005 |
bul | -0.004 |
paramed | -0.004 |
ostr | -0.004 |
spr | -0.004 |
Token | ball |
Token ID | 2613 |
Feature activation | +6.22e-04 |
Pos logit contributions | |
bul | +0.017 |
flew | +0.017 |
paramed | +0.015 |
ostr | +0.015 |
pre | +0.015 |
Neg logit contributions | |
sidelines | -0.014 |
Seek | -0.013 |
spaghetti | -0.013 |
ours | -0.012 |
internet | -0.011 |
Token | behind |
Token ID | 2157 |
Feature activation | +3.11e-02 |
Pos logit contributions | |
spaghetti | +0.001 |
sidelines | +0.001 |
Seek | +0.001 |
menu | +0.001 |
bed | +0.001 |
Neg logit contributions | |
bul | -0.001 |
spe | -0.001 |
flew | -0.001 |
Bel | -0.001 |
paramed | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +3.75e-02 |
Pos logit contributions | |
sidelines | +0.055 |
spaghetti | +0.053 |
Seek | +0.050 |
menu | +0.048 |
Want | +0.046 |
Neg logit contributions | |
flew | -0.040 |
bul | -0.038 |
spe | -0.037 |
esh | -0.034 |
soared | -0.034 |
Token | books |
Token ID | 3835 |
Feature activation | +4.72e-02 |
Pos logit contributions | |
sidelines | +0.060 |
unnecessary | +0.054 |
inations | +0.052 |
ours | +0.051 |
elsewhere | +0.051 |
Neg logit contributions | |
zo | -0.046 |
ostr | -0.045 |
aer | -0.044 |
k | -0.043 |
Ev | -0.041 |
Token | he |
Token ID | 258 |
Feature activation | +8.12e-02 |
Pos logit contributions | |
sidelines | +0.088 |
spaghetti | +0.085 |
Seek | +0.081 |
robbers | +0.076 |
Want | +0.073 |
Neg logit contributions | |
flew | -0.059 |
bul | -0.053 |
spe | -0.052 |
blew | -0.049 |
master | -0.048 |
Token | lf |
Token ID | 1652 |
Feature activation | +2.79e-03 |
Pos logit contributions | |
spaghetti | +0.118 |
sidelines | +0.117 |
Seek | +0.103 |
menu | +0.100 |
bed | +0.097 |
Neg logit contributions | |
bul | -0.126 |
flew | -0.126 |
spe | -0.125 |
pol | -0.115 |
Bel | -0.115 |
Token | . |
Token ID | 13 |
Feature activation | +1.20e-02 |
Pos logit contributions | |
spaghetti | +0.005 |
sidelines | +0.005 |
Seek | +0.004 |
menu | +0.004 |
bed | +0.004 |
Neg logit contributions | |
bul | -0.004 |
flew | -0.004 |
spe | -0.004 |
pol | -0.003 |
Bel | -0.003 |
Token | Tom |
Token ID | 4186 |
Feature activation | +2.50e-02 |
Pos logit contributions | |
sidelines | +0.019 |
spaghetti | +0.018 |
Seek | +0.017 |
bed | +0.016 |
ours | +0.015 |
Neg logit contributions | |
flew | -0.017 |
spe | -0.016 |
bul | -0.016 |
paramed | -0.015 |
pol | -0.015 |
Token | tried |
Token ID | 3088 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
spaghetti | +0.037 |
Seek | +0.032 |
bone | +0.031 |
robbers | +0.031 |
mine | +0.031 |
Neg logit contributions | |
bul | -0.042 |
paramed | -0.038 |
spe | -0.038 |
pre | -0.037 |
Bel | -0.036 |
Token | to |
Token ID | 284 |
Feature activation | +2.45e-03 |
Pos logit contributions | |
sidelines | +0.031 |
spaghetti | +0.029 |
Seek | +0.027 |
concession | +0.026 |
menu | +0.026 |
Neg logit contributions | |
flew | -0.017 |
bul | -0.016 |
pol | -0.015 |
spe | -0.014 |
blew | -0.014 |
Token | just |
Token ID | 655 |
Feature activation | +2.95e-02 |
Pos logit contributions | |
sidelines | +0.039 |
spaghetti | +0.039 |
Seek | +0.035 |
menu | +0.033 |
bed | +0.032 |
Neg logit contributions | |
flew | -0.036 |
bul | -0.035 |
spe | -0.035 |
Bel | -0.032 |
soared | -0.032 |
Token | another |
Token ID | 1194 |
Feature activation | -6.37e-03 |
Pos logit contributions | |
sidelines | +0.042 |
spaghetti | +0.042 |
Seek | +0.038 |
menu | +0.035 |
bed | +0.034 |
Neg logit contributions | |
flew | -0.048 |
bul | -0.046 |
spe | -0.046 |
soared | -0.043 |
Bel | -0.042 |
Token | day |
Token ID | 1110 |
Feature activation | -1.74e-03 |
Pos logit contributions | |
flew | +0.010 |
bul | +0.010 |
spe | +0.010 |
Bel | +0.009 |
soared | +0.009 |
Neg logit contributions | |
sidelines | -0.009 |
spaghetti | -0.009 |
Seek | -0.008 |
menu | -0.007 |
ours | -0.007 |
Token | playing |
Token ID | 2712 |
Feature activation | +5.81e-04 |
Pos logit contributions | |
flew | +0.002 |
spe | +0.002 |
bul | +0.002 |
soared | +0.002 |
Or | +0.002 |
Neg logit contributions | |
sidelines | -0.003 |
spaghetti | -0.003 |
Seek | -0.003 |
internet | -0.003 |
ours | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
sidelines | +0.001 |
spaghetti | +0.001 |
Seek | +0.001 |
menu | +0.001 |
ours | +0.001 |
Neg logit contributions | |
flew | -0.001 |
bul | -0.001 |
spe | -0.001 |
soared | -0.001 |
Or | -0.001 |
Token | usual |
Token ID | 6678 |
Feature activation | +8.11e-02 |
Pos logit contributions | |
sidelines | +0.024 |
spaghetti | +0.023 |
Seek | +0.021 |
Want | +0.020 |
bed | +0.020 |
Neg logit contributions | |
flew | -0.029 |
spe | -0.028 |
bul | -0.027 |
soared | -0.027 |
Bel | -0.027 |
Token | game |
Token ID | 983 |
Feature activation | -6.00e-03 |
Pos logit contributions | |
sidelines | +0.112 |
spaghetti | +0.111 |
Seek | +0.099 |
menu | +0.093 |
ours | +0.091 |
Neg logit contributions | |
flew | -0.131 |
bul | -0.129 |
spe | -0.129 |
soared | -0.119 |
Bel | -0.118 |
Token | , |
Token ID | 11 |
Feature activation | -6.75e-03 |
Pos logit contributions | |
bul | +0.009 |
flew | +0.009 |
spe | +0.009 |
paramed | +0.008 |
Bel | +0.008 |
Neg logit contributions | |
spaghetti | -0.009 |
sidelines | -0.009 |
Seek | -0.008 |
menu | -0.008 |
bed | -0.008 |
Token | but |
Token ID | 475 |
Feature activation | +8.39e-03 |
Pos logit contributions | |
flew | +0.012 |
spe | +0.011 |
bul | +0.011 |
Or | +0.011 |
soared | +0.011 |
Neg logit contributions | |
spaghetti | -0.009 |
sidelines | -0.009 |
Seek | -0.008 |
menu | -0.007 |
bed | -0.007 |
Token | to |
Token ID | 284 |
Feature activation | +6.46e-03 |
Pos logit contributions | |
spaghetti | +0.013 |
sidelines | +0.013 |
Seek | +0.012 |
menu | +0.011 |
bed | +0.011 |
Neg logit contributions | |
flew | -0.012 |
bul | -0.012 |
spe | -0.012 |
soared | -0.011 |
Bel | -0.011 |
Token | his |
Token ID | 465 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
spaghetti | +0.010 |
sidelines | +0.010 |
Seek | +0.009 |
menu | +0.008 |
bed | +0.008 |
Neg logit contributions | |
bul | -0.010 |
flew | -0.010 |
spe | -0.010 |
pre | -0.009 |
pol | -0.009 |
Token | delicate |
Token ID | 19217 |
Feature activation | +1.37e-02 |
Pos logit contributions | |
sidelines | +0.041 |
spaghetti | +0.039 |
Seek | +0.038 |
ours | +0.036 |
Want | +0.034 |
Neg logit contributions | |
flew | -0.033 |
bul | -0.032 |
rob | -0.031 |
spe | -0.030 |
paramed | -0.030 |
Token | banana |
Token ID | 25996 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
sidelines | +0.023 |
spaghetti | +0.022 |
Seek | +0.022 |
ours | +0.019 |
robbers | +0.019 |
Neg logit contributions | |
flew | -0.019 |
bul | -0.019 |
spe | -0.017 |
rob | -0.017 |
paramed | -0.017 |
Token | tree |
Token ID | 5509 |
Feature activation | +2.07e-02 |
Pos logit contributions | |
sidelines | +0.017 |
spaghetti | +0.016 |
Seek | +0.015 |
ours | +0.014 |
menu | +0.014 |
Neg logit contributions | |
flew | -0.015 |
bul | -0.014 |
soared | -0.013 |
spe | -0.013 |
blew | -0.012 |
Token | on |
Token ID | 319 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
sidelines | +0.036 |
spaghetti | +0.035 |
Seek | +0.032 |
menu | +0.030 |
robbers | +0.030 |
Neg logit contributions | |
flew | -0.029 |
bul | -0.028 |
spe | -0.027 |
soared | -0.025 |
pol | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | +3.49e-02 |
Pos logit contributions | |
spaghetti | +0.032 |
sidelines | +0.030 |
bed | +0.028 |
menu | +0.027 |
Seek | +0.025 |
Neg logit contributions | |
spe | -0.035 |
bul | -0.034 |
flew | -0.033 |
pre | -0.032 |
paramed | -0.032 |
Token | other |
Token ID | 584 |
Feature activation | +8.09e-02 |
Pos logit contributions | |
spaghetti | +0.045 |
sidelines | +0.042 |
Seek | +0.042 |
Want | +0.039 |
robbers | +0.035 |
Neg logit contributions | |
flew | -0.059 |
ostr | -0.057 |
rob | -0.056 |
bul | -0.055 |
spr | -0.053 |
Token | side |
Token ID | 1735 |
Feature activation | +2.99e-02 |
Pos logit contributions | |
sidelines | +0.094 |
spaghetti | +0.092 |
Seek | +0.082 |
ours | +0.073 |
menu | +0.072 |
Neg logit contributions | |
flew | -0.151 |
bul | -0.143 |
spe | -0.140 |
ostr | -0.139 |
rob | -0.139 |
Token | of |
Token ID | 286 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
sidelines | +0.047 |
spaghetti | +0.047 |
Seek | +0.042 |
menu | +0.041 |
robbers | +0.039 |
Neg logit contributions | |
flew | -0.044 |
bul | -0.043 |
spe | -0.043 |
soared | -0.038 |
pol | -0.038 |
Token | the |
Token ID | 262 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
sidelines | +0.024 |
spaghetti | +0.024 |
Seek | +0.022 |
menu | +0.021 |
Want | +0.021 |
Neg logit contributions | |
flew | -0.016 |
bul | -0.016 |
spe | -0.015 |
Bel | -0.014 |
soared | -0.014 |
Token | path |
Token ID | 3108 |
Feature activation | +9.00e-03 |
Pos logit contributions | |
spaghetti | +0.024 |
sidelines | +0.024 |
Seek | +0.022 |
ours | +0.021 |
Want | +0.021 |
Neg logit contributions | |
flew | -0.021 |
rob | -0.020 |
ostr | -0.020 |
bul | -0.019 |
spe | -0.019 |
Token | . |
Token ID | 13 |
Feature activation | +3.24e-03 |
Pos logit contributions | |
spaghetti | +0.016 |
sidelines | +0.016 |
Seek | +0.015 |
menu | +0.014 |
robbers | +0.014 |
Neg logit contributions | |
flew | -0.011 |
spe | -0.011 |
bul | -0.011 |
soared | -0.010 |
pol | -0.009 |
Token | problem |
Token ID | 1917 |
Feature activation | -2.82e-02 |
Pos logit contributions | |
bul | +0.032 |
flew | +0.032 |
spe | +0.032 |
Bel | +0.029 |
pol | +0.029 |
Neg logit contributions | |
spaghetti | -0.024 |
sidelines | -0.023 |
Seek | -0.020 |
menu | -0.019 |
bed | -0.019 |
Token | . |
Token ID | 13 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
spe | +0.036 |
bul | +0.036 |
flew | +0.035 |
Or | +0.031 |
pol | +0.031 |
Neg logit contributions | |
sidelines | -0.050 |
spaghetti | -0.049 |
Seek | -0.043 |
menu | -0.043 |
Want | -0.041 |
Token | He |
Token ID | 679 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
bul | +0.020 |
flew | +0.020 |
spe | +0.019 |
pre | +0.018 |
pol | +0.018 |
Neg logit contributions | |
spaghetti | -0.017 |
sidelines | -0.017 |
Seek | -0.015 |
menu | -0.014 |
bed | -0.014 |
Token | ate |
Token ID | 15063 |
Feature activation | +3.51e-02 |
Pos logit contributions | |
bul | +0.015 |
paramed | +0.015 |
pre | +0.015 |
xc | +0.014 |
hon | +0.014 |
Neg logit contributions | |
spaghetti | -0.016 |
sidelines | -0.014 |
Seek | -0.014 |
mine | -0.014 |
bed | -0.013 |
Token | the |
Token ID | 262 |
Feature activation | +6.71e-03 |
Pos logit contributions | |
sidelines | +0.061 |
Seek | +0.056 |
spaghetti | +0.055 |
robbers | +0.052 |
Want | +0.052 |
Neg logit contributions | |
flew | -0.045 |
bul | -0.043 |
spe | -0.041 |
Or | -0.038 |
soared | -0.038 |
Token | rest |
Token ID | 1334 |
Feature activation | +8.06e-02 |
Pos logit contributions | |
sidelines | +0.008 |
spaghetti | +0.008 |
Seek | +0.007 |
robbers | +0.007 |
ours | +0.007 |
Neg logit contributions | |
bul | -0.012 |
flew | -0.012 |
spe | -0.011 |
pre | -0.011 |
pol | -0.011 |
Token | of |
Token ID | 286 |
Feature activation | -8.67e-03 |
Pos logit contributions | |
sidelines | +0.124 |
spaghetti | +0.122 |
Seek | +0.110 |
menu | +0.106 |
bed | +0.102 |
Neg logit contributions | |
bul | -0.120 |
flew | -0.119 |
spe | -0.117 |
pre | -0.107 |
soared | -0.106 |
Token | his |
Token ID | 465 |
Feature activation | -8.21e-03 |
Pos logit contributions | |
flew | +0.010 |
bul | +0.010 |
spe | +0.010 |
pol | +0.009 |
soared | +0.009 |
Neg logit contributions | |
sidelines | -0.016 |
spaghetti | -0.016 |
Seek | -0.014 |
menu | -0.014 |
internet | -0.013 |
Token | cookie |
Token ID | 19751 |
Feature activation | +4.02e-03 |
Pos logit contributions | |
flew | +0.014 |
bul | +0.014 |
spe | +0.014 |
pre | +0.013 |
pol | +0.013 |
Neg logit contributions | |
sidelines | -0.010 |
spaghetti | -0.010 |
Seek | -0.009 |
menu | -0.008 |
ours | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | -4.13e-03 |
Pos logit contributions | |
sidelines | +0.007 |
spaghetti | +0.006 |
Seek | +0.006 |
menu | +0.006 |
Want | +0.005 |
Neg logit contributions | |
flew | -0.006 |
bul | -0.006 |
spe | -0.005 |
soared | -0.005 |
pol | -0.005 |
Token | went |
Token ID | 1816 |
Feature activation | -2.91e-02 |
Pos logit contributions | |
bul | +0.005 |
spe | +0.005 |
paramed | +0.005 |
flew | +0.005 |
pre | +0.004 |
Neg logit contributions | |
spaghetti | -0.008 |
sidelines | -0.007 |
Seek | -0.007 |
bed | -0.007 |
menu | -0.006 |
Token | The |
Token ID | 383 |
Feature activation | +9.63e-03 |
Pos logit contributions | |
sidelines | +0.026 |
spaghetti | +0.024 |
internet | +0.023 |
Seek | +0.022 |
ours | +0.022 |
Neg logit contributions | |
flew | -0.015 |
paramed | -0.012 |
hon | -0.012 |
Spr | -0.012 |
walked | -0.012 |
Token | ball |
Token ID | 2613 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
sidelines | +0.018 |
spaghetti | +0.018 |
Seek | +0.017 |
hunting | +0.017 |
concession | +0.017 |
Neg logit contributions | |
flew | -0.011 |
blew | -0.009 |
k | -0.009 |
soared | -0.009 |
went | -0.008 |
Token | was |
Token ID | 373 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
spaghetti | +0.018 |
sidelines | +0.017 |
mine | +0.016 |
bone | +0.015 |
bed | +0.015 |
Neg logit contributions | |
spe | -0.016 |
bul | -0.016 |
paramed | -0.015 |
xc | -0.015 |
Ale | -0.015 |
Token | on |
Token ID | 319 |
Feature activation | +2.34e-02 |
Pos logit contributions | |
sidelines | +0.026 |
spaghetti | +0.025 |
Seek | +0.023 |
menu | +0.022 |
concession | +0.021 |
Neg logit contributions | |
flew | -0.025 |
bul | -0.022 |
blew | -0.021 |
spe | -0.021 |
pol | -0.021 |
Token | the |
Token ID | 262 |
Feature activation | +3.35e-02 |
Pos logit contributions | |
spaghetti | +0.039 |
sidelines | +0.039 |
Seek | +0.035 |
menu | +0.034 |
bed | +0.033 |
Neg logit contributions | |
bul | -0.031 |
flew | -0.031 |
spe | -0.031 |
Bel | -0.028 |
pol | -0.028 |
Token | other |
Token ID | 584 |
Feature activation | +8.05e-02 |
Pos logit contributions | |
Want | +0.048 |
Seek | +0.048 |
spaghetti | +0.048 |
Would | +0.048 |
oring | +0.045 |
Neg logit contributions | |
flew | -0.045 |
ostr | -0.044 |
k | -0.042 |
Or | -0.040 |
blew | -0.040 |
Token | side |
Token ID | 1735 |
Feature activation | +2.91e-02 |
Pos logit contributions | |
sidelines | +0.105 |
spaghetti | +0.103 |
Seek | +0.098 |
menu | +0.093 |
jar | +0.092 |
Neg logit contributions | |
flew | -0.127 |
ostr | -0.119 |
Or | -0.114 |
rob | -0.114 |
went | -0.113 |
Token | of |
Token ID | 286 |
Feature activation | +1.73e-02 |
Pos logit contributions | |
sidelines | +0.058 |
spaghetti | +0.053 |
Seek | +0.050 |
menu | +0.050 |
concession | +0.049 |
Neg logit contributions | |
flew | -0.034 |
spe | -0.032 |
bul | -0.032 |
cker | -0.027 |
mill | -0.027 |
Token | the |
Token ID | 262 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
sidelines | +0.035 |
Seek | +0.033 |
spaghetti | +0.032 |
Want | +0.031 |
menu | +0.031 |
Neg logit contributions | |
flew | -0.018 |
bul | -0.017 |
blew | -0.015 |
soared | -0.014 |
rob | -0.014 |
Token | fence |
Token ID | 13990 |
Feature activation | +1.57e-02 |
Pos logit contributions | |
spaghetti | +0.027 |
sidelines | +0.027 |
Seek | +0.026 |
ocket | +0.026 |
Want | +0.026 |
Neg logit contributions | |
flew | -0.020 |
k | -0.019 |
went | -0.019 |
ostr | -0.019 |
blew | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | +9.02e-03 |
Pos logit contributions | |
sidelines | +0.035 |
spaghetti | +0.033 |
Seek | +0.033 |
robbers | +0.031 |
concession | +0.031 |
Neg logit contributions | |
flew | -0.016 |
soared | -0.012 |
bul | -0.011 |
spr | -0.011 |
blew | -0.011 |
Token | He |
Token ID | 679 |
Feature activation | -2.85e-03 |
Pos logit contributions | |
sidelines | +0.013 |
spaghetti | +0.012 |
Seek | +0.011 |
menu | +0.011 |
bed | +0.010 |
Neg logit contributions | |
spe | -0.010 |
bul | -0.010 |
flew | -0.010 |
paramed | -0.010 |
Bel | -0.010 |
Token | made |
Token ID | 925 |
Feature activation | +4.76e-03 |
Pos logit contributions | |
bul | +0.004 |
esh | +0.004 |
xc | +0.004 |
spe | +0.004 |
paramed | +0.004 |
Neg logit contributions | |
spaghetti | -0.004 |
bone | -0.004 |
bones | -0.004 |
mine | -0.004 |
menu | -0.003 |
Token | faces |
Token ID | 6698 |
Feature activation | +2.62e-02 |
Pos logit contributions | |
sidelines | +0.007 |
spaghetti | +0.007 |
Seek | +0.007 |
menu | +0.006 |
bed | +0.006 |
Neg logit contributions | |
flew | -0.007 |
bul | -0.007 |
spe | -0.007 |
pol | -0.006 |
paramed | -0.006 |
Token | at |
Token ID | 379 |
Feature activation | -1.49e-02 |
Pos logit contributions | |
spaghetti | +0.036 |
sidelines | +0.035 |
Seek | +0.030 |
menu | +0.030 |
bed | +0.030 |
Neg logit contributions | |
bul | -0.042 |
spe | -0.042 |
flew | -0.042 |
xc | -0.040 |
Bel | -0.040 |
Token | the |
Token ID | 262 |
Feature activation | +3.00e-02 |
Pos logit contributions | |
flew | +0.015 |
bul | +0.014 |
spe | +0.014 |
blew | +0.012 |
mill | +0.012 |
Neg logit contributions | |
sidelines | -0.030 |
Seek | -0.029 |
spaghetti | -0.028 |
Want | -0.026 |
menu | -0.026 |
Token | other |
Token ID | 584 |
Feature activation | +8.04e-02 |
Pos logit contributions | |
Seek | +0.047 |
sidelines | +0.047 |
spaghetti | +0.047 |
Want | +0.043 |
robbers | +0.042 |
Neg logit contributions | |
flew | -0.042 |
bul | -0.039 |
blew | -0.039 |
spe | -0.038 |
pre | -0.038 |
Token | kids |
Token ID | 3988 |
Feature activation | +2.67e-02 |
Pos logit contributions | |
sidelines | +0.137 |
spaghetti | +0.129 |
Seek | +0.124 |
Want | +0.115 |
menu | +0.115 |
Neg logit contributions | |
flew | -0.112 |
spe | -0.105 |
bul | -0.103 |
pre | -0.100 |
blew | -0.099 |
Token | and |
Token ID | 290 |
Feature activation | -9.08e-03 |
Pos logit contributions | |
sidelines | +0.046 |
spaghetti | +0.046 |
Seek | +0.042 |
menu | +0.040 |
Want | +0.039 |
Neg logit contributions | |
flew | -0.035 |
spe | -0.034 |
bul | -0.033 |
soared | -0.030 |
hon | -0.029 |
Token | said |
Token ID | 531 |
Feature activation | +8.73e-03 |
Pos logit contributions | |
bul | +0.012 |
esh | +0.012 |
xc | +0.012 |
spe | +0.012 |
Bel | +0.011 |
Neg logit contributions | |
spaghetti | -0.016 |
sidelines | -0.015 |
bed | -0.014 |
robbers | -0.013 |
Seek | -0.013 |
Token | , |
Token ID | 11 |
Feature activation | +1.07e-03 |
Pos logit contributions | |
spaghetti | +0.012 |
sidelines | +0.010 |
mine | +0.010 |
menu | +0.010 |
bed | +0.009 |
Neg logit contributions | |
bul | -0.015 |
spe | -0.014 |
Bel | -0.014 |
flew | -0.014 |
cker | -0.014 |
Token | " |
Token ID | 366 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
spaghetti | +0.001 |
sidelines | +0.001 |
Seek | +0.001 |
menu | +0.001 |
bed | +0.001 |
Neg logit contributions | |
bul | -0.002 |
flew | -0.002 |
spe | -0.002 |
paramed | -0.002 |
Bel | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | -7.31e-03 |
Pos logit contributions | |
bul | +0.012 |
flew | +0.011 |
spe | +0.011 |
pol | +0.010 |
Bel | +0.010 |
Neg logit contributions | |
spaghetti | -0.011 |
sidelines | -0.010 |
Seek | -0.009 |
menu | -0.009 |
bed | -0.009 |
Token | Andy |
Token ID | 35314 |
Feature activation | -1.20e-02 |
Pos logit contributions | |
spe | +0.011 |
bul | +0.011 |
pre | +0.010 |
flew | +0.010 |
pol | +0.010 |
Neg logit contributions | |
spaghetti | -0.011 |
sidelines | -0.010 |
Seek | -0.010 |
Want | -0.009 |
bed | -0.009 |
Token | looked |
Token ID | 3114 |
Feature activation | +3.61e-03 |
Pos logit contributions | |
pre | +0.018 |
bul | +0.018 |
paramed | +0.017 |
Or | +0.017 |
xc | +0.017 |
Neg logit contributions | |
spaghetti | -0.016 |
sidelines | -0.014 |
Seek | -0.013 |
mine | -0.013 |
bed | -0.013 |
Token | at |
Token ID | 379 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
sidelines | +0.006 |
spaghetti | +0.006 |
Seek | +0.005 |
menu | +0.005 |
bed | +0.005 |
Neg logit contributions | |
flew | -0.005 |
bul | -0.005 |
spe | -0.005 |
Bel | -0.004 |
pol | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +8.25e-03 |
Pos logit contributions | |
spe | +0.038 |
bul | +0.038 |
flew | +0.038 |
paramed | +0.035 |
pre | +0.035 |
Neg logit contributions | |
spaghetti | -0.043 |
sidelines | -0.042 |
Seek | -0.037 |
bed | -0.037 |
menu | -0.036 |
Token | freshly |
Token ID | 29026 |
Feature activation | +8.04e-02 |
Pos logit contributions | |
Seek | +0.013 |
sidelines | +0.013 |
robbers | +0.012 |
Want | +0.011 |
spaghetti | +0.011 |
Neg logit contributions | |
bul | -0.012 |
flew | -0.012 |
blew | -0.012 |
pre | -0.011 |
spr | -0.011 |
Token | printed |
Token ID | 10398 |
Feature activation | -1.01e-03 |
Pos logit contributions | |
spaghetti | +0.155 |
sidelines | +0.145 |
menu | +0.136 |
Seek | +0.134 |
bed | +0.130 |
Neg logit contributions | |
spe | -0.090 |
bul | -0.086 |
flew | -0.077 |
paramed | -0.076 |
xc | -0.075 |
Token | picture |
Token ID | 4286 |
Feature activation | -3.06e-03 |
Pos logit contributions | |
bul | +0.002 |
flew | +0.002 |
spe | +0.002 |
Bel | +0.001 |
pol | +0.001 |
Neg logit contributions | |
spaghetti | -0.001 |
sidelines | -0.001 |
menu | -0.001 |
bed | -0.001 |
Seek | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | -5.11e-03 |
Pos logit contributions | |
bul | +0.004 |
flew | +0.004 |
spe | +0.004 |
pol | +0.004 |
soared | +0.004 |
Neg logit contributions | |
sidelines | -0.005 |
spaghetti | -0.005 |
Seek | -0.004 |
menu | -0.004 |
robbers | -0.004 |
Token | smiled |
Token ID | 13541 |
Feature activation | -9.43e-03 |
Pos logit contributions | |
bul | +0.006 |
spe | +0.006 |
flew | +0.006 |
paramed | +0.006 |
pre | +0.006 |
Neg logit contributions | |
spaghetti | -0.009 |
sidelines | -0.009 |
Seek | -0.008 |
bed | -0.008 |
menu | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
bul | +0.016 |
flew | +0.016 |
spe | +0.016 |
soared | +0.015 |
paramed | +0.015 |
Neg logit contributions | |
spaghetti | -0.013 |
sidelines | -0.011 |
bed | -0.010 |
menu | -0.010 |
safe | -0.010 |
Token | and |
Token ID | 290 |
Feature activation | +5.60e-03 |
Pos logit contributions | |
spe | +0.067 |
paramed | +0.066 |
bul | +0.065 |
xc | +0.064 |
esh | +0.063 |
Neg logit contributions | |
spaghetti | -0.045 |
sidelines | -0.037 |
menu | -0.036 |
bed | -0.036 |
Seek | -0.035 |
Token | circles |
Token ID | 13332 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
spaghetti | +0.009 |
sidelines | +0.008 |
Seek | +0.007 |
bed | +0.007 |
robbers | +0.007 |
Neg logit contributions | |
spe | -0.009 |
paramed | -0.009 |
bul | -0.009 |
pre | -0.009 |
xc | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +2.05e-03 |
Pos logit contributions | |
spe | +0.047 |
bul | +0.046 |
paramed | +0.045 |
xc | +0.044 |
flew | +0.044 |
Neg logit contributions | |
spaghetti | -0.035 |
sidelines | -0.032 |
bed | -0.028 |
menu | -0.028 |
Seek | -0.028 |
Token | triangles |
Token ID | 44360 |
Feature activation | -8.06e-02 |
Pos logit contributions | |
spaghetti | +0.003 |
sidelines | +0.003 |
Seek | +0.003 |
bed | +0.003 |
robbers | +0.002 |
Neg logit contributions | |
spe | -0.003 |
xc | -0.003 |
bul | -0.003 |
paramed | -0.003 |
pre | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | -4.40e-03 |
Pos logit contributions | |
paramed | +0.160 |
spe | +0.157 |
xc | +0.154 |
bul | +0.151 |
esh | +0.147 |
Neg logit contributions | |
spaghetti | -0.091 |
bed | -0.074 |
chess | -0.070 |
sidelines | -0.069 |
menu | -0.068 |
Token | rect |
Token ID | 13621 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
spe | +0.007 |
xc | +0.007 |
bul | +0.007 |
paramed | +0.007 |
Bel | +0.007 |
Neg logit contributions | |
spaghetti | -0.006 |
sidelines | -0.006 |
bed | -0.005 |
Seek | -0.005 |
menu | -0.005 |
Token | angles |
Token ID | 27787 |
Feature activation | -1.78e-02 |
Pos logit contributions | |
paramed | +0.265 |
rob | +0.251 |
bul | +0.247 |
spe | +0.240 |
ostr | +0.233 |
Neg logit contributions | |
spaghetti | -0.136 |
ours | -0.117 |
mine | -0.102 |
menu | -0.101 |
Seek | -0.093 |
Token | . |
Token ID | 13 |
Feature activation | -3.98e-03 |
Pos logit contributions | |
xc | +0.036 |
spe | +0.035 |
paramed | +0.034 |
Bel | +0.033 |
esh | +0.033 |
Neg logit contributions | |
spaghetti | -0.019 |
bed | -0.017 |
sidelines | -0.015 |
anywhere | -0.015 |
before | -0.015 |
Token | She |
Token ID | 1375 |
Feature activation | -7.67e-03 |
Pos logit contributions | |
bul | +0.006 |
flew | +0.006 |
spe | +0.006 |
soared | +0.006 |
cker | +0.005 |
Neg logit contributions | |
spaghetti | -0.006 |
sidelines | -0.006 |
Seek | -0.005 |
bed | -0.005 |
menu | -0.005 |
Token | made |
Token ID | 925 |
Feature activation | -5.61e-03 |
Pos logit contributions | |
paramed | +0.013 |
esh | +0.013 |
xc | +0.012 |
Bel | +0.012 |
Sher | +0.012 |
Neg logit contributions | |
spaghetti | -0.011 |
chess | -0.009 |
Seek | -0.009 |
table | -0.008 |
bed | -0.008 |
Token | her |
Token ID | 607 |
Feature activation | +7.22e-03 |
Pos logit contributions | |
bul | +0.010 |
spe | +0.010 |
paramed | +0.010 |
pre | +0.010 |
flew | +0.010 |
Neg logit contributions | |
spaghetti | -0.007 |
sidelines | -0.007 |
bed | -0.006 |
menu | -0.006 |
Seek | -0.006 |
Token | circles |
Token ID | 13332 |
Feature activation | +2.97e-03 |
Pos logit contributions | |
spaghetti | +0.018 |
sidelines | +0.017 |
Seek | +0.015 |
menu | +0.015 |
bed | +0.014 |
Neg logit contributions | |
bul | -0.018 |
spe | -0.018 |
flew | -0.018 |
paramed | -0.016 |
pol | -0.016 |
Token | , |
Token ID | 11 |
Feature activation | +9.00e-03 |
Pos logit contributions | |
spaghetti | +0.004 |
sidelines | +0.004 |
Seek | +0.004 |
menu | +0.004 |
bed | +0.004 |
Neg logit contributions | |
spe | -0.005 |
bul | -0.005 |
flew | -0.004 |
paramed | -0.004 |
pre | -0.004 |
Token | triangles |
Token ID | 44360 |
Feature activation | -4.12e-02 |
Pos logit contributions | |
spaghetti | +0.013 |
sidelines | +0.012 |
menu | +0.011 |
Seek | +0.011 |
bed | +0.010 |
Neg logit contributions | |
spe | -0.015 |
bul | -0.015 |
flew | -0.014 |
paramed | -0.014 |
pol | -0.014 |
Token | , |
Token ID | 11 |
Feature activation | +7.65e-03 |
Pos logit contributions | |
spe | +0.069 |
bul | +0.069 |
paramed | +0.067 |
xc | +0.065 |
pol | +0.064 |
Neg logit contributions | |
spaghetti | -0.057 |
sidelines | -0.050 |
bed | -0.048 |
menu | -0.047 |
Seek | -0.046 |
Token | and |
Token ID | 290 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
spaghetti | +0.010 |
sidelines | +0.010 |
menu | +0.008 |
bed | +0.008 |
Seek | +0.008 |
Neg logit contributions | |
spe | -0.013 |
bul | -0.013 |
paramed | -0.013 |
pol | -0.012 |
xc | -0.012 |
Token | rect |
Token ID | 13621 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
spaghetti | +0.019 |
sidelines | +0.018 |
Seek | +0.016 |
menu | +0.016 |
bed | +0.016 |
Neg logit contributions | |
bul | -0.016 |
spe | -0.016 |
flew | -0.016 |
paramed | -0.015 |
pre | -0.015 |
Token | angles |
Token ID | 27787 |
Feature activation | -4.31e-03 |
Pos logit contributions | |
paramed | +0.235 |
bul | +0.222 |
rob | +0.216 |
slit | +0.213 |
spe | +0.207 |
Neg logit contributions | |
spaghetti | -0.110 |
ours | -0.099 |
mine | -0.090 |
menu | -0.079 |
chess | -0.074 |
Token | ! |
Token ID | 0 |
Feature activation | -3.27e-03 |
Pos logit contributions | |
spe | +0.008 |
paramed | +0.008 |
xc | +0.008 |
bul | +0.007 |
esh | +0.007 |
Neg logit contributions | |
spaghetti | -0.005 |
sidelines | -0.005 |
bed | -0.005 |
anywhere | -0.004 |
menu | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +3.74e-03 |
Pos logit contributions | |
bul | +0.005 |
flew | +0.005 |
spe | +0.005 |
soared | +0.004 |
paramed | +0.004 |
Neg logit contributions | |
spaghetti | -0.005 |
sidelines | -0.005 |
Seek | -0.004 |
menu | -0.004 |
bed | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +7.23e-03 |
Pos logit contributions | |
spaghetti | +0.005 |
sidelines | +0.005 |
Seek | +0.005 |
menu | +0.005 |
bed | +0.005 |
Neg logit contributions | |
bul | -0.006 |
flew | -0.006 |
spe | -0.006 |
pre | -0.005 |
paramed | -0.005 |
Token | One |
Token ID | 3198 |
Feature activation | +4.36e-03 |
Pos logit contributions | |
spaghetti | +0.009 |
sidelines | +0.009 |
Seek | +0.008 |
Want | +0.007 |
menu | +0.007 |
Neg logit contributions | |
bul | -0.013 |
spe | -0.012 |
pre | -0.012 |
flew | -0.012 |
xc | -0.012 |
Token | |
Token ID | 220 |
Feature activation | -2.12e-03 |
Pos logit contributions | |
bul | +0.060 |
flew | +0.059 |
spe | +0.059 |
Bel | +0.055 |
pre | +0.055 |
Neg logit contributions | |
spaghetti | -0.046 |
sidelines | -0.045 |
Seek | -0.039 |
menu | -0.038 |
bed | -0.037 |
Token |
|
Token ID | 198 |
Feature activation | -2.43e-02 |
Pos logit contributions | |
bul | +0.003 |
flew | +0.003 |
spe | +0.003 |
paramed | +0.003 |
soared | +0.003 |
Neg logit contributions | |
spaghetti | -0.003 |
sidelines | -0.003 |
Seek | -0.003 |
menu | -0.002 |
bed | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
bul | +0.041 |
flew | +0.039 |
spe | +0.039 |
pre | +0.038 |
pol | +0.037 |
Neg logit contributions | |
spaghetti | -0.033 |
sidelines | -0.033 |
Seek | -0.029 |
bed | -0.028 |
Want | -0.027 |
Token | The |
Token ID | 464 |
Feature activation | -1.79e-02 |
Pos logit contributions | |
bul | +0.028 |
flew | +0.026 |
pre | +0.025 |
spe | +0.024 |
pol | +0.024 |
Neg logit contributions | |
sidelines | -0.029 |
spaghetti | -0.028 |
Seek | -0.027 |
robbers | -0.024 |
Want | -0.024 |
Token | town |
Token ID | 3240 |
Feature activation | +4.44e-04 |
Pos logit contributions | |
bul | +0.027 |
flew | +0.027 |
spe | +0.026 |
paramed | +0.024 |
Bel | +0.024 |
Neg logit contributions | |
spaghetti | -0.027 |
sidelines | -0.027 |
Seek | -0.024 |
menu | -0.023 |
bed | -0.023 |
Token | spe |
Token ID | 4125 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
sidelines | +0.001 |
spaghetti | +0.001 |
Seek | +0.001 |
menu | +0.001 |
mine | +0.001 |
Neg logit contributions | |
bul | -0.000 |
Bel | -0.000 |
esh | -0.000 |
pre | -0.000 |
Sher | -0.000 |
Token | ople |
Token ID | 643 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
Sab | +0.164 |
paramed | +0.160 |
Bel | +0.160 |
bul | +0.159 |
Sher | +0.156 |
Neg logit contributions | |
sidelines | -0.143 |
mine | -0.121 |
Seek | -0.119 |
spaghetti | -0.115 |
ours | -0.107 |
Token | had |
Token ID | 550 |
Feature activation | -6.64e-03 |
Pos logit contributions | |
bul | +0.015 |
pre | +0.014 |
pol | +0.014 |
paramed | +0.014 |
Bel | +0.014 |
Neg logit contributions | |
sidelines | -0.016 |
spaghetti | -0.015 |
Seek | -0.014 |
menu | -0.014 |
bed | -0.014 |
Token | to |
Token ID | 284 |
Feature activation | -2.28e-03 |
Pos logit contributions | |
bul | +0.011 |
pre | +0.010 |
flew | +0.010 |
spe | +0.010 |
pol | +0.010 |
Neg logit contributions | |
spaghetti | -0.009 |
sidelines | -0.009 |
Seek | -0.008 |
menu | -0.008 |
bed | -0.008 |
Token | find |
Token ID | 1064 |
Feature activation | +8.52e-03 |
Pos logit contributions | |
bul | +0.004 |
pre | +0.004 |
spe | +0.004 |
flew | +0.004 |
pol | +0.004 |
Neg logit contributions | |
sidelines | -0.003 |
spaghetti | -0.003 |
bed | -0.003 |
Seek | -0.002 |
mine | -0.002 |
Token | a |
Token ID | 257 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
sidelines | +0.014 |
spaghetti | +0.014 |
Seek | +0.012 |
menu | +0.012 |
bed | +0.011 |
Neg logit contributions | |
bul | -0.012 |
flew | -0.012 |
spe | -0.012 |
paramed | -0.011 |
Bel | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | -5.23e-03 |
Pos logit contributions | |
flew | +0.012 |
bul | +0.012 |
spe | +0.012 |
soared | +0.011 |
Bel | +0.011 |
Neg logit contributions | |
spaghetti | -0.014 |
sidelines | -0.013 |
Seek | -0.012 |
menu | -0.012 |
bed | -0.011 |
Token | be |
Token ID | 307 |
Feature activation | -1.84e-02 |
Pos logit contributions | |
flew | +0.008 |
bul | +0.008 |
spe | +0.008 |
soared | +0.007 |
Bel | +0.007 |
Neg logit contributions | |
spaghetti | -0.008 |
sidelines | -0.008 |
Seek | -0.007 |
menu | -0.006 |
bed | -0.006 |
Token | as |
Token ID | 355 |
Feature activation | -2.85e-02 |
Pos logit contributions | |
bul | +0.032 |
spe | +0.031 |
flew | +0.031 |
pre | +0.029 |
paramed | +0.029 |
Neg logit contributions | |
spaghetti | -0.024 |
sidelines | -0.024 |
Seek | -0.021 |
menu | -0.020 |
bed | -0.020 |
Token | intelligent |
Token ID | 12661 |
Feature activation | -6.52e-02 |
Pos logit contributions | |
flew | +0.046 |
bul | +0.044 |
spe | +0.044 |
soared | +0.040 |
pol | +0.040 |
Neg logit contributions | |
sidelines | -0.045 |
spaghetti | -0.041 |
menu | -0.036 |
Seek | -0.036 |
café | -0.035 |
Token | as |
Token ID | 355 |
Feature activation | -4.62e-02 |
Pos logit contributions | |
flew | +0.093 |
bul | +0.092 |
spe | +0.090 |
soared | +0.083 |
Bel | +0.082 |
Neg logit contributions | |
spaghetti | -0.103 |
sidelines | -0.103 |
Seek | -0.091 |
menu | -0.089 |
bed | -0.087 |
Token | possible |
Token ID | 1744 |
Feature activation | -9.87e-02 |
Pos logit contributions | |
flew | +0.081 |
bul | +0.075 |
spe | +0.073 |
soared | +0.072 |
Bel | +0.070 |
Neg logit contributions | |
sidelines | -0.066 |
spaghetti | -0.062 |
menu | -0.054 |
Seek | -0.052 |
café | -0.050 |
Token | ! |
Token ID | 0 |
Feature activation | -2.03e-02 |
Pos logit contributions | |
flew | +0.134 |
bul | +0.131 |
spe | +0.128 |
soared | +0.119 |
Bel | +0.118 |
Neg logit contributions | |
sidelines | -0.166 |
spaghetti | -0.165 |
Seek | -0.146 |
menu | -0.143 |
bed | -0.139 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +2.70e-02 |
Pos logit contributions | |
flew | +0.031 |
bul | +0.031 |
spe | +0.030 |
soared | +0.028 |
pre | +0.028 |
Neg logit contributions | |
spaghetti | -0.030 |
sidelines | -0.029 |
Seek | -0.026 |
menu | -0.025 |
bed | -0.025 |
Token | Once |
Token ID | 7454 |
Feature activation | -2.78e-02 |
Pos logit contributions | |
sidelines | +0.055 |
spaghetti | +0.052 |
ours | +0.048 |
Seek | +0.048 |
mine | +0.047 |
Neg logit contributions | |
flew | -0.029 |
bul | -0.027 |
spe | -0.026 |
Bel | -0.024 |
Sher | -0.024 |
Token | upon |
Token ID | 2402 |
Feature activation | +1.92e-03 |
Pos logit contributions | |
bul | +0.059 |
flew | +0.058 |
spe | +0.057 |
paramed | +0.056 |
pre | +0.055 |
Neg logit contributions | |
spaghetti | -0.025 |
sidelines | -0.023 |
bed | -0.020 |
Seek | -0.019 |
menu | -0.019 |
Token | a |
Token ID | 257 |
Feature activation | -5.37e-03 |
Pos logit contributions | |
sidelines | +0.004 |
Seek | +0.003 |
spaghetti | +0.003 |
menu | +0.003 |
internet | +0.003 |
Neg logit contributions | |
flew | -0.002 |
soared | -0.002 |
Bel | -0.002 |
bul | -0.002 |
hon | -0.002 |
Token | new |
Token ID | 649 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
bul | +0.003 |
spe | +0.003 |
flew | +0.003 |
paramed | +0.003 |
Or | +0.003 |
Neg logit contributions | |
sidelines | -0.003 |
spaghetti | -0.003 |
Seek | -0.002 |
ours | -0.002 |
concession | -0.002 |
Token | tutor |
Token ID | 48680 |
Feature activation | -2.42e-02 |
Pos logit contributions | |
sidelines | +0.015 |
spaghetti | +0.014 |
Seek | +0.013 |
menu | +0.012 |
bed | +0.011 |
Neg logit contributions | |
bul | -0.018 |
flew | -0.017 |
spe | -0.017 |
Bel | -0.016 |
paramed | -0.016 |
Token | as |
Token ID | 355 |
Feature activation | -3.16e-02 |
Pos logit contributions | |
bul | +0.034 |
flew | +0.034 |
spe | +0.033 |
Or | +0.030 |
soared | +0.030 |
Neg logit contributions | |
sidelines | -0.039 |
spaghetti | -0.038 |
Seek | -0.034 |
menu | -0.033 |
bed | -0.032 |
Token | soon |
Token ID | 2582 |
Feature activation | -5.01e-02 |
Pos logit contributions | |
flew | +0.045 |
bul | +0.041 |
spe | +0.039 |
soared | +0.038 |
ira | +0.038 |
Neg logit contributions | |
sidelines | -0.055 |
spaghetti | -0.048 |
Seek | -0.046 |
menu | -0.043 |
café | -0.043 |
Token | as |
Token ID | 355 |
Feature activation | -4.44e-02 |
Pos logit contributions | |
flew | +0.068 |
bul | +0.065 |
spe | +0.063 |
soared | +0.059 |
blew | +0.058 |
Neg logit contributions | |
sidelines | -0.084 |
spaghetti | -0.083 |
Seek | -0.075 |
menu | -0.072 |
bed | -0.069 |
Token | possible |
Token ID | 1744 |
Feature activation | -9.74e-02 |
Pos logit contributions | |
flew | +0.071 |
bul | +0.065 |
spe | +0.063 |
ira | +0.062 |
soared | +0.060 |
Neg logit contributions | |
sidelines | -0.069 |
spaghetti | -0.057 |
Seek | -0.055 |
menu | -0.053 |
café | -0.053 |
Token | . |
Token ID | 13 |
Feature activation | +1.95e-03 |
Pos logit contributions | |
flew | +0.127 |
bul | +0.124 |
spe | +0.120 |
pol | +0.110 |
soared | +0.110 |
Neg logit contributions | |
sidelines | -0.170 |
spaghetti | -0.165 |
Seek | -0.149 |
menu | -0.143 |
bed | -0.139 |
Token | We |
Token ID | 775 |
Feature activation | -2.08e-03 |
Pos logit contributions | |
sidelines | +0.003 |
spaghetti | +0.003 |
menu | +0.002 |
Seek | +0.002 |
bed | +0.002 |
Neg logit contributions | |
bul | -0.003 |
flew | -0.003 |
spe | -0.003 |
paramed | -0.003 |
Bel | -0.003 |
Token | love |
Token ID | 1842 |
Feature activation | +2.42e-02 |
Pos logit contributions | |
bul | +0.004 |
spe | +0.003 |
flew | +0.003 |
esh | +0.003 |
xc | +0.003 |
Neg logit contributions | |
spaghetti | -0.003 |
sidelines | -0.003 |
Seek | -0.002 |
menu | -0.002 |
bed | -0.002 |
Token | you |
Token ID | 345 |
Feature activation | -7.75e-03 |
Pos logit contributions | |
sidelines | +0.029 |
spaghetti | +0.026 |
Seek | +0.025 |
menu | +0.023 |
locker | +0.022 |
Neg logit contributions | |
flew | -0.042 |
spe | -0.041 |
bul | -0.041 |
Bel | -0.039 |
ira | -0.038 |
Token | , |
Token ID | 11 |
Feature activation | -6.05e-03 |
Pos logit contributions | |
flew | +0.008 |
bul | +0.007 |
spe | +0.006 |
ilot | +0.006 |
Or | +0.006 |
Neg logit contributions | |
sidelines | -0.017 |
spaghetti | -0.015 |
Seek | -0.014 |
Want | -0.014 |
menu | -0.013 |
Token | coat |
Token ID | 31434 |
Feature activation | +1.92e-02 |
Pos logit contributions | |
bul | +0.063 |
spe | +0.062 |
flew | +0.061 |
paramed | +0.057 |
Bel | +0.057 |
Neg logit contributions | |
spaghetti | -0.060 |
sidelines | -0.057 |
Seek | -0.053 |
bed | -0.050 |
menu | -0.050 |
Token | and |
Token ID | 290 |
Feature activation | -1.87e-02 |
Pos logit contributions | |
sidelines | +0.033 |
spaghetti | +0.032 |
Seek | +0.029 |
menu | +0.028 |
ours | +0.028 |
Neg logit contributions | |
flew | -0.026 |
bul | -0.025 |
spe | -0.025 |
paramed | -0.023 |
pol | -0.023 |
Token | boots |
Token ID | 14412 |
Feature activation | -2.67e-02 |
Pos logit contributions | |
flew | +0.022 |
bul | +0.022 |
spe | +0.021 |
soared | +0.019 |
Bel | +0.019 |
Neg logit contributions | |
sidelines | -0.035 |
spaghetti | -0.035 |
Seek | -0.031 |
menu | -0.031 |
bed | -0.030 |
Token | when |
Token ID | 618 |
Feature activation | -4.54e-02 |
Pos logit contributions | |
flew | +0.039 |
bul | +0.039 |
spe | +0.038 |
paramed | +0.035 |
pol | +0.035 |
Neg logit contributions | |
spaghetti | -0.041 |
sidelines | -0.041 |
Seek | -0.036 |
menu | -0.036 |
bed | -0.034 |
Token | it |
Token ID | 340 |
Feature activation | -2.48e-02 |
Pos logit contributions | |
flew | +0.055 |
bul | +0.052 |
spe | +0.051 |
soared | +0.047 |
pol | +0.046 |
Neg logit contributions | |
sidelines | -0.083 |
spaghetti | -0.082 |
Seek | -0.075 |
menu | -0.075 |
internet | -0.070 |
Token | r |
Token ID | 374 |
Feature activation | -9.68e-02 |
Pos logit contributions | |
spe | +0.033 |
bul | +0.032 |
Ale | +0.030 |
cker | +0.029 |
rob | +0.029 |
Neg logit contributions | |
spaghetti | -0.043 |
sidelines | -0.039 |
bed | -0.038 |
Seek | -0.037 |
Want | -0.036 |
Token | ained |
Token ID | 1328 |
Feature activation | -3.54e-02 |
Pos logit contributions | |
spe | +0.161 |
flew | +0.158 |
bul | +0.157 |
Bel | +0.150 |
Or | +0.148 |
Neg logit contributions | |
spaghetti | -0.131 |
sidelines | -0.126 |
Seek | -0.113 |
bed | -0.107 |
menu | -0.100 |
Token | . |
Token ID | 13 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
bul | +0.053 |
spe | +0.053 |
flew | +0.052 |
paramed | +0.049 |
Bel | +0.049 |
Neg logit contributions | |
spaghetti | -0.053 |
sidelines | -0.052 |
Seek | -0.046 |
bed | -0.045 |
menu | -0.044 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
bul | +0.023 |
flew | +0.022 |
spe | +0.022 |
Bel | +0.021 |
paramed | +0.021 |
Neg logit contributions | |
sidelines | -0.032 |
spaghetti | -0.031 |
Seek | -0.028 |
menu | -0.028 |
ours | -0.027 |
Token | Once |
Token ID | 7454 |
Feature activation | -3.39e-02 |
Pos logit contributions | |
sidelines | +0.040 |
spaghetti | +0.037 |
ours | +0.035 |
Seek | +0.035 |
mine | +0.034 |
Neg logit contributions | |
flew | -0.019 |
bul | -0.018 |
spe | -0.016 |
Sher | -0.016 |
Bel | -0.016 |
Token | upon |
Token ID | 2402 |
Feature activation | -1.45e-04 |
Pos logit contributions | |
bul | +0.070 |
flew | +0.069 |
spe | +0.069 |
paramed | +0.066 |
pre | +0.066 |
Neg logit contributions | |
spaghetti | -0.033 |
sidelines | -0.030 |
bed | -0.026 |
Seek | -0.024 |
menu | -0.024 |
Token | to |
Token ID | 284 |
Feature activation | -6.60e-03 |
Pos logit contributions | |
bul | +0.005 |
flew | +0.004 |
spe | +0.004 |
pol | +0.004 |
mill | +0.004 |
Neg logit contributions | |
sidelines | -0.007 |
spaghetti | -0.007 |
Seek | -0.006 |
ours | -0.006 |
menu | -0.006 |
Token | be |
Token ID | 307 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
flew | +0.010 |
bul | +0.010 |
spe | +0.010 |
Bel | +0.009 |
pol | +0.009 |
Neg logit contributions | |
spaghetti | -0.010 |
sidelines | -0.010 |
Seek | -0.008 |
menu | -0.008 |
bed | -0.008 |
Token | as |
Token ID | 355 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
bul | +0.018 |
spe | +0.018 |
flew | +0.017 |
Bel | +0.017 |
pre | +0.017 |
Neg logit contributions | |
spaghetti | -0.013 |
sidelines | -0.013 |
Seek | -0.011 |
bed | -0.011 |
safe | -0.011 |
Token | quiet |
Token ID | 5897 |
Feature activation | -5.10e-02 |
Pos logit contributions | |
bul | +0.046 |
flew | +0.045 |
spe | +0.044 |
Bel | +0.043 |
xc | +0.043 |
Neg logit contributions | |
spaghetti | -0.031 |
sidelines | -0.029 |
Seek | -0.026 |
menu | -0.024 |
bed | -0.024 |
Token | as |
Token ID | 355 |
Feature activation | -3.66e-02 |
Pos logit contributions | |
bul | +0.070 |
flew | +0.070 |
spe | +0.068 |
paramed | +0.062 |
esh | +0.061 |
Neg logit contributions | |
spaghetti | -0.083 |
sidelines | -0.083 |
Seek | -0.075 |
menu | -0.072 |
bed | -0.070 |
Token | possible |
Token ID | 1744 |
Feature activation | -9.65e-02 |
Pos logit contributions | |
flew | +0.049 |
spe | +0.048 |
bul | +0.047 |
soared | +0.042 |
blew | +0.041 |
Neg logit contributions | |
sidelines | -0.063 |
spaghetti | -0.060 |
menu | -0.055 |
Seek | -0.054 |
internet | -0.052 |
Token | . |
Token ID | 13 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
flew | +0.122 |
bul | +0.119 |
spe | +0.115 |
pol | +0.105 |
soared | +0.105 |
Neg logit contributions | |
sidelines | -0.174 |
spaghetti | -0.170 |
Seek | -0.152 |
menu | -0.148 |
bed | -0.144 |
Token |
|
Token ID | 198 |
Feature activation | -5.30e-03 |
Pos logit contributions | |
spe | +0.016 |
bul | +0.015 |
flew | +0.014 |
pol | +0.014 |
Bel | +0.014 |
Neg logit contributions | |
sidelines | -0.026 |
spaghetti | -0.024 |
ours | -0.024 |
Seek | -0.023 |
shady | -0.022 |
Token |
|
Token ID | 198 |
Feature activation | -1.02e-03 |
Pos logit contributions | |
flew | +0.006 |
spe | +0.006 |
bul | +0.006 |
Bel | +0.005 |
Sher | +0.005 |
Neg logit contributions | |
sidelines | -0.010 |
spaghetti | -0.010 |
Seek | -0.009 |
menu | -0.009 |
ours | -0.009 |
Token | He |
Token ID | 1544 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
spe | +0.001 |
flew | +0.001 |
bul | +0.001 |
Bel | +0.001 |
pol | +0.001 |
Neg logit contributions | |
spaghetti | -0.002 |
sidelines | -0.002 |
bed | -0.002 |
menu | -0.002 |
Seek | -0.002 |
Token | grabbed |
Token ID | 13176 |
Feature activation | +5.30e-03 |
Pos logit contributions | |
bul | +0.014 |
pre | +0.014 |
spe | +0.013 |
paramed | +0.013 |
xc | +0.013 |
Neg logit contributions | |
spaghetti | -0.019 |
sidelines | -0.017 |
Seek | -0.016 |
bed | -0.016 |
robbers | -0.016 |
Token | all |
Token ID | 477 |
Feature activation | +2.02e-02 |
Pos logit contributions | |
spaghetti | +0.001 |
sidelines | +0.001 |
Seek | +0.001 |
menu | +0.001 |
bed | +0.001 |
Neg logit contributions | |
flew | -0.001 |
bul | -0.001 |
spe | -0.001 |
soared | -0.001 |
pol | -0.001 |
Token | over |
Token ID | 625 |
Feature activation | -1.69e-02 |
Pos logit contributions | |
spaghetti | +0.023 |
sidelines | +0.023 |
Seek | +0.020 |
bed | +0.019 |
mine | +0.018 |
Neg logit contributions | |
pre | -0.038 |
bul | -0.037 |
Or | -0.037 |
spe | -0.037 |
paramed | -0.037 |
Token | and |
Token ID | 290 |
Feature activation | -4.15e-03 |
Pos logit contributions | |
flew | +0.019 |
bul | +0.019 |
spe | +0.018 |
Bel | +0.016 |
pol | +0.016 |
Neg logit contributions | |
sidelines | -0.031 |
spaghetti | -0.030 |
Seek | -0.029 |
menu | -0.028 |
ours | -0.028 |
Token | his |
Token ID | 465 |
Feature activation | -2.51e-02 |
Pos logit contributions | |
flew | +0.005 |
bul | +0.005 |
spe | +0.005 |
soared | +0.005 |
blew | +0.004 |
Neg logit contributions | |
spaghetti | -0.007 |
sidelines | -0.007 |
Seek | -0.007 |
menu | -0.007 |
internet | -0.006 |
Token | mum |
Token ID | 25682 |
Feature activation | -3.29e-02 |
Pos logit contributions | |
flew | +0.036 |
bul | +0.035 |
spe | +0.035 |
paramed | +0.032 |
pre | +0.032 |
Neg logit contributions | |
sidelines | -0.039 |
spaghetti | -0.039 |
Seek | -0.036 |
menu | -0.034 |
ours | -0.033 |
Token | r |
Token ID | 374 |
Feature activation | -9.59e-02 |
Pos logit contributions | |
bul | +0.042 |
spe | +0.041 |
flew | +0.040 |
Bel | +0.038 |
pre | +0.038 |
Neg logit contributions | |
spaghetti | -0.058 |
sidelines | -0.056 |
Seek | -0.051 |
bed | -0.049 |
menu | -0.049 |
Token | ins |
Token ID | 1040 |
Feature activation | -2.75e-02 |
Pos logit contributions | |
flew | +0.160 |
Or | +0.153 |
soared | +0.149 |
rob | +0.148 |
spe | +0.146 |
Neg logit contributions | |
spaghetti | -0.139 |
sidelines | -0.121 |
Seek | -0.114 |
amas | -0.108 |
bed | -0.104 |
Token | ed |
Token ID | 276 |
Feature activation | -3.90e-02 |
Pos logit contributions | |
bul | +0.036 |
spe | +0.034 |
Bel | +0.033 |
paramed | +0.033 |
flew | +0.033 |
Neg logit contributions | |
spaghetti | -0.047 |
sidelines | -0.043 |
Seek | -0.041 |
bed | -0.040 |
menu | -0.040 |
Token | the |
Token ID | 262 |
Feature activation | -1.53e-02 |
Pos logit contributions | |
bul | +0.057 |
flew | +0.057 |
spe | +0.056 |
pol | +0.051 |
paramed | +0.051 |
Neg logit contributions | |
sidelines | -0.060 |
spaghetti | -0.059 |
Seek | -0.054 |
menu | -0.052 |
ours | -0.050 |
Token | soap |
Token ID | 19533 |
Feature activation | +2.02e-03 |
Pos logit contributions | |
bul | +0.024 |
spe | +0.024 |
flew | +0.024 |
paramed | +0.023 |
blew | +0.022 |
Neg logit contributions | |
sidelines | -0.020 |
spaghetti | -0.020 |
Seek | -0.019 |
ours | -0.018 |
Want | -0.018 |
Token | off |
Token ID | 572 |
Feature activation | -7.24e-03 |
Pos logit contributions | |
spaghetti | +0.003 |
sidelines | +0.003 |
bed | +0.003 |
Seek | +0.003 |
menu | +0.003 |
Neg logit contributions | |
bul | -0.003 |
spe | -0.003 |
flew | -0.003 |
paramed | -0.003 |
Bel | -0.003 |
Token | eat |
Token ID | 4483 |
Feature activation | +3.63e-02 |
Pos logit contributions | |
spaghetti | +0.027 |
sidelines | +0.027 |
Seek | +0.024 |
menu | +0.023 |
bed | +0.022 |
Neg logit contributions | |
flew | -0.034 |
bul | -0.034 |
spe | -0.033 |
paramed | -0.031 |
pol | -0.031 |
Token | it |
Token ID | 340 |
Feature activation | +9.51e-03 |
Pos logit contributions | |
sidelines | +0.075 |
Seek | +0.069 |
robbers | +0.067 |
internet | +0.065 |
spine | +0.064 |
Neg logit contributions | |
flew | -0.037 |
bul | -0.032 |
spr | -0.032 |
aches | -0.032 |
pol | -0.031 |
Token | as |
Token ID | 355 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
sidelines | +0.020 |
spaghetti | +0.017 |
robbers | +0.017 |
concession | +0.017 |
Seek | +0.017 |
Neg logit contributions | |
flew | -0.010 |
bul | -0.009 |
spe | -0.008 |
pol | -0.008 |
imm | -0.007 |
Token | quickly |
Token ID | 2952 |
Feature activation | -2.80e-02 |
Pos logit contributions | |
bul | +0.024 |
flew | +0.024 |
spe | +0.024 |
paramed | +0.022 |
soared | +0.022 |
Neg logit contributions | |
spaghetti | -0.022 |
sidelines | -0.021 |
Seek | -0.019 |
menu | -0.018 |
bed | -0.018 |
Token | as |
Token ID | 355 |
Feature activation | -3.97e-02 |
Pos logit contributions | |
bul | +0.047 |
spe | +0.047 |
xc | +0.044 |
Bel | +0.043 |
flew | +0.043 |
Neg logit contributions | |
spaghetti | -0.040 |
sidelines | -0.038 |
menu | -0.034 |
bed | -0.034 |
mine | -0.032 |
Token | possible |
Token ID | 1744 |
Feature activation | -9.57e-02 |
Pos logit contributions | |
bul | +0.051 |
flew | +0.050 |
spe | +0.049 |
paramed | +0.045 |
pol | +0.045 |
Neg logit contributions | |
spaghetti | -0.070 |
sidelines | -0.068 |
Seek | -0.062 |
menu | -0.060 |
bed | -0.060 |
Token | , |
Token ID | 11 |
Feature activation | -2.18e-02 |
Pos logit contributions | |
bul | +0.142 |
spe | +0.141 |
flew | +0.139 |
paramed | +0.131 |
Bel | +0.129 |
Neg logit contributions | |
spaghetti | -0.148 |
sidelines | -0.142 |
Seek | -0.129 |
menu | -0.126 |
bed | -0.125 |
Token | but |
Token ID | 475 |
Feature activation | -1.33e-03 |
Pos logit contributions | |
flew | +0.037 |
bul | +0.035 |
spe | +0.034 |
Or | +0.034 |
blew | +0.033 |
Neg logit contributions | |
sidelines | -0.028 |
spaghetti | -0.027 |
Seek | -0.025 |
menu | -0.023 |
internet | -0.022 |
Token | her |
Token ID | 607 |
Feature activation | -7.48e-03 |
Pos logit contributions | |
flew | +0.001 |
spe | +0.001 |
bul | +0.001 |
blew | +0.001 |
pol | +0.001 |
Neg logit contributions | |
sidelines | -0.003 |
spaghetti | -0.003 |
menu | -0.002 |
Seek | -0.002 |
internet | -0.002 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.89e-02 |
Pos logit contributions | |
spe | +0.006 |
flew | +0.006 |
bul | +0.005 |
paramed | +0.005 |
ira | +0.005 |
Neg logit contributions | |
sidelines | -0.017 |
Seek | -0.016 |
spaghetti | -0.015 |
Want | -0.015 |
ours | -0.014 |
Token | my |
Token ID | 1820 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
bul | +0.032 |
flew | +0.032 |
spe | +0.032 |
pol | +0.030 |
paramed | +0.030 |
Neg logit contributions | |
spaghetti | -0.025 |
sidelines | -0.024 |
Seek | -0.021 |
menu | -0.020 |
bed | -0.020 |
Token | get |
Token ID | 651 |
Feature activation | -9.04e-03 |
Pos logit contributions | |
bul | +0.005 |
flew | +0.005 |
spe | +0.005 |
Bel | +0.005 |
pol | +0.005 |
Neg logit contributions | |
spaghetti | -0.005 |
sidelines | -0.005 |
Seek | -0.004 |
menu | -0.004 |
bed | -0.004 |
Token | it |
Token ID | 340 |
Feature activation | -5.19e-03 |
Pos logit contributions | |
flew | +0.013 |
bul | +0.013 |
spe | +0.013 |
soared | +0.012 |
pol | +0.012 |
Neg logit contributions | |
spaghetti | -0.014 |
sidelines | -0.014 |
Seek | -0.012 |
menu | -0.012 |
bed | -0.012 |
Token | as |
Token ID | 355 |
Feature activation | -3.14e-02 |
Pos logit contributions | |
bul | +0.008 |
flew | +0.008 |
spe | +0.008 |
paramed | +0.008 |
Bel | +0.008 |
Neg logit contributions | |
spaghetti | -0.007 |
sidelines | -0.007 |
Seek | -0.006 |
menu | -0.006 |
bed | -0.006 |
Token | close |
Token ID | 1969 |
Feature activation | -4.15e-02 |
Pos logit contributions | |
flew | +0.056 |
bul | +0.055 |
spe | +0.055 |
soared | +0.051 |
pol | +0.050 |
Neg logit contributions | |
sidelines | -0.040 |
spaghetti | -0.039 |
Seek | -0.033 |
menu | -0.033 |
bed | -0.031 |
Token | as |
Token ID | 355 |
Feature activation | -3.88e-02 |
Pos logit contributions | |
bul | +0.065 |
flew | +0.064 |
spe | +0.064 |
paramed | +0.062 |
Bel | +0.062 |
Neg logit contributions | |
spaghetti | -0.059 |
sidelines | -0.057 |
bed | -0.051 |
Seek | -0.050 |
menu | -0.049 |
Token | possible |
Token ID | 1744 |
Feature activation | -9.56e-02 |
Pos logit contributions | |
flew | +0.049 |
bul | +0.048 |
spe | +0.048 |
soared | +0.042 |
pre | +0.041 |
Neg logit contributions | |
sidelines | -0.069 |
spaghetti | -0.068 |
menu | -0.061 |
Seek | -0.061 |
bed | -0.057 |
Token | to |
Token ID | 284 |
Feature activation | -3.50e-02 |
Pos logit contributions | |
flew | +0.121 |
bul | +0.119 |
spe | +0.115 |
soared | +0.105 |
pol | +0.105 |
Neg logit contributions | |
sidelines | -0.171 |
spaghetti | -0.168 |
Seek | -0.150 |
menu | -0.146 |
bed | -0.141 |
Token | the |
Token ID | 262 |
Feature activation | -1.29e-02 |
Pos logit contributions | |
flew | +0.051 |
bul | +0.047 |
spe | +0.045 |
soared | +0.045 |
rob | +0.042 |
Neg logit contributions | |
spaghetti | -0.058 |
sidelines | -0.054 |
menu | -0.051 |
Seek | -0.050 |
concession | -0.047 |
Token | bench |
Token ID | 7624 |
Feature activation | -4.38e-03 |
Pos logit contributions | |
flew | +0.018 |
spe | +0.017 |
rob | +0.016 |
k | +0.016 |
soared | +0.016 |
Neg logit contributions | |
spaghetti | -0.021 |
Seek | -0.018 |
Want | -0.018 |
hunting | -0.017 |
sidelines | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
flew | +0.006 |
bul | +0.006 |
spe | +0.006 |
pol | +0.005 |
Bel | +0.005 |
Neg logit contributions | |
spaghetti | -0.007 |
sidelines | -0.007 |
Seek | -0.006 |
menu | -0.006 |
bed | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | -4.85e-03 |
Pos logit contributions | |
bul | +0.015 |
spe | +0.014 |
flew | +0.014 |
Sher | +0.013 |
Bel | +0.013 |
Neg logit contributions | |
sidelines | -0.019 |
spaghetti | -0.018 |
menu | -0.016 |
Seek | -0.016 |
ours | -0.016 |
Token | red |
Token ID | 2266 |
Feature activation | -1.87e-02 |
Pos logit contributions | |
bul | +0.004 |
flew | +0.004 |
spe | +0.004 |
soared | +0.004 |
pre | +0.004 |
Neg logit contributions | |
sidelines | -0.004 |
spaghetti | -0.004 |
Seek | -0.004 |
menu | -0.003 |
Want | -0.003 |
Token | cape |
Token ID | 36023 |
Feature activation | -1.60e-03 |
Pos logit contributions | |
bul | +0.030 |
flew | +0.030 |
spe | +0.029 |
soared | +0.027 |
Bel | +0.027 |
Neg logit contributions | |
sidelines | -0.026 |
spaghetti | -0.026 |
Seek | -0.023 |
menu | -0.022 |
ours | -0.021 |
Token | and |
Token ID | 290 |
Feature activation | +2.97e-03 |
Pos logit contributions | |
flew | +0.002 |
bul | +0.002 |
spe | +0.002 |
soared | +0.002 |
pol | +0.002 |
Neg logit contributions | |
sidelines | -0.003 |
spaghetti | -0.003 |
Seek | -0.002 |
menu | -0.002 |
Want | -0.002 |
Token | make |
Token ID | 787 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
sidelines | +0.005 |
spaghetti | +0.005 |
Seek | +0.004 |
menu | +0.004 |
bed | +0.004 |
Neg logit contributions | |
flew | -0.004 |
bul | -0.004 |
spe | -0.004 |
soared | -0.004 |
Bel | -0.004 |
Token | - |
Token ID | 12 |
Feature activation | -1.99e-02 |
Pos logit contributions | |
bul | +0.016 |
flew | +0.015 |
spe | +0.015 |
paramed | +0.014 |
pol | +0.014 |
Neg logit contributions | |
spaghetti | -0.015 |
sidelines | -0.015 |
Seek | -0.013 |
menu | -0.013 |
bed | -0.013 |
Token | bel |
Token ID | 6667 |
Feature activation | -9.54e-02 |
Pos logit contributions | |
bul | +0.012 |
flew | +0.011 |
spe | +0.010 |
esh | +0.010 |
slit | +0.010 |
Neg logit contributions | |
sidelines | -0.046 |
spaghetti | -0.045 |
Seek | -0.044 |
safe | -0.040 |
bed | -0.040 |
Token | ieve |
Token ID | 12311 |
Feature activation | -3.13e-02 |
Pos logit contributions | |
spe | +0.150 |
bul | +0.149 |
flew | +0.149 |
pre | +0.138 |
Bel | +0.138 |
Neg logit contributions | |
spaghetti | -0.136 |
sidelines | -0.135 |
Seek | -0.120 |
bed | -0.113 |
menu | -0.112 |
Token | he |
Token ID | 339 |
Feature activation | +8.22e-03 |
Pos logit contributions | |
bul | +0.045 |
flew | +0.045 |
spe | +0.044 |
soared | +0.040 |
Bel | +0.039 |
Neg logit contributions | |
sidelines | -0.050 |
spaghetti | -0.050 |
Seek | -0.044 |
menu | -0.043 |
bed | -0.041 |
Token | had |
Token ID | 550 |
Feature activation | -4.56e-05 |
Pos logit contributions | |
spaghetti | +0.014 |
sidelines | +0.013 |
Seek | +0.012 |
bed | +0.012 |
menu | +0.012 |
Neg logit contributions | |
paramed | -0.011 |
bul | -0.010 |
spe | -0.010 |
Bel | -0.010 |
xc | -0.010 |
Token | super |
Token ID | 2208 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
flew | +0.000 |
bul | +0.000 |
spe | +0.000 |
soared | +0.000 |
Bel | +0.000 |
Neg logit contributions | |
sidelines | -0.000 |
spaghetti | -0.000 |
Seek | -0.000 |
menu | -0.000 |
bed | -0.000 |
Token | powers |
Token ID | 30132 |
Feature activation | -4.65e-02 |
Pos logit contributions | |
bul | +0.019 |
flew | +0.019 |
spe | +0.019 |
paramed | +0.018 |
xc | +0.018 |
Neg logit contributions | |
spaghetti | -0.012 |
sidelines | -0.012 |
Seek | -0.011 |
menu | -0.010 |
bed | -0.010 |
Token | back |
Token ID | 736 |
Feature activation | +2.47e-03 |
Pos logit contributions | |
flew | +0.001 |
bul | +0.001 |
spe | +0.001 |
Bel | +0.000 |
soared | +0.000 |
Neg logit contributions | |
spaghetti | -0.001 |
sidelines | -0.001 |
Seek | -0.000 |
menu | -0.000 |
bed | -0.000 |
Token | away |
Token ID | 1497 |
Feature activation | +8.81e-03 |
Pos logit contributions | |
sidelines | +0.004 |
spaghetti | +0.004 |
Seek | +0.003 |
menu | +0.003 |
bed | +0.003 |
Neg logit contributions | |
flew | -0.004 |
bul | -0.004 |
spe | -0.004 |
Bel | -0.003 |
pol | -0.003 |
Token | as |
Token ID | 355 |
Feature activation | -2.36e-02 |
Pos logit contributions | |
spaghetti | +0.013 |
sidelines | +0.013 |
bed | +0.011 |
Seek | +0.011 |
menu | +0.011 |
Neg logit contributions | |
bul | -0.013 |
flew | -0.013 |
spe | -0.013 |
pre | -0.012 |
soared | -0.012 |
Token | quietly |
Token ID | 12703 |
Feature activation | -3.89e-02 |
Pos logit contributions | |
bul | +0.032 |
spe | +0.032 |
flew | +0.031 |
paramed | +0.030 |
pre | +0.029 |
Neg logit contributions | |
spaghetti | -0.039 |
sidelines | -0.039 |
bed | -0.034 |
Seek | -0.034 |
menu | -0.033 |
Token | as |
Token ID | 355 |
Feature activation | -4.15e-02 |
Pos logit contributions | |
spe | +0.070 |
bul | +0.067 |
xc | +0.066 |
Bel | +0.064 |
pre | +0.064 |
Neg logit contributions | |
spaghetti | -0.050 |
sidelines | -0.048 |
bed | -0.043 |
hunting | -0.041 |
menu | -0.041 |
Token | possible |
Token ID | 1744 |
Feature activation | -9.53e-02 |
Pos logit contributions | |
bul | +0.052 |
spe | +0.051 |
flew | +0.050 |
paramed | +0.047 |
pre | +0.047 |
Neg logit contributions | |
spaghetti | -0.074 |
sidelines | -0.073 |
Seek | -0.065 |
bed | -0.065 |
menu | -0.063 |
Token | , |
Token ID | 11 |
Feature activation | -2.11e-02 |
Pos logit contributions | |
spe | +0.159 |
bul | +0.157 |
paramed | +0.151 |
flew | +0.149 |
pre | +0.146 |
Neg logit contributions | |
spaghetti | -0.129 |
sidelines | -0.120 |
bed | -0.113 |
Seek | -0.111 |
menu | -0.107 |
Token | but |
Token ID | 475 |
Feature activation | +1.45e-03 |
Pos logit contributions | |
flew | +0.041 |
bul | +0.041 |
spe | +0.040 |
Bel | +0.038 |
soared | +0.038 |
Neg logit contributions | |
spaghetti | -0.023 |
sidelines | -0.022 |
Seek | -0.019 |
menu | -0.018 |
bed | -0.017 |
Token | Mom |
Token ID | 11254 |
Feature activation | -1.86e-02 |
Pos logit contributions | |
spaghetti | +0.002 |
sidelines | +0.002 |
Seek | +0.002 |
menu | +0.002 |
bed | +0.002 |
Neg logit contributions | |
bul | -0.002 |
flew | -0.002 |
spe | -0.002 |
pre | -0.002 |
paramed | -0.002 |
Token | my |
Token ID | 1820 |
Feature activation | -6.55e-03 |
Pos logit contributions | |
bul | +0.034 |
spe | +0.034 |
flew | +0.034 |
pre | +0.032 |
Bel | +0.032 |
Neg logit contributions | |
spaghetti | -0.022 |
sidelines | -0.021 |
Seek | -0.018 |
bed | -0.017 |
menu | -0.017 |
Token | noticed |
Token ID | 6810 |
Feature activation | +6.66e-03 |
Pos logit contributions | |
bul | +0.008 |
spe | +0.008 |
pre | +0.008 |
Bel | +0.008 |
xc | +0.008 |
Neg logit contributions | |
spaghetti | -0.011 |
sidelines | -0.010 |
Seek | -0.009 |
safe | -0.009 |
bone | -0.009 |
Token | It |
Token ID | 632 |
Feature activation | -7.46e-03 |
Pos logit contributions | |
flew | +0.003 |
Bel | +0.002 |
bul | +0.002 |
spe | +0.002 |
pol | +0.002 |
Neg logit contributions | |
sidelines | -0.003 |
spaghetti | -0.003 |
Seek | -0.003 |
ours | -0.003 |
menu | -0.003 |
Token | tasted |
Token ID | 29187 |
Feature activation | +4.48e-02 |
Pos logit contributions | |
spe | +0.011 |
paramed | +0.011 |
Ale | +0.010 |
xc | +0.010 |
pre | +0.010 |
Neg logit contributions | |
spaghetti | -0.012 |
bone | -0.009 |
Seek | -0.009 |
shady | -0.009 |
safe | -0.009 |
Token | terrible |
Token ID | 7818 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
sidelines | +0.061 |
spaghetti | +0.055 |
Seek | +0.052 |
robbers | +0.049 |
menu | +0.048 |
Neg logit contributions | |
flew | -0.078 |
bul | -0.075 |
spe | -0.072 |
pol | -0.070 |
Bel | -0.070 |
Token | and |
Token ID | 290 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
flew | +0.013 |
bul | +0.012 |
spe | +0.011 |
spr | +0.011 |
esh | +0.010 |
Neg logit contributions | |
sidelines | -0.019 |
Seek | -0.017 |
spaghetti | -0.017 |
robbers | -0.016 |
internet | -0.016 |
Token | she |
Token ID | 673 |
Feature activation | +6.51e-03 |
Pos logit contributions | |
sidelines | +0.025 |
spaghetti | +0.025 |
Seek | +0.023 |
menu | +0.022 |
bed | +0.021 |
Neg logit contributions | |
flew | -0.020 |
bul | -0.019 |
spe | -0.018 |
soared | -0.017 |
blew | -0.017 |
Token | rec |
Token ID | 664 |
Feature activation | -9.51e-02 |
Pos logit contributions | |
spaghetti | +0.011 |
sidelines | +0.009 |
bone | +0.009 |
mine | +0.009 |
Seek | +0.008 |
Neg logit contributions | |
bul | -0.009 |
paramed | -0.009 |
spe | -0.009 |
esh | -0.009 |
xc | -0.008 |
Token | o |
Token ID | 78 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
bul | +0.162 |
flew | +0.156 |
spe | +0.154 |
rob | +0.154 |
paramed | +0.153 |
Neg logit contributions | |
sidelines | -0.119 |
spaghetti | -0.112 |
Seek | -0.109 |
mine | -0.094 |
Want | -0.094 |
Token | iled |
Token ID | 3902 |
Feature activation | -9.16e-03 |
Pos logit contributions | |
bul | +0.019 |
spe | +0.017 |
Sher | +0.017 |
paramed | +0.017 |
Sab | +0.017 |
Neg logit contributions | |
spaghetti | -0.021 |
sidelines | -0.018 |
bone | -0.017 |
safe | -0.016 |
mine | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | -7.32e-04 |
Pos logit contributions | |
bul | +0.014 |
spe | +0.013 |
flew | +0.013 |
Bel | +0.012 |
pre | +0.012 |
Neg logit contributions | |
spaghetti | -0.014 |
sidelines | -0.014 |
Seek | -0.012 |
menu | -0.012 |
bed | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | +2.03e-03 |
Pos logit contributions | |
flew | +0.001 |
bul | +0.001 |
Bel | +0.001 |
spe | +0.001 |
pol | +0.001 |
Neg logit contributions | |
sidelines | -0.001 |
spaghetti | -0.001 |
Seek | -0.001 |
menu | -0.001 |
ours | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +4.42e-03 |
Pos logit contributions | |
sidelines | +0.003 |
spaghetti | +0.003 |
Seek | +0.003 |
menu | +0.003 |
ours | +0.003 |
Neg logit contributions | |
flew | -0.003 |
bul | -0.003 |
spe | -0.002 |
Bel | -0.002 |
Sher | -0.002 |
Token | - |
Token ID | 12 |
Feature activation | -2.87e-03 |
Pos logit contributions | |
sidelines | +0.035 |
spaghetti | +0.035 |
Seek | +0.032 |
menu | +0.031 |
robbers | +0.030 |
Neg logit contributions | |
flew | -0.020 |
bul | -0.020 |
spe | -0.019 |
pol | -0.018 |
paramed | -0.018 |
Token | up |
Token ID | 929 |
Feature activation | +5.29e-03 |
Pos logit contributions | |
bul | +0.003 |
spe | +0.003 |
flew | +0.003 |
slit | +0.003 |
Or | +0.003 |
Neg logit contributions | |
spaghetti | -0.006 |
sidelines | -0.005 |
Seek | -0.005 |
menu | -0.005 |
bed | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | +8.94e-03 |
Pos logit contributions | |
sidelines | +0.009 |
spaghetti | +0.009 |
Seek | +0.008 |
menu | +0.007 |
Want | +0.007 |
Neg logit contributions | |
flew | -0.007 |
bul | -0.007 |
spe | -0.007 |
pol | -0.006 |
soared | -0.006 |
Token | make |
Token ID | 787 |
Feature activation | -8.94e-03 |
Pos logit contributions | |
sidelines | +0.014 |
spaghetti | +0.014 |
Seek | +0.012 |
menu | +0.012 |
ours | +0.011 |
Neg logit contributions | |
flew | -0.013 |
bul | -0.013 |
spe | -0.013 |
soared | -0.012 |
Bel | -0.012 |
Token | - |
Token ID | 12 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
bul | +0.015 |
spe | +0.015 |
flew | +0.014 |
cker | +0.014 |
pre | +0.014 |
Neg logit contributions | |
spaghetti | -0.013 |
sidelines | -0.012 |
bed | -0.011 |
Seek | -0.010 |
menu | -0.010 |
Token | bel |
Token ID | 6667 |
Feature activation | -9.41e-02 |
Pos logit contributions | |
bul | +0.015 |
flew | +0.014 |
spe | +0.013 |
slit | +0.013 |
esh | +0.013 |
Neg logit contributions | |
spaghetti | -0.037 |
sidelines | -0.037 |
Seek | -0.035 |
bed | -0.033 |
menu | -0.033 |
Token | ieve |
Token ID | 12311 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
spe | +0.144 |
bul | +0.143 |
flew | +0.142 |
Bel | +0.132 |
pre | +0.132 |
Neg logit contributions | |
spaghetti | -0.138 |
sidelines | -0.138 |
Seek | -0.124 |
bed | -0.115 |
menu | -0.114 |
Token | . |
Token ID | 13 |
Feature activation | +1.72e-03 |
Pos logit contributions | |
bul | +0.041 |
flew | +0.041 |
spe | +0.040 |
Bel | +0.037 |
paramed | +0.037 |
Neg logit contributions | |
spaghetti | -0.040 |
sidelines | -0.039 |
Seek | -0.035 |
menu | -0.034 |
bed | -0.033 |
Token | One |
Token ID | 1881 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
sidelines | +0.003 |
spaghetti | +0.003 |
Seek | +0.003 |
ours | +0.003 |
robbers | +0.003 |
Neg logit contributions | |
bul | -0.002 |
flew | -0.002 |
Bel | -0.002 |
pol | -0.002 |
spe | -0.002 |
Token | day |
Token ID | 1110 |
Feature activation | +2.37e-02 |
Pos logit contributions | |
sidelines | +0.021 |
spaghetti | +0.019 |
Seek | +0.018 |
menu | +0.017 |
ours | +0.016 |
Neg logit contributions | |
flew | -0.018 |
bul | -0.018 |
spe | -0.018 |
pol | -0.017 |
pre | -0.016 |
Token | , |
Token ID | 11 |
Feature activation | +7.53e-03 |
Pos logit contributions | |
spaghetti | +0.040 |
sidelines | +0.040 |
Seek | +0.036 |
menu | +0.035 |
bed | +0.034 |
Neg logit contributions | |
flew | -0.032 |
bul | -0.031 |
spe | -0.031 |
pol | -0.028 |
paramed | -0.028 |
Token | things |
Token ID | 1243 |
Feature activation | -3.28e-02 |
Pos logit contributions | |
sidelines | +0.006 |
spaghetti | +0.005 |
Seek | +0.005 |
Want | +0.004 |
internet | +0.004 |
Neg logit contributions | |
flew | -0.006 |
bul | -0.006 |
spe | -0.006 |
soared | -0.006 |
Bel | -0.006 |
Token | â |
Token ID | 22940 |
Feature activation | -5.23e-05 |
Pos logit contributions | |
flew | +0.046 |
bul | +0.046 |
spe | +0.044 |
pol | +0.041 |
soared | +0.040 |
Neg logit contributions | |
sidelines | -0.054 |
spaghetti | -0.053 |
Seek | -0.047 |
menu | -0.045 |
bed | -0.045 |
Token | € |
Token ID | 26391 |
Feature activation | -3.30e-03 |
Pos logit contributions | |
bul | +0.000 |
flew | +0.000 |
spe | +0.000 |
pol | +0.000 |
Bel | +0.000 |
Neg logit contributions | |
spaghetti | -0.000 |
sidelines | -0.000 |
Seek | -0.000 |
menu | -0.000 |
bed | -0.000 |
Token | � |
Token ID | 447 |
Feature activation | -6.61e-02 |
Pos logit contributions | |
flew | +0.005 |
spe | +0.005 |
bul | +0.005 |
soared | +0.004 |
Bel | +0.004 |
Neg logit contributions | |
sidelines | -0.005 |
spaghetti | -0.005 |
Seek | -0.005 |
menu | -0.005 |
bed | -0.004 |
Token | � |
Token ID | 251 |
Feature activation | -2.31e-02 |
Pos logit contributions | |
bul | +0.122 |
spe | +0.122 |
flew | +0.120 |
paramed | +0.113 |
Bel | +0.112 |
Neg logit contributions | |
spaghetti | -0.078 |
sidelines | -0.075 |
Seek | -0.064 |
menu | -0.062 |
bed | -0.061 |
Token | col |
Token ID | 4033 |
Feature activation | -9.38e-02 |
Pos logit contributions | |
spe | +0.041 |
bul | +0.040 |
flew | +0.039 |
cker | +0.039 |
pol | +0.037 |
Neg logit contributions | |
spaghetti | -0.031 |
sidelines | -0.029 |
bed | -0.027 |
Seek | -0.024 |
menu | -0.024 |
Token | ouring |
Token ID | 21823 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
flew | +0.210 |
spe | +0.207 |
bul | +0.204 |
Or | +0.202 |
soared | +0.197 |
Neg logit contributions | |
sidelines | -0.078 |
spaghetti | -0.074 |
Seek | -0.056 |
menu | -0.051 |
mine | -0.050 |
Token | books |
Token ID | 3835 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
spaghetti | +0.024 |
sidelines | +0.023 |
bed | +0.021 |
menu | +0.020 |
Seek | +0.020 |
Neg logit contributions | |
bul | -0.022 |
spe | -0.021 |
flew | -0.021 |
pre | -0.020 |
xc | -0.020 |
Token | , |
Token ID | 11 |
Feature activation | -3.11e-02 |
Pos logit contributions | |
flew | +0.020 |
bul | +0.020 |
spe | +0.019 |
soared | +0.017 |
pol | +0.017 |
Neg logit contributions | |
sidelines | -0.026 |
spaghetti | -0.026 |
Seek | -0.024 |
menu | -0.023 |
robbers | -0.022 |
Token | stickers |
Token ID | 28568 |
Feature activation | -1.28e-02 |
Pos logit contributions | |
flew | +0.045 |
bul | +0.044 |
spe | +0.043 |
soared | +0.040 |
Bel | +0.039 |
Neg logit contributions | |
sidelines | -0.049 |
spaghetti | -0.048 |
Seek | -0.044 |
menu | -0.042 |
internet | -0.041 |
Token | and |
Token ID | 290 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
bul | +0.020 |
spe | +0.019 |
flew | +0.019 |
Bel | +0.018 |
paramed | +0.018 |
Neg logit contributions | |
spaghetti | -0.019 |
sidelines | -0.018 |
Seek | -0.016 |
menu | -0.016 |
bed | -0.016 |
Token | slices |
Token ID | 24314 |
Feature activation | +1.17e-03 |
Pos logit contributions | |
bul | +0.020 |
flew | +0.020 |
spe | +0.020 |
paramed | +0.019 |
Bel | +0.019 |
Neg logit contributions | |
spaghetti | -0.018 |
sidelines | -0.017 |
Seek | -0.015 |
menu | -0.015 |
bed | -0.015 |
Token | look |
Token ID | 804 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
sidelines | +0.002 |
spaghetti | +0.002 |
Seek | +0.002 |
menu | +0.002 |
bed | +0.001 |
Neg logit contributions | |
bul | -0.002 |
flew | -0.002 |
spe | -0.002 |
pol | -0.002 |
pre | -0.002 |
Token | as |
Token ID | 355 |
Feature activation | -2.29e-02 |
Pos logit contributions | |
sidelines | +0.016 |
spaghetti | +0.015 |
Seek | +0.014 |
bed | +0.013 |
robbers | +0.013 |
Neg logit contributions | |
flew | -0.020 |
bul | -0.020 |
spe | -0.020 |
pol | -0.018 |
soared | -0.018 |
Token | tidy |
Token ID | 43044 |
Feature activation | -4.16e-02 |
Pos logit contributions | |
bul | +0.040 |
flew | +0.040 |
spe | +0.040 |
pol | +0.037 |
pre | +0.037 |
Neg logit contributions | |
sidelines | -0.029 |
spaghetti | -0.028 |
Seek | -0.025 |
menu | -0.024 |
bed | -0.023 |
Token | as |
Token ID | 355 |
Feature activation | -3.57e-02 |
Pos logit contributions | |
bul | +0.059 |
flew | +0.059 |
spe | +0.058 |
pol | +0.053 |
paramed | +0.053 |
Neg logit contributions | |
sidelines | -0.066 |
spaghetti | -0.066 |
Seek | -0.059 |
menu | -0.057 |
bed | -0.056 |
Token | possible |
Token ID | 1744 |
Feature activation | -9.32e-02 |
Pos logit contributions | |
flew | +0.050 |
bul | +0.050 |
spe | +0.049 |
pre | +0.044 |
pol | +0.044 |
Neg logit contributions | |
sidelines | -0.059 |
spaghetti | -0.056 |
Seek | -0.051 |
menu | -0.049 |
bed | -0.048 |
Token | . |
Token ID | 13 |
Feature activation | -9.48e-03 |
Pos logit contributions | |
flew | +0.118 |
bul | +0.117 |
spe | +0.112 |
pol | +0.102 |
soared | +0.102 |
Neg logit contributions | |
sidelines | -0.166 |
spaghetti | -0.160 |
Seek | -0.145 |
menu | -0.140 |
bed | -0.137 |
Token | Once |
Token ID | 4874 |
Feature activation | -3.78e-02 |
Pos logit contributions | |
bul | +0.015 |
spe | +0.015 |
flew | +0.015 |
paramed | +0.013 |
Bel | +0.013 |
Neg logit contributions | |
sidelines | -0.014 |
spaghetti | -0.014 |
Seek | -0.012 |
menu | -0.012 |
bed | -0.011 |
Token | he |
Token ID | 339 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
bul | +0.061 |
spe | +0.060 |
flew | +0.059 |
Bel | +0.057 |
paramed | +0.056 |
Neg logit contributions | |
spaghetti | -0.054 |
sidelines | -0.052 |
Seek | -0.046 |
menu | -0.045 |
bed | -0.044 |
Token | was |
Token ID | 373 |
Feature activation | -1.38e-02 |
Pos logit contributions | |
spaghetti | +0.020 |
sidelines | +0.018 |
Seek | +0.017 |
menu | +0.017 |
bed | +0.016 |
Neg logit contributions | |
spe | -0.016 |
bul | -0.016 |
paramed | -0.016 |
Bel | -0.015 |
esh | -0.015 |
Token | finished |
Token ID | 5201 |
Feature activation | -1.81e-03 |
Pos logit contributions | |
bul | +0.021 |
flew | +0.021 |
spe | +0.021 |
Bel | +0.019 |
pol | +0.019 |
Neg logit contributions | |
spaghetti | -0.020 |
sidelines | -0.020 |
Seek | -0.018 |
menu | -0.017 |
bed | -0.017 |
Token | and |
Token ID | 290 |
Feature activation | -1.76e-02 |
Pos logit contributions | |
flew | +0.004 |
bul | +0.004 |
spe | +0.003 |
blew | +0.003 |
soared | +0.003 |
Neg logit contributions | |
sidelines | -0.007 |
spaghetti | -0.006 |
Seek | -0.006 |
Want | -0.006 |
menu | -0.006 |
Token | they |
Token ID | 484 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
flew | +0.024 |
bul | +0.023 |
spe | +0.023 |
soared | +0.021 |
blew | +0.021 |
Neg logit contributions | |
sidelines | -0.030 |
spaghetti | -0.029 |
Seek | -0.026 |
menu | -0.025 |
internet | -0.024 |
Token | played |
Token ID | 2826 |
Feature activation | -2.22e-02 |
Pos logit contributions | |
bul | +0.020 |
paramed | +0.019 |
xc | +0.019 |
esh | +0.019 |
spe | +0.019 |
Neg logit contributions | |
spaghetti | -0.022 |
sidelines | -0.021 |
Seek | -0.019 |
bed | -0.019 |
menu | -0.019 |
Token | make |
Token ID | 787 |
Feature activation | -9.15e-03 |
Pos logit contributions | |
flew | +0.025 |
spe | +0.022 |
bul | +0.022 |
Or | +0.021 |
soared | +0.021 |
Neg logit contributions | |
sidelines | -0.043 |
spaghetti | -0.040 |
menu | -0.037 |
ours | -0.037 |
Seek | -0.037 |
Token | - |
Token ID | 12 |
Feature activation | -2.16e-02 |
Pos logit contributions | |
flew | +0.013 |
spe | +0.012 |
bul | +0.012 |
soared | +0.012 |
hon | +0.011 |
Neg logit contributions | |
sidelines | -0.015 |
spaghetti | -0.013 |
menu | -0.013 |
Seek | -0.012 |
robbers | -0.012 |
Token | bel |
Token ID | 6667 |
Feature activation | -9.27e-02 |
Pos logit contributions | |
flew | +0.010 |
bul | +0.010 |
spe | +0.008 |
esh | +0.008 |
soared | +0.008 |
Neg logit contributions | |
spaghetti | -0.053 |
sidelines | -0.053 |
Seek | -0.050 |
menu | -0.049 |
bed | -0.047 |
Token | ieve |
Token ID | 12311 |
Feature activation | -3.19e-02 |
Pos logit contributions | |
bul | +0.139 |
flew | +0.138 |
spe | +0.137 |
Bel | +0.126 |
paramed | +0.126 |
Neg logit contributions | |
spaghetti | -0.140 |
sidelines | -0.139 |
Seek | -0.123 |
menu | -0.118 |
bed | -0.116 |
Token | . |
Token ID | 13 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
spe | +0.042 |
flew | +0.042 |
bul | +0.042 |
soared | +0.036 |
Or | +0.036 |
Neg logit contributions | |
sidelines | -0.056 |
spaghetti | -0.054 |
Seek | -0.048 |
menu | -0.047 |
bed | -0.045 |
Token | Finally |
Token ID | 9461 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
flew | +0.017 |
Bel | +0.016 |
Ale | +0.016 |
irled | +0.015 |
ira | +0.015 |
Neg logit contributions | |
sidelines | -0.020 |
Seek | -0.018 |
spaghetti | -0.017 |
ours | -0.017 |
anywhere | -0.016 |
Token | , |
Token ID | 11 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
bul | +0.016 |
spe | +0.015 |
flew | +0.015 |
pre | +0.014 |
pol | +0.014 |
Neg logit contributions | |
spaghetti | -0.017 |
sidelines | -0.017 |
Seek | -0.015 |
menu | -0.015 |
bed | -0.015 |
Token | they |
Token ID | 484 |
Feature activation | -7.91e-03 |
Pos logit contributions | |
flew | +0.022 |
bul | +0.021 |
spe | +0.020 |
Bel | +0.020 |
blew | +0.020 |
Neg logit contributions | |
sidelines | -0.025 |
spaghetti | -0.024 |
Seek | -0.022 |
internet | -0.021 |
menu | -0.021 |
Token | to |
Token ID | 284 |
Feature activation | -3.29e-03 |
Pos logit contributions | |
flew | +0.002 |
bul | +0.002 |
spe | +0.002 |
Sher | +0.002 |
Bel | +0.002 |
Neg logit contributions | |
sidelines | -0.003 |
spaghetti | -0.003 |
Seek | -0.003 |
ours | -0.003 |
menu | -0.002 |
Token | be |
Token ID | 307 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
bul | +0.005 |
flew | +0.005 |
spe | +0.005 |
pol | +0.005 |
Bel | +0.005 |
Neg logit contributions | |
spaghetti | -0.005 |
sidelines | -0.005 |
Seek | -0.004 |
menu | -0.004 |
bed | -0.004 |
Token | as |
Token ID | 355 |
Feature activation | -1.68e-02 |
Pos logit contributions | |
bul | +0.018 |
spe | +0.018 |
flew | +0.018 |
pre | +0.017 |
paramed | +0.017 |
Neg logit contributions | |
spaghetti | -0.014 |
sidelines | -0.013 |
Seek | -0.012 |
bed | -0.011 |
menu | -0.011 |
Token | ready |
Token ID | 3492 |
Feature activation | -1.84e-02 |
Pos logit contributions | |
bul | +0.031 |
flew | +0.030 |
spe | +0.029 |
esh | +0.029 |
pre | +0.029 |
Neg logit contributions | |
spaghetti | -0.021 |
sidelines | -0.018 |
Seek | -0.017 |
bed | -0.016 |
safe | -0.015 |
Token | as |
Token ID | 355 |
Feature activation | -3.35e-02 |
Pos logit contributions | |
flew | +0.028 |
bul | +0.027 |
spe | +0.027 |
Bel | +0.024 |
pol | +0.024 |
Neg logit contributions | |
sidelines | -0.028 |
spaghetti | -0.027 |
Seek | -0.025 |
menu | -0.023 |
robbers | -0.022 |
Token | possible |
Token ID | 1744 |
Feature activation | -9.26e-02 |
Pos logit contributions | |
flew | +0.039 |
bul | +0.038 |
spe | +0.037 |
Bel | +0.033 |
soared | +0.033 |
Neg logit contributions | |
sidelines | -0.063 |
spaghetti | -0.063 |
menu | -0.056 |
Seek | -0.056 |
internet | -0.053 |
Token | . |
Token ID | 13 |
Feature activation | -8.08e-03 |
Pos logit contributions | |
spe | +0.146 |
bul | +0.146 |
flew | +0.139 |
paramed | +0.137 |
pre | +0.134 |
Neg logit contributions | |
spaghetti | -0.135 |
sidelines | -0.128 |
Seek | -0.118 |
bed | -0.117 |
menu | -0.115 |
Token | She |
Token ID | 1375 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
bul | +0.011 |
spe | +0.011 |
flew | +0.010 |
Bel | +0.010 |
pol | +0.010 |
Neg logit contributions | |
sidelines | -0.013 |
spaghetti | -0.013 |
Seek | -0.012 |
menu | -0.012 |
ours | -0.012 |
Token | straight |
Token ID | 3892 |
Feature activation | -2.79e-02 |
Pos logit contributions | |
bul | +0.013 |
spe | +0.012 |
pre | +0.012 |
paramed | +0.012 |
pol | +0.011 |
Neg logit contributions | |
spaghetti | -0.019 |
sidelines | -0.017 |
Seek | -0.016 |
bed | -0.016 |
menu | -0.016 |
Token | ened |
Token ID | 2945 |
Feature activation | -2.99e-02 |
Pos logit contributions | |
spe | +0.042 |
pre | +0.042 |
bul | +0.041 |
rob | +0.040 |
paramed | +0.040 |
Neg logit contributions | |
spaghetti | -0.042 |
sidelines | -0.038 |
bed | -0.037 |
Seek | -0.036 |
menu | -0.034 |
Token | her |
Token ID | 607 |
Feature activation | -2.35e-03 |
Pos logit contributions | |
bul | +0.036 |
spe | +0.035 |
flew | +0.035 |
pre | +0.032 |
paramed | +0.032 |
Neg logit contributions | |
spaghetti | -0.055 |
sidelines | -0.054 |
Seek | -0.049 |
menu | -0.048 |
bed | -0.048 |
Token | send |
Token ID | 3758 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
bul | +0.012 |
spe | +0.012 |
xc | +0.012 |
esh | +0.012 |
pre | +0.011 |
Neg logit contributions | |
spaghetti | -0.008 |
sidelines | -0.008 |
menu | -0.007 |
bed | -0.007 |
Seek | -0.007 |
Token | them |
Token ID | 606 |
Feature activation | -8.18e-03 |
Pos logit contributions | |
spaghetti | +0.020 |
sidelines | +0.019 |
Seek | +0.018 |
menu | +0.017 |
bed | +0.017 |
Neg logit contributions | |
bul | -0.012 |
flew | -0.012 |
spe | -0.012 |
Bel | -0.011 |
pol | -0.011 |
Token | some |
Token ID | 617 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
bul | +0.014 |
spe | +0.014 |
flew | +0.014 |
pre | +0.013 |
paramed | +0.013 |
Neg logit contributions | |
spaghetti | -0.011 |
sidelines | -0.009 |
Seek | -0.009 |
menu | -0.009 |
bed | -0.009 |
Token | jokes |
Token ID | 14532 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
bul | +0.023 |
flew | +0.023 |
spe | +0.022 |
pre | +0.021 |
paramed | +0.021 |
Neg logit contributions | |
sidelines | -0.023 |
spaghetti | -0.022 |
Seek | -0.020 |
Want | -0.018 |
menu | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
spe | +0.025 |
bul | +0.025 |
flew | +0.024 |
pol | +0.023 |
xc | +0.023 |
Neg logit contributions | |
spaghetti | -0.023 |
sidelines | -0.021 |
menu | -0.019 |
Seek | -0.019 |
bed | -0.019 |
Token | r |
Token ID | 374 |
Feature activation | -9.25e-02 |
Pos logit contributions | |
bul | +0.026 |
flew | +0.025 |
spe | +0.025 |
pol | +0.023 |
Bel | +0.023 |
Neg logit contributions | |
spaghetti | -0.024 |
sidelines | -0.024 |
Seek | -0.021 |
menu | -0.020 |
bed | -0.020 |
Token | iddles |
Token ID | 29319 |
Feature activation | -5.04e-02 |
Pos logit contributions | |
flew | +0.155 |
spe | +0.147 |
bul | +0.142 |
rob | +0.142 |
slit | +0.141 |
Neg logit contributions | |
spaghetti | -0.128 |
sidelines | -0.109 |
Seek | -0.109 |
menu | -0.103 |
amas | -0.103 |
Token | . |
Token ID | 13 |
Feature activation | +2.90e-03 |
Pos logit contributions | |
bul | +0.083 |
flew | +0.080 |
xc | +0.079 |
pol | +0.078 |
spe | +0.077 |
Neg logit contributions | |
spaghetti | -0.068 |
sidelines | -0.063 |
menu | -0.060 |
bed | -0.057 |
Seek | -0.057 |
Token |
|
Token ID | 198 |
Feature activation | +7.30e-03 |
Pos logit contributions | |
spaghetti | +0.005 |
sidelines | +0.005 |
Seek | +0.004 |
menu | +0.004 |
bed | +0.004 |
Neg logit contributions | |
bul | -0.004 |
flew | -0.004 |
spe | -0.004 |
Bel | -0.004 |
paramed | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | +9.57e-03 |
Pos logit contributions | |
spaghetti | +0.012 |
sidelines | +0.012 |
Seek | +0.010 |
menu | +0.010 |
bed | +0.010 |
Neg logit contributions | |
flew | -0.010 |
bul | -0.010 |
spe | -0.010 |
Bel | -0.009 |
paramed | -0.009 |
Token | " |
Token ID | 1 |
Feature activation | -1.72e-02 |
Pos logit contributions | |
spaghetti | +0.018 |
sidelines | +0.018 |
Seek | +0.016 |
menu | +0.016 |
bed | +0.015 |
Neg logit contributions | |
bul | -0.012 |
flew | -0.011 |
spe | -0.011 |
pol | -0.010 |
pre | -0.010 |
Token | it |
Token ID | 340 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
spe | +0.040 |
bul | +0.040 |
paramed | +0.038 |
flew | +0.038 |
pre | +0.037 |
Neg logit contributions | |
sidelines | -0.030 |
spaghetti | -0.030 |
Seek | -0.026 |
bed | -0.025 |
mine | -0.024 |
Token | for |
Token ID | 329 |
Feature activation | +2.31e-02 |
Pos logit contributions | |
spaghetti | +0.017 |
sidelines | +0.017 |
menu | +0.015 |
Seek | +0.015 |
robbers | +0.014 |
Neg logit contributions | |
flew | -0.017 |
bul | -0.017 |
spe | -0.016 |
soared | -0.015 |
Bel | -0.015 |
Token | as |
Token ID | 355 |
Feature activation | -1.54e-02 |
Pos logit contributions | |
sidelines | +0.037 |
spaghetti | +0.036 |
menu | +0.034 |
ours | +0.033 |
concession | +0.033 |
Neg logit contributions | |
flew | -0.033 |
Bel | -0.029 |
Sher | -0.029 |
soared | -0.028 |
bul | -0.028 |
Token | long |
Token ID | 890 |
Feature activation | -3.55e-02 |
Pos logit contributions | |
bul | +0.026 |
spe | +0.026 |
flew | +0.025 |
paramed | +0.025 |
xc | +0.024 |
Neg logit contributions | |
spaghetti | -0.021 |
sidelines | -0.020 |
Seek | -0.017 |
bed | -0.017 |
menu | -0.016 |
Token | as |
Token ID | 355 |
Feature activation | -3.11e-02 |
Pos logit contributions | |
spe | +0.077 |
xc | +0.074 |
bul | +0.073 |
pre | +0.072 |
paramed | +0.071 |
Neg logit contributions | |
sidelines | -0.035 |
spaghetti | -0.035 |
bed | -0.030 |
before | -0.028 |
mine | -0.026 |
Token | possible |
Token ID | 1744 |
Feature activation | -9.23e-02 |
Pos logit contributions | |
bul | +0.039 |
spe | +0.039 |
flew | +0.038 |
paramed | +0.036 |
pre | +0.035 |
Neg logit contributions | |
spaghetti | -0.055 |
sidelines | -0.053 |
Seek | -0.048 |
menu | -0.047 |
bed | -0.047 |
Token | , |
Token ID | 11 |
Feature activation | -2.10e-02 |
Pos logit contributions | |
bul | +0.136 |
spe | +0.135 |
flew | +0.133 |
paramed | +0.126 |
pre | +0.123 |
Neg logit contributions | |
spaghetti | -0.142 |
sidelines | -0.138 |
Seek | -0.124 |
menu | -0.121 |
bed | -0.120 |
Token | until |
Token ID | 1566 |
Feature activation | -1.29e-02 |
Pos logit contributions | |
flew | +0.035 |
bul | +0.035 |
spe | +0.034 |
soared | +0.032 |
Bel | +0.032 |
Neg logit contributions | |
spaghetti | -0.028 |
sidelines | -0.028 |
Seek | -0.024 |
menu | -0.024 |
bed | -0.023 |
Token | she |
Token ID | 673 |
Feature activation | -8.00e-03 |
Pos logit contributions | |
bul | +0.021 |
spe | +0.021 |
cker | +0.020 |
pre | +0.020 |
paramed | +0.020 |
Neg logit contributions | |
spaghetti | -0.019 |
sidelines | -0.018 |
bed | -0.016 |
Seek | -0.015 |
mine | -0.015 |
Token | was |
Token ID | 373 |
Feature activation | -1.96e-02 |
Pos logit contributions | |
bul | +0.012 |
paramed | +0.012 |
esh | +0.012 |
cker | +0.011 |
spe | +0.011 |
Neg logit contributions | |
spaghetti | -0.012 |
sidelines | -0.011 |
Seek | -0.010 |
bed | -0.010 |
forgetting | -0.010 |
Token | too |
Token ID | 1165 |
Feature activation | -9.21e-03 |
Pos logit contributions | |
bul | +0.034 |
flew | +0.034 |
spe | +0.033 |
paramed | +0.031 |
Bel | +0.031 |
Neg logit contributions | |
spaghetti | -0.025 |
sidelines | -0.025 |
Seek | -0.022 |
menu | -0.021 |
bed | -0.021 |
Token | was |
Token ID | 373 |
Feature activation | -9.21e-04 |
Pos logit contributions | |
bul | +0.006 |
flew | +0.006 |
spe | +0.005 |
paramed | +0.005 |
pol | +0.005 |
Neg logit contributions | |
spaghetti | -0.007 |
sidelines | -0.007 |
Seek | -0.007 |
menu | -0.006 |
bed | -0.006 |
Token | carrying |
Token ID | 6872 |
Feature activation | +2.11e-02 |
Pos logit contributions | |
flew | +0.002 |
spe | +0.002 |
bul | +0.002 |
paramed | +0.001 |
blew | +0.001 |
Neg logit contributions | |
sidelines | -0.001 |
spaghetti | -0.001 |
Seek | -0.001 |
menu | -0.001 |
internet | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | +8.50e-04 |
Pos logit contributions | |
sidelines | +0.041 |
spaghetti | +0.036 |
Seek | +0.035 |
Want | +0.035 |
internet | +0.033 |
Neg logit contributions | |
flew | -0.025 |
bul | -0.023 |
spe | -0.022 |
pol | -0.021 |
soared | -0.021 |
Token | big |
Token ID | 1263 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
sidelines | +0.001 |
spaghetti | +0.001 |
Seek | +0.001 |
Want | +0.001 |
forgetting | +0.001 |
Neg logit contributions | |
bul | -0.001 |
flew | -0.001 |
spe | -0.001 |
paramed | -0.001 |
rob | -0.001 |
Token | bag |
Token ID | 6131 |
Feature activation | +2.09e-02 |
Pos logit contributions | |
flew | +0.015 |
bul | +0.015 |
spe | +0.013 |
spr | +0.013 |
paramed | +0.013 |
Neg logit contributions | |
sidelines | -0.016 |
Seek | -0.015 |
spaghetti | -0.014 |
ours | -0.013 |
forgetting | -0.013 |
Token | full |
Token ID | 1336 |
Feature activation | +4.06e-02 |
Pos logit contributions | |
sidelines | +0.039 |
spaghetti | +0.037 |
Seek | +0.034 |
robbers | +0.034 |
Want | +0.033 |
Neg logit contributions | |
flew | -0.026 |
bul | -0.024 |
spe | -0.024 |
pol | -0.021 |
esh | -0.020 |
Token | of |
Token ID | 286 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
sidelines | +0.085 |
assing | +0.076 |
Seek | +0.076 |
spaghetti | +0.073 |
Want | +0.073 |
Neg logit contributions | |
bul | -0.040 |
flew | -0.038 |
spe | -0.037 |
spr | -0.031 |
paramed | -0.031 |
Token | mail |
Token ID | 6920 |
Feature activation | +1.24e-02 |
Pos logit contributions | |
sidelines | +0.021 |
Want | +0.018 |
Seek | +0.018 |
spine | +0.017 |
oring | +0.017 |
Neg logit contributions | |
flew | -0.022 |
paramed | -0.021 |
bul | -0.021 |
spe | -0.020 |
ostr | -0.020 |
Token | for |
Token ID | 329 |
Feature activation | +2.00e-02 |
Pos logit contributions | |
sidelines | +0.024 |
spaghetti | +0.021 |
Seek | +0.020 |
Want | +0.019 |
internet | +0.019 |
Neg logit contributions | |
bul | -0.015 |
flew | -0.015 |
spe | -0.015 |
pre | -0.013 |
master | -0.013 |
Token | everyone |
Token ID | 2506 |
Feature activation | -1.17e-03 |
Pos logit contributions | |
sidelines | +0.040 |
Want | +0.036 |
oring | +0.035 |
Seek | +0.035 |
spaghetti | +0.034 |
Neg logit contributions | |
flew | -0.020 |
spe | -0.018 |
Wil | -0.018 |
il | -0.017 |
ered | -0.017 |
Token | in |
Token ID | 287 |
Feature activation | -2.17e-02 |
Pos logit contributions | |
bul | +0.002 |
flew | +0.002 |
spe | +0.002 |
paramed | +0.002 |
Bel | +0.002 |
Neg logit contributions | |
spaghetti | -0.002 |
sidelines | -0.002 |
Seek | -0.001 |
menu | -0.001 |
bed | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -5.53e-03 |
Pos logit contributions | |
flew | +0.012 |
bul | +0.012 |
spe | +0.011 |
pol | +0.011 |
Bel | +0.010 |
Neg logit contributions | |
sidelines | -0.010 |
spaghetti | -0.010 |
Seek | -0.009 |
menu | -0.008 |
Want | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | +4.12e-04 |
Pos logit contributions | |
bul | +0.009 |
flew | +0.009 |
spe | +0.009 |
pre | +0.009 |
soared | +0.009 |
Neg logit contributions | |
spaghetti | -0.008 |
sidelines | -0.007 |
Seek | -0.006 |
bed | -0.006 |
menu | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +3.94e-03 |
Pos logit contributions | |
spaghetti | +0.000 |
sidelines | +0.000 |
Seek | +0.000 |
bed | +0.000 |
Want | +0.000 |
Neg logit contributions | |
bul | -0.001 |
flew | -0.001 |
spe | -0.001 |
pre | -0.001 |
cker | -0.001 |
Token | The |
Token ID | 464 |
Feature activation | -5.55e-03 |
Pos logit contributions | |
sidelines | +0.006 |
Seek | +0.006 |
spaghetti | +0.005 |
Want | +0.005 |
concession | +0.005 |
Neg logit contributions | |
bul | -0.006 |
pre | -0.006 |
flew | -0.006 |
cker | -0.006 |
imm | -0.006 |
Token | girl |
Token ID | 2576 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
flew | +0.008 |
bul | +0.008 |
spe | +0.008 |
paramed | +0.007 |
blew | +0.007 |
Neg logit contributions | |
spaghetti | -0.009 |
sidelines | -0.008 |
Seek | -0.008 |
menu | -0.007 |
ours | -0.007 |
Token | hugged |
Token ID | 41130 |
Feature activation | +3.91e-02 |
Pos logit contributions | |
spaghetti | +0.018 |
sidelines | +0.016 |
bed | +0.015 |
menu | +0.015 |
Seek | +0.015 |
Neg logit contributions | |
bul | -0.018 |
xc | -0.016 |
pre | -0.016 |
esh | -0.016 |
pol | -0.016 |
Token | her |
Token ID | 607 |
Feature activation | -5.35e-04 |
Pos logit contributions | |
spaghetti | +0.063 |
sidelines | +0.062 |
Seek | +0.054 |
bed | +0.054 |
menu | +0.053 |
Neg logit contributions | |
bul | -0.056 |
spe | -0.055 |
flew | -0.055 |
pre | -0.051 |
soared | -0.050 |
Token | new |
Token ID | 649 |
Feature activation | -4.94e-05 |
Pos logit contributions | |
bul | +0.001 |
flew | +0.001 |
spe | +0.001 |
paramed | +0.001 |
pre | +0.001 |
Neg logit contributions | |
sidelines | -0.001 |
spaghetti | -0.001 |
Seek | -0.001 |
menu | -0.001 |
Want | -0.001 |
Token | friend |
Token ID | 1545 |
Feature activation | -5.59e-03 |
Pos logit contributions | |
bul | +0.000 |
flew | +0.000 |
spe | +0.000 |
paramed | +0.000 |
pol | +0.000 |
Neg logit contributions | |
spaghetti | -0.000 |
sidelines | -0.000 |
Seek | -0.000 |
menu | -0.000 |
bed | -0.000 |
Token | , |
Token ID | 11 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
flew | +0.008 |
bul | +0.008 |
spe | +0.007 |
Bel | +0.007 |
pol | +0.007 |
Neg logit contributions | |
sidelines | -0.009 |
spaghetti | -0.009 |
Seek | -0.008 |
menu | -0.008 |
internet | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | -3.04e-03 |
Pos logit contributions | |
bul | +0.029 |
flew | +0.028 |
spe | +0.028 |
pol | +0.026 |
pre | +0.026 |
Neg logit contributions | |
spaghetti | -0.026 |
sidelines | -0.026 |
Seek | -0.022 |
menu | -0.022 |
bed | -0.022 |
Token | it |
Token ID | 340 |
Feature activation | +1.89e-03 |
Pos logit contributions | |
flew | +0.019 |
spe | +0.018 |
bul | +0.018 |
soared | +0.017 |
Bel | +0.017 |
Neg logit contributions | |
sidelines | -0.029 |
spaghetti | -0.028 |
Seek | -0.026 |
menu | -0.026 |
internet | -0.025 |
Token | involved |
Token ID | 2950 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
spaghetti | +0.003 |
sidelines | +0.003 |
Seek | +0.003 |
bed | +0.003 |
menu | +0.003 |
Neg logit contributions | |
bul | -0.002 |
spe | -0.002 |
paramed | -0.002 |
Ale | -0.002 |
pre | -0.002 |
Token | a |
Token ID | 257 |
Feature activation | -5.95e-03 |
Pos logit contributions | |
flew | +0.039 |
bul | +0.038 |
spe | +0.038 |
soared | +0.035 |
pol | +0.034 |
Neg logit contributions | |
sidelines | -0.042 |
spaghetti | -0.041 |
Seek | -0.037 |
menu | -0.036 |
robbers | -0.034 |
Token | bit |
Token ID | 1643 |
Feature activation | -4.14e-03 |
Pos logit contributions | |
bul | +0.010 |
spe | +0.010 |
flew | +0.010 |
paramed | +0.009 |
Bel | +0.009 |
Neg logit contributions | |
spaghetti | -0.008 |
sidelines | -0.008 |
Seek | -0.007 |
ours | -0.007 |
menu | -0.007 |
Token | of |
Token ID | 286 |
Feature activation | -4.34e-03 |
Pos logit contributions | |
bul | +0.006 |
flew | +0.006 |
spe | +0.006 |
pol | +0.006 |
paramed | +0.006 |
Neg logit contributions | |
sidelines | -0.006 |
spaghetti | -0.006 |
Seek | -0.005 |
menu | -0.005 |
bed | -0.005 |
Token | rest |
Token ID | 1334 |
Feature activation | +4.68e-02 |
Pos logit contributions | |
flew | +0.007 |
bul | +0.007 |
spe | +0.007 |
soared | +0.007 |
paramed | +0.006 |
Neg logit contributions | |
sidelines | -0.006 |
spaghetti | -0.006 |
Seek | -0.005 |
menu | -0.005 |
robbers | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | -2.17e-02 |
Pos logit contributions | |
sidelines | +0.083 |
spaghetti | +0.080 |
Seek | +0.074 |
menu | +0.071 |
robbers | +0.069 |
Neg logit contributions | |
flew | -0.060 |
bul | -0.060 |
spe | -0.059 |
pre | -0.052 |
pol | -0.052 |
Token | being |
Token ID | 852 |
Feature activation | -2.87e-02 |
Pos logit contributions | |
flew | +0.034 |
bul | +0.032 |
spe | +0.032 |
soared | +0.030 |
blew | +0.029 |
Neg logit contributions | |
sidelines | -0.033 |
spaghetti | -0.032 |
Seek | -0.029 |
menu | -0.028 |
robbers | -0.027 |
Token | a |
Token ID | 257 |
Feature activation | -2.11e-02 |
Pos logit contributions | |
bul | +0.051 |
spe | +0.050 |
flew | +0.050 |
pre | +0.047 |
paramed | +0.047 |
Neg logit contributions | |
spaghetti | -0.036 |
sidelines | -0.034 |
Seek | -0.030 |
bed | -0.028 |
menu | -0.028 |
Token | little |
Token ID | 1310 |
Feature activation | -3.09e-02 |
Pos logit contributions | |
bul | +0.037 |
flew | +0.037 |
spe | +0.036 |
xc | +0.036 |
esh | +0.035 |
Neg logit contributions | |
spaghetti | -0.025 |
sidelines | -0.025 |
Seek | -0.022 |
bed | -0.021 |
menu | -0.021 |
Token | hurt |
Token ID | 5938 |
Feature activation | -8.34e-03 |
Pos logit contributions | |
flew | +0.049 |
spe | +0.049 |
bul | +0.048 |
esh | +0.047 |
xc | +0.047 |
Neg logit contributions | |
spaghetti | -0.043 |
sidelines | -0.042 |
bed | -0.036 |
Seek | -0.036 |
menu | -0.035 |
Token | a |
Token ID | 257 |
Feature activation | +2.67e-02 |
Pos logit contributions | |
spaghetti | +0.037 |
sidelines | +0.033 |
bed | +0.029 |
menu | +0.028 |
Seek | +0.028 |
Neg logit contributions | |
bul | -0.046 |
spe | -0.046 |
flew | -0.043 |
pol | -0.042 |
esh | -0.041 |
Token | big |
Token ID | 1263 |
Feature activation | +5.64e-03 |
Pos logit contributions | |
sidelines | +0.045 |
spaghetti | +0.044 |
Seek | +0.042 |
Want | +0.039 |
internet | +0.039 |
Neg logit contributions | |
flew | -0.036 |
bul | -0.033 |
rob | -0.033 |
spe | -0.033 |
blew | -0.032 |
Token | sack |
Token ID | 23704 |
Feature activation | +3.03e-02 |
Pos logit contributions | |
Seek | +0.010 |
sidelines | +0.010 |
spaghetti | +0.009 |
internet | +0.009 |
Want | +0.008 |
Neg logit contributions | |
flew | -0.007 |
ostr | -0.007 |
rob | -0.007 |
bul | -0.007 |
spr | -0.006 |
Token | on |
Token ID | 319 |
Feature activation | +1.98e-02 |
Pos logit contributions | |
spaghetti | +0.047 |
sidelines | +0.047 |
Seek | +0.041 |
menu | +0.040 |
bed | +0.039 |
Neg logit contributions | |
flew | -0.045 |
bul | -0.044 |
spe | -0.043 |
pol | -0.040 |
soared | -0.040 |
Token | a |
Token ID | 257 |
Feature activation | +2.66e-02 |
Pos logit contributions | |
spaghetti | +0.031 |
sidelines | +0.030 |
bed | +0.026 |
menu | +0.026 |
Seek | +0.026 |
Neg logit contributions | |
bul | -0.030 |
spe | -0.030 |
flew | -0.029 |
pre | -0.028 |
paramed | -0.028 |
Token | bench |
Token ID | 7624 |
Feature activation | +3.47e-02 |
Pos logit contributions | |
Seek | +0.041 |
sidelines | +0.040 |
spaghetti | +0.038 |
Want | +0.038 |
Do | +0.035 |
Neg logit contributions | |
flew | -0.037 |
ostr | -0.035 |
swoop | -0.034 |
spr | -0.033 |
rob | -0.033 |
Token | . |
Token ID | 13 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
sidelines | +0.061 |
spaghetti | +0.061 |
Seek | +0.056 |
menu | +0.052 |
bed | +0.051 |
Neg logit contributions | |
flew | -0.045 |
bul | -0.043 |
spe | -0.043 |
pol | -0.038 |
soared | -0.038 |
Token | They |
Token ID | 1119 |
Feature activation | +9.03e-03 |
Pos logit contributions | |
sidelines | +0.021 |
spaghetti | +0.021 |
Seek | +0.019 |
menu | +0.017 |
hunting | +0.017 |
Neg logit contributions | |
spe | -0.016 |
flew | -0.016 |
bul | -0.015 |
paramed | -0.014 |
Ale | -0.014 |
Token | ran |
Token ID | 4966 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
spaghetti | +0.015 |
sidelines | +0.014 |
robbers | +0.013 |
Seek | +0.013 |
menu | +0.013 |
Neg logit contributions | |
bul | -0.013 |
pre | -0.012 |
spe | -0.012 |
paramed | -0.011 |
esh | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | +7.56e-03 |
Pos logit contributions | |
spaghetti | +0.019 |
sidelines | +0.019 |
Seek | +0.017 |
menu | +0.016 |
bed | +0.016 |
Neg logit contributions | |
flew | -0.020 |
bul | -0.019 |
spe | -0.019 |
Bel | -0.018 |
pol | -0.018 |
Token | the |
Token ID | 262 |
Feature activation | +2.01e-02 |
Pos logit contributions | |
spaghetti | +0.014 |
sidelines | +0.014 |
Seek | +0.013 |
menu | +0.012 |
internet | +0.012 |
Neg logit contributions | |
flew | -0.009 |
spe | -0.008 |
Bel | -0.008 |
soared | -0.008 |
bul | -0.008 |
Token | ily |
Token ID | 813 |
Feature activation | -2.89e-03 |
Pos logit contributions | |
spaghetti | +0.005 |
sidelines | +0.005 |
Seek | +0.004 |
menu | +0.004 |
bed | +0.004 |
Neg logit contributions | |
bul | -0.003 |
flew | -0.003 |
spe | -0.003 |
pol | -0.003 |
paramed | -0.003 |
Token | loved |
Token ID | 6151 |
Feature activation | +2.85e-02 |
Pos logit contributions | |
bul | +0.006 |
spe | +0.006 |
paramed | +0.005 |
xc | +0.005 |
pol | +0.005 |
Neg logit contributions | |
spaghetti | -0.004 |
menu | -0.003 |
bed | -0.003 |
sidelines | -0.003 |
bone | -0.003 |
Token | music |
Token ID | 2647 |
Feature activation | +5.99e-03 |
Pos logit contributions | |
spaghetti | +0.040 |
sidelines | +0.035 |
menu | +0.031 |
bed | +0.031 |
Seek | +0.030 |
Neg logit contributions | |
spe | -0.051 |
bul | -0.050 |
flew | -0.050 |
soared | -0.047 |
Bel | -0.047 |
Token | . |
Token ID | 13 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
spaghetti | +0.008 |
sidelines | +0.008 |
bed | +0.007 |
menu | +0.007 |
Seek | +0.007 |
Neg logit contributions | |
spe | -0.010 |
flew | -0.010 |
bul | -0.010 |
Bel | -0.010 |
xc | -0.010 |
Token | She |
Token ID | 1375 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
spaghetti | +0.025 |
sidelines | +0.023 |
Seek | +0.020 |
bed | +0.020 |
menu | +0.020 |
Neg logit contributions | |
flew | -0.026 |
spe | -0.026 |
bul | -0.025 |
soared | -0.024 |
pre | -0.024 |
Token | liked |
Token ID | 8288 |
Feature activation | +3.46e-02 |
Pos logit contributions | |
spaghetti | +0.014 |
bed | +0.012 |
sidelines | +0.011 |
chess | +0.011 |
Seek | +0.011 |
Neg logit contributions | |
xc | -0.021 |
paramed | -0.021 |
bul | -0.021 |
spe | -0.020 |
esh | -0.019 |
Token | to |
Token ID | 284 |
Feature activation | +2.48e-02 |
Pos logit contributions | |
spaghetti | +0.050 |
sidelines | +0.049 |
Seek | +0.043 |
menu | +0.042 |
bed | +0.041 |
Neg logit contributions | |
bul | -0.055 |
flew | -0.054 |
spe | -0.054 |
Bel | -0.050 |
pol | -0.050 |
Token | sing |
Token ID | 1702 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
spaghetti | +0.031 |
sidelines | +0.030 |
bed | +0.026 |
Seek | +0.025 |
menu | +0.025 |
Neg logit contributions | |
spe | -0.046 |
bul | -0.045 |
flew | -0.043 |
paramed | -0.042 |
pre | -0.042 |
Token | and |
Token ID | 290 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
sidelines | +0.023 |
spaghetti | +0.023 |
Seek | +0.021 |
menu | +0.020 |
bed | +0.020 |
Neg logit contributions | |
bul | -0.021 |
flew | -0.021 |
spe | -0.020 |
Bel | -0.019 |
paramed | -0.019 |
Token | dance |
Token ID | 9280 |
Feature activation | -3.50e-02 |
Pos logit contributions | |
sidelines | +0.027 |
spaghetti | +0.027 |
Seek | +0.024 |
menu | +0.024 |
ours | +0.023 |
Neg logit contributions | |
flew | -0.024 |
bul | -0.024 |
spe | -0.023 |
soared | -0.021 |
blew | -0.021 |
Token | and |
Token ID | 290 |
Feature activation | +7.67e-03 |
Pos logit contributions | |
bul | +0.052 |
spe | +0.052 |
flew | +0.051 |
paramed | +0.048 |
pol | +0.047 |
Neg logit contributions | |
spaghetti | -0.054 |
sidelines | -0.052 |
Seek | -0.047 |
menu | -0.046 |
bed | -0.046 |
Token | ran |
Token ID | 4966 |
Feature activation | +1.14e-02 |
Pos logit contributions | |
spaghetti | +0.003 |
sidelines | +0.002 |
Seek | +0.002 |
bed | +0.002 |
bone | +0.002 |
Neg logit contributions | |
spe | -0.002 |
bul | -0.002 |
esh | -0.002 |
xc | -0.002 |
paramed | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | +7.14e-03 |
Pos logit contributions | |
spaghetti | +0.018 |
sidelines | +0.018 |
Seek | +0.016 |
menu | +0.015 |
bed | +0.015 |
Neg logit contributions | |
flew | -0.016 |
bul | -0.016 |
spe | -0.015 |
Bel | -0.015 |
pol | -0.015 |
Token | the |
Token ID | 262 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
spaghetti | +0.013 |
sidelines | +0.012 |
Seek | +0.012 |
menu | +0.011 |
internet | +0.011 |
Neg logit contributions | |
flew | -0.008 |
Bel | -0.007 |
Ale | -0.007 |
Sher | -0.007 |
bul | -0.007 |
Token | bag |
Token ID | 6131 |
Feature activation | +3.63e-02 |
Pos logit contributions | |
Seek | +0.020 |
spaghetti | +0.020 |
sidelines | +0.020 |
Want | +0.019 |
ours | +0.018 |
Neg logit contributions | |
flew | -0.020 |
rob | -0.019 |
paramed | -0.019 |
spr | -0.018 |
blew | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
sidelines | +0.071 |
spaghetti | +0.070 |
Seek | +0.065 |
robbers | +0.061 |
menu | +0.061 |
Neg logit contributions | |
flew | -0.041 |
bul | -0.039 |
spe | -0.038 |
pol | -0.034 |
Or | -0.034 |
Token | the |
Token ID | 262 |
Feature activation | -8.71e-03 |
Pos logit contributions | |
spaghetti | +0.024 |
sidelines | +0.024 |
Seek | +0.022 |
menu | +0.021 |
bed | +0.021 |
Neg logit contributions | |
spe | -0.013 |
bul | -0.013 |
flew | -0.013 |
pre | -0.012 |
paramed | -0.012 |
Token | gum |
Token ID | 27142 |
Feature activation | -1.37e-02 |
Pos logit contributions | |
flew | +0.013 |
pre | +0.012 |
bul | +0.012 |
paramed | +0.012 |
rob | +0.012 |
Neg logit contributions | |
sidelines | -0.013 |
Seek | -0.013 |
spaghetti | -0.012 |
Want | -0.011 |
ours | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
bul | +0.022 |
spe | +0.021 |
flew | +0.020 |
paramed | +0.020 |
Bel | +0.020 |
Neg logit contributions | |
spaghetti | -0.020 |
sidelines | -0.019 |
bed | -0.017 |
menu | -0.017 |
Seek | -0.016 |
Token | She |
Token ID | 1375 |
Feature activation | -3.61e-03 |
Pos logit contributions | |
spaghetti | +0.023 |
sidelines | +0.023 |
Seek | +0.021 |
menu | +0.020 |
bed | +0.019 |
Neg logit contributions | |
flew | -0.018 |
bul | -0.018 |
spe | -0.018 |
Bel | -0.016 |
paramed | -0.016 |
Token | picked |
Token ID | 6497 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
spe | +0.005 |
bul | +0.005 |
esh | +0.004 |
xc | +0.004 |
paramed | +0.004 |
Neg logit contributions | |
spaghetti | -0.006 |
sidelines | -0.006 |
Seek | -0.005 |
bed | -0.005 |
bone | -0.005 |
Token | them |
Token ID | 606 |
Feature activation | +9.75e-03 |
Pos logit contributions | |
spaghetti | +0.032 |
sidelines | +0.031 |
Seek | +0.027 |
menu | +0.026 |
bed | +0.026 |
Neg logit contributions | |
bul | -0.038 |
flew | -0.038 |
spe | -0.038 |
paramed | -0.035 |
Bel | -0.035 |
Token | , |
Token ID | 11 |
Feature activation | -1.53e-03 |
Pos logit contributions | |
spaghetti | +0.009 |
sidelines | +0.009 |
Seek | +0.008 |
menu | +0.008 |
mine | +0.008 |
Neg logit contributions | |
bul | -0.013 |
spe | -0.012 |
cker | -0.012 |
flew | -0.012 |
pre | -0.012 |
Token | " |
Token ID | 366 |
Feature activation | +4.54e-03 |
Pos logit contributions | |
bul | +0.003 |
flew | +0.003 |
spe | +0.003 |
pol | +0.002 |
Bel | +0.002 |
Neg logit contributions | |
spaghetti | -0.002 |
sidelines | -0.002 |
Seek | -0.002 |
menu | -0.002 |
bed | -0.002 |
Token | Okay |
Token ID | 16454 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
Seek | +0.006 |
sidelines | +0.006 |
spaghetti | +0.006 |
Want | +0.006 |
Do | +0.005 |
Neg logit contributions | |
bul | -0.007 |
flew | -0.007 |
paramed | -0.007 |
slit | -0.007 |
spe | -0.007 |
Token | , |
Token ID | 11 |
Feature activation | +1.14e-03 |
Pos logit contributions | |
sidelines | +0.045 |
spaghetti | +0.044 |
Seek | +0.039 |
menu | +0.038 |
internet | +0.037 |
Neg logit contributions | |
flew | -0.034 |
bul | -0.033 |
spe | -0.033 |
esh | -0.030 |
pol | -0.029 |
Token | I |
Token ID | 314 |
Feature activation | +7.37e-03 |
Pos logit contributions | |
sidelines | +0.002 |
spaghetti | +0.002 |
menu | +0.001 |
internet | +0.001 |
Seek | +0.001 |
Neg logit contributions | |
flew | -0.002 |
bul | -0.002 |
spe | -0.002 |
rob | -0.002 |
soared | -0.002 |
Token | 'll |
Token ID | 1183 |
Feature activation | +3.02e-02 |
Pos logit contributions | |
spaghetti | +0.010 |
sidelines | +0.010 |
Seek | +0.009 |
menu | +0.009 |
bed | +0.009 |
Neg logit contributions | |
bul | -0.012 |
spe | -0.011 |
flew | -0.011 |
paramed | -0.011 |
pol | -0.011 |
Token | take |
Token ID | 1011 |
Feature activation | +5.50e-03 |
Pos logit contributions | |
spaghetti | +0.040 |
sidelines | +0.040 |
Seek | +0.035 |
bed | +0.034 |
menu | +0.033 |
Neg logit contributions | |
spe | -0.051 |
bul | -0.051 |
flew | -0.049 |
paramed | -0.047 |
pre | -0.047 |
Token | the |
Token ID | 262 |
Feature activation | -3.63e-03 |
Pos logit contributions | |
sidelines | +0.007 |
spaghetti | +0.007 |
menu | +0.006 |
Seek | +0.006 |
internet | +0.005 |
Neg logit contributions | |
flew | -0.010 |
bul | -0.009 |
soared | -0.009 |
spe | -0.009 |
xc | -0.009 |
Token | test |
Token ID | 1332 |
Feature activation | -4.35e-03 |
Pos logit contributions | |
bul | +0.005 |
flew | +0.005 |
spe | +0.005 |
blew | +0.004 |
soared | +0.004 |
Neg logit contributions | |
spaghetti | -0.006 |
sidelines | -0.006 |
ours | -0.005 |
Seek | -0.005 |
menu | -0.005 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.29e-02 |
Pos logit contributions | |
bul | +0.007 |
spe | +0.007 |
flew | +0.007 |
soared | +0.006 |
pol | +0.006 |
Neg logit contributions | |
sidelines | -0.006 |
spaghetti | -0.006 |
Seek | -0.005 |
menu | -0.005 |
bed | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
flew | +0.022 |
bul | +0.022 |
spe | +0.022 |
pol | +0.021 |
paramed | +0.021 |
Neg logit contributions | |
spaghetti | -0.016 |
sidelines | -0.016 |
Seek | -0.014 |
bed | -0.014 |
menu | -0.013 |
Token | looked |
Token ID | 3114 |
Feature activation | +4.21e-03 |
Pos logit contributions | |
bul | +0.006 |
spe | +0.006 |
Sab | +0.005 |
Ev | +0.005 |
esh | +0.005 |
Neg logit contributions | |
spaghetti | -0.004 |
bone | -0.003 |
skeleton | -0.003 |
café | -0.003 |
robbers | -0.003 |
Token | at |
Token ID | 379 |
Feature activation | -2.48e-02 |
Pos logit contributions | |
sidelines | +0.008 |
spaghetti | +0.008 |
Seek | +0.008 |
internet | +0.007 |
menu | +0.007 |
Neg logit contributions | |
flew | -0.005 |
bul | -0.004 |
spe | -0.004 |
blew | -0.004 |
Bel | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
spe | +0.044 |
bul | +0.043 |
paramed | +0.041 |
pre | +0.040 |
flew | +0.039 |
Neg logit contributions | |
spaghetti | -0.033 |
sidelines | -0.032 |
ours | -0.028 |
bed | -0.028 |
mine | -0.028 |
Token | spike |
Token ID | 20240 |
Feature activation | +5.14e-05 |
Pos logit contributions | |
spaghetti | +0.026 |
sidelines | +0.026 |
Seek | +0.024 |
menu | +0.023 |
bed | +0.022 |
Neg logit contributions | |
flew | -0.016 |
bul | -0.015 |
spe | -0.014 |
pol | -0.014 |
soared | -0.013 |
Token | and |
Token ID | 290 |
Feature activation | +5.51e-03 |
Pos logit contributions | |
sidelines | +0.000 |
spaghetti | +0.000 |
Seek | +0.000 |
menu | +0.000 |
Want | +0.000 |
Neg logit contributions | |
flew | -0.000 |
bul | -0.000 |
spe | -0.000 |
pol | -0.000 |
pre | -0.000 |
Token | said |
Token ID | 531 |
Feature activation | +3.98e-03 |
Pos logit contributions | |
spaghetti | +0.010 |
sidelines | +0.010 |
Seek | +0.009 |
menu | +0.009 |
bed | +0.009 |
Neg logit contributions | |
bul | -0.007 |
spe | -0.007 |
paramed | -0.006 |
flew | -0.006 |
pre | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | +3.24e-04 |
Pos logit contributions | |
spaghetti | +0.005 |
sidelines | +0.004 |
mine | +0.004 |
bed | +0.004 |
Seek | +0.004 |
Neg logit contributions | |
bul | -0.007 |
spe | -0.007 |
cker | -0.007 |
Bel | -0.007 |
Sher | -0.007 |
Token | " |
Token ID | 366 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
spaghetti | +0.000 |
sidelines | +0.000 |
Seek | +0.000 |
menu | +0.000 |
bed | +0.000 |
Neg logit contributions | |
flew | -0.001 |
bul | -0.001 |
spe | -0.001 |
paramed | -0.000 |
pre | -0.000 |
Token | You |
Token ID | 1639 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
sidelines | +0.016 |
spaghetti | +0.015 |
Seek | +0.013 |
Want | +0.013 |
robbers | +0.012 |
Neg logit contributions | |
bul | -0.018 |
spe | -0.017 |
flew | -0.016 |
irled | -0.016 |
xc | -0.015 |
Token | 're |
Token ID | 821 |
Feature activation | +3.41e-02 |
Pos logit contributions | |
flew | +0.023 |
bul | +0.022 |
spe | +0.022 |
soared | +0.021 |
pol | +0.020 |
Neg logit contributions | |
sidelines | -0.018 |
spaghetti | -0.018 |
Seek | -0.015 |
menu | -0.015 |
bed | -0.014 |
Token | right |
Token ID | 826 |
Feature activation | -9.62e-03 |
Pos logit contributions | |
sidelines | +0.065 |
café | +0.058 |
spaghetti | +0.058 |
menu | +0.057 |
concession | +0.056 |
Neg logit contributions | |
flew | -0.041 |
rob | -0.036 |
exc | -0.034 |
pol | -0.033 |
known | -0.033 |
Token | Let |
Token ID | 5756 |
Feature activation | +7.74e-03 |
Pos logit contributions | |
sidelines | +0.015 |
spaghetti | +0.014 |
Seek | +0.014 |
Want | +0.013 |
robbers | +0.012 |
Neg logit contributions | |
bul | -0.016 |
flew | -0.016 |
spe | -0.015 |
irled | -0.015 |
slit | -0.015 |
Token | 's |
Token ID | 338 |
Feature activation | -2.86e-03 |
Pos logit contributions | |
spaghetti | +0.009 |
sidelines | +0.008 |
Seek | +0.007 |
bed | +0.007 |
mine | +0.007 |
Neg logit contributions | |
bul | -0.015 |
spe | -0.015 |
pre | -0.014 |
flew | -0.014 |
Or | -0.014 |
Token | go |
Token ID | 467 |
Feature activation | -1.38e-02 |
Pos logit contributions | |
bul | +0.004 |
flew | +0.004 |
spe | +0.004 |
pre | +0.004 |
Bel | +0.004 |
Neg logit contributions | |
spaghetti | -0.004 |
sidelines | -0.004 |
Seek | -0.004 |
menu | -0.004 |
bed | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | +1.70e-02 |
Pos logit contributions | |
flew | +0.019 |
bul | +0.018 |
esh | +0.017 |
Sher | +0.017 |
Ale | +0.016 |
Neg logit contributions | |
spaghetti | -0.023 |
sidelines | -0.022 |
internet | -0.019 |
menu | -0.019 |
Seek | -0.019 |
Token | get |
Token ID | 651 |
Feature activation | -8.53e-03 |
Pos logit contributions | |
spaghetti | +0.027 |
sidelines | +0.026 |
menu | +0.024 |
internet | +0.023 |
Seek | +0.022 |
Neg logit contributions | |
flew | -0.025 |
bul | -0.023 |
spe | -0.023 |
blew | -0.022 |
soared | -0.022 |
Token | ice |
Token ID | 4771 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
flew | +0.013 |
bul | +0.013 |
spe | +0.012 |
soared | +0.011 |
blew | +0.011 |
Neg logit contributions | |
sidelines | -0.013 |
spaghetti | -0.012 |
menu | -0.011 |
Seek | -0.011 |
internet | -0.011 |
Token | cream |
Token ID | 8566 |
Feature activation | -4.65e-03 |
Pos logit contributions | |
bul | +0.016 |
flew | +0.016 |
spe | +0.016 |
Bel | +0.015 |
paramed | +0.015 |
Neg logit contributions | |
spaghetti | -0.017 |
sidelines | -0.016 |
Seek | -0.015 |
menu | -0.014 |
bed | -0.014 |
Token | , |
Token ID | 11 |
Feature activation | -2.14e-05 |
Pos logit contributions | |
bul | +0.007 |
flew | +0.007 |
spe | +0.007 |
blew | +0.007 |
pre | +0.007 |
Neg logit contributions | |
sidelines | -0.007 |
spaghetti | -0.006 |
Seek | -0.006 |
internet | -0.005 |
robbers | -0.005 |
Token | sweet |
Token ID | 6029 |
Feature activation | +1.51e-02 |
Pos logit contributions | |
flew | +0.000 |
bul | +0.000 |
spe | +0.000 |
paramed | +0.000 |
Bel | +0.000 |
Neg logit contributions | |
sidelines | -0.000 |
spaghetti | -0.000 |
Seek | -0.000 |
menu | -0.000 |
hunting | -0.000 |
Token | ie |
Token ID | 494 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
sidelines | +0.026 |
spaghetti | +0.026 |
Seek | +0.023 |
menu | +0.022 |
bed | +0.022 |
Neg logit contributions | |
flew | -0.020 |
bul | -0.020 |
spe | -0.019 |
paramed | -0.018 |
Bel | -0.017 |
Token | ." |
Token ID | 526 |
Feature activation | -8.89e-03 |
Pos logit contributions | |
spaghetti | +0.021 |
sidelines | +0.020 |
Seek | +0.017 |
menu | +0.017 |
bed | +0.017 |
Neg logit contributions | |
bul | -0.035 |
flew | -0.034 |
spe | -0.034 |
Bel | -0.033 |
pol | -0.033 |
Token | forest |
Token ID | 8222 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
sidelines | +0.022 |
spaghetti | +0.021 |
ours | +0.021 |
Seek | +0.020 |
menu | +0.020 |
Neg logit contributions | |
flew | -0.025 |
Bel | -0.023 |
soared | -0.022 |
bul | -0.022 |
spr | -0.021 |
Token | when |
Token ID | 618 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
sidelines | +0.024 |
spaghetti | +0.023 |
Seek | +0.022 |
ours | +0.021 |
menu | +0.021 |
Neg logit contributions | |
flew | -0.016 |
spe | -0.014 |
Bel | -0.014 |
soared | -0.014 |
cker | -0.013 |
Token | he |
Token ID | 339 |
Feature activation | -7.62e-03 |
Pos logit contributions | |
flew | +0.021 |
bul | +0.020 |
spe | +0.019 |
soared | +0.018 |
Bel | +0.018 |
Neg logit contributions | |
spaghetti | -0.024 |
sidelines | -0.024 |
Seek | -0.021 |
menu | -0.021 |
ours | -0.020 |
Token | saw |
Token ID | 2497 |
Feature activation | +7.71e-03 |
Pos logit contributions | |
flew | +0.010 |
bul | +0.009 |
spe | +0.008 |
soared | +0.008 |
Bel | +0.008 |
Neg logit contributions | |
sidelines | -0.014 |
spaghetti | -0.014 |
Seek | -0.013 |
menu | -0.012 |
ours | -0.012 |
Token | a |
Token ID | 257 |
Feature activation | +1.20e-02 |
Pos logit contributions | |
spaghetti | +0.012 |
sidelines | +0.011 |
Seek | +0.010 |
bed | +0.010 |
menu | +0.010 |
Neg logit contributions | |
spe | -0.012 |
bul | -0.012 |
flew | -0.012 |
pre | -0.011 |
pol | -0.011 |
Token | little |
Token ID | 1310 |
Feature activation | +8.14e-03 |
Pos logit contributions | |
sidelines | +0.022 |
spaghetti | +0.021 |
Seek | +0.020 |
ours | +0.019 |
internet | +0.018 |
Neg logit contributions | |
flew | -0.016 |
rob | -0.015 |
bul | -0.015 |
swoop | -0.014 |
spr | -0.014 |
Token | bird |
Token ID | 6512 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
sidelines | +0.017 |
spaghetti | +0.016 |
Seek | +0.016 |
internet | +0.015 |
ours | +0.015 |
Neg logit contributions | |
bul | -0.008 |
flew | -0.008 |
rob | -0.008 |
spr | -0.007 |
ostr | -0.007 |
Token | sh |
Token ID | 427 |
Feature activation | -2.46e-02 |
Pos logit contributions | |
spe | +0.016 |
bul | +0.016 |
paramed | +0.015 |
Or | +0.015 |
xc | +0.015 |
Neg logit contributions | |
spaghetti | -0.015 |
sidelines | -0.014 |
bed | -0.013 |
hunting | -0.012 |
Seek | -0.012 |
Token | ivering |
Token ID | 35598 |
Feature activation | +2.42e-02 |
Pos logit contributions | |
spe | +0.052 |
bul | +0.052 |
flew | +0.051 |
Or | +0.049 |
soared | +0.048 |
Neg logit contributions | |
sidelines | -0.022 |
spaghetti | -0.021 |
Seek | -0.017 |
bed | -0.015 |
menu | -0.015 |
Token | in |
Token ID | 287 |
Feature activation | -8.94e-03 |
Pos logit contributions | |
sidelines | +0.042 |
spaghetti | +0.041 |
Seek | +0.037 |
menu | +0.036 |
bed | +0.035 |
Neg logit contributions | |
flew | -0.032 |
bul | -0.032 |
spe | -0.031 |
pol | -0.028 |
pre | -0.028 |
Token | the |
Token ID | 262 |
Feature activation | +4.70e-03 |
Pos logit contributions | |
flew | +0.011 |
bul | +0.011 |
spe | +0.010 |
soared | +0.010 |
Bel | +0.010 |
Neg logit contributions | |
sidelines | -0.016 |
spaghetti | -0.015 |
Seek | -0.015 |
menu | -0.014 |
internet | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | -7.98e-03 |
Pos logit contributions | |
spaghetti | +0.038 |
sidelines | +0.037 |
Seek | +0.033 |
bed | +0.032 |
menu | +0.031 |
Neg logit contributions | |
bul | -0.043 |
flew | -0.042 |
spe | -0.042 |
soared | -0.039 |
paramed | -0.038 |
Token |
|
Token ID | 198 |
Feature activation | -5.25e-03 |
Pos logit contributions | |
bul | +0.011 |
flew | +0.011 |
spe | +0.011 |
Bel | +0.010 |
pol | +0.010 |
Neg logit contributions | |
spaghetti | -0.013 |
sidelines | -0.013 |
Seek | -0.011 |
menu | -0.011 |
bed | -0.011 |
Token | Then |
Token ID | 6423 |
Feature activation | -2.09e-02 |
Pos logit contributions | |
bul | +0.007 |
flew | +0.007 |
spe | +0.006 |
pre | +0.006 |
soared | +0.006 |
Neg logit contributions | |
sidelines | -0.009 |
spaghetti | -0.009 |
Seek | -0.008 |
menu | -0.008 |
bed | -0.008 |
Token | Sarah |
Token ID | 10490 |
Feature activation | +9.19e-04 |
Pos logit contributions | |
bul | +0.032 |
spe | +0.031 |
flew | +0.031 |
pre | +0.030 |
hon | +0.029 |
Neg logit contributions | |
spaghetti | -0.032 |
sidelines | -0.030 |
Seek | -0.028 |
bed | -0.027 |
menu | -0.026 |
Token | and |
Token ID | 290 |
Feature activation | -5.34e-03 |
Pos logit contributions | |
spaghetti | +0.001 |
sidelines | +0.001 |
bed | +0.001 |
menu | +0.001 |
Seek | +0.001 |
Neg logit contributions | |
bul | -0.001 |
pre | -0.001 |
spe | -0.001 |
pol | -0.001 |
esh | -0.001 |
Token | her |
Token ID | 607 |
Feature activation | -3.12e-02 |
Pos logit contributions | |
bul | +0.007 |
pre | +0.007 |
hon | +0.007 |
flew | +0.007 |
cker | +0.007 |
Neg logit contributions | |
spaghetti | -0.009 |
sidelines | -0.009 |
bed | -0.008 |
Seek | -0.008 |
mine | -0.008 |
Token | mom |
Token ID | 1995 |
Feature activation | -3.92e-02 |
Pos logit contributions | |
bul | +0.038 |
flew | +0.038 |
spe | +0.037 |
paramed | +0.034 |
pre | +0.033 |
Neg logit contributions | |
spaghetti | -0.056 |
sidelines | -0.056 |
Seek | -0.051 |
menu | -0.049 |
bed | -0.048 |
Token | went |
Token ID | 1816 |
Feature activation | -2.93e-02 |
Pos logit contributions | |
bul | +0.043 |
spe | +0.042 |
pre | +0.041 |
pol | +0.040 |
Bel | +0.040 |
Neg logit contributions | |
spaghetti | -0.075 |
sidelines | -0.070 |
Seek | -0.066 |
bed | -0.065 |
menu | -0.063 |
Token | outside |
Token ID | 2354 |
Feature activation | -3.53e-03 |
Pos logit contributions | |
flew | +0.041 |
bul | +0.039 |
paramed | +0.038 |
spe | +0.037 |
Sher | +0.036 |
Neg logit contributions | |
spaghetti | -0.046 |
sidelines | -0.045 |
Seek | -0.041 |
ours | -0.040 |
internet | -0.039 |
Token | to |
Token ID | 284 |
Feature activation | -7.12e-03 |
Pos logit contributions | |
bul | +0.005 |
flew | +0.005 |
spe | +0.005 |
Bel | +0.005 |
pol | +0.005 |
Neg logit contributions | |
spaghetti | -0.005 |
sidelines | -0.005 |
Seek | -0.005 |
menu | -0.004 |
bed | -0.004 |
Token | enjoy |
Token ID | 2883 |
Feature activation | +1.68e-02 |
Pos logit contributions | |
flew | +0.011 |
bul | +0.011 |
blew | +0.010 |
spe | +0.010 |
paramed | +0.010 |
Neg logit contributions | |
sidelines | -0.010 |
spaghetti | -0.010 |
Seek | -0.009 |
menu | -0.009 |
internet | -0.009 |
Token | he |
Token ID | 339 |
Feature activation | +9.42e-03 |
Pos logit contributions | |
spaghetti | +0.011 |
bed | +0.009 |
sidelines | +0.009 |
Seek | +0.008 |
safe | +0.008 |
Neg logit contributions | |
bul | -0.017 |
spe | -0.017 |
pre | -0.017 |
Bel | -0.017 |
xc | -0.017 |
Token | gave |
Token ID | 2921 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
spaghetti | +0.015 |
robbers | +0.013 |
safe | +0.013 |
Seek | +0.012 |
bed | +0.012 |
Neg logit contributions | |
spe | -0.015 |
pre | -0.014 |
bul | -0.014 |
mill | -0.013 |
imm | -0.012 |
Token | her |
Token ID | 607 |
Feature activation | -5.70e-03 |
Pos logit contributions | |
spaghetti | +0.020 |
sidelines | +0.020 |
Seek | +0.018 |
bed | +0.017 |
menu | +0.017 |
Neg logit contributions | |
spe | -0.015 |
bul | -0.015 |
flew | -0.014 |
pre | -0.013 |
paramed | -0.013 |
Token | his |
Token ID | 465 |
Feature activation | -2.44e-03 |
Pos logit contributions | |
spe | +0.009 |
flew | +0.009 |
bul | +0.009 |
pre | +0.008 |
hon | +0.008 |
Neg logit contributions | |
spaghetti | -0.009 |
sidelines | -0.008 |
bed | -0.007 |
Seek | -0.007 |
menu | -0.007 |
Token | favorite |
Token ID | 4004 |
Feature activation | +1.49e-02 |
Pos logit contributions | |
bul | +0.003 |
flew | +0.003 |
spe | +0.003 |
pol | +0.003 |
paramed | +0.003 |
Neg logit contributions | |
sidelines | -0.004 |
spaghetti | -0.004 |
Seek | -0.004 |
menu | -0.003 |
Want | -0.003 |
Token | toy |
Token ID | 13373 |
Feature activation | -2.14e-02 |
Pos logit contributions | |
sidelines | +0.028 |
Seek | +0.025 |
spaghetti | +0.025 |
ours | +0.023 |
assing | +0.022 |
Neg logit contributions | |
bul | -0.020 |
flew | -0.018 |
pol | -0.016 |
spe | -0.016 |
esh | -0.015 |
Token | car |
Token ID | 1097 |
Feature activation | -1.74e-02 |
Pos logit contributions | |
spe | +0.037 |
flew | +0.036 |
bul | +0.035 |
Bel | +0.034 |
soared | +0.034 |
Neg logit contributions | |
spaghetti | -0.029 |
sidelines | -0.027 |
bed | -0.024 |
Seek | -0.023 |
menu | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | -3.37e-03 |
Pos logit contributions | |
bul | +0.027 |
flew | +0.027 |
spe | +0.027 |
Bel | +0.025 |
soared | +0.025 |
Neg logit contributions | |
spaghetti | -0.026 |
sidelines | -0.025 |
Seek | -0.022 |
menu | -0.022 |
bed | -0.022 |
Token | The |
Token ID | 383 |
Feature activation | -1.85e-03 |
Pos logit contributions | |
flew | +0.006 |
bul | +0.006 |
spe | +0.006 |
soared | +0.006 |
cker | +0.006 |
Neg logit contributions | |
spaghetti | -0.004 |
sidelines | -0.004 |
Seek | -0.004 |
bed | -0.004 |
menu | -0.003 |
Token | little |
Token ID | 1310 |
Feature activation | +8.79e-03 |
Pos logit contributions | |
bul | +0.003 |
flew | +0.003 |
spe | +0.003 |
paramed | +0.002 |
pol | +0.002 |
Neg logit contributions | |
spaghetti | -0.003 |
sidelines | -0.003 |
Seek | -0.003 |
menu | -0.003 |
bed | -0.002 |
Token | girl |
Token ID | 2576 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
spaghetti | +0.012 |
sidelines | +0.010 |
bed | +0.010 |
Seek | +0.009 |
bone | +0.009 |
Neg logit contributions | |
spe | -0.015 |
bul | -0.014 |
hon | -0.014 |
Ale | -0.014 |
pre | -0.014 |
Token | the |
Token ID | 262 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
spaghetti | +0.007 |
sidelines | +0.006 |
Seek | +0.006 |
menu | +0.006 |
bed | +0.005 |
Neg logit contributions | |
bul | -0.006 |
flew | -0.006 |
spe | -0.006 |
paramed | -0.005 |
pol | -0.005 |
Token | magical |
Token ID | 10883 |
Feature activation | -1.99e-02 |
Pos logit contributions | |
bul | +0.017 |
spe | +0.017 |
flew | +0.016 |
pol | +0.016 |
esh | +0.015 |
Neg logit contributions | |
sidelines | -0.018 |
spaghetti | -0.018 |
Seek | -0.015 |
menu | -0.015 |
bed | -0.015 |
Token | voice |
Token ID | 3809 |
Feature activation | -3.91e-02 |
Pos logit contributions | |
xc | +0.032 |
bul | +0.031 |
pol | +0.031 |
hon | +0.031 |
Ale | +0.030 |
Neg logit contributions | |
sidelines | -0.026 |
spaghetti | -0.024 |
menu | -0.023 |
mine | -0.023 |
bed | -0.022 |
Token | was |
Token ID | 373 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
xc | +0.054 |
paramed | +0.052 |
Ale | +0.051 |
esh | +0.051 |
pre | +0.051 |
Neg logit contributions | |
spaghetti | -0.052 |
sidelines | -0.052 |
safe | -0.051 |
Seek | -0.049 |
mine | -0.048 |
Token | so |
Token ID | 523 |
Feature activation | +1.94e-03 |
Pos logit contributions | |
pre | +0.028 |
bul | +0.027 |
xc | +0.027 |
spe | +0.026 |
hon | +0.026 |
Neg logit contributions | |
spaghetti | -0.022 |
sidelines | -0.020 |
safe | -0.019 |
mine | -0.018 |
bed | -0.018 |
Token | impressed |
Token ID | 12617 |
Feature activation | -3.28e-02 |
Pos logit contributions | |
spaghetti | +0.002 |
sidelines | +0.002 |
Seek | +0.002 |
safe | +0.002 |
menu | +0.002 |
Neg logit contributions | |
bul | -0.004 |
xc | -0.004 |
flew | -0.004 |
pre | -0.004 |
paramed | -0.004 |
Token | that |
Token ID | 326 |
Feature activation | -1.48e-03 |
Pos logit contributions | |
bul | +0.060 |
paramed | +0.060 |
spe | +0.058 |
flew | +0.057 |
soared | +0.055 |
Neg logit contributions | |
spaghetti | -0.039 |
sidelines | -0.034 |
Seek | -0.032 |
mine | -0.031 |
menu | -0.030 |
Token | it |
Token ID | 340 |
Feature activation | +6.85e-03 |
Pos logit contributions | |
bul | +0.002 |
flew | +0.002 |
spe | +0.002 |
paramed | +0.002 |
pre | +0.002 |
Neg logit contributions | |
spaghetti | -0.002 |
sidelines | -0.002 |
Seek | -0.002 |
menu | -0.002 |
bed | -0.002 |
Token | granted |
Token ID | 7520 |
Feature activation | -7.64e-03 |
Pos logit contributions | |
spaghetti | +0.009 |
sidelines | +0.009 |
Seek | +0.009 |
mine | +0.008 |
safe | +0.008 |
Neg logit contributions | |
paramed | -0.011 |
xc | -0.010 |
bul | -0.010 |
pre | -0.010 |
Ale | -0.010 |
Token | the |
Token ID | 262 |
Feature activation | -1.35e-02 |
Pos logit contributions | |
flew | +0.010 |
bul | +0.010 |
spe | +0.010 |
Bel | +0.009 |
soared | +0.009 |
Neg logit contributions | |
sidelines | -0.013 |
spaghetti | -0.012 |
Seek | -0.011 |
menu | -0.011 |
bed | -0.011 |
Token | bird |
Token ID | 6512 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
bul | +0.022 |
flew | +0.022 |
spe | +0.021 |
Bel | +0.020 |
paramed | +0.020 |
Neg logit contributions | |
spaghetti | -0.019 |
sidelines | -0.019 |
Seek | -0.016 |
menu | -0.016 |
bed | -0.015 |
Token | up |
Token ID | 510 |
Feature activation | -5.42e-03 |
Pos logit contributions | |
flew | +0.008 |
bul | +0.007 |
esh | +0.007 |
Bel | +0.007 |
ck | +0.007 |
Neg logit contributions | |
sidelines | -0.013 |
Seek | -0.012 |
spaghetti | -0.011 |
jar | -0.011 |
robbers | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
flew | +0.008 |
bul | +0.008 |
spe | +0.007 |
Bel | +0.007 |
blew | +0.007 |
Neg logit contributions | |
sidelines | -0.009 |
spaghetti | -0.008 |
Seek | -0.008 |
ours | -0.007 |
Want | -0.007 |
Token | grab |
Token ID | 5552 |
Feature activation | -1.49e-02 |
Pos logit contributions | |
sidelines | +0.025 |
spaghetti | +0.025 |
Seek | +0.023 |
menu | +0.022 |
ours | +0.021 |
Neg logit contributions | |
flew | -0.024 |
bul | -0.023 |
soared | -0.022 |
spe | -0.022 |
blew | -0.021 |
Token | his |
Token ID | 465 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
flew | +0.018 |
bul | +0.017 |
soared | +0.016 |
Bel | +0.016 |
spe | +0.016 |
Neg logit contributions | |
sidelines | -0.028 |
spaghetti | -0.025 |
Seek | -0.024 |
internet | -0.023 |
Want | -0.023 |
Token | special |
Token ID | 2041 |
Feature activation | -2.05e-02 |
Pos logit contributions | |
flew | +0.017 |
bul | +0.017 |
spe | +0.015 |
pre | +0.015 |
soared | +0.015 |
Neg logit contributions | |
sidelines | -0.018 |
spaghetti | -0.016 |
Seek | -0.016 |
Want | -0.014 |
internet | -0.014 |
Token | drum |
Token ID | 13026 |
Feature activation | -3.30e-02 |
Pos logit contributions | |
bul | +0.032 |
flew | +0.031 |
spe | +0.028 |
pol | +0.028 |
pre | +0.028 |
Neg logit contributions | |
sidelines | -0.031 |
Seek | -0.028 |
spaghetti | -0.028 |
ours | -0.026 |
forgetting | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | +2.64e-03 |
Pos logit contributions | |
spe | +0.050 |
bul | +0.049 |
flew | +0.049 |
Bel | +0.046 |
pol | +0.046 |
Neg logit contributions | |
spaghetti | -0.051 |
sidelines | -0.048 |
Seek | -0.044 |
bed | -0.043 |
menu | -0.042 |
Token | He |
Token ID | 679 |
Feature activation | -6.96e-04 |
Pos logit contributions | |
sidelines | +0.005 |
spaghetti | +0.004 |
Seek | +0.004 |
menu | +0.004 |
ours | +0.004 |
Neg logit contributions | |
bul | -0.003 |
flew | -0.003 |
spe | -0.003 |
Bel | -0.003 |
Ale | -0.003 |
Token | would |
Token ID | 561 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
paramed | +0.001 |
bul | +0.001 |
spe | +0.001 |
pre | +0.001 |
xc | +0.001 |
Neg logit contributions | |
spaghetti | -0.001 |
bed | -0.001 |
safe | -0.001 |
bone | -0.001 |
bones | -0.001 |
Token | th |
Token ID | 294 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
sidelines | +0.034 |
spaghetti | +0.034 |
bed | +0.030 |
mine | +0.028 |
menu | +0.027 |
Neg logit contributions | |
spe | -0.042 |
bul | -0.040 |
pre | -0.039 |
pol | -0.038 |
xc | -0.038 |
Token | ump |
Token ID | 931 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
spaghetti | +0.041 |
sidelines | +0.040 |
Seek | +0.036 |
bed | +0.035 |
menu | +0.034 |
Neg logit contributions | |
spe | -0.034 |
bul | -0.034 |
flew | -0.033 |
paramed | -0.030 |
pre | -0.030 |
Token | , |
Token ID | 11 |
Feature activation | +6.99e-03 |
Pos logit contributions | |
sidelines | +0.017 |
spaghetti | +0.017 |
Seek | +0.016 |
menu | +0.015 |
bed | +0.015 |
Neg logit contributions | |
flew | -0.014 |
bul | -0.014 |
spe | -0.014 |
soared | -0.013 |
Bel | -0.012 |
Token | but |
Token ID | 475 |
Feature activation | +1.94e-02 |
Pos logit contributions | |
sidelines | +0.010 |
spaghetti | +0.009 |
Seek | +0.009 |
menu | +0.008 |
locker | +0.008 |
Neg logit contributions | |
flew | -0.012 |
spe | -0.010 |
bul | -0.010 |
soared | -0.010 |
Or | -0.010 |
Token | sometimes |
Token ID | 3360 |
Feature activation | -2.96e-02 |
Pos logit contributions | |
sidelines | +0.041 |
spaghetti | +0.038 |
Seek | +0.035 |
menu | +0.035 |
internet | +0.034 |
Neg logit contributions | |
flew | -0.022 |
spe | -0.019 |
soared | -0.018 |
blew | -0.017 |
bul | -0.017 |
Token | they |
Token ID | 484 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
flew | +0.035 |
bul | +0.034 |
spe | +0.034 |
soared | +0.030 |
pol | +0.030 |
Neg logit contributions | |
sidelines | -0.055 |
spaghetti | -0.054 |
Seek | -0.049 |
menu | -0.048 |
bed | -0.047 |
Token | would |
Token ID | 561 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
spaghetti | +0.017 |
sidelines | +0.016 |
Seek | +0.015 |
mine | +0.015 |
robbers | +0.015 |
Neg logit contributions | |
bul | -0.015 |
esh | -0.014 |
spe | -0.014 |
paramed | -0.014 |
xc | -0.014 |
Token | fight |
Token ID | 1907 |
Feature activation | -2.11e-02 |
Pos logit contributions | |
spaghetti | +0.015 |
sidelines | +0.015 |
Seek | +0.013 |
menu | +0.013 |
bed | +0.013 |
Neg logit contributions | |
bul | -0.015 |
flew | -0.015 |
spe | -0.015 |
Bel | -0.014 |
pol | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | +8.67e-04 |
Pos logit contributions | |
flew | +0.028 |
bul | +0.027 |
spe | +0.026 |
pol | +0.024 |
soared | +0.024 |
Neg logit contributions | |
sidelines | -0.038 |
spaghetti | -0.036 |
menu | -0.032 |
Seek | -0.032 |
bed | -0.031 |
Token |
|
Token ID | 198 |
Feature activation | +8.10e-03 |
Pos logit contributions | |
sidelines | +0.002 |
spaghetti | +0.002 |
Seek | +0.001 |
menu | +0.001 |
bed | +0.001 |
Neg logit contributions | |
flew | -0.001 |
spe | -0.001 |
bul | -0.001 |
hon | -0.001 |
Bel | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
spaghetti | +0.013 |
sidelines | +0.013 |
Seek | +0.011 |
menu | +0.011 |
bed | +0.011 |
Neg logit contributions | |
bul | -0.011 |
flew | -0.011 |
spe | -0.011 |
Bel | -0.010 |
pol | -0.010 |
Token | One |
Token ID | 3198 |
Feature activation | +6.72e-03 |
Pos logit contributions | |
spaghetti | +0.017 |
sidelines | +0.017 |
Seek | +0.015 |
menu | +0.015 |
bed | +0.015 |
Neg logit contributions | |
bul | -0.015 |
spe | -0.014 |
flew | -0.014 |
pre | -0.013 |
paramed | -0.013 |
Token | day |
Token ID | 1110 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
sidelines | +0.012 |
spaghetti | +0.011 |
Seek | +0.011 |
internet | +0.010 |
menu | +0.010 |
Neg logit contributions | |
flew | -0.009 |
bul | -0.008 |
spe | -0.008 |
cker | -0.008 |
ira | -0.008 |
Token | , |
Token ID | 11 |
Feature activation | -3.15e-02 |
Pos logit contributions | |
bul | +0.128 |
spe | +0.123 |
flew | +0.122 |
paramed | +0.118 |
pol | +0.117 |
Neg logit contributions | |
spaghetti | -0.127 |
sidelines | -0.123 |
Seek | -0.108 |
menu | -0.108 |
bed | -0.108 |
Token | swinging |
Token ID | 25635 |
Feature activation | -4.35e-02 |
Pos logit contributions | |
bul | +0.054 |
flew | +0.052 |
spe | +0.052 |
pol | +0.049 |
pre | +0.049 |
Neg logit contributions | |
spaghetti | -0.042 |
sidelines | -0.041 |
Seek | -0.036 |
menu | -0.035 |
bed | -0.035 |
Token | and |
Token ID | 290 |
Feature activation | +8.44e-03 |
Pos logit contributions | |
bul | +0.075 |
spe | +0.073 |
paramed | +0.071 |
pre | +0.069 |
pol | +0.069 |
Neg logit contributions | |
spaghetti | -0.056 |
sidelines | -0.054 |
mine | -0.048 |
Seek | -0.047 |
bed | -0.046 |
Token | laughing |
Token ID | 14376 |
Feature activation | -2.78e-02 |
Pos logit contributions | |
spaghetti | +0.013 |
sidelines | +0.013 |
menu | +0.011 |
Seek | +0.011 |
bed | +0.011 |
Neg logit contributions | |
flew | -0.013 |
bul | -0.012 |
spe | -0.012 |
soared | -0.012 |
Bel | -0.011 |
Token | as |
Token ID | 355 |
Feature activation | -3.09e-02 |
Pos logit contributions | |
bul | +0.044 |
spe | +0.043 |
flew | +0.042 |
paramed | +0.041 |
pol | +0.040 |
Neg logit contributions | |
spaghetti | -0.041 |
sidelines | -0.039 |
Seek | -0.035 |
menu | -0.034 |
bed | -0.034 |
Token | high |
Token ID | 1029 |
Feature activation | -7.24e-02 |
Pos logit contributions | |
bul | +0.051 |
spe | +0.048 |
flew | +0.048 |
paramed | +0.047 |
pol | +0.046 |
Neg logit contributions | |
spaghetti | -0.043 |
sidelines | -0.042 |
Seek | -0.037 |
bed | -0.035 |
menu | -0.035 |
Token | as |
Token ID | 355 |
Feature activation | -3.32e-02 |
Pos logit contributions | |
spe | +0.147 |
bul | +0.142 |
paramed | +0.141 |
Bel | +0.138 |
Sab | +0.135 |
Neg logit contributions | |
spaghetti | -0.076 |
sidelines | -0.076 |
mine | -0.066 |
menu | -0.060 |
bed | -0.060 |
Token | he |
Token ID | 339 |
Feature activation | -3.52e-02 |
Pos logit contributions | |
bul | +0.051 |
spe | +0.051 |
flew | +0.049 |
paramed | +0.048 |
pol | +0.047 |
Neg logit contributions | |
spaghetti | -0.049 |
sidelines | -0.047 |
Seek | -0.042 |
bed | -0.041 |
menu | -0.040 |
Token | could |
Token ID | 714 |
Feature activation | -3.82e-02 |
Pos logit contributions | |
bul | +0.054 |
paramed | +0.053 |
spe | +0.053 |
esh | +0.051 |
xc | +0.048 |
Neg logit contributions | |
spaghetti | -0.051 |
sidelines | -0.049 |
Seek | -0.046 |
Want | -0.045 |
menu | -0.044 |
Token | . |
Token ID | 13 |
Feature activation | -1.31e-02 |
Pos logit contributions | |
bul | +0.067 |
spe | +0.066 |
paramed | +0.064 |
xc | +0.062 |
pre | +0.060 |
Neg logit contributions | |
sidelines | -0.049 |
spaghetti | -0.045 |
bed | -0.043 |
safe | -0.039 |
anywhere | -0.039 |
Token |
|
Token ID | 198 |
Feature activation | -9.53e-04 |
Pos logit contributions | |
spe | +0.019 |
flew | +0.019 |
bul | +0.019 |
Bel | +0.017 |
paramed | +0.017 |
Neg logit contributions | |
sidelines | -0.020 |
spaghetti | -0.020 |
Seek | -0.018 |
menu | -0.017 |
ours | -0.017 |
Token |
|
Token ID | 198 |
Feature activation | +4.74e-03 |
Pos logit contributions | |
spaghetti | +0.005 |
sidelines | +0.005 |
Seek | +0.005 |
menu | +0.004 |
bed | +0.004 |
Neg logit contributions | |
bul | -0.005 |
flew | -0.005 |
spe | -0.005 |
pol | -0.004 |
Bel | -0.004 |
Token | M |
Token ID | 44 |
Feature activation | -3.10e-02 |
Pos logit contributions | |
sidelines | +0.009 |
spaghetti | +0.009 |
Seek | +0.008 |
menu | +0.007 |
bed | +0.007 |
Neg logit contributions | |
bul | -0.006 |
flew | -0.006 |
spe | -0.006 |
pre | -0.005 |
pol | -0.005 |
Token | ama |
Token ID | 1689 |
Feature activation | +9.46e-04 |
Pos logit contributions | |
flew | +0.047 |
bul | +0.046 |
spe | +0.046 |
soared | +0.045 |
Or | +0.043 |
Neg logit contributions | |
spaghetti | -0.046 |
sidelines | -0.045 |
bed | -0.040 |
Seek | -0.040 |
menu | -0.039 |
Token | smiled |
Token ID | 13541 |
Feature activation | +1.48e-02 |
Pos logit contributions | |
spaghetti | +0.002 |
sidelines | +0.001 |
menu | +0.001 |
Seek | +0.001 |
bed | +0.001 |
Neg logit contributions | |
bul | -0.001 |
spe | -0.001 |
pol | -0.001 |
Or | -0.001 |
pre | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | -4.70e-03 |
Pos logit contributions | |
spaghetti | +0.019 |
sidelines | +0.017 |
bed | +0.015 |
menu | +0.015 |
safe | +0.014 |
Neg logit contributions | |
bul | -0.026 |
spe | -0.026 |
flew | -0.026 |
soared | -0.025 |
pre | -0.025 |
Token | r |
Token ID | 374 |
Feature activation | -8.73e-02 |
Pos logit contributions | |
bul | +0.007 |
spe | +0.007 |
cker | +0.006 |
pre | +0.006 |
esh | +0.006 |
Neg logit contributions | |
spaghetti | -0.008 |
sidelines | -0.007 |
Seek | -0.007 |
bed | -0.006 |
safe | -0.006 |
Token | uff |
Token ID | 1648 |
Feature activation | -2.57e-02 |
Pos logit contributions | |
flew | +0.133 |
bul | +0.126 |
Or | +0.126 |
rob | +0.126 |
soared | +0.125 |
Neg logit contributions | |
spaghetti | -0.128 |
sidelines | -0.121 |
Seek | -0.113 |
amas | -0.105 |
menu | -0.098 |
Token | led |
Token ID | 992 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
bul | +0.035 |
spe | +0.033 |
Bel | +0.033 |
Or | +0.031 |
rob | +0.031 |
Neg logit contributions | |
spaghetti | -0.042 |
sidelines | -0.040 |
menu | -0.035 |
Seek | -0.034 |
mine | -0.034 |
Token | the |
Token ID | 262 |
Feature activation | -1.64e-02 |
Pos logit contributions | |
bul | +0.030 |
flew | +0.029 |
spe | +0.029 |
soared | +0.028 |
pre | +0.027 |
Neg logit contributions | |
spaghetti | -0.032 |
sidelines | -0.030 |
bed | -0.027 |
Seek | -0.027 |
menu | -0.026 |
Token | three |
Token ID | 1115 |
Feature activation | -3.66e-02 |
Pos logit contributions | |
flew | +0.028 |
spe | +0.028 |
bul | +0.027 |
paramed | +0.027 |
blew | +0.026 |
Neg logit contributions | |
spaghetti | -0.019 |
sidelines | -0.019 |
Seek | -0.018 |
ours | -0.017 |
Want | -0.016 |
Token | - |
Token ID | 12 |
Feature activation | -4.22e-02 |
Pos logit contributions | |
bul | +0.058 |
flew | +0.056 |
spe | +0.055 |
Bel | +0.053 |
pol | +0.053 |
Neg logit contributions | |
spaghetti | -0.055 |
sidelines | -0.053 |
menu | -0.047 |
Seek | -0.046 |
bed | -0.045 |
Token | and |
Token ID | 290 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
bul | +0.019 |
flew | +0.019 |
spe | +0.019 |
paramed | +0.018 |
Bel | +0.018 |
Neg logit contributions | |
spaghetti | -0.018 |
sidelines | -0.017 |
Seek | -0.015 |
menu | -0.015 |
bed | -0.015 |
Token | always |
Token ID | 1464 |
Feature activation | -2.57e-02 |
Pos logit contributions | |
bul | +0.014 |
spe | +0.013 |
flew | +0.013 |
paramed | +0.012 |
Bel | +0.012 |
Neg logit contributions | |
spaghetti | -0.021 |
sidelines | -0.021 |
Seek | -0.019 |
bed | -0.018 |
menu | -0.018 |
Token | had |
Token ID | 550 |
Feature activation | -2.26e-02 |
Pos logit contributions | |
bul | +0.028 |
spe | +0.027 |
flew | +0.026 |
paramed | +0.024 |
pre | +0.024 |
Neg logit contributions | |
spaghetti | -0.050 |
sidelines | -0.049 |
Seek | -0.045 |
menu | -0.044 |
bed | -0.044 |
Token | plenty |
Token ID | 6088 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
bul | +0.039 |
spe | +0.039 |
flew | +0.038 |
pre | +0.036 |
paramed | +0.036 |
Neg logit contributions | |
spaghetti | -0.030 |
sidelines | -0.029 |
Seek | -0.025 |
bed | -0.024 |
menu | -0.024 |
Token | of |
Token ID | 286 |
Feature activation | -1.49e-02 |
Pos logit contributions | |
sidelines | +0.020 |
spaghetti | +0.019 |
Seek | +0.018 |
Want | +0.017 |
internet | +0.017 |
Neg logit contributions | |
bul | -0.014 |
flew | -0.013 |
pre | -0.012 |
spe | -0.012 |
pol | -0.012 |
Token | rad |
Token ID | 2511 |
Feature activation | -7.21e-02 |
Pos logit contributions | |
flew | +0.027 |
bul | +0.026 |
spe | +0.025 |
soared | +0.024 |
pol | +0.024 |
Neg logit contributions | |
sidelines | -0.019 |
spaghetti | -0.018 |
Seek | -0.016 |
menu | -0.015 |
bed | -0.015 |
Token | ishes |
Token ID | 5614 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
spe | +0.086 |
bul | +0.086 |
flew | +0.085 |
paramed | +0.079 |
Bel | +0.076 |
Neg logit contributions | |
spaghetti | -0.130 |
sidelines | -0.125 |
Seek | -0.116 |
menu | -0.113 |
robbers | -0.110 |
Token | to |
Token ID | 284 |
Feature activation | -9.10e-03 |
Pos logit contributions | |
bul | +0.018 |
flew | +0.018 |
spe | +0.018 |
pre | +0.016 |
pol | +0.016 |
Neg logit contributions | |
sidelines | -0.019 |
spaghetti | -0.018 |
Seek | -0.016 |
menu | -0.016 |
bed | -0.015 |
Token | eat |
Token ID | 4483 |
Feature activation | +2.87e-02 |
Pos logit contributions | |
flew | +0.015 |
bul | +0.014 |
spe | +0.014 |
soared | +0.013 |
Bel | +0.013 |
Neg logit contributions | |
spaghetti | -0.013 |
sidelines | -0.013 |
Seek | -0.011 |
menu | -0.011 |
bed | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | -7.08e-03 |
Pos logit contributions | |
sidelines | +0.050 |
spaghetti | +0.048 |
Seek | +0.045 |
menu | +0.042 |
robbers | +0.042 |
Neg logit contributions | |
flew | -0.037 |
bul | -0.037 |
spe | -0.035 |
pol | -0.033 |
pre | -0.032 |
Token | The |
Token ID | 383 |
Feature activation | +9.25e-04 |
Pos logit contributions | |
flew | +0.011 |
bul | +0.011 |
spe | +0.011 |
soared | +0.010 |
pol | +0.010 |
Neg logit contributions | |
spaghetti | -0.010 |
sidelines | -0.010 |
Seek | -0.009 |
bed | -0.008 |
menu | -0.008 |
Token | red |
Token ID | 2266 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
spaghetti | +0.005 |
sidelines | +0.004 |
bed | +0.004 |
mine | +0.004 |
ours | +0.004 |
Neg logit contributions | |
spe | -0.008 |
bul | -0.007 |
xc | -0.007 |
pre | -0.007 |
Bel | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | +3.94e-02 |
Pos logit contributions | |
flew | +0.014 |
bul | +0.014 |
spe | +0.012 |
spr | +0.012 |
pre | +0.012 |
Neg logit contributions | |
sidelines | -0.024 |
Seek | -0.022 |
spaghetti | -0.022 |
Want | -0.020 |
robbers | -0.020 |
Token | white |
Token ID | 2330 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
spaghetti | +0.057 |
sidelines | +0.056 |
Seek | +0.050 |
menu | +0.048 |
bed | +0.048 |
Neg logit contributions | |
bul | -0.061 |
flew | -0.061 |
spe | -0.061 |
paramed | -0.056 |
Bel | -0.056 |
Token | and |
Token ID | 290 |
Feature activation | +2.45e-02 |
Pos logit contributions | |
flew | +0.019 |
bul | +0.018 |
spe | +0.016 |
soared | +0.016 |
pre | +0.016 |
Neg logit contributions | |
sidelines | -0.030 |
spaghetti | -0.028 |
Seek | -0.027 |
menu | -0.025 |
robbers | -0.025 |
Token | it |
Token ID | 340 |
Feature activation | -4.77e-04 |
Pos logit contributions | |
sidelines | +0.040 |
spaghetti | +0.040 |
Seek | +0.035 |
menu | +0.035 |
bed | +0.033 |
Neg logit contributions | |
flew | -0.035 |
bul | -0.035 |
spe | -0.034 |
soared | -0.032 |
pol | -0.031 |
Token | r |
Token ID | 374 |
Feature activation | -7.07e-02 |
Pos logit contributions | |
paramed | +0.001 |
xc | +0.001 |
spe | +0.001 |
Bel | +0.001 |
esh | +0.001 |
Neg logit contributions | |
spaghetti | -0.001 |
safe | -0.001 |
Seek | -0.001 |
cozy | -0.000 |
bed | -0.000 |
Token | ipp |
Token ID | 3974 |
Feature activation | -1.68e-02 |
Pos logit contributions | |
bul | +0.122 |
flew | +0.122 |
spe | +0.120 |
Bel | +0.117 |
Or | +0.116 |
Neg logit contributions | |
spaghetti | -0.084 |
sidelines | -0.081 |
Seek | -0.072 |
ours | -0.069 |
menu | -0.067 |
Token | led |
Token ID | 992 |
Feature activation | -9.87e-03 |
Pos logit contributions | |
paramed | +0.025 |
bul | +0.023 |
Or | +0.021 |
Sher | +0.020 |
esh | +0.020 |
Neg logit contributions | |
spaghetti | -0.022 |
ours | -0.022 |
food | -0.021 |
mine | -0.021 |
oring | -0.020 |
Token | in |
Token ID | 287 |
Feature activation | -1.40e-02 |
Pos logit contributions | |
flew | +0.012 |
bul | +0.012 |
spe | +0.011 |
soared | +0.011 |
pol | +0.010 |
Neg logit contributions | |
sidelines | -0.019 |
spaghetti | -0.018 |
Seek | -0.016 |
menu | -0.016 |
robbers | -0.016 |
Token | the |
Token ID | 262 |
Feature activation | +4.00e-03 |
Pos logit contributions | |
flew | +0.017 |
bul | +0.017 |
spe | +0.016 |
soared | +0.015 |
Bel | +0.015 |
Neg logit contributions | |
sidelines | -0.026 |
spaghetti | -0.025 |
Seek | -0.023 |
menu | -0.023 |
robbers | -0.022 |
Token | wind |
Token ID | 2344 |
Feature activation | -9.19e-04 |
Pos logit contributions | |
spaghetti | +0.005 |
sidelines | +0.004 |
bed | +0.004 |
menu | +0.004 |
Seek | +0.004 |
Neg logit contributions | |
bul | -0.008 |
spe | -0.007 |
flew | -0.007 |
paramed | -0.007 |
pol | -0.007 |
Token | tub |
Token ID | 12202 |
Feature activation | +5.39e-03 |
Pos logit contributions | |
flew | +0.017 |
bul | +0.017 |
spe | +0.016 |
paramed | +0.016 |
blew | +0.015 |
Neg logit contributions | |
sidelines | -0.016 |
spaghetti | -0.015 |
Seek | -0.014 |
internet | -0.012 |
ours | -0.012 |
Token | of |
Token ID | 286 |
Feature activation | -3.60e-03 |
Pos logit contributions | |
spaghetti | +0.006 |
sidelines | +0.006 |
bed | +0.005 |
menu | +0.005 |
Seek | +0.005 |
Neg logit contributions | |
flew | -0.010 |
soared | -0.010 |
bul | -0.009 |
spe | -0.009 |
Bel | -0.009 |
Token | ice |
Token ID | 4771 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
bul | +0.006 |
flew | +0.006 |
spe | +0.006 |
Bel | +0.006 |
pre | +0.006 |
Neg logit contributions | |
spaghetti | -0.005 |
sidelines | -0.005 |
Seek | -0.004 |
menu | -0.004 |
bed | -0.004 |
Token | cream |
Token ID | 8566 |
Feature activation | -2.48e-03 |
Pos logit contributions | |
spe | +0.021 |
bul | +0.020 |
flew | +0.020 |
Bel | +0.020 |
soared | +0.019 |
Neg logit contributions | |
spaghetti | -0.016 |
menu | -0.013 |
bed | -0.013 |
sidelines | -0.013 |
food | -0.012 |
Token | and |
Token ID | 290 |
Feature activation | -9.40e-03 |
Pos logit contributions | |
spe | +0.004 |
flew | +0.004 |
bul | +0.004 |
Bel | +0.004 |
soared | +0.004 |
Neg logit contributions | |
spaghetti | -0.004 |
sidelines | -0.003 |
menu | -0.003 |
bed | -0.003 |
Seek | -0.003 |
Token | two |
Token ID | 734 |
Feature activation | -7.16e-02 |
Pos logit contributions | |
bul | +0.011 |
spe | +0.011 |
flew | +0.010 |
Bel | +0.010 |
paramed | +0.010 |
Neg logit contributions | |
spaghetti | -0.018 |
sidelines | -0.017 |
Seek | -0.015 |
bed | -0.015 |
menu | -0.015 |
Token | pops |
Token ID | 26384 |
Feature activation | -3.47e-02 |
Pos logit contributions | |
bul | +0.127 |
spe | +0.119 |
Bel | +0.118 |
pre | +0.117 |
xc | +0.117 |
Neg logit contributions | |
spaghetti | -0.099 |
sidelines | -0.087 |
menu | -0.079 |
bed | -0.078 |
Seek | -0.074 |
Token | icles |
Token ID | 2983 |
Feature activation | -2.11e-02 |
Pos logit contributions | |
spe | +0.055 |
Bel | +0.053 |
bul | +0.051 |
flew | +0.050 |
Sher | +0.050 |
Neg logit contributions | |
spaghetti | -0.056 |
sidelines | -0.046 |
menu | -0.046 |
bed | -0.045 |
food | -0.044 |
Token | . |
Token ID | 13 |
Feature activation | -4.08e-03 |
Pos logit contributions | |
spe | +0.038 |
bul | +0.038 |
Bel | +0.037 |
xc | +0.036 |
Sher | +0.036 |
Neg logit contributions | |
spaghetti | -0.027 |
sidelines | -0.023 |
menu | -0.022 |
bed | -0.021 |
safe | -0.019 |
Token | They |
Token ID | 1119 |
Feature activation | -7.08e-03 |
Pos logit contributions | |
bul | +0.006 |
spe | +0.006 |
flew | +0.006 |
Bel | +0.006 |
soared | +0.006 |
Neg logit contributions | |
spaghetti | -0.006 |
sidelines | -0.006 |
Seek | -0.005 |
menu | -0.005 |
bed | -0.005 |
Token | closed |
Token ID | 4838 |
Feature activation | +6.62e-04 |
Pos logit contributions | |
bul | +0.010 |
esh | +0.010 |
xc | +0.009 |
spe | +0.009 |
Bel | +0.009 |
Neg logit contributions | |
spaghetti | -0.012 |
sidelines | -0.011 |
menu | -0.010 |
bed | -0.010 |
Seek | -0.010 |